diff --git a/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/checkpoints/latest-checkpoint.pt b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/checkpoints/latest-checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a5ac3cfb8c8c1b83e93797180e8b7750f0e80ef --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/checkpoints/latest-checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b1b2cfb949c4d3bbb04ae243cd747443c324e9bd3fe61630825787f5d27c39 +size 15336322587 diff --git a/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/checkpoints/step-005000-epoch-00-loss=1.9222.pt b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/checkpoints/step-005000-epoch-00-loss=1.9222.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d90e0a9b6d1205c008f3237d8f798026879ce10 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/checkpoints/step-005000-epoch-00-loss=1.9222.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f3267e6eb19bef9395d219c34c6c2667280e37cdd8e181e0ab48eb0cfe9927f +size 15336322587 diff --git a/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/checkpoints/step-009537-epoch-01-loss=2.0725.pt b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/checkpoints/step-009537-epoch-01-loss=2.0725.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a5ac3cfb8c8c1b83e93797180e8b7750f0e80ef --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/checkpoints/step-009537-epoch-01-loss=2.0725.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b1b2cfb949c4d3bbb04ae243cd747443c324e9bd3fe61630825787f5d27c39 +size 15336322587 diff --git a/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/config.json b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/config.json new file mode 100644 index 0000000000000000000000000000000000000000..be3ca6375ce602261f982dc624f32eda8890e70b --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/config.json @@ -0,0 +1,74 @@ +{ + "dataset": { + "align_stage_components": [ + "download/llava-laion-cc-sbu-558k/chat.json", + "download/llava-laion-cc-sbu-558k" + ], + "dataset_id": "obelics", + "dataset_resampled": true, + "dataset_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_hq_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl/", + "finetune_stage_components": [ + "/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/llava_v1_5_mix665k.json", + "/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/data" + ], + "max_num_images": 6, + "min_num_images": 1, + "train_num_samples": 2441407, + "type": "obelics", + "workers": 4 + }, + "model": { + "align_epochs": 1, + "align_global_batch_size": 256, + "align_learning_rate": 0.001, + "align_lr_scheduler_type": "linear-warmup+cosine-decay", + "align_max_grad_norm": 1.0, + "align_max_steps": null, + "align_per_device_batch_size": 16, + "align_train_strategy": "fsdp-shard-grad-op", + "align_warmup_ratio": 0.03, + "align_weight_decay": 0.0, + "arch_specifier": "no-align+avgpool", + "enable_gradient_checkpointing": true, + "enable_mixed_precision_training": true, + "finetune_epochs": 1, + "finetune_global_batch_size": 128, + "finetune_learning_rate": 2e-05, + "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", + "finetune_max_grad_norm": 1.0, + "finetune_max_steps": null, + "finetune_per_device_batch_size": 16, + "finetune_train_strategy": "fsdp-full-shard", + "finetune_warmup_ratio": 0.03, + "finetune_weight_decay": 0.1, + "image_resize_strategy": "resize-naive", + "llm_backbone_id": "phi3-3b", + "llm_max_length": 4096, + "model_id": "phi3-3b-continue-training-hq", + "pretrain_epochs": 1, + "pretrain_global_batch_size": 256, + "pretrain_learning_rate": 5e-05, + "pretrain_lr_scheduler_type": "linear-warmup+cosine-decay", + "pretrain_max_grad_norm": 1.0, + "pretrain_max_steps": 9537, + "pretrain_per_device_batch_size": 8, + "pretrain_train_strategy": "fsdp-full-shard", + "pretrain_warmup_ratio": 0.03, + "pretrain_weight_decay": 0.01, + "reduce_in_full_precision": false, + "type": "one-stage+7b", + "vision_backbone_id": "siglip-vit-so400m-384px" + }, + "mount_path": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models", + "pretrained_checkpoint": null, + "run_id": "obelics+phi3-3b-continue-training-hq+stage-pretrain+x7", + "run_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints", + "seed": 7, + "stage": "pretrain", + "trackers": [ + "jsonl", + "wandb" + ], + "wandb_entity": null, + "wandb_project": "mmpretrain" +} \ No newline at end of file diff --git a/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/config.yaml b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..cda1239d7d4b72b11be8eee8efe58436665d2277 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/config.yaml @@ -0,0 +1,67 @@ +dataset: + align_stage_components: + - download/llava-laion-cc-sbu-558k/chat.json + - download/llava-laion-cc-sbu-558k + dataset_id: obelics + dataset_resampled: true + dataset_root_dir: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_hq_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl/ + finetune_stage_components: + - /fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/llava_v1_5_mix665k.json + - /fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/data + max_num_images: 6 + min_num_images: 1 + train_num_samples: 2441407 + type: obelics + workers: 4 +model: + align_epochs: 1 + align_global_batch_size: 256 + align_learning_rate: 0.001 + align_lr_scheduler_type: linear-warmup+cosine-decay + align_max_grad_norm: 1.0 + align_max_steps: null + align_per_device_batch_size: 16 + align_train_strategy: fsdp-shard-grad-op + align_warmup_ratio: 0.03 + align_weight_decay: 0.0 + arch_specifier: no-align+avgpool + enable_gradient_checkpointing: true + enable_mixed_precision_training: true + finetune_epochs: 1 + finetune_global_batch_size: 128 + finetune_learning_rate: 2.0e-05 + finetune_lr_scheduler_type: linear-warmup+cosine-decay + finetune_max_grad_norm: 1.0 + finetune_max_steps: null + finetune_per_device_batch_size: 16 + finetune_train_strategy: fsdp-full-shard + finetune_warmup_ratio: 0.03 + finetune_weight_decay: 0.1 + image_resize_strategy: resize-naive + llm_backbone_id: phi3-3b + llm_max_length: 4096 + model_id: phi3-3b-continue-training-hq + pretrain_epochs: 1 + pretrain_global_batch_size: 256 + pretrain_learning_rate: 5.0e-05 + pretrain_lr_scheduler_type: linear-warmup+cosine-decay + pretrain_max_grad_norm: 1.0 + pretrain_max_steps: 9537 + pretrain_per_device_batch_size: 8 + pretrain_train_strategy: fsdp-full-shard + pretrain_warmup_ratio: 0.03 + pretrain_weight_decay: 0.01 + reduce_in_full_precision: false + type: one-stage+7b + vision_backbone_id: siglip-vit-so400m-384px +mount_path: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models +pretrained_checkpoint: null +run_id: obelics+phi3-3b-continue-training-hq+stage-pretrain+x7 +run_root_dir: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints +seed: 7 +stage: pretrain +trackers: +- jsonl +- wandb +wandb_entity: null +wandb_project: mmpretrain diff --git a/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/obelics+phi3-3b-continue-training-hq+stage-pretrain+x7.jsonl b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/obelics+phi3-3b-continue-training-hq+stage-pretrain+x7.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5992e5dbdc3ec6044a6108d11df616936123da00 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/obelics+phi3-3b-continue-training-hq+stage-pretrain+x7.jsonl @@ -0,0 +1,17623 @@ +{"Pretrain/Learning Rate": 1.7482517482517484e-07, "Pretrain/Loss": 2.8460285663604736, "Pretrain/Loss (Raw)": 2.8460285663604736, "Pretrain/Step": 1, "Pretrain/Step Time": 12.032064437866211} +{"Pretrain/Learning Rate": 3.496503496503497e-07, "Pretrain/Loss": 3.249972343444824, "Pretrain/Loss (Raw)": 3.653916120529175, "Pretrain/Step": 2, "Pretrain/Step Time": 9.732903242111206} +{"Pretrain/Learning Rate": 5.244755244755246e-07, "Pretrain/Loss": 3.0853233337402344, "Pretrain/Loss (Raw)": 2.756025552749634, "Pretrain/Step": 3, "Pretrain/Step Time": 8.947766542434692} +{"Pretrain/Learning Rate": 6.993006993006994e-07, "Pretrain/Loss": 3.104240894317627, "Pretrain/Loss (Raw)": 3.1609935760498047, "Pretrain/Step": 4, "Pretrain/Step Time": 8.68039608001709} +{"Pretrain/Learning Rate": 8.741258741258743e-07, "Pretrain/Loss": 3.109840154647827, "Pretrain/Loss (Raw)": 3.1322364807128906, "Pretrain/Step": 5, "Pretrain/Step Time": 8.428513193130494} +{"Pretrain/Learning Rate": 1.0489510489510491e-06, "Pretrain/Loss": 3.110654830932617, "Pretrain/Loss (Raw)": 3.1147289276123047, "Pretrain/Step": 6, "Pretrain/Step Time": 8.257091204325357} +{"Pretrain/Learning Rate": 1.2237762237762238e-06, "Pretrain/Loss": 3.079310417175293, "Pretrain/Loss (Raw)": 2.8912436962127686, "Pretrain/Step": 7, "Pretrain/Step Time": 8.207454408918109} +{"Pretrain/Learning Rate": 1.3986013986013987e-06, "Pretrain/Loss": 3.1147851943969727, "Pretrain/Loss (Raw)": 3.363107681274414, "Pretrain/Step": 8, "Pretrain/Step Time": 8.118331164121628} +{"Pretrain/Learning Rate": 1.5734265734265736e-06, "Pretrain/Loss": 3.1069369316101074, "Pretrain/Loss (Raw)": 3.044152021408081, "Pretrain/Step": 9, "Pretrain/Step Time": 8.051265319188436} +{"Pretrain/Learning Rate": 1.7482517482517485e-06, "Pretrain/Loss": 3.066074848175049, "Pretrain/Loss (Raw)": 2.698314666748047, "Pretrain/Step": 10, "Pretrain/Step Time": 8.038108372688294} +{"Pretrain/Learning Rate": 1.9230769230769234e-06, "Pretrain/Loss": 3.044703483581543, "Pretrain/Loss (Raw)": 2.8309895992279053, "Pretrain/Step": 11, "Pretrain/Step Time": 7.9767327958887275} +{"Pretrain/Learning Rate": 2.0979020979020983e-06, "Pretrain/Loss": 3.015629291534424, "Pretrain/Loss (Raw)": 2.6958138942718506, "Pretrain/Step": 12, "Pretrain/Step Time": 7.951660593350728} +{"Pretrain/Learning Rate": 2.2727272727272728e-06, "Pretrain/Loss": 3.0195610523223877, "Pretrain/Loss (Raw)": 3.0667409896850586, "Pretrain/Step": 13, "Pretrain/Step Time": 7.910945488856389} +{"Pretrain/Learning Rate": 2.4475524475524477e-06, "Pretrain/Loss": 3.008017063140869, "Pretrain/Loss (Raw)": 2.8579440116882324, "Pretrain/Step": 14, "Pretrain/Step Time": 7.900590079171317} +{"Pretrain/Learning Rate": 2.6223776223776225e-06, "Pretrain/Loss": 2.9691388607025146, "Pretrain/Loss (Raw)": 2.4248430728912354, "Pretrain/Step": 15, "Pretrain/Step Time": 7.908502610524495} +{"Pretrain/Learning Rate": 2.7972027972027974e-06, "Pretrain/Loss": 2.9383084774017334, "Pretrain/Loss (Raw)": 2.475855588912964, "Pretrain/Step": 16, "Pretrain/Step Time": 7.885215729475021} +{"Pretrain/Learning Rate": 2.9720279720279723e-06, "Pretrain/Loss": 2.909243106842041, "Pretrain/Loss (Raw)": 2.4441981315612793, "Pretrain/Step": 17, "Pretrain/Step Time": 7.903768693699556} +{"Pretrain/Learning Rate": 3.1468531468531472e-06, "Pretrain/Loss": 2.888265371322632, "Pretrain/Loss (Raw)": 2.5316429138183594, "Pretrain/Step": 18, "Pretrain/Step Time": 7.890596124860975} +{"Pretrain/Learning Rate": 3.3216783216783217e-06, "Pretrain/Loss": 2.8690602779388428, "Pretrain/Loss (Raw)": 2.5233685970306396, "Pretrain/Step": 19, "Pretrain/Step Time": 7.896613698256643} +{"Pretrain/Learning Rate": 3.496503496503497e-06, "Pretrain/Loss": 2.8462588787078857, "Pretrain/Loss (Raw)": 2.4130349159240723, "Pretrain/Step": 20, "Pretrain/Step Time": 7.9053069114685055} +{"Pretrain/Learning Rate": 3.6713286713286715e-06, "Pretrain/Loss": 2.827967405319214, "Pretrain/Loss (Raw)": 2.462135076522827, "Pretrain/Step": 21, "Pretrain/Step Time": 7.894351811636062} +{"Pretrain/Learning Rate": 3.846153846153847e-06, "Pretrain/Loss": 2.8040499687194824, "Pretrain/Loss (Raw)": 2.3017823696136475, "Pretrain/Step": 22, "Pretrain/Step Time": 7.875464016740972} +{"Pretrain/Learning Rate": 4.020979020979021e-06, "Pretrain/Loss": 2.7928407192230225, "Pretrain/Loss (Raw)": 2.546238660812378, "Pretrain/Step": 23, "Pretrain/Step Time": 7.864544941031414} +{"Pretrain/Learning Rate": 4.195804195804197e-06, "Pretrain/Loss": 2.7817482948303223, "Pretrain/Loss (Raw)": 2.5266199111938477, "Pretrain/Step": 24, "Pretrain/Step Time": 7.845136791467667} +{"Pretrain/Learning Rate": 4.370629370629371e-06, "Pretrain/Loss": 2.7716481685638428, "Pretrain/Loss (Raw)": 2.5292534828186035, "Pretrain/Step": 25, "Pretrain/Step Time": 7.838245077133179} +{"Pretrain/Learning Rate": 4.5454545454545455e-06, "Pretrain/Loss": 2.766817092895508, "Pretrain/Loss (Raw)": 2.646033763885498, "Pretrain/Step": 26, "Pretrain/Step Time": 7.831610065240127} +{"Pretrain/Learning Rate": 4.72027972027972e-06, "Pretrain/Loss": 2.7653729915618896, "Pretrain/Loss (Raw)": 2.7278265953063965, "Pretrain/Step": 27, "Pretrain/Step Time": 7.824758741590712} +{"Pretrain/Learning Rate": 4.895104895104895e-06, "Pretrain/Loss": 2.745556116104126, "Pretrain/Loss (Raw)": 2.2105019092559814, "Pretrain/Step": 28, "Pretrain/Step Time": 7.8191874878747125} +{"Pretrain/Learning Rate": 5.06993006993007e-06, "Pretrain/Loss": 2.7283670902252197, "Pretrain/Loss (Raw)": 2.2470719814300537, "Pretrain/Step": 29, "Pretrain/Step Time": 7.809998841121279} +{"Pretrain/Learning Rate": 5.244755244755245e-06, "Pretrain/Loss": 2.7122514247894287, "Pretrain/Loss (Raw)": 2.244896173477173, "Pretrain/Step": 30, "Pretrain/Step Time": 7.79525187810262} +{"Pretrain/Learning Rate": 5.419580419580419e-06, "Pretrain/Loss": 2.695899248123169, "Pretrain/Loss (Raw)": 2.2053334712982178, "Pretrain/Step": 31, "Pretrain/Step Time": 7.789275815409999} +{"Pretrain/Learning Rate": 5.594405594405595e-06, "Pretrain/Loss": 2.6799533367156982, "Pretrain/Loss (Raw)": 2.1856322288513184, "Pretrain/Step": 32, "Pretrain/Step Time": 7.7785025760531425} +{"Pretrain/Learning Rate": 5.76923076923077e-06, "Pretrain/Loss": 2.6702280044555664, "Pretrain/Loss (Raw)": 2.3590197563171387, "Pretrain/Step": 33, "Pretrain/Step Time": 7.768782218297322} +{"Pretrain/Learning Rate": 5.944055944055945e-06, "Pretrain/Loss": 2.6562118530273438, "Pretrain/Loss (Raw)": 2.193678379058838, "Pretrain/Step": 34, "Pretrain/Step Time": 7.769338832182043} +{"Pretrain/Learning Rate": 6.1188811188811196e-06, "Pretrain/Loss": 2.6424636840820312, "Pretrain/Loss (Raw)": 2.1750247478485107, "Pretrain/Step": 35, "Pretrain/Step Time": 7.783820261274065} +{"Pretrain/Learning Rate": 6.2937062937062944e-06, "Pretrain/Loss": 2.6328208446502686, "Pretrain/Loss (Raw)": 2.295318126678467, "Pretrain/Step": 36, "Pretrain/Step Time": 7.778296675946978} +{"Pretrain/Learning Rate": 6.468531468531469e-06, "Pretrain/Loss": 2.626593828201294, "Pretrain/Loss (Raw)": 2.4024229049682617, "Pretrain/Step": 37, "Pretrain/Step Time": 7.788426940505569} +{"Pretrain/Learning Rate": 6.643356643356643e-06, "Pretrain/Loss": 2.6130504608154297, "Pretrain/Loss (Raw)": 2.11194109916687, "Pretrain/Step": 38, "Pretrain/Step Time": 7.78365863624372} +{"Pretrain/Learning Rate": 6.818181818181818e-06, "Pretrain/Loss": 2.6049559116363525, "Pretrain/Loss (Raw)": 2.29736328125, "Pretrain/Step": 39, "Pretrain/Step Time": 7.780362202570989} +{"Pretrain/Learning Rate": 6.993006993006994e-06, "Pretrain/Loss": 2.595923662185669, "Pretrain/Loss (Raw)": 2.2436695098876953, "Pretrain/Step": 40, "Pretrain/Step Time": 7.776529437303543} +{"Pretrain/Learning Rate": 7.167832167832168e-06, "Pretrain/Loss": 2.590574264526367, "Pretrain/Loss (Raw)": 2.376607656478882, "Pretrain/Step": 41, "Pretrain/Step Time": 7.769616981831993} +{"Pretrain/Learning Rate": 7.342657342657343e-06, "Pretrain/Loss": 2.579026699066162, "Pretrain/Loss (Raw)": 2.1055643558502197, "Pretrain/Step": 42, "Pretrain/Step Time": 7.759991265478588} +{"Pretrain/Learning Rate": 7.517482517482517e-06, "Pretrain/Loss": 2.5701091289520264, "Pretrain/Loss (Raw)": 2.1955790519714355, "Pretrain/Step": 43, "Pretrain/Step Time": 7.756578961084055} +{"Pretrain/Learning Rate": 7.692307692307694e-06, "Pretrain/Loss": 2.5688772201538086, "Pretrain/Loss (Raw)": 2.515897512435913, "Pretrain/Step": 44, "Pretrain/Step Time": 7.750463556159627} +{"Pretrain/Learning Rate": 7.867132867132867e-06, "Pretrain/Loss": 2.560041666030884, "Pretrain/Loss (Raw)": 2.171278953552246, "Pretrain/Step": 45, "Pretrain/Step Time": 7.744692182540893} +{"Pretrain/Learning Rate": 8.041958041958042e-06, "Pretrain/Loss": 2.554689884185791, "Pretrain/Loss (Raw)": 2.313857316970825, "Pretrain/Step": 46, "Pretrain/Step Time": 7.745205298714016} +{"Pretrain/Learning Rate": 8.216783216783217e-06, "Pretrain/Loss": 2.5530035495758057, "Pretrain/Loss (Raw)": 2.4754388332366943, "Pretrain/Step": 47, "Pretrain/Step Time": 7.743985815251127} +{"Pretrain/Learning Rate": 8.391608391608393e-06, "Pretrain/Loss": 2.54587459564209, "Pretrain/Loss (Raw)": 2.2108047008514404, "Pretrain/Step": 48, "Pretrain/Step Time": 7.738382190465927} +{"Pretrain/Learning Rate": 8.566433566433566e-06, "Pretrain/Loss": 2.5381267070770264, "Pretrain/Loss (Raw)": 2.1662354469299316, "Pretrain/Step": 49, "Pretrain/Step Time": 7.736108682593521} +{"Pretrain/Learning Rate": 8.741258741258741e-06, "Pretrain/Loss": 2.531913995742798, "Pretrain/Loss (Raw)": 2.227494478225708, "Pretrain/Step": 50, "Pretrain/Step Time": 7.735683169364929} +{"Pretrain/Learning Rate": 8.916083916083918e-06, "Pretrain/Loss": 2.527768611907959, "Pretrain/Loss (Raw)": 2.3204898834228516, "Pretrain/Step": 51, "Pretrain/Step Time": 7.731853237339094} +{"Pretrain/Learning Rate": 9.090909090909091e-06, "Pretrain/Loss": 2.521298408508301, "Pretrain/Loss (Raw)": 2.191316604614258, "Pretrain/Step": 52, "Pretrain/Step Time": 7.72695594567519} +{"Pretrain/Learning Rate": 9.265734265734266e-06, "Pretrain/Loss": 2.5148775577545166, "Pretrain/Loss (Raw)": 2.18100905418396, "Pretrain/Step": 53, "Pretrain/Step Time": 7.72657904984816} +{"Pretrain/Learning Rate": 9.44055944055944e-06, "Pretrain/Loss": 2.507702350616455, "Pretrain/Loss (Raw)": 2.127391815185547, "Pretrain/Step": 54, "Pretrain/Step Time": 7.724079463216993} +{"Pretrain/Learning Rate": 9.615384615384616e-06, "Pretrain/Loss": 2.499607563018799, "Pretrain/Loss (Raw)": 2.062511444091797, "Pretrain/Step": 55, "Pretrain/Step Time": 7.72364186373624} +{"Pretrain/Learning Rate": 9.79020979020979e-06, "Pretrain/Loss": 2.4910714626312256, "Pretrain/Loss (Raw)": 2.0215823650360107, "Pretrain/Step": 56, "Pretrain/Step Time": 7.737697733300073} +{"Pretrain/Learning Rate": 9.965034965034966e-06, "Pretrain/Loss": 2.4882900714874268, "Pretrain/Loss (Raw)": 2.3325235843658447, "Pretrain/Step": 57, "Pretrain/Step Time": 7.733085531937449} +{"Pretrain/Learning Rate": 1.013986013986014e-05, "Pretrain/Loss": 2.481330394744873, "Pretrain/Loss (Raw)": 2.0846354961395264, "Pretrain/Step": 58, "Pretrain/Step Time": 7.7346498349617265} +{"Pretrain/Learning Rate": 1.0314685314685315e-05, "Pretrain/Loss": 2.4751532077789307, "Pretrain/Loss (Raw)": 2.116873264312744, "Pretrain/Step": 59, "Pretrain/Step Time": 7.732196432048991} +{"Pretrain/Learning Rate": 1.048951048951049e-05, "Pretrain/Loss": 2.4724831581115723, "Pretrain/Loss (Raw)": 2.3149430751800537, "Pretrain/Step": 60, "Pretrain/Step Time": 7.726930816968282} +{"Pretrain/Learning Rate": 1.0664335664335665e-05, "Pretrain/Loss": 2.4681479930877686, "Pretrain/Loss (Raw)": 2.2080538272857666, "Pretrain/Step": 61, "Pretrain/Step Time": 7.7225650451222405} +{"Pretrain/Learning Rate": 1.0839160839160838e-05, "Pretrain/Loss": 2.4647984504699707, "Pretrain/Loss (Raw)": 2.2604660987854004, "Pretrain/Step": 62, "Pretrain/Step Time": 7.719342516314599} +{"Pretrain/Learning Rate": 1.1013986013986015e-05, "Pretrain/Loss": 2.458838701248169, "Pretrain/Loss (Raw)": 2.089327573776245, "Pretrain/Step": 63, "Pretrain/Step Time": 7.714977953169081} +{"Pretrain/Learning Rate": 1.118881118881119e-05, "Pretrain/Loss": 2.4549546241760254, "Pretrain/Loss (Raw)": 2.2102603912353516, "Pretrain/Step": 64, "Pretrain/Step Time": 7.713527001440525} +{"Pretrain/Learning Rate": 1.1363636363636365e-05, "Pretrain/Loss": 2.4506099224090576, "Pretrain/Loss (Raw)": 2.172550916671753, "Pretrain/Step": 65, "Pretrain/Step Time": 7.706490047161395} +{"Pretrain/Learning Rate": 1.153846153846154e-05, "Pretrain/Loss": 2.447425127029419, "Pretrain/Loss (Raw)": 2.240415573120117, "Pretrain/Step": 66, "Pretrain/Step Time": 7.70568931463993} +{"Pretrain/Learning Rate": 1.1713286713286714e-05, "Pretrain/Loss": 2.4437415599823, "Pretrain/Loss (Raw)": 2.200626850128174, "Pretrain/Step": 67, "Pretrain/Step Time": 7.70841355466131} +{"Pretrain/Learning Rate": 1.188811188811189e-05, "Pretrain/Loss": 2.441032886505127, "Pretrain/Loss (Raw)": 2.259566068649292, "Pretrain/Step": 68, "Pretrain/Step Time": 7.70924833241631} +{"Pretrain/Learning Rate": 1.2062937062937063e-05, "Pretrain/Loss": 2.438105583190918, "Pretrain/Loss (Raw)": 2.23903751373291, "Pretrain/Step": 69, "Pretrain/Step Time": 7.709068021912506} +{"Pretrain/Learning Rate": 1.2237762237762239e-05, "Pretrain/Loss": 2.434459924697876, "Pretrain/Loss (Raw)": 2.1829030513763428, "Pretrain/Step": 70, "Pretrain/Step Time": 7.705200713021415} +{"Pretrain/Learning Rate": 1.2412587412587414e-05, "Pretrain/Loss": 2.431450128555298, "Pretrain/Loss (Raw)": 2.2207674980163574, "Pretrain/Step": 71, "Pretrain/Step Time": 7.701325520663194} +{"Pretrain/Learning Rate": 1.2587412587412589e-05, "Pretrain/Loss": 2.4292750358581543, "Pretrain/Loss (Raw)": 2.274847984313965, "Pretrain/Step": 72, "Pretrain/Step Time": 7.705403847826852} +{"Pretrain/Learning Rate": 1.2762237762237764e-05, "Pretrain/Loss": 2.426279067993164, "Pretrain/Loss (Raw)": 2.210578441619873, "Pretrain/Step": 73, "Pretrain/Step Time": 7.703031690153357} +{"Pretrain/Learning Rate": 1.2937062937062939e-05, "Pretrain/Loss": 2.4233126640319824, "Pretrain/Loss (Raw)": 2.206761121749878, "Pretrain/Step": 74, "Pretrain/Step Time": 7.707880139350891} +{"Pretrain/Learning Rate": 1.3111888111888112e-05, "Pretrain/Loss": 2.424050807952881, "Pretrain/Loss (Raw)": 2.4786596298217773, "Pretrain/Step": 75, "Pretrain/Step Time": 7.7140113035837805} +{"Pretrain/Learning Rate": 1.3286713286713287e-05, "Pretrain/Loss": 2.420957088470459, "Pretrain/Loss (Raw)": 2.188944101333618, "Pretrain/Step": 76, "Pretrain/Step Time": 7.716661744996121} +{"Pretrain/Learning Rate": 1.3461538461538462e-05, "Pretrain/Loss": 2.417999744415283, "Pretrain/Loss (Raw)": 2.1932218074798584, "Pretrain/Step": 77, "Pretrain/Step Time": 7.7180050348306635} +{"Pretrain/Learning Rate": 1.3636363636363637e-05, "Pretrain/Loss": 2.415626049041748, "Pretrain/Loss (Raw)": 2.2328450679779053, "Pretrain/Step": 78, "Pretrain/Step Time": 7.743045449256897} +{"Pretrain/Learning Rate": 1.381118881118881e-05, "Pretrain/Loss": 2.4112706184387207, "Pretrain/Loss (Raw)": 2.0715560913085938, "Pretrain/Step": 79, "Pretrain/Step Time": 7.744259327272825} +{"Pretrain/Learning Rate": 1.3986013986013988e-05, "Pretrain/Loss": 2.412069082260132, "Pretrain/Loss (Raw)": 2.4751391410827637, "Pretrain/Step": 80, "Pretrain/Step Time": 7.780219694972038} +{"Pretrain/Learning Rate": 1.4160839160839163e-05, "Pretrain/Loss": 2.409661054611206, "Pretrain/Loss (Raw)": 2.2170331478118896, "Pretrain/Step": 81, "Pretrain/Step Time": 7.783876701637551} +{"Pretrain/Learning Rate": 1.4335664335664336e-05, "Pretrain/Loss": 2.406467914581299, "Pretrain/Loss (Raw)": 2.1478328704833984, "Pretrain/Step": 82, "Pretrain/Step Time": 7.798103402300579} +{"Pretrain/Learning Rate": 1.4510489510489511e-05, "Pretrain/Loss": 2.4055707454681396, "Pretrain/Loss (Raw)": 2.3320083618164062, "Pretrain/Step": 83, "Pretrain/Step Time": 7.794719084199652} +{"Pretrain/Learning Rate": 1.4685314685314686e-05, "Pretrain/Loss": 2.402594804763794, "Pretrain/Loss (Raw)": 2.1555755138397217, "Pretrain/Step": 84, "Pretrain/Step Time": 7.801240796134586} +{"Pretrain/Learning Rate": 1.486013986013986e-05, "Pretrain/Loss": 2.4015212059020996, "Pretrain/Loss (Raw)": 2.3113369941711426, "Pretrain/Step": 85, "Pretrain/Step Time": 7.79887755057391} +{"Pretrain/Learning Rate": 1.5034965034965034e-05, "Pretrain/Loss": 2.4001169204711914, "Pretrain/Loss (Raw)": 2.280766010284424, "Pretrain/Step": 86, "Pretrain/Step Time": 7.803114683129067} +{"Pretrain/Learning Rate": 1.5209790209790212e-05, "Pretrain/Loss": 2.398087739944458, "Pretrain/Loss (Raw)": 2.2235827445983887, "Pretrain/Step": 87, "Pretrain/Step Time": 7.801767672615489} +{"Pretrain/Learning Rate": 1.5384615384615387e-05, "Pretrain/Loss": 2.3955609798431396, "Pretrain/Loss (Raw)": 2.175712823867798, "Pretrain/Step": 88, "Pretrain/Step Time": 7.8064777824011715} +{"Pretrain/Learning Rate": 1.555944055944056e-05, "Pretrain/Loss": 2.3941171169281006, "Pretrain/Loss (Raw)": 2.2670726776123047, "Pretrain/Step": 89, "Pretrain/Step Time": 7.807056785969252} +{"Pretrain/Learning Rate": 1.5734265734265734e-05, "Pretrain/Loss": 2.390076160430908, "Pretrain/Loss (Raw)": 2.0304007530212402, "Pretrain/Step": 90, "Pretrain/Step Time": 7.809276201989916} +{"Pretrain/Learning Rate": 1.590909090909091e-05, "Pretrain/Loss": 2.3884809017181396, "Pretrain/Loss (Raw)": 2.244924306869507, "Pretrain/Step": 91, "Pretrain/Step Time": 7.814442008406251} +{"Pretrain/Learning Rate": 1.6083916083916083e-05, "Pretrain/Loss": 2.3889377117156982, "Pretrain/Loss (Raw)": 2.430492401123047, "Pretrain/Step": 92, "Pretrain/Step Time": 7.823402062706325} +{"Pretrain/Learning Rate": 1.625874125874126e-05, "Pretrain/Loss": 2.3862643241882324, "Pretrain/Loss (Raw)": 2.1403441429138184, "Pretrain/Step": 93, "Pretrain/Step Time": 7.8178471929283555} +{"Pretrain/Learning Rate": 1.6433566433566433e-05, "Pretrain/Loss": 2.3843934535980225, "Pretrain/Loss (Raw)": 2.2104032039642334, "Pretrain/Step": 94, "Pretrain/Step Time": 7.825227012025549} +{"Pretrain/Learning Rate": 1.660839160839161e-05, "Pretrain/Loss": 2.3848512172698975, "Pretrain/Loss (Raw)": 2.427863836288452, "Pretrain/Step": 95, "Pretrain/Step Time": 7.833561417931005} +{"Pretrain/Learning Rate": 1.6783216783216786e-05, "Pretrain/Loss": 2.38305401802063, "Pretrain/Loss (Raw)": 2.2123208045959473, "Pretrain/Step": 96, "Pretrain/Step Time": 7.845916127165158} +{"Pretrain/Learning Rate": 1.695804195804196e-05, "Pretrain/Loss": 2.380073070526123, "Pretrain/Loss (Raw)": 2.0939252376556396, "Pretrain/Step": 97, "Pretrain/Step Time": 7.84846668636676} +{"Pretrain/Learning Rate": 1.7132867132867133e-05, "Pretrain/Loss": 2.3776986598968506, "Pretrain/Loss (Raw)": 2.147359848022461, "Pretrain/Step": 98, "Pretrain/Step Time": 7.849580555546041} +{"Pretrain/Learning Rate": 1.730769230769231e-05, "Pretrain/Loss": 2.3762519359588623, "Pretrain/Loss (Raw)": 2.2344722747802734, "Pretrain/Step": 99, "Pretrain/Step Time": 7.853722767396406} +{"Pretrain/Learning Rate": 1.7482517482517483e-05, "Pretrain/Loss": 2.3744795322418213, "Pretrain/Loss (Raw)": 2.1990318298339844, "Pretrain/Step": 100, "Pretrain/Step Time": 7.849523806571961} +{"Pretrain/Learning Rate": 1.7657342657342656e-05, "Pretrain/Loss": 2.3749890327453613, "Pretrain/Loss (Raw)": 2.425929546356201, "Pretrain/Step": 101, "Pretrain/Step Time": 7.855651510824071} +{"Pretrain/Learning Rate": 1.7832167832167836e-05, "Pretrain/Loss": 2.3743205070495605, "Pretrain/Loss (Raw)": 2.306797981262207, "Pretrain/Step": 102, "Pretrain/Step Time": 7.85061496145585} +{"Pretrain/Learning Rate": 1.800699300699301e-05, "Pretrain/Loss": 2.3724265098571777, "Pretrain/Loss (Raw)": 2.179245948791504, "Pretrain/Step": 103, "Pretrain/Step Time": 7.857635766557119} +{"Pretrain/Learning Rate": 1.8181818181818182e-05, "Pretrain/Loss": 2.371295213699341, "Pretrain/Loss (Raw)": 2.2547619342803955, "Pretrain/Step": 104, "Pretrain/Step Time": 7.853264813239758} +{"Pretrain/Learning Rate": 1.835664335664336e-05, "Pretrain/Loss": 2.370499849319458, "Pretrain/Loss (Raw)": 2.287759780883789, "Pretrain/Step": 105, "Pretrain/Step Time": 7.8585426739283974} +{"Pretrain/Learning Rate": 1.8531468531468532e-05, "Pretrain/Loss": 2.3688836097717285, "Pretrain/Loss (Raw)": 2.1991984844207764, "Pretrain/Step": 106, "Pretrain/Step Time": 7.854193745918994} +{"Pretrain/Learning Rate": 1.8706293706293705e-05, "Pretrain/Loss": 2.367008686065674, "Pretrain/Loss (Raw)": 2.168264389038086, "Pretrain/Step": 107, "Pretrain/Step Time": 7.859348330542306} +{"Pretrain/Learning Rate": 1.888111888111888e-05, "Pretrain/Loss": 2.366306781768799, "Pretrain/Loss (Raw)": 2.2912001609802246, "Pretrain/Step": 108, "Pretrain/Step Time": 7.856139200705069} +{"Pretrain/Learning Rate": 1.9055944055944055e-05, "Pretrain/Loss": 2.36594820022583, "Pretrain/Loss (Raw)": 2.3272416591644287, "Pretrain/Step": 109, "Pretrain/Step Time": 7.858866989065747} +{"Pretrain/Learning Rate": 1.923076923076923e-05, "Pretrain/Loss": 2.36472225189209, "Pretrain/Loss (Raw)": 2.2310750484466553, "Pretrain/Step": 110, "Pretrain/Step Time": 7.861648173765703} +{"Pretrain/Learning Rate": 1.9405594405594408e-05, "Pretrain/Loss": 2.363757610321045, "Pretrain/Loss (Raw)": 2.257636070251465, "Pretrain/Step": 111, "Pretrain/Step Time": 7.859404374887277} +{"Pretrain/Learning Rate": 1.958041958041958e-05, "Pretrain/Loss": 2.362760305404663, "Pretrain/Loss (Raw)": 2.2520864009857178, "Pretrain/Step": 112, "Pretrain/Step Time": 7.868437879851887} +{"Pretrain/Learning Rate": 1.9755244755244758e-05, "Pretrain/Loss": 2.364232301712036, "Pretrain/Loss (Raw)": 2.529090166091919, "Pretrain/Step": 113, "Pretrain/Step Time": 7.86961821750202} +{"Pretrain/Learning Rate": 1.993006993006993e-05, "Pretrain/Loss": 2.3622453212738037, "Pretrain/Loss (Raw)": 2.137709379196167, "Pretrain/Step": 114, "Pretrain/Step Time": 7.870085197582579} +{"Pretrain/Learning Rate": 2.0104895104895104e-05, "Pretrain/Loss": 2.360063076019287, "Pretrain/Loss (Raw)": 2.111299514770508, "Pretrain/Step": 115, "Pretrain/Step Time": 7.87968869001969} +{"Pretrain/Learning Rate": 2.027972027972028e-05, "Pretrain/Loss": 2.3595733642578125, "Pretrain/Loss (Raw)": 2.3032405376434326, "Pretrain/Step": 116, "Pretrain/Step Time": 7.885045781217772} +{"Pretrain/Learning Rate": 2.0454545454545457e-05, "Pretrain/Loss": 2.358350992202759, "Pretrain/Loss (Raw)": 2.2165489196777344, "Pretrain/Step": 117, "Pretrain/Step Time": 7.882285093649839} +{"Pretrain/Learning Rate": 2.062937062937063e-05, "Pretrain/Loss": 2.3558106422424316, "Pretrain/Loss (Raw)": 2.058619260787964, "Pretrain/Step": 118, "Pretrain/Step Time": 7.886645084720547} +{"Pretrain/Learning Rate": 2.0804195804195807e-05, "Pretrain/Loss": 2.3549346923828125, "Pretrain/Loss (Raw)": 2.251528263092041, "Pretrain/Step": 119, "Pretrain/Step Time": 7.883616211033669} +{"Pretrain/Learning Rate": 2.097902097902098e-05, "Pretrain/Loss": 2.35233211517334, "Pretrain/Loss (Raw)": 2.0426244735717773, "Pretrain/Step": 120, "Pretrain/Step Time": 7.890212255716324} +{"Pretrain/Learning Rate": 2.1153846153846154e-05, "Pretrain/Loss": 2.352368116378784, "Pretrain/Loss (Raw)": 2.3567330837249756, "Pretrain/Step": 121, "Pretrain/Step Time": 7.8901123586765} +{"Pretrain/Learning Rate": 2.132867132867133e-05, "Pretrain/Loss": 2.3517189025878906, "Pretrain/Loss (Raw)": 2.273167610168457, "Pretrain/Step": 122, "Pretrain/Step Time": 7.8954030040834775} +{"Pretrain/Learning Rate": 2.1503496503496503e-05, "Pretrain/Loss": 2.350473642349243, "Pretrain/Loss (Raw)": 2.198542594909668, "Pretrain/Step": 123, "Pretrain/Step Time": 7.889473248303421} +{"Pretrain/Learning Rate": 2.1678321678321677e-05, "Pretrain/Loss": 2.350097894668579, "Pretrain/Loss (Raw)": 2.303863286972046, "Pretrain/Step": 124, "Pretrain/Step Time": 7.894464467802355} +{"Pretrain/Learning Rate": 2.1853146853146857e-05, "Pretrain/Loss": 2.3509721755981445, "Pretrain/Loss (Raw)": 2.4593615531921387, "Pretrain/Step": 125, "Pretrain/Step Time": 7.891487432479859} +{"Pretrain/Learning Rate": 2.202797202797203e-05, "Pretrain/Loss": 2.3494975566864014, "Pretrain/Loss (Raw)": 2.165160894393921, "Pretrain/Step": 126, "Pretrain/Step Time": 7.8928578278375054} +{"Pretrain/Learning Rate": 2.2202797202797203e-05, "Pretrain/Loss": 2.34889817237854, "Pretrain/Loss (Raw)": 2.273383140563965, "Pretrain/Step": 127, "Pretrain/Step Time": 7.893057286270022} +{"Pretrain/Learning Rate": 2.237762237762238e-05, "Pretrain/Loss": 2.3475518226623535, "Pretrain/Loss (Raw)": 2.176567554473877, "Pretrain/Step": 128, "Pretrain/Step Time": 7.893094075843692} +{"Pretrain/Learning Rate": 2.2552447552447553e-05, "Pretrain/Loss": 2.3430299758911133, "Pretrain/Loss (Raw)": 2.267275094985962, "Pretrain/Step": 129, "Pretrain/Step Time": 7.865392213687301} +{"Pretrain/Learning Rate": 2.272727272727273e-05, "Pretrain/Loss": 2.3314785957336426, "Pretrain/Loss (Raw)": 2.175328254699707, "Pretrain/Step": 130, "Pretrain/Step Time": 7.869465524330735} +{"Pretrain/Learning Rate": 2.2902097902097902e-05, "Pretrain/Loss": 2.3269505500793457, "Pretrain/Loss (Raw)": 2.1764626502990723, "Pretrain/Step": 131, "Pretrain/Step Time": 7.87396882660687} +{"Pretrain/Learning Rate": 2.307692307692308e-05, "Pretrain/Loss": 2.3190693855285645, "Pretrain/Loss (Raw)": 2.152157783508301, "Pretrain/Step": 132, "Pretrain/Step Time": 7.874379526823759} +{"Pretrain/Learning Rate": 2.3251748251748252e-05, "Pretrain/Loss": 2.310555934906006, "Pretrain/Loss (Raw)": 2.042534828186035, "Pretrain/Step": 133, "Pretrain/Step Time": 7.879768008366227} +{"Pretrain/Learning Rate": 2.342657342657343e-05, "Pretrain/Loss": 2.3040895462036133, "Pretrain/Loss (Raw)": 2.287010431289673, "Pretrain/Step": 134, "Pretrain/Step Time": 7.896551851183176} +{"Pretrain/Learning Rate": 2.3601398601398602e-05, "Pretrain/Loss": 2.2986507415771484, "Pretrain/Loss (Raw)": 2.195103406906128, "Pretrain/Step": 135, "Pretrain/Step Time": 7.902354979887605} +{"Pretrain/Learning Rate": 2.377622377622378e-05, "Pretrain/Loss": 2.2892005443573, "Pretrain/Loss (Raw)": 2.153459072113037, "Pretrain/Step": 136, "Pretrain/Step Time": 7.905233604833484} +{"Pretrain/Learning Rate": 2.3951048951048952e-05, "Pretrain/Loss": 2.283583402633667, "Pretrain/Loss (Raw)": 2.3251700401306152, "Pretrain/Step": 137, "Pretrain/Step Time": 7.909438701346517} +{"Pretrain/Learning Rate": 2.4125874125874125e-05, "Pretrain/Loss": 2.2793128490448, "Pretrain/Loss (Raw)": 2.1516788005828857, "Pretrain/Step": 138, "Pretrain/Step Time": 7.906712336465716} +{"Pretrain/Learning Rate": 2.43006993006993e-05, "Pretrain/Loss": 2.2732040882110596, "Pretrain/Loss (Raw)": 2.049078941345215, "Pretrain/Step": 139, "Pretrain/Step Time": 7.912155402824283} +{"Pretrain/Learning Rate": 2.4475524475524478e-05, "Pretrain/Loss": 2.2704102993011475, "Pretrain/Loss (Raw)": 2.3382019996643066, "Pretrain/Step": 140, "Pretrain/Step Time": 7.9173374231904745} +{"Pretrain/Learning Rate": 2.465034965034965e-05, "Pretrain/Loss": 2.2646350860595703, "Pretrain/Loss (Raw)": 2.3274972438812256, "Pretrain/Step": 141, "Pretrain/Step Time": 7.916531281545758} +{"Pretrain/Learning Rate": 2.4825174825174828e-05, "Pretrain/Loss": 2.258272647857666, "Pretrain/Loss (Raw)": 2.0435891151428223, "Pretrain/Step": 142, "Pretrain/Step Time": 7.917483827099204} +{"Pretrain/Learning Rate": 2.5e-05, "Pretrain/Loss": 2.257107973098755, "Pretrain/Loss (Raw)": 2.2757577896118164, "Pretrain/Step": 143, "Pretrain/Step Time": 7.91461693495512} +{"Pretrain/Learning Rate": 2.5174825174825178e-05, "Pretrain/Loss": 2.2548844814300537, "Pretrain/Loss (Raw)": 2.191223621368408, "Pretrain/Step": 144, "Pretrain/Step Time": 7.91954399086535} +{"Pretrain/Learning Rate": 2.534965034965035e-05, "Pretrain/Loss": 2.2532730102539062, "Pretrain/Loss (Raw)": 2.2379448413848877, "Pretrain/Step": 145, "Pretrain/Step Time": 7.912338078022003} +{"Pretrain/Learning Rate": 2.5524475524475528e-05, "Pretrain/Loss": 2.2508788108825684, "Pretrain/Loss (Raw)": 2.2251899242401123, "Pretrain/Step": 146, "Pretrain/Step Time": 7.916160624474287} +{"Pretrain/Learning Rate": 2.5699300699300697e-05, "Pretrain/Loss": 2.2479288578033447, "Pretrain/Loss (Raw)": 2.1457836627960205, "Pretrain/Step": 147, "Pretrain/Step Time": 7.911960165947676} +{"Pretrain/Learning Rate": 2.5874125874125877e-05, "Pretrain/Loss": 2.246023178100586, "Pretrain/Loss (Raw)": 2.1690831184387207, "Pretrain/Step": 148, "Pretrain/Step Time": 7.915043329820037} +{"Pretrain/Learning Rate": 2.6048951048951047e-05, "Pretrain/Loss": 2.244783878326416, "Pretrain/Loss (Raw)": 2.3035430908203125, "Pretrain/Step": 149, "Pretrain/Step Time": 7.91802741587162} +{"Pretrain/Learning Rate": 2.6223776223776224e-05, "Pretrain/Loss": 2.2440643310546875, "Pretrain/Loss (Raw)": 2.2096450328826904, "Pretrain/Step": 150, "Pretrain/Step Time": 7.9252060148864985} +{"Pretrain/Learning Rate": 2.6398601398601404e-05, "Pretrain/Loss": 2.2402682304382324, "Pretrain/Loss (Raw)": 2.0603232383728027, "Pretrain/Step": 151, "Pretrain/Step Time": 7.928829254582524} +{"Pretrain/Learning Rate": 2.6573426573426574e-05, "Pretrain/Loss": 2.2379486560821533, "Pretrain/Loss (Raw)": 2.229736804962158, "Pretrain/Step": 152, "Pretrain/Step Time": 7.932788606733084} +{"Pretrain/Learning Rate": 2.674825174825175e-05, "Pretrain/Loss": 2.233670949935913, "Pretrain/Loss (Raw)": 1.981695532798767, "Pretrain/Step": 153, "Pretrain/Step Time": 7.942671742290258} +{"Pretrain/Learning Rate": 2.6923076923076923e-05, "Pretrain/Loss": 2.2307229042053223, "Pretrain/Loss (Raw)": 2.2686734199523926, "Pretrain/Step": 154, "Pretrain/Step Time": 7.94517987780273} +{"Pretrain/Learning Rate": 2.70979020979021e-05, "Pretrain/Loss": 2.2264180183410645, "Pretrain/Loss (Raw)": 2.17683744430542, "Pretrain/Step": 155, "Pretrain/Step Time": 7.942617446184158} +{"Pretrain/Learning Rate": 2.7272727272727273e-05, "Pretrain/Loss": 2.2263917922973633, "Pretrain/Loss (Raw)": 2.2071378231048584, "Pretrain/Step": 156, "Pretrain/Step Time": 7.947725899517536} +{"Pretrain/Learning Rate": 2.744755244755245e-05, "Pretrain/Loss": 2.2252063751220703, "Pretrain/Loss (Raw)": 2.0953431129455566, "Pretrain/Step": 157, "Pretrain/Step Time": 7.949966115877032} +{"Pretrain/Learning Rate": 2.762237762237762e-05, "Pretrain/Loss": 2.2241921424865723, "Pretrain/Loss (Raw)": 2.1150426864624023, "Pretrain/Step": 158, "Pretrain/Step Time": 7.953859830275178} +{"Pretrain/Learning Rate": 2.77972027972028e-05, "Pretrain/Loss": 2.223588705062866, "Pretrain/Loss (Raw)": 2.128117084503174, "Pretrain/Step": 159, "Pretrain/Step Time": 7.955424748361111} +{"Pretrain/Learning Rate": 2.7972027972027976e-05, "Pretrain/Loss": 2.2245917320251465, "Pretrain/Loss (Raw)": 2.3140194416046143, "Pretrain/Step": 160, "Pretrain/Step Time": 7.955417050048709} +{"Pretrain/Learning Rate": 2.8146853146853146e-05, "Pretrain/Loss": 2.228545904159546, "Pretrain/Loss (Raw)": 2.8651340007781982, "Pretrain/Step": 161, "Pretrain/Step Time": 7.963545443490148} +{"Pretrain/Learning Rate": 2.8321678321678326e-05, "Pretrain/Loss": 2.2294633388519287, "Pretrain/Loss (Raw)": 2.3111228942871094, "Pretrain/Step": 162, "Pretrain/Step Time": 7.968349160626531} +{"Pretrain/Learning Rate": 2.8496503496503496e-05, "Pretrain/Loss": 2.229663848876953, "Pretrain/Loss (Raw)": 2.2006871700286865, "Pretrain/Step": 163, "Pretrain/Step Time": 7.964472511783242} +{"Pretrain/Learning Rate": 2.8671328671328672e-05, "Pretrain/Loss": 2.228600025177002, "Pretrain/Loss (Raw)": 2.1591596603393555, "Pretrain/Step": 164, "Pretrain/Step Time": 7.96856627240777} +{"Pretrain/Learning Rate": 2.8846153846153845e-05, "Pretrain/Loss": 2.2273271083831787, "Pretrain/Loss (Raw)": 2.2394981384277344, "Pretrain/Step": 165, "Pretrain/Step Time": 7.965479435399175} +{"Pretrain/Learning Rate": 2.9020979020979022e-05, "Pretrain/Loss": 2.227731704711914, "Pretrain/Loss (Raw)": 2.1637167930603027, "Pretrain/Step": 166, "Pretrain/Step Time": 7.969658426940441} +{"Pretrain/Learning Rate": 2.91958041958042e-05, "Pretrain/Loss": 2.227815628051758, "Pretrain/Loss (Raw)": 2.3080763816833496, "Pretrain/Step": 167, "Pretrain/Step Time": 7.97121049836278} +{"Pretrain/Learning Rate": 2.9370629370629372e-05, "Pretrain/Loss": 2.229994058609009, "Pretrain/Loss (Raw)": 2.522524118423462, "Pretrain/Step": 168, "Pretrain/Step Time": 7.971193574368954} +{"Pretrain/Learning Rate": 2.954545454545455e-05, "Pretrain/Loss": 2.2304067611694336, "Pretrain/Loss (Raw)": 2.429457664489746, "Pretrain/Step": 169, "Pretrain/Step Time": 7.985640665516257} +{"Pretrain/Learning Rate": 2.972027972027972e-05, "Pretrain/Loss": 2.2311935424804688, "Pretrain/Loss (Raw)": 2.2062621116638184, "Pretrain/Step": 170, "Pretrain/Step Time": 7.990438144654036} +{"Pretrain/Learning Rate": 2.9895104895104898e-05, "Pretrain/Loss": 2.2317566871643066, "Pretrain/Loss (Raw)": 2.267676591873169, "Pretrain/Step": 171, "Pretrain/Step Time": 7.993559844791889} +{"Pretrain/Learning Rate": 3.0069930069930068e-05, "Pretrain/Loss": 2.230510711669922, "Pretrain/Loss (Raw)": 2.3564136028289795, "Pretrain/Step": 172, "Pretrain/Step Time": 8.003391837701201} +{"Pretrain/Learning Rate": 3.0244755244755245e-05, "Pretrain/Loss": 2.230271577835083, "Pretrain/Loss (Raw)": 2.140651226043701, "Pretrain/Step": 173, "Pretrain/Step Time": 8.011209581047297} +{"Pretrain/Learning Rate": 3.0419580419580425e-05, "Pretrain/Loss": 2.2311038970947266, "Pretrain/Loss (Raw)": 2.4204025268554688, "Pretrain/Step": 174, "Pretrain/Step Time": 8.014093978330493} +{"Pretrain/Learning Rate": 3.0594405594405594e-05, "Pretrain/Loss": 2.230008602142334, "Pretrain/Loss (Raw)": 2.3352224826812744, "Pretrain/Step": 175, "Pretrain/Step Time": 8.013295117765665} +{"Pretrain/Learning Rate": 3.0769230769230774e-05, "Pretrain/Loss": 2.2305097579956055, "Pretrain/Loss (Raw)": 2.274979829788208, "Pretrain/Step": 176, "Pretrain/Step Time": 8.015647988766432} +{"Pretrain/Learning Rate": 3.094405594405594e-05, "Pretrain/Loss": 2.230487823486328, "Pretrain/Loss (Raw)": 2.163409471511841, "Pretrain/Step": 177, "Pretrain/Step Time": 8.02011350914836} +{"Pretrain/Learning Rate": 3.111888111888112e-05, "Pretrain/Loss": 2.2299623489379883, "Pretrain/Loss (Raw)": 2.160259962081909, "Pretrain/Step": 178, "Pretrain/Step Time": 8.01963804103434} +{"Pretrain/Learning Rate": 3.1293706293706294e-05, "Pretrain/Loss": 2.2295308113098145, "Pretrain/Loss (Raw)": 2.2652359008789062, "Pretrain/Step": 179, "Pretrain/Step Time": 8.019937982782722} +{"Pretrain/Learning Rate": 3.146853146853147e-05, "Pretrain/Loss": 2.2316629886627197, "Pretrain/Loss (Raw)": 2.464233160018921, "Pretrain/Step": 180, "Pretrain/Step Time": 8.026144780218601} +{"Pretrain/Learning Rate": 3.164335664335665e-05, "Pretrain/Loss": 2.2315621376037598, "Pretrain/Loss (Raw)": 2.1680846214294434, "Pretrain/Step": 181, "Pretrain/Step Time": 8.031643724069} +{"Pretrain/Learning Rate": 3.181818181818182e-05, "Pretrain/Loss": 2.2321722507476807, "Pretrain/Loss (Raw)": 2.205495834350586, "Pretrain/Step": 182, "Pretrain/Step Time": 8.03409700281918} +{"Pretrain/Learning Rate": 3.1993006993006994e-05, "Pretrain/Loss": 2.2332658767700195, "Pretrain/Loss (Raw)": 2.2024972438812256, "Pretrain/Step": 183, "Pretrain/Step Time": 8.037169901654124} +{"Pretrain/Learning Rate": 3.216783216783217e-05, "Pretrain/Loss": 2.234804630279541, "Pretrain/Loss (Raw)": 2.218524932861328, "Pretrain/Step": 184, "Pretrain/Step Time": 8.031143872067332} +{"Pretrain/Learning Rate": 3.234265734265735e-05, "Pretrain/Loss": 2.236867666244507, "Pretrain/Loss (Raw)": 2.596611499786377, "Pretrain/Step": 185, "Pretrain/Step Time": 8.039476895704865} +{"Pretrain/Learning Rate": 3.251748251748252e-05, "Pretrain/Loss": 2.2379097938537598, "Pretrain/Loss (Raw)": 2.218022108078003, "Pretrain/Step": 186, "Pretrain/Step Time": 8.037759171798825} +{"Pretrain/Learning Rate": 3.269230769230769e-05, "Pretrain/Loss": 2.238203525543213, "Pretrain/Loss (Raw)": 2.154484510421753, "Pretrain/Step": 187, "Pretrain/Step Time": 8.036490466445684} +{"Pretrain/Learning Rate": 3.2867132867132866e-05, "Pretrain/Loss": 2.237123489379883, "Pretrain/Loss (Raw)": 2.1766817569732666, "Pretrain/Step": 188, "Pretrain/Step Time": 8.047259060665965} +{"Pretrain/Learning Rate": 3.3041958041958046e-05, "Pretrain/Loss": 2.236279249191284, "Pretrain/Loss (Raw)": 2.1000101566314697, "Pretrain/Step": 189, "Pretrain/Step Time": 8.05038519948721} +{"Pretrain/Learning Rate": 3.321678321678322e-05, "Pretrain/Loss": 2.2368626594543457, "Pretrain/Loss (Raw)": 2.335108518600464, "Pretrain/Step": 190, "Pretrain/Step Time": 8.058486927300692} +{"Pretrain/Learning Rate": 3.339160839160839e-05, "Pretrain/Loss": 2.236570358276367, "Pretrain/Loss (Raw)": 2.0519256591796875, "Pretrain/Step": 191, "Pretrain/Step Time": 8.060850758105516} +{"Pretrain/Learning Rate": 3.356643356643357e-05, "Pretrain/Loss": 2.2378461360931396, "Pretrain/Loss (Raw)": 2.3735861778259277, "Pretrain/Step": 192, "Pretrain/Step Time": 8.064707038924098} +{"Pretrain/Learning Rate": 3.374125874125874e-05, "Pretrain/Loss": 2.238269329071045, "Pretrain/Loss (Raw)": 2.2267086505889893, "Pretrain/Step": 193, "Pretrain/Step Time": 8.07437290623784} +{"Pretrain/Learning Rate": 3.391608391608392e-05, "Pretrain/Loss": 2.237271785736084, "Pretrain/Loss (Raw)": 2.1127266883850098, "Pretrain/Step": 194, "Pretrain/Step Time": 8.074532322585583} +{"Pretrain/Learning Rate": 3.409090909090909e-05, "Pretrain/Loss": 2.237102508544922, "Pretrain/Loss (Raw)": 2.178969383239746, "Pretrain/Step": 195, "Pretrain/Step Time": 8.078992169350386} +{"Pretrain/Learning Rate": 3.4265734265734265e-05, "Pretrain/Loss": 2.2366957664489746, "Pretrain/Loss (Raw)": 2.2074739933013916, "Pretrain/Step": 196, "Pretrain/Step Time": 8.080507572740316} +{"Pretrain/Learning Rate": 3.4440559440559445e-05, "Pretrain/Loss": 2.235290050506592, "Pretrain/Loss (Raw)": 2.0591044425964355, "Pretrain/Step": 197, "Pretrain/Step Time": 8.081869255751371} +{"Pretrain/Learning Rate": 3.461538461538462e-05, "Pretrain/Loss": 2.235879421234131, "Pretrain/Loss (Raw)": 2.25834321975708, "Pretrain/Step": 198, "Pretrain/Step Time": 8.089990893378854} +{"Pretrain/Learning Rate": 3.479020979020979e-05, "Pretrain/Loss": 2.2362780570983887, "Pretrain/Loss (Raw)": 2.2718091011047363, "Pretrain/Step": 199, "Pretrain/Step Time": 8.094857653602958} +{"Pretrain/Learning Rate": 3.4965034965034965e-05, "Pretrain/Loss": 2.2364959716796875, "Pretrain/Loss (Raw)": 2.3027539253234863, "Pretrain/Step": 200, "Pretrain/Step Time": 8.097339518368244} +{"Pretrain/Learning Rate": 3.5139860139860145e-05, "Pretrain/Loss": 2.236598491668701, "Pretrain/Loss (Raw)": 2.223703145980835, "Pretrain/Step": 201, "Pretrain/Step Time": 8.101418558508158} +{"Pretrain/Learning Rate": 3.531468531468531e-05, "Pretrain/Loss": 2.236924886703491, "Pretrain/Loss (Raw)": 2.2485454082489014, "Pretrain/Step": 202, "Pretrain/Step Time": 8.103456191718578} +{"Pretrain/Learning Rate": 3.548951048951049e-05, "Pretrain/Loss": 2.234067916870117, "Pretrain/Loss (Raw)": 2.112954616546631, "Pretrain/Step": 203, "Pretrain/Step Time": 8.096588391810656} +{"Pretrain/Learning Rate": 3.566433566433567e-05, "Pretrain/Loss": 2.2356128692626953, "Pretrain/Loss (Raw)": 2.386667251586914, "Pretrain/Step": 204, "Pretrain/Step Time": 8.095064530149102} +{"Pretrain/Learning Rate": 3.583916083916084e-05, "Pretrain/Loss": 2.2353782653808594, "Pretrain/Loss (Raw)": 2.163235902786255, "Pretrain/Step": 205, "Pretrain/Step Time": 8.09823371656239} +{"Pretrain/Learning Rate": 3.601398601398602e-05, "Pretrain/Loss": 2.2344777584075928, "Pretrain/Loss (Raw)": 2.117563009262085, "Pretrain/Step": 206, "Pretrain/Step Time": 8.082460828125477} +{"Pretrain/Learning Rate": 3.618881118881119e-05, "Pretrain/Loss": 2.2344412803649902, "Pretrain/Loss (Raw)": 2.0668983459472656, "Pretrain/Step": 207, "Pretrain/Step Time": 8.08538307249546} +{"Pretrain/Learning Rate": 3.6363636363636364e-05, "Pretrain/Loss": 2.233112335205078, "Pretrain/Loss (Raw)": 2.3050527572631836, "Pretrain/Step": 208, "Pretrain/Step Time": 8.069754753261805} +{"Pretrain/Learning Rate": 3.653846153846154e-05, "Pretrain/Loss": 2.2335891723632812, "Pretrain/Loss (Raw)": 2.2780189514160156, "Pretrain/Step": 209, "Pretrain/Step Time": 8.070277363061905} +{"Pretrain/Learning Rate": 3.671328671328672e-05, "Pretrain/Loss": 2.234358310699463, "Pretrain/Loss (Raw)": 2.246306896209717, "Pretrain/Step": 210, "Pretrain/Step Time": 8.067379182204604} +{"Pretrain/Learning Rate": 3.688811188811189e-05, "Pretrain/Loss": 2.233132839202881, "Pretrain/Loss (Raw)": 2.1751232147216797, "Pretrain/Step": 211, "Pretrain/Step Time": 8.068842224776745} +{"Pretrain/Learning Rate": 3.7062937062937064e-05, "Pretrain/Loss": 2.235276937484741, "Pretrain/Loss (Raw)": 2.430032253265381, "Pretrain/Step": 212, "Pretrain/Step Time": 8.068392926827073} +{"Pretrain/Learning Rate": 3.7237762237762244e-05, "Pretrain/Loss": 2.2348291873931885, "Pretrain/Loss (Raw)": 2.254033327102661, "Pretrain/Step": 213, "Pretrain/Step Time": 8.06992626003921} +{"Pretrain/Learning Rate": 3.741258741258741e-05, "Pretrain/Loss": 2.2348170280456543, "Pretrain/Loss (Raw)": 2.27919602394104, "Pretrain/Step": 214, "Pretrain/Step Time": 8.071696756407619} +{"Pretrain/Learning Rate": 3.758741258741259e-05, "Pretrain/Loss": 2.2342441082000732, "Pretrain/Loss (Raw)": 2.150264024734497, "Pretrain/Step": 215, "Pretrain/Step Time": 8.073467928916216} +{"Pretrain/Learning Rate": 3.776223776223776e-05, "Pretrain/Loss": 2.235361099243164, "Pretrain/Loss (Raw)": 2.3186678886413574, "Pretrain/Step": 216, "Pretrain/Step Time": 8.072048941627145} +{"Pretrain/Learning Rate": 3.7937062937062936e-05, "Pretrain/Loss": 2.2336812019348145, "Pretrain/Loss (Raw)": 2.052074432373047, "Pretrain/Step": 217, "Pretrain/Step Time": 8.068919014185667} +{"Pretrain/Learning Rate": 3.811188811188811e-05, "Pretrain/Loss": 2.2351443767547607, "Pretrain/Loss (Raw)": 2.217686176300049, "Pretrain/Step": 218, "Pretrain/Step Time": 8.071616780012846} +{"Pretrain/Learning Rate": 3.828671328671329e-05, "Pretrain/Loss": 2.2349815368652344, "Pretrain/Loss (Raw)": 2.2240893840789795, "Pretrain/Step": 219, "Pretrain/Step Time": 8.072282085195184} +{"Pretrain/Learning Rate": 3.846153846153846e-05, "Pretrain/Loss": 2.2340734004974365, "Pretrain/Loss (Raw)": 2.3142261505126953, "Pretrain/Step": 220, "Pretrain/Step Time": 8.062667023390532} +{"Pretrain/Learning Rate": 3.8636363636363636e-05, "Pretrain/Loss": 2.235474109649658, "Pretrain/Loss (Raw)": 2.3196237087249756, "Pretrain/Step": 221, "Pretrain/Step Time": 8.07266516238451} +{"Pretrain/Learning Rate": 3.8811188811188816e-05, "Pretrain/Loss": 2.2363181114196777, "Pretrain/Loss (Raw)": 2.3184571266174316, "Pretrain/Step": 222, "Pretrain/Step Time": 8.064675187692046} +{"Pretrain/Learning Rate": 3.898601398601399e-05, "Pretrain/Loss": 2.233151912689209, "Pretrain/Loss (Raw)": 2.0225894451141357, "Pretrain/Step": 223, "Pretrain/Step Time": 8.06331011466682} +{"Pretrain/Learning Rate": 3.916083916083916e-05, "Pretrain/Loss": 2.2329297065734863, "Pretrain/Loss (Raw)": 2.1838715076446533, "Pretrain/Step": 224, "Pretrain/Step Time": 8.052124686539173} +{"Pretrain/Learning Rate": 3.9335664335664336e-05, "Pretrain/Loss": 2.2339892387390137, "Pretrain/Loss (Raw)": 2.2295634746551514, "Pretrain/Step": 225, "Pretrain/Step Time": 8.046033158898354} +{"Pretrain/Learning Rate": 3.9510489510489516e-05, "Pretrain/Loss": 2.2354321479797363, "Pretrain/Loss (Raw)": 2.332064151763916, "Pretrain/Step": 226, "Pretrain/Step Time": 8.045347230508924} +{"Pretrain/Learning Rate": 3.968531468531469e-05, "Pretrain/Loss": 2.236377716064453, "Pretrain/Loss (Raw)": 2.35547137260437, "Pretrain/Step": 227, "Pretrain/Step Time": 8.0508096460253} +{"Pretrain/Learning Rate": 3.986013986013986e-05, "Pretrain/Loss": 2.2357771396636963, "Pretrain/Loss (Raw)": 2.122171401977539, "Pretrain/Step": 228, "Pretrain/Step Time": 8.056942604482174} +{"Pretrain/Learning Rate": 4.0034965034965035e-05, "Pretrain/Loss": 2.234661340713501, "Pretrain/Loss (Raw)": 2.283118724822998, "Pretrain/Step": 229, "Pretrain/Step Time": 8.055795030668378} +{"Pretrain/Learning Rate": 4.020979020979021e-05, "Pretrain/Loss": 2.233971118927002, "Pretrain/Loss (Raw)": 2.2184505462646484, "Pretrain/Step": 230, "Pretrain/Step Time": 8.063337661325932} +{"Pretrain/Learning Rate": 4.038461538461539e-05, "Pretrain/Loss": 2.2344608306884766, "Pretrain/Loss (Raw)": 2.2418971061706543, "Pretrain/Step": 231, "Pretrain/Step Time": 8.054267942905426} +{"Pretrain/Learning Rate": 4.055944055944056e-05, "Pretrain/Loss": 2.23470401763916, "Pretrain/Loss (Raw)": 2.285910129547119, "Pretrain/Step": 232, "Pretrain/Step Time": 8.062701486051083} +{"Pretrain/Learning Rate": 4.0734265734265735e-05, "Pretrain/Loss": 2.235414505004883, "Pretrain/Loss (Raw)": 2.3786888122558594, "Pretrain/Step": 233, "Pretrain/Step Time": 8.062054734677076} +{"Pretrain/Learning Rate": 4.0909090909090915e-05, "Pretrain/Loss": 2.235593795776367, "Pretrain/Loss (Raw)": 2.2221453189849854, "Pretrain/Step": 234, "Pretrain/Step Time": 8.062570350244641} +{"Pretrain/Learning Rate": 4.108391608391609e-05, "Pretrain/Loss": 2.235562562942505, "Pretrain/Loss (Raw)": 2.16428279876709, "Pretrain/Step": 235, "Pretrain/Step Time": 8.056922620162368} +{"Pretrain/Learning Rate": 4.125874125874126e-05, "Pretrain/Loss": 2.2364161014556885, "Pretrain/Loss (Raw)": 2.4004647731781006, "Pretrain/Step": 236, "Pretrain/Step Time": 8.063176676630974} +{"Pretrain/Learning Rate": 4.1433566433566434e-05, "Pretrain/Loss": 2.2354276180267334, "Pretrain/Loss (Raw)": 2.2007157802581787, "Pretrain/Step": 237, "Pretrain/Step Time": 8.064515819773078} +{"Pretrain/Learning Rate": 4.1608391608391614e-05, "Pretrain/Loss": 2.235062599182129, "Pretrain/Loss (Raw)": 2.1843466758728027, "Pretrain/Step": 238, "Pretrain/Step Time": 8.059724520891905} +{"Pretrain/Learning Rate": 4.178321678321678e-05, "Pretrain/Loss": 2.2362399101257324, "Pretrain/Loss (Raw)": 2.408350706100464, "Pretrain/Step": 239, "Pretrain/Step Time": 8.061279840767384} +{"Pretrain/Learning Rate": 4.195804195804196e-05, "Pretrain/Loss": 2.236605644226074, "Pretrain/Loss (Raw)": 2.2988600730895996, "Pretrain/Step": 240, "Pretrain/Step Time": 8.051335705444217} +{"Pretrain/Learning Rate": 4.213286713286714e-05, "Pretrain/Loss": 2.232949733734131, "Pretrain/Loss (Raw)": 2.0611722469329834, "Pretrain/Step": 241, "Pretrain/Step Time": 8.05210598744452} +{"Pretrain/Learning Rate": 4.230769230769231e-05, "Pretrain/Loss": 2.233130931854248, "Pretrain/Loss (Raw)": 2.1608612537384033, "Pretrain/Step": 242, "Pretrain/Step Time": 8.05664455331862} +{"Pretrain/Learning Rate": 4.248251748251749e-05, "Pretrain/Loss": 2.234335422515869, "Pretrain/Loss (Raw)": 2.265507936477661, "Pretrain/Step": 243, "Pretrain/Step Time": 8.046209808439016} +{"Pretrain/Learning Rate": 4.265734265734266e-05, "Pretrain/Loss": 2.2353153228759766, "Pretrain/Loss (Raw)": 2.4286653995513916, "Pretrain/Step": 244, "Pretrain/Step Time": 8.044826477766037} +{"Pretrain/Learning Rate": 4.2832167832167833e-05, "Pretrain/Loss": 2.234959840774536, "Pretrain/Loss (Raw)": 2.171046018600464, "Pretrain/Step": 245, "Pretrain/Step Time": 8.04296763241291} +{"Pretrain/Learning Rate": 4.300699300699301e-05, "Pretrain/Loss": 2.236125946044922, "Pretrain/Loss (Raw)": 2.2078845500946045, "Pretrain/Step": 246, "Pretrain/Step Time": 8.050420010462403} +{"Pretrain/Learning Rate": 4.318181818181819e-05, "Pretrain/Loss": 2.23459529876709, "Pretrain/Loss (Raw)": 2.0555624961853027, "Pretrain/Step": 247, "Pretrain/Step Time": 8.055577024817467} +{"Pretrain/Learning Rate": 4.335664335664335e-05, "Pretrain/Loss": 2.2362546920776367, "Pretrain/Loss (Raw)": 2.25502872467041, "Pretrain/Step": 248, "Pretrain/Step Time": 8.049194939434528} +{"Pretrain/Learning Rate": 4.353146853146853e-05, "Pretrain/Loss": 2.2356784343719482, "Pretrain/Loss (Raw)": 2.2830026149749756, "Pretrain/Step": 249, "Pretrain/Step Time": 8.054760800674558} +{"Pretrain/Learning Rate": 4.370629370629371e-05, "Pretrain/Loss": 2.234468698501587, "Pretrain/Loss (Raw)": 2.118302822113037, "Pretrain/Step": 250, "Pretrain/Step Time": 8.047900328412652} +{"Pretrain/Learning Rate": 4.388111888111888e-05, "Pretrain/Loss": 2.2333202362060547, "Pretrain/Loss (Raw)": 2.0515592098236084, "Pretrain/Step": 251, "Pretrain/Step Time": 8.058158477768302} +{"Pretrain/Learning Rate": 4.405594405594406e-05, "Pretrain/Loss": 2.231539249420166, "Pretrain/Loss (Raw)": 2.075897693634033, "Pretrain/Step": 252, "Pretrain/Step Time": 8.05409892462194} +{"Pretrain/Learning Rate": 4.423076923076923e-05, "Pretrain/Loss": 2.2295949459075928, "Pretrain/Loss (Raw)": 2.2104828357696533, "Pretrain/Step": 253, "Pretrain/Step Time": 8.058936443179846} +{"Pretrain/Learning Rate": 4.4405594405594406e-05, "Pretrain/Loss": 2.2286674976348877, "Pretrain/Loss (Raw)": 2.046437978744507, "Pretrain/Step": 254, "Pretrain/Step Time": 8.057421993464231} +{"Pretrain/Learning Rate": 4.458041958041958e-05, "Pretrain/Loss": 2.227391481399536, "Pretrain/Loss (Raw)": 2.1100656986236572, "Pretrain/Step": 255, "Pretrain/Step Time": 8.055532587692142} +{"Pretrain/Learning Rate": 4.475524475524476e-05, "Pretrain/Loss": 2.2275431156158447, "Pretrain/Loss (Raw)": 2.1959640979766846, "Pretrain/Step": 256, "Pretrain/Step Time": 8.061805970966816} +{"Pretrain/Learning Rate": 4.493006993006993e-05, "Pretrain/Loss": 2.2256946563720703, "Pretrain/Loss (Raw)": 2.030672550201416, "Pretrain/Step": 257, "Pretrain/Step Time": 8.054129740223289} +{"Pretrain/Learning Rate": 4.5104895104895105e-05, "Pretrain/Loss": 2.225762367248535, "Pretrain/Loss (Raw)": 2.1840059757232666, "Pretrain/Step": 258, "Pretrain/Step Time": 8.054162392392755} +{"Pretrain/Learning Rate": 4.5279720279720285e-05, "Pretrain/Loss": 2.226297378540039, "Pretrain/Loss (Raw)": 2.244960308074951, "Pretrain/Step": 259, "Pretrain/Step Time": 8.049617789685726} +{"Pretrain/Learning Rate": 4.545454545454546e-05, "Pretrain/Loss": 2.226560592651367, "Pretrain/Loss (Raw)": 2.185807228088379, "Pretrain/Step": 260, "Pretrain/Step Time": 8.052513042464852} +{"Pretrain/Learning Rate": 4.562937062937063e-05, "Pretrain/Loss": 2.227125644683838, "Pretrain/Loss (Raw)": 2.1148972511291504, "Pretrain/Step": 261, "Pretrain/Step Time": 8.054996179416776} +{"Pretrain/Learning Rate": 4.5804195804195805e-05, "Pretrain/Loss": 2.2256479263305664, "Pretrain/Loss (Raw)": 2.0978410243988037, "Pretrain/Step": 262, "Pretrain/Step Time": 8.040004154667258} +{"Pretrain/Learning Rate": 4.597902097902098e-05, "Pretrain/Loss": 2.22576904296875, "Pretrain/Loss (Raw)": 2.2106335163116455, "Pretrain/Step": 263, "Pretrain/Step Time": 8.035961102694273} +{"Pretrain/Learning Rate": 4.615384615384616e-05, "Pretrain/Loss": 2.226400852203369, "Pretrain/Loss (Raw)": 2.234321355819702, "Pretrain/Step": 264, "Pretrain/Step Time": 8.038069920614362} +{"Pretrain/Learning Rate": 4.632867132867133e-05, "Pretrain/Loss": 2.2253947257995605, "Pretrain/Loss (Raw)": 2.196389675140381, "Pretrain/Step": 265, "Pretrain/Step Time": 8.039494873955846} +{"Pretrain/Learning Rate": 4.6503496503496505e-05, "Pretrain/Loss": 2.2256712913513184, "Pretrain/Loss (Raw)": 2.187079429626465, "Pretrain/Step": 266, "Pretrain/Step Time": 8.04673925228417} +{"Pretrain/Learning Rate": 4.667832167832168e-05, "Pretrain/Loss": 2.2284326553344727, "Pretrain/Loss (Raw)": 2.4024972915649414, "Pretrain/Step": 267, "Pretrain/Step Time": 8.044654849916697} +{"Pretrain/Learning Rate": 4.685314685314686e-05, "Pretrain/Loss": 2.2289061546325684, "Pretrain/Loss (Raw)": 2.398815631866455, "Pretrain/Step": 268, "Pretrain/Step Time": 8.038600536063313} +{"Pretrain/Learning Rate": 4.702797202797203e-05, "Pretrain/Loss": 2.2287724018096924, "Pretrain/Loss (Raw)": 2.3103830814361572, "Pretrain/Step": 269, "Pretrain/Step Time": 8.048112999647856} +{"Pretrain/Learning Rate": 4.7202797202797204e-05, "Pretrain/Loss": 2.2296066284179688, "Pretrain/Loss (Raw)": 2.1503841876983643, "Pretrain/Step": 270, "Pretrain/Step Time": 8.053927881643176} +{"Pretrain/Learning Rate": 4.7377622377622384e-05, "Pretrain/Loss": 2.228266954421997, "Pretrain/Loss (Raw)": 2.1042635440826416, "Pretrain/Step": 271, "Pretrain/Step Time": 8.055159730836749} +{"Pretrain/Learning Rate": 4.755244755244756e-05, "Pretrain/Loss": 2.229043960571289, "Pretrain/Loss (Raw)": 2.2906911373138428, "Pretrain/Step": 272, "Pretrain/Step Time": 8.051955170929432} +{"Pretrain/Learning Rate": 4.772727272727273e-05, "Pretrain/Loss": 2.228503942489624, "Pretrain/Loss (Raw)": 2.168818950653076, "Pretrain/Step": 273, "Pretrain/Step Time": 8.053078351542354} +{"Pretrain/Learning Rate": 4.7902097902097904e-05, "Pretrain/Loss": 2.229504108428955, "Pretrain/Loss (Raw)": 2.3532328605651855, "Pretrain/Step": 274, "Pretrain/Step Time": 8.052006738260388} +{"Pretrain/Learning Rate": 4.8076923076923084e-05, "Pretrain/Loss": 2.2297658920288086, "Pretrain/Loss (Raw)": 2.1792821884155273, "Pretrain/Step": 275, "Pretrain/Step Time": 8.0602612439543} +{"Pretrain/Learning Rate": 4.825174825174825e-05, "Pretrain/Loss": 2.229555368423462, "Pretrain/Loss (Raw)": 2.142124891281128, "Pretrain/Step": 276, "Pretrain/Step Time": 8.055258493870497} +{"Pretrain/Learning Rate": 4.842657342657343e-05, "Pretrain/Loss": 2.2298083305358887, "Pretrain/Loss (Raw)": 2.33593487739563, "Pretrain/Step": 277, "Pretrain/Step Time": 8.05590533837676} +{"Pretrain/Learning Rate": 4.86013986013986e-05, "Pretrain/Loss": 2.230318546295166, "Pretrain/Loss (Raw)": 2.2749359607696533, "Pretrain/Step": 278, "Pretrain/Step Time": 8.048998242244124} +{"Pretrain/Learning Rate": 4.8776223776223776e-05, "Pretrain/Loss": 2.231740713119507, "Pretrain/Loss (Raw)": 2.242382287979126, "Pretrain/Step": 279, "Pretrain/Step Time": 8.055315876379609} +{"Pretrain/Learning Rate": 4.8951048951048956e-05, "Pretrain/Loss": 2.231863498687744, "Pretrain/Loss (Raw)": 2.245426654815674, "Pretrain/Step": 280, "Pretrain/Step Time": 8.055715693160892} +{"Pretrain/Learning Rate": 4.912587412587413e-05, "Pretrain/Loss": 2.2342400550842285, "Pretrain/Loss (Raw)": 2.285885810852051, "Pretrain/Step": 281, "Pretrain/Step Time": 8.043734759092331} +{"Pretrain/Learning Rate": 4.93006993006993e-05, "Pretrain/Loss": 2.2334938049316406, "Pretrain/Loss (Raw)": 2.1731605529785156, "Pretrain/Step": 282, "Pretrain/Step Time": 8.03960082679987} +{"Pretrain/Learning Rate": 4.9475524475524476e-05, "Pretrain/Loss": 2.2335314750671387, "Pretrain/Loss (Raw)": 2.1816821098327637, "Pretrain/Step": 283, "Pretrain/Step Time": 8.049680098891258} +{"Pretrain/Learning Rate": 4.9650349650349656e-05, "Pretrain/Loss": 2.2334346771240234, "Pretrain/Loss (Raw)": 2.1947145462036133, "Pretrain/Step": 284, "Pretrain/Step Time": 8.05110034160316} +{"Pretrain/Learning Rate": 4.982517482517482e-05, "Pretrain/Loss": 2.2346744537353516, "Pretrain/Loss (Raw)": 2.254074811935425, "Pretrain/Step": 285, "Pretrain/Step Time": 8.05755541101098} +{"Pretrain/Learning Rate": 5e-05, "Pretrain/Loss": 2.23551607131958, "Pretrain/Loss (Raw)": 2.2227413654327393, "Pretrain/Step": 286, "Pretrain/Step Time": 8.055443044751883} +{"Pretrain/Learning Rate": 4.9999998558441094e-05, "Pretrain/Loss": 2.2362632751464844, "Pretrain/Loss (Raw)": 2.223783493041992, "Pretrain/Step": 287, "Pretrain/Step Time": 8.062777044251561} +{"Pretrain/Learning Rate": 4.999999423376456e-05, "Pretrain/Loss": 2.2348361015319824, "Pretrain/Loss (Raw)": 2.131338596343994, "Pretrain/Step": 288, "Pretrain/Step Time": 8.06797069311142} +{"Pretrain/Learning Rate": 4.9999987025970884e-05, "Pretrain/Loss": 2.229933261871338, "Pretrain/Loss (Raw)": 2.2375752925872803, "Pretrain/Step": 289, "Pretrain/Step Time": 8.066059542819858} +{"Pretrain/Learning Rate": 4.99999769350609e-05, "Pretrain/Loss": 2.2300920486450195, "Pretrain/Loss (Raw)": 2.3314077854156494, "Pretrain/Step": 290, "Pretrain/Step Time": 8.060436863452196} +{"Pretrain/Learning Rate": 4.999996396103577e-05, "Pretrain/Loss": 2.230855941772461, "Pretrain/Loss (Raw)": 2.2985031604766846, "Pretrain/Step": 291, "Pretrain/Step Time": 8.063612539321184} +{"Pretrain/Learning Rate": 4.999994810389699e-05, "Pretrain/Loss": 2.231572151184082, "Pretrain/Loss (Raw)": 2.250809907913208, "Pretrain/Step": 292, "Pretrain/Step Time": 8.058250593021512} +{"Pretrain/Learning Rate": 4.999992936364639e-05, "Pretrain/Loss": 2.2307190895080566, "Pretrain/Loss (Raw)": 2.1303346157073975, "Pretrain/Step": 293, "Pretrain/Step Time": 8.060170389711857} +{"Pretrain/Learning Rate": 4.9999907740286136e-05, "Pretrain/Loss": 2.230093479156494, "Pretrain/Loss (Raw)": 2.083646297454834, "Pretrain/Step": 294, "Pretrain/Step Time": 8.061421561986208} +{"Pretrain/Learning Rate": 4.9999883233818724e-05, "Pretrain/Loss": 2.228330612182617, "Pretrain/Loss (Raw)": 2.082425832748413, "Pretrain/Step": 295, "Pretrain/Step Time": 8.057590238749981} +{"Pretrain/Learning Rate": 4.999985584424696e-05, "Pretrain/Loss": 2.2259583473205566, "Pretrain/Loss (Raw)": 2.218867778778076, "Pretrain/Step": 296, "Pretrain/Step Time": 8.064342366531491} +{"Pretrain/Learning Rate": 4.999982557157403e-05, "Pretrain/Loss": 2.2243452072143555, "Pretrain/Loss (Raw)": 2.222968101501465, "Pretrain/Step": 297, "Pretrain/Step Time": 8.050155524164438} +{"Pretrain/Learning Rate": 4.9999792415803405e-05, "Pretrain/Loss": 2.22416353225708, "Pretrain/Loss (Raw)": 2.1829910278320312, "Pretrain/Step": 298, "Pretrain/Step Time": 8.05228284187615} +{"Pretrain/Learning Rate": 4.999975637693892e-05, "Pretrain/Loss": 2.2232203483581543, "Pretrain/Loss (Raw)": 2.146963357925415, "Pretrain/Step": 299, "Pretrain/Step Time": 8.055387888103724} +{"Pretrain/Learning Rate": 4.999971745498472e-05, "Pretrain/Loss": 2.2215559482574463, "Pretrain/Loss (Raw)": 2.1433608531951904, "Pretrain/Step": 300, "Pretrain/Step Time": 8.051011620089412} +{"Pretrain/Learning Rate": 4.999967564994531e-05, "Pretrain/Loss": 2.2223339080810547, "Pretrain/Loss (Raw)": 2.2402596473693848, "Pretrain/Step": 301, "Pretrain/Step Time": 8.041653499007225} +{"Pretrain/Learning Rate": 4.999963096182549e-05, "Pretrain/Loss": 2.219878673553467, "Pretrain/Loss (Raw)": 2.1061346530914307, "Pretrain/Step": 302, "Pretrain/Step Time": 8.040825633332133} +{"Pretrain/Learning Rate": 4.9999583390630435e-05, "Pretrain/Loss": 2.2193665504455566, "Pretrain/Loss (Raw)": 2.269665241241455, "Pretrain/Step": 303, "Pretrain/Step Time": 8.048758704215288} +{"Pretrain/Learning Rate": 4.999953293636562e-05, "Pretrain/Loss": 2.220187187194824, "Pretrain/Loss (Raw)": 2.379987955093384, "Pretrain/Step": 304, "Pretrain/Step Time": 8.047872241586447} +{"Pretrain/Learning Rate": 4.9999479599036856e-05, "Pretrain/Loss": 2.2198891639709473, "Pretrain/Loss (Raw)": 2.12530517578125, "Pretrain/Step": 305, "Pretrain/Step Time": 8.049366852268577} +{"Pretrain/Learning Rate": 4.9999423378650315e-05, "Pretrain/Loss": 2.220057487487793, "Pretrain/Loss (Raw)": 2.1818015575408936, "Pretrain/Step": 306, "Pretrain/Step Time": 8.050616879016161} +{"Pretrain/Learning Rate": 4.9999364275212466e-05, "Pretrain/Loss": 2.218601703643799, "Pretrain/Loss (Raw)": 2.078880548477173, "Pretrain/Step": 307, "Pretrain/Step Time": 8.058963568881154} +{"Pretrain/Learning Rate": 4.9999302288730126e-05, "Pretrain/Loss": 2.2165136337280273, "Pretrain/Loss (Raw)": 2.1969308853149414, "Pretrain/Step": 308, "Pretrain/Step Time": 8.061523407697678} +{"Pretrain/Learning Rate": 4.9999237419210445e-05, "Pretrain/Loss": 2.217175006866455, "Pretrain/Loss (Raw)": 2.252775192260742, "Pretrain/Step": 309, "Pretrain/Step Time": 8.054753623902798} +{"Pretrain/Learning Rate": 4.99991696666609e-05, "Pretrain/Loss": 2.216940402984619, "Pretrain/Loss (Raw)": 2.175457239151001, "Pretrain/Step": 310, "Pretrain/Step Time": 8.06078041344881} +{"Pretrain/Learning Rate": 4.999909903108932e-05, "Pretrain/Loss": 2.216033935546875, "Pretrain/Loss (Raw)": 2.086452007293701, "Pretrain/Step": 311, "Pretrain/Step Time": 8.0568329654634} +{"Pretrain/Learning Rate": 4.999902551250384e-05, "Pretrain/Loss": 2.2149572372436523, "Pretrain/Loss (Raw)": 2.080704689025879, "Pretrain/Step": 312, "Pretrain/Step Time": 8.058758748695254} +{"Pretrain/Learning Rate": 4.999894911091293e-05, "Pretrain/Loss": 2.212143898010254, "Pretrain/Loss (Raw)": 2.23652982711792, "Pretrain/Step": 313, "Pretrain/Step Time": 8.053199475631118} +{"Pretrain/Learning Rate": 4.999886982632541e-05, "Pretrain/Loss": 2.212125778198242, "Pretrain/Loss (Raw)": 2.2156848907470703, "Pretrain/Step": 314, "Pretrain/Step Time": 8.057986877858639} +{"Pretrain/Learning Rate": 4.999878765875042e-05, "Pretrain/Loss": 2.214221715927124, "Pretrain/Loss (Raw)": 2.4227566719055176, "Pretrain/Step": 315, "Pretrain/Step Time": 8.059115746989846} +{"Pretrain/Learning Rate": 4.999870260819745e-05, "Pretrain/Loss": 2.2146501541137695, "Pretrain/Loss (Raw)": 2.231550693511963, "Pretrain/Step": 316, "Pretrain/Step Time": 8.05167449824512} +{"Pretrain/Learning Rate": 4.999861467467629e-05, "Pretrain/Loss": 2.215254783630371, "Pretrain/Loss (Raw)": 2.177381992340088, "Pretrain/Step": 317, "Pretrain/Step Time": 8.052718972787261} +{"Pretrain/Learning Rate": 4.9998523858197094e-05, "Pretrain/Loss": 2.2145700454711914, "Pretrain/Loss (Raw)": 2.247474193572998, "Pretrain/Step": 318, "Pretrain/Step Time": 8.046191090717912} +{"Pretrain/Learning Rate": 4.999843015877032e-05, "Pretrain/Loss": 2.2150416374206543, "Pretrain/Loss (Raw)": 2.1122944355010986, "Pretrain/Step": 319, "Pretrain/Step Time": 8.054454039782286} +{"Pretrain/Learning Rate": 4.99983335764068e-05, "Pretrain/Loss": 2.213552236557007, "Pretrain/Loss (Raw)": 2.182935953140259, "Pretrain/Step": 320, "Pretrain/Step Time": 8.050267046317458} +{"Pretrain/Learning Rate": 4.999823411111765e-05, "Pretrain/Loss": 2.2131271362304688, "Pretrain/Loss (Raw)": 2.1722991466522217, "Pretrain/Step": 321, "Pretrain/Step Time": 8.044201374053955} +{"Pretrain/Learning Rate": 4.999813176291433e-05, "Pretrain/Loss": 2.213470220565796, "Pretrain/Loss (Raw)": 2.1566574573516846, "Pretrain/Step": 322, "Pretrain/Step Time": 8.051040600985289} +{"Pretrain/Learning Rate": 4.999802653180868e-05, "Pretrain/Loss": 2.213672399520874, "Pretrain/Loss (Raw)": 2.2048089504241943, "Pretrain/Step": 323, "Pretrain/Step Time": 8.045480037108064} +{"Pretrain/Learning Rate": 4.9997918417812805e-05, "Pretrain/Loss": 2.2134337425231934, "Pretrain/Loss (Raw)": 2.1769556999206543, "Pretrain/Step": 324, "Pretrain/Step Time": 8.055071221664548} +{"Pretrain/Learning Rate": 4.999780742093919e-05, "Pretrain/Loss": 2.213973045349121, "Pretrain/Loss (Raw)": 2.1281261444091797, "Pretrain/Step": 325, "Pretrain/Step Time": 8.05218249745667} +{"Pretrain/Learning Rate": 4.999769354120063e-05, "Pretrain/Loss": 2.213573455810547, "Pretrain/Loss (Raw)": 2.2071712017059326, "Pretrain/Step": 326, "Pretrain/Step Time": 8.051994821056724} +{"Pretrain/Learning Rate": 4.9997576778610254e-05, "Pretrain/Loss": 2.2122769355773926, "Pretrain/Loss (Raw)": 2.105867385864258, "Pretrain/Step": 327, "Pretrain/Step Time": 8.056887429207563} +{"Pretrain/Learning Rate": 4.999745713318154e-05, "Pretrain/Loss": 2.2114224433898926, "Pretrain/Loss (Raw)": 2.1933581829071045, "Pretrain/Step": 328, "Pretrain/Step Time": 8.049233233556151} +{"Pretrain/Learning Rate": 4.999733460492826e-05, "Pretrain/Loss": 2.2109131813049316, "Pretrain/Loss (Raw)": 2.1585326194763184, "Pretrain/Step": 329, "Pretrain/Step Time": 8.053010273724794} +{"Pretrain/Learning Rate": 4.999720919386457e-05, "Pretrain/Loss": 2.209174633026123, "Pretrain/Loss (Raw)": 2.0260508060455322, "Pretrain/Step": 330, "Pretrain/Step Time": 8.049487179145217} +{"Pretrain/Learning Rate": 4.999708090000493e-05, "Pretrain/Loss": 2.2088217735290527, "Pretrain/Loss (Raw)": 2.067746162414551, "Pretrain/Step": 331, "Pretrain/Step Time": 8.056282870471478} +{"Pretrain/Learning Rate": 4.999694972336413e-05, "Pretrain/Loss": 2.206923484802246, "Pretrain/Loss (Raw)": 2.143690824508667, "Pretrain/Step": 332, "Pretrain/Step Time": 8.060101399198174} +{"Pretrain/Learning Rate": 4.9996815663957296e-05, "Pretrain/Loss": 2.2067532539367676, "Pretrain/Loss (Raw)": 2.1414270401000977, "Pretrain/Step": 333, "Pretrain/Step Time": 8.061454897746444} +{"Pretrain/Learning Rate": 4.9996678721799893e-05, "Pretrain/Loss": 2.207033157348633, "Pretrain/Loss (Raw)": 2.1534266471862793, "Pretrain/Step": 334, "Pretrain/Step Time": 8.059062954038382} +{"Pretrain/Learning Rate": 4.999653889690771e-05, "Pretrain/Loss": 2.20761775970459, "Pretrain/Loss (Raw)": 2.141706943511963, "Pretrain/Step": 335, "Pretrain/Step Time": 8.055363958701491} +{"Pretrain/Learning Rate": 4.9996396189296865e-05, "Pretrain/Loss": 2.20556640625, "Pretrain/Loss (Raw)": 2.042487144470215, "Pretrain/Step": 336, "Pretrain/Step Time": 8.057020688429475} +{"Pretrain/Learning Rate": 4.999625059898384e-05, "Pretrain/Loss": 2.2050156593322754, "Pretrain/Loss (Raw)": 2.207519054412842, "Pretrain/Step": 337, "Pretrain/Step Time": 8.051084792241454} +{"Pretrain/Learning Rate": 4.99961021259854e-05, "Pretrain/Loss": 2.2052884101867676, "Pretrain/Loss (Raw)": 2.281247854232788, "Pretrain/Step": 338, "Pretrain/Step Time": 8.050762016326189} +{"Pretrain/Learning Rate": 4.999595077031868e-05, "Pretrain/Loss": 2.205070734024048, "Pretrain/Loss (Raw)": 2.1472415924072266, "Pretrain/Step": 339, "Pretrain/Step Time": 8.047734601423144} +{"Pretrain/Learning Rate": 4.9995796532001136e-05, "Pretrain/Loss": 2.2037391662597656, "Pretrain/Loss (Raw)": 2.259587526321411, "Pretrain/Step": 340, "Pretrain/Step Time": 8.048076560720801} +{"Pretrain/Learning Rate": 4.999563941105054e-05, "Pretrain/Loss": 2.203660726547241, "Pretrain/Loss (Raw)": 2.2439963817596436, "Pretrain/Step": 341, "Pretrain/Step Time": 8.049464894458652} +{"Pretrain/Learning Rate": 4.9995479407485035e-05, "Pretrain/Loss": 2.2022933959960938, "Pretrain/Loss (Raw)": 2.1041982173919678, "Pretrain/Step": 342, "Pretrain/Step Time": 8.043431598693132} +{"Pretrain/Learning Rate": 4.9995316521323066e-05, "Pretrain/Loss": 2.2023568153381348, "Pretrain/Loss (Raw)": 2.158332109451294, "Pretrain/Step": 343, "Pretrain/Step Time": 8.041945056989789} +{"Pretrain/Learning Rate": 4.99951507525834e-05, "Pretrain/Loss": 2.202014446258545, "Pretrain/Loss (Raw)": 2.274890422821045, "Pretrain/Step": 344, "Pretrain/Step Time": 8.047222562134266} +{"Pretrain/Learning Rate": 4.999498210128518e-05, "Pretrain/Loss": 2.202500104904175, "Pretrain/Loss (Raw)": 2.1141979694366455, "Pretrain/Step": 345, "Pretrain/Step Time": 8.056734150275588} +{"Pretrain/Learning Rate": 4.9994810567447834e-05, "Pretrain/Loss": 2.2030372619628906, "Pretrain/Loss (Raw)": 2.2864632606506348, "Pretrain/Step": 346, "Pretrain/Step Time": 8.053876552730799} +{"Pretrain/Learning Rate": 4.9994636151091165e-05, "Pretrain/Loss": 2.203896999359131, "Pretrain/Loss (Raw)": 2.334150552749634, "Pretrain/Step": 347, "Pretrain/Step Time": 8.052391063421965} +{"Pretrain/Learning Rate": 4.999445885223527e-05, "Pretrain/Loss": 2.2035470008850098, "Pretrain/Loss (Raw)": 2.2694151401519775, "Pretrain/Step": 348, "Pretrain/Step Time": 8.051754618063569} +{"Pretrain/Learning Rate": 4.99942786709006e-05, "Pretrain/Loss": 2.2045507431030273, "Pretrain/Loss (Raw)": 2.448092222213745, "Pretrain/Step": 349, "Pretrain/Step Time": 8.048379424959421} +{"Pretrain/Learning Rate": 4.999409560710794e-05, "Pretrain/Loss": 2.204066276550293, "Pretrain/Loss (Raw)": 2.25646710395813, "Pretrain/Step": 350, "Pretrain/Step Time": 8.051999021321535} +{"Pretrain/Learning Rate": 4.99939096608784e-05, "Pretrain/Loss": 2.2052266597747803, "Pretrain/Loss (Raw)": 2.1710987091064453, "Pretrain/Step": 351, "Pretrain/Step Time": 8.04448022134602} +{"Pretrain/Learning Rate": 4.999372083223343e-05, "Pretrain/Loss": 2.205410957336426, "Pretrain/Loss (Raw)": 2.207462787628174, "Pretrain/Step": 352, "Pretrain/Step Time": 8.05002212151885} +{"Pretrain/Learning Rate": 4.999352912119478e-05, "Pretrain/Loss": 2.2042462825775146, "Pretrain/Loss (Raw)": 2.0804967880249023, "Pretrain/Step": 353, "Pretrain/Step Time": 8.051285557448864} +{"Pretrain/Learning Rate": 4.999333452778459e-05, "Pretrain/Loss": 2.203596591949463, "Pretrain/Loss (Raw)": 2.2489194869995117, "Pretrain/Step": 354, "Pretrain/Step Time": 8.055480962619185} +{"Pretrain/Learning Rate": 4.999313705202529e-05, "Pretrain/Loss": 2.2014963626861572, "Pretrain/Loss (Raw)": 2.0866305828094482, "Pretrain/Step": 355, "Pretrain/Step Time": 8.051485478878021} +{"Pretrain/Learning Rate": 4.999293669393965e-05, "Pretrain/Loss": 2.20298433303833, "Pretrain/Loss (Raw)": 2.3126258850097656, "Pretrain/Step": 356, "Pretrain/Step Time": 8.051901975646615} +{"Pretrain/Learning Rate": 4.999273345355078e-05, "Pretrain/Loss": 2.203016996383667, "Pretrain/Loss (Raw)": 2.2872819900512695, "Pretrain/Step": 357, "Pretrain/Step Time": 8.046037044376135} +{"Pretrain/Learning Rate": 4.9992527330882125e-05, "Pretrain/Loss": 2.203291416168213, "Pretrain/Loss (Raw)": 2.25358247756958, "Pretrain/Step": 358, "Pretrain/Step Time": 8.041856212541461} +{"Pretrain/Learning Rate": 4.999231832595744e-05, "Pretrain/Loss": 2.2024991512298584, "Pretrain/Loss (Raw)": 2.1404850482940674, "Pretrain/Step": 359, "Pretrain/Step Time": 8.050047254189849} +{"Pretrain/Learning Rate": 4.9992106438800846e-05, "Pretrain/Loss": 2.201883316040039, "Pretrain/Loss (Raw)": 2.2071051597595215, "Pretrain/Step": 360, "Pretrain/Step Time": 8.045216294005513} +{"Pretrain/Learning Rate": 4.999189166943677e-05, "Pretrain/Loss": 2.201341390609741, "Pretrain/Loss (Raw)": 2.3092899322509766, "Pretrain/Step": 361, "Pretrain/Step Time": 8.04494028352201} +{"Pretrain/Learning Rate": 4.999167401788998e-05, "Pretrain/Loss": 2.200697898864746, "Pretrain/Loss (Raw)": 2.139808177947998, "Pretrain/Step": 362, "Pretrain/Step Time": 8.044202173128724} +{"Pretrain/Learning Rate": 4.9991453484185577e-05, "Pretrain/Loss": 2.200878620147705, "Pretrain/Loss (Raw)": 2.1873738765716553, "Pretrain/Step": 363, "Pretrain/Step Time": 8.05475004389882} +{"Pretrain/Learning Rate": 4.999123006834899e-05, "Pretrain/Loss": 2.201353073120117, "Pretrain/Loss (Raw)": 2.461226463317871, "Pretrain/Step": 364, "Pretrain/Step Time": 8.055300269275904} +{"Pretrain/Learning Rate": 4.9991003770405994e-05, "Pretrain/Loss": 2.2019686698913574, "Pretrain/Loss (Raw)": 2.2794978618621826, "Pretrain/Step": 365, "Pretrain/Step Time": 8.04997332394123} +{"Pretrain/Learning Rate": 4.999077459038268e-05, "Pretrain/Loss": 2.2014951705932617, "Pretrain/Loss (Raw)": 2.1237547397613525, "Pretrain/Step": 366, "Pretrain/Step Time": 8.057446897029877} +{"Pretrain/Learning Rate": 4.9990542528305484e-05, "Pretrain/Loss": 2.1998305320739746, "Pretrain/Loss (Raw)": 2.195246458053589, "Pretrain/Step": 367, "Pretrain/Step Time": 8.056007189676166} +{"Pretrain/Learning Rate": 4.999030758420116e-05, "Pretrain/Loss": 2.1990487575531006, "Pretrain/Loss (Raw)": 2.1988186836242676, "Pretrain/Step": 368, "Pretrain/Step Time": 8.058504352346063} +{"Pretrain/Learning Rate": 4.999006975809681e-05, "Pretrain/Loss": 2.199457883834839, "Pretrain/Loss (Raw)": 2.1135571002960205, "Pretrain/Step": 369, "Pretrain/Step Time": 8.058579534292221} +{"Pretrain/Learning Rate": 4.998982905001986e-05, "Pretrain/Loss": 2.199216365814209, "Pretrain/Loss (Raw)": 2.1299424171447754, "Pretrain/Step": 370, "Pretrain/Step Time": 8.055971654132009} +{"Pretrain/Learning Rate": 4.998958545999806e-05, "Pretrain/Loss": 2.196934938430786, "Pretrain/Loss (Raw)": 1.973483681678772, "Pretrain/Step": 371, "Pretrain/Step Time": 8.053688386455178} +{"Pretrain/Learning Rate": 4.998933898805951e-05, "Pretrain/Loss": 2.1951396465301514, "Pretrain/Loss (Raw)": 2.1988637447357178, "Pretrain/Step": 372, "Pretrain/Step Time": 8.057731945067644} +{"Pretrain/Learning Rate": 4.9989089634232645e-05, "Pretrain/Loss": 2.1956140995025635, "Pretrain/Loss (Raw)": 2.231764793395996, "Pretrain/Step": 373, "Pretrain/Step Time": 8.065520565956831} +{"Pretrain/Learning Rate": 4.9988837398546206e-05, "Pretrain/Loss": 2.194514274597168, "Pretrain/Loss (Raw)": 2.067101240158081, "Pretrain/Step": 374, "Pretrain/Step Time": 8.052719939500093} +{"Pretrain/Learning Rate": 4.9988582281029284e-05, "Pretrain/Loss": 2.1965365409851074, "Pretrain/Loss (Raw)": 2.314451217651367, "Pretrain/Step": 375, "Pretrain/Step Time": 8.052567513659596} +{"Pretrain/Learning Rate": 4.998832428171131e-05, "Pretrain/Loss": 2.1963186264038086, "Pretrain/Loss (Raw)": 2.227100133895874, "Pretrain/Step": 376, "Pretrain/Step Time": 8.049040652811527} +{"Pretrain/Learning Rate": 4.998806340062202e-05, "Pretrain/Loss": 2.1959173679351807, "Pretrain/Loss (Raw)": 2.2316532135009766, "Pretrain/Step": 377, "Pretrain/Step Time": 8.047296609729528} +{"Pretrain/Learning Rate": 4.998779963779152e-05, "Pretrain/Loss": 2.196237564086914, "Pretrain/Loss (Raw)": 2.159289836883545, "Pretrain/Step": 378, "Pretrain/Step Time": 8.054965265095234} +{"Pretrain/Learning Rate": 4.998753299325021e-05, "Pretrain/Loss": 2.197739601135254, "Pretrain/Loss (Raw)": 2.243791103363037, "Pretrain/Step": 379, "Pretrain/Step Time": 8.053795032203197} +{"Pretrain/Learning Rate": 4.998726346702886e-05, "Pretrain/Loss": 2.1979825496673584, "Pretrain/Loss (Raw)": 2.1070303916931152, "Pretrain/Step": 380, "Pretrain/Step Time": 8.059285122901201} +{"Pretrain/Learning Rate": 4.998699105915854e-05, "Pretrain/Loss": 2.1981494426727295, "Pretrain/Loss (Raw)": 2.231837272644043, "Pretrain/Step": 381, "Pretrain/Step Time": 8.055380698293447} +{"Pretrain/Learning Rate": 4.9986715769670665e-05, "Pretrain/Loss": 2.1992239952087402, "Pretrain/Loss (Raw)": 2.183979034423828, "Pretrain/Step": 382, "Pretrain/Step Time": 8.05484108813107} +{"Pretrain/Learning Rate": 4.998643759859699e-05, "Pretrain/Loss": 2.1998391151428223, "Pretrain/Loss (Raw)": 2.188778877258301, "Pretrain/Step": 383, "Pretrain/Step Time": 8.06285398826003} +{"Pretrain/Learning Rate": 4.998615654596959e-05, "Pretrain/Loss": 2.2010250091552734, "Pretrain/Loss (Raw)": 2.3477623462677, "Pretrain/Step": 384, "Pretrain/Step Time": 8.054545171558857} +{"Pretrain/Learning Rate": 4.9985872611820885e-05, "Pretrain/Loss": 2.203226089477539, "Pretrain/Loss (Raw)": 2.3124277591705322, "Pretrain/Step": 385, "Pretrain/Step Time": 8.066788235679269} +{"Pretrain/Learning Rate": 4.9985585796183605e-05, "Pretrain/Loss": 2.2040698528289795, "Pretrain/Loss (Raw)": 2.2920117378234863, "Pretrain/Step": 386, "Pretrain/Step Time": 8.062872624024749} +{"Pretrain/Learning Rate": 4.998529609909084e-05, "Pretrain/Loss": 2.203425407409668, "Pretrain/Loss (Raw)": 2.162490129470825, "Pretrain/Step": 387, "Pretrain/Step Time": 8.069517521187663} +{"Pretrain/Learning Rate": 4.998500352057599e-05, "Pretrain/Loss": 2.2037606239318848, "Pretrain/Loss (Raw)": 2.2286994457244873, "Pretrain/Step": 388, "Pretrain/Step Time": 8.067393571138382} +{"Pretrain/Learning Rate": 4.9984708060672805e-05, "Pretrain/Loss": 2.2053487300872803, "Pretrain/Loss (Raw)": 2.3181581497192383, "Pretrain/Step": 389, "Pretrain/Step Time": 8.061730071902275} +{"Pretrain/Learning Rate": 4.9984409719415345e-05, "Pretrain/Loss": 2.2063162326812744, "Pretrain/Loss (Raw)": 2.2216784954071045, "Pretrain/Step": 390, "Pretrain/Step Time": 8.058999072760344} +{"Pretrain/Learning Rate": 4.9984108496838034e-05, "Pretrain/Loss": 2.206132411956787, "Pretrain/Loss (Raw)": 2.187113046646118, "Pretrain/Step": 391, "Pretrain/Step Time": 8.062902530655265} +{"Pretrain/Learning Rate": 4.99838043929756e-05, "Pretrain/Loss": 2.2043750286102295, "Pretrain/Loss (Raw)": 2.009385824203491, "Pretrain/Step": 392, "Pretrain/Step Time": 8.065376041457057} +{"Pretrain/Learning Rate": 4.9983497407863114e-05, "Pretrain/Loss": 2.2045998573303223, "Pretrain/Loss (Raw)": 2.225165605545044, "Pretrain/Step": 393, "Pretrain/Step Time": 8.059884609654546} +{"Pretrain/Learning Rate": 4.9983187541535984e-05, "Pretrain/Loss": 2.2052927017211914, "Pretrain/Loss (Raw)": 2.275761842727661, "Pretrain/Step": 394, "Pretrain/Step Time": 8.059520039707422} +{"Pretrain/Learning Rate": 4.998287479402994e-05, "Pretrain/Loss": 2.205653667449951, "Pretrain/Loss (Raw)": 2.4486851692199707, "Pretrain/Step": 395, "Pretrain/Step Time": 8.05561269260943} +{"Pretrain/Learning Rate": 4.998255916538106e-05, "Pretrain/Loss": 2.2044894695281982, "Pretrain/Loss (Raw)": 2.2498128414154053, "Pretrain/Step": 396, "Pretrain/Step Time": 8.062423124909401} +{"Pretrain/Learning Rate": 4.998224065562572e-05, "Pretrain/Loss": 2.2032828330993652, "Pretrain/Loss (Raw)": 2.1559340953826904, "Pretrain/Step": 397, "Pretrain/Step Time": 8.053631762042642} +{"Pretrain/Learning Rate": 4.998191926480068e-05, "Pretrain/Loss": 2.2042622566223145, "Pretrain/Loss (Raw)": 2.275761127471924, "Pretrain/Step": 398, "Pretrain/Step Time": 8.04611306451261} +{"Pretrain/Learning Rate": 4.998159499294299e-05, "Pretrain/Loss": 2.205826759338379, "Pretrain/Loss (Raw)": 2.304489850997925, "Pretrain/Step": 399, "Pretrain/Step Time": 8.050689958035946} +{"Pretrain/Learning Rate": 4.998126784009005e-05, "Pretrain/Loss": 2.2052884101867676, "Pretrain/Loss (Raw)": 2.221780776977539, "Pretrain/Step": 400, "Pretrain/Step Time": 8.051179226487875} +{"Pretrain/Learning Rate": 4.998093780627958e-05, "Pretrain/Loss": 2.2088375091552734, "Pretrain/Loss (Raw)": 2.6231014728546143, "Pretrain/Step": 401, "Pretrain/Step Time": 8.06421815045178} +{"Pretrain/Learning Rate": 4.9980604891549656e-05, "Pretrain/Loss": 2.208101272583008, "Pretrain/Loss (Raw)": 2.2590348720550537, "Pretrain/Step": 402, "Pretrain/Step Time": 8.064342861995101} +{"Pretrain/Learning Rate": 4.998026909593865e-05, "Pretrain/Loss": 2.2071590423583984, "Pretrain/Loss (Raw)": 2.0586814880371094, "Pretrain/Step": 403, "Pretrain/Step Time": 8.056301763281226} +{"Pretrain/Learning Rate": 4.997993041948531e-05, "Pretrain/Loss": 2.207634925842285, "Pretrain/Loss (Raw)": 2.2029998302459717, "Pretrain/Step": 404, "Pretrain/Step Time": 8.061513436958194} +{"Pretrain/Learning Rate": 4.997958886222869e-05, "Pretrain/Loss": 2.207609176635742, "Pretrain/Loss (Raw)": 2.3326382637023926, "Pretrain/Step": 405, "Pretrain/Step Time": 8.058938844129443} +{"Pretrain/Learning Rate": 4.9979244424208165e-05, "Pretrain/Loss": 2.2069525718688965, "Pretrain/Loss (Raw)": 2.190910577774048, "Pretrain/Step": 406, "Pretrain/Step Time": 8.065968016162515} +{"Pretrain/Learning Rate": 4.997889710546347e-05, "Pretrain/Loss": 2.205575704574585, "Pretrain/Loss (Raw)": 2.0661399364471436, "Pretrain/Step": 407, "Pretrain/Step Time": 8.05753268301487} +{"Pretrain/Learning Rate": 4.9978546906034655e-05, "Pretrain/Loss": 2.2061076164245605, "Pretrain/Loss (Raw)": 2.3135106563568115, "Pretrain/Step": 408, "Pretrain/Step Time": 8.05532991886139} +{"Pretrain/Learning Rate": 4.997819382596212e-05, "Pretrain/Loss": 2.2049174308776855, "Pretrain/Loss (Raw)": 2.133545398712158, "Pretrain/Step": 409, "Pretrain/Step Time": 8.05612881295383} +{"Pretrain/Learning Rate": 4.997783786528656e-05, "Pretrain/Loss": 2.205338954925537, "Pretrain/Loss (Raw)": 2.2271194458007812, "Pretrain/Step": 410, "Pretrain/Step Time": 8.066197210922837} +{"Pretrain/Learning Rate": 4.997747902404904e-05, "Pretrain/Loss": 2.2043704986572266, "Pretrain/Loss (Raw)": 2.0576982498168945, "Pretrain/Step": 411, "Pretrain/Step Time": 8.065805466845632} +{"Pretrain/Learning Rate": 4.997711730229094e-05, "Pretrain/Loss": 2.204305648803711, "Pretrain/Loss (Raw)": 2.1864380836486816, "Pretrain/Step": 412, "Pretrain/Step Time": 8.060893489047885} +{"Pretrain/Learning Rate": 4.9976752700053975e-05, "Pretrain/Loss": 2.2022042274475098, "Pretrain/Loss (Raw)": 1.9850552082061768, "Pretrain/Step": 413, "Pretrain/Step Time": 8.057349763810635} +{"Pretrain/Learning Rate": 4.9976385217380195e-05, "Pretrain/Loss": 2.2002925872802734, "Pretrain/Loss (Raw)": 1.9780504703521729, "Pretrain/Step": 414, "Pretrain/Step Time": 8.055588129907846} +{"Pretrain/Learning Rate": 4.997601485431198e-05, "Pretrain/Loss": 2.2004241943359375, "Pretrain/Loss (Raw)": 2.2406680583953857, "Pretrain/Step": 415, "Pretrain/Step Time": 8.052763333544135} +{"Pretrain/Learning Rate": 4.997564161089204e-05, "Pretrain/Loss": 2.2006521224975586, "Pretrain/Loss (Raw)": 2.160487413406372, "Pretrain/Step": 416, "Pretrain/Step Time": 8.05272801592946} +{"Pretrain/Learning Rate": 4.9975265487163424e-05, "Pretrain/Loss": 2.200664520263672, "Pretrain/Loss (Raw)": 2.239197254180908, "Pretrain/Step": 417, "Pretrain/Step Time": 8.05370082706213} +{"Pretrain/Learning Rate": 4.997488648316951e-05, "Pretrain/Loss": 2.1995019912719727, "Pretrain/Loss (Raw)": 2.1825735569000244, "Pretrain/Step": 418, "Pretrain/Step Time": 8.052868025377393} +{"Pretrain/Learning Rate": 4.997450459895399e-05, "Pretrain/Loss": 2.198330879211426, "Pretrain/Loss (Raw)": 2.1486308574676514, "Pretrain/Step": 419, "Pretrain/Step Time": 8.050003625452518} +{"Pretrain/Learning Rate": 4.997411983456092e-05, "Pretrain/Loss": 2.1980466842651367, "Pretrain/Loss (Raw)": 2.2144105434417725, "Pretrain/Step": 420, "Pretrain/Step Time": 8.060606410726905} +{"Pretrain/Learning Rate": 4.9973732190034674e-05, "Pretrain/Loss": 2.19828462600708, "Pretrain/Loss (Raw)": 2.1608006954193115, "Pretrain/Step": 421, "Pretrain/Step Time": 8.060072047635913} +{"Pretrain/Learning Rate": 4.9973341665419946e-05, "Pretrain/Loss": 2.1984786987304688, "Pretrain/Loss (Raw)": 2.108448028564453, "Pretrain/Step": 422, "Pretrain/Step Time": 8.06127797998488} +{"Pretrain/Learning Rate": 4.997294826076178e-05, "Pretrain/Loss": 2.200657367706299, "Pretrain/Loss (Raw)": 2.3613171577453613, "Pretrain/Step": 423, "Pretrain/Step Time": 8.064401620998979} +{"Pretrain/Learning Rate": 4.9972551976105545e-05, "Pretrain/Loss": 2.199540138244629, "Pretrain/Loss (Raw)": 2.0758726596832275, "Pretrain/Step": 424, "Pretrain/Step Time": 8.060153419151902} +{"Pretrain/Learning Rate": 4.9972152811496945e-05, "Pretrain/Loss": 2.199586868286133, "Pretrain/Loss (Raw)": 2.2289605140686035, "Pretrain/Step": 425, "Pretrain/Step Time": 8.071748742833734} +{"Pretrain/Learning Rate": 4.9971750766982e-05, "Pretrain/Loss": 2.1994519233703613, "Pretrain/Loss (Raw)": 2.165682554244995, "Pretrain/Step": 426, "Pretrain/Step Time": 8.065558295696974} +{"Pretrain/Learning Rate": 4.9971345842607095e-05, "Pretrain/Loss": 2.1993155479431152, "Pretrain/Loss (Raw)": 2.129539966583252, "Pretrain/Step": 427, "Pretrain/Step Time": 8.06505292467773} +{"Pretrain/Learning Rate": 4.997093803841891e-05, "Pretrain/Loss": 2.198472023010254, "Pretrain/Loss (Raw)": 2.035402774810791, "Pretrain/Step": 428, "Pretrain/Step Time": 8.057957824319601} +{"Pretrain/Learning Rate": 4.997052735446449e-05, "Pretrain/Loss": 2.1988677978515625, "Pretrain/Loss (Raw)": 2.290883779525757, "Pretrain/Step": 429, "Pretrain/Step Time": 8.068207060918212} +{"Pretrain/Learning Rate": 4.997011379079119e-05, "Pretrain/Loss": 2.1988492012023926, "Pretrain/Loss (Raw)": 2.1037559509277344, "Pretrain/Step": 430, "Pretrain/Step Time": 8.063309364020824} +{"Pretrain/Learning Rate": 4.996969734744671e-05, "Pretrain/Loss": 2.197219133377075, "Pretrain/Loss (Raw)": 2.0610172748565674, "Pretrain/Step": 431, "Pretrain/Step Time": 8.058369372040033} +{"Pretrain/Learning Rate": 4.996927802447906e-05, "Pretrain/Loss": 2.1960930824279785, "Pretrain/Loss (Raw)": 2.2358508110046387, "Pretrain/Step": 432, "Pretrain/Step Time": 8.056342812255025} +{"Pretrain/Learning Rate": 4.9968855821936613e-05, "Pretrain/Loss": 2.196909189224243, "Pretrain/Loss (Raw)": 2.2297897338867188, "Pretrain/Step": 433, "Pretrain/Step Time": 8.056045485660434} +{"Pretrain/Learning Rate": 4.9968430739868056e-05, "Pretrain/Loss": 2.1960055828094482, "Pretrain/Loss (Raw)": 2.0661206245422363, "Pretrain/Step": 434, "Pretrain/Step Time": 8.063656253740191} +{"Pretrain/Learning Rate": 4.9968002778322406e-05, "Pretrain/Loss": 2.1960859298706055, "Pretrain/Loss (Raw)": 2.0891854763031006, "Pretrain/Step": 435, "Pretrain/Step Time": 8.056731963530183} +{"Pretrain/Learning Rate": 4.9967571937349034e-05, "Pretrain/Loss": 2.195619583129883, "Pretrain/Loss (Raw)": 2.1372456550598145, "Pretrain/Step": 436, "Pretrain/Step Time": 8.055352926254272} +{"Pretrain/Learning Rate": 4.996713821699761e-05, "Pretrain/Loss": 2.195378303527832, "Pretrain/Loss (Raw)": 2.221881628036499, "Pretrain/Step": 437, "Pretrain/Step Time": 8.057575788348913} +{"Pretrain/Learning Rate": 4.9966701617318154e-05, "Pretrain/Loss": 2.1954751014709473, "Pretrain/Loss (Raw)": 2.1878445148468018, "Pretrain/Step": 438, "Pretrain/Step Time": 8.050806377083063} +{"Pretrain/Learning Rate": 4.996626213836103e-05, "Pretrain/Loss": 2.1960394382476807, "Pretrain/Loss (Raw)": 2.1586735248565674, "Pretrain/Step": 439, "Pretrain/Step Time": 8.057886891067028} +{"Pretrain/Learning Rate": 4.99658197801769e-05, "Pretrain/Loss": 2.1973750591278076, "Pretrain/Loss (Raw)": 2.2516682147979736, "Pretrain/Step": 440, "Pretrain/Step Time": 8.061797445639968} +{"Pretrain/Learning Rate": 4.99653745428168e-05, "Pretrain/Loss": 2.1994211673736572, "Pretrain/Loss (Raw)": 2.4984419345855713, "Pretrain/Step": 441, "Pretrain/Step Time": 8.071360290050507} +{"Pretrain/Learning Rate": 4.9964926426332056e-05, "Pretrain/Loss": 2.19864559173584, "Pretrain/Loss (Raw)": 2.1163907051086426, "Pretrain/Step": 442, "Pretrain/Step Time": 8.065562972798944} +{"Pretrain/Learning Rate": 4.9964475430774364e-05, "Pretrain/Loss": 2.196643352508545, "Pretrain/Loss (Raw)": 2.166513204574585, "Pretrain/Step": 443, "Pretrain/Step Time": 8.07373488880694} +{"Pretrain/Learning Rate": 4.996402155619573e-05, "Pretrain/Loss": 2.1952245235443115, "Pretrain/Loss (Raw)": 2.049931526184082, "Pretrain/Step": 444, "Pretrain/Step Time": 8.072592221200466} +{"Pretrain/Learning Rate": 4.9963564802648494e-05, "Pretrain/Loss": 2.195435047149658, "Pretrain/Loss (Raw)": 2.2043204307556152, "Pretrain/Step": 445, "Pretrain/Step Time": 8.068250875920057} +{"Pretrain/Learning Rate": 4.9963105170185334e-05, "Pretrain/Loss": 2.1954989433288574, "Pretrain/Loss (Raw)": 2.255632162094116, "Pretrain/Step": 446, "Pretrain/Step Time": 8.073670621961355} +{"Pretrain/Learning Rate": 4.9962642658859255e-05, "Pretrain/Loss": 2.1963276863098145, "Pretrain/Loss (Raw)": 2.2183849811553955, "Pretrain/Step": 447, "Pretrain/Step Time": 8.066049626097083} +{"Pretrain/Learning Rate": 4.99621772687236e-05, "Pretrain/Loss": 2.198397636413574, "Pretrain/Loss (Raw)": 2.447869062423706, "Pretrain/Step": 448, "Pretrain/Step Time": 8.07173177972436} +{"Pretrain/Learning Rate": 4.996170899983203e-05, "Pretrain/Loss": 2.1989316940307617, "Pretrain/Loss (Raw)": 2.2406928539276123, "Pretrain/Step": 449, "Pretrain/Step Time": 8.069910196587443} +{"Pretrain/Learning Rate": 4.9961237852238554e-05, "Pretrain/Loss": 2.199220657348633, "Pretrain/Loss (Raw)": 2.1936049461364746, "Pretrain/Step": 450, "Pretrain/Step Time": 8.069831784814596} +{"Pretrain/Learning Rate": 4.996076382599752e-05, "Pretrain/Loss": 2.1980478763580322, "Pretrain/Loss (Raw)": 2.05472469329834, "Pretrain/Step": 451, "Pretrain/Step Time": 8.067646160721779} +{"Pretrain/Learning Rate": 4.996028692116357e-05, "Pretrain/Loss": 2.197746515274048, "Pretrain/Loss (Raw)": 2.1383726596832275, "Pretrain/Step": 452, "Pretrain/Step Time": 8.060144387185574} +{"Pretrain/Learning Rate": 4.995980713779172e-05, "Pretrain/Loss": 2.1985692977905273, "Pretrain/Loss (Raw)": 2.233417510986328, "Pretrain/Step": 453, "Pretrain/Step Time": 8.069192856550217} +{"Pretrain/Learning Rate": 4.9959324475937297e-05, "Pretrain/Loss": 2.196666717529297, "Pretrain/Loss (Raw)": 1.9636858701705933, "Pretrain/Step": 454, "Pretrain/Step Time": 8.063187731429935} +{"Pretrain/Learning Rate": 4.995883893565596e-05, "Pretrain/Loss": 2.1965882778167725, "Pretrain/Loss (Raw)": 2.095813274383545, "Pretrain/Step": 455, "Pretrain/Step Time": 8.060787426307797} +{"Pretrain/Learning Rate": 4.995835051700371e-05, "Pretrain/Loss": 2.1962664127349854, "Pretrain/Loss (Raw)": 2.152158498764038, "Pretrain/Step": 456, "Pretrain/Step Time": 8.06275336816907} +{"Pretrain/Learning Rate": 4.995785922003687e-05, "Pretrain/Loss": 2.196129322052002, "Pretrain/Loss (Raw)": 2.1409852504730225, "Pretrain/Step": 457, "Pretrain/Step Time": 8.057483781129122} +{"Pretrain/Learning Rate": 4.9957365044812097e-05, "Pretrain/Loss": 2.1971960067749023, "Pretrain/Loss (Raw)": 2.1625852584838867, "Pretrain/Step": 458, "Pretrain/Step Time": 8.066571360453963} +{"Pretrain/Learning Rate": 4.995686799138639e-05, "Pretrain/Loss": 2.1992568969726562, "Pretrain/Loss (Raw)": 2.331552505493164, "Pretrain/Step": 459, "Pretrain/Step Time": 8.065759977325797} +{"Pretrain/Learning Rate": 4.995636805981706e-05, "Pretrain/Loss": 2.1997315883636475, "Pretrain/Loss (Raw)": 2.2044363021850586, "Pretrain/Step": 460, "Pretrain/Step Time": 8.069208275526762} +{"Pretrain/Learning Rate": 4.9955865250161774e-05, "Pretrain/Loss": 2.2001280784606934, "Pretrain/Loss (Raw)": 2.192183017730713, "Pretrain/Step": 461, "Pretrain/Step Time": 8.061498617753386} +{"Pretrain/Learning Rate": 4.9955359562478504e-05, "Pretrain/Loss": 2.200136661529541, "Pretrain/Loss (Raw)": 2.154501438140869, "Pretrain/Step": 462, "Pretrain/Step Time": 8.069398356601596} +{"Pretrain/Learning Rate": 4.995485099682558e-05, "Pretrain/Loss": 2.2001962661743164, "Pretrain/Loss (Raw)": 2.149350881576538, "Pretrain/Step": 463, "Pretrain/Step Time": 8.078544886782765} +{"Pretrain/Learning Rate": 4.995433955326165e-05, "Pretrain/Loss": 2.203188896179199, "Pretrain/Loss (Raw)": 2.4255831241607666, "Pretrain/Step": 464, "Pretrain/Step Time": 8.066691460087895} +{"Pretrain/Learning Rate": 4.995382523184569e-05, "Pretrain/Loss": 2.2023348808288574, "Pretrain/Loss (Raw)": 2.0981698036193848, "Pretrain/Step": 465, "Pretrain/Step Time": 8.078463731333613} +{"Pretrain/Learning Rate": 4.9953308032637016e-05, "Pretrain/Loss": 2.2001290321350098, "Pretrain/Loss (Raw)": 1.9989060163497925, "Pretrain/Step": 466, "Pretrain/Step Time": 8.071351312100887} +{"Pretrain/Learning Rate": 4.995278795569528e-05, "Pretrain/Loss": 2.200211763381958, "Pretrain/Loss (Raw)": 2.1578354835510254, "Pretrain/Step": 467, "Pretrain/Step Time": 8.077995955944061} +{"Pretrain/Learning Rate": 4.995226500108046e-05, "Pretrain/Loss": 2.1993818283081055, "Pretrain/Loss (Raw)": 2.153348445892334, "Pretrain/Step": 468, "Pretrain/Step Time": 8.075411038473248} +{"Pretrain/Learning Rate": 4.995173916885285e-05, "Pretrain/Loss": 2.198611259460449, "Pretrain/Loss (Raw)": 2.145364999771118, "Pretrain/Step": 469, "Pretrain/Step Time": 8.07791893556714} +{"Pretrain/Learning Rate": 4.9951210459073105e-05, "Pretrain/Loss": 2.1982951164245605, "Pretrain/Loss (Raw)": 2.0637218952178955, "Pretrain/Step": 470, "Pretrain/Step Time": 8.080645712092519} +{"Pretrain/Learning Rate": 4.99506788718022e-05, "Pretrain/Loss": 2.198115348815918, "Pretrain/Loss (Raw)": 2.1353342533111572, "Pretrain/Step": 471, "Pretrain/Step Time": 8.083542162552476} +{"Pretrain/Learning Rate": 4.995014440710144e-05, "Pretrain/Loss": 2.19734787940979, "Pretrain/Loss (Raw)": 2.1766622066497803, "Pretrain/Step": 472, "Pretrain/Step Time": 8.079264713451266} +{"Pretrain/Learning Rate": 4.9949607065032445e-05, "Pretrain/Loss": 2.197478771209717, "Pretrain/Loss (Raw)": 2.130915403366089, "Pretrain/Step": 473, "Pretrain/Step Time": 8.072323946282268} +{"Pretrain/Learning Rate": 4.99490668456572e-05, "Pretrain/Loss": 2.1965889930725098, "Pretrain/Loss (Raw)": 2.17258620262146, "Pretrain/Step": 474, "Pretrain/Step Time": 8.074503626674414} +{"Pretrain/Learning Rate": 4.994852374903801e-05, "Pretrain/Loss": 2.1961522102355957, "Pretrain/Loss (Raw)": 2.2782528400421143, "Pretrain/Step": 475, "Pretrain/Step Time": 8.075883854180574} +{"Pretrain/Learning Rate": 4.99479777752375e-05, "Pretrain/Loss": 2.195675849914551, "Pretrain/Loss (Raw)": 2.208444833755493, "Pretrain/Step": 476, "Pretrain/Step Time": 8.078973393887281} +{"Pretrain/Learning Rate": 4.994742892431863e-05, "Pretrain/Loss": 2.193317174911499, "Pretrain/Loss (Raw)": 2.1461708545684814, "Pretrain/Step": 477, "Pretrain/Step Time": 8.0818413477391} +{"Pretrain/Learning Rate": 4.99468771963447e-05, "Pretrain/Loss": 2.192837715148926, "Pretrain/Loss (Raw)": 2.195122003555298, "Pretrain/Step": 478, "Pretrain/Step Time": 8.079889174550772} +{"Pretrain/Learning Rate": 4.994632259137935e-05, "Pretrain/Loss": 2.1949026584625244, "Pretrain/Loss (Raw)": 2.4353830814361572, "Pretrain/Step": 479, "Pretrain/Step Time": 8.0875474344939} +{"Pretrain/Learning Rate": 4.9945765109486506e-05, "Pretrain/Loss": 2.1940531730651855, "Pretrain/Loss (Raw)": 2.0987484455108643, "Pretrain/Step": 480, "Pretrain/Step Time": 8.082680948078632} +{"Pretrain/Learning Rate": 4.99452047507305e-05, "Pretrain/Loss": 2.194573163986206, "Pretrain/Loss (Raw)": 2.147035837173462, "Pretrain/Step": 481, "Pretrain/Step Time": 8.09141312353313} +{"Pretrain/Learning Rate": 4.994464151517593e-05, "Pretrain/Loss": 2.1943368911743164, "Pretrain/Loss (Raw)": 2.2186665534973145, "Pretrain/Step": 482, "Pretrain/Step Time": 8.093504942953587} +{"Pretrain/Learning Rate": 4.994407540288775e-05, "Pretrain/Loss": 2.1945316791534424, "Pretrain/Loss (Raw)": 2.111589193344116, "Pretrain/Step": 483, "Pretrain/Step Time": 8.092761168256402} +{"Pretrain/Learning Rate": 4.994350641393126e-05, "Pretrain/Loss": 2.1932973861694336, "Pretrain/Loss (Raw)": 2.15464186668396, "Pretrain/Step": 484, "Pretrain/Step Time": 8.087594132870436} +{"Pretrain/Learning Rate": 4.9942934548372077e-05, "Pretrain/Loss": 2.1924989223480225, "Pretrain/Loss (Raw)": 2.185063362121582, "Pretrain/Step": 485, "Pretrain/Step Time": 8.085650747641921} +{"Pretrain/Learning Rate": 4.994235980627614e-05, "Pretrain/Loss": 2.1928887367248535, "Pretrain/Loss (Raw)": 2.3035025596618652, "Pretrain/Step": 486, "Pretrain/Step Time": 8.090913331136107} +{"Pretrain/Learning Rate": 4.9941782187709746e-05, "Pretrain/Loss": 2.1939198970794678, "Pretrain/Loss (Raw)": 2.272449493408203, "Pretrain/Step": 487, "Pretrain/Step Time": 8.085046773776412} +{"Pretrain/Learning Rate": 4.994120169273949e-05, "Pretrain/Loss": 2.1949753761291504, "Pretrain/Loss (Raw)": 2.342238426208496, "Pretrain/Step": 488, "Pretrain/Step Time": 8.08761983923614} +{"Pretrain/Learning Rate": 4.9940618321432344e-05, "Pretrain/Loss": 2.1952009201049805, "Pretrain/Loss (Raw)": 2.338102340698242, "Pretrain/Step": 489, "Pretrain/Step Time": 8.080235987901688} +{"Pretrain/Learning Rate": 4.994003207385556e-05, "Pretrain/Loss": 2.195314884185791, "Pretrain/Loss (Raw)": 2.154452085494995, "Pretrain/Step": 490, "Pretrain/Step Time": 8.083678677678108} +{"Pretrain/Learning Rate": 4.9939442950076755e-05, "Pretrain/Loss": 2.194845676422119, "Pretrain/Loss (Raw)": 2.1272737979888916, "Pretrain/Step": 491, "Pretrain/Step Time": 8.076857326552272} +{"Pretrain/Learning Rate": 4.9938850950163864e-05, "Pretrain/Loss": 2.1920385360717773, "Pretrain/Loss (Raw)": 2.101949453353882, "Pretrain/Step": 492, "Pretrain/Step Time": 8.070802103728056} +{"Pretrain/Learning Rate": 4.9938256074185174e-05, "Pretrain/Loss": 2.190469264984131, "Pretrain/Loss (Raw)": 2.078603506088257, "Pretrain/Step": 493, "Pretrain/Step Time": 8.080397799611092} +{"Pretrain/Learning Rate": 4.993765832220928e-05, "Pretrain/Loss": 2.1915597915649414, "Pretrain/Loss (Raw)": 2.263364791870117, "Pretrain/Step": 494, "Pretrain/Step Time": 8.073355834931135} +{"Pretrain/Learning Rate": 4.993705769430511e-05, "Pretrain/Loss": 2.1926722526550293, "Pretrain/Loss (Raw)": 2.3376026153564453, "Pretrain/Step": 495, "Pretrain/Step Time": 8.074403146281838} +{"Pretrain/Learning Rate": 4.9936454190541945e-05, "Pretrain/Loss": 2.191051483154297, "Pretrain/Loss (Raw)": 1.9913874864578247, "Pretrain/Step": 496, "Pretrain/Step Time": 8.075108993798494} +{"Pretrain/Learning Rate": 4.993584781098939e-05, "Pretrain/Loss": 2.192216396331787, "Pretrain/Loss (Raw)": 2.262655258178711, "Pretrain/Step": 497, "Pretrain/Step Time": 8.075637893751264} +{"Pretrain/Learning Rate": 4.993523855571735e-05, "Pretrain/Loss": 2.1931028366088867, "Pretrain/Loss (Raw)": 2.24340558052063, "Pretrain/Step": 498, "Pretrain/Step Time": 8.078797716647387} +{"Pretrain/Learning Rate": 4.99346264247961e-05, "Pretrain/Loss": 2.195765972137451, "Pretrain/Loss (Raw)": 2.314375400543213, "Pretrain/Step": 499, "Pretrain/Step Time": 8.081407111138105} +{"Pretrain/Learning Rate": 4.993401141829625e-05, "Pretrain/Loss": 2.1953277587890625, "Pretrain/Loss (Raw)": 2.142777442932129, "Pretrain/Step": 500, "Pretrain/Step Time": 8.07463769800961} +{"Pretrain/Learning Rate": 4.99333935362887e-05, "Pretrain/Loss": 2.1954424381256104, "Pretrain/Loss (Raw)": 2.246447801589966, "Pretrain/Step": 501, "Pretrain/Step Time": 8.072352856397629} +{"Pretrain/Learning Rate": 4.993277277884471e-05, "Pretrain/Loss": 2.196904182434082, "Pretrain/Loss (Raw)": 2.254197597503662, "Pretrain/Step": 502, "Pretrain/Step Time": 8.079239783808589} +{"Pretrain/Learning Rate": 4.993214914603588e-05, "Pretrain/Loss": 2.1957480907440186, "Pretrain/Loss (Raw)": 2.1664488315582275, "Pretrain/Step": 503, "Pretrain/Step Time": 8.073407409712672} +{"Pretrain/Learning Rate": 4.993152263793414e-05, "Pretrain/Loss": 2.1955790519714355, "Pretrain/Loss (Raw)": 2.205467462539673, "Pretrain/Step": 504, "Pretrain/Step Time": 8.079254472628236} +{"Pretrain/Learning Rate": 4.993089325461171e-05, "Pretrain/Loss": 2.194660186767578, "Pretrain/Loss (Raw)": 2.114043712615967, "Pretrain/Step": 505, "Pretrain/Step Time": 8.07788553647697} +{"Pretrain/Learning Rate": 4.99302609961412e-05, "Pretrain/Loss": 2.1947264671325684, "Pretrain/Loss (Raw)": 2.1677920818328857, "Pretrain/Step": 506, "Pretrain/Step Time": 8.07044698484242} +{"Pretrain/Learning Rate": 4.9929625862595516e-05, "Pretrain/Loss": 2.193361282348633, "Pretrain/Loss (Raw)": 2.0690455436706543, "Pretrain/Step": 507, "Pretrain/Step Time": 8.071529442444444} +{"Pretrain/Learning Rate": 4.9928987854047905e-05, "Pretrain/Loss": 2.1954002380371094, "Pretrain/Loss (Raw)": 2.368009567260742, "Pretrain/Step": 508, "Pretrain/Step Time": 8.061878029257059} +{"Pretrain/Learning Rate": 4.992834697057195e-05, "Pretrain/Loss": 2.1948721408843994, "Pretrain/Loss (Raw)": 2.164228677749634, "Pretrain/Step": 509, "Pretrain/Step Time": 8.066523190587759} +{"Pretrain/Learning Rate": 4.992770321224155e-05, "Pretrain/Loss": 2.196357250213623, "Pretrain/Loss (Raw)": 2.374079465866089, "Pretrain/Step": 510, "Pretrain/Step Time": 8.065674977377057} +{"Pretrain/Learning Rate": 4.992705657913095e-05, "Pretrain/Loss": 2.195512056350708, "Pretrain/Loss (Raw)": 2.0805866718292236, "Pretrain/Step": 511, "Pretrain/Step Time": 8.055133655667305} +{"Pretrain/Learning Rate": 4.9926407071314736e-05, "Pretrain/Loss": 2.194481611251831, "Pretrain/Loss (Raw)": 2.215895891189575, "Pretrain/Step": 512, "Pretrain/Step Time": 8.062401516363025} +{"Pretrain/Learning Rate": 4.9925754688867796e-05, "Pretrain/Loss": 2.1923627853393555, "Pretrain/Loss (Raw)": 2.041189193725586, "Pretrain/Step": 513, "Pretrain/Step Time": 8.055243831127882} +{"Pretrain/Learning Rate": 4.992509943186537e-05, "Pretrain/Loss": 2.1907601356506348, "Pretrain/Loss (Raw)": 2.086886405944824, "Pretrain/Step": 514, "Pretrain/Step Time": 8.057624664157629} +{"Pretrain/Learning Rate": 4.992444130038302e-05, "Pretrain/Loss": 2.1899001598358154, "Pretrain/Loss (Raw)": 2.052393913269043, "Pretrain/Step": 515, "Pretrain/Step Time": 8.0582956969738} +{"Pretrain/Learning Rate": 4.992378029449666e-05, "Pretrain/Loss": 2.190101146697998, "Pretrain/Loss (Raw)": 2.2544467449188232, "Pretrain/Step": 516, "Pretrain/Step Time": 8.05405399389565} +{"Pretrain/Learning Rate": 4.9923116414282514e-05, "Pretrain/Loss": 2.1871280670166016, "Pretrain/Loss (Raw)": 1.9376060962677002, "Pretrain/Step": 517, "Pretrain/Step Time": 8.060561161488295} +{"Pretrain/Learning Rate": 4.992244965981714e-05, "Pretrain/Loss": 2.1883277893066406, "Pretrain/Loss (Raw)": 2.3752381801605225, "Pretrain/Step": 518, "Pretrain/Step Time": 8.065918397158384} +{"Pretrain/Learning Rate": 4.9921780031177425e-05, "Pretrain/Loss": 2.1883397102355957, "Pretrain/Loss (Raw)": 2.1886181831359863, "Pretrain/Step": 519, "Pretrain/Step Time": 8.064090823754668} +{"Pretrain/Learning Rate": 4.992110752844061e-05, "Pretrain/Loss": 2.189755439758301, "Pretrain/Loss (Raw)": 2.190598964691162, "Pretrain/Step": 520, "Pretrain/Step Time": 8.058348949998617} +{"Pretrain/Learning Rate": 4.992043215168424e-05, "Pretrain/Loss": 2.1898252964019775, "Pretrain/Loss (Raw)": 2.2341253757476807, "Pretrain/Step": 521, "Pretrain/Step Time": 8.063181387260556} +{"Pretrain/Learning Rate": 4.99197539009862e-05, "Pretrain/Loss": 2.18859601020813, "Pretrain/Loss (Raw)": 2.1184194087982178, "Pretrain/Step": 522, "Pretrain/Step Time": 8.054439390078187} +{"Pretrain/Learning Rate": 4.9919072776424726e-05, "Pretrain/Loss": 2.186582326889038, "Pretrain/Loss (Raw)": 2.190922498703003, "Pretrain/Step": 523, "Pretrain/Step Time": 8.065062088891864} +{"Pretrain/Learning Rate": 4.9918388778078347e-05, "Pretrain/Loss": 2.187014102935791, "Pretrain/Loss (Raw)": 2.305076837539673, "Pretrain/Step": 524, "Pretrain/Step Time": 8.06455908715725} +{"Pretrain/Learning Rate": 4.991770190602596e-05, "Pretrain/Loss": 2.186307907104492, "Pretrain/Loss (Raw)": 2.0655386447906494, "Pretrain/Step": 525, "Pretrain/Step Time": 8.067175665870309} +{"Pretrain/Learning Rate": 4.991701216034677e-05, "Pretrain/Loss": 2.185346841812134, "Pretrain/Loss (Raw)": 2.152757406234741, "Pretrain/Step": 526, "Pretrain/Step Time": 8.071295181289315} +{"Pretrain/Learning Rate": 4.9916319541120324e-05, "Pretrain/Loss": 2.184445858001709, "Pretrain/Loss (Raw)": 2.1891589164733887, "Pretrain/Step": 527, "Pretrain/Step Time": 8.062651570886374} +{"Pretrain/Learning Rate": 4.99156240484265e-05, "Pretrain/Loss": 2.183328151702881, "Pretrain/Loss (Raw)": 2.078721284866333, "Pretrain/Step": 528, "Pretrain/Step Time": 8.066786846145988} +{"Pretrain/Learning Rate": 4.9914925682345504e-05, "Pretrain/Loss": 2.179297924041748, "Pretrain/Loss (Raw)": 2.107229471206665, "Pretrain/Step": 529, "Pretrain/Step Time": 8.060474319383502} +{"Pretrain/Learning Rate": 4.991422444295788e-05, "Pretrain/Loss": 2.1807701587677, "Pretrain/Loss (Raw)": 2.447482109069824, "Pretrain/Step": 530, "Pretrain/Step Time": 8.056635279208422} +{"Pretrain/Learning Rate": 4.9913520330344486e-05, "Pretrain/Loss": 2.183448314666748, "Pretrain/Loss (Raw)": 2.4014692306518555, "Pretrain/Step": 531, "Pretrain/Step Time": 8.064208324998617} +{"Pretrain/Learning Rate": 4.991281334458654e-05, "Pretrain/Loss": 2.183256149291992, "Pretrain/Loss (Raw)": 2.1784234046936035, "Pretrain/Step": 532, "Pretrain/Step Time": 8.06072368659079} +{"Pretrain/Learning Rate": 4.991210348576556e-05, "Pretrain/Loss": 2.181814670562744, "Pretrain/Loss (Raw)": 2.148135185241699, "Pretrain/Step": 533, "Pretrain/Step Time": 8.065729681402445} +{"Pretrain/Learning Rate": 4.991139075396342e-05, "Pretrain/Loss": 2.181674003601074, "Pretrain/Loss (Raw)": 2.172908306121826, "Pretrain/Step": 534, "Pretrain/Step Time": 8.064306519925594} +{"Pretrain/Learning Rate": 4.991067514926231e-05, "Pretrain/Loss": 2.1821165084838867, "Pretrain/Loss (Raw)": 2.122748374938965, "Pretrain/Step": 535, "Pretrain/Step Time": 8.064444804564118} +{"Pretrain/Learning Rate": 4.990995667174476e-05, "Pretrain/Loss": 2.180873394012451, "Pretrain/Loss (Raw)": 2.1543991565704346, "Pretrain/Step": 536, "Pretrain/Step Time": 8.074201749637723} +{"Pretrain/Learning Rate": 4.990923532149362e-05, "Pretrain/Loss": 2.1810460090637207, "Pretrain/Loss (Raw)": 2.155646800994873, "Pretrain/Step": 537, "Pretrain/Step Time": 8.07346374541521} +{"Pretrain/Learning Rate": 4.990851109859209e-05, "Pretrain/Loss": 2.1801137924194336, "Pretrain/Loss (Raw)": 2.107790470123291, "Pretrain/Step": 538, "Pretrain/Step Time": 8.070365538820624} +{"Pretrain/Learning Rate": 4.9907784003123695e-05, "Pretrain/Loss": 2.1818203926086426, "Pretrain/Loss (Raw)": 2.276149034500122, "Pretrain/Step": 539, "Pretrain/Step Time": 8.067496977746487} +{"Pretrain/Learning Rate": 4.9907054035172273e-05, "Pretrain/Loss": 2.1817898750305176, "Pretrain/Loss (Raw)": 2.1825170516967773, "Pretrain/Step": 540, "Pretrain/Step Time": 8.068934917449951} +{"Pretrain/Learning Rate": 4.9906321194822014e-05, "Pretrain/Loss": 2.184134006500244, "Pretrain/Loss (Raw)": 2.28513503074646, "Pretrain/Step": 541, "Pretrain/Step Time": 8.073799535632133} +{"Pretrain/Learning Rate": 4.9905585482157436e-05, "Pretrain/Loss": 2.1853723526000977, "Pretrain/Loss (Raw)": 2.136547565460205, "Pretrain/Step": 542, "Pretrain/Step Time": 8.078221585601568} +{"Pretrain/Learning Rate": 4.990484689726338e-05, "Pretrain/Loss": 2.183725357055664, "Pretrain/Loss (Raw)": 2.029874324798584, "Pretrain/Step": 543, "Pretrain/Step Time": 8.076811091974378} +{"Pretrain/Learning Rate": 4.990410544022502e-05, "Pretrain/Loss": 2.1835153102874756, "Pretrain/Loss (Raw)": 2.1335678100585938, "Pretrain/Step": 544, "Pretrain/Step Time": 8.075057979673147} +{"Pretrain/Learning Rate": 4.9903361111127864e-05, "Pretrain/Loss": 2.1833951473236084, "Pretrain/Loss (Raw)": 2.2238364219665527, "Pretrain/Step": 545, "Pretrain/Step Time": 8.071253491565585} +{"Pretrain/Learning Rate": 4.990261391005777e-05, "Pretrain/Loss": 2.183115005493164, "Pretrain/Loss (Raw)": 2.1466786861419678, "Pretrain/Step": 546, "Pretrain/Step Time": 8.070346422493458} +{"Pretrain/Learning Rate": 4.9901863837100886e-05, "Pretrain/Loss": 2.1834702491760254, "Pretrain/Loss (Raw)": 2.1941447257995605, "Pretrain/Step": 547, "Pretrain/Step Time": 8.075747331604362} +{"Pretrain/Learning Rate": 4.9901110892343724e-05, "Pretrain/Loss": 2.182668924331665, "Pretrain/Loss (Raw)": 2.111833333969116, "Pretrain/Step": 548, "Pretrain/Step Time": 8.072244297713041} +{"Pretrain/Learning Rate": 4.9900355075873116e-05, "Pretrain/Loss": 2.1819896697998047, "Pretrain/Loss (Raw)": 2.073852300643921, "Pretrain/Step": 549, "Pretrain/Step Time": 8.069337153807282} +{"Pretrain/Learning Rate": 4.989959638777623e-05, "Pretrain/Loss": 2.1822471618652344, "Pretrain/Loss (Raw)": 2.1413986682891846, "Pretrain/Step": 550, "Pretrain/Step Time": 8.068347359076142} +{"Pretrain/Learning Rate": 4.989883482814056e-05, "Pretrain/Loss": 2.1815505027770996, "Pretrain/Loss (Raw)": 2.2721540927886963, "Pretrain/Step": 551, "Pretrain/Step Time": 8.067758785560727} +{"Pretrain/Learning Rate": 4.989807039705392e-05, "Pretrain/Loss": 2.183821678161621, "Pretrain/Loss (Raw)": 2.3665833473205566, "Pretrain/Step": 552, "Pretrain/Step Time": 8.072942910715938} +{"Pretrain/Learning Rate": 4.989730309460449e-05, "Pretrain/Loss": 2.1847033500671387, "Pretrain/Loss (Raw)": 2.3418004512786865, "Pretrain/Step": 553, "Pretrain/Step Time": 8.065993832424283} +{"Pretrain/Learning Rate": 4.989653292088074e-05, "Pretrain/Loss": 2.1846256256103516, "Pretrain/Loss (Raw)": 2.1557319164276123, "Pretrain/Step": 554, "Pretrain/Step Time": 8.067754922434688} +{"Pretrain/Learning Rate": 4.9895759875971495e-05, "Pretrain/Loss": 2.185408592224121, "Pretrain/Loss (Raw)": 2.229745864868164, "Pretrain/Step": 555, "Pretrain/Step Time": 8.068926254287362} +{"Pretrain/Learning Rate": 4.9894983959965915e-05, "Pretrain/Loss": 2.186112880706787, "Pretrain/Loss (Raw)": 2.1255791187286377, "Pretrain/Step": 556, "Pretrain/Step Time": 8.07198067381978} +{"Pretrain/Learning Rate": 4.989420517295347e-05, "Pretrain/Loss": 2.1853058338165283, "Pretrain/Loss (Raw)": 2.187568426132202, "Pretrain/Step": 557, "Pretrain/Step Time": 8.062135964632034} +{"Pretrain/Learning Rate": 4.9893423515023986e-05, "Pretrain/Loss": 2.1862401962280273, "Pretrain/Loss (Raw)": 2.2233550548553467, "Pretrain/Step": 558, "Pretrain/Step Time": 8.077137744054198} +{"Pretrain/Learning Rate": 4.9892638986267594e-05, "Pretrain/Loss": 2.1865196228027344, "Pretrain/Loss (Raw)": 2.0967864990234375, "Pretrain/Step": 559, "Pretrain/Step Time": 8.073886767029762} +{"Pretrain/Learning Rate": 4.989185158677478e-05, "Pretrain/Loss": 2.1855740547180176, "Pretrain/Loss (Raw)": 2.1148033142089844, "Pretrain/Step": 560, "Pretrain/Step Time": 8.076345428824425} +{"Pretrain/Learning Rate": 4.9891061316636346e-05, "Pretrain/Loss": 2.1855363845825195, "Pretrain/Loss (Raw)": 2.224998950958252, "Pretrain/Step": 561, "Pretrain/Step Time": 8.078784227371216} +{"Pretrain/Learning Rate": 4.9890268175943425e-05, "Pretrain/Loss": 2.1866984367370605, "Pretrain/Loss (Raw)": 2.2148725986480713, "Pretrain/Step": 562, "Pretrain/Step Time": 8.078295212239027} +{"Pretrain/Learning Rate": 4.9889472164787496e-05, "Pretrain/Loss": 2.1875979900360107, "Pretrain/Loss (Raw)": 2.2043063640594482, "Pretrain/Step": 563, "Pretrain/Step Time": 8.076926328241825} +{"Pretrain/Learning Rate": 4.9888673283260355e-05, "Pretrain/Loss": 2.187649965286255, "Pretrain/Loss (Raw)": 2.143893241882324, "Pretrain/Step": 564, "Pretrain/Step Time": 8.076806535944343} +{"Pretrain/Learning Rate": 4.9887871531454134e-05, "Pretrain/Loss": 2.1878280639648438, "Pretrain/Loss (Raw)": 2.2446932792663574, "Pretrain/Step": 565, "Pretrain/Step Time": 8.073543563485146} +{"Pretrain/Learning Rate": 4.988706690946129e-05, "Pretrain/Loss": 2.1898248195648193, "Pretrain/Loss (Raw)": 2.4434266090393066, "Pretrain/Step": 566, "Pretrain/Step Time": 8.072905231267214} +{"Pretrain/Learning Rate": 4.9886259417374616e-05, "Pretrain/Loss": 2.1898388862609863, "Pretrain/Loss (Raw)": 2.160485029220581, "Pretrain/Step": 567, "Pretrain/Step Time": 8.070720108225942} +{"Pretrain/Learning Rate": 4.988544905528724e-05, "Pretrain/Loss": 2.190321922302246, "Pretrain/Loss (Raw)": 2.313471794128418, "Pretrain/Step": 568, "Pretrain/Step Time": 8.062981314957142} +{"Pretrain/Learning Rate": 4.9884635823292615e-05, "Pretrain/Loss": 2.187842845916748, "Pretrain/Loss (Raw)": 2.181110143661499, "Pretrain/Step": 569, "Pretrain/Step Time": 8.055290644988418} +{"Pretrain/Learning Rate": 4.988381972148452e-05, "Pretrain/Loss": 2.1907548904418945, "Pretrain/Loss (Raw)": 2.4891765117645264, "Pretrain/Step": 570, "Pretrain/Step Time": 8.062371511012316} +{"Pretrain/Learning Rate": 4.9883000749957086e-05, "Pretrain/Loss": 2.191157579421997, "Pretrain/Loss (Raw)": 2.2180233001708984, "Pretrain/Step": 571, "Pretrain/Step Time": 8.059986893087626} +{"Pretrain/Learning Rate": 4.988217890880475e-05, "Pretrain/Loss": 2.1929025650024414, "Pretrain/Loss (Raw)": 2.273319721221924, "Pretrain/Step": 572, "Pretrain/Step Time": 8.060307823121548} +{"Pretrain/Learning Rate": 4.98813541981223e-05, "Pretrain/Loss": 2.1928868293762207, "Pretrain/Loss (Raw)": 2.2022547721862793, "Pretrain/Step": 573, "Pretrain/Step Time": 8.071028839796782} +{"Pretrain/Learning Rate": 4.988052661800483e-05, "Pretrain/Loss": 2.1924185752868652, "Pretrain/Loss (Raw)": 2.1957218647003174, "Pretrain/Step": 574, "Pretrain/Step Time": 8.063451711088419} +{"Pretrain/Learning Rate": 4.98796961685478e-05, "Pretrain/Loss": 2.192089080810547, "Pretrain/Loss (Raw)": 2.176227569580078, "Pretrain/Step": 575, "Pretrain/Step Time": 8.068130515515804} +{"Pretrain/Learning Rate": 4.987886284984695e-05, "Pretrain/Loss": 2.1887454986572266, "Pretrain/Loss (Raw)": 2.0198898315429688, "Pretrain/Step": 576, "Pretrain/Step Time": 8.06890837661922} +{"Pretrain/Learning Rate": 4.987802666199842e-05, "Pretrain/Loss": 2.1880714893341064, "Pretrain/Loss (Raw)": 2.1544034481048584, "Pretrain/Step": 577, "Pretrain/Step Time": 8.073390364646912} +{"Pretrain/Learning Rate": 4.987718760509863e-05, "Pretrain/Loss": 2.186735153198242, "Pretrain/Loss (Raw)": 2.022559404373169, "Pretrain/Step": 578, "Pretrain/Step Time": 8.072054335847497} +{"Pretrain/Learning Rate": 4.987634567924433e-05, "Pretrain/Loss": 2.1875905990600586, "Pretrain/Loss (Raw)": 2.1642282009124756, "Pretrain/Step": 579, "Pretrain/Step Time": 8.072888650000095} +{"Pretrain/Learning Rate": 4.9875500884532634e-05, "Pretrain/Loss": 2.188145637512207, "Pretrain/Loss (Raw)": 2.2094109058380127, "Pretrain/Step": 580, "Pretrain/Step Time": 8.06982772052288} +{"Pretrain/Learning Rate": 4.987465322106095e-05, "Pretrain/Loss": 2.1877832412719727, "Pretrain/Loss (Raw)": 2.18699049949646, "Pretrain/Step": 581, "Pretrain/Step Time": 8.070825146511197} +{"Pretrain/Learning Rate": 4.987380268892705e-05, "Pretrain/Loss": 2.1886134147644043, "Pretrain/Loss (Raw)": 2.0699706077575684, "Pretrain/Step": 582, "Pretrain/Step Time": 8.07280932366848} +{"Pretrain/Learning Rate": 4.987294928822901e-05, "Pretrain/Loss": 2.189168930053711, "Pretrain/Loss (Raw)": 2.1669423580169678, "Pretrain/Step": 583, "Pretrain/Step Time": 8.073702277615666} +{"Pretrain/Learning Rate": 4.9872093019065255e-05, "Pretrain/Loss": 2.190746545791626, "Pretrain/Loss (Raw)": 2.3540852069854736, "Pretrain/Step": 584, "Pretrain/Step Time": 8.074821677058935} +{"Pretrain/Learning Rate": 4.987123388153453e-05, "Pretrain/Loss": 2.1911072731018066, "Pretrain/Loss (Raw)": 2.187117099761963, "Pretrain/Step": 585, "Pretrain/Step Time": 8.076716635376215} +{"Pretrain/Learning Rate": 4.9870371875735916e-05, "Pretrain/Loss": 2.1908276081085205, "Pretrain/Loss (Raw)": 2.1268348693847656, "Pretrain/Step": 586, "Pretrain/Step Time": 8.064950494095683} +{"Pretrain/Learning Rate": 4.986950700176882e-05, "Pretrain/Loss": 2.188422203063965, "Pretrain/Loss (Raw)": 2.0236308574676514, "Pretrain/Step": 587, "Pretrain/Step Time": 8.066256634891033} +{"Pretrain/Learning Rate": 4.9868639259732996e-05, "Pretrain/Loss": 2.1874680519104004, "Pretrain/Loss (Raw)": 2.0823280811309814, "Pretrain/Step": 588, "Pretrain/Step Time": 8.056780053302646} +{"Pretrain/Learning Rate": 4.986776864972851e-05, "Pretrain/Loss": 2.186457633972168, "Pretrain/Loss (Raw)": 2.0628457069396973, "Pretrain/Step": 589, "Pretrain/Step Time": 8.057741580531001} +{"Pretrain/Learning Rate": 4.9866895171855756e-05, "Pretrain/Loss": 2.185839891433716, "Pretrain/Loss (Raw)": 2.0754265785217285, "Pretrain/Step": 590, "Pretrain/Step Time": 8.055345738306642} +{"Pretrain/Learning Rate": 4.9866018826215475e-05, "Pretrain/Loss": 2.187296152114868, "Pretrain/Loss (Raw)": 2.3357551097869873, "Pretrain/Step": 591, "Pretrain/Step Time": 8.053553238511086} +{"Pretrain/Learning Rate": 4.9865139612908736e-05, "Pretrain/Loss": 2.185687780380249, "Pretrain/Loss (Raw)": 2.219705820083618, "Pretrain/Step": 592, "Pretrain/Step Time": 8.054207308217883} +{"Pretrain/Learning Rate": 4.9864257532036924e-05, "Pretrain/Loss": 2.1871907711029053, "Pretrain/Loss (Raw)": 2.2905662059783936, "Pretrain/Step": 593, "Pretrain/Step Time": 8.049402521923184} +{"Pretrain/Learning Rate": 4.9863372583701765e-05, "Pretrain/Loss": 2.188800573348999, "Pretrain/Loss (Raw)": 2.2049386501312256, "Pretrain/Step": 594, "Pretrain/Step Time": 8.053883492946625} +{"Pretrain/Learning Rate": 4.9862484768005324e-05, "Pretrain/Loss": 2.188680410385132, "Pretrain/Loss (Raw)": 2.1424689292907715, "Pretrain/Step": 595, "Pretrain/Step Time": 8.05335945263505} +{"Pretrain/Learning Rate": 4.986159408504999e-05, "Pretrain/Loss": 2.188995838165283, "Pretrain/Loss (Raw)": 2.193730354309082, "Pretrain/Step": 596, "Pretrain/Step Time": 8.055088764056563} +{"Pretrain/Learning Rate": 4.986070053493846e-05, "Pretrain/Loss": 2.189751148223877, "Pretrain/Loss (Raw)": 2.2420482635498047, "Pretrain/Step": 597, "Pretrain/Step Time": 8.047985984012485} +{"Pretrain/Learning Rate": 4.985980411777381e-05, "Pretrain/Loss": 2.190605401992798, "Pretrain/Loss (Raw)": 2.173043727874756, "Pretrain/Step": 598, "Pretrain/Step Time": 8.052114024758339} +{"Pretrain/Learning Rate": 4.9858904833659404e-05, "Pretrain/Loss": 2.190117120742798, "Pretrain/Loss (Raw)": 2.0728423595428467, "Pretrain/Step": 599, "Pretrain/Step Time": 8.052297869697213} +{"Pretrain/Learning Rate": 4.985800268269895e-05, "Pretrain/Loss": 2.1891517639160156, "Pretrain/Loss (Raw)": 2.053101062774658, "Pretrain/Step": 600, "Pretrain/Step Time": 8.049410128965974} +{"Pretrain/Learning Rate": 4.9857097664996486e-05, "Pretrain/Loss": 2.1903655529022217, "Pretrain/Loss (Raw)": 2.286278009414673, "Pretrain/Step": 601, "Pretrain/Step Time": 8.052995013073087} +{"Pretrain/Learning Rate": 4.98561897806564e-05, "Pretrain/Loss": 2.189699172973633, "Pretrain/Loss (Raw)": 2.0873048305511475, "Pretrain/Step": 602, "Pretrain/Step Time": 8.047187762334943} +{"Pretrain/Learning Rate": 4.985527902978337e-05, "Pretrain/Loss": 2.189361095428467, "Pretrain/Loss (Raw)": 2.2349469661712646, "Pretrain/Step": 603, "Pretrain/Step Time": 8.045446041971445} +{"Pretrain/Learning Rate": 4.985436541248245e-05, "Pretrain/Loss": 2.189481735229492, "Pretrain/Loss (Raw)": 2.223889112472534, "Pretrain/Step": 604, "Pretrain/Step Time": 8.044653667137027} +{"Pretrain/Learning Rate": 4.985344892885899e-05, "Pretrain/Loss": 2.18891978263855, "Pretrain/Loss (Raw)": 2.0742437839508057, "Pretrain/Step": 605, "Pretrain/Step Time": 8.039175925776362} +{"Pretrain/Learning Rate": 4.985252957901869e-05, "Pretrain/Loss": 2.1889941692352295, "Pretrain/Loss (Raw)": 2.2046568393707275, "Pretrain/Step": 606, "Pretrain/Step Time": 8.041460450738668} +{"Pretrain/Learning Rate": 4.985160736306756e-05, "Pretrain/Loss": 2.187018871307373, "Pretrain/Loss (Raw)": 2.1825549602508545, "Pretrain/Step": 607, "Pretrain/Step Time": 8.036849308758974} +{"Pretrain/Learning Rate": 4.985068228111198e-05, "Pretrain/Loss": 2.1885061264038086, "Pretrain/Loss (Raw)": 2.28910231590271, "Pretrain/Step": 608, "Pretrain/Step Time": 8.046133918687701} +{"Pretrain/Learning Rate": 4.984975433325861e-05, "Pretrain/Loss": 2.1872668266296387, "Pretrain/Loss (Raw)": 1.9884177446365356, "Pretrain/Step": 609, "Pretrain/Step Time": 8.03931525349617} +{"Pretrain/Learning Rate": 4.9848823519614475e-05, "Pretrain/Loss": 2.1861517429351807, "Pretrain/Loss (Raw)": 2.075932025909424, "Pretrain/Step": 610, "Pretrain/Step Time": 8.034338371828198} +{"Pretrain/Learning Rate": 4.9847889840286924e-05, "Pretrain/Loss": 2.1868948936462402, "Pretrain/Loss (Raw)": 2.2067208290100098, "Pretrain/Step": 611, "Pretrain/Step Time": 8.02855241857469} +{"Pretrain/Learning Rate": 4.984695329538362e-05, "Pretrain/Loss": 2.185563087463379, "Pretrain/Loss (Raw)": 1.9841418266296387, "Pretrain/Step": 612, "Pretrain/Step Time": 8.032895810902119} +{"Pretrain/Learning Rate": 4.984601388501258e-05, "Pretrain/Loss": 2.1856701374053955, "Pretrain/Loss (Raw)": 2.1987860202789307, "Pretrain/Step": 613, "Pretrain/Step Time": 8.042778141796589} +{"Pretrain/Learning Rate": 4.9845071609282145e-05, "Pretrain/Loss": 2.1827785968780518, "Pretrain/Loss (Raw)": 1.9333887100219727, "Pretrain/Step": 614, "Pretrain/Step Time": 8.039278967306018} +{"Pretrain/Learning Rate": 4.984412646830098e-05, "Pretrain/Loss": 2.1817846298217773, "Pretrain/Loss (Raw)": 2.1451919078826904, "Pretrain/Step": 615, "Pretrain/Step Time": 8.038822915405035} +{"Pretrain/Learning Rate": 4.9843178462178084e-05, "Pretrain/Loss": 2.179464340209961, "Pretrain/Loss (Raw)": 2.04524827003479, "Pretrain/Step": 616, "Pretrain/Step Time": 8.040762325748801} +{"Pretrain/Learning Rate": 4.984222759102277e-05, "Pretrain/Loss": 2.1773681640625, "Pretrain/Loss (Raw)": 2.0698063373565674, "Pretrain/Step": 617, "Pretrain/Step Time": 8.05276295915246} +{"Pretrain/Learning Rate": 4.984127385494472e-05, "Pretrain/Loss": 2.1775898933410645, "Pretrain/Loss (Raw)": 2.182847261428833, "Pretrain/Step": 618, "Pretrain/Step Time": 8.057454762980342} +{"Pretrain/Learning Rate": 4.984031725405392e-05, "Pretrain/Loss": 2.1789774894714355, "Pretrain/Loss (Raw)": 2.3048765659332275, "Pretrain/Step": 619, "Pretrain/Step Time": 8.055783972144127} +{"Pretrain/Learning Rate": 4.983935778846067e-05, "Pretrain/Loss": 2.179382562637329, "Pretrain/Loss (Raw)": 2.153784990310669, "Pretrain/Step": 620, "Pretrain/Step Time": 8.059151817113161} +{"Pretrain/Learning Rate": 4.9838395458275636e-05, "Pretrain/Loss": 2.1801414489746094, "Pretrain/Loss (Raw)": 2.175740957260132, "Pretrain/Step": 621, "Pretrain/Step Time": 8.047245644032955} +{"Pretrain/Learning Rate": 4.98374302636098e-05, "Pretrain/Loss": 2.1799659729003906, "Pretrain/Loss (Raw)": 2.2409133911132812, "Pretrain/Step": 622, "Pretrain/Step Time": 8.050001453608274} +{"Pretrain/Learning Rate": 4.983646220457446e-05, "Pretrain/Loss": 2.1779580116271973, "Pretrain/Loss (Raw)": 2.0806002616882324, "Pretrain/Step": 623, "Pretrain/Step Time": 8.05632590688765} +{"Pretrain/Learning Rate": 4.9835491281281274e-05, "Pretrain/Loss": 2.1793365478515625, "Pretrain/Loss (Raw)": 2.167820692062378, "Pretrain/Step": 624, "Pretrain/Step Time": 8.053273590281606} +{"Pretrain/Learning Rate": 4.9834517493842196e-05, "Pretrain/Loss": 2.1779627799987793, "Pretrain/Loss (Raw)": 2.0868215560913086, "Pretrain/Step": 625, "Pretrain/Step Time": 8.053550951182842} +{"Pretrain/Learning Rate": 4.983354084236954e-05, "Pretrain/Loss": 2.177051544189453, "Pretrain/Loss (Raw)": 2.126793146133423, "Pretrain/Step": 626, "Pretrain/Step Time": 8.04677333123982} +{"Pretrain/Learning Rate": 4.983256132697594e-05, "Pretrain/Loss": 2.17529296875, "Pretrain/Loss (Raw)": 2.0892364978790283, "Pretrain/Step": 627, "Pretrain/Step Time": 8.054092092439532} +{"Pretrain/Learning Rate": 4.983157894777435e-05, "Pretrain/Loss": 2.17520809173584, "Pretrain/Loss (Raw)": 2.131943941116333, "Pretrain/Step": 628, "Pretrain/Step Time": 8.05403671786189} +{"Pretrain/Learning Rate": 4.983059370487806e-05, "Pretrain/Loss": 2.1741445064544678, "Pretrain/Loss (Raw)": 2.110300064086914, "Pretrain/Step": 629, "Pretrain/Step Time": 8.05591206997633} +{"Pretrain/Learning Rate": 4.9829605598400705e-05, "Pretrain/Loss": 2.17285418510437, "Pretrain/Loss (Raw)": 2.089033603668213, "Pretrain/Step": 630, "Pretrain/Step Time": 8.047805340960622} +{"Pretrain/Learning Rate": 4.982861462845623e-05, "Pretrain/Loss": 2.1721243858337402, "Pretrain/Loss (Raw)": 2.073012590408325, "Pretrain/Step": 631, "Pretrain/Step Time": 8.054337283596396} +{"Pretrain/Learning Rate": 4.982762079515892e-05, "Pretrain/Loss": 2.1724767684936523, "Pretrain/Loss (Raw)": 2.250575304031372, "Pretrain/Step": 632, "Pretrain/Step Time": 8.05988179706037} +{"Pretrain/Learning Rate": 4.982662409862339e-05, "Pretrain/Loss": 2.1721456050872803, "Pretrain/Loss (Raw)": 2.0716779232025146, "Pretrain/Step": 633, "Pretrain/Step Time": 8.058339977636933} +{"Pretrain/Learning Rate": 4.9825624538964576e-05, "Pretrain/Loss": 2.1726760864257812, "Pretrain/Loss (Raw)": 2.2356956005096436, "Pretrain/Step": 634, "Pretrain/Step Time": 8.063290083780885} +{"Pretrain/Learning Rate": 4.982462211629776e-05, "Pretrain/Loss": 2.1731438636779785, "Pretrain/Loss (Raw)": 2.1288959980010986, "Pretrain/Step": 635, "Pretrain/Step Time": 8.055112231522799} +{"Pretrain/Learning Rate": 4.9823616830738546e-05, "Pretrain/Loss": 2.170475482940674, "Pretrain/Loss (Raw)": 2.026453733444214, "Pretrain/Step": 636, "Pretrain/Step Time": 8.059967655688524} +{"Pretrain/Learning Rate": 4.9822608682402866e-05, "Pretrain/Loss": 2.170660972595215, "Pretrain/Loss (Raw)": 2.1879849433898926, "Pretrain/Step": 637, "Pretrain/Step Time": 8.065466176718473} +{"Pretrain/Learning Rate": 4.9821597671406984e-05, "Pretrain/Loss": 2.168245792388916, "Pretrain/Loss (Raw)": 2.064953565597534, "Pretrain/Step": 638, "Pretrain/Step Time": 8.066601464524865} +{"Pretrain/Learning Rate": 4.982058379786749e-05, "Pretrain/Loss": 2.1695046424865723, "Pretrain/Loss (Raw)": 2.2417099475860596, "Pretrain/Step": 639, "Pretrain/Step Time": 8.067866234108806} +{"Pretrain/Learning Rate": 4.9819567061901327e-05, "Pretrain/Loss": 2.168966770172119, "Pretrain/Loss (Raw)": 2.1470372676849365, "Pretrain/Step": 640, "Pretrain/Step Time": 8.060141509398818} +{"Pretrain/Learning Rate": 4.981854746362573e-05, "Pretrain/Loss": 2.1693832874298096, "Pretrain/Loss (Raw)": 2.0945215225219727, "Pretrain/Step": 641, "Pretrain/Step Time": 8.0621316768229} +{"Pretrain/Learning Rate": 4.981752500315829e-05, "Pretrain/Loss": 2.1700382232666016, "Pretrain/Loss (Raw)": 2.1707139015197754, "Pretrain/Step": 642, "Pretrain/Step Time": 8.064848575741053} +{"Pretrain/Learning Rate": 4.981649968061692e-05, "Pretrain/Loss": 2.1695594787597656, "Pretrain/Loss (Raw)": 1.9911155700683594, "Pretrain/Step": 643, "Pretrain/Step Time": 8.06006195396185} +{"Pretrain/Learning Rate": 4.981547149611987e-05, "Pretrain/Loss": 2.1697568893432617, "Pretrain/Loss (Raw)": 2.2796902656555176, "Pretrain/Step": 644, "Pretrain/Step Time": 8.067659886553884} +{"Pretrain/Learning Rate": 4.9814440449785715e-05, "Pretrain/Loss": 2.1714489459991455, "Pretrain/Loss (Raw)": 2.15421986579895, "Pretrain/Step": 645, "Pretrain/Step Time": 8.060419274494052} +{"Pretrain/Learning Rate": 4.9813406541733355e-05, "Pretrain/Loss": 2.170919895172119, "Pretrain/Loss (Raw)": 2.3075244426727295, "Pretrain/Step": 646, "Pretrain/Step Time": 8.064558565616608} +{"Pretrain/Learning Rate": 4.981236977208203e-05, "Pretrain/Loss": 2.171013832092285, "Pretrain/Loss (Raw)": 2.2006068229675293, "Pretrain/Step": 647, "Pretrain/Step Time": 8.059841744601727} +{"Pretrain/Learning Rate": 4.98113301409513e-05, "Pretrain/Loss": 2.1706862449645996, "Pretrain/Loss (Raw)": 2.1486928462982178, "Pretrain/Step": 648, "Pretrain/Step Time": 8.060815641656518} +{"Pretrain/Learning Rate": 4.981028764846106e-05, "Pretrain/Loss": 2.1696090698242188, "Pretrain/Loss (Raw)": 2.0962343215942383, "Pretrain/Step": 649, "Pretrain/Step Time": 8.06031572073698} +{"Pretrain/Learning Rate": 4.980924229473155e-05, "Pretrain/Loss": 2.1699748039245605, "Pretrain/Loss (Raw)": 2.165239095687866, "Pretrain/Step": 650, "Pretrain/Step Time": 8.066511500626802} +{"Pretrain/Learning Rate": 4.980819407988331e-05, "Pretrain/Loss": 2.169480323791504, "Pretrain/Loss (Raw)": 2.127634048461914, "Pretrain/Step": 651, "Pretrain/Step Time": 8.069953819736838} +{"Pretrain/Learning Rate": 4.980714300403723e-05, "Pretrain/Loss": 2.1684155464172363, "Pretrain/Loss (Raw)": 2.1687958240509033, "Pretrain/Step": 652, "Pretrain/Step Time": 8.066983487457037} +{"Pretrain/Learning Rate": 4.9806089067314515e-05, "Pretrain/Loss": 2.1680665016174316, "Pretrain/Loss (Raw)": 2.0208399295806885, "Pretrain/Step": 653, "Pretrain/Step Time": 8.066629497334361} +{"Pretrain/Learning Rate": 4.980503226983673e-05, "Pretrain/Loss": 2.1683921813964844, "Pretrain/Loss (Raw)": 2.1944713592529297, "Pretrain/Step": 654, "Pretrain/Step Time": 8.063855966553092} +{"Pretrain/Learning Rate": 4.980397261172573e-05, "Pretrain/Loss": 2.1689765453338623, "Pretrain/Loss (Raw)": 2.263944149017334, "Pretrain/Step": 655, "Pretrain/Step Time": 8.073259817436337} +{"Pretrain/Learning Rate": 4.9802910093103725e-05, "Pretrain/Loss": 2.1703600883483887, "Pretrain/Loss (Raw)": 2.2558207511901855, "Pretrain/Step": 656, "Pretrain/Step Time": 8.075067089870572} +{"Pretrain/Learning Rate": 4.980184471409326e-05, "Pretrain/Loss": 2.170743465423584, "Pretrain/Loss (Raw)": 2.1563031673431396, "Pretrain/Step": 657, "Pretrain/Step Time": 8.070077383890748} +{"Pretrain/Learning Rate": 4.980077647481719e-05, "Pretrain/Loss": 2.1674869060516357, "Pretrain/Loss (Raw)": 2.030622720718384, "Pretrain/Step": 658, "Pretrain/Step Time": 8.077365841716528} +{"Pretrain/Learning Rate": 4.979970537539871e-05, "Pretrain/Loss": 2.1654787063598633, "Pretrain/Loss (Raw)": 2.1444149017333984, "Pretrain/Step": 659, "Pretrain/Step Time": 8.070152023807168} +{"Pretrain/Learning Rate": 4.979863141596135e-05, "Pretrain/Loss": 2.165353298187256, "Pretrain/Loss (Raw)": 2.1624081134796143, "Pretrain/Step": 660, "Pretrain/Step Time": 8.07037778571248} +{"Pretrain/Learning Rate": 4.979755459662896e-05, "Pretrain/Loss": 2.164722204208374, "Pretrain/Loss (Raw)": 2.067340612411499, "Pretrain/Step": 661, "Pretrain/Step Time": 8.070735121145844} +{"Pretrain/Learning Rate": 4.979647491752572e-05, "Pretrain/Loss": 2.1654233932495117, "Pretrain/Loss (Raw)": 2.262664318084717, "Pretrain/Step": 662, "Pretrain/Step Time": 8.065204709768295} +{"Pretrain/Learning Rate": 4.979539237877615e-05, "Pretrain/Loss": 2.165457010269165, "Pretrain/Loss (Raw)": 2.127033233642578, "Pretrain/Step": 663, "Pretrain/Step Time": 8.065369946882129} +{"Pretrain/Learning Rate": 4.979430698050509e-05, "Pretrain/Loss": 2.1656546592712402, "Pretrain/Loss (Raw)": 2.1796910762786865, "Pretrain/Step": 664, "Pretrain/Step Time": 8.056694157421589} +{"Pretrain/Learning Rate": 4.979321872283772e-05, "Pretrain/Loss": 2.165304660797119, "Pretrain/Loss (Raw)": 2.1108596324920654, "Pretrain/Step": 665, "Pretrain/Step Time": 8.070790871977806} +{"Pretrain/Learning Rate": 4.979212760589953e-05, "Pretrain/Loss": 2.167137384414673, "Pretrain/Loss (Raw)": 2.3423736095428467, "Pretrain/Step": 666, "Pretrain/Step Time": 8.065280191600323} +{"Pretrain/Learning Rate": 4.9791033629816364e-05, "Pretrain/Loss": 2.165400981903076, "Pretrain/Loss (Raw)": 2.0538878440856934, "Pretrain/Step": 667, "Pretrain/Step Time": 8.06968393549323} +{"Pretrain/Learning Rate": 4.978993679471438e-05, "Pretrain/Loss": 2.1653828620910645, "Pretrain/Loss (Raw)": 2.18019700050354, "Pretrain/Step": 668, "Pretrain/Step Time": 8.06491401977837} +{"Pretrain/Learning Rate": 4.978883710072008e-05, "Pretrain/Loss": 2.164527177810669, "Pretrain/Loss (Raw)": 2.1756203174591064, "Pretrain/Step": 669, "Pretrain/Step Time": 8.06006184592843} +{"Pretrain/Learning Rate": 4.978773454796026e-05, "Pretrain/Loss": 2.16593599319458, "Pretrain/Loss (Raw)": 2.3168785572052, "Pretrain/Step": 670, "Pretrain/Step Time": 8.061800431460142} +{"Pretrain/Learning Rate": 4.9786629136562095e-05, "Pretrain/Loss": 2.167717695236206, "Pretrain/Loss (Raw)": 2.2579386234283447, "Pretrain/Step": 671, "Pretrain/Step Time": 8.058357922360301} +{"Pretrain/Learning Rate": 4.978552086665306e-05, "Pretrain/Loss": 2.1689369678497314, "Pretrain/Loss (Raw)": 2.2896318435668945, "Pretrain/Step": 672, "Pretrain/Step Time": 8.062893951311707} +{"Pretrain/Learning Rate": 4.9784409738360973e-05, "Pretrain/Loss": 2.1695423126220703, "Pretrain/Loss (Raw)": 2.301314115524292, "Pretrain/Step": 673, "Pretrain/Step Time": 8.065315729007125} +{"Pretrain/Learning Rate": 4.978329575181395e-05, "Pretrain/Loss": 2.170527458190918, "Pretrain/Loss (Raw)": 2.2727530002593994, "Pretrain/Step": 674, "Pretrain/Step Time": 8.069206777960062} +{"Pretrain/Learning Rate": 4.978217890714049e-05, "Pretrain/Loss": 2.1695659160614014, "Pretrain/Loss (Raw)": 2.071070671081543, "Pretrain/Step": 675, "Pretrain/Step Time": 8.065087081864476} +{"Pretrain/Learning Rate": 4.978105920446938e-05, "Pretrain/Loss": 2.169718027114868, "Pretrain/Loss (Raw)": 2.1313283443450928, "Pretrain/Step": 676, "Pretrain/Step Time": 8.062928525730968} +{"Pretrain/Learning Rate": 4.977993664392975e-05, "Pretrain/Loss": 2.1702194213867188, "Pretrain/Loss (Raw)": 2.138023853302002, "Pretrain/Step": 677, "Pretrain/Step Time": 8.061824770644307} +{"Pretrain/Learning Rate": 4.9778811225651056e-05, "Pretrain/Loss": 2.169638156890869, "Pretrain/Loss (Raw)": 2.0669755935668945, "Pretrain/Step": 678, "Pretrain/Step Time": 8.060354474931955} +{"Pretrain/Learning Rate": 4.9777682949763096e-05, "Pretrain/Loss": 2.1686007976531982, "Pretrain/Loss (Raw)": 2.139390230178833, "Pretrain/Step": 679, "Pretrain/Step Time": 8.06570882909} +{"Pretrain/Learning Rate": 4.9776551816395975e-05, "Pretrain/Loss": 2.1671009063720703, "Pretrain/Loss (Raw)": 2.174611806869507, "Pretrain/Step": 680, "Pretrain/Step Time": 8.057532165199518} +{"Pretrain/Learning Rate": 4.977541782568015e-05, "Pretrain/Loss": 2.1671066284179688, "Pretrain/Loss (Raw)": 2.3425087928771973, "Pretrain/Step": 681, "Pretrain/Step Time": 8.053234135732055} +{"Pretrain/Learning Rate": 4.97742809777464e-05, "Pretrain/Loss": 2.169391393661499, "Pretrain/Loss (Raw)": 2.4481728076934814, "Pretrain/Step": 682, "Pretrain/Step Time": 8.05745056271553} +{"Pretrain/Learning Rate": 4.9773141272725824e-05, "Pretrain/Loss": 2.168191432952881, "Pretrain/Loss (Raw)": 2.0761656761169434, "Pretrain/Step": 683, "Pretrain/Step Time": 8.055622678250074} +{"Pretrain/Learning Rate": 4.9771998710749864e-05, "Pretrain/Loss": 2.1673471927642822, "Pretrain/Loss (Raw)": 2.017514228820801, "Pretrain/Step": 684, "Pretrain/Step Time": 8.055236209183931} +{"Pretrain/Learning Rate": 4.977085329195028e-05, "Pretrain/Loss": 2.1674752235412598, "Pretrain/Loss (Raw)": 2.203969955444336, "Pretrain/Step": 685, "Pretrain/Step Time": 8.064060788601637} +{"Pretrain/Learning Rate": 4.9769705016459164e-05, "Pretrain/Loss": 2.1680679321289062, "Pretrain/Loss (Raw)": 2.299203634262085, "Pretrain/Step": 686, "Pretrain/Step Time": 8.050788732245564} +{"Pretrain/Learning Rate": 4.976855388440896e-05, "Pretrain/Loss": 2.168924570083618, "Pretrain/Loss (Raw)": 2.206463098526001, "Pretrain/Step": 687, "Pretrain/Step Time": 8.055072646588087} +{"Pretrain/Learning Rate": 4.97673998959324e-05, "Pretrain/Loss": 2.169373035430908, "Pretrain/Loss (Raw)": 2.1721913814544678, "Pretrain/Step": 688, "Pretrain/Step Time": 8.062664173543453} +{"Pretrain/Learning Rate": 4.976624305116259e-05, "Pretrain/Loss": 2.1687169075012207, "Pretrain/Loss (Raw)": 2.141026258468628, "Pretrain/Step": 689, "Pretrain/Step Time": 8.0549789480865} +{"Pretrain/Learning Rate": 4.9765083350232913e-05, "Pretrain/Loss": 2.168821096420288, "Pretrain/Loss (Raw)": 2.228165626525879, "Pretrain/Step": 690, "Pretrain/Step Time": 8.053290029987693} +{"Pretrain/Learning Rate": 4.976392079327713e-05, "Pretrain/Loss": 2.1685538291931152, "Pretrain/Loss (Raw)": 2.170105218887329, "Pretrain/Step": 691, "Pretrain/Step Time": 8.052497578784823} +{"Pretrain/Learning Rate": 4.976275538042932e-05, "Pretrain/Loss": 2.1690778732299805, "Pretrain/Loss (Raw)": 2.2109897136688232, "Pretrain/Step": 692, "Pretrain/Step Time": 8.04825309664011} +{"Pretrain/Learning Rate": 4.976158711182386e-05, "Pretrain/Loss": 2.167832374572754, "Pretrain/Loss (Raw)": 2.0852549076080322, "Pretrain/Step": 693, "Pretrain/Step Time": 8.059906931594014} +{"Pretrain/Learning Rate": 4.9760415987595496e-05, "Pretrain/Loss": 2.1647653579711914, "Pretrain/Loss (Raw)": 2.050861358642578, "Pretrain/Step": 694, "Pretrain/Step Time": 8.060624171048403} +{"Pretrain/Learning Rate": 4.9759242007879295e-05, "Pretrain/Loss": 2.1637489795684814, "Pretrain/Loss (Raw)": 2.0303845405578613, "Pretrain/Step": 695, "Pretrain/Step Time": 8.061178924515843} +{"Pretrain/Learning Rate": 4.975806517281062e-05, "Pretrain/Loss": 2.16279935836792, "Pretrain/Loss (Raw)": 2.1919376850128174, "Pretrain/Step": 696, "Pretrain/Step Time": 8.061877308413386} +{"Pretrain/Learning Rate": 4.975688548252522e-05, "Pretrain/Loss": 2.1625804901123047, "Pretrain/Loss (Raw)": 2.1530861854553223, "Pretrain/Step": 697, "Pretrain/Step Time": 8.061944788321853} +{"Pretrain/Learning Rate": 4.9755702937159124e-05, "Pretrain/Loss": 2.161691188812256, "Pretrain/Loss (Raw)": 2.3753318786621094, "Pretrain/Step": 698, "Pretrain/Step Time": 8.064764665439725} +{"Pretrain/Learning Rate": 4.975451753684871e-05, "Pretrain/Loss": 2.1607165336608887, "Pretrain/Loss (Raw)": 2.0932862758636475, "Pretrain/Step": 699, "Pretrain/Step Time": 8.0588951241225} +{"Pretrain/Learning Rate": 4.975332928173069e-05, "Pretrain/Loss": 2.1587600708007812, "Pretrain/Loss (Raw)": 2.0228757858276367, "Pretrain/Step": 700, "Pretrain/Step Time": 8.066409224644303} +{"Pretrain/Learning Rate": 4.975213817194209e-05, "Pretrain/Loss": 2.1594173908233643, "Pretrain/Loss (Raw)": 2.2863945960998535, "Pretrain/Step": 701, "Pretrain/Step Time": 8.0546342600137} +{"Pretrain/Learning Rate": 4.975094420762029e-05, "Pretrain/Loss": 2.1587297916412354, "Pretrain/Loss (Raw)": 2.107710361480713, "Pretrain/Step": 702, "Pretrain/Step Time": 8.063912011682987} +{"Pretrain/Learning Rate": 4.9749747388902964e-05, "Pretrain/Loss": 2.159501552581787, "Pretrain/Loss (Raw)": 2.275029420852661, "Pretrain/Step": 703, "Pretrain/Step Time": 8.057826027274132} +{"Pretrain/Learning Rate": 4.974854771592815e-05, "Pretrain/Loss": 2.1600046157836914, "Pretrain/Loss (Raw)": 2.0842511653900146, "Pretrain/Step": 704, "Pretrain/Step Time": 8.0510019287467} +{"Pretrain/Learning Rate": 4.974734518883419e-05, "Pretrain/Loss": 2.1589884757995605, "Pretrain/Loss (Raw)": 2.0243701934814453, "Pretrain/Step": 705, "Pretrain/Step Time": 8.053199818357825} +{"Pretrain/Learning Rate": 4.974613980775977e-05, "Pretrain/Loss": 2.1608595848083496, "Pretrain/Loss (Raw)": 2.2620327472686768, "Pretrain/Step": 706, "Pretrain/Step Time": 8.049537705257535} +{"Pretrain/Learning Rate": 4.974493157284391e-05, "Pretrain/Loss": 2.1607918739318848, "Pretrain/Loss (Raw)": 2.1555933952331543, "Pretrain/Step": 707, "Pretrain/Step Time": 8.055004691705108} +{"Pretrain/Learning Rate": 4.974372048422593e-05, "Pretrain/Loss": 2.160614252090454, "Pretrain/Loss (Raw)": 2.1866660118103027, "Pretrain/Step": 708, "Pretrain/Step Time": 8.054371524602175} +{"Pretrain/Learning Rate": 4.974250654204551e-05, "Pretrain/Loss": 2.158987283706665, "Pretrain/Loss (Raw)": 1.978726863861084, "Pretrain/Step": 709, "Pretrain/Step Time": 8.04972319304943} +{"Pretrain/Learning Rate": 4.974128974644264e-05, "Pretrain/Loss": 2.1594715118408203, "Pretrain/Loss (Raw)": 2.1319468021392822, "Pretrain/Step": 710, "Pretrain/Step Time": 8.051254861056805} +{"Pretrain/Learning Rate": 4.9740070097557656e-05, "Pretrain/Loss": 2.1608309745788574, "Pretrain/Loss (Raw)": 2.3409643173217773, "Pretrain/Step": 711, "Pretrain/Step Time": 8.047808973118663} +{"Pretrain/Learning Rate": 4.973884759553121e-05, "Pretrain/Loss": 2.1594648361206055, "Pretrain/Loss (Raw)": 2.179206132888794, "Pretrain/Step": 712, "Pretrain/Step Time": 8.053746528923512} +{"Pretrain/Learning Rate": 4.973762224050428e-05, "Pretrain/Loss": 2.1586081981658936, "Pretrain/Loss (Raw)": 2.077467679977417, "Pretrain/Step": 713, "Pretrain/Step Time": 8.053891994059086} +{"Pretrain/Learning Rate": 4.973639403261819e-05, "Pretrain/Loss": 2.158623695373535, "Pretrain/Loss (Raw)": 2.12882399559021, "Pretrain/Step": 714, "Pretrain/Step Time": 8.059122806414962} +{"Pretrain/Learning Rate": 4.9735162972014584e-05, "Pretrain/Loss": 2.1600868701934814, "Pretrain/Loss (Raw)": 2.210930824279785, "Pretrain/Step": 715, "Pretrain/Step Time": 8.053435508161783} +{"Pretrain/Learning Rate": 4.9733929058835425e-05, "Pretrain/Loss": 2.160249948501587, "Pretrain/Loss (Raw)": 2.103198528289795, "Pretrain/Step": 716, "Pretrain/Step Time": 8.056827267631888} +{"Pretrain/Learning Rate": 4.973269229322301e-05, "Pretrain/Loss": 2.161304473876953, "Pretrain/Loss (Raw)": 2.1978249549865723, "Pretrain/Step": 717, "Pretrain/Step Time": 8.061292437836528} +{"Pretrain/Learning Rate": 4.973145267531998e-05, "Pretrain/Loss": 2.1619510650634766, "Pretrain/Loss (Raw)": 2.1581692695617676, "Pretrain/Step": 718, "Pretrain/Step Time": 8.058358259499073} +{"Pretrain/Learning Rate": 4.973021020526929e-05, "Pretrain/Loss": 2.159944772720337, "Pretrain/Loss (Raw)": 2.078972339630127, "Pretrain/Step": 719, "Pretrain/Step Time": 8.057297874242067} +{"Pretrain/Learning Rate": 4.972896488321422e-05, "Pretrain/Loss": 2.158754348754883, "Pretrain/Loss (Raw)": 2.0673277378082275, "Pretrain/Step": 720, "Pretrain/Step Time": 8.057609943673015} +{"Pretrain/Learning Rate": 4.97277167092984e-05, "Pretrain/Loss": 2.1576337814331055, "Pretrain/Loss (Raw)": 2.147122383117676, "Pretrain/Step": 721, "Pretrain/Step Time": 8.060625800862908} +{"Pretrain/Learning Rate": 4.972646568366577e-05, "Pretrain/Loss": 2.1572346687316895, "Pretrain/Loss (Raw)": 2.153867721557617, "Pretrain/Step": 722, "Pretrain/Step Time": 8.055454056710005} +{"Pretrain/Learning Rate": 4.9725211806460604e-05, "Pretrain/Loss": 2.1565165519714355, "Pretrain/Loss (Raw)": 2.050532341003418, "Pretrain/Step": 723, "Pretrain/Step Time": 8.06125227175653} +{"Pretrain/Learning Rate": 4.97239550778275e-05, "Pretrain/Loss": 2.1560158729553223, "Pretrain/Loss (Raw)": 2.129646062850952, "Pretrain/Step": 724, "Pretrain/Step Time": 8.055563317611814} +{"Pretrain/Learning Rate": 4.972269549791139e-05, "Pretrain/Loss": 2.1551084518432617, "Pretrain/Loss (Raw)": 2.1259169578552246, "Pretrain/Step": 725, "Pretrain/Step Time": 8.063870346173644} +{"Pretrain/Learning Rate": 4.9721433066857535e-05, "Pretrain/Loss": 2.1542248725891113, "Pretrain/Loss (Raw)": 2.059910774230957, "Pretrain/Step": 726, "Pretrain/Step Time": 8.064402371644974} +{"Pretrain/Learning Rate": 4.9720167784811535e-05, "Pretrain/Loss": 2.1559996604919434, "Pretrain/Loss (Raw)": 2.3000569343566895, "Pretrain/Step": 727, "Pretrain/Step Time": 8.061191629618406} +{"Pretrain/Learning Rate": 4.97188996519193e-05, "Pretrain/Loss": 2.156214952468872, "Pretrain/Loss (Raw)": 2.0806257724761963, "Pretrain/Step": 728, "Pretrain/Step Time": 8.065215954557061} +{"Pretrain/Learning Rate": 4.971762866832708e-05, "Pretrain/Loss": 2.154587507247925, "Pretrain/Loss (Raw)": 2.077981948852539, "Pretrain/Step": 729, "Pretrain/Step Time": 8.058714324608445} +{"Pretrain/Learning Rate": 4.971635483418144e-05, "Pretrain/Loss": 2.155235528945923, "Pretrain/Loss (Raw)": 2.1702523231506348, "Pretrain/Step": 730, "Pretrain/Step Time": 8.065703658387065} +{"Pretrain/Learning Rate": 4.97150781496293e-05, "Pretrain/Loss": 2.154758930206299, "Pretrain/Loss (Raw)": 2.173964738845825, "Pretrain/Step": 731, "Pretrain/Step Time": 8.071284782141447} +{"Pretrain/Learning Rate": 4.971379861481789e-05, "Pretrain/Loss": 2.1540396213531494, "Pretrain/Loss (Raw)": 2.131788969039917, "Pretrain/Step": 732, "Pretrain/Step Time": 8.074681598693132} +{"Pretrain/Learning Rate": 4.9712516229894756e-05, "Pretrain/Loss": 2.1550588607788086, "Pretrain/Loss (Raw)": 2.2047057151794434, "Pretrain/Step": 733, "Pretrain/Step Time": 8.08194193802774} +{"Pretrain/Learning Rate": 4.971123099500781e-05, "Pretrain/Loss": 2.155190944671631, "Pretrain/Loss (Raw)": 2.2215447425842285, "Pretrain/Step": 734, "Pretrain/Step Time": 8.079595005139709} +{"Pretrain/Learning Rate": 4.970994291030526e-05, "Pretrain/Loss": 2.1555683612823486, "Pretrain/Loss (Raw)": 2.230883836746216, "Pretrain/Step": 735, "Pretrain/Step Time": 8.076135145500302} +{"Pretrain/Learning Rate": 4.970865197593566e-05, "Pretrain/Loss": 2.154025077819824, "Pretrain/Loss (Raw)": 2.091573715209961, "Pretrain/Step": 736, "Pretrain/Step Time": 8.074538925662637} +{"Pretrain/Learning Rate": 4.9707358192047885e-05, "Pretrain/Loss": 2.1546239852905273, "Pretrain/Loss (Raw)": 2.0650458335876465, "Pretrain/Step": 737, "Pretrain/Step Time": 8.07619079388678} +{"Pretrain/Learning Rate": 4.970606155879113e-05, "Pretrain/Loss": 2.154651641845703, "Pretrain/Loss (Raw)": 2.0794854164123535, "Pretrain/Step": 738, "Pretrain/Step Time": 8.076209124177694} +{"Pretrain/Learning Rate": 4.970476207631494e-05, "Pretrain/Loss": 2.1538336277008057, "Pretrain/Loss (Raw)": 2.1020314693450928, "Pretrain/Step": 739, "Pretrain/Step Time": 8.074352372437716} +{"Pretrain/Learning Rate": 4.970345974476918e-05, "Pretrain/Loss": 2.1545395851135254, "Pretrain/Loss (Raw)": 2.0744802951812744, "Pretrain/Step": 740, "Pretrain/Step Time": 8.074063405394554} +{"Pretrain/Learning Rate": 4.970215456430403e-05, "Pretrain/Loss": 2.1539340019226074, "Pretrain/Loss (Raw)": 2.121299982070923, "Pretrain/Step": 741, "Pretrain/Step Time": 8.069562030956149} +{"Pretrain/Learning Rate": 4.970084653507001e-05, "Pretrain/Loss": 2.1549012660980225, "Pretrain/Loss (Raw)": 2.057191848754883, "Pretrain/Step": 742, "Pretrain/Step Time": 8.06542506814003} +{"Pretrain/Learning Rate": 4.969953565721799e-05, "Pretrain/Loss": 2.154404640197754, "Pretrain/Loss (Raw)": 2.0815963745117188, "Pretrain/Step": 743, "Pretrain/Step Time": 8.074742456898093} +{"Pretrain/Learning Rate": 4.969822193089911e-05, "Pretrain/Loss": 2.156052589416504, "Pretrain/Loss (Raw)": 2.256197929382324, "Pretrain/Step": 744, "Pretrain/Step Time": 8.069614488631487} +{"Pretrain/Learning Rate": 4.969690535626491e-05, "Pretrain/Loss": 2.1560122966766357, "Pretrain/Loss (Raw)": 2.064650535583496, "Pretrain/Step": 745, "Pretrain/Step Time": 8.067923218011856} +{"Pretrain/Learning Rate": 4.96955859334672e-05, "Pretrain/Loss": 2.155621290206909, "Pretrain/Loss (Raw)": 2.132814645767212, "Pretrain/Step": 746, "Pretrain/Step Time": 8.062701696529984} +{"Pretrain/Learning Rate": 4.9694263662658156e-05, "Pretrain/Loss": 2.1560616493225098, "Pretrain/Loss (Raw)": 2.36124587059021, "Pretrain/Step": 747, "Pretrain/Step Time": 8.062760405242443} +{"Pretrain/Learning Rate": 4.9692938543990265e-05, "Pretrain/Loss": 2.1568562984466553, "Pretrain/Loss (Raw)": 2.255486249923706, "Pretrain/Step": 748, "Pretrain/Step Time": 8.058746095746756} +{"Pretrain/Learning Rate": 4.969161057761634e-05, "Pretrain/Loss": 2.1575417518615723, "Pretrain/Loss (Raw)": 2.2634530067443848, "Pretrain/Step": 749, "Pretrain/Step Time": 8.069188244640827} +{"Pretrain/Learning Rate": 4.969027976368954e-05, "Pretrain/Loss": 2.1564042568206787, "Pretrain/Loss (Raw)": 2.095337152481079, "Pretrain/Step": 750, "Pretrain/Step Time": 8.070373628288507} +{"Pretrain/Learning Rate": 4.968894610236332e-05, "Pretrain/Loss": 2.1569879055023193, "Pretrain/Loss (Raw)": 2.1553144454956055, "Pretrain/Step": 751, "Pretrain/Step Time": 8.066992994397879} +{"Pretrain/Learning Rate": 4.968760959379151e-05, "Pretrain/Loss": 2.156479835510254, "Pretrain/Loss (Raw)": 2.1027560234069824, "Pretrain/Step": 752, "Pretrain/Step Time": 8.075053980574012} +{"Pretrain/Learning Rate": 4.968627023812822e-05, "Pretrain/Loss": 2.1590819358825684, "Pretrain/Loss (Raw)": 2.419891834259033, "Pretrain/Step": 753, "Pretrain/Step Time": 8.07009800337255} +{"Pretrain/Learning Rate": 4.968492803552793e-05, "Pretrain/Loss": 2.1602203845977783, "Pretrain/Loss (Raw)": 2.2725419998168945, "Pretrain/Step": 754, "Pretrain/Step Time": 8.069279689341784} +{"Pretrain/Learning Rate": 4.968358298614541e-05, "Pretrain/Loss": 2.160335063934326, "Pretrain/Loss (Raw)": 2.103933095932007, "Pretrain/Step": 755, "Pretrain/Step Time": 8.06618364714086} +{"Pretrain/Learning Rate": 4.968223509013579e-05, "Pretrain/Loss": 2.162092685699463, "Pretrain/Loss (Raw)": 2.3568801879882812, "Pretrain/Step": 756, "Pretrain/Step Time": 8.062963841482997} +{"Pretrain/Learning Rate": 4.968088434765452e-05, "Pretrain/Loss": 2.163517951965332, "Pretrain/Loss (Raw)": 2.2927658557891846, "Pretrain/Step": 757, "Pretrain/Step Time": 8.061346933245659} +{"Pretrain/Learning Rate": 4.967953075885736e-05, "Pretrain/Loss": 2.1635570526123047, "Pretrain/Loss (Raw)": 2.09403133392334, "Pretrain/Step": 758, "Pretrain/Step Time": 8.063801154494286} +{"Pretrain/Learning Rate": 4.9678174323900415e-05, "Pretrain/Loss": 2.1647934913635254, "Pretrain/Loss (Raw)": 2.2312610149383545, "Pretrain/Step": 759, "Pretrain/Step Time": 8.068189138546586} +{"Pretrain/Learning Rate": 4.9676815042940125e-05, "Pretrain/Loss": 2.1631669998168945, "Pretrain/Loss (Raw)": 2.0424039363861084, "Pretrain/Step": 760, "Pretrain/Step Time": 8.06068609841168} +{"Pretrain/Learning Rate": 4.967545291613325e-05, "Pretrain/Loss": 2.163910388946533, "Pretrain/Loss (Raw)": 2.1668283939361572, "Pretrain/Step": 761, "Pretrain/Step Time": 8.062617104500532} +{"Pretrain/Learning Rate": 4.967408794363686e-05, "Pretrain/Loss": 2.164132595062256, "Pretrain/Loss (Raw)": 2.2641544342041016, "Pretrain/Step": 762, "Pretrain/Step Time": 8.058175258338451} +{"Pretrain/Learning Rate": 4.9672720125608384e-05, "Pretrain/Loss": 2.16471791267395, "Pretrain/Loss (Raw)": 2.203794002532959, "Pretrain/Step": 763, "Pretrain/Step Time": 8.059578750282526} +{"Pretrain/Learning Rate": 4.9671349462205565e-05, "Pretrain/Loss": 2.1670236587524414, "Pretrain/Loss (Raw)": 2.321589231491089, "Pretrain/Step": 764, "Pretrain/Step Time": 8.061157451942563} +{"Pretrain/Learning Rate": 4.966997595358647e-05, "Pretrain/Loss": 2.1675686836242676, "Pretrain/Loss (Raw)": 2.257748603820801, "Pretrain/Step": 765, "Pretrain/Step Time": 8.04993057437241} +{"Pretrain/Learning Rate": 4.966859959990949e-05, "Pretrain/Loss": 2.1697838306427, "Pretrain/Loss (Raw)": 2.3485023975372314, "Pretrain/Step": 766, "Pretrain/Step Time": 8.061697313562036} +{"Pretrain/Learning Rate": 4.966722040133337e-05, "Pretrain/Loss": 2.168884515762329, "Pretrain/Loss (Raw)": 2.1265926361083984, "Pretrain/Step": 767, "Pretrain/Step Time": 8.060660755261779} +{"Pretrain/Learning Rate": 4.9665838358017156e-05, "Pretrain/Loss": 2.16983962059021, "Pretrain/Loss (Raw)": 2.2692558765411377, "Pretrain/Step": 768, "Pretrain/Step Time": 8.068068496882915} +{"Pretrain/Learning Rate": 4.966445347012023e-05, "Pretrain/Loss": 2.169154405593872, "Pretrain/Loss (Raw)": 2.0068345069885254, "Pretrain/Step": 769, "Pretrain/Step Time": 8.063778840005398} +{"Pretrain/Learning Rate": 4.9663065737802316e-05, "Pretrain/Loss": 2.169257164001465, "Pretrain/Loss (Raw)": 2.183851480484009, "Pretrain/Step": 770, "Pretrain/Step Time": 8.058704713359475} +{"Pretrain/Learning Rate": 4.9661675161223435e-05, "Pretrain/Loss": 2.170185089111328, "Pretrain/Loss (Raw)": 2.1099231243133545, "Pretrain/Step": 771, "Pretrain/Step Time": 8.06119403988123} +{"Pretrain/Learning Rate": 4.966028174054397e-05, "Pretrain/Loss": 2.170396327972412, "Pretrain/Loss (Raw)": 2.3067386150360107, "Pretrain/Step": 772, "Pretrain/Step Time": 8.058356510475278} +{"Pretrain/Learning Rate": 4.965888547592461e-05, "Pretrain/Loss": 2.1693668365478516, "Pretrain/Loss (Raw)": 2.0224485397338867, "Pretrain/Step": 773, "Pretrain/Step Time": 8.067434668540955} +{"Pretrain/Learning Rate": 4.965748636752638e-05, "Pretrain/Loss": 2.168097734451294, "Pretrain/Loss (Raw)": 2.145052909851074, "Pretrain/Step": 774, "Pretrain/Step Time": 8.064396515488625} +{"Pretrain/Learning Rate": 4.965608441551063e-05, "Pretrain/Loss": 2.1678967475891113, "Pretrain/Loss (Raw)": 2.174872636795044, "Pretrain/Step": 775, "Pretrain/Step Time": 8.065306210890412} +{"Pretrain/Learning Rate": 4.965467962003905e-05, "Pretrain/Loss": 2.167965888977051, "Pretrain/Loss (Raw)": 2.1575541496276855, "Pretrain/Step": 776, "Pretrain/Step Time": 8.060714647173882} +{"Pretrain/Learning Rate": 4.965327198127363e-05, "Pretrain/Loss": 2.1688852310180664, "Pretrain/Loss (Raw)": 2.2139031887054443, "Pretrain/Step": 777, "Pretrain/Step Time": 8.063269095495343} +{"Pretrain/Learning Rate": 4.965186149937672e-05, "Pretrain/Loss": 2.1689696311950684, "Pretrain/Loss (Raw)": 2.176039457321167, "Pretrain/Step": 778, "Pretrain/Step Time": 8.067697864025831} +{"Pretrain/Learning Rate": 4.9650448174510986e-05, "Pretrain/Loss": 2.1710355281829834, "Pretrain/Loss (Raw)": 2.392080783843994, "Pretrain/Step": 779, "Pretrain/Step Time": 8.058114893734455} +{"Pretrain/Learning Rate": 4.9649032006839404e-05, "Pretrain/Loss": 2.1707518100738525, "Pretrain/Loss (Raw)": 2.1324825286865234, "Pretrain/Step": 780, "Pretrain/Step Time": 8.060820039361715} +{"Pretrain/Learning Rate": 4.964761299652529e-05, "Pretrain/Loss": 2.171341896057129, "Pretrain/Loss (Raw)": 2.096407175064087, "Pretrain/Step": 781, "Pretrain/Step Time": 8.061034152284265} +{"Pretrain/Learning Rate": 4.9646191143732324e-05, "Pretrain/Loss": 2.1723501682281494, "Pretrain/Loss (Raw)": 2.323491334915161, "Pretrain/Step": 782, "Pretrain/Step Time": 8.06283081509173} +{"Pretrain/Learning Rate": 4.9644766448624444e-05, "Pretrain/Loss": 2.1723551750183105, "Pretrain/Loss (Raw)": 2.264592409133911, "Pretrain/Step": 783, "Pretrain/Step Time": 8.057528832927346} +{"Pretrain/Learning Rate": 4.9643338911365964e-05, "Pretrain/Loss": 2.17114520072937, "Pretrain/Loss (Raw)": 2.1009345054626465, "Pretrain/Step": 784, "Pretrain/Step Time": 8.057224694639444} +{"Pretrain/Learning Rate": 4.9641908532121525e-05, "Pretrain/Loss": 2.171466112136841, "Pretrain/Loss (Raw)": 2.1974010467529297, "Pretrain/Step": 785, "Pretrain/Step Time": 8.056316191330552} +{"Pretrain/Learning Rate": 4.964047531105608e-05, "Pretrain/Loss": 2.1726317405700684, "Pretrain/Loss (Raw)": 2.1798102855682373, "Pretrain/Step": 786, "Pretrain/Step Time": 8.05619447119534} +{"Pretrain/Learning Rate": 4.963903924833491e-05, "Pretrain/Loss": 2.1719133853912354, "Pretrain/Loss (Raw)": 2.052457571029663, "Pretrain/Step": 787, "Pretrain/Step Time": 8.061881644651294} +{"Pretrain/Learning Rate": 4.963760034412363e-05, "Pretrain/Loss": 2.1724472045898438, "Pretrain/Loss (Raw)": 2.2307486534118652, "Pretrain/Step": 788, "Pretrain/Step Time": 8.056928368285298} +{"Pretrain/Learning Rate": 4.9636158598588185e-05, "Pretrain/Loss": 2.172201156616211, "Pretrain/Loss (Raw)": 2.035827875137329, "Pretrain/Step": 789, "Pretrain/Step Time": 8.053231438621879} +{"Pretrain/Learning Rate": 4.9634714011894836e-05, "Pretrain/Loss": 2.171020984649658, "Pretrain/Loss (Raw)": 2.1116130352020264, "Pretrain/Step": 790, "Pretrain/Step Time": 8.051036247983575} +{"Pretrain/Learning Rate": 4.963326658421019e-05, "Pretrain/Loss": 2.17112398147583, "Pretrain/Loss (Raw)": 2.1402056217193604, "Pretrain/Step": 791, "Pretrain/Step Time": 8.058659302070737} +{"Pretrain/Learning Rate": 4.9631816315701165e-05, "Pretrain/Loss": 2.170422077178955, "Pretrain/Loss (Raw)": 2.089846134185791, "Pretrain/Step": 792, "Pretrain/Step Time": 8.060361001640558} +{"Pretrain/Learning Rate": 4.9630363206535e-05, "Pretrain/Loss": 2.171837091445923, "Pretrain/Loss (Raw)": 2.2920093536376953, "Pretrain/Step": 793, "Pretrain/Step Time": 8.046535274013877} +{"Pretrain/Learning Rate": 4.962890725687931e-05, "Pretrain/Loss": 2.169668197631836, "Pretrain/Loss (Raw)": 2.0647449493408203, "Pretrain/Step": 794, "Pretrain/Step Time": 8.054052099585533} +{"Pretrain/Learning Rate": 4.962744846690196e-05, "Pretrain/Loss": 2.1710753440856934, "Pretrain/Loss (Raw)": 2.2339863777160645, "Pretrain/Step": 795, "Pretrain/Step Time": 8.043112488463521} +{"Pretrain/Learning Rate": 4.962598683677122e-05, "Pretrain/Loss": 2.1708950996398926, "Pretrain/Loss (Raw)": 2.157160758972168, "Pretrain/Step": 796, "Pretrain/Step Time": 8.051904240623116} +{"Pretrain/Learning Rate": 4.9624522366655625e-05, "Pretrain/Loss": 2.1700799465179443, "Pretrain/Loss (Raw)": 2.071288824081421, "Pretrain/Step": 797, "Pretrain/Step Time": 8.048221129924059} +{"Pretrain/Learning Rate": 4.962305505672408e-05, "Pretrain/Loss": 2.1678943634033203, "Pretrain/Loss (Raw)": 2.0370731353759766, "Pretrain/Step": 798, "Pretrain/Step Time": 8.043371617794037} +{"Pretrain/Learning Rate": 4.96215849071458e-05, "Pretrain/Loss": 2.166720151901245, "Pretrain/Loss (Raw)": 2.1076581478118896, "Pretrain/Step": 799, "Pretrain/Step Time": 8.044056635349989} +{"Pretrain/Learning Rate": 4.962011191809033e-05, "Pretrain/Loss": 2.165496826171875, "Pretrain/Loss (Raw)": 2.133038282394409, "Pretrain/Step": 800, "Pretrain/Step Time": 8.043572587892413} +{"Pretrain/Learning Rate": 4.961863608972753e-05, "Pretrain/Loss": 2.164801597595215, "Pretrain/Loss (Raw)": 2.2123358249664307, "Pretrain/Step": 801, "Pretrain/Step Time": 8.046874791383743} +{"Pretrain/Learning Rate": 4.961715742222762e-05, "Pretrain/Loss": 2.1640636920928955, "Pretrain/Loss (Raw)": 2.178279399871826, "Pretrain/Step": 802, "Pretrain/Step Time": 8.04427707195282} +{"Pretrain/Learning Rate": 4.961567591576112e-05, "Pretrain/Loss": 2.1640915870666504, "Pretrain/Loss (Raw)": 2.074659585952759, "Pretrain/Step": 803, "Pretrain/Step Time": 8.047620078548789} +{"Pretrain/Learning Rate": 4.961419157049887e-05, "Pretrain/Loss": 2.1649725437164307, "Pretrain/Loss (Raw)": 2.244105577468872, "Pretrain/Step": 804, "Pretrain/Step Time": 8.041760483756661} +{"Pretrain/Learning Rate": 4.9612704386612066e-05, "Pretrain/Loss": 2.1639864444732666, "Pretrain/Loss (Raw)": 2.0118024349212646, "Pretrain/Step": 805, "Pretrain/Step Time": 8.050812615081668} +{"Pretrain/Learning Rate": 4.9611214364272206e-05, "Pretrain/Loss": 2.1648287773132324, "Pretrain/Loss (Raw)": 2.1747732162475586, "Pretrain/Step": 806, "Pretrain/Step Time": 8.052702959626913} +{"Pretrain/Learning Rate": 4.960972150365114e-05, "Pretrain/Loss": 2.1648504734039307, "Pretrain/Loss (Raw)": 2.142165184020996, "Pretrain/Step": 807, "Pretrain/Step Time": 8.047347089275718} +{"Pretrain/Learning Rate": 4.960822580492103e-05, "Pretrain/Loss": 2.163548231124878, "Pretrain/Loss (Raw)": 2.0079331398010254, "Pretrain/Step": 808, "Pretrain/Step Time": 8.048061868175864} +{"Pretrain/Learning Rate": 4.960672726825436e-05, "Pretrain/Loss": 2.1625092029571533, "Pretrain/Loss (Raw)": 2.209524393081665, "Pretrain/Step": 809, "Pretrain/Step Time": 8.049795847386122} +{"Pretrain/Learning Rate": 4.960522589382395e-05, "Pretrain/Loss": 2.1601762771606445, "Pretrain/Loss (Raw)": 2.149559497833252, "Pretrain/Step": 810, "Pretrain/Step Time": 8.050859598442912} +{"Pretrain/Learning Rate": 4.960372168180294e-05, "Pretrain/Loss": 2.1599953174591064, "Pretrain/Loss (Raw)": 2.0529897212982178, "Pretrain/Step": 811, "Pretrain/Step Time": 8.057140870019794} +{"Pretrain/Learning Rate": 4.9602214632364816e-05, "Pretrain/Loss": 2.1613359451293945, "Pretrain/Loss (Raw)": 2.1891229152679443, "Pretrain/Step": 812, "Pretrain/Step Time": 8.056501938030124} +{"Pretrain/Learning Rate": 4.9600704745683367e-05, "Pretrain/Loss": 2.1616830825805664, "Pretrain/Loss (Raw)": 2.248422384262085, "Pretrain/Step": 813, "Pretrain/Step Time": 8.055170461535454} +{"Pretrain/Learning Rate": 4.959919202193273e-05, "Pretrain/Loss": 2.161113977432251, "Pretrain/Loss (Raw)": 2.226341724395752, "Pretrain/Step": 814, "Pretrain/Step Time": 8.057387487962842} +{"Pretrain/Learning Rate": 4.959767646128735e-05, "Pretrain/Loss": 2.1600067615509033, "Pretrain/Loss (Raw)": 2.0647149085998535, "Pretrain/Step": 815, "Pretrain/Step Time": 8.059786839410663} +{"Pretrain/Learning Rate": 4.959615806392201e-05, "Pretrain/Loss": 2.15864896774292, "Pretrain/Loss (Raw)": 1.9983899593353271, "Pretrain/Step": 816, "Pretrain/Step Time": 8.054230198264122} +{"Pretrain/Learning Rate": 4.959463683001182e-05, "Pretrain/Loss": 2.1578598022460938, "Pretrain/Loss (Raw)": 2.0400116443634033, "Pretrain/Step": 817, "Pretrain/Step Time": 8.059471325948834} +{"Pretrain/Learning Rate": 4.959311275973223e-05, "Pretrain/Loss": 2.1578547954559326, "Pretrain/Loss (Raw)": 2.227543592453003, "Pretrain/Step": 818, "Pretrain/Step Time": 8.053293848410249} +{"Pretrain/Learning Rate": 4.959158585325898e-05, "Pretrain/Loss": 2.157595634460449, "Pretrain/Loss (Raw)": 2.136937141418457, "Pretrain/Step": 819, "Pretrain/Step Time": 8.06110555306077} +{"Pretrain/Learning Rate": 4.959005611076817e-05, "Pretrain/Loss": 2.1571459770202637, "Pretrain/Loss (Raw)": 2.153465986251831, "Pretrain/Step": 820, "Pretrain/Step Time": 8.066182071343064} +{"Pretrain/Learning Rate": 4.9588523532436214e-05, "Pretrain/Loss": 2.157487154006958, "Pretrain/Loss (Raw)": 2.128899097442627, "Pretrain/Step": 821, "Pretrain/Step Time": 8.059834571555257} +{"Pretrain/Learning Rate": 4.9586988118439863e-05, "Pretrain/Loss": 2.1579415798187256, "Pretrain/Loss (Raw)": 2.109008312225342, "Pretrain/Step": 822, "Pretrain/Step Time": 8.06205339729786} +{"Pretrain/Learning Rate": 4.958544986895619e-05, "Pretrain/Loss": 2.158611297607422, "Pretrain/Loss (Raw)": 2.1160976886749268, "Pretrain/Step": 823, "Pretrain/Step Time": 8.055891528725624} +{"Pretrain/Learning Rate": 4.958390878416258e-05, "Pretrain/Loss": 2.158125400543213, "Pretrain/Loss (Raw)": 2.129772901535034, "Pretrain/Step": 824, "Pretrain/Step Time": 8.057458071038127} +{"Pretrain/Learning Rate": 4.9582364864236765e-05, "Pretrain/Loss": 2.1582112312316895, "Pretrain/Loss (Raw)": 2.164066791534424, "Pretrain/Step": 825, "Pretrain/Step Time": 8.062747027724981} +{"Pretrain/Learning Rate": 4.95808181093568e-05, "Pretrain/Loss": 2.1563429832458496, "Pretrain/Loss (Raw)": 2.1362011432647705, "Pretrain/Step": 826, "Pretrain/Step Time": 8.052077459171414} +{"Pretrain/Learning Rate": 4.9579268519701063e-05, "Pretrain/Loss": 2.157235622406006, "Pretrain/Loss (Raw)": 2.2075448036193848, "Pretrain/Step": 827, "Pretrain/Step Time": 8.05860504321754} +{"Pretrain/Learning Rate": 4.957771609544826e-05, "Pretrain/Loss": 2.1587886810302734, "Pretrain/Loss (Raw)": 2.2216553688049316, "Pretrain/Step": 828, "Pretrain/Step Time": 8.049628401175141} +{"Pretrain/Learning Rate": 4.957616083677742e-05, "Pretrain/Loss": 2.1572184562683105, "Pretrain/Loss (Raw)": 2.0854036808013916, "Pretrain/Step": 829, "Pretrain/Step Time": 8.058984108269215} +{"Pretrain/Learning Rate": 4.9574602743867916e-05, "Pretrain/Loss": 2.1573610305786133, "Pretrain/Loss (Raw)": 2.1259467601776123, "Pretrain/Step": 830, "Pretrain/Step Time": 8.05671763792634} +{"Pretrain/Learning Rate": 4.957304181689941e-05, "Pretrain/Loss": 2.1570701599121094, "Pretrain/Loss (Raw)": 2.237797498703003, "Pretrain/Step": 831, "Pretrain/Step Time": 8.061393344774842} +{"Pretrain/Learning Rate": 4.957147805605194e-05, "Pretrain/Loss": 2.1569039821624756, "Pretrain/Loss (Raw)": 2.062998056411743, "Pretrain/Step": 832, "Pretrain/Step Time": 8.062589161098003} +{"Pretrain/Learning Rate": 4.956991146150583e-05, "Pretrain/Loss": 2.1578314304351807, "Pretrain/Loss (Raw)": 2.143066644668579, "Pretrain/Step": 833, "Pretrain/Step Time": 8.058039903640747} +{"Pretrain/Learning Rate": 4.9568342033441755e-05, "Pretrain/Loss": 2.156862497329712, "Pretrain/Loss (Raw)": 2.13804292678833, "Pretrain/Step": 834, "Pretrain/Step Time": 8.063599899411201} +{"Pretrain/Learning Rate": 4.956676977204071e-05, "Pretrain/Loss": 2.156766891479492, "Pretrain/Loss (Raw)": 2.1433465480804443, "Pretrain/Step": 835, "Pretrain/Step Time": 8.060025358572602} +{"Pretrain/Learning Rate": 4.9565194677484e-05, "Pretrain/Loss": 2.156618118286133, "Pretrain/Loss (Raw)": 2.1676199436187744, "Pretrain/Step": 836, "Pretrain/Step Time": 8.062826115638018} +{"Pretrain/Learning Rate": 4.95636167499533e-05, "Pretrain/Loss": 2.1576950550079346, "Pretrain/Loss (Raw)": 2.1165690422058105, "Pretrain/Step": 837, "Pretrain/Step Time": 8.058042565360665} +{"Pretrain/Learning Rate": 4.9562035989630564e-05, "Pretrain/Loss": 2.159316301345825, "Pretrain/Loss (Raw)": 2.3394510746002197, "Pretrain/Step": 838, "Pretrain/Step Time": 8.059746790677309} +{"Pretrain/Learning Rate": 4.95604523966981e-05, "Pretrain/Loss": 2.1580278873443604, "Pretrain/Loss (Raw)": 2.1760752201080322, "Pretrain/Step": 839, "Pretrain/Step Time": 8.06667511165142} +{"Pretrain/Learning Rate": 4.9558865971338524e-05, "Pretrain/Loss": 2.158447265625, "Pretrain/Loss (Raw)": 2.2328860759735107, "Pretrain/Step": 840, "Pretrain/Step Time": 8.05978555418551} +{"Pretrain/Learning Rate": 4.9557276713734805e-05, "Pretrain/Loss": 2.1605281829833984, "Pretrain/Loss (Raw)": 2.343824625015259, "Pretrain/Step": 841, "Pretrain/Step Time": 8.063766127452254} +{"Pretrain/Learning Rate": 4.955568462407022e-05, "Pretrain/Loss": 2.1609995365142822, "Pretrain/Loss (Raw)": 2.1891322135925293, "Pretrain/Step": 842, "Pretrain/Step Time": 8.056729979813099} +{"Pretrain/Learning Rate": 4.955408970252837e-05, "Pretrain/Loss": 2.1608352661132812, "Pretrain/Loss (Raw)": 2.18992018699646, "Pretrain/Step": 843, "Pretrain/Step Time": 8.060201631858945} +{"Pretrain/Learning Rate": 4.955249194929319e-05, "Pretrain/Loss": 2.162574291229248, "Pretrain/Loss (Raw)": 2.3258118629455566, "Pretrain/Step": 844, "Pretrain/Step Time": 8.06527223996818} +{"Pretrain/Learning Rate": 4.955089136454895e-05, "Pretrain/Loss": 2.1616547107696533, "Pretrain/Loss (Raw)": 2.0800931453704834, "Pretrain/Step": 845, "Pretrain/Step Time": 8.066009882837534} +{"Pretrain/Learning Rate": 4.954928794848023e-05, "Pretrain/Loss": 2.160506010055542, "Pretrain/Loss (Raw)": 2.0111260414123535, "Pretrain/Step": 846, "Pretrain/Step Time": 8.065563211217523} +{"Pretrain/Learning Rate": 4.954768170127194e-05, "Pretrain/Loss": 2.1616835594177246, "Pretrain/Loss (Raw)": 2.229701519012451, "Pretrain/Step": 847, "Pretrain/Step Time": 8.065057272091508} +{"Pretrain/Learning Rate": 4.9546072623109325e-05, "Pretrain/Loss": 2.1617650985717773, "Pretrain/Loss (Raw)": 2.077772378921509, "Pretrain/Step": 848, "Pretrain/Step Time": 8.073290627449751} +{"Pretrain/Learning Rate": 4.954446071417795e-05, "Pretrain/Loss": 2.162139654159546, "Pretrain/Loss (Raw)": 2.1950762271881104, "Pretrain/Step": 849, "Pretrain/Step Time": 8.06609451957047} +{"Pretrain/Learning Rate": 4.954284597466371e-05, "Pretrain/Loss": 2.1618432998657227, "Pretrain/Loss (Raw)": 2.115933656692505, "Pretrain/Step": 850, "Pretrain/Step Time": 8.074477352201939} +{"Pretrain/Learning Rate": 4.954122840475281e-05, "Pretrain/Loss": 2.1623754501342773, "Pretrain/Loss (Raw)": 2.1186649799346924, "Pretrain/Step": 851, "Pretrain/Step Time": 8.06448569148779} +{"Pretrain/Learning Rate": 4.9539608004631825e-05, "Pretrain/Loss": 2.1629133224487305, "Pretrain/Loss (Raw)": 2.1984705924987793, "Pretrain/Step": 852, "Pretrain/Step Time": 8.068697990849614} +{"Pretrain/Learning Rate": 4.9537984774487606e-05, "Pretrain/Loss": 2.163867473602295, "Pretrain/Loss (Raw)": 2.2480695247650146, "Pretrain/Step": 853, "Pretrain/Step Time": 8.06640774011612} +{"Pretrain/Learning Rate": 4.953635871450736e-05, "Pretrain/Loss": 2.1639060974121094, "Pretrain/Loss (Raw)": 2.0648069381713867, "Pretrain/Step": 854, "Pretrain/Step Time": 8.060684019699693} +{"Pretrain/Learning Rate": 4.95347298248786e-05, "Pretrain/Loss": 2.162395477294922, "Pretrain/Loss (Raw)": 2.1067147254943848, "Pretrain/Step": 855, "Pretrain/Step Time": 8.070185173302889} +{"Pretrain/Learning Rate": 4.953309810578918e-05, "Pretrain/Loss": 2.161939859390259, "Pretrain/Loss (Raw)": 2.0223066806793213, "Pretrain/Step": 856, "Pretrain/Step Time": 8.065459543839097} +{"Pretrain/Learning Rate": 4.953146355742729e-05, "Pretrain/Loss": 2.162788152694702, "Pretrain/Loss (Raw)": 2.186577081680298, "Pretrain/Step": 857, "Pretrain/Step Time": 8.067112470045686} +{"Pretrain/Learning Rate": 4.952982617998143e-05, "Pretrain/Loss": 2.1616969108581543, "Pretrain/Loss (Raw)": 2.0305471420288086, "Pretrain/Step": 858, "Pretrain/Step Time": 8.068572031334043} +{"Pretrain/Learning Rate": 4.952818597364043e-05, "Pretrain/Loss": 2.1611790657043457, "Pretrain/Loss (Raw)": 2.1076903343200684, "Pretrain/Step": 859, "Pretrain/Step Time": 8.062112174928188} +{"Pretrain/Learning Rate": 4.952654293859344e-05, "Pretrain/Loss": 2.1600723266601562, "Pretrain/Loss (Raw)": 1.9901498556137085, "Pretrain/Step": 860, "Pretrain/Step Time": 8.058921828866005} +{"Pretrain/Learning Rate": 4.952489707502993e-05, "Pretrain/Loss": 2.1608152389526367, "Pretrain/Loss (Raw)": 2.2997803688049316, "Pretrain/Step": 861, "Pretrain/Step Time": 8.052897579967976} +{"Pretrain/Learning Rate": 4.952324838313974e-05, "Pretrain/Loss": 2.159822463989258, "Pretrain/Loss (Raw)": 2.094487190246582, "Pretrain/Step": 862, "Pretrain/Step Time": 8.055343639105558} +{"Pretrain/Learning Rate": 4.9521596863112986e-05, "Pretrain/Loss": 2.1589889526367188, "Pretrain/Loss (Raw)": 2.124175548553467, "Pretrain/Step": 863, "Pretrain/Step Time": 8.061600910499692} +{"Pretrain/Learning Rate": 4.951994251514013e-05, "Pretrain/Loss": 2.159176826477051, "Pretrain/Loss (Raw)": 2.1156253814697266, "Pretrain/Step": 864, "Pretrain/Step Time": 8.063205866143107} +{"Pretrain/Learning Rate": 4.9518285339411966e-05, "Pretrain/Loss": 2.1588449478149414, "Pretrain/Loss (Raw)": 2.022589921951294, "Pretrain/Step": 865, "Pretrain/Step Time": 8.061173079535365} +{"Pretrain/Learning Rate": 4.9516625336119595e-05, "Pretrain/Loss": 2.159703016281128, "Pretrain/Loss (Raw)": 2.189291477203369, "Pretrain/Step": 866, "Pretrain/Step Time": 8.060343496501446} +{"Pretrain/Learning Rate": 4.951496250545446e-05, "Pretrain/Loss": 2.1602463722229004, "Pretrain/Loss (Raw)": 2.171605110168457, "Pretrain/Step": 867, "Pretrain/Step Time": 8.066258953884244} +{"Pretrain/Learning Rate": 4.951329684760835e-05, "Pretrain/Loss": 2.1605019569396973, "Pretrain/Loss (Raw)": 2.1071693897247314, "Pretrain/Step": 868, "Pretrain/Step Time": 8.067846456542611} +{"Pretrain/Learning Rate": 4.951162836277332e-05, "Pretrain/Loss": 2.159618854522705, "Pretrain/Loss (Raw)": 2.0082592964172363, "Pretrain/Step": 869, "Pretrain/Step Time": 8.070172740146518} +{"Pretrain/Learning Rate": 4.950995705114182e-05, "Pretrain/Loss": 2.162876844406128, "Pretrain/Loss (Raw)": 2.4742259979248047, "Pretrain/Step": 870, "Pretrain/Step Time": 8.070432534441352} +{"Pretrain/Learning Rate": 4.950828291290656e-05, "Pretrain/Loss": 2.164869785308838, "Pretrain/Loss (Raw)": 2.336690902709961, "Pretrain/Step": 871, "Pretrain/Step Time": 8.064286654815078} +{"Pretrain/Learning Rate": 4.950660594826064e-05, "Pretrain/Loss": 2.164882183074951, "Pretrain/Loss (Raw)": 2.2577662467956543, "Pretrain/Step": 872, "Pretrain/Step Time": 8.064099969342351} +{"Pretrain/Learning Rate": 4.9504926157397436e-05, "Pretrain/Loss": 2.16512393951416, "Pretrain/Loss (Raw)": 2.095614194869995, "Pretrain/Step": 873, "Pretrain/Step Time": 8.063573379069567} +{"Pretrain/Learning Rate": 4.950324354051068e-05, "Pretrain/Loss": 2.1673030853271484, "Pretrain/Loss (Raw)": 2.4117252826690674, "Pretrain/Step": 874, "Pretrain/Step Time": 8.060618130490184} +{"Pretrain/Learning Rate": 4.950155809779442e-05, "Pretrain/Loss": 2.1655030250549316, "Pretrain/Loss (Raw)": 2.130862236022949, "Pretrain/Step": 875, "Pretrain/Step Time": 8.055990485474467} +{"Pretrain/Learning Rate": 4.9499869829443026e-05, "Pretrain/Loss": 2.165147066116333, "Pretrain/Loss (Raw)": 2.209902286529541, "Pretrain/Step": 876, "Pretrain/Step Time": 8.065637903288007} +{"Pretrain/Learning Rate": 4.9498178735651184e-05, "Pretrain/Loss": 2.1640830039978027, "Pretrain/Loss (Raw)": 2.1272947788238525, "Pretrain/Step": 877, "Pretrain/Step Time": 8.058637030422688} +{"Pretrain/Learning Rate": 4.949648481661394e-05, "Pretrain/Loss": 2.1653079986572266, "Pretrain/Loss (Raw)": 2.2521023750305176, "Pretrain/Step": 878, "Pretrain/Step Time": 8.061370715498924} +{"Pretrain/Learning Rate": 4.949478807252663e-05, "Pretrain/Loss": 2.1644506454467773, "Pretrain/Loss (Raw)": 2.0455822944641113, "Pretrain/Step": 879, "Pretrain/Step Time": 8.056950071826577} +{"Pretrain/Learning Rate": 4.949308850358494e-05, "Pretrain/Loss": 2.1643502712249756, "Pretrain/Loss (Raw)": 2.089916706085205, "Pretrain/Step": 880, "Pretrain/Step Time": 8.051101239398122} +{"Pretrain/Learning Rate": 4.949138610998487e-05, "Pretrain/Loss": 2.162539005279541, "Pretrain/Loss (Raw)": 2.188060998916626, "Pretrain/Step": 881, "Pretrain/Step Time": 8.05762418359518} +{"Pretrain/Learning Rate": 4.9489680891922746e-05, "Pretrain/Loss": 2.1619973182678223, "Pretrain/Loss (Raw)": 2.2031683921813965, "Pretrain/Step": 882, "Pretrain/Step Time": 8.057269321754575} +{"Pretrain/Learning Rate": 4.948797284959522e-05, "Pretrain/Loss": 2.161529541015625, "Pretrain/Loss (Raw)": 2.0440874099731445, "Pretrain/Step": 883, "Pretrain/Step Time": 8.06339617073536} +{"Pretrain/Learning Rate": 4.948626198319928e-05, "Pretrain/Loss": 2.1601600646972656, "Pretrain/Loss (Raw)": 2.181567907333374, "Pretrain/Step": 884, "Pretrain/Step Time": 8.064135916531086} +{"Pretrain/Learning Rate": 4.948454829293222e-05, "Pretrain/Loss": 2.1580071449279785, "Pretrain/Loss (Raw)": 2.0172207355499268, "Pretrain/Step": 885, "Pretrain/Step Time": 8.066069858148694} +{"Pretrain/Learning Rate": 4.9482831778991676e-05, "Pretrain/Loss": 2.1592154502868652, "Pretrain/Loss (Raw)": 2.248669147491455, "Pretrain/Step": 886, "Pretrain/Step Time": 8.069319183006883} +{"Pretrain/Learning Rate": 4.9481112441575605e-05, "Pretrain/Loss": 2.157639741897583, "Pretrain/Loss (Raw)": 2.0295863151550293, "Pretrain/Step": 887, "Pretrain/Step Time": 8.059883378446102} +{"Pretrain/Learning Rate": 4.947939028088229e-05, "Pretrain/Loss": 2.1585206985473633, "Pretrain/Loss (Raw)": 2.1551239490509033, "Pretrain/Step": 888, "Pretrain/Step Time": 8.066268293187022} +{"Pretrain/Learning Rate": 4.947766529711033e-05, "Pretrain/Loss": 2.158444881439209, "Pretrain/Loss (Raw)": 2.1571767330169678, "Pretrain/Step": 889, "Pretrain/Step Time": 8.060823248699307} +{"Pretrain/Learning Rate": 4.947593749045867e-05, "Pretrain/Loss": 2.1590981483459473, "Pretrain/Loss (Raw)": 2.3477392196655273, "Pretrain/Step": 890, "Pretrain/Step Time": 8.06870225071907} +{"Pretrain/Learning Rate": 4.947420686112657e-05, "Pretrain/Loss": 2.158334255218506, "Pretrain/Loss (Raw)": 2.106065511703491, "Pretrain/Step": 891, "Pretrain/Step Time": 8.07016378454864} +{"Pretrain/Learning Rate": 4.9472473409313605e-05, "Pretrain/Loss": 2.157668352127075, "Pretrain/Loss (Raw)": 2.2363121509552, "Pretrain/Step": 892, "Pretrain/Step Time": 8.069791404530406} +{"Pretrain/Learning Rate": 4.947073713521968e-05, "Pretrain/Loss": 2.157262086868286, "Pretrain/Loss (Raw)": 2.205775737762451, "Pretrain/Step": 893, "Pretrain/Step Time": 8.072446728125215} +{"Pretrain/Learning Rate": 4.9468998039045046e-05, "Pretrain/Loss": 2.1555240154266357, "Pretrain/Loss (Raw)": 2.126004934310913, "Pretrain/Step": 894, "Pretrain/Step Time": 8.062078639864922} +{"Pretrain/Learning Rate": 4.946725612099026e-05, "Pretrain/Loss": 2.1556007862091064, "Pretrain/Loss (Raw)": 2.1364409923553467, "Pretrain/Step": 895, "Pretrain/Step Time": 8.06737214513123} +{"Pretrain/Learning Rate": 4.9465511381256204e-05, "Pretrain/Loss": 2.1544432640075684, "Pretrain/Loss (Raw)": 2.12109637260437, "Pretrain/Step": 896, "Pretrain/Step Time": 8.060794251039624} +{"Pretrain/Learning Rate": 4.946376382004408e-05, "Pretrain/Loss": 2.1557328701019287, "Pretrain/Loss (Raw)": 2.171902894973755, "Pretrain/Step": 897, "Pretrain/Step Time": 8.06650366820395} +{"Pretrain/Learning Rate": 4.9462013437555446e-05, "Pretrain/Loss": 2.1563611030578613, "Pretrain/Loss (Raw)": 2.264228343963623, "Pretrain/Step": 898, "Pretrain/Step Time": 8.067040096968412} +{"Pretrain/Learning Rate": 4.946026023399215e-05, "Pretrain/Loss": 2.1572093963623047, "Pretrain/Loss (Raw)": 2.218540906906128, "Pretrain/Step": 899, "Pretrain/Step Time": 8.069902820512652} +{"Pretrain/Learning Rate": 4.9458504209556377e-05, "Pretrain/Loss": 2.1553516387939453, "Pretrain/Loss (Raw)": 2.068902015686035, "Pretrain/Step": 900, "Pretrain/Step Time": 8.070419440045953} +{"Pretrain/Learning Rate": 4.945674536445065e-05, "Pretrain/Loss": 2.158125162124634, "Pretrain/Loss (Raw)": 2.3774986267089844, "Pretrain/Step": 901, "Pretrain/Step Time": 8.061173347756267} +{"Pretrain/Learning Rate": 4.945498369887781e-05, "Pretrain/Loss": 2.1583945751190186, "Pretrain/Loss (Raw)": 2.179513454437256, "Pretrain/Step": 902, "Pretrain/Step Time": 8.06458718329668} +{"Pretrain/Learning Rate": 4.945321921304101e-05, "Pretrain/Loss": 2.1581482887268066, "Pretrain/Loss (Raw)": 2.1433539390563965, "Pretrain/Step": 903, "Pretrain/Step Time": 8.06367040798068} +{"Pretrain/Learning Rate": 4.945145190714374e-05, "Pretrain/Loss": 2.1591506004333496, "Pretrain/Loss (Raw)": 2.2858493328094482, "Pretrain/Step": 904, "Pretrain/Step Time": 8.06888441182673} +{"Pretrain/Learning Rate": 4.944968178138982e-05, "Pretrain/Loss": 2.1591696739196777, "Pretrain/Loss (Raw)": 2.216376543045044, "Pretrain/Step": 905, "Pretrain/Step Time": 8.067364564165473} +{"Pretrain/Learning Rate": 4.944790883598339e-05, "Pretrain/Loss": 2.1587672233581543, "Pretrain/Loss (Raw)": 2.1244733333587646, "Pretrain/Step": 906, "Pretrain/Step Time": 8.062888577580452} +{"Pretrain/Learning Rate": 4.9446133071128905e-05, "Pretrain/Loss": 2.1560263633728027, "Pretrain/Loss (Raw)": 2.041303873062134, "Pretrain/Step": 907, "Pretrain/Step Time": 8.068951986730099} +{"Pretrain/Learning Rate": 4.944435448703116e-05, "Pretrain/Loss": 2.1567962169647217, "Pretrain/Loss (Raw)": 2.230982542037964, "Pretrain/Step": 908, "Pretrain/Step Time": 8.062280509620905} +{"Pretrain/Learning Rate": 4.944257308389528e-05, "Pretrain/Loss": 2.157201051712036, "Pretrain/Loss (Raw)": 2.1482467651367188, "Pretrain/Step": 909, "Pretrain/Step Time": 8.066955842077732} +{"Pretrain/Learning Rate": 4.944078886192668e-05, "Pretrain/Loss": 2.1574254035949707, "Pretrain/Loss (Raw)": 2.3522138595581055, "Pretrain/Step": 910, "Pretrain/Step Time": 8.06364274583757} +{"Pretrain/Learning Rate": 4.943900182133116e-05, "Pretrain/Loss": 2.156351327896118, "Pretrain/Loss (Raw)": 2.12712025642395, "Pretrain/Step": 911, "Pretrain/Step Time": 8.06750439107418} +{"Pretrain/Learning Rate": 4.943721196231477e-05, "Pretrain/Loss": 2.156963586807251, "Pretrain/Loss (Raw)": 2.1792852878570557, "Pretrain/Step": 912, "Pretrain/Step Time": 8.059215856716037} +{"Pretrain/Learning Rate": 4.943541928508395e-05, "Pretrain/Loss": 2.1622238159179688, "Pretrain/Loss (Raw)": 2.870706081390381, "Pretrain/Step": 913, "Pretrain/Step Time": 8.065347710624337} +{"Pretrain/Learning Rate": 4.9433623789845426e-05, "Pretrain/Loss": 2.161633014678955, "Pretrain/Loss (Raw)": 2.104182720184326, "Pretrain/Step": 914, "Pretrain/Step Time": 8.06397440098226} +{"Pretrain/Learning Rate": 4.943182547680629e-05, "Pretrain/Loss": 2.161078691482544, "Pretrain/Loss (Raw)": 1.9815080165863037, "Pretrain/Step": 915, "Pretrain/Step Time": 8.059601370245218} +{"Pretrain/Learning Rate": 4.94300243461739e-05, "Pretrain/Loss": 2.161771535873413, "Pretrain/Loss (Raw)": 2.3194150924682617, "Pretrain/Step": 916, "Pretrain/Step Time": 8.064423017203808} +{"Pretrain/Learning Rate": 4.9428220398155986e-05, "Pretrain/Loss": 2.161973237991333, "Pretrain/Loss (Raw)": 2.0616605281829834, "Pretrain/Step": 917, "Pretrain/Step Time": 8.062001721933484} +{"Pretrain/Learning Rate": 4.94264136329606e-05, "Pretrain/Loss": 2.1632871627807617, "Pretrain/Loss (Raw)": 2.2797765731811523, "Pretrain/Step": 918, "Pretrain/Step Time": 8.069355178624392} +{"Pretrain/Learning Rate": 4.942460405079608e-05, "Pretrain/Loss": 2.1644020080566406, "Pretrain/Loss (Raw)": 2.282925605773926, "Pretrain/Step": 919, "Pretrain/Step Time": 8.066639861091971} +{"Pretrain/Learning Rate": 4.942279165187113e-05, "Pretrain/Loss": 2.1658072471618652, "Pretrain/Loss (Raw)": 2.269707441329956, "Pretrain/Step": 920, "Pretrain/Step Time": 8.06310692243278} +{"Pretrain/Learning Rate": 4.9420976436394764e-05, "Pretrain/Loss": 2.164958953857422, "Pretrain/Loss (Raw)": 2.183452844619751, "Pretrain/Step": 921, "Pretrain/Step Time": 8.074892826378345} +{"Pretrain/Learning Rate": 4.941915840457632e-05, "Pretrain/Loss": 2.1671409606933594, "Pretrain/Loss (Raw)": 2.3440160751342773, "Pretrain/Step": 922, "Pretrain/Step Time": 8.068095894530416} +{"Pretrain/Learning Rate": 4.941733755662545e-05, "Pretrain/Loss": 2.1667256355285645, "Pretrain/Loss (Raw)": 2.1808652877807617, "Pretrain/Step": 923, "Pretrain/Step Time": 8.072865949943662} +{"Pretrain/Learning Rate": 4.941551389275217e-05, "Pretrain/Loss": 2.1656012535095215, "Pretrain/Loss (Raw)": 2.013188123703003, "Pretrain/Step": 924, "Pretrain/Step Time": 8.068618088960648} +{"Pretrain/Learning Rate": 4.9413687413166777e-05, "Pretrain/Loss": 2.165383815765381, "Pretrain/Loss (Raw)": 2.043469190597534, "Pretrain/Step": 925, "Pretrain/Step Time": 8.071688549593091} +{"Pretrain/Learning Rate": 4.94118581180799e-05, "Pretrain/Loss": 2.1667351722717285, "Pretrain/Loss (Raw)": 2.2100412845611572, "Pretrain/Step": 926, "Pretrain/Step Time": 8.081118075177073} +{"Pretrain/Learning Rate": 4.9410026007702525e-05, "Pretrain/Loss": 2.1653385162353516, "Pretrain/Loss (Raw)": 1.9289342164993286, "Pretrain/Step": 927, "Pretrain/Step Time": 8.078146519139409} +{"Pretrain/Learning Rate": 4.940819108224592e-05, "Pretrain/Loss": 2.165647029876709, "Pretrain/Loss (Raw)": 2.1725075244903564, "Pretrain/Step": 928, "Pretrain/Step Time": 8.072784457355738} +{"Pretrain/Learning Rate": 4.940635334192171e-05, "Pretrain/Loss": 2.1640944480895996, "Pretrain/Loss (Raw)": 2.0136077404022217, "Pretrain/Step": 929, "Pretrain/Step Time": 8.070720026269555} +{"Pretrain/Learning Rate": 4.940451278694181e-05, "Pretrain/Loss": 2.163456439971924, "Pretrain/Loss (Raw)": 2.0966179370880127, "Pretrain/Step": 930, "Pretrain/Step Time": 8.071422001346946} +{"Pretrain/Learning Rate": 4.9402669417518514e-05, "Pretrain/Loss": 2.16326904296875, "Pretrain/Loss (Raw)": 2.0506436824798584, "Pretrain/Step": 931, "Pretrain/Step Time": 8.071433860808611} +{"Pretrain/Learning Rate": 4.940082323386439e-05, "Pretrain/Loss": 2.16267991065979, "Pretrain/Loss (Raw)": 2.1686959266662598, "Pretrain/Step": 932, "Pretrain/Step Time": 8.074826976284385} +{"Pretrain/Learning Rate": 4.939897423619234e-05, "Pretrain/Loss": 2.164207696914673, "Pretrain/Loss (Raw)": 2.2073585987091064, "Pretrain/Step": 933, "Pretrain/Step Time": 8.078257760033011} +{"Pretrain/Learning Rate": 4.9397122424715624e-05, "Pretrain/Loss": 2.163844108581543, "Pretrain/Loss (Raw)": 2.1282589435577393, "Pretrain/Step": 934, "Pretrain/Step Time": 8.071717014536262} +{"Pretrain/Learning Rate": 4.939526779964778e-05, "Pretrain/Loss": 2.1633808612823486, "Pretrain/Loss (Raw)": 2.082873582839966, "Pretrain/Step": 935, "Pretrain/Step Time": 8.074423637241125} +{"Pretrain/Learning Rate": 4.9393410361202694e-05, "Pretrain/Loss": 2.1654739379882812, "Pretrain/Loss (Raw)": 2.275826930999756, "Pretrain/Step": 936, "Pretrain/Step Time": 8.074440667405725} +{"Pretrain/Learning Rate": 4.9391550109594584e-05, "Pretrain/Loss": 2.1635231971740723, "Pretrain/Loss (Raw)": 1.959814429283142, "Pretrain/Step": 937, "Pretrain/Step Time": 8.077500995248556} +{"Pretrain/Learning Rate": 4.938968704503798e-05, "Pretrain/Loss": 2.164310932159424, "Pretrain/Loss (Raw)": 2.25042724609375, "Pretrain/Step": 938, "Pretrain/Step Time": 8.075708577409387} +{"Pretrain/Learning Rate": 4.938782116774774e-05, "Pretrain/Loss": 2.1661365032196045, "Pretrain/Loss (Raw)": 2.2866528034210205, "Pretrain/Step": 939, "Pretrain/Step Time": 8.065524205565453} +{"Pretrain/Learning Rate": 4.938595247793903e-05, "Pretrain/Loss": 2.165217399597168, "Pretrain/Loss (Raw)": 2.071445941925049, "Pretrain/Step": 940, "Pretrain/Step Time": 8.073932062834501} +{"Pretrain/Learning Rate": 4.938408097582738e-05, "Pretrain/Loss": 2.1637933254241943, "Pretrain/Loss (Raw)": 2.0661516189575195, "Pretrain/Step": 941, "Pretrain/Step Time": 8.067784549668431} +{"Pretrain/Learning Rate": 4.9382206661628615e-05, "Pretrain/Loss": 2.1627137660980225, "Pretrain/Loss (Raw)": 2.088188886642456, "Pretrain/Step": 942, "Pretrain/Step Time": 8.069412991404533} +{"Pretrain/Learning Rate": 4.9380329535558887e-05, "Pretrain/Loss": 2.162860631942749, "Pretrain/Loss (Raw)": 2.083508014678955, "Pretrain/Step": 943, "Pretrain/Step Time": 8.070472534745932} +{"Pretrain/Learning Rate": 4.9378449597834664e-05, "Pretrain/Loss": 2.1634750366210938, "Pretrain/Loss (Raw)": 2.0769975185394287, "Pretrain/Step": 944, "Pretrain/Step Time": 8.067805916070938} +{"Pretrain/Learning Rate": 4.937656684867276e-05, "Pretrain/Loss": 2.164407253265381, "Pretrain/Loss (Raw)": 2.15934419631958, "Pretrain/Step": 945, "Pretrain/Step Time": 8.072548806667328} +{"Pretrain/Learning Rate": 4.93746812882903e-05, "Pretrain/Loss": 2.1648073196411133, "Pretrain/Loss (Raw)": 2.2787961959838867, "Pretrain/Step": 946, "Pretrain/Step Time": 8.07045141607523} +{"Pretrain/Learning Rate": 4.937279291690474e-05, "Pretrain/Loss": 2.1641135215759277, "Pretrain/Loss (Raw)": 2.0481131076812744, "Pretrain/Step": 947, "Pretrain/Step Time": 8.071672551333904} +{"Pretrain/Learning Rate": 4.9370901734733856e-05, "Pretrain/Loss": 2.1646578311920166, "Pretrain/Loss (Raw)": 2.223115921020508, "Pretrain/Step": 948, "Pretrain/Step Time": 8.066579710692167} +{"Pretrain/Learning Rate": 4.936900774199573e-05, "Pretrain/Loss": 2.164884567260742, "Pretrain/Loss (Raw)": 2.157914876937866, "Pretrain/Step": 949, "Pretrain/Step Time": 8.069760259240866} +{"Pretrain/Learning Rate": 4.936711093890881e-05, "Pretrain/Loss": 2.163681983947754, "Pretrain/Loss (Raw)": 1.9551013708114624, "Pretrain/Step": 950, "Pretrain/Step Time": 8.066501906141639} +{"Pretrain/Learning Rate": 4.936521132569184e-05, "Pretrain/Loss": 2.163592576980591, "Pretrain/Loss (Raw)": 2.1046667098999023, "Pretrain/Step": 951, "Pretrain/Step Time": 8.06778885051608} +{"Pretrain/Learning Rate": 4.936330890256388e-05, "Pretrain/Loss": 2.1637299060821533, "Pretrain/Loss (Raw)": 2.147334098815918, "Pretrain/Step": 952, "Pretrain/Step Time": 8.074548453092575} +{"Pretrain/Learning Rate": 4.9361403669744336e-05, "Pretrain/Loss": 2.1632957458496094, "Pretrain/Loss (Raw)": 2.1084883213043213, "Pretrain/Step": 953, "Pretrain/Step Time": 8.06737500242889} +{"Pretrain/Learning Rate": 4.935949562745293e-05, "Pretrain/Loss": 2.162773370742798, "Pretrain/Loss (Raw)": 2.0693461894989014, "Pretrain/Step": 954, "Pretrain/Step Time": 8.07490037754178} +{"Pretrain/Learning Rate": 4.93575847759097e-05, "Pretrain/Loss": 2.1634955406188965, "Pretrain/Loss (Raw)": 2.299971342086792, "Pretrain/Step": 955, "Pretrain/Step Time": 8.069071497768164} +{"Pretrain/Learning Rate": 4.9355671115335015e-05, "Pretrain/Loss": 2.162670373916626, "Pretrain/Loss (Raw)": 2.1160356998443604, "Pretrain/Step": 956, "Pretrain/Step Time": 8.072796994820237} +{"Pretrain/Learning Rate": 4.935375464594957e-05, "Pretrain/Loss": 2.1626486778259277, "Pretrain/Loss (Raw)": 2.082624912261963, "Pretrain/Step": 957, "Pretrain/Step Time": 8.067058557644486} +{"Pretrain/Learning Rate": 4.9351835367974375e-05, "Pretrain/Loss": 2.1632862091064453, "Pretrain/Loss (Raw)": 2.207569122314453, "Pretrain/Step": 958, "Pretrain/Step Time": 8.06015731394291} +{"Pretrain/Learning Rate": 4.9349913281630786e-05, "Pretrain/Loss": 2.1631388664245605, "Pretrain/Loss (Raw)": 2.2189254760742188, "Pretrain/Step": 959, "Pretrain/Step Time": 8.060433262959123} +{"Pretrain/Learning Rate": 4.934798838714045e-05, "Pretrain/Loss": 2.163358449935913, "Pretrain/Loss (Raw)": 2.0911128520965576, "Pretrain/Step": 960, "Pretrain/Step Time": 8.063333364203572} +{"Pretrain/Learning Rate": 4.9346060684725364e-05, "Pretrain/Loss": 2.1632654666900635, "Pretrain/Loss (Raw)": 2.1311569213867188, "Pretrain/Step": 961, "Pretrain/Step Time": 8.070519035682082} +{"Pretrain/Learning Rate": 4.934413017460784e-05, "Pretrain/Loss": 2.1633458137512207, "Pretrain/Loss (Raw)": 2.1483383178710938, "Pretrain/Step": 962, "Pretrain/Step Time": 8.062358593568206} +{"Pretrain/Learning Rate": 4.93421968570105e-05, "Pretrain/Loss": 2.162529468536377, "Pretrain/Loss (Raw)": 2.0388479232788086, "Pretrain/Step": 963, "Pretrain/Step Time": 8.06890799663961} +{"Pretrain/Learning Rate": 4.934026073215633e-05, "Pretrain/Loss": 2.1624789237976074, "Pretrain/Loss (Raw)": 2.1611387729644775, "Pretrain/Step": 964, "Pretrain/Step Time": 8.068770134821534} +{"Pretrain/Learning Rate": 4.933832180026858e-05, "Pretrain/Loss": 2.1643459796905518, "Pretrain/Loss (Raw)": 2.3555588722229004, "Pretrain/Step": 965, "Pretrain/Step Time": 8.072773043066263} +{"Pretrain/Learning Rate": 4.933638006157089e-05, "Pretrain/Loss": 2.1637821197509766, "Pretrain/Loss (Raw)": 2.267299175262451, "Pretrain/Step": 966, "Pretrain/Step Time": 8.07241085730493} +{"Pretrain/Learning Rate": 4.933443551628717e-05, "Pretrain/Loss": 2.163865566253662, "Pretrain/Loss (Raw)": 2.186739206314087, "Pretrain/Step": 967, "Pretrain/Step Time": 8.063726613298059} +{"Pretrain/Learning Rate": 4.933248816464168e-05, "Pretrain/Loss": 2.163619041442871, "Pretrain/Loss (Raw)": 2.2013373374938965, "Pretrain/Step": 968, "Pretrain/Step Time": 8.067944381386042} +{"Pretrain/Learning Rate": 4.933053800685899e-05, "Pretrain/Loss": 2.162328004837036, "Pretrain/Loss (Raw)": 2.1785452365875244, "Pretrain/Step": 969, "Pretrain/Step Time": 8.057458858937025} +{"Pretrain/Learning Rate": 4.932858504316401e-05, "Pretrain/Loss": 2.160999298095703, "Pretrain/Loss (Raw)": 2.019080877304077, "Pretrain/Step": 970, "Pretrain/Step Time": 8.065940512344241} +{"Pretrain/Learning Rate": 4.932662927378196e-05, "Pretrain/Loss": 2.1614291667938232, "Pretrain/Loss (Raw)": 2.244953155517578, "Pretrain/Step": 971, "Pretrain/Step Time": 8.069538861513138} +{"Pretrain/Learning Rate": 4.93246706989384e-05, "Pretrain/Loss": 2.159677267074585, "Pretrain/Loss (Raw)": 2.1015563011169434, "Pretrain/Step": 972, "Pretrain/Step Time": 8.065044023096561} +{"Pretrain/Learning Rate": 4.932270931885918e-05, "Pretrain/Loss": 2.161454200744629, "Pretrain/Loss (Raw)": 2.307541847229004, "Pretrain/Step": 973, "Pretrain/Step Time": 8.066420504823327} +{"Pretrain/Learning Rate": 4.9320745133770524e-05, "Pretrain/Loss": 2.1646134853363037, "Pretrain/Loss (Raw)": 2.4155032634735107, "Pretrain/Step": 974, "Pretrain/Step Time": 8.067888636142015} +{"Pretrain/Learning Rate": 4.931877814389893e-05, "Pretrain/Loss": 2.1647589206695557, "Pretrain/Loss (Raw)": 2.2483208179473877, "Pretrain/Step": 975, "Pretrain/Step Time": 8.061216136440635} +{"Pretrain/Learning Rate": 4.931680834947124e-05, "Pretrain/Loss": 2.165771484375, "Pretrain/Loss (Raw)": 2.207374095916748, "Pretrain/Step": 976, "Pretrain/Step Time": 8.057087237015367} +{"Pretrain/Learning Rate": 4.9314835750714635e-05, "Pretrain/Loss": 2.165811061859131, "Pretrain/Loss (Raw)": 2.2001497745513916, "Pretrain/Step": 977, "Pretrain/Step Time": 8.056065859273076} +{"Pretrain/Learning Rate": 4.9312860347856595e-05, "Pretrain/Loss": 2.1652355194091797, "Pretrain/Loss (Raw)": 2.0422563552856445, "Pretrain/Step": 978, "Pretrain/Step Time": 8.058817185461521} +{"Pretrain/Learning Rate": 4.931088214112494e-05, "Pretrain/Loss": 2.165158748626709, "Pretrain/Loss (Raw)": 2.1088688373565674, "Pretrain/Step": 979, "Pretrain/Step Time": 8.05976534076035} +{"Pretrain/Learning Rate": 4.930890113074779e-05, "Pretrain/Loss": 2.1643402576446533, "Pretrain/Loss (Raw)": 2.093672752380371, "Pretrain/Step": 980, "Pretrain/Step Time": 8.063389310613275} +{"Pretrain/Learning Rate": 4.930691731695362e-05, "Pretrain/Loss": 2.1629185676574707, "Pretrain/Loss (Raw)": 2.0661027431488037, "Pretrain/Step": 981, "Pretrain/Step Time": 8.060446286574006} +{"Pretrain/Learning Rate": 4.9304930699971194e-05, "Pretrain/Loss": 2.1635923385620117, "Pretrain/Loss (Raw)": 2.151033878326416, "Pretrain/Step": 982, "Pretrain/Step Time": 8.065017562359571} +{"Pretrain/Learning Rate": 4.9302941280029645e-05, "Pretrain/Loss": 2.164271831512451, "Pretrain/Loss (Raw)": 2.1937129497528076, "Pretrain/Step": 983, "Pretrain/Step Time": 8.0598910972476} +{"Pretrain/Learning Rate": 4.930094905735838e-05, "Pretrain/Loss": 2.1652603149414062, "Pretrain/Loss (Raw)": 2.148831844329834, "Pretrain/Step": 984, "Pretrain/Step Time": 8.05853195860982} +{"Pretrain/Learning Rate": 4.929895403218717e-05, "Pretrain/Loss": 2.1653952598571777, "Pretrain/Loss (Raw)": 2.203822612762451, "Pretrain/Step": 985, "Pretrain/Step Time": 8.06705217063427} +{"Pretrain/Learning Rate": 4.929695620474607e-05, "Pretrain/Loss": 2.1654767990112305, "Pretrain/Loss (Raw)": 2.0409862995147705, "Pretrain/Step": 986, "Pretrain/Step Time": 8.05942327156663} +{"Pretrain/Learning Rate": 4.9294955575265494e-05, "Pretrain/Loss": 2.165492057800293, "Pretrain/Loss (Raw)": 2.109673500061035, "Pretrain/Step": 987, "Pretrain/Step Time": 8.061445327475667} +{"Pretrain/Learning Rate": 4.929295214397616e-05, "Pretrain/Loss": 2.1665244102478027, "Pretrain/Loss (Raw)": 2.122286081314087, "Pretrain/Step": 988, "Pretrain/Step Time": 8.060098556801677} +{"Pretrain/Learning Rate": 4.929094591110911e-05, "Pretrain/Loss": 2.1646041870117188, "Pretrain/Loss (Raw)": 2.054002523422241, "Pretrain/Step": 989, "Pretrain/Step Time": 8.062792923301458} +{"Pretrain/Learning Rate": 4.928893687689572e-05, "Pretrain/Loss": 2.1651933193206787, "Pretrain/Loss (Raw)": 2.1698720455169678, "Pretrain/Step": 990, "Pretrain/Step Time": 8.062945710495114} +{"Pretrain/Learning Rate": 4.928692504156767e-05, "Pretrain/Loss": 2.1652326583862305, "Pretrain/Loss (Raw)": 2.1292266845703125, "Pretrain/Step": 991, "Pretrain/Step Time": 8.063398597761989} +{"Pretrain/Learning Rate": 4.928491040535699e-05, "Pretrain/Loss": 2.1675684452056885, "Pretrain/Loss (Raw)": 2.414604425430298, "Pretrain/Step": 992, "Pretrain/Step Time": 8.05456968024373} +{"Pretrain/Learning Rate": 4.9282892968495995e-05, "Pretrain/Loss": 2.1678948402404785, "Pretrain/Loss (Raw)": 2.0643651485443115, "Pretrain/Step": 993, "Pretrain/Step Time": 8.058682383969426} +{"Pretrain/Learning Rate": 4.928087273121737e-05, "Pretrain/Loss": 2.167287826538086, "Pretrain/Loss (Raw)": 2.1115972995758057, "Pretrain/Step": 994, "Pretrain/Step Time": 8.065399333834648} +{"Pretrain/Learning Rate": 4.9278849693754076e-05, "Pretrain/Loss": 2.166998863220215, "Pretrain/Loss (Raw)": 2.134636163711548, "Pretrain/Step": 995, "Pretrain/Step Time": 8.06099621579051} +{"Pretrain/Learning Rate": 4.927682385633944e-05, "Pretrain/Loss": 2.166490316390991, "Pretrain/Loss (Raw)": 2.042026996612549, "Pretrain/Step": 996, "Pretrain/Step Time": 8.06129814311862} +{"Pretrain/Learning Rate": 4.927479521920707e-05, "Pretrain/Loss": 2.166378974914551, "Pretrain/Loss (Raw)": 1.9940459728240967, "Pretrain/Step": 997, "Pretrain/Step Time": 8.055248541757464} +{"Pretrain/Learning Rate": 4.927276378259094e-05, "Pretrain/Loss": 2.16402530670166, "Pretrain/Loss (Raw)": 2.1729421615600586, "Pretrain/Step": 998, "Pretrain/Step Time": 8.060685064643621} +{"Pretrain/Learning Rate": 4.9270729546725305e-05, "Pretrain/Loss": 2.1628518104553223, "Pretrain/Loss (Raw)": 2.1864871978759766, "Pretrain/Step": 999, "Pretrain/Step Time": 8.063988266512752} +{"Pretrain/Learning Rate": 4.9268692511844774e-05, "Pretrain/Loss": 2.1619889736175537, "Pretrain/Loss (Raw)": 2.1473116874694824, "Pretrain/Step": 1000, "Pretrain/Step Time": 8.064258962869644} +{"Pretrain/Learning Rate": 4.926665267818426e-05, "Pretrain/Loss": 2.162038803100586, "Pretrain/Loss (Raw)": 2.101994276046753, "Pretrain/Step": 1001, "Pretrain/Step Time": 8.064788727089763} +{"Pretrain/Learning Rate": 4.926461004597901e-05, "Pretrain/Loss": 2.1616311073303223, "Pretrain/Loss (Raw)": 2.359551429748535, "Pretrain/Step": 1002, "Pretrain/Step Time": 8.069265199825168} +{"Pretrain/Learning Rate": 4.92625646154646e-05, "Pretrain/Loss": 2.160623550415039, "Pretrain/Loss (Raw)": 2.00189471244812, "Pretrain/Step": 1003, "Pretrain/Step Time": 8.071100734174252} +{"Pretrain/Learning Rate": 4.926051638687691e-05, "Pretrain/Loss": 2.1598620414733887, "Pretrain/Loss (Raw)": 2.112420082092285, "Pretrain/Step": 1004, "Pretrain/Step Time": 8.066389951854944} +{"Pretrain/Learning Rate": 4.925846536045215e-05, "Pretrain/Loss": 2.161090612411499, "Pretrain/Loss (Raw)": 2.2845587730407715, "Pretrain/Step": 1005, "Pretrain/Step Time": 8.068259241059422} +{"Pretrain/Learning Rate": 4.925641153642684e-05, "Pretrain/Loss": 2.1618406772613525, "Pretrain/Loss (Raw)": 2.348085880279541, "Pretrain/Step": 1006, "Pretrain/Step Time": 8.063225504010916} +{"Pretrain/Learning Rate": 4.925435491503787e-05, "Pretrain/Loss": 2.1623449325561523, "Pretrain/Loss (Raw)": 2.1101503372192383, "Pretrain/Step": 1007, "Pretrain/Step Time": 8.06606225669384} +{"Pretrain/Learning Rate": 4.9252295496522395e-05, "Pretrain/Loss": 2.163037061691284, "Pretrain/Loss (Raw)": 2.178527593612671, "Pretrain/Step": 1008, "Pretrain/Step Time": 8.068206677213311} +{"Pretrain/Learning Rate": 4.925023328111792e-05, "Pretrain/Loss": 2.16198992729187, "Pretrain/Loss (Raw)": 2.0540201663970947, "Pretrain/Step": 1009, "Pretrain/Step Time": 8.062690975144506} +{"Pretrain/Learning Rate": 4.924816826906227e-05, "Pretrain/Loss": 2.159668445587158, "Pretrain/Loss (Raw)": 1.9059758186340332, "Pretrain/Step": 1010, "Pretrain/Step Time": 8.067598663270473} +{"Pretrain/Learning Rate": 4.92461004605936e-05, "Pretrain/Loss": 2.159996509552002, "Pretrain/Loss (Raw)": 2.086107015609741, "Pretrain/Step": 1011, "Pretrain/Step Time": 8.055213667452335} +{"Pretrain/Learning Rate": 4.924402985595037e-05, "Pretrain/Loss": 2.1596641540527344, "Pretrain/Loss (Raw)": 2.1390228271484375, "Pretrain/Step": 1012, "Pretrain/Step Time": 8.058932533487678} +{"Pretrain/Learning Rate": 4.924195645537138e-05, "Pretrain/Loss": 2.1596765518188477, "Pretrain/Loss (Raw)": 2.0188043117523193, "Pretrain/Step": 1013, "Pretrain/Step Time": 8.063077000901103} +{"Pretrain/Learning Rate": 4.923988025909574e-05, "Pretrain/Loss": 2.1588265895843506, "Pretrain/Loss (Raw)": 2.139880657196045, "Pretrain/Step": 1014, "Pretrain/Step Time": 8.057889992371202} +{"Pretrain/Learning Rate": 4.923780126736288e-05, "Pretrain/Loss": 2.1585421562194824, "Pretrain/Loss (Raw)": 1.993196964263916, "Pretrain/Step": 1015, "Pretrain/Step Time": 8.06616211682558} +{"Pretrain/Learning Rate": 4.923571948041257e-05, "Pretrain/Loss": 2.158766031265259, "Pretrain/Loss (Raw)": 2.183743476867676, "Pretrain/Step": 1016, "Pretrain/Step Time": 8.055845925584435} +{"Pretrain/Learning Rate": 4.923363489848489e-05, "Pretrain/Loss": 2.1578681468963623, "Pretrain/Loss (Raw)": 2.0422792434692383, "Pretrain/Step": 1017, "Pretrain/Step Time": 8.058359241113067} +{"Pretrain/Learning Rate": 4.923154752182023e-05, "Pretrain/Loss": 2.155917167663574, "Pretrain/Loss (Raw)": 2.0980172157287598, "Pretrain/Step": 1018, "Pretrain/Step Time": 8.05230195261538} +{"Pretrain/Learning Rate": 4.922945735065934e-05, "Pretrain/Loss": 2.156395673751831, "Pretrain/Loss (Raw)": 2.167292356491089, "Pretrain/Step": 1019, "Pretrain/Step Time": 8.051965175196528} +{"Pretrain/Learning Rate": 4.9227364385243246e-05, "Pretrain/Loss": 2.1573421955108643, "Pretrain/Loss (Raw)": 2.357450246810913, "Pretrain/Step": 1020, "Pretrain/Step Time": 8.055741297081113} +{"Pretrain/Learning Rate": 4.922526862581333e-05, "Pretrain/Loss": 2.157120943069458, "Pretrain/Loss (Raw)": 2.1774790287017822, "Pretrain/Step": 1021, "Pretrain/Step Time": 8.05325779132545} +{"Pretrain/Learning Rate": 4.922317007261129e-05, "Pretrain/Loss": 2.1577658653259277, "Pretrain/Loss (Raw)": 2.208527088165283, "Pretrain/Step": 1022, "Pretrain/Step Time": 8.056073719635606} +{"Pretrain/Learning Rate": 4.922106872587913e-05, "Pretrain/Loss": 2.158381700515747, "Pretrain/Loss (Raw)": 2.2153122425079346, "Pretrain/Step": 1023, "Pretrain/Step Time": 8.05755354091525} +{"Pretrain/Learning Rate": 4.921896458585919e-05, "Pretrain/Loss": 2.159853458404541, "Pretrain/Loss (Raw)": 2.3094608783721924, "Pretrain/Step": 1024, "Pretrain/Step Time": 8.057257313281298} +{"Pretrain/Learning Rate": 4.9216857652794125e-05, "Pretrain/Loss": 2.1590700149536133, "Pretrain/Loss (Raw)": 2.0716090202331543, "Pretrain/Step": 1025, "Pretrain/Step Time": 8.055192962288857} +{"Pretrain/Learning Rate": 4.921474792692692e-05, "Pretrain/Loss": 2.1575851440429688, "Pretrain/Loss (Raw)": 2.07419490814209, "Pretrain/Step": 1026, "Pretrain/Step Time": 8.060136321932077} +{"Pretrain/Learning Rate": 4.921263540850089e-05, "Pretrain/Loss": 2.157238483428955, "Pretrain/Loss (Raw)": 2.1741394996643066, "Pretrain/Step": 1027, "Pretrain/Step Time": 8.064041808247566} +{"Pretrain/Learning Rate": 4.921052009775965e-05, "Pretrain/Loss": 2.158745288848877, "Pretrain/Loss (Raw)": 2.2617976665496826, "Pretrain/Step": 1028, "Pretrain/Step Time": 8.060526298359036} +{"Pretrain/Learning Rate": 4.9208401994947144e-05, "Pretrain/Loss": 2.157230854034424, "Pretrain/Loss (Raw)": 2.1836612224578857, "Pretrain/Step": 1029, "Pretrain/Step Time": 8.065095515921712} +{"Pretrain/Learning Rate": 4.920628110030765e-05, "Pretrain/Loss": 2.1562063694000244, "Pretrain/Loss (Raw)": 2.0483779907226562, "Pretrain/Step": 1030, "Pretrain/Step Time": 8.05618335492909} +{"Pretrain/Learning Rate": 4.920415741408575e-05, "Pretrain/Loss": 2.1563496589660645, "Pretrain/Loss (Raw)": 2.1616640090942383, "Pretrain/Step": 1031, "Pretrain/Step Time": 8.060670256614685} +{"Pretrain/Learning Rate": 4.920203093652637e-05, "Pretrain/Loss": 2.154529571533203, "Pretrain/Loss (Raw)": 2.052898406982422, "Pretrain/Step": 1032, "Pretrain/Step Time": 8.066325634717941} +{"Pretrain/Learning Rate": 4.919990166787474e-05, "Pretrain/Loss": 2.1537413597106934, "Pretrain/Loss (Raw)": 2.115455389022827, "Pretrain/Step": 1033, "Pretrain/Step Time": 8.062957689166069} +{"Pretrain/Learning Rate": 4.919776960837641e-05, "Pretrain/Loss": 2.1547412872314453, "Pretrain/Loss (Raw)": 2.25249981880188, "Pretrain/Step": 1034, "Pretrain/Step Time": 8.067697359248996} +{"Pretrain/Learning Rate": 4.9195634758277264e-05, "Pretrain/Loss": 2.15625, "Pretrain/Loss (Raw)": 2.234410524368286, "Pretrain/Step": 1035, "Pretrain/Step Time": 8.057497439906001} +{"Pretrain/Learning Rate": 4.919349711782351e-05, "Pretrain/Loss": 2.1559629440307617, "Pretrain/Loss (Raw)": 2.1942200660705566, "Pretrain/Step": 1036, "Pretrain/Step Time": 8.064771918579936} +{"Pretrain/Learning Rate": 4.919135668726167e-05, "Pretrain/Loss": 2.157505512237549, "Pretrain/Loss (Raw)": 2.3457300662994385, "Pretrain/Step": 1037, "Pretrain/Step Time": 8.05942516028881} +{"Pretrain/Learning Rate": 4.9189213466838565e-05, "Pretrain/Loss": 2.154906749725342, "Pretrain/Loss (Raw)": 2.019533157348633, "Pretrain/Step": 1038, "Pretrain/Step Time": 8.059754516929388} +{"Pretrain/Learning Rate": 4.91870674568014e-05, "Pretrain/Loss": 2.1551947593688965, "Pretrain/Loss (Raw)": 2.164015054702759, "Pretrain/Step": 1039, "Pretrain/Step Time": 8.058075034990907} +{"Pretrain/Learning Rate": 4.9184918657397625e-05, "Pretrain/Loss": 2.1551949977874756, "Pretrain/Loss (Raw)": 2.179302453994751, "Pretrain/Step": 1040, "Pretrain/Step Time": 8.062663048505783} +{"Pretrain/Learning Rate": 4.918276706887508e-05, "Pretrain/Loss": 2.149132251739502, "Pretrain/Loss (Raw)": 2.0946831703186035, "Pretrain/Step": 1041, "Pretrain/Step Time": 8.06398844346404} +{"Pretrain/Learning Rate": 4.918061269148187e-05, "Pretrain/Loss": 2.150247573852539, "Pretrain/Loss (Raw)": 2.246945381164551, "Pretrain/Step": 1042, "Pretrain/Step Time": 8.060266707092524} +{"Pretrain/Learning Rate": 4.9178455525466484e-05, "Pretrain/Loss": 2.150907516479492, "Pretrain/Loss (Raw)": 2.065988063812256, "Pretrain/Step": 1043, "Pretrain/Step Time": 8.065584218129516} +{"Pretrain/Learning Rate": 4.9176295571077655e-05, "Pretrain/Loss": 2.149811267852783, "Pretrain/Loss (Raw)": 2.1790759563446045, "Pretrain/Step": 1044, "Pretrain/Step Time": 8.060089029371738} +{"Pretrain/Learning Rate": 4.917413282856451e-05, "Pretrain/Loss": 2.1505017280578613, "Pretrain/Loss (Raw)": 2.1500461101531982, "Pretrain/Step": 1045, "Pretrain/Step Time": 8.064015813171864} +{"Pretrain/Learning Rate": 4.917196729817645e-05, "Pretrain/Loss": 2.1500017642974854, "Pretrain/Loss (Raw)": 2.2157723903656006, "Pretrain/Step": 1046, "Pretrain/Step Time": 8.068412424996495} +{"Pretrain/Learning Rate": 4.9169798980163215e-05, "Pretrain/Loss": 2.1490960121154785, "Pretrain/Loss (Raw)": 2.166987895965576, "Pretrain/Step": 1047, "Pretrain/Step Time": 8.061955224722624} +{"Pretrain/Learning Rate": 4.916762787477487e-05, "Pretrain/Loss": 2.1495237350463867, "Pretrain/Loss (Raw)": 2.324460744857788, "Pretrain/Step": 1048, "Pretrain/Step Time": 8.066667614504695} +{"Pretrain/Learning Rate": 4.91654539822618e-05, "Pretrain/Loss": 2.1491360664367676, "Pretrain/Loss (Raw)": 2.133801221847534, "Pretrain/Step": 1049, "Pretrain/Step Time": 8.057191235944629} +{"Pretrain/Learning Rate": 4.916327730287471e-05, "Pretrain/Loss": 2.1476938724517822, "Pretrain/Loss (Raw)": 2.159438133239746, "Pretrain/Step": 1050, "Pretrain/Step Time": 8.060708912089467} +{"Pretrain/Learning Rate": 4.916109783686461e-05, "Pretrain/Loss": 2.147397994995117, "Pretrain/Loss (Raw)": 2.1430046558380127, "Pretrain/Step": 1051, "Pretrain/Step Time": 8.059761341661215} +{"Pretrain/Learning Rate": 4.915891558448287e-05, "Pretrain/Loss": 2.148817539215088, "Pretrain/Loss (Raw)": 2.19488263130188, "Pretrain/Step": 1052, "Pretrain/Step Time": 8.05582413263619} +{"Pretrain/Learning Rate": 4.915673054598113e-05, "Pretrain/Loss": 2.1491284370422363, "Pretrain/Loss (Raw)": 2.0832390785217285, "Pretrain/Step": 1053, "Pretrain/Step Time": 8.052538430318236} +{"Pretrain/Learning Rate": 4.91545427216114e-05, "Pretrain/Loss": 2.148239850997925, "Pretrain/Loss (Raw)": 2.0963213443756104, "Pretrain/Step": 1054, "Pretrain/Step Time": 8.049332033842802} +{"Pretrain/Learning Rate": 4.915235211162599e-05, "Pretrain/Loss": 2.149259567260742, "Pretrain/Loss (Raw)": 2.059492349624634, "Pretrain/Step": 1055, "Pretrain/Step Time": 8.054853493347764} +{"Pretrain/Learning Rate": 4.9150158716277516e-05, "Pretrain/Loss": 2.148158550262451, "Pretrain/Loss (Raw)": 2.031569719314575, "Pretrain/Step": 1056, "Pretrain/Step Time": 8.055578703060746} +{"Pretrain/Learning Rate": 4.9147962535818935e-05, "Pretrain/Loss": 2.150655746459961, "Pretrain/Loss (Raw)": 2.3332314491271973, "Pretrain/Step": 1057, "Pretrain/Step Time": 8.053639341145754} +{"Pretrain/Learning Rate": 4.9145763570503536e-05, "Pretrain/Loss": 2.152010440826416, "Pretrain/Loss (Raw)": 2.2700369358062744, "Pretrain/Step": 1058, "Pretrain/Step Time": 8.053103199228644} +{"Pretrain/Learning Rate": 4.914356182058491e-05, "Pretrain/Loss": 2.152282238006592, "Pretrain/Loss (Raw)": 2.0854337215423584, "Pretrain/Step": 1059, "Pretrain/Step Time": 8.055033864453435} +{"Pretrain/Learning Rate": 4.914135728631695e-05, "Pretrain/Loss": 2.1524837017059326, "Pretrain/Loss (Raw)": 2.1944565773010254, "Pretrain/Step": 1060, "Pretrain/Step Time": 8.05982786603272} +{"Pretrain/Learning Rate": 4.913914996795391e-05, "Pretrain/Loss": 2.152146816253662, "Pretrain/Loss (Raw)": 2.164219617843628, "Pretrain/Step": 1061, "Pretrain/Step Time": 8.047182677313685} +{"Pretrain/Learning Rate": 4.9136939865750357e-05, "Pretrain/Loss": 2.1541450023651123, "Pretrain/Loss (Raw)": 2.3840322494506836, "Pretrain/Step": 1062, "Pretrain/Step Time": 8.053940296173096} +{"Pretrain/Learning Rate": 4.913472697996116e-05, "Pretrain/Loss": 2.154226779937744, "Pretrain/Loss (Raw)": 2.093380928039551, "Pretrain/Step": 1063, "Pretrain/Step Time": 8.049779005348682} +{"Pretrain/Learning Rate": 4.913251131084152e-05, "Pretrain/Loss": 2.152853012084961, "Pretrain/Loss (Raw)": 2.099940299987793, "Pretrain/Step": 1064, "Pretrain/Step Time": 8.054744649678469} +{"Pretrain/Learning Rate": 4.9130292858646966e-05, "Pretrain/Loss": 2.1559813022613525, "Pretrain/Loss (Raw)": 2.3602423667907715, "Pretrain/Step": 1065, "Pretrain/Step Time": 8.0578851159662} +{"Pretrain/Learning Rate": 4.912807162363332e-05, "Pretrain/Loss": 2.154515504837036, "Pretrain/Loss (Raw)": 2.0628182888031006, "Pretrain/Step": 1066, "Pretrain/Step Time": 8.05347746424377} +{"Pretrain/Learning Rate": 4.912584760605677e-05, "Pretrain/Loss": 2.153777599334717, "Pretrain/Loss (Raw)": 2.1922240257263184, "Pretrain/Step": 1067, "Pretrain/Step Time": 8.052728794515133} +{"Pretrain/Learning Rate": 4.9123620806173785e-05, "Pretrain/Loss": 2.154451847076416, "Pretrain/Loss (Raw)": 2.1577515602111816, "Pretrain/Step": 1068, "Pretrain/Step Time": 8.05261031538248} +{"Pretrain/Learning Rate": 4.9121391224241174e-05, "Pretrain/Loss": 2.1554012298583984, "Pretrain/Loss (Raw)": 2.187636137008667, "Pretrain/Step": 1069, "Pretrain/Step Time": 8.05758137628436} +{"Pretrain/Learning Rate": 4.9119158860516066e-05, "Pretrain/Loss": 2.1563563346862793, "Pretrain/Loss (Raw)": 2.2104713916778564, "Pretrain/Step": 1070, "Pretrain/Step Time": 8.062244612723589} +{"Pretrain/Learning Rate": 4.9116923715255905e-05, "Pretrain/Loss": 2.1567115783691406, "Pretrain/Loss (Raw)": 2.1289689540863037, "Pretrain/Step": 1071, "Pretrain/Step Time": 8.053993448615074} +{"Pretrain/Learning Rate": 4.9114685788718454e-05, "Pretrain/Loss": 2.1576759815216064, "Pretrain/Loss (Raw)": 2.2004411220550537, "Pretrain/Step": 1072, "Pretrain/Step Time": 8.060988578945398} +{"Pretrain/Learning Rate": 4.9112445081161813e-05, "Pretrain/Loss": 2.156472682952881, "Pretrain/Loss (Raw)": 2.005331516265869, "Pretrain/Step": 1073, "Pretrain/Step Time": 8.053016325458884} +{"Pretrain/Learning Rate": 4.9110201592844376e-05, "Pretrain/Loss": 2.1548075675964355, "Pretrain/Loss (Raw)": 2.0656394958496094, "Pretrain/Step": 1074, "Pretrain/Step Time": 8.061153817921877} +{"Pretrain/Learning Rate": 4.910795532402489e-05, "Pretrain/Loss": 2.154651641845703, "Pretrain/Loss (Raw)": 2.028172254562378, "Pretrain/Step": 1075, "Pretrain/Step Time": 8.0561758633703} +{"Pretrain/Learning Rate": 4.910570627496239e-05, "Pretrain/Loss": 2.1527457237243652, "Pretrain/Loss (Raw)": 1.9791380167007446, "Pretrain/Step": 1076, "Pretrain/Step Time": 8.051624368876219} +{"Pretrain/Learning Rate": 4.9103454445916256e-05, "Pretrain/Loss": 2.1521754264831543, "Pretrain/Loss (Raw)": 2.0849459171295166, "Pretrain/Step": 1077, "Pretrain/Step Time": 8.057338273152709} +{"Pretrain/Learning Rate": 4.910119983714616e-05, "Pretrain/Loss": 2.1543235778808594, "Pretrain/Loss (Raw)": 2.230048894882202, "Pretrain/Step": 1078, "Pretrain/Step Time": 8.057840390130877} +{"Pretrain/Learning Rate": 4.909894244891214e-05, "Pretrain/Loss": 2.155118942260742, "Pretrain/Loss (Raw)": 2.206488847732544, "Pretrain/Step": 1079, "Pretrain/Step Time": 8.067128850147128} +{"Pretrain/Learning Rate": 4.909668228147453e-05, "Pretrain/Loss": 2.1551074981689453, "Pretrain/Loss (Raw)": 2.1458327770233154, "Pretrain/Step": 1080, "Pretrain/Step Time": 8.060469785705209} +{"Pretrain/Learning Rate": 4.9094419335093966e-05, "Pretrain/Loss": 2.1560885906219482, "Pretrain/Loss (Raw)": 2.2340810298919678, "Pretrain/Step": 1081, "Pretrain/Step Time": 8.063943102955818} +{"Pretrain/Learning Rate": 4.909215361003142e-05, "Pretrain/Loss": 2.1577324867248535, "Pretrain/Loss (Raw)": 2.2797751426696777, "Pretrain/Step": 1082, "Pretrain/Step Time": 8.058837622404099} +{"Pretrain/Learning Rate": 4.90898851065482e-05, "Pretrain/Loss": 2.1563875675201416, "Pretrain/Loss (Raw)": 2.127812147140503, "Pretrain/Step": 1083, "Pretrain/Step Time": 8.059619307518005} +{"Pretrain/Learning Rate": 4.908761382490591e-05, "Pretrain/Loss": 2.1560816764831543, "Pretrain/Loss (Raw)": 2.0769248008728027, "Pretrain/Step": 1084, "Pretrain/Step Time": 8.060038240626454} +{"Pretrain/Learning Rate": 4.908533976536649e-05, "Pretrain/Loss": 2.1569504737854004, "Pretrain/Loss (Raw)": 2.1938109397888184, "Pretrain/Step": 1085, "Pretrain/Step Time": 8.061533072963357} +{"Pretrain/Learning Rate": 4.90830629281922e-05, "Pretrain/Loss": 2.1557044982910156, "Pretrain/Loss (Raw)": 2.0480797290802, "Pretrain/Step": 1086, "Pretrain/Step Time": 8.069762280210853} +{"Pretrain/Learning Rate": 4.908078331364561e-05, "Pretrain/Loss": 2.1548147201538086, "Pretrain/Loss (Raw)": 2.105034828186035, "Pretrain/Step": 1087, "Pretrain/Step Time": 8.064448429271579} +{"Pretrain/Learning Rate": 4.907850092198961e-05, "Pretrain/Loss": 2.1547372341156006, "Pretrain/Loss (Raw)": 2.0811808109283447, "Pretrain/Step": 1088, "Pretrain/Step Time": 8.06962795369327} +{"Pretrain/Learning Rate": 4.9076215753487425e-05, "Pretrain/Loss": 2.154372215270996, "Pretrain/Loss (Raw)": 2.084453582763672, "Pretrain/Step": 1089, "Pretrain/Step Time": 8.059321599081159} +{"Pretrain/Learning Rate": 4.9073927808402585e-05, "Pretrain/Loss": 2.1547465324401855, "Pretrain/Loss (Raw)": 2.1962623596191406, "Pretrain/Step": 1090, "Pretrain/Step Time": 8.067461485043168} +{"Pretrain/Learning Rate": 4.907163708699896e-05, "Pretrain/Loss": 2.1553549766540527, "Pretrain/Loss (Raw)": 2.1167027950286865, "Pretrain/Step": 1091, "Pretrain/Step Time": 8.058506473898888} +{"Pretrain/Learning Rate": 4.9069343589540704e-05, "Pretrain/Loss": 2.154597759246826, "Pretrain/Loss (Raw)": 2.0642340183258057, "Pretrain/Step": 1092, "Pretrain/Step Time": 8.05893444083631} +{"Pretrain/Learning Rate": 4.906704731629233e-05, "Pretrain/Loss": 2.1528871059417725, "Pretrain/Loss (Raw)": 2.136580228805542, "Pretrain/Step": 1093, "Pretrain/Step Time": 8.066719321534038} +{"Pretrain/Learning Rate": 4.9064748267518656e-05, "Pretrain/Loss": 2.1525325775146484, "Pretrain/Loss (Raw)": 2.221937894821167, "Pretrain/Step": 1094, "Pretrain/Step Time": 8.060680862516165} +{"Pretrain/Learning Rate": 4.9062446443484813e-05, "Pretrain/Loss": 2.154453992843628, "Pretrain/Loss (Raw)": 2.43264102935791, "Pretrain/Step": 1095, "Pretrain/Step Time": 8.066849334165454} +{"Pretrain/Learning Rate": 4.9060141844456267e-05, "Pretrain/Loss": 2.1549391746520996, "Pretrain/Loss (Raw)": 2.26343035697937, "Pretrain/Step": 1096, "Pretrain/Step Time": 8.061478029936552} +{"Pretrain/Learning Rate": 4.905783447069878e-05, "Pretrain/Loss": 2.1554367542266846, "Pretrain/Loss (Raw)": 2.2422728538513184, "Pretrain/Step": 1097, "Pretrain/Step Time": 8.07065712660551} +{"Pretrain/Learning Rate": 4.905552432247846e-05, "Pretrain/Loss": 2.156464099884033, "Pretrain/Loss (Raw)": 2.150592803955078, "Pretrain/Step": 1098, "Pretrain/Step Time": 8.066569084301591} +{"Pretrain/Learning Rate": 4.905321140006172e-05, "Pretrain/Loss": 2.1554455757141113, "Pretrain/Loss (Raw)": 2.1145591735839844, "Pretrain/Step": 1099, "Pretrain/Step Time": 8.066258391365409} +{"Pretrain/Learning Rate": 4.90508957037153e-05, "Pretrain/Loss": 2.1561999320983887, "Pretrain/Loss (Raw)": 2.198141098022461, "Pretrain/Step": 1100, "Pretrain/Step Time": 8.063095731660724} +{"Pretrain/Learning Rate": 4.9048577233706264e-05, "Pretrain/Loss": 2.156071424484253, "Pretrain/Loss (Raw)": 2.291053533554077, "Pretrain/Step": 1101, "Pretrain/Step Time": 8.06185488961637} +{"Pretrain/Learning Rate": 4.9046255990301965e-05, "Pretrain/Loss": 2.1541638374328613, "Pretrain/Loss (Raw)": 2.1713287830352783, "Pretrain/Step": 1102, "Pretrain/Step Time": 8.0636120531708} +{"Pretrain/Learning Rate": 4.904393197377012e-05, "Pretrain/Loss": 2.1534016132354736, "Pretrain/Loss (Raw)": 2.1507554054260254, "Pretrain/Step": 1103, "Pretrain/Step Time": 8.067792400717735} +{"Pretrain/Learning Rate": 4.9041605184378746e-05, "Pretrain/Loss": 2.1523008346557617, "Pretrain/Loss (Raw)": 2.0664899349212646, "Pretrain/Step": 1104, "Pretrain/Step Time": 8.067838858813047} +{"Pretrain/Learning Rate": 4.903927562239617e-05, "Pretrain/Loss": 2.151876926422119, "Pretrain/Loss (Raw)": 2.1458871364593506, "Pretrain/Step": 1105, "Pretrain/Step Time": 8.066638860851526} +{"Pretrain/Learning Rate": 4.9036943288091066e-05, "Pretrain/Loss": 2.152336597442627, "Pretrain/Loss (Raw)": 2.101076602935791, "Pretrain/Step": 1106, "Pretrain/Step Time": 8.059591321274638} +{"Pretrain/Learning Rate": 4.903460818173238e-05, "Pretrain/Loss": 2.1525561809539795, "Pretrain/Loss (Raw)": 2.1369943618774414, "Pretrain/Step": 1107, "Pretrain/Step Time": 8.066321386024356} +{"Pretrain/Learning Rate": 4.9032270303589435e-05, "Pretrain/Loss": 2.154252052307129, "Pretrain/Loss (Raw)": 2.310744047164917, "Pretrain/Step": 1108, "Pretrain/Step Time": 8.0622474309057} +{"Pretrain/Learning Rate": 4.9029929653931826e-05, "Pretrain/Loss": 2.155648708343506, "Pretrain/Loss (Raw)": 2.2448689937591553, "Pretrain/Step": 1109, "Pretrain/Step Time": 8.064263336360455} +{"Pretrain/Learning Rate": 4.90275862330295e-05, "Pretrain/Loss": 2.154961585998535, "Pretrain/Loss (Raw)": 2.0631113052368164, "Pretrain/Step": 1110, "Pretrain/Step Time": 8.055904116481543} +{"Pretrain/Learning Rate": 4.902524004115271e-05, "Pretrain/Loss": 2.1541004180908203, "Pretrain/Loss (Raw)": 2.0834574699401855, "Pretrain/Step": 1111, "Pretrain/Step Time": 8.058480139821768} +{"Pretrain/Learning Rate": 4.902289107857202e-05, "Pretrain/Loss": 2.153921604156494, "Pretrain/Loss (Raw)": 2.1259210109710693, "Pretrain/Step": 1112, "Pretrain/Step Time": 8.068821934983134} +{"Pretrain/Learning Rate": 4.9020539345558335e-05, "Pretrain/Loss": 2.1561179161071777, "Pretrain/Loss (Raw)": 2.48496413230896, "Pretrain/Step": 1113, "Pretrain/Step Time": 8.061947559937835} +{"Pretrain/Learning Rate": 4.9018184842382866e-05, "Pretrain/Loss": 2.157371997833252, "Pretrain/Loss (Raw)": 2.201538562774658, "Pretrain/Step": 1114, "Pretrain/Step Time": 8.073086207732558} +{"Pretrain/Learning Rate": 4.901582756931715e-05, "Pretrain/Loss": 2.158083915710449, "Pretrain/Loss (Raw)": 2.2007884979248047, "Pretrain/Step": 1115, "Pretrain/Step Time": 8.068224553018808} +{"Pretrain/Learning Rate": 4.901346752663302e-05, "Pretrain/Loss": 2.158107280731201, "Pretrain/Loss (Raw)": 2.1252493858337402, "Pretrain/Step": 1116, "Pretrain/Step Time": 8.072342846542597} +{"Pretrain/Learning Rate": 4.9011104714602666e-05, "Pretrain/Loss": 2.158815383911133, "Pretrain/Loss (Raw)": 2.1446359157562256, "Pretrain/Step": 1117, "Pretrain/Step Time": 8.071110557764769} +{"Pretrain/Learning Rate": 4.900873913349857e-05, "Pretrain/Loss": 2.158165454864502, "Pretrain/Loss (Raw)": 2.086691379547119, "Pretrain/Step": 1118, "Pretrain/Step Time": 8.06693321838975} +{"Pretrain/Learning Rate": 4.9006370783593544e-05, "Pretrain/Loss": 2.1588833332061768, "Pretrain/Loss (Raw)": 2.221118211746216, "Pretrain/Step": 1119, "Pretrain/Step Time": 8.063810395076871} +{"Pretrain/Learning Rate": 4.900399966516073e-05, "Pretrain/Loss": 2.156606674194336, "Pretrain/Loss (Raw)": 2.123206377029419, "Pretrain/Step": 1120, "Pretrain/Step Time": 8.07260993681848} +{"Pretrain/Learning Rate": 4.900162577847355e-05, "Pretrain/Loss": 2.1557092666625977, "Pretrain/Loss (Raw)": 1.9494832754135132, "Pretrain/Step": 1121, "Pretrain/Step Time": 8.068561622872949} +{"Pretrain/Learning Rate": 4.899924912380579e-05, "Pretrain/Loss": 2.1552672386169434, "Pretrain/Loss (Raw)": 2.0550031661987305, "Pretrain/Step": 1122, "Pretrain/Step Time": 8.059837009757757} +{"Pretrain/Learning Rate": 4.899686970143153e-05, "Pretrain/Loss": 2.1557672023773193, "Pretrain/Loss (Raw)": 2.198674201965332, "Pretrain/Step": 1123, "Pretrain/Step Time": 8.07004076614976} +{"Pretrain/Learning Rate": 4.8994487511625184e-05, "Pretrain/Loss": 2.1568167209625244, "Pretrain/Loss (Raw)": 2.176344633102417, "Pretrain/Step": 1124, "Pretrain/Step Time": 8.062576495110989} +{"Pretrain/Learning Rate": 4.899210255466147e-05, "Pretrain/Loss": 2.158046245574951, "Pretrain/Loss (Raw)": 2.151437282562256, "Pretrain/Step": 1125, "Pretrain/Step Time": 8.067579274997115} +{"Pretrain/Learning Rate": 4.898971483081543e-05, "Pretrain/Loss": 2.157714366912842, "Pretrain/Loss (Raw)": 2.130474328994751, "Pretrain/Step": 1126, "Pretrain/Step Time": 8.06847708672285} +{"Pretrain/Learning Rate": 4.898732434036244e-05, "Pretrain/Loss": 2.156777858734131, "Pretrain/Loss (Raw)": 2.0665838718414307, "Pretrain/Step": 1127, "Pretrain/Step Time": 8.061650542542338} +{"Pretrain/Learning Rate": 4.898493108357817e-05, "Pretrain/Loss": 2.156461238861084, "Pretrain/Loss (Raw)": 2.1067841053009033, "Pretrain/Step": 1128, "Pretrain/Step Time": 8.065651718527079} +{"Pretrain/Learning Rate": 4.898253506073863e-05, "Pretrain/Loss": 2.1553964614868164, "Pretrain/Loss (Raw)": 1.9656885862350464, "Pretrain/Step": 1129, "Pretrain/Step Time": 8.063924660906196} +{"Pretrain/Learning Rate": 4.8980136272120136e-05, "Pretrain/Loss": 2.1542348861694336, "Pretrain/Loss (Raw)": 2.21091628074646, "Pretrain/Step": 1130, "Pretrain/Step Time": 8.066026760265231} +{"Pretrain/Learning Rate": 4.8977734717999326e-05, "Pretrain/Loss": 2.156059503555298, "Pretrain/Loss (Raw)": 2.235426425933838, "Pretrain/Step": 1131, "Pretrain/Step Time": 8.06735796481371} +{"Pretrain/Learning Rate": 4.8975330398653164e-05, "Pretrain/Loss": 2.1577677726745605, "Pretrain/Loss (Raw)": 2.331056833267212, "Pretrain/Step": 1132, "Pretrain/Step Time": 8.070657467469573} +{"Pretrain/Learning Rate": 4.8972923314358934e-05, "Pretrain/Loss": 2.1573495864868164, "Pretrain/Loss (Raw)": 2.231015682220459, "Pretrain/Step": 1133, "Pretrain/Step Time": 8.065077718347311} +{"Pretrain/Learning Rate": 4.8970513465394206e-05, "Pretrain/Loss": 2.1550941467285156, "Pretrain/Loss (Raw)": 2.0594120025634766, "Pretrain/Step": 1134, "Pretrain/Step Time": 8.064785122871399} +{"Pretrain/Learning Rate": 4.896810085203692e-05, "Pretrain/Loss": 2.1546037197113037, "Pretrain/Loss (Raw)": 2.0473806858062744, "Pretrain/Step": 1135, "Pretrain/Step Time": 8.067277831956744} +{"Pretrain/Learning Rate": 4.896568547456531e-05, "Pretrain/Loss": 2.154388904571533, "Pretrain/Loss (Raw)": 2.1510322093963623, "Pretrain/Step": 1136, "Pretrain/Step Time": 8.063922533765435} +{"Pretrain/Learning Rate": 4.896326733325791e-05, "Pretrain/Loss": 2.1540560722351074, "Pretrain/Loss (Raw)": 2.0114216804504395, "Pretrain/Step": 1137, "Pretrain/Step Time": 8.069583414122462} +{"Pretrain/Learning Rate": 4.8960846428393615e-05, "Pretrain/Loss": 2.156445026397705, "Pretrain/Loss (Raw)": 2.2117857933044434, "Pretrain/Step": 1138, "Pretrain/Step Time": 8.064681004732847} +{"Pretrain/Learning Rate": 4.8958422760251585e-05, "Pretrain/Loss": 2.155911445617676, "Pretrain/Loss (Raw)": 2.017808198928833, "Pretrain/Step": 1139, "Pretrain/Step Time": 8.071582304313779} +{"Pretrain/Learning Rate": 4.8955996329111364e-05, "Pretrain/Loss": 2.1558449268341064, "Pretrain/Loss (Raw)": 2.1304867267608643, "Pretrain/Step": 1140, "Pretrain/Step Time": 8.069505026564002} +{"Pretrain/Learning Rate": 4.895356713525275e-05, "Pretrain/Loss": 2.1563503742218018, "Pretrain/Loss (Raw)": 2.083496570587158, "Pretrain/Step": 1141, "Pretrain/Step Time": 8.061304572969675} +{"Pretrain/Learning Rate": 4.895113517895591e-05, "Pretrain/Loss": 2.156632423400879, "Pretrain/Loss (Raw)": 2.1759917736053467, "Pretrain/Step": 1142, "Pretrain/Step Time": 8.062442822381854} +{"Pretrain/Learning Rate": 4.8948700460501294e-05, "Pretrain/Loss": 2.1584653854370117, "Pretrain/Loss (Raw)": 2.2278201580047607, "Pretrain/Step": 1143, "Pretrain/Step Time": 8.056606007739902} +{"Pretrain/Learning Rate": 4.8946262980169686e-05, "Pretrain/Loss": 2.15932297706604, "Pretrain/Loss (Raw)": 2.293501853942871, "Pretrain/Step": 1144, "Pretrain/Step Time": 8.064538953825831} +{"Pretrain/Learning Rate": 4.894382273824221e-05, "Pretrain/Loss": 2.160569429397583, "Pretrain/Loss (Raw)": 2.201829195022583, "Pretrain/Step": 1145, "Pretrain/Step Time": 8.061386987566948} +{"Pretrain/Learning Rate": 4.894137973500025e-05, "Pretrain/Loss": 2.161679744720459, "Pretrain/Loss (Raw)": 2.2401645183563232, "Pretrain/Step": 1146, "Pretrain/Step Time": 8.063918625935912} +{"Pretrain/Learning Rate": 4.893893397072558e-05, "Pretrain/Loss": 2.1616227626800537, "Pretrain/Loss (Raw)": 2.1599884033203125, "Pretrain/Step": 1147, "Pretrain/Step Time": 8.06211294978857} +{"Pretrain/Learning Rate": 4.893648544570022e-05, "Pretrain/Loss": 2.1601104736328125, "Pretrain/Loss (Raw)": 2.1638691425323486, "Pretrain/Step": 1148, "Pretrain/Step Time": 8.05535594932735} +{"Pretrain/Learning Rate": 4.893403416020658e-05, "Pretrain/Loss": 2.1599998474121094, "Pretrain/Loss (Raw)": 2.163297176361084, "Pretrain/Step": 1149, "Pretrain/Step Time": 8.06511539593339} +{"Pretrain/Learning Rate": 4.893158011452734e-05, "Pretrain/Loss": 2.158440589904785, "Pretrain/Loss (Raw)": 2.0089569091796875, "Pretrain/Step": 1150, "Pretrain/Step Time": 8.060504643246531} +{"Pretrain/Learning Rate": 4.8929123308945505e-05, "Pretrain/Loss": 2.1586172580718994, "Pretrain/Loss (Raw)": 2.237924337387085, "Pretrain/Step": 1151, "Pretrain/Step Time": 8.059699574485421} +{"Pretrain/Learning Rate": 4.8926663743744414e-05, "Pretrain/Loss": 2.1567018032073975, "Pretrain/Loss (Raw)": 2.0642871856689453, "Pretrain/Step": 1152, "Pretrain/Step Time": 8.057551680132747} +{"Pretrain/Learning Rate": 4.892420141920772e-05, "Pretrain/Loss": 2.1576452255249023, "Pretrain/Loss (Raw)": 2.1923677921295166, "Pretrain/Step": 1153, "Pretrain/Step Time": 8.055922081694007} +{"Pretrain/Learning Rate": 4.8921736335619385e-05, "Pretrain/Loss": 2.1578118801116943, "Pretrain/Loss (Raw)": 2.095534324645996, "Pretrain/Step": 1154, "Pretrain/Step Time": 8.060229048132896} +{"Pretrain/Learning Rate": 4.8919268493263684e-05, "Pretrain/Loss": 2.155829906463623, "Pretrain/Loss (Raw)": 1.9204657077789307, "Pretrain/Step": 1155, "Pretrain/Step Time": 8.049093836918473} +{"Pretrain/Learning Rate": 4.891679789242524e-05, "Pretrain/Loss": 2.154308795928955, "Pretrain/Loss (Raw)": 2.067080497741699, "Pretrain/Step": 1156, "Pretrain/Step Time": 8.054344341158867} +{"Pretrain/Learning Rate": 4.891432453338895e-05, "Pretrain/Loss": 2.1546716690063477, "Pretrain/Loss (Raw)": 2.2300832271575928, "Pretrain/Step": 1157, "Pretrain/Step Time": 8.048044633120298} +{"Pretrain/Learning Rate": 4.8911848416440075e-05, "Pretrain/Loss": 2.1552224159240723, "Pretrain/Loss (Raw)": 2.118889331817627, "Pretrain/Step": 1158, "Pretrain/Step Time": 8.05721060745418} +{"Pretrain/Learning Rate": 4.890936954186416e-05, "Pretrain/Loss": 2.1547019481658936, "Pretrain/Loss (Raw)": 2.0950539112091064, "Pretrain/Step": 1159, "Pretrain/Step Time": 8.058918604627252} +{"Pretrain/Learning Rate": 4.890688790994709e-05, "Pretrain/Loss": 2.156602382659912, "Pretrain/Loss (Raw)": 2.296119451522827, "Pretrain/Step": 1160, "Pretrain/Step Time": 8.05024884454906} +{"Pretrain/Learning Rate": 4.890440352097505e-05, "Pretrain/Loss": 2.1556191444396973, "Pretrain/Loss (Raw)": 1.9896131753921509, "Pretrain/Step": 1161, "Pretrain/Step Time": 8.05924609862268} +{"Pretrain/Learning Rate": 4.8901916375234556e-05, "Pretrain/Loss": 2.1553969383239746, "Pretrain/Loss (Raw)": 2.2240519523620605, "Pretrain/Step": 1162, "Pretrain/Step Time": 8.049959111958742} +{"Pretrain/Learning Rate": 4.889942647301243e-05, "Pretrain/Loss": 2.1560018062591553, "Pretrain/Loss (Raw)": 2.311870574951172, "Pretrain/Step": 1163, "Pretrain/Step Time": 8.056878998875618} +{"Pretrain/Learning Rate": 4.8896933814595834e-05, "Pretrain/Loss": 2.154780864715576, "Pretrain/Loss (Raw)": 2.03790283203125, "Pretrain/Step": 1164, "Pretrain/Step Time": 8.05648284777999} +{"Pretrain/Learning Rate": 4.8894438400272224e-05, "Pretrain/Loss": 2.153319835662842, "Pretrain/Loss (Raw)": 2.158729076385498, "Pretrain/Step": 1165, "Pretrain/Step Time": 8.058861861005425} +{"Pretrain/Learning Rate": 4.889194023032938e-05, "Pretrain/Loss": 2.1534781455993652, "Pretrain/Loss (Raw)": 2.0397961139678955, "Pretrain/Step": 1166, "Pretrain/Step Time": 8.06633304618299} +{"Pretrain/Learning Rate": 4.8889439305055406e-05, "Pretrain/Loss": 2.1538782119750977, "Pretrain/Loss (Raw)": 2.215219020843506, "Pretrain/Step": 1167, "Pretrain/Step Time": 8.060965053737164} +{"Pretrain/Learning Rate": 4.8886935624738715e-05, "Pretrain/Loss": 2.152069091796875, "Pretrain/Loss (Raw)": 1.9477598667144775, "Pretrain/Step": 1168, "Pretrain/Step Time": 8.066582383587956} +{"Pretrain/Learning Rate": 4.888442918966806e-05, "Pretrain/Loss": 2.1542818546295166, "Pretrain/Loss (Raw)": 2.3779187202453613, "Pretrain/Step": 1169, "Pretrain/Step Time": 8.062860809266567} +{"Pretrain/Learning Rate": 4.888192000013248e-05, "Pretrain/Loss": 2.1526427268981934, "Pretrain/Loss (Raw)": 2.0371036529541016, "Pretrain/Step": 1170, "Pretrain/Step Time": 8.060270050540566} +{"Pretrain/Learning Rate": 4.887940805642135e-05, "Pretrain/Loss": 2.1532130241394043, "Pretrain/Loss (Raw)": 2.138981819152832, "Pretrain/Step": 1171, "Pretrain/Step Time": 8.057116352021694} +{"Pretrain/Learning Rate": 4.887689335882436e-05, "Pretrain/Loss": 2.152766227722168, "Pretrain/Loss (Raw)": 2.121905565261841, "Pretrain/Step": 1172, "Pretrain/Step Time": 8.066935766488314} +{"Pretrain/Learning Rate": 4.8874375907631506e-05, "Pretrain/Loss": 2.151996612548828, "Pretrain/Loss (Raw)": 2.0515506267547607, "Pretrain/Step": 1173, "Pretrain/Step Time": 8.06980157457292} +{"Pretrain/Learning Rate": 4.887185570313314e-05, "Pretrain/Loss": 2.1511058807373047, "Pretrain/Loss (Raw)": 2.101745367050171, "Pretrain/Step": 1174, "Pretrain/Step Time": 8.06258606724441} +{"Pretrain/Learning Rate": 4.886933274561988e-05, "Pretrain/Loss": 2.1507887840270996, "Pretrain/Loss (Raw)": 2.1263887882232666, "Pretrain/Step": 1175, "Pretrain/Step Time": 8.070717072114348} +{"Pretrain/Learning Rate": 4.886680703538269e-05, "Pretrain/Loss": 2.1474108695983887, "Pretrain/Loss (Raw)": 1.8921293020248413, "Pretrain/Step": 1176, "Pretrain/Step Time": 8.063320025801659} +{"Pretrain/Learning Rate": 4.886427857271284e-05, "Pretrain/Loss": 2.146461009979248, "Pretrain/Loss (Raw)": 2.012218952178955, "Pretrain/Step": 1177, "Pretrain/Step Time": 8.068383757025003} +{"Pretrain/Learning Rate": 4.886174735790194e-05, "Pretrain/Loss": 2.1459028720855713, "Pretrain/Loss (Raw)": 2.087958812713623, "Pretrain/Step": 1178, "Pretrain/Step Time": 8.07468468695879} +{"Pretrain/Learning Rate": 4.88592133912419e-05, "Pretrain/Loss": 2.146456480026245, "Pretrain/Loss (Raw)": 2.213878631591797, "Pretrain/Step": 1179, "Pretrain/Step Time": 8.073544293642044} +{"Pretrain/Learning Rate": 4.885667667302494e-05, "Pretrain/Loss": 2.145829916000366, "Pretrain/Loss (Raw)": 2.114668369293213, "Pretrain/Step": 1180, "Pretrain/Step Time": 8.081683203577995} +{"Pretrain/Learning Rate": 4.88541372035436e-05, "Pretrain/Loss": 2.145942449569702, "Pretrain/Loss (Raw)": 2.0976600646972656, "Pretrain/Step": 1181, "Pretrain/Step Time": 8.079770244657993} +{"Pretrain/Learning Rate": 4.885159498309077e-05, "Pretrain/Loss": 2.1462206840515137, "Pretrain/Loss (Raw)": 2.1319122314453125, "Pretrain/Step": 1182, "Pretrain/Step Time": 8.07792516052723} +{"Pretrain/Learning Rate": 4.884905001195961e-05, "Pretrain/Loss": 2.146589756011963, "Pretrain/Loss (Raw)": 2.106727123260498, "Pretrain/Step": 1183, "Pretrain/Step Time": 8.075028007850051} +{"Pretrain/Learning Rate": 4.884650229044361e-05, "Pretrain/Loss": 2.148909568786621, "Pretrain/Loss (Raw)": 2.328530788421631, "Pretrain/Step": 1184, "Pretrain/Step Time": 8.076850827783346} +{"Pretrain/Learning Rate": 4.884395181883661e-05, "Pretrain/Loss": 2.1467936038970947, "Pretrain/Loss (Raw)": 2.0623905658721924, "Pretrain/Step": 1185, "Pretrain/Step Time": 8.073230477049947} +{"Pretrain/Learning Rate": 4.8841398597432725e-05, "Pretrain/Loss": 2.145143985748291, "Pretrain/Loss (Raw)": 2.058866024017334, "Pretrain/Step": 1186, "Pretrain/Step Time": 8.076593147590756} +{"Pretrain/Learning Rate": 4.883884262652641e-05, "Pretrain/Loss": 2.145564556121826, "Pretrain/Loss (Raw)": 2.139270067214966, "Pretrain/Step": 1187, "Pretrain/Step Time": 8.074627300724387} +{"Pretrain/Learning Rate": 4.883628390641243e-05, "Pretrain/Loss": 2.146977424621582, "Pretrain/Loss (Raw)": 2.3753087520599365, "Pretrain/Step": 1188, "Pretrain/Step Time": 8.067856011912227} +{"Pretrain/Learning Rate": 4.883372243738588e-05, "Pretrain/Loss": 2.1463165283203125, "Pretrain/Loss (Raw)": 2.0796263217926025, "Pretrain/Step": 1189, "Pretrain/Step Time": 8.069203583523631} +{"Pretrain/Learning Rate": 4.883115821974213e-05, "Pretrain/Loss": 2.1433987617492676, "Pretrain/Loss (Raw)": 2.010561943054199, "Pretrain/Step": 1190, "Pretrain/Step Time": 8.062736760824919} +{"Pretrain/Learning Rate": 4.8828591253776937e-05, "Pretrain/Loss": 2.143739700317383, "Pretrain/Loss (Raw)": 2.1370344161987305, "Pretrain/Step": 1191, "Pretrain/Step Time": 8.075892930850387} +{"Pretrain/Learning Rate": 4.88260215397863e-05, "Pretrain/Loss": 2.14648699760437, "Pretrain/Loss (Raw)": 2.4515786170959473, "Pretrain/Step": 1192, "Pretrain/Step Time": 8.085111159831285} +{"Pretrain/Learning Rate": 4.882344907806659e-05, "Pretrain/Loss": 2.1464903354644775, "Pretrain/Loss (Raw)": 2.360677480697632, "Pretrain/Step": 1193, "Pretrain/Step Time": 8.078592149540782} +{"Pretrain/Learning Rate": 4.882087386891448e-05, "Pretrain/Loss": 2.1463141441345215, "Pretrain/Loss (Raw)": 2.040257453918457, "Pretrain/Step": 1194, "Pretrain/Step Time": 8.083161860704422} +{"Pretrain/Learning Rate": 4.8818295912626955e-05, "Pretrain/Loss": 2.145415782928467, "Pretrain/Loss (Raw)": 2.0772345066070557, "Pretrain/Step": 1195, "Pretrain/Step Time": 8.080945448949933} +{"Pretrain/Learning Rate": 4.88157152095013e-05, "Pretrain/Loss": 2.145261287689209, "Pretrain/Loss (Raw)": 2.137974739074707, "Pretrain/Step": 1196, "Pretrain/Step Time": 8.080104926601052} +{"Pretrain/Learning Rate": 4.881313175983515e-05, "Pretrain/Loss": 2.1440510749816895, "Pretrain/Loss (Raw)": 2.0327470302581787, "Pretrain/Step": 1197, "Pretrain/Step Time": 8.082498682662845} +{"Pretrain/Learning Rate": 4.881054556392642e-05, "Pretrain/Loss": 2.143796682357788, "Pretrain/Loss (Raw)": 2.1778836250305176, "Pretrain/Step": 1198, "Pretrain/Step Time": 8.073620645329356} +{"Pretrain/Learning Rate": 4.8807956622073394e-05, "Pretrain/Loss": 2.1432337760925293, "Pretrain/Loss (Raw)": 2.056926727294922, "Pretrain/Step": 1199, "Pretrain/Step Time": 8.081625929102302} +{"Pretrain/Learning Rate": 4.880536493457461e-05, "Pretrain/Loss": 2.1431427001953125, "Pretrain/Loss (Raw)": 2.188776731491089, "Pretrain/Step": 1200, "Pretrain/Step Time": 8.07615640759468} +{"Pretrain/Learning Rate": 4.880277050172897e-05, "Pretrain/Loss": 2.1435062885284424, "Pretrain/Loss (Raw)": 2.0518710613250732, "Pretrain/Step": 1201, "Pretrain/Step Time": 8.075709322467446} +{"Pretrain/Learning Rate": 4.880017332383567e-05, "Pretrain/Loss": 2.1438300609588623, "Pretrain/Loss (Raw)": 2.1070778369903564, "Pretrain/Step": 1202, "Pretrain/Step Time": 8.075875511392951} +{"Pretrain/Learning Rate": 4.879757340119425e-05, "Pretrain/Loss": 2.1444003582000732, "Pretrain/Loss (Raw)": 2.1011645793914795, "Pretrain/Step": 1203, "Pretrain/Step Time": 8.07437041029334} +{"Pretrain/Learning Rate": 4.879497073410451e-05, "Pretrain/Loss": 2.1452832221984863, "Pretrain/Loss (Raw)": 2.0921761989593506, "Pretrain/Step": 1204, "Pretrain/Step Time": 8.08631275780499} +{"Pretrain/Learning Rate": 4.8792365322866626e-05, "Pretrain/Loss": 2.143951416015625, "Pretrain/Loss (Raw)": 1.914471983909607, "Pretrain/Step": 1205, "Pretrain/Step Time": 8.071851469576359} +{"Pretrain/Learning Rate": 4.878975716778106e-05, "Pretrain/Loss": 2.143655300140381, "Pretrain/Loss (Raw)": 2.192112684249878, "Pretrain/Step": 1206, "Pretrain/Step Time": 8.078796859830618} +{"Pretrain/Learning Rate": 4.878714626914859e-05, "Pretrain/Loss": 2.1448893547058105, "Pretrain/Loss (Raw)": 2.3644745349884033, "Pretrain/Step": 1207, "Pretrain/Step Time": 8.06867951899767} +{"Pretrain/Learning Rate": 4.878453262727033e-05, "Pretrain/Loss": 2.1441850662231445, "Pretrain/Loss (Raw)": 2.0556530952453613, "Pretrain/Step": 1208, "Pretrain/Step Time": 8.072866421192884} +{"Pretrain/Learning Rate": 4.878191624244769e-05, "Pretrain/Loss": 2.1433310508728027, "Pretrain/Loss (Raw)": 2.124783754348755, "Pretrain/Step": 1209, "Pretrain/Step Time": 8.067775571718812} +{"Pretrain/Learning Rate": 4.8779297114982406e-05, "Pretrain/Loss": 2.1424179077148438, "Pretrain/Loss (Raw)": 2.1629133224487305, "Pretrain/Step": 1210, "Pretrain/Step Time": 8.071656135842204} +{"Pretrain/Learning Rate": 4.877667524517652e-05, "Pretrain/Loss": 2.1425223350524902, "Pretrain/Loss (Raw)": 2.141186475753784, "Pretrain/Step": 1211, "Pretrain/Step Time": 8.076124001294374} +{"Pretrain/Learning Rate": 4.877405063333241e-05, "Pretrain/Loss": 2.141833782196045, "Pretrain/Loss (Raw)": 1.9887861013412476, "Pretrain/Step": 1212, "Pretrain/Step Time": 8.071279365569353} +{"Pretrain/Learning Rate": 4.877142327975276e-05, "Pretrain/Loss": 2.1406259536743164, "Pretrain/Loss (Raw)": 2.039198398590088, "Pretrain/Step": 1213, "Pretrain/Step Time": 8.078785562887788} +{"Pretrain/Learning Rate": 4.8768793184740556e-05, "Pretrain/Loss": 2.140878200531006, "Pretrain/Loss (Raw)": 2.080357551574707, "Pretrain/Step": 1214, "Pretrain/Step Time": 8.072769520804286} +{"Pretrain/Learning Rate": 4.8766160348599125e-05, "Pretrain/Loss": 2.1418886184692383, "Pretrain/Loss (Raw)": 2.2343790531158447, "Pretrain/Step": 1215, "Pretrain/Step Time": 8.079150587320328} +{"Pretrain/Learning Rate": 4.876352477163209e-05, "Pretrain/Loss": 2.1424624919891357, "Pretrain/Loss (Raw)": 2.154616117477417, "Pretrain/Step": 1216, "Pretrain/Step Time": 8.074995083734393} +{"Pretrain/Learning Rate": 4.8760886454143394e-05, "Pretrain/Loss": 2.143077850341797, "Pretrain/Loss (Raw)": 2.1632208824157715, "Pretrain/Step": 1217, "Pretrain/Step Time": 8.081629283726215} +{"Pretrain/Learning Rate": 4.875824539643731e-05, "Pretrain/Loss": 2.14237642288208, "Pretrain/Loss (Raw)": 2.106491804122925, "Pretrain/Step": 1218, "Pretrain/Step Time": 8.073240192607045} +{"Pretrain/Learning Rate": 4.8755601598818427e-05, "Pretrain/Loss": 2.1414990425109863, "Pretrain/Loss (Raw)": 2.0043888092041016, "Pretrain/Step": 1219, "Pretrain/Step Time": 8.078689765185118} +{"Pretrain/Learning Rate": 4.875295506159161e-05, "Pretrain/Loss": 2.1425302028656006, "Pretrain/Loss (Raw)": 2.196237087249756, "Pretrain/Step": 1220, "Pretrain/Step Time": 8.079525042325258} +{"Pretrain/Learning Rate": 4.87503057850621e-05, "Pretrain/Loss": 2.142510414123535, "Pretrain/Loss (Raw)": 2.1340644359588623, "Pretrain/Step": 1221, "Pretrain/Step Time": 8.065360087901354} +{"Pretrain/Learning Rate": 4.874765376953541e-05, "Pretrain/Loss": 2.1425044536590576, "Pretrain/Loss (Raw)": 2.2211477756500244, "Pretrain/Step": 1222, "Pretrain/Step Time": 8.076520316302776} +{"Pretrain/Learning Rate": 4.874499901531737e-05, "Pretrain/Loss": 2.139882802963257, "Pretrain/Loss (Raw)": 2.0970709323883057, "Pretrain/Step": 1223, "Pretrain/Step Time": 8.066555742174387} +{"Pretrain/Learning Rate": 4.874234152271418e-05, "Pretrain/Loss": 2.138704299926758, "Pretrain/Loss (Raw)": 2.112607479095459, "Pretrain/Step": 1224, "Pretrain/Step Time": 8.076154323294759} +{"Pretrain/Learning Rate": 4.8739681292032266e-05, "Pretrain/Loss": 2.1380701065063477, "Pretrain/Loss (Raw)": 2.161076545715332, "Pretrain/Step": 1225, "Pretrain/Step Time": 8.067228885367513} +{"Pretrain/Learning Rate": 4.8737018323578445e-05, "Pretrain/Loss": 2.1395649909973145, "Pretrain/Loss (Raw)": 2.3419647216796875, "Pretrain/Step": 1226, "Pretrain/Step Time": 8.069472510367632} +{"Pretrain/Learning Rate": 4.873435261765982e-05, "Pretrain/Loss": 2.1392064094543457, "Pretrain/Loss (Raw)": 2.068619728088379, "Pretrain/Step": 1227, "Pretrain/Step Time": 8.061321998015046} +{"Pretrain/Learning Rate": 4.873168417458381e-05, "Pretrain/Loss": 2.1379446983337402, "Pretrain/Loss (Raw)": 2.0366435050964355, "Pretrain/Step": 1228, "Pretrain/Step Time": 8.067097390070558} +{"Pretrain/Learning Rate": 4.8729012994658166e-05, "Pretrain/Loss": 2.135253667831421, "Pretrain/Loss (Raw)": 1.9466110467910767, "Pretrain/Step": 1229, "Pretrain/Step Time": 8.066314356401563} +{"Pretrain/Learning Rate": 4.8726339078190914e-05, "Pretrain/Loss": 2.1346325874328613, "Pretrain/Loss (Raw)": 2.091852903366089, "Pretrain/Step": 1230, "Pretrain/Step Time": 8.063647974282503} +{"Pretrain/Learning Rate": 4.872366242549044e-05, "Pretrain/Loss": 2.134182929992676, "Pretrain/Loss (Raw)": 2.093172073364258, "Pretrain/Step": 1231, "Pretrain/Step Time": 8.06672052666545} +{"Pretrain/Learning Rate": 4.872098303686543e-05, "Pretrain/Loss": 2.1356444358825684, "Pretrain/Loss (Raw)": 2.253568649291992, "Pretrain/Step": 1232, "Pretrain/Step Time": 8.066283797845244} +{"Pretrain/Learning Rate": 4.871830091262488e-05, "Pretrain/Loss": 2.134244441986084, "Pretrain/Loss (Raw)": 1.9666838645935059, "Pretrain/Step": 1233, "Pretrain/Step Time": 8.069474067538977} +{"Pretrain/Learning Rate": 4.8715616053078095e-05, "Pretrain/Loss": 2.136058807373047, "Pretrain/Loss (Raw)": 2.3333423137664795, "Pretrain/Step": 1234, "Pretrain/Step Time": 8.066764594987035} +{"Pretrain/Learning Rate": 4.871292845853472e-05, "Pretrain/Loss": 2.135124683380127, "Pretrain/Loss (Raw)": 2.017394781112671, "Pretrain/Step": 1235, "Pretrain/Step Time": 8.063864208757877} +{"Pretrain/Learning Rate": 4.87102381293047e-05, "Pretrain/Loss": 2.1336162090301514, "Pretrain/Loss (Raw)": 2.1176583766937256, "Pretrain/Step": 1236, "Pretrain/Step Time": 8.0690295137465} +{"Pretrain/Learning Rate": 4.870754506569829e-05, "Pretrain/Loss": 2.1319363117218018, "Pretrain/Loss (Raw)": 2.029873847961426, "Pretrain/Step": 1237, "Pretrain/Step Time": 8.065536998212337} +{"Pretrain/Learning Rate": 4.870484926802606e-05, "Pretrain/Loss": 2.1323649883270264, "Pretrain/Loss (Raw)": 2.1179590225219727, "Pretrain/Step": 1238, "Pretrain/Step Time": 8.073407495394349} +{"Pretrain/Learning Rate": 4.8702150736598925e-05, "Pretrain/Loss": 2.135336399078369, "Pretrain/Loss (Raw)": 2.4637908935546875, "Pretrain/Step": 1239, "Pretrain/Step Time": 8.065521381795406} +{"Pretrain/Learning Rate": 4.8699449471728075e-05, "Pretrain/Loss": 2.134639263153076, "Pretrain/Loss (Raw)": 2.036708116531372, "Pretrain/Step": 1240, "Pretrain/Step Time": 8.058315861970186} +{"Pretrain/Learning Rate": 4.869674547372504e-05, "Pretrain/Loss": 2.1324405670166016, "Pretrain/Loss (Raw)": 2.2035300731658936, "Pretrain/Step": 1241, "Pretrain/Step Time": 8.058823892846704} +{"Pretrain/Learning Rate": 4.8694038742901646e-05, "Pretrain/Loss": 2.131941795349121, "Pretrain/Loss (Raw)": 2.1377131938934326, "Pretrain/Step": 1242, "Pretrain/Step Time": 8.050587892532349} +{"Pretrain/Learning Rate": 4.869132927957007e-05, "Pretrain/Loss": 2.1321487426757812, "Pretrain/Loss (Raw)": 2.22724986076355, "Pretrain/Step": 1243, "Pretrain/Step Time": 8.05532538332045} +{"Pretrain/Learning Rate": 4.868861708404275e-05, "Pretrain/Loss": 2.1310863494873047, "Pretrain/Loss (Raw)": 1.9892762899398804, "Pretrain/Step": 1244, "Pretrain/Step Time": 8.054668860509992} +{"Pretrain/Learning Rate": 4.868590215663248e-05, "Pretrain/Loss": 2.1318459510803223, "Pretrain/Loss (Raw)": 2.2418439388275146, "Pretrain/Step": 1245, "Pretrain/Step Time": 8.054880315437913} +{"Pretrain/Learning Rate": 4.8683184497652366e-05, "Pretrain/Loss": 2.1330177783966064, "Pretrain/Loss (Raw)": 2.2367045879364014, "Pretrain/Step": 1246, "Pretrain/Step Time": 8.05622454546392} +{"Pretrain/Learning Rate": 4.868046410741582e-05, "Pretrain/Loss": 2.130802631378174, "Pretrain/Loss (Raw)": 1.937562346458435, "Pretrain/Step": 1247, "Pretrain/Step Time": 8.057256599888206} +{"Pretrain/Learning Rate": 4.867774098623657e-05, "Pretrain/Loss": 2.130308151245117, "Pretrain/Loss (Raw)": 2.059922933578491, "Pretrain/Step": 1248, "Pretrain/Step Time": 8.05493026226759} +{"Pretrain/Learning Rate": 4.8675015134428654e-05, "Pretrain/Loss": 2.1317901611328125, "Pretrain/Loss (Raw)": 2.1391608715057373, "Pretrain/Step": 1249, "Pretrain/Step Time": 8.056234907358885} +{"Pretrain/Learning Rate": 4.867228655230643e-05, "Pretrain/Loss": 2.1320011615753174, "Pretrain/Loss (Raw)": 2.0820395946502686, "Pretrain/Step": 1250, "Pretrain/Step Time": 8.056851457804441} +{"Pretrain/Learning Rate": 4.866955524018457e-05, "Pretrain/Loss": 2.13106632232666, "Pretrain/Loss (Raw)": 2.079019069671631, "Pretrain/Step": 1251, "Pretrain/Step Time": 8.045186031609774} +{"Pretrain/Learning Rate": 4.866682119837807e-05, "Pretrain/Loss": 2.1306166648864746, "Pretrain/Loss (Raw)": 2.1187503337860107, "Pretrain/Step": 1252, "Pretrain/Step Time": 8.057089200243354} +{"Pretrain/Learning Rate": 4.866408442720223e-05, "Pretrain/Loss": 2.1299378871917725, "Pretrain/Loss (Raw)": 2.064594030380249, "Pretrain/Step": 1253, "Pretrain/Step Time": 8.059917679056525} +{"Pretrain/Learning Rate": 4.8661344926972666e-05, "Pretrain/Loss": 2.129660129547119, "Pretrain/Loss (Raw)": 2.0948896408081055, "Pretrain/Step": 1254, "Pretrain/Step Time": 8.056294567883015} +{"Pretrain/Learning Rate": 4.8658602698005294e-05, "Pretrain/Loss": 2.1301560401916504, "Pretrain/Loss (Raw)": 2.1300699710845947, "Pretrain/Step": 1255, "Pretrain/Step Time": 8.058590916916728} +{"Pretrain/Learning Rate": 4.8655857740616395e-05, "Pretrain/Loss": 2.129572629928589, "Pretrain/Loss (Raw)": 2.0321133136749268, "Pretrain/Step": 1256, "Pretrain/Step Time": 8.052129341289401} +{"Pretrain/Learning Rate": 4.8653110055122496e-05, "Pretrain/Loss": 2.129631757736206, "Pretrain/Loss (Raw)": 1.9732482433319092, "Pretrain/Step": 1257, "Pretrain/Step Time": 8.05496665649116} +{"Pretrain/Learning Rate": 4.8650359641840495e-05, "Pretrain/Loss": 2.128835916519165, "Pretrain/Loss (Raw)": 2.109053134918213, "Pretrain/Step": 1258, "Pretrain/Step Time": 8.054996222257614} +{"Pretrain/Learning Rate": 4.864760650108758e-05, "Pretrain/Loss": 2.1270737648010254, "Pretrain/Loss (Raw)": 2.0098793506622314, "Pretrain/Step": 1259, "Pretrain/Step Time": 8.053847325965762} +{"Pretrain/Learning Rate": 4.864485063318125e-05, "Pretrain/Loss": 2.1258175373077393, "Pretrain/Loss (Raw)": 2.1702582836151123, "Pretrain/Step": 1260, "Pretrain/Step Time": 8.056276692077518} +{"Pretrain/Learning Rate": 4.864209203843932e-05, "Pretrain/Loss": 2.1248865127563477, "Pretrain/Loss (Raw)": 2.111821174621582, "Pretrain/Step": 1261, "Pretrain/Step Time": 8.05965430662036} +{"Pretrain/Learning Rate": 4.8639330717179946e-05, "Pretrain/Loss": 2.124472141265869, "Pretrain/Loss (Raw)": 2.0063693523406982, "Pretrain/Step": 1262, "Pretrain/Step Time": 8.05998032912612} +{"Pretrain/Learning Rate": 4.863656666972154e-05, "Pretrain/Loss": 2.125046730041504, "Pretrain/Loss (Raw)": 2.12095046043396, "Pretrain/Step": 1263, "Pretrain/Step Time": 8.059153350070119} +{"Pretrain/Learning Rate": 4.86337998963829e-05, "Pretrain/Loss": 2.1245667934417725, "Pretrain/Loss (Raw)": 2.0895895957946777, "Pretrain/Step": 1264, "Pretrain/Step Time": 8.06454361230135} +{"Pretrain/Learning Rate": 4.863103039748309e-05, "Pretrain/Loss": 2.1272411346435547, "Pretrain/Loss (Raw)": 2.3537259101867676, "Pretrain/Step": 1265, "Pretrain/Step Time": 8.056312285363674} +{"Pretrain/Learning Rate": 4.86282581733415e-05, "Pretrain/Loss": 2.1280879974365234, "Pretrain/Loss (Raw)": 2.320213556289673, "Pretrain/Step": 1266, "Pretrain/Step Time": 8.056214835494757} +{"Pretrain/Learning Rate": 4.8625483224277835e-05, "Pretrain/Loss": 2.1288814544677734, "Pretrain/Loss (Raw)": 2.1193747520446777, "Pretrain/Step": 1267, "Pretrain/Step Time": 8.061419880017638} +{"Pretrain/Learning Rate": 4.8622705550612126e-05, "Pretrain/Loss": 2.1301486492156982, "Pretrain/Loss (Raw)": 2.292673349380493, "Pretrain/Step": 1268, "Pretrain/Step Time": 8.060488913208246} +{"Pretrain/Learning Rate": 4.861992515266469e-05, "Pretrain/Loss": 2.1295933723449707, "Pretrain/Loss (Raw)": 2.012451648712158, "Pretrain/Step": 1269, "Pretrain/Step Time": 8.061678690835834} +{"Pretrain/Learning Rate": 4.8617142030756194e-05, "Pretrain/Loss": 2.1290602684020996, "Pretrain/Loss (Raw)": 2.1077234745025635, "Pretrain/Step": 1270, "Pretrain/Step Time": 8.062757382169366} +{"Pretrain/Learning Rate": 4.8614356185207575e-05, "Pretrain/Loss": 2.1286113262176514, "Pretrain/Loss (Raw)": 2.170358180999756, "Pretrain/Step": 1271, "Pretrain/Step Time": 8.068088496103883} +{"Pretrain/Learning Rate": 4.861156761634014e-05, "Pretrain/Loss": 2.1272358894348145, "Pretrain/Loss (Raw)": 2.11743426322937, "Pretrain/Step": 1272, "Pretrain/Step Time": 8.069107865914702} +{"Pretrain/Learning Rate": 4.860877632447546e-05, "Pretrain/Loss": 2.1278085708618164, "Pretrain/Loss (Raw)": 2.275122880935669, "Pretrain/Step": 1273, "Pretrain/Step Time": 8.072328304871917} +{"Pretrain/Learning Rate": 4.8605982309935446e-05, "Pretrain/Loss": 2.1265769004821777, "Pretrain/Loss (Raw)": 2.082502841949463, "Pretrain/Step": 1274, "Pretrain/Step Time": 8.07198191806674} +{"Pretrain/Learning Rate": 4.860318557304232e-05, "Pretrain/Loss": 2.12528920173645, "Pretrain/Loss (Raw)": 1.9951984882354736, "Pretrain/Step": 1275, "Pretrain/Step Time": 8.07323369383812} +{"Pretrain/Learning Rate": 4.860038611411861e-05, "Pretrain/Loss": 2.1254122257232666, "Pretrain/Loss (Raw)": 2.1796083450317383, "Pretrain/Step": 1276, "Pretrain/Step Time": 8.076876109465957} +{"Pretrain/Learning Rate": 4.8597583933487165e-05, "Pretrain/Loss": 2.125889778137207, "Pretrain/Loss (Raw)": 2.2244064807891846, "Pretrain/Step": 1277, "Pretrain/Step Time": 8.072475410997868} +{"Pretrain/Learning Rate": 4.859477903147115e-05, "Pretrain/Loss": 2.128392219543457, "Pretrain/Loss (Raw)": 2.329286813735962, "Pretrain/Step": 1278, "Pretrain/Step Time": 8.072773840278387} +{"Pretrain/Learning Rate": 4.8591971408394034e-05, "Pretrain/Loss": 2.127401828765869, "Pretrain/Loss (Raw)": 2.1111526489257812, "Pretrain/Step": 1279, "Pretrain/Step Time": 8.076342107728124} +{"Pretrain/Learning Rate": 4.85891610645796e-05, "Pretrain/Loss": 2.1287384033203125, "Pretrain/Loss (Raw)": 2.2353508472442627, "Pretrain/Step": 1280, "Pretrain/Step Time": 8.076506907120347} +{"Pretrain/Learning Rate": 4.8586348000351956e-05, "Pretrain/Loss": 2.1278445720672607, "Pretrain/Loss (Raw)": 2.077960729598999, "Pretrain/Step": 1281, "Pretrain/Step Time": 8.077049830928445} +{"Pretrain/Learning Rate": 4.8583532216035524e-05, "Pretrain/Loss": 2.1276371479034424, "Pretrain/Loss (Raw)": 2.0689949989318848, "Pretrain/Step": 1282, "Pretrain/Step Time": 8.075805382803082} +{"Pretrain/Learning Rate": 4.858071371195502e-05, "Pretrain/Loss": 2.13075852394104, "Pretrain/Loss (Raw)": 2.320011615753174, "Pretrain/Step": 1283, "Pretrain/Step Time": 8.07737197354436} +{"Pretrain/Learning Rate": 4.8577892488435504e-05, "Pretrain/Loss": 2.131194591522217, "Pretrain/Loss (Raw)": 2.1228647232055664, "Pretrain/Step": 1284, "Pretrain/Step Time": 8.076463606208563} +{"Pretrain/Learning Rate": 4.8575068545802316e-05, "Pretrain/Loss": 2.130154609680176, "Pretrain/Loss (Raw)": 2.0969791412353516, "Pretrain/Step": 1285, "Pretrain/Step Time": 8.082025401294231} +{"Pretrain/Learning Rate": 4.8572241884381145e-05, "Pretrain/Loss": 2.1303043365478516, "Pretrain/Loss (Raw)": 2.138047695159912, "Pretrain/Step": 1286, "Pretrain/Step Time": 8.079783473163843} +{"Pretrain/Learning Rate": 4.856941250449795e-05, "Pretrain/Loss": 2.1295816898345947, "Pretrain/Loss (Raw)": 2.0025601387023926, "Pretrain/Step": 1287, "Pretrain/Step Time": 8.074181448668242} +{"Pretrain/Learning Rate": 4.8566580406479045e-05, "Pretrain/Loss": 2.128781795501709, "Pretrain/Loss (Raw)": 2.1937191486358643, "Pretrain/Step": 1288, "Pretrain/Step Time": 8.076086297631264} +{"Pretrain/Learning Rate": 4.856374559065104e-05, "Pretrain/Loss": 2.1303672790527344, "Pretrain/Loss (Raw)": 2.1925859451293945, "Pretrain/Step": 1289, "Pretrain/Step Time": 8.072472648695111} +{"Pretrain/Learning Rate": 4.856090805734086e-05, "Pretrain/Loss": 2.1291251182556152, "Pretrain/Loss (Raw)": 2.0650382041931152, "Pretrain/Step": 1290, "Pretrain/Step Time": 8.077432189136744} +{"Pretrain/Learning Rate": 4.855806780687574e-05, "Pretrain/Loss": 2.1274824142456055, "Pretrain/Loss (Raw)": 2.101605176925659, "Pretrain/Step": 1291, "Pretrain/Step Time": 8.07811600342393} +{"Pretrain/Learning Rate": 4.8555224839583236e-05, "Pretrain/Loss": 2.1289491653442383, "Pretrain/Loss (Raw)": 2.2256548404693604, "Pretrain/Step": 1292, "Pretrain/Step Time": 8.073727065697312} +{"Pretrain/Learning Rate": 4.8552379155791194e-05, "Pretrain/Loss": 2.1283602714538574, "Pretrain/Loss (Raw)": 2.083353281021118, "Pretrain/Step": 1293, "Pretrain/Step Time": 8.07243357412517} +{"Pretrain/Learning Rate": 4.854953075582782e-05, "Pretrain/Loss": 2.1296119689941406, "Pretrain/Loss (Raw)": 2.200028657913208, "Pretrain/Step": 1294, "Pretrain/Step Time": 8.06588913500309} +{"Pretrain/Learning Rate": 4.854667964002158e-05, "Pretrain/Loss": 2.1287293434143066, "Pretrain/Loss (Raw)": 2.1022491455078125, "Pretrain/Step": 1295, "Pretrain/Step Time": 8.0758633967489} +{"Pretrain/Learning Rate": 4.8543825808701294e-05, "Pretrain/Loss": 2.1300439834594727, "Pretrain/Loss (Raw)": 2.11601185798645, "Pretrain/Step": 1296, "Pretrain/Step Time": 8.06997450813651} +{"Pretrain/Learning Rate": 4.854096926219607e-05, "Pretrain/Loss": 2.1285595893859863, "Pretrain/Loss (Raw)": 2.1879072189331055, "Pretrain/Step": 1297, "Pretrain/Step Time": 8.065744154155254} +{"Pretrain/Learning Rate": 4.853811000083535e-05, "Pretrain/Loss": 2.1283535957336426, "Pretrain/Loss (Raw)": 2.0107481479644775, "Pretrain/Step": 1298, "Pretrain/Step Time": 8.072951992973685} +{"Pretrain/Learning Rate": 4.8535248024948854e-05, "Pretrain/Loss": 2.128068447113037, "Pretrain/Loss (Raw)": 2.102478265762329, "Pretrain/Step": 1299, "Pretrain/Step Time": 8.067631516605616} +{"Pretrain/Learning Rate": 4.853238333486666e-05, "Pretrain/Loss": 2.128037929534912, "Pretrain/Loss (Raw)": 2.1180026531219482, "Pretrain/Step": 1300, "Pretrain/Step Time": 8.07334890589118} +{"Pretrain/Learning Rate": 4.852951593091914e-05, "Pretrain/Loss": 2.129085063934326, "Pretrain/Loss (Raw)": 2.185594081878662, "Pretrain/Step": 1301, "Pretrain/Step Time": 8.069537922739983} +{"Pretrain/Learning Rate": 4.852664581343696e-05, "Pretrain/Loss": 2.130084753036499, "Pretrain/Loss (Raw)": 2.229705572128296, "Pretrain/Step": 1302, "Pretrain/Step Time": 8.065998708829284} +{"Pretrain/Learning Rate": 4.852377298275113e-05, "Pretrain/Loss": 2.1307830810546875, "Pretrain/Loss (Raw)": 2.2157576084136963, "Pretrain/Step": 1303, "Pretrain/Step Time": 8.059204705059528} +{"Pretrain/Learning Rate": 4.852089743919295e-05, "Pretrain/Loss": 2.1332736015319824, "Pretrain/Loss (Raw)": 2.210900068283081, "Pretrain/Step": 1304, "Pretrain/Step Time": 8.068271996453404} +{"Pretrain/Learning Rate": 4.851801918309403e-05, "Pretrain/Loss": 2.1355371475219727, "Pretrain/Loss (Raw)": 2.3019514083862305, "Pretrain/Step": 1305, "Pretrain/Step Time": 8.070897674188018} +{"Pretrain/Learning Rate": 4.8515138214786335e-05, "Pretrain/Loss": 2.136064291000366, "Pretrain/Loss (Raw)": 2.155470609664917, "Pretrain/Step": 1306, "Pretrain/Step Time": 8.05885792709887} +{"Pretrain/Learning Rate": 4.851225453460209e-05, "Pretrain/Loss": 2.135108232498169, "Pretrain/Loss (Raw)": 2.09149169921875, "Pretrain/Step": 1307, "Pretrain/Step Time": 8.066593740135431} +{"Pretrain/Learning Rate": 4.850936814287386e-05, "Pretrain/Loss": 2.135648250579834, "Pretrain/Loss (Raw)": 2.1837844848632812, "Pretrain/Step": 1308, "Pretrain/Step Time": 8.059533979743719} +{"Pretrain/Learning Rate": 4.85064790399345e-05, "Pretrain/Loss": 2.1370766162872314, "Pretrain/Loss (Raw)": 2.280496120452881, "Pretrain/Step": 1309, "Pretrain/Step Time": 8.065040711313486} +{"Pretrain/Learning Rate": 4.850358722611723e-05, "Pretrain/Loss": 2.138448715209961, "Pretrain/Loss (Raw)": 2.307558536529541, "Pretrain/Step": 1310, "Pretrain/Step Time": 8.061616199091077} +{"Pretrain/Learning Rate": 4.850069270175552e-05, "Pretrain/Loss": 2.138697385787964, "Pretrain/Loss (Raw)": 2.1385533809661865, "Pretrain/Step": 1311, "Pretrain/Step Time": 8.063050573691726} +{"Pretrain/Learning Rate": 4.849779546718319e-05, "Pretrain/Loss": 2.1375961303710938, "Pretrain/Loss (Raw)": 2.1875791549682617, "Pretrain/Step": 1312, "Pretrain/Step Time": 8.068036586046219} +{"Pretrain/Learning Rate": 4.8494895522734364e-05, "Pretrain/Loss": 2.139500856399536, "Pretrain/Loss (Raw)": 2.306178092956543, "Pretrain/Step": 1313, "Pretrain/Step Time": 8.067276570945978} +{"Pretrain/Learning Rate": 4.849199286874347e-05, "Pretrain/Loss": 2.139626979827881, "Pretrain/Loss (Raw)": 2.0750274658203125, "Pretrain/Step": 1314, "Pretrain/Step Time": 8.068705033510923} +{"Pretrain/Learning Rate": 4.8489087505545266e-05, "Pretrain/Loss": 2.1392157077789307, "Pretrain/Loss (Raw)": 2.0866100788116455, "Pretrain/Step": 1315, "Pretrain/Step Time": 8.060651954263449} +{"Pretrain/Learning Rate": 4.84861794334748e-05, "Pretrain/Loss": 2.1364946365356445, "Pretrain/Loss (Raw)": 2.027012348175049, "Pretrain/Step": 1316, "Pretrain/Step Time": 8.06956871971488} +{"Pretrain/Learning Rate": 4.848326865286746e-05, "Pretrain/Loss": 2.1369662284851074, "Pretrain/Loss (Raw)": 2.1400089263916016, "Pretrain/Step": 1317, "Pretrain/Step Time": 8.068039426580071} +{"Pretrain/Learning Rate": 4.848035516405892e-05, "Pretrain/Loss": 2.1381638050079346, "Pretrain/Loss (Raw)": 2.1638295650482178, "Pretrain/Step": 1318, "Pretrain/Step Time": 8.07304229773581} +{"Pretrain/Learning Rate": 4.847743896738517e-05, "Pretrain/Loss": 2.1383213996887207, "Pretrain/Loss (Raw)": 2.1571803092956543, "Pretrain/Step": 1319, "Pretrain/Step Time": 8.069967065006495} +{"Pretrain/Learning Rate": 4.847452006318254e-05, "Pretrain/Loss": 2.135080337524414, "Pretrain/Loss (Raw)": 2.0367376804351807, "Pretrain/Step": 1320, "Pretrain/Step Time": 8.05661610327661} +{"Pretrain/Learning Rate": 4.8471598451787635e-05, "Pretrain/Loss": 2.1325337886810303, "Pretrain/Loss (Raw)": 2.0347208976745605, "Pretrain/Step": 1321, "Pretrain/Step Time": 8.059252232313156} +{"Pretrain/Learning Rate": 4.8468674133537395e-05, "Pretrain/Loss": 2.1335701942443848, "Pretrain/Loss (Raw)": 2.1729276180267334, "Pretrain/Step": 1322, "Pretrain/Step Time": 8.055442215874791} +{"Pretrain/Learning Rate": 4.846574710876907e-05, "Pretrain/Loss": 2.1336090564727783, "Pretrain/Loss (Raw)": 2.0821969509124756, "Pretrain/Step": 1323, "Pretrain/Step Time": 8.061463495716453} +{"Pretrain/Learning Rate": 4.846281737782021e-05, "Pretrain/Loss": 2.13191819190979, "Pretrain/Loss (Raw)": 1.9215646982192993, "Pretrain/Step": 1324, "Pretrain/Step Time": 8.056267838925123} +{"Pretrain/Learning Rate": 4.845988494102869e-05, "Pretrain/Loss": 2.13175106048584, "Pretrain/Loss (Raw)": 2.01131534576416, "Pretrain/Step": 1325, "Pretrain/Step Time": 8.058423481881618} +{"Pretrain/Learning Rate": 4.845694979873269e-05, "Pretrain/Loss": 2.131549835205078, "Pretrain/Loss (Raw)": 2.152156352996826, "Pretrain/Step": 1326, "Pretrain/Step Time": 8.05725414864719} +{"Pretrain/Learning Rate": 4.845401195127071e-05, "Pretrain/Loss": 2.132025718688965, "Pretrain/Loss (Raw)": 2.1178414821624756, "Pretrain/Step": 1327, "Pretrain/Step Time": 8.058523239567876} +{"Pretrain/Learning Rate": 4.845107139898155e-05, "Pretrain/Loss": 2.132070541381836, "Pretrain/Loss (Raw)": 2.1945278644561768, "Pretrain/Step": 1328, "Pretrain/Step Time": 8.060036703944206} +{"Pretrain/Learning Rate": 4.8448128142204334e-05, "Pretrain/Loss": 2.1331355571746826, "Pretrain/Loss (Raw)": 2.1881628036499023, "Pretrain/Step": 1329, "Pretrain/Step Time": 8.060559211298823} +{"Pretrain/Learning Rate": 4.8445182181278494e-05, "Pretrain/Loss": 2.13210391998291, "Pretrain/Loss (Raw)": 1.975022315979004, "Pretrain/Step": 1330, "Pretrain/Step Time": 8.06487420015037} +{"Pretrain/Learning Rate": 4.8442233516543756e-05, "Pretrain/Loss": 2.1323838233947754, "Pretrain/Loss (Raw)": 2.1370060443878174, "Pretrain/Step": 1331, "Pretrain/Step Time": 8.063962547108531} +{"Pretrain/Learning Rate": 4.8439282148340195e-05, "Pretrain/Loss": 2.1330416202545166, "Pretrain/Loss (Raw)": 2.176379919052124, "Pretrain/Step": 1332, "Pretrain/Step Time": 8.056842349469662} +{"Pretrain/Learning Rate": 4.843632807700816e-05, "Pretrain/Loss": 2.135427713394165, "Pretrain/Loss (Raw)": 2.2198994159698486, "Pretrain/Step": 1333, "Pretrain/Step Time": 8.061927646398544} +{"Pretrain/Learning Rate": 4.843337130288834e-05, "Pretrain/Loss": 2.1362380981445312, "Pretrain/Loss (Raw)": 2.2958316802978516, "Pretrain/Step": 1334, "Pretrain/Step Time": 8.055935863405466} +{"Pretrain/Learning Rate": 4.843041182632172e-05, "Pretrain/Loss": 2.1341447830200195, "Pretrain/Loss (Raw)": 2.0965161323547363, "Pretrain/Step": 1335, "Pretrain/Step Time": 8.059108532965183} +{"Pretrain/Learning Rate": 4.84274496476496e-05, "Pretrain/Loss": 2.134636402130127, "Pretrain/Loss (Raw)": 2.1185951232910156, "Pretrain/Step": 1336, "Pretrain/Step Time": 8.052103638648987} +{"Pretrain/Learning Rate": 4.84244847672136e-05, "Pretrain/Loss": 2.134986162185669, "Pretrain/Loss (Raw)": 2.169548749923706, "Pretrain/Step": 1337, "Pretrain/Step Time": 8.058439645916224} +{"Pretrain/Learning Rate": 4.842151718535563e-05, "Pretrain/Loss": 2.1339306831359863, "Pretrain/Loss (Raw)": 2.0277981758117676, "Pretrain/Step": 1338, "Pretrain/Step Time": 8.060949699953198} +{"Pretrain/Learning Rate": 4.841854690241793e-05, "Pretrain/Loss": 2.135364294052124, "Pretrain/Loss (Raw)": 2.3247017860412598, "Pretrain/Step": 1339, "Pretrain/Step Time": 8.060164012014866} +{"Pretrain/Learning Rate": 4.841557391874304e-05, "Pretrain/Loss": 2.1364941596984863, "Pretrain/Loss (Raw)": 2.133434295654297, "Pretrain/Step": 1340, "Pretrain/Step Time": 8.067352084442973} +{"Pretrain/Learning Rate": 4.8412598234673845e-05, "Pretrain/Loss": 2.1374404430389404, "Pretrain/Loss (Raw)": 2.1603009700775146, "Pretrain/Step": 1341, "Pretrain/Step Time": 8.054869120940566} +{"Pretrain/Learning Rate": 4.840961985055349e-05, "Pretrain/Loss": 2.1379752159118652, "Pretrain/Loss (Raw)": 2.1487889289855957, "Pretrain/Step": 1342, "Pretrain/Step Time": 8.06464010849595} +{"Pretrain/Learning Rate": 4.8406638766725464e-05, "Pretrain/Loss": 2.137617588043213, "Pretrain/Loss (Raw)": 2.1886165142059326, "Pretrain/Step": 1343, "Pretrain/Step Time": 8.057901741936803} +{"Pretrain/Learning Rate": 4.840365498353357e-05, "Pretrain/Loss": 2.137178421020508, "Pretrain/Loss (Raw)": 2.0984396934509277, "Pretrain/Step": 1344, "Pretrain/Step Time": 8.060003845021129} +{"Pretrain/Learning Rate": 4.840066850132189e-05, "Pretrain/Loss": 2.1367907524108887, "Pretrain/Loss (Raw)": 2.1135408878326416, "Pretrain/Step": 1345, "Pretrain/Step Time": 8.054843751713634} +{"Pretrain/Learning Rate": 4.839767932043485e-05, "Pretrain/Loss": 2.136673927307129, "Pretrain/Loss (Raw)": 2.09155011177063, "Pretrain/Step": 1346, "Pretrain/Step Time": 8.058397985994816} +{"Pretrain/Learning Rate": 4.839468744121718e-05, "Pretrain/Loss": 2.1377086639404297, "Pretrain/Loss (Raw)": 2.1368470191955566, "Pretrain/Step": 1347, "Pretrain/Step Time": 8.060489639639854} +{"Pretrain/Learning Rate": 4.8391692864013916e-05, "Pretrain/Loss": 2.137153387069702, "Pretrain/Loss (Raw)": 2.125159502029419, "Pretrain/Step": 1348, "Pretrain/Step Time": 8.055890226736665} +{"Pretrain/Learning Rate": 4.838869558917041e-05, "Pretrain/Loss": 2.136462926864624, "Pretrain/Loss (Raw)": 2.045681953430176, "Pretrain/Step": 1349, "Pretrain/Step Time": 8.064461728557944} +{"Pretrain/Learning Rate": 4.838569561703231e-05, "Pretrain/Loss": 2.135310173034668, "Pretrain/Loss (Raw)": 2.0735902786254883, "Pretrain/Step": 1350, "Pretrain/Step Time": 8.055694444105029} +{"Pretrain/Learning Rate": 4.83826929479456e-05, "Pretrain/Loss": 2.1380515098571777, "Pretrain/Loss (Raw)": 2.4479820728302, "Pretrain/Step": 1351, "Pretrain/Step Time": 8.060463573783636} +{"Pretrain/Learning Rate": 4.837968758225655e-05, "Pretrain/Loss": 2.138310194015503, "Pretrain/Loss (Raw)": 2.1457252502441406, "Pretrain/Step": 1352, "Pretrain/Step Time": 8.05967271886766} +{"Pretrain/Learning Rate": 4.837667952031176e-05, "Pretrain/Loss": 2.1376380920410156, "Pretrain/Loss (Raw)": 2.0750174522399902, "Pretrain/Step": 1353, "Pretrain/Step Time": 8.060951532796025} +{"Pretrain/Learning Rate": 4.8373668762458144e-05, "Pretrain/Loss": 2.135143756866455, "Pretrain/Loss (Raw)": 2.022703170776367, "Pretrain/Step": 1354, "Pretrain/Step Time": 8.063147952780128} +{"Pretrain/Learning Rate": 4.8370655309042896e-05, "Pretrain/Loss": 2.135366916656494, "Pretrain/Loss (Raw)": 2.0971789360046387, "Pretrain/Step": 1355, "Pretrain/Step Time": 8.064867094159126} +{"Pretrain/Learning Rate": 4.8367639160413553e-05, "Pretrain/Loss": 2.1359877586364746, "Pretrain/Loss (Raw)": 2.1161344051361084, "Pretrain/Step": 1356, "Pretrain/Step Time": 8.063445085659623} +{"Pretrain/Learning Rate": 4.8364620316917956e-05, "Pretrain/Loss": 2.1382083892822266, "Pretrain/Loss (Raw)": 2.230862855911255, "Pretrain/Step": 1357, "Pretrain/Step Time": 8.061414802446961} +{"Pretrain/Learning Rate": 4.836159877890424e-05, "Pretrain/Loss": 2.1386380195617676, "Pretrain/Loss (Raw)": 2.1468255519866943, "Pretrain/Step": 1358, "Pretrain/Step Time": 8.060815956443548} +{"Pretrain/Learning Rate": 4.835857454672087e-05, "Pretrain/Loss": 2.138612747192383, "Pretrain/Loss (Raw)": 2.0899558067321777, "Pretrain/Step": 1359, "Pretrain/Step Time": 8.057112837210298} +{"Pretrain/Learning Rate": 4.835554762071661e-05, "Pretrain/Loss": 2.138054370880127, "Pretrain/Loss (Raw)": 2.1820924282073975, "Pretrain/Step": 1360, "Pretrain/Step Time": 8.05475177615881} +{"Pretrain/Learning Rate": 4.8352518001240555e-05, "Pretrain/Loss": 2.140024185180664, "Pretrain/Loss (Raw)": 2.2187979221343994, "Pretrain/Step": 1361, "Pretrain/Step Time": 8.0610023252666} +{"Pretrain/Learning Rate": 4.834948568864207e-05, "Pretrain/Loss": 2.1378211975097656, "Pretrain/Loss (Raw)": 2.0513572692871094, "Pretrain/Step": 1362, "Pretrain/Step Time": 8.065361248329282} +{"Pretrain/Learning Rate": 4.8346450683270875e-05, "Pretrain/Loss": 2.1393072605133057, "Pretrain/Loss (Raw)": 2.2076199054718018, "Pretrain/Step": 1363, "Pretrain/Step Time": 8.06771749816835} +{"Pretrain/Learning Rate": 4.8343412985476974e-05, "Pretrain/Loss": 2.1389758586883545, "Pretrain/Loss (Raw)": 2.0752320289611816, "Pretrain/Step": 1364, "Pretrain/Step Time": 8.058690216392279} +{"Pretrain/Learning Rate": 4.83403725956107e-05, "Pretrain/Loss": 2.140310525894165, "Pretrain/Loss (Raw)": 2.2007062435150146, "Pretrain/Step": 1365, "Pretrain/Step Time": 8.069288050755858} +{"Pretrain/Learning Rate": 4.8337329514022664e-05, "Pretrain/Loss": 2.1401872634887695, "Pretrain/Loss (Raw)": 2.102207899093628, "Pretrain/Step": 1366, "Pretrain/Step Time": 8.067678643390536} +{"Pretrain/Learning Rate": 4.833428374106382e-05, "Pretrain/Loss": 2.137402057647705, "Pretrain/Loss (Raw)": 2.1072499752044678, "Pretrain/Step": 1367, "Pretrain/Step Time": 8.068377623334527} +{"Pretrain/Learning Rate": 4.833123527708542e-05, "Pretrain/Loss": 2.1389026641845703, "Pretrain/Loss (Raw)": 2.228832721710205, "Pretrain/Step": 1368, "Pretrain/Step Time": 8.070634242147207} +{"Pretrain/Learning Rate": 4.832818412243904e-05, "Pretrain/Loss": 2.1379518508911133, "Pretrain/Loss (Raw)": 2.081815719604492, "Pretrain/Step": 1369, "Pretrain/Step Time": 8.067745506763458} +{"Pretrain/Learning Rate": 4.8325130277476526e-05, "Pretrain/Loss": 2.137693405151367, "Pretrain/Loss (Raw)": 2.1046290397644043, "Pretrain/Step": 1370, "Pretrain/Step Time": 8.066463150084019} +{"Pretrain/Learning Rate": 4.832207374255008e-05, "Pretrain/Loss": 2.1376049518585205, "Pretrain/Loss (Raw)": 2.2159180641174316, "Pretrain/Step": 1371, "Pretrain/Step Time": 8.06534075178206} +{"Pretrain/Learning Rate": 4.8319014518012195e-05, "Pretrain/Loss": 2.138153553009033, "Pretrain/Loss (Raw)": 2.0594916343688965, "Pretrain/Step": 1372, "Pretrain/Step Time": 8.063251420855522} +{"Pretrain/Learning Rate": 4.831595260421567e-05, "Pretrain/Loss": 2.1365270614624023, "Pretrain/Loss (Raw)": 2.033674716949463, "Pretrain/Step": 1373, "Pretrain/Step Time": 8.063847003504634} +{"Pretrain/Learning Rate": 4.8312888001513624e-05, "Pretrain/Loss": 2.134847402572632, "Pretrain/Loss (Raw)": 2.0216822624206543, "Pretrain/Step": 1374, "Pretrain/Step Time": 8.065540863201022} +{"Pretrain/Learning Rate": 4.830982071025948e-05, "Pretrain/Loss": 2.136789321899414, "Pretrain/Loss (Raw)": 2.186103582382202, "Pretrain/Step": 1375, "Pretrain/Step Time": 8.065402783453465} +{"Pretrain/Learning Rate": 4.830675073080697e-05, "Pretrain/Loss": 2.137136936187744, "Pretrain/Loss (Raw)": 2.104461669921875, "Pretrain/Step": 1376, "Pretrain/Step Time": 8.065081031993032} +{"Pretrain/Learning Rate": 4.830367806351015e-05, "Pretrain/Loss": 2.1362857818603516, "Pretrain/Loss (Raw)": 2.030198812484741, "Pretrain/Step": 1377, "Pretrain/Step Time": 8.063875943422318} +{"Pretrain/Learning Rate": 4.830060270872335e-05, "Pretrain/Loss": 2.137352228164673, "Pretrain/Loss (Raw)": 2.2185559272766113, "Pretrain/Step": 1378, "Pretrain/Step Time": 8.066559836268425} +{"Pretrain/Learning Rate": 4.8297524666801265e-05, "Pretrain/Loss": 2.137259006500244, "Pretrain/Loss (Raw)": 2.0670714378356934, "Pretrain/Step": 1379, "Pretrain/Step Time": 8.069806193932891} +{"Pretrain/Learning Rate": 4.829444393809884e-05, "Pretrain/Loss": 2.1377201080322266, "Pretrain/Loss (Raw)": 2.1777987480163574, "Pretrain/Step": 1380, "Pretrain/Step Time": 8.06870792247355} +{"Pretrain/Learning Rate": 4.829136052297138e-05, "Pretrain/Loss": 2.137829303741455, "Pretrain/Loss (Raw)": 2.0785531997680664, "Pretrain/Step": 1381, "Pretrain/Step Time": 8.064131053164601} +{"Pretrain/Learning Rate": 4.828827442177447e-05, "Pretrain/Loss": 2.1382029056549072, "Pretrain/Loss (Raw)": 2.1427090167999268, "Pretrain/Step": 1382, "Pretrain/Step Time": 8.0623867996037} +{"Pretrain/Learning Rate": 4.8285185634864024e-05, "Pretrain/Loss": 2.1386189460754395, "Pretrain/Loss (Raw)": 2.183318853378296, "Pretrain/Step": 1383, "Pretrain/Step Time": 8.059813218191266} +{"Pretrain/Learning Rate": 4.8282094162596235e-05, "Pretrain/Loss": 2.1401448249816895, "Pretrain/Loss (Raw)": 2.22744083404541, "Pretrain/Step": 1384, "Pretrain/Step Time": 8.06970389932394} +{"Pretrain/Learning Rate": 4.8279000005327644e-05, "Pretrain/Loss": 2.1407761573791504, "Pretrain/Loss (Raw)": 2.054032802581787, "Pretrain/Step": 1385, "Pretrain/Step Time": 8.073034273460507} +{"Pretrain/Learning Rate": 4.827590316341508e-05, "Pretrain/Loss": 2.1413497924804688, "Pretrain/Loss (Raw)": 2.1825129985809326, "Pretrain/Step": 1386, "Pretrain/Step Time": 8.06894594244659} +{"Pretrain/Learning Rate": 4.827280363721568e-05, "Pretrain/Loss": 2.1417410373687744, "Pretrain/Loss (Raw)": 2.05993390083313, "Pretrain/Step": 1387, "Pretrain/Step Time": 8.07460823468864} +{"Pretrain/Learning Rate": 4.82697014270869e-05, "Pretrain/Loss": 2.141390800476074, "Pretrain/Loss (Raw)": 2.1254189014434814, "Pretrain/Step": 1388, "Pretrain/Step Time": 8.064592532813549} +{"Pretrain/Learning Rate": 4.8266596533386505e-05, "Pretrain/Loss": 2.1413302421569824, "Pretrain/Loss (Raw)": 2.104094982147217, "Pretrain/Step": 1389, "Pretrain/Step Time": 8.067903256043792} +{"Pretrain/Learning Rate": 4.8263488956472555e-05, "Pretrain/Loss": 2.142106056213379, "Pretrain/Loss (Raw)": 2.1056675910949707, "Pretrain/Step": 1390, "Pretrain/Step Time": 8.070588449016213} +{"Pretrain/Learning Rate": 4.826037869670345e-05, "Pretrain/Loss": 2.142162322998047, "Pretrain/Loss (Raw)": 2.1281538009643555, "Pretrain/Step": 1391, "Pretrain/Step Time": 8.067073760554194} +{"Pretrain/Learning Rate": 4.8257265754437854e-05, "Pretrain/Loss": 2.1432182788848877, "Pretrain/Loss (Raw)": 2.2247440814971924, "Pretrain/Step": 1392, "Pretrain/Step Time": 8.0682922154665} +{"Pretrain/Learning Rate": 4.825415013003478e-05, "Pretrain/Loss": 2.1408257484436035, "Pretrain/Loss (Raw)": 2.0474791526794434, "Pretrain/Step": 1393, "Pretrain/Step Time": 8.069143451750278} +{"Pretrain/Learning Rate": 4.8251031823853546e-05, "Pretrain/Loss": 2.13956356048584, "Pretrain/Loss (Raw)": 2.1586804389953613, "Pretrain/Step": 1394, "Pretrain/Step Time": 8.07422187179327} +{"Pretrain/Learning Rate": 4.824791083625375e-05, "Pretrain/Loss": 2.140671730041504, "Pretrain/Loss (Raw)": 2.2611987590789795, "Pretrain/Step": 1395, "Pretrain/Step Time": 8.065352641046047} +{"Pretrain/Learning Rate": 4.8244787167595335e-05, "Pretrain/Loss": 2.140620708465576, "Pretrain/Loss (Raw)": 2.286125421524048, "Pretrain/Step": 1396, "Pretrain/Step Time": 8.070134038105607} +{"Pretrain/Learning Rate": 4.824166081823853e-05, "Pretrain/Loss": 2.140608787536621, "Pretrain/Loss (Raw)": 2.0109567642211914, "Pretrain/Step": 1397, "Pretrain/Step Time": 8.065959263592958} +{"Pretrain/Learning Rate": 4.823853178854387e-05, "Pretrain/Loss": 2.1397411823272705, "Pretrain/Loss (Raw)": 1.9966503381729126, "Pretrain/Step": 1398, "Pretrain/Step Time": 8.06856414489448} +{"Pretrain/Learning Rate": 4.8235400078872234e-05, "Pretrain/Loss": 2.1394386291503906, "Pretrain/Loss (Raw)": 2.1316304206848145, "Pretrain/Step": 1399, "Pretrain/Step Time": 8.069700745865703} +{"Pretrain/Learning Rate": 4.823226568958477e-05, "Pretrain/Loss": 2.139690399169922, "Pretrain/Loss (Raw)": 2.1496450901031494, "Pretrain/Step": 1400, "Pretrain/Step Time": 8.06424537859857} +{"Pretrain/Learning Rate": 4.822912862104295e-05, "Pretrain/Loss": 2.1387939453125, "Pretrain/Loss (Raw)": 2.160384178161621, "Pretrain/Step": 1401, "Pretrain/Step Time": 8.06750387698412} +{"Pretrain/Learning Rate": 4.8225988873608554e-05, "Pretrain/Loss": 2.139090061187744, "Pretrain/Loss (Raw)": 2.1204075813293457, "Pretrain/Step": 1402, "Pretrain/Step Time": 8.061362937092781} +{"Pretrain/Learning Rate": 4.8222846447643686e-05, "Pretrain/Loss": 2.141037940979004, "Pretrain/Loss (Raw)": 2.244537115097046, "Pretrain/Step": 1403, "Pretrain/Step Time": 8.062337597832084} +{"Pretrain/Learning Rate": 4.8219701343510727e-05, "Pretrain/Loss": 2.1415627002716064, "Pretrain/Loss (Raw)": 2.246758222579956, "Pretrain/Step": 1404, "Pretrain/Step Time": 8.063080022111535} +{"Pretrain/Learning Rate": 4.8216553561572395e-05, "Pretrain/Loss": 2.1415200233459473, "Pretrain/Loss (Raw)": 2.2189624309539795, "Pretrain/Step": 1405, "Pretrain/Step Time": 8.06010303273797} +{"Pretrain/Learning Rate": 4.821340310219171e-05, "Pretrain/Loss": 2.140421152114868, "Pretrain/Loss (Raw)": 2.188631534576416, "Pretrain/Step": 1406, "Pretrain/Step Time": 8.066342314705253} +{"Pretrain/Learning Rate": 4.8210249965732e-05, "Pretrain/Loss": 2.14017915725708, "Pretrain/Loss (Raw)": 2.080206871032715, "Pretrain/Step": 1407, "Pretrain/Step Time": 8.058548498898745} +{"Pretrain/Learning Rate": 4.8207094152556886e-05, "Pretrain/Loss": 2.1391055583953857, "Pretrain/Loss (Raw)": 2.0978991985321045, "Pretrain/Step": 1408, "Pretrain/Step Time": 8.06456913240254} +{"Pretrain/Learning Rate": 4.820393566303032e-05, "Pretrain/Loss": 2.140292167663574, "Pretrain/Loss (Raw)": 2.2298455238342285, "Pretrain/Step": 1409, "Pretrain/Step Time": 8.067023579031229} +{"Pretrain/Learning Rate": 4.8200774497516555e-05, "Pretrain/Loss": 2.1422276496887207, "Pretrain/Loss (Raw)": 2.316741943359375, "Pretrain/Step": 1410, "Pretrain/Step Time": 8.062533477321267} +{"Pretrain/Learning Rate": 4.8197610656380144e-05, "Pretrain/Loss": 2.1420605182647705, "Pretrain/Loss (Raw)": 2.2986104488372803, "Pretrain/Step": 1411, "Pretrain/Step Time": 8.063355140388012} +{"Pretrain/Learning Rate": 4.8194444139985965e-05, "Pretrain/Loss": 2.141371965408325, "Pretrain/Loss (Raw)": 2.0347368717193604, "Pretrain/Step": 1412, "Pretrain/Step Time": 8.063110379502177} +{"Pretrain/Learning Rate": 4.81912749486992e-05, "Pretrain/Loss": 2.1407876014709473, "Pretrain/Loss (Raw)": 2.022188663482666, "Pretrain/Step": 1413, "Pretrain/Step Time": 8.066953428089619} +{"Pretrain/Learning Rate": 4.818810308288531e-05, "Pretrain/Loss": 2.1407816410064697, "Pretrain/Loss (Raw)": 2.1372601985931396, "Pretrain/Step": 1414, "Pretrain/Step Time": 8.062105536460876} +{"Pretrain/Learning Rate": 4.818492854291012e-05, "Pretrain/Loss": 2.1418447494506836, "Pretrain/Loss (Raw)": 2.1386537551879883, "Pretrain/Step": 1415, "Pretrain/Step Time": 8.06206283159554} +{"Pretrain/Learning Rate": 4.818175132913971e-05, "Pretrain/Loss": 2.140801429748535, "Pretrain/Loss (Raw)": 2.0601654052734375, "Pretrain/Step": 1416, "Pretrain/Step Time": 8.058708285912871} +{"Pretrain/Learning Rate": 4.817857144194051e-05, "Pretrain/Loss": 2.140636682510376, "Pretrain/Loss (Raw)": 2.171506404876709, "Pretrain/Step": 1417, "Pretrain/Step Time": 8.05824864283204} +{"Pretrain/Learning Rate": 4.817538888167923e-05, "Pretrain/Loss": 2.1416327953338623, "Pretrain/Loss (Raw)": 2.192549228668213, "Pretrain/Step": 1418, "Pretrain/Step Time": 8.059465445578098} +{"Pretrain/Learning Rate": 4.817220364872289e-05, "Pretrain/Loss": 2.1418232917785645, "Pretrain/Loss (Raw)": 2.125994920730591, "Pretrain/Step": 1419, "Pretrain/Step Time": 8.052811311557889} +{"Pretrain/Learning Rate": 4.816901574343884e-05, "Pretrain/Loss": 2.140077829360962, "Pretrain/Loss (Raw)": 2.0022175312042236, "Pretrain/Step": 1420, "Pretrain/Step Time": 8.058842049911618} +{"Pretrain/Learning Rate": 4.816582516619471e-05, "Pretrain/Loss": 2.140317440032959, "Pretrain/Loss (Raw)": 2.114011287689209, "Pretrain/Step": 1421, "Pretrain/Step Time": 8.056857902556658} +{"Pretrain/Learning Rate": 4.816263191735847e-05, "Pretrain/Loss": 2.1403141021728516, "Pretrain/Loss (Raw)": 2.199631452560425, "Pretrain/Step": 1422, "Pretrain/Step Time": 8.059591045603156} +{"Pretrain/Learning Rate": 4.8159435997298375e-05, "Pretrain/Loss": 2.139585018157959, "Pretrain/Loss (Raw)": 2.0089006423950195, "Pretrain/Step": 1423, "Pretrain/Step Time": 8.058941749855876} +{"Pretrain/Learning Rate": 4.8156237406382975e-05, "Pretrain/Loss": 2.140552282333374, "Pretrain/Loss (Raw)": 2.239823341369629, "Pretrain/Step": 1424, "Pretrain/Step Time": 8.05549143999815} +{"Pretrain/Learning Rate": 4.815303614498118e-05, "Pretrain/Loss": 2.140103578567505, "Pretrain/Loss (Raw)": 2.130479335784912, "Pretrain/Step": 1425, "Pretrain/Step Time": 8.067630145698786} +{"Pretrain/Learning Rate": 4.814983221346214e-05, "Pretrain/Loss": 2.140852928161621, "Pretrain/Loss (Raw)": 2.1066837310791016, "Pretrain/Step": 1426, "Pretrain/Step Time": 8.062921347096562} +{"Pretrain/Learning Rate": 4.814662561219537e-05, "Pretrain/Loss": 2.1410775184631348, "Pretrain/Loss (Raw)": 2.1312096118927, "Pretrain/Step": 1427, "Pretrain/Step Time": 8.069950258359313} +{"Pretrain/Learning Rate": 4.814341634155066e-05, "Pretrain/Loss": 2.1420633792877197, "Pretrain/Loss (Raw)": 2.2441959381103516, "Pretrain/Step": 1428, "Pretrain/Step Time": 8.060843845829368} +{"Pretrain/Learning Rate": 4.8140204401898134e-05, "Pretrain/Loss": 2.1411619186401367, "Pretrain/Loss (Raw)": 2.070200204849243, "Pretrain/Step": 1429, "Pretrain/Step Time": 8.063700649887323} +{"Pretrain/Learning Rate": 4.813698979360819e-05, "Pretrain/Loss": 2.1401467323303223, "Pretrain/Loss (Raw)": 2.09975266456604, "Pretrain/Step": 1430, "Pretrain/Step Time": 8.063889235258102} +{"Pretrain/Learning Rate": 4.813377251705156e-05, "Pretrain/Loss": 2.1402130126953125, "Pretrain/Loss (Raw)": 2.2242398262023926, "Pretrain/Step": 1431, "Pretrain/Step Time": 8.069735640659928} +{"Pretrain/Learning Rate": 4.8130552572599265e-05, "Pretrain/Loss": 2.139435291290283, "Pretrain/Loss (Raw)": 2.111370086669922, "Pretrain/Step": 1432, "Pretrain/Step Time": 8.069483283907175} +{"Pretrain/Learning Rate": 4.8127329960622656e-05, "Pretrain/Loss": 2.136995315551758, "Pretrain/Loss (Raw)": 1.9896295070648193, "Pretrain/Step": 1433, "Pretrain/Step Time": 8.059613890945911} +{"Pretrain/Learning Rate": 4.8124104681493375e-05, "Pretrain/Loss": 2.1363773345947266, "Pretrain/Loss (Raw)": 2.0763843059539795, "Pretrain/Step": 1434, "Pretrain/Step Time": 8.067585412412882} +{"Pretrain/Learning Rate": 4.8120876735583384e-05, "Pretrain/Loss": 2.136932849884033, "Pretrain/Loss (Raw)": 2.1625609397888184, "Pretrain/Step": 1435, "Pretrain/Step Time": 8.059319032356143} +{"Pretrain/Learning Rate": 4.811764612326493e-05, "Pretrain/Loss": 2.1363332271575928, "Pretrain/Loss (Raw)": 2.107057809829712, "Pretrain/Step": 1436, "Pretrain/Step Time": 8.061562804505229} +{"Pretrain/Learning Rate": 4.8114412844910595e-05, "Pretrain/Loss": 2.13504958152771, "Pretrain/Loss (Raw)": 2.11619234085083, "Pretrain/Step": 1437, "Pretrain/Step Time": 8.056381298229098} +{"Pretrain/Learning Rate": 4.8111176900893254e-05, "Pretrain/Loss": 2.133664608001709, "Pretrain/Loss (Raw)": 2.1302688121795654, "Pretrain/Step": 1438, "Pretrain/Step Time": 8.05842524021864} +{"Pretrain/Learning Rate": 4.810793829158609e-05, "Pretrain/Loss": 2.136505126953125, "Pretrain/Loss (Raw)": 2.5021398067474365, "Pretrain/Step": 1439, "Pretrain/Step Time": 8.061534814536572} +{"Pretrain/Learning Rate": 4.8104697017362595e-05, "Pretrain/Loss": 2.135951042175293, "Pretrain/Loss (Raw)": 2.116677761077881, "Pretrain/Step": 1440, "Pretrain/Step Time": 8.053320562466979} +{"Pretrain/Learning Rate": 4.8101453078596565e-05, "Pretrain/Loss": 2.134751796722412, "Pretrain/Loss (Raw)": 2.1526687145233154, "Pretrain/Step": 1441, "Pretrain/Step Time": 8.060148334130645} +{"Pretrain/Learning Rate": 4.809820647566211e-05, "Pretrain/Loss": 2.135937213897705, "Pretrain/Loss (Raw)": 2.226750612258911, "Pretrain/Step": 1442, "Pretrain/Step Time": 8.059102848172188} +{"Pretrain/Learning Rate": 4.8094957208933635e-05, "Pretrain/Loss": 2.1386735439300537, "Pretrain/Loss (Raw)": 2.4368700981140137, "Pretrain/Step": 1443, "Pretrain/Step Time": 8.067573430016637} +{"Pretrain/Learning Rate": 4.809170527878587e-05, "Pretrain/Loss": 2.1389636993408203, "Pretrain/Loss (Raw)": 2.0641531944274902, "Pretrain/Step": 1444, "Pretrain/Step Time": 8.061140548437834} +{"Pretrain/Learning Rate": 4.808845068559384e-05, "Pretrain/Loss": 2.1383657455444336, "Pretrain/Loss (Raw)": 2.0634686946868896, "Pretrain/Step": 1445, "Pretrain/Step Time": 8.065444748848677} +{"Pretrain/Learning Rate": 4.808519342973289e-05, "Pretrain/Loss": 2.1382718086242676, "Pretrain/Loss (Raw)": 2.1518054008483887, "Pretrain/Step": 1446, "Pretrain/Step Time": 8.067560287192464} +{"Pretrain/Learning Rate": 4.808193351157865e-05, "Pretrain/Loss": 2.137071371078491, "Pretrain/Loss (Raw)": 2.0035181045532227, "Pretrain/Step": 1447, "Pretrain/Step Time": 8.057208877056837} +{"Pretrain/Learning Rate": 4.8078670931507064e-05, "Pretrain/Loss": 2.137360095977783, "Pretrain/Loss (Raw)": 2.073683738708496, "Pretrain/Step": 1448, "Pretrain/Step Time": 8.06404983624816} +{"Pretrain/Learning Rate": 4.80754056898944e-05, "Pretrain/Loss": 2.1378889083862305, "Pretrain/Loss (Raw)": 2.102414608001709, "Pretrain/Step": 1449, "Pretrain/Step Time": 8.060622999444604} +{"Pretrain/Learning Rate": 4.807213778711722e-05, "Pretrain/Loss": 2.1371564865112305, "Pretrain/Loss (Raw)": 2.0791611671447754, "Pretrain/Step": 1450, "Pretrain/Step Time": 8.065115462988615} +{"Pretrain/Learning Rate": 4.8068867223552384e-05, "Pretrain/Loss": 2.1367099285125732, "Pretrain/Loss (Raw)": 2.0250442028045654, "Pretrain/Step": 1451, "Pretrain/Step Time": 8.061493076384068} +{"Pretrain/Learning Rate": 4.8065593999577086e-05, "Pretrain/Loss": 2.138723850250244, "Pretrain/Loss (Raw)": 2.179370164871216, "Pretrain/Step": 1452, "Pretrain/Step Time": 8.062907982617617} +{"Pretrain/Learning Rate": 4.806231811556879e-05, "Pretrain/Loss": 2.1397554874420166, "Pretrain/Loss (Raw)": 2.1433587074279785, "Pretrain/Step": 1453, "Pretrain/Step Time": 8.052877398207784} +{"Pretrain/Learning Rate": 4.80590395719053e-05, "Pretrain/Loss": 2.138495922088623, "Pretrain/Loss (Raw)": 1.990938425064087, "Pretrain/Step": 1454, "Pretrain/Step Time": 8.059602342545986} +{"Pretrain/Learning Rate": 4.805575836896471e-05, "Pretrain/Loss": 2.1379966735839844, "Pretrain/Loss (Raw)": 2.053938150405884, "Pretrain/Step": 1455, "Pretrain/Step Time": 8.055857291445136} +{"Pretrain/Learning Rate": 4.805247450712542e-05, "Pretrain/Loss": 2.1375577449798584, "Pretrain/Loss (Raw)": 2.138357162475586, "Pretrain/Step": 1456, "Pretrain/Step Time": 8.056603560224175} +{"Pretrain/Learning Rate": 4.804918798676614e-05, "Pretrain/Loss": 2.13724422454834, "Pretrain/Loss (Raw)": 2.1480023860931396, "Pretrain/Step": 1457, "Pretrain/Step Time": 8.057910731062293} +{"Pretrain/Learning Rate": 4.804589880826589e-05, "Pretrain/Loss": 2.1378955841064453, "Pretrain/Loss (Raw)": 2.0583841800689697, "Pretrain/Step": 1458, "Pretrain/Step Time": 8.044729048386216} +{"Pretrain/Learning Rate": 4.8042606972004e-05, "Pretrain/Loss": 2.137291669845581, "Pretrain/Loss (Raw)": 2.059727668762207, "Pretrain/Step": 1459, "Pretrain/Step Time": 8.049198642373085} +{"Pretrain/Learning Rate": 4.803931247836009e-05, "Pretrain/Loss": 2.1375985145568848, "Pretrain/Loss (Raw)": 2.215632438659668, "Pretrain/Step": 1460, "Pretrain/Step Time": 8.053959159180522} +{"Pretrain/Learning Rate": 4.80360153277141e-05, "Pretrain/Loss": 2.1368660926818848, "Pretrain/Loss (Raw)": 2.126164436340332, "Pretrain/Step": 1461, "Pretrain/Step Time": 8.048766728490591} +{"Pretrain/Learning Rate": 4.8032715520446275e-05, "Pretrain/Loss": 2.134275436401367, "Pretrain/Loss (Raw)": 1.964242935180664, "Pretrain/Step": 1462, "Pretrain/Step Time": 8.052028004080057} +{"Pretrain/Learning Rate": 4.802941305693716e-05, "Pretrain/Loss": 2.134904146194458, "Pretrain/Loss (Raw)": 2.1769790649414062, "Pretrain/Step": 1463, "Pretrain/Step Time": 8.049513710662723} +{"Pretrain/Learning Rate": 4.802610793756761e-05, "Pretrain/Loss": 2.1351118087768555, "Pretrain/Loss (Raw)": 2.145167112350464, "Pretrain/Step": 1464, "Pretrain/Step Time": 8.05780921690166} +{"Pretrain/Learning Rate": 4.8022800162718794e-05, "Pretrain/Loss": 2.1345338821411133, "Pretrain/Loss (Raw)": 2.0955872535705566, "Pretrain/Step": 1465, "Pretrain/Step Time": 8.057962369173765} +{"Pretrain/Learning Rate": 4.801948973277218e-05, "Pretrain/Loss": 2.1358485221862793, "Pretrain/Loss (Raw)": 2.1960458755493164, "Pretrain/Step": 1466, "Pretrain/Step Time": 8.053916852921247} +{"Pretrain/Learning Rate": 4.8016176648109534e-05, "Pretrain/Loss": 2.133545398712158, "Pretrain/Loss (Raw)": 2.0299198627471924, "Pretrain/Step": 1467, "Pretrain/Step Time": 8.057982198894024} +{"Pretrain/Learning Rate": 4.801286090911295e-05, "Pretrain/Loss": 2.1320667266845703, "Pretrain/Loss (Raw)": 1.9441826343536377, "Pretrain/Step": 1468, "Pretrain/Step Time": 8.049796698614955} +{"Pretrain/Learning Rate": 4.80095425161648e-05, "Pretrain/Loss": 2.132214069366455, "Pretrain/Loss (Raw)": 2.1791341304779053, "Pretrain/Step": 1469, "Pretrain/Step Time": 8.05834910646081} +{"Pretrain/Learning Rate": 4.800622146964777e-05, "Pretrain/Loss": 2.1321496963500977, "Pretrain/Loss (Raw)": 2.1405434608459473, "Pretrain/Step": 1470, "Pretrain/Step Time": 8.049822259694338} +{"Pretrain/Learning Rate": 4.8002897769944885e-05, "Pretrain/Loss": 2.131103038787842, "Pretrain/Loss (Raw)": 2.0546443462371826, "Pretrain/Step": 1471, "Pretrain/Step Time": 8.052343802526593} +{"Pretrain/Learning Rate": 4.799957141743944e-05, "Pretrain/Loss": 2.1313767433166504, "Pretrain/Loss (Raw)": 2.1335232257843018, "Pretrain/Step": 1472, "Pretrain/Step Time": 8.043525384739041} +{"Pretrain/Learning Rate": 4.799624241251502e-05, "Pretrain/Loss": 2.130396604537964, "Pretrain/Loss (Raw)": 1.9880436658859253, "Pretrain/Step": 1473, "Pretrain/Step Time": 8.050649492070079} +{"Pretrain/Learning Rate": 4.7992910755555584e-05, "Pretrain/Loss": 2.130026340484619, "Pretrain/Loss (Raw)": 2.044172763824463, "Pretrain/Step": 1474, "Pretrain/Step Time": 8.055702537298203} +{"Pretrain/Learning Rate": 4.798957644694533e-05, "Pretrain/Loss": 2.129624128341675, "Pretrain/Loss (Raw)": 2.0853450298309326, "Pretrain/Step": 1475, "Pretrain/Step Time": 8.049128578975797} +{"Pretrain/Learning Rate": 4.7986239487068785e-05, "Pretrain/Loss": 2.1296191215515137, "Pretrain/Loss (Raw)": 2.124530076980591, "Pretrain/Step": 1476, "Pretrain/Step Time": 8.053921166807413} +{"Pretrain/Learning Rate": 4.798289987631079e-05, "Pretrain/Loss": 2.12973952293396, "Pretrain/Loss (Raw)": 2.061082363128662, "Pretrain/Step": 1477, "Pretrain/Step Time": 8.046619113534689} +{"Pretrain/Learning Rate": 4.797955761505648e-05, "Pretrain/Loss": 2.130725860595703, "Pretrain/Loss (Raw)": 2.1998391151428223, "Pretrain/Step": 1478, "Pretrain/Step Time": 8.051492603495717} +{"Pretrain/Learning Rate": 4.7976212703691306e-05, "Pretrain/Loss": 2.1281495094299316, "Pretrain/Loss (Raw)": 2.1182289123535156, "Pretrain/Step": 1479, "Pretrain/Step Time": 8.052375419065356} +{"Pretrain/Learning Rate": 4.797286514260101e-05, "Pretrain/Loss": 2.1279256343841553, "Pretrain/Loss (Raw)": 2.117058277130127, "Pretrain/Step": 1480, "Pretrain/Step Time": 8.047594830393791} +{"Pretrain/Learning Rate": 4.7969514932171665e-05, "Pretrain/Loss": 2.1281580924987793, "Pretrain/Loss (Raw)": 2.1047699451446533, "Pretrain/Step": 1481, "Pretrain/Step Time": 8.055498827248812} +{"Pretrain/Learning Rate": 4.796616207278961e-05, "Pretrain/Loss": 2.1281514167785645, "Pretrain/Loss (Raw)": 2.021857500076294, "Pretrain/Step": 1482, "Pretrain/Step Time": 8.048336260020733} +{"Pretrain/Learning Rate": 4.796280656484153e-05, "Pretrain/Loss": 2.129016876220703, "Pretrain/Loss (Raw)": 2.207958459854126, "Pretrain/Step": 1483, "Pretrain/Step Time": 8.056370278820395} +{"Pretrain/Learning Rate": 4.795944840871439e-05, "Pretrain/Loss": 2.1288001537323, "Pretrain/Loss (Raw)": 2.088374614715576, "Pretrain/Step": 1484, "Pretrain/Step Time": 8.058346504345536} +{"Pretrain/Learning Rate": 4.7956087604795474e-05, "Pretrain/Loss": 2.128035068511963, "Pretrain/Loss (Raw)": 2.132969379425049, "Pretrain/Step": 1485, "Pretrain/Step Time": 8.055936180055141} +{"Pretrain/Learning Rate": 4.7952724153472366e-05, "Pretrain/Loss": 2.1296000480651855, "Pretrain/Loss (Raw)": 2.3471133708953857, "Pretrain/Step": 1486, "Pretrain/Step Time": 8.06273352354765} +{"Pretrain/Learning Rate": 4.7949358055132945e-05, "Pretrain/Loss": 2.129453659057617, "Pretrain/Loss (Raw)": 2.0712192058563232, "Pretrain/Step": 1487, "Pretrain/Step Time": 8.062015717849135} +{"Pretrain/Learning Rate": 4.7945989310165415e-05, "Pretrain/Loss": 2.130580425262451, "Pretrain/Loss (Raw)": 2.3263027667999268, "Pretrain/Step": 1488, "Pretrain/Step Time": 8.06701303459704} +{"Pretrain/Learning Rate": 4.794261791895828e-05, "Pretrain/Loss": 2.128743886947632, "Pretrain/Loss (Raw)": 1.9837404489517212, "Pretrain/Step": 1489, "Pretrain/Step Time": 8.061966508626938} +{"Pretrain/Learning Rate": 4.793924388190033e-05, "Pretrain/Loss": 2.130345344543457, "Pretrain/Loss (Raw)": 2.2563531398773193, "Pretrain/Step": 1490, "Pretrain/Step Time": 8.062320128083229} +{"Pretrain/Learning Rate": 4.793586719938068e-05, "Pretrain/Loss": 2.130183696746826, "Pretrain/Loss (Raw)": 2.1869192123413086, "Pretrain/Step": 1491, "Pretrain/Step Time": 8.054612942039967} +{"Pretrain/Learning Rate": 4.7932487871788746e-05, "Pretrain/Loss": 2.1307034492492676, "Pretrain/Loss (Raw)": 2.141775131225586, "Pretrain/Step": 1492, "Pretrain/Step Time": 8.061765464022756} +{"Pretrain/Learning Rate": 1.7482517482517484e-07, "Pretrain/Loss": 2.875234842300415, "Pretrain/Loss (Raw)": 2.875234842300415, "Pretrain/Step": 1, "Pretrain/Step Time": 12.501804113388062} +{"Pretrain/Learning Rate": 3.496503496503497e-07, "Pretrain/Loss": 2.9566798210144043, "Pretrain/Loss (Raw)": 3.0381250381469727, "Pretrain/Step": 2, "Pretrain/Step Time": 10.234309673309326} +{"Pretrain/Learning Rate": 5.244755244755246e-07, "Pretrain/Loss": 3.3331334590911865, "Pretrain/Loss (Raw)": 4.086040496826172, "Pretrain/Step": 3, "Pretrain/Step Time": 9.575958569844564} +{"Pretrain/Learning Rate": 6.993006993006994e-07, "Pretrain/Loss": 3.4034674167633057, "Pretrain/Loss (Raw)": 3.614469528198242, "Pretrain/Step": 4, "Pretrain/Step Time": 9.253808379173279} +{"Pretrain/Learning Rate": 8.741258741258743e-07, "Pretrain/Loss": 3.595816135406494, "Pretrain/Loss (Raw)": 4.365209102630615, "Pretrain/Step": 5, "Pretrain/Step Time": 9.029268884658814} +{"Pretrain/Learning Rate": 1.0489510489510491e-06, "Pretrain/Loss": 3.646848678588867, "Pretrain/Loss (Raw)": 3.9020118713378906, "Pretrain/Step": 6, "Pretrain/Step Time": 8.860156416893005} +{"Pretrain/Learning Rate": 1.2237762237762238e-06, "Pretrain/Loss": 3.6192939281463623, "Pretrain/Loss (Raw)": 3.4539647102355957, "Pretrain/Step": 7, "Pretrain/Step Time": 8.73090866633824} +{"Pretrain/Learning Rate": 1.3986013986013987e-06, "Pretrain/Loss": 3.5375852584838867, "Pretrain/Loss (Raw)": 2.965627431869507, "Pretrain/Step": 8, "Pretrain/Step Time": 8.658568382263184} +{"Pretrain/Learning Rate": 1.5734265734265736e-06, "Pretrain/Loss": 3.4894349575042725, "Pretrain/Loss (Raw)": 3.1042308807373047, "Pretrain/Step": 9, "Pretrain/Step Time": 8.591733243730333} +{"Pretrain/Learning Rate": 1.7482517482517485e-06, "Pretrain/Loss": 3.472484588623047, "Pretrain/Loss (Raw)": 3.319931745529175, "Pretrain/Step": 10, "Pretrain/Step Time": 8.535490560531617} +{"Pretrain/Learning Rate": 1.9230769230769234e-06, "Pretrain/Loss": 3.4624600410461426, "Pretrain/Loss (Raw)": 3.3622121810913086, "Pretrain/Step": 11, "Pretrain/Step Time": 8.507929563522339} +{"Pretrain/Learning Rate": 2.0979020979020983e-06, "Pretrain/Loss": 3.508485794067383, "Pretrain/Loss (Raw)": 4.014769554138184, "Pretrain/Step": 12, "Pretrain/Step Time": 8.495926996072134} +{"Pretrain/Learning Rate": 2.2727272727272728e-06, "Pretrain/Loss": 3.463073253631592, "Pretrain/Loss (Raw)": 2.9181244373321533, "Pretrain/Step": 13, "Pretrain/Step Time": 8.465177939488338} +{"Pretrain/Learning Rate": 2.4475524475524477e-06, "Pretrain/Loss": 3.4529001712799072, "Pretrain/Loss (Raw)": 3.320645570755005, "Pretrain/Step": 14, "Pretrain/Step Time": 8.426200764519828} +{"Pretrain/Learning Rate": 2.6223776223776225e-06, "Pretrain/Loss": 3.43780255317688, "Pretrain/Loss (Raw)": 3.226438522338867, "Pretrain/Step": 15, "Pretrain/Step Time": 8.430219570795694} +{"Pretrain/Learning Rate": 2.7972027972027974e-06, "Pretrain/Loss": 3.4063823223114014, "Pretrain/Loss (Raw)": 2.935081720352173, "Pretrain/Step": 16, "Pretrain/Step Time": 8.409840866923332} +{"Pretrain/Learning Rate": 2.9720279720279723e-06, "Pretrain/Loss": 3.377972364425659, "Pretrain/Loss (Raw)": 2.9234092235565186, "Pretrain/Step": 17, "Pretrain/Step Time": 8.480078627081479} +{"Pretrain/Learning Rate": 3.1468531468531472e-06, "Pretrain/Loss": 3.329549551010132, "Pretrain/Loss (Raw)": 2.5063657760620117, "Pretrain/Step": 18, "Pretrain/Step Time": 8.455479529168871} +{"Pretrain/Learning Rate": 3.3216783216783217e-06, "Pretrain/Loss": 3.2916674613952637, "Pretrain/Loss (Raw)": 2.609787940979004, "Pretrain/Step": 19, "Pretrain/Step Time": 8.449550578468724} +{"Pretrain/Learning Rate": 3.496503496503497e-06, "Pretrain/Loss": 3.270766496658325, "Pretrain/Loss (Raw)": 2.873647928237915, "Pretrain/Step": 20, "Pretrain/Step Time": 8.425109493732453} +{"Pretrain/Learning Rate": 3.6713286713286715e-06, "Pretrain/Loss": 3.2441632747650146, "Pretrain/Loss (Raw)": 2.7120935916900635, "Pretrain/Step": 21, "Pretrain/Step Time": 8.404021660486857} +{"Pretrain/Learning Rate": 3.846153846153847e-06, "Pretrain/Loss": 3.228785514831543, "Pretrain/Loss (Raw)": 2.9058568477630615, "Pretrain/Step": 22, "Pretrain/Step Time": 8.390849330208518} +{"Pretrain/Learning Rate": 4.020979020979021e-06, "Pretrain/Loss": 3.215786933898926, "Pretrain/Loss (Raw)": 2.9298157691955566, "Pretrain/Step": 23, "Pretrain/Step Time": 8.373302138370017} +{"Pretrain/Learning Rate": 4.195804195804197e-06, "Pretrain/Loss": 3.1799755096435547, "Pretrain/Loss (Raw)": 2.356316089630127, "Pretrain/Step": 24, "Pretrain/Step Time": 8.352062612771988} +{"Pretrain/Learning Rate": 4.370629370629371e-06, "Pretrain/Loss": 3.1631875038146973, "Pretrain/Loss (Raw)": 2.7602803707122803, "Pretrain/Step": 25, "Pretrain/Step Time": 8.344635457992554} +{"Pretrain/Learning Rate": 4.5454545454545455e-06, "Pretrain/Loss": 3.127854108810425, "Pretrain/Loss (Raw)": 2.2445080280303955, "Pretrain/Step": 26, "Pretrain/Step Time": 8.327202778596144} +{"Pretrain/Learning Rate": 4.72027972027972e-06, "Pretrain/Loss": 3.116415500640869, "Pretrain/Loss (Raw)": 2.819014549255371, "Pretrain/Step": 27, "Pretrain/Step Time": 8.328329571971187} +{"Pretrain/Learning Rate": 4.895104895104895e-06, "Pretrain/Loss": 3.08772611618042, "Pretrain/Loss (Raw)": 2.3131160736083984, "Pretrain/Step": 28, "Pretrain/Step Time": 8.311330156666893} +{"Pretrain/Learning Rate": 5.06993006993007e-06, "Pretrain/Loss": 3.0643835067749023, "Pretrain/Loss (Raw)": 2.4107871055603027, "Pretrain/Step": 29, "Pretrain/Step Time": 8.303225451502307} +{"Pretrain/Learning Rate": 5.244755244755245e-06, "Pretrain/Loss": 3.036118745803833, "Pretrain/Loss (Raw)": 2.2164440155029297, "Pretrain/Step": 30, "Pretrain/Step Time": 8.297056762377421} +{"Pretrain/Learning Rate": 5.419580419580419e-06, "Pretrain/Loss": 3.0140788555145264, "Pretrain/Loss (Raw)": 2.352886199951172, "Pretrain/Step": 31, "Pretrain/Step Time": 8.293898051784884} +{"Pretrain/Learning Rate": 5.594405594405595e-06, "Pretrain/Loss": 2.9959442615509033, "Pretrain/Loss (Raw)": 2.433769702911377, "Pretrain/Step": 32, "Pretrain/Step Time": 8.279911361634731} +{"Pretrain/Learning Rate": 5.76923076923077e-06, "Pretrain/Loss": 2.977586507797241, "Pretrain/Loss (Raw)": 2.390134572982788, "Pretrain/Step": 33, "Pretrain/Step Time": 8.274643226103349} +{"Pretrain/Learning Rate": 5.944055944055945e-06, "Pretrain/Loss": 2.970039129257202, "Pretrain/Loss (Raw)": 2.720978260040283, "Pretrain/Step": 34, "Pretrain/Step Time": 8.282150563071756} +{"Pretrain/Learning Rate": 6.1188811188811196e-06, "Pretrain/Loss": 2.94897723197937, "Pretrain/Loss (Raw)": 2.2328763008117676, "Pretrain/Step": 35, "Pretrain/Step Time": 8.283417442866734} +{"Pretrain/Learning Rate": 6.2937062937062944e-06, "Pretrain/Loss": 2.943577289581299, "Pretrain/Loss (Raw)": 2.7545745372772217, "Pretrain/Step": 36, "Pretrain/Step Time": 8.291588803132376} +{"Pretrain/Learning Rate": 6.468531468531469e-06, "Pretrain/Loss": 2.9221596717834473, "Pretrain/Loss (Raw)": 2.1511216163635254, "Pretrain/Step": 37, "Pretrain/Step Time": 8.312177477656183} +{"Pretrain/Learning Rate": 6.643356643356643e-06, "Pretrain/Loss": 2.9172890186309814, "Pretrain/Loss (Raw)": 2.737077236175537, "Pretrain/Step": 38, "Pretrain/Step Time": 8.303546554163882} +{"Pretrain/Learning Rate": 6.818181818181818e-06, "Pretrain/Loss": 2.897656202316284, "Pretrain/Loss (Raw)": 2.1516125202178955, "Pretrain/Step": 39, "Pretrain/Step Time": 8.290617582125542} +{"Pretrain/Learning Rate": 6.993006993006994e-06, "Pretrain/Loss": 2.878488540649414, "Pretrain/Loss (Raw)": 2.1309497356414795, "Pretrain/Step": 40, "Pretrain/Step Time": 8.287254571914673} +{"Pretrain/Learning Rate": 7.167832167832168e-06, "Pretrain/Loss": 2.868990898132324, "Pretrain/Loss (Raw)": 2.4890856742858887, "Pretrain/Step": 41, "Pretrain/Step Time": 8.280069653580828} +{"Pretrain/Learning Rate": 7.342657342657343e-06, "Pretrain/Loss": 2.863844156265259, "Pretrain/Loss (Raw)": 2.6528189182281494, "Pretrain/Step": 42, "Pretrain/Step Time": 8.272526706968035} +{"Pretrain/Learning Rate": 7.517482517482517e-06, "Pretrain/Loss": 2.8514199256896973, "Pretrain/Loss (Raw)": 2.3296151161193848, "Pretrain/Step": 43, "Pretrain/Step Time": 8.271021194236223} +{"Pretrain/Learning Rate": 7.692307692307694e-06, "Pretrain/Loss": 2.8371474742889404, "Pretrain/Loss (Raw)": 2.2234296798706055, "Pretrain/Step": 44, "Pretrain/Step Time": 8.273217900232835} +{"Pretrain/Learning Rate": 7.867132867132867e-06, "Pretrain/Loss": 2.824056386947632, "Pretrain/Loss (Raw)": 2.2480454444885254, "Pretrain/Step": 45, "Pretrain/Step Time": 8.266705735524495} +{"Pretrain/Learning Rate": 8.041958041958042e-06, "Pretrain/Loss": 2.811825752258301, "Pretrain/Loss (Raw)": 2.2614409923553467, "Pretrain/Step": 46, "Pretrain/Step Time": 8.263343966525534} +{"Pretrain/Learning Rate": 8.216783216783217e-06, "Pretrain/Loss": 2.807101249694824, "Pretrain/Loss (Raw)": 2.5897762775421143, "Pretrain/Step": 47, "Pretrain/Step Time": 8.257158299709888} +{"Pretrain/Learning Rate": 8.391608391608393e-06, "Pretrain/Loss": 2.7993218898773193, "Pretrain/Loss (Raw)": 2.433694839477539, "Pretrain/Step": 48, "Pretrain/Step Time": 8.251250877976418} +{"Pretrain/Learning Rate": 8.566433566433566e-06, "Pretrain/Loss": 2.790766954421997, "Pretrain/Loss (Raw)": 2.3801543712615967, "Pretrain/Step": 49, "Pretrain/Step Time": 8.247530752298783} +{"Pretrain/Learning Rate": 8.741258741258741e-06, "Pretrain/Loss": 2.784116506576538, "Pretrain/Loss (Raw)": 2.458226442337036, "Pretrain/Step": 50, "Pretrain/Step Time": 8.241068677902222} +{"Pretrain/Learning Rate": 8.916083916083918e-06, "Pretrain/Loss": 2.7733962535858154, "Pretrain/Loss (Raw)": 2.2373905181884766, "Pretrain/Step": 51, "Pretrain/Step Time": 8.239445508695116} +{"Pretrain/Learning Rate": 9.090909090909091e-06, "Pretrain/Loss": 2.759373664855957, "Pretrain/Loss (Raw)": 2.0442049503326416, "Pretrain/Step": 52, "Pretrain/Step Time": 8.237464712216305} +{"Pretrain/Learning Rate": 9.265734265734266e-06, "Pretrain/Loss": 2.7529263496398926, "Pretrain/Loss (Raw)": 2.417681932449341, "Pretrain/Step": 53, "Pretrain/Step Time": 8.250497111734354} +{"Pretrain/Learning Rate": 9.44055944055944e-06, "Pretrain/Loss": 2.741006374359131, "Pretrain/Loss (Raw)": 2.1092514991760254, "Pretrain/Step": 54, "Pretrain/Step Time": 8.247150050269234} +{"Pretrain/Learning Rate": 9.615384615384616e-06, "Pretrain/Loss": 2.7335469722747803, "Pretrain/Loss (Raw)": 2.3307394981384277, "Pretrain/Step": 55, "Pretrain/Step Time": 8.257515933296897} +{"Pretrain/Learning Rate": 9.79020979020979e-06, "Pretrain/Loss": 2.728847026824951, "Pretrain/Loss (Raw)": 2.4703311920166016, "Pretrain/Step": 56, "Pretrain/Step Time": 8.25353976232665} +{"Pretrain/Learning Rate": 9.965034965034966e-06, "Pretrain/Loss": 2.7181081771850586, "Pretrain/Loss (Raw)": 2.1167263984680176, "Pretrain/Step": 57, "Pretrain/Step Time": 8.255316437336436} +{"Pretrain/Learning Rate": 1.013986013986014e-05, "Pretrain/Loss": 2.712589979171753, "Pretrain/Loss (Raw)": 2.3980660438537598, "Pretrain/Step": 58, "Pretrain/Step Time": 8.248588105727887} +{"Pretrain/Learning Rate": 1.0314685314685315e-05, "Pretrain/Loss": 2.7143633365631104, "Pretrain/Loss (Raw)": 2.817214012145996, "Pretrain/Step": 59, "Pretrain/Step Time": 8.253849340697466} +{"Pretrain/Learning Rate": 1.048951048951049e-05, "Pretrain/Loss": 2.7065765857696533, "Pretrain/Loss (Raw)": 2.2471718788146973, "Pretrain/Step": 60, "Pretrain/Step Time": 8.249278628826142} +{"Pretrain/Learning Rate": 1.0664335664335665e-05, "Pretrain/Loss": 2.7030434608459473, "Pretrain/Loss (Raw)": 2.4910616874694824, "Pretrain/Step": 61, "Pretrain/Step Time": 8.243470735237247} +{"Pretrain/Learning Rate": 1.0839160839160838e-05, "Pretrain/Loss": 2.6973161697387695, "Pretrain/Loss (Raw)": 2.3479409217834473, "Pretrain/Step": 62, "Pretrain/Step Time": 8.237666487693787} +{"Pretrain/Learning Rate": 1.1013986013986015e-05, "Pretrain/Loss": 2.6895911693573, "Pretrain/Loss (Raw)": 2.2106196880340576, "Pretrain/Step": 63, "Pretrain/Step Time": 8.233880830189538} +{"Pretrain/Learning Rate": 1.118881118881119e-05, "Pretrain/Loss": 2.67983078956604, "Pretrain/Loss (Raw)": 2.0649473667144775, "Pretrain/Step": 64, "Pretrain/Step Time": 8.234169077128172} +{"Pretrain/Learning Rate": 1.1363636363636365e-05, "Pretrain/Loss": 2.678873300552368, "Pretrain/Loss (Raw)": 2.617596387863159, "Pretrain/Step": 65, "Pretrain/Step Time": 8.229615097779494} +{"Pretrain/Learning Rate": 1.153846153846154e-05, "Pretrain/Loss": 2.674724817276001, "Pretrain/Loss (Raw)": 2.4050545692443848, "Pretrain/Step": 66, "Pretrain/Step Time": 8.226632421666926} +{"Pretrain/Learning Rate": 1.1713286713286714e-05, "Pretrain/Loss": 2.66876482963562, "Pretrain/Loss (Raw)": 2.2754323482513428, "Pretrain/Step": 67, "Pretrain/Step Time": 8.22236761762135} +{"Pretrain/Learning Rate": 1.188811188811189e-05, "Pretrain/Loss": 2.6638245582580566, "Pretrain/Loss (Raw)": 2.3328168392181396, "Pretrain/Step": 68, "Pretrain/Step Time": 8.221324082683115} +{"Pretrain/Learning Rate": 1.2062937062937063e-05, "Pretrain/Loss": 2.660764694213867, "Pretrain/Loss (Raw)": 2.4526777267456055, "Pretrain/Step": 69, "Pretrain/Step Time": 8.218235351037288} +{"Pretrain/Learning Rate": 1.2237762237762239e-05, "Pretrain/Loss": 2.653960943222046, "Pretrain/Loss (Raw)": 2.1845109462738037, "Pretrain/Step": 70, "Pretrain/Step Time": 8.218977172034128} +{"Pretrain/Learning Rate": 1.2412587412587414e-05, "Pretrain/Loss": 2.6504266262054443, "Pretrain/Loss (Raw)": 2.403027057647705, "Pretrain/Step": 71, "Pretrain/Step Time": 8.220419544569204} +{"Pretrain/Learning Rate": 1.2587412587412589e-05, "Pretrain/Loss": 2.64512300491333, "Pretrain/Loss (Raw)": 2.2685673236846924, "Pretrain/Step": 72, "Pretrain/Step Time": 8.215861337052452} +{"Pretrain/Learning Rate": 1.2762237762237764e-05, "Pretrain/Loss": 2.63737416267395, "Pretrain/Loss (Raw)": 2.079472780227661, "Pretrain/Step": 73, "Pretrain/Step Time": 8.224828089753242} +{"Pretrain/Learning Rate": 1.2937062937062939e-05, "Pretrain/Loss": 2.6345343589782715, "Pretrain/Loss (Raw)": 2.427196979522705, "Pretrain/Step": 74, "Pretrain/Step Time": 8.29052331963101} +{"Pretrain/Learning Rate": 1.3111888111888112e-05, "Pretrain/Loss": 2.628520965576172, "Pretrain/Loss (Raw)": 2.183540105819702, "Pretrain/Step": 75, "Pretrain/Step Time": 8.302039213180542} +{"Pretrain/Learning Rate": 1.3286713286713287e-05, "Pretrain/Loss": 2.6257121562957764, "Pretrain/Loss (Raw)": 2.41506290435791, "Pretrain/Step": 76, "Pretrain/Step Time": 8.300287108672293} +{"Pretrain/Learning Rate": 1.3461538461538462e-05, "Pretrain/Loss": 2.62099552154541, "Pretrain/Loss (Raw)": 2.2625157833099365, "Pretrain/Step": 77, "Pretrain/Step Time": 8.31087174044027} +{"Pretrain/Learning Rate": 1.3636363636363637e-05, "Pretrain/Loss": 2.618145704269409, "Pretrain/Loss (Raw)": 2.3987200260162354, "Pretrain/Step": 78, "Pretrain/Step Time": 8.3227640634928} +{"Pretrain/Learning Rate": 1.381118881118881e-05, "Pretrain/Loss": 2.6140623092651367, "Pretrain/Loss (Raw)": 2.2955470085144043, "Pretrain/Step": 79, "Pretrain/Step Time": 8.325032566167131} +{"Pretrain/Learning Rate": 1.3986013986013988e-05, "Pretrain/Loss": 2.61930513381958, "Pretrain/Loss (Raw)": 3.033492088317871, "Pretrain/Step": 80, "Pretrain/Step Time": 8.323383849859237} +{"Pretrain/Learning Rate": 1.4160839160839163e-05, "Pretrain/Loss": 2.617669105529785, "Pretrain/Loss (Raw)": 2.4867796897888184, "Pretrain/Step": 81, "Pretrain/Step Time": 8.321788808445872} +{"Pretrain/Learning Rate": 1.4335664335664336e-05, "Pretrain/Loss": 2.6098382472991943, "Pretrain/Loss (Raw)": 1.9755582809448242, "Pretrain/Step": 82, "Pretrain/Step Time": 8.333538136831145} +{"Pretrain/Learning Rate": 1.4510489510489511e-05, "Pretrain/Loss": 2.604992389678955, "Pretrain/Loss (Raw)": 2.207653045654297, "Pretrain/Step": 83, "Pretrain/Step Time": 8.334801251629749} +{"Pretrain/Learning Rate": 1.4685314685314686e-05, "Pretrain/Loss": 2.6026241779327393, "Pretrain/Loss (Raw)": 2.4060332775115967, "Pretrain/Step": 84, "Pretrain/Step Time": 8.330692983808971} +{"Pretrain/Learning Rate": 1.486013986013986e-05, "Pretrain/Loss": 2.599299192428589, "Pretrain/Loss (Raw)": 2.3200137615203857, "Pretrain/Step": 85, "Pretrain/Step Time": 8.329283568438361} +{"Pretrain/Learning Rate": 1.5034965034965034e-05, "Pretrain/Loss": 2.593914031982422, "Pretrain/Loss (Raw)": 2.13617205619812, "Pretrain/Step": 86, "Pretrain/Step Time": 8.32554761476295} +{"Pretrain/Learning Rate": 1.5209790209790212e-05, "Pretrain/Loss": 2.5903453826904297, "Pretrain/Loss (Raw)": 2.283440589904785, "Pretrain/Step": 87, "Pretrain/Step Time": 8.33502547220252} +{"Pretrain/Learning Rate": 1.5384615384615387e-05, "Pretrain/Loss": 2.5858657360076904, "Pretrain/Loss (Raw)": 2.196120023727417, "Pretrain/Step": 88, "Pretrain/Step Time": 8.347127112475308} +{"Pretrain/Learning Rate": 1.555944055944056e-05, "Pretrain/Loss": 2.5813400745391846, "Pretrain/Loss (Raw)": 2.1830999851226807, "Pretrain/Step": 89, "Pretrain/Step Time": 8.342797394548908} +{"Pretrain/Learning Rate": 1.5734265734265734e-05, "Pretrain/Loss": 2.575986862182617, "Pretrain/Loss (Raw)": 2.099550485610962, "Pretrain/Step": 90, "Pretrain/Step Time": 8.342475239435831} +{"Pretrain/Learning Rate": 1.590909090909091e-05, "Pretrain/Loss": 2.571683645248413, "Pretrain/Loss (Raw)": 2.1843831539154053, "Pretrain/Step": 91, "Pretrain/Step Time": 8.343686195520254} +{"Pretrain/Learning Rate": 1.6083916083916083e-05, "Pretrain/Loss": 2.567110538482666, "Pretrain/Loss (Raw)": 2.150949001312256, "Pretrain/Step": 92, "Pretrain/Step Time": 8.349983917630237} +{"Pretrain/Learning Rate": 1.625874125874126e-05, "Pretrain/Loss": 2.5649473667144775, "Pretrain/Loss (Raw)": 2.3659422397613525, "Pretrain/Step": 93, "Pretrain/Step Time": 8.36204574185033} +{"Pretrain/Learning Rate": 1.6433566433566433e-05, "Pretrain/Loss": 2.5618491172790527, "Pretrain/Loss (Raw)": 2.273729085922241, "Pretrain/Step": 94, "Pretrain/Step Time": 8.3644412375511} +{"Pretrain/Learning Rate": 1.660839160839161e-05, "Pretrain/Loss": 2.556087017059326, "Pretrain/Loss (Raw)": 2.014437437057495, "Pretrain/Step": 95, "Pretrain/Step Time": 8.360871844542654} +{"Pretrain/Learning Rate": 1.6783216783216786e-05, "Pretrain/Loss": 2.554065704345703, "Pretrain/Loss (Raw)": 2.3620493412017822, "Pretrain/Step": 96, "Pretrain/Step Time": 8.35705258945624} +{"Pretrain/Learning Rate": 1.695804195804196e-05, "Pretrain/Loss": 2.5508012771606445, "Pretrain/Loss (Raw)": 2.2374255657196045, "Pretrain/Step": 97, "Pretrain/Step Time": 8.376652201426397} +{"Pretrain/Learning Rate": 1.7132867132867133e-05, "Pretrain/Loss": 2.549647569656372, "Pretrain/Loss (Raw)": 2.4377312660217285, "Pretrain/Step": 98, "Pretrain/Step Time": 8.374706149101257} +{"Pretrain/Learning Rate": 1.730769230769231e-05, "Pretrain/Loss": 2.5473482608795166, "Pretrain/Loss (Raw)": 2.3219873905181885, "Pretrain/Step": 99, "Pretrain/Step Time": 8.37477778906774} +{"Pretrain/Learning Rate": 1.7482517482517483e-05, "Pretrain/Loss": 2.544846534729004, "Pretrain/Loss (Raw)": 2.297201633453369, "Pretrain/Step": 100, "Pretrain/Step Time": 8.369432764053345} +{"Pretrain/Learning Rate": 1.7657342657342656e-05, "Pretrain/Loss": 2.542060136795044, "Pretrain/Loss (Raw)": 2.2634153366088867, "Pretrain/Step": 101, "Pretrain/Step Time": 8.385721966771797} +{"Pretrain/Learning Rate": 1.7832167832167836e-05, "Pretrain/Loss": 2.542602300643921, "Pretrain/Loss (Raw)": 2.5973517894744873, "Pretrain/Step": 102, "Pretrain/Step Time": 8.383021109244403} +{"Pretrain/Learning Rate": 1.800699300699301e-05, "Pretrain/Loss": 2.5433759689331055, "Pretrain/Loss (Raw)": 2.6222832202911377, "Pretrain/Step": 103, "Pretrain/Step Time": 8.378442171707894} +{"Pretrain/Learning Rate": 1.8181818181818182e-05, "Pretrain/Loss": 2.5400872230529785, "Pretrain/Loss (Raw)": 2.2013607025146484, "Pretrain/Step": 104, "Pretrain/Step Time": 8.377714466590147} +{"Pretrain/Learning Rate": 1.835664335664336e-05, "Pretrain/Loss": 2.5362861156463623, "Pretrain/Loss (Raw)": 2.1409661769866943, "Pretrain/Step": 105, "Pretrain/Step Time": 8.381966243471417} +{"Pretrain/Learning Rate": 1.8531468531468532e-05, "Pretrain/Loss": 2.5339574813842773, "Pretrain/Loss (Raw)": 2.2894575595855713, "Pretrain/Step": 106, "Pretrain/Step Time": 8.385945891434291} +{"Pretrain/Learning Rate": 1.8706293706293705e-05, "Pretrain/Loss": 2.53403639793396, "Pretrain/Loss (Raw)": 2.54239559173584, "Pretrain/Step": 107, "Pretrain/Step Time": 8.382626176994538} +{"Pretrain/Learning Rate": 1.888111888111888e-05, "Pretrain/Loss": 2.5305492877960205, "Pretrain/Loss (Raw)": 2.157430410385132, "Pretrain/Step": 108, "Pretrain/Step Time": 8.379716707600487} +{"Pretrain/Learning Rate": 1.9055944055944055e-05, "Pretrain/Loss": 2.529029607772827, "Pretrain/Loss (Raw)": 2.3649394512176514, "Pretrain/Step": 109, "Pretrain/Step Time": 8.380802611692236} +{"Pretrain/Learning Rate": 1.923076923076923e-05, "Pretrain/Loss": 2.5263640880584717, "Pretrain/Loss (Raw)": 2.235806703567505, "Pretrain/Step": 110, "Pretrain/Step Time": 8.383255672454833} +{"Pretrain/Learning Rate": 1.9405594405594408e-05, "Pretrain/Loss": 2.5242176055908203, "Pretrain/Loss (Raw)": 2.2880654335021973, "Pretrain/Step": 111, "Pretrain/Step Time": 8.395082774463} +{"Pretrain/Learning Rate": 1.958041958041958e-05, "Pretrain/Loss": 2.5232815742492676, "Pretrain/Loss (Raw)": 2.4193718433380127, "Pretrain/Step": 112, "Pretrain/Step Time": 8.400364254202161} +{"Pretrain/Learning Rate": 1.9755244755244758e-05, "Pretrain/Loss": 2.520169258117676, "Pretrain/Loss (Raw)": 2.171611785888672, "Pretrain/Step": 113, "Pretrain/Step Time": 8.397632773998565} +{"Pretrain/Learning Rate": 1.993006993006993e-05, "Pretrain/Loss": 2.5186758041381836, "Pretrain/Loss (Raw)": 2.3499269485473633, "Pretrain/Step": 114, "Pretrain/Step Time": 8.39900463505795} +{"Pretrain/Learning Rate": 2.0104895104895104e-05, "Pretrain/Loss": 2.5160272121429443, "Pretrain/Loss (Raw)": 2.2140908241271973, "Pretrain/Step": 115, "Pretrain/Step Time": 8.399335747179778} +{"Pretrain/Learning Rate": 2.027972027972028e-05, "Pretrain/Loss": 2.517258644104004, "Pretrain/Loss (Raw)": 2.658865213394165, "Pretrain/Step": 116, "Pretrain/Step Time": 8.412999722464331} +{"Pretrain/Learning Rate": 2.0454545454545457e-05, "Pretrain/Loss": 2.5197207927703857, "Pretrain/Loss (Raw)": 2.8053088188171387, "Pretrain/Step": 117, "Pretrain/Step Time": 8.41328852197044} +{"Pretrain/Learning Rate": 2.062937062937063e-05, "Pretrain/Loss": 2.5209310054779053, "Pretrain/Loss (Raw)": 2.6625304222106934, "Pretrain/Step": 118, "Pretrain/Step Time": 8.410579869302653} +{"Pretrain/Learning Rate": 2.0804195804195807e-05, "Pretrain/Loss": 2.5173451900482178, "Pretrain/Loss (Raw)": 2.0942180156707764, "Pretrain/Step": 119, "Pretrain/Step Time": 8.4111369177073} +{"Pretrain/Learning Rate": 2.097902097902098e-05, "Pretrain/Loss": 2.515573740005493, "Pretrain/Loss (Raw)": 2.3047897815704346, "Pretrain/Step": 120, "Pretrain/Step Time": 8.421268757184347} +{"Pretrain/Learning Rate": 2.1153846153846154e-05, "Pretrain/Loss": 2.512232542037964, "Pretrain/Loss (Raw)": 2.1113202571868896, "Pretrain/Step": 121, "Pretrain/Step Time": 8.415829236842384} +{"Pretrain/Learning Rate": 2.132867132867133e-05, "Pretrain/Loss": 2.5088462829589844, "Pretrain/Loss (Raw)": 2.0990819931030273, "Pretrain/Step": 122, "Pretrain/Step Time": 8.414495089015023} +{"Pretrain/Learning Rate": 2.1503496503496503e-05, "Pretrain/Loss": 2.5046887397766113, "Pretrain/Loss (Raw)": 1.9974483251571655, "Pretrain/Step": 123, "Pretrain/Step Time": 8.411952491698226} +{"Pretrain/Learning Rate": 2.1678321678321677e-05, "Pretrain/Loss": 2.5018630027770996, "Pretrain/Loss (Raw)": 2.154301643371582, "Pretrain/Step": 124, "Pretrain/Step Time": 8.409864842891693} +{"Pretrain/Learning Rate": 2.1853146853146857e-05, "Pretrain/Loss": 2.4998083114624023, "Pretrain/Loss (Raw)": 2.2450129985809326, "Pretrain/Step": 125, "Pretrain/Step Time": 8.413026494979858} +{"Pretrain/Learning Rate": 2.202797202797203e-05, "Pretrain/Loss": 2.4981329441070557, "Pretrain/Loss (Raw)": 2.288723945617676, "Pretrain/Step": 126, "Pretrain/Step Time": 8.413829608569069} +{"Pretrain/Learning Rate": 2.2202797202797203e-05, "Pretrain/Loss": 2.496293067932129, "Pretrain/Loss (Raw)": 2.264507532119751, "Pretrain/Step": 127, "Pretrain/Step Time": 8.411070960713184} +{"Pretrain/Learning Rate": 2.237762237762238e-05, "Pretrain/Loss": 2.4964847564697266, "Pretrain/Loss (Raw)": 2.520775079727173, "Pretrain/Step": 128, "Pretrain/Step Time": 8.412554528564215} +{"Pretrain/Learning Rate": 2.2552447552447553e-05, "Pretrain/Loss": 2.492036819458008, "Pretrain/Loss (Raw)": 2.305929660797119, "Pretrain/Step": 129, "Pretrain/Step Time": 8.381741281598806} +{"Pretrain/Learning Rate": 2.272727272727273e-05, "Pretrain/Loss": 2.487330675125122, "Pretrain/Loss (Raw)": 2.4357247352600098, "Pretrain/Step": 130, "Pretrain/Step Time": 8.400370324030519} +{"Pretrain/Learning Rate": 2.2902097902097902e-05, "Pretrain/Loss": 2.4740452766418457, "Pretrain/Loss (Raw)": 2.385507345199585, "Pretrain/Step": 131, "Pretrain/Step Time": 8.401836270466447} +{"Pretrain/Learning Rate": 2.307692307692308e-05, "Pretrain/Loss": 2.4639930725097656, "Pretrain/Loss (Raw)": 2.327786445617676, "Pretrain/Step": 132, "Pretrain/Step Time": 8.401551365852356} +{"Pretrain/Learning Rate": 2.3251748251748252e-05, "Pretrain/Loss": 2.4492900371551514, "Pretrain/Loss (Raw)": 2.483215093612671, "Pretrain/Step": 133, "Pretrain/Step Time": 8.410167120397091} +{"Pretrain/Learning Rate": 2.342657342657343e-05, "Pretrain/Loss": 2.4384143352508545, "Pretrain/Loss (Raw)": 2.509929895401001, "Pretrain/Step": 134, "Pretrain/Step Time": 8.414232093840837} +{"Pretrain/Learning Rate": 2.3601398601398602e-05, "Pretrain/Loss": 2.431112289428711, "Pretrain/Loss (Raw)": 2.5193259716033936, "Pretrain/Step": 135, "Pretrain/Step Time": 8.420932436361909} +{"Pretrain/Learning Rate": 2.377622377622378e-05, "Pretrain/Loss": 2.4259581565856934, "Pretrain/Loss (Raw)": 2.305889368057251, "Pretrain/Step": 136, "Pretrain/Step Time": 8.421467578038573} +{"Pretrain/Learning Rate": 2.3951048951048952e-05, "Pretrain/Loss": 2.419154644012451, "Pretrain/Loss (Raw)": 2.2333693504333496, "Pretrain/Step": 137, "Pretrain/Step Time": 8.421254511922598} +{"Pretrain/Learning Rate": 2.4125874125874125e-05, "Pretrain/Loss": 2.4109601974487305, "Pretrain/Loss (Raw)": 2.2710607051849365, "Pretrain/Step": 138, "Pretrain/Step Time": 8.431103188544512} +{"Pretrain/Learning Rate": 2.43006993006993e-05, "Pretrain/Loss": 2.402578353881836, "Pretrain/Loss (Raw)": 2.2893340587615967, "Pretrain/Step": 139, "Pretrain/Step Time": 8.428739434108138} +{"Pretrain/Learning Rate": 2.4475524475524478e-05, "Pretrain/Loss": 2.3906044960021973, "Pretrain/Loss (Raw)": 2.4821248054504395, "Pretrain/Step": 140, "Pretrain/Step Time": 8.428353844210505} +{"Pretrain/Learning Rate": 2.465034965034965e-05, "Pretrain/Loss": 2.3863508701324463, "Pretrain/Loss (Raw)": 2.373619318008423, "Pretrain/Step": 141, "Pretrain/Step Time": 8.430073276162148} +{"Pretrain/Learning Rate": 2.4825174825174828e-05, "Pretrain/Loss": 2.375192165374756, "Pretrain/Loss (Raw)": 1.8923733234405518, "Pretrain/Step": 142, "Pretrain/Step Time": 8.431812612339854} +{"Pretrain/Learning Rate": 2.5e-05, "Pretrain/Loss": 2.3671507835388184, "Pretrain/Loss (Raw)": 2.197117328643799, "Pretrain/Step": 143, "Pretrain/Step Time": 8.43251653201878} +{"Pretrain/Learning Rate": 2.5174825174825178e-05, "Pretrain/Loss": 2.361621856689453, "Pretrain/Loss (Raw)": 2.2273762226104736, "Pretrain/Step": 144, "Pretrain/Step Time": 8.430614488199353} +{"Pretrain/Learning Rate": 2.534965034965035e-05, "Pretrain/Loss": 2.3559226989746094, "Pretrain/Loss (Raw)": 2.193927764892578, "Pretrain/Step": 145, "Pretrain/Step Time": 8.419528793543577} +{"Pretrain/Learning Rate": 2.5524475524475528e-05, "Pretrain/Loss": 2.3511500358581543, "Pretrain/Loss (Raw)": 1.895451307296753, "Pretrain/Step": 146, "Pretrain/Step Time": 8.421221965923905} +{"Pretrain/Learning Rate": 2.5699300699300697e-05, "Pretrain/Loss": 2.34898042678833, "Pretrain/Loss (Raw)": 2.3321008682250977, "Pretrain/Step": 147, "Pretrain/Step Time": 8.42227766290307} +{"Pretrain/Learning Rate": 2.5874125874125877e-05, "Pretrain/Loss": 2.342280149459839, "Pretrain/Loss (Raw)": 2.0160043239593506, "Pretrain/Step": 148, "Pretrain/Step Time": 8.432599235326052} +{"Pretrain/Learning Rate": 2.6048951048951047e-05, "Pretrain/Loss": 2.339963436126709, "Pretrain/Loss (Raw)": 2.41552996635437, "Pretrain/Step": 149, "Pretrain/Step Time": 8.432980664074421} +{"Pretrain/Learning Rate": 2.6223776223776224e-05, "Pretrain/Loss": 2.3343544006347656, "Pretrain/Loss (Raw)": 2.1879336833953857, "Pretrain/Step": 150, "Pretrain/Step Time": 8.439595511183143} +{"Pretrain/Learning Rate": 2.6398601398601404e-05, "Pretrain/Loss": 2.328248977661133, "Pretrain/Loss (Raw)": 2.148289918899536, "Pretrain/Step": 151, "Pretrain/Step Time": 8.441729994490743} +{"Pretrain/Learning Rate": 2.6573426573426574e-05, "Pretrain/Loss": 2.3281731605529785, "Pretrain/Loss (Raw)": 2.346637487411499, "Pretrain/Step": 152, "Pretrain/Step Time": 8.44597421772778} +{"Pretrain/Learning Rate": 2.674825174825175e-05, "Pretrain/Loss": 2.324988842010498, "Pretrain/Loss (Raw)": 2.352694511413574, "Pretrain/Step": 153, "Pretrain/Step Time": 8.445690631866455} +{"Pretrain/Learning Rate": 2.6923076923076923e-05, "Pretrain/Loss": 2.3265156745910645, "Pretrain/Loss (Raw)": 2.439927339553833, "Pretrain/Step": 154, "Pretrain/Step Time": 8.453783741220832} +{"Pretrain/Learning Rate": 2.70979020979021e-05, "Pretrain/Loss": 2.3215088844299316, "Pretrain/Loss (Raw)": 2.1781632900238037, "Pretrain/Step": 155, "Pretrain/Step Time": 8.46333252824843} +{"Pretrain/Learning Rate": 2.7272727272727273e-05, "Pretrain/Loss": 2.3212356567382812, "Pretrain/Loss (Raw)": 2.2781131267547607, "Pretrain/Step": 156, "Pretrain/Step Time": 8.46464404463768} +{"Pretrain/Learning Rate": 2.744755244755245e-05, "Pretrain/Loss": 2.3188066482543945, "Pretrain/Loss (Raw)": 2.0998826026916504, "Pretrain/Step": 157, "Pretrain/Step Time": 8.464798966422677} +{"Pretrain/Learning Rate": 2.762237762237762e-05, "Pretrain/Loss": 2.3191702365875244, "Pretrain/Loss (Raw)": 2.2629897594451904, "Pretrain/Step": 158, "Pretrain/Step Time": 8.465565467253327} +{"Pretrain/Learning Rate": 2.77972027972028e-05, "Pretrain/Loss": 2.317267656326294, "Pretrain/Loss (Raw)": 2.1093571186065674, "Pretrain/Step": 159, "Pretrain/Step Time": 8.464971596375108} +{"Pretrain/Learning Rate": 2.7972027972027976e-05, "Pretrain/Loss": 2.313209056854248, "Pretrain/Loss (Raw)": 1.9142556190490723, "Pretrain/Step": 160, "Pretrain/Step Time": 8.476837513968349} +{"Pretrain/Learning Rate": 2.8146853146853146e-05, "Pretrain/Loss": 2.312074899673462, "Pretrain/Loss (Raw)": 2.2449772357940674, "Pretrain/Step": 161, "Pretrain/Step Time": 8.475420147180557} +{"Pretrain/Learning Rate": 2.8321678321678326e-05, "Pretrain/Loss": 2.306380033493042, "Pretrain/Loss (Raw)": 1.992032527923584, "Pretrain/Step": 162, "Pretrain/Step Time": 8.473532682284713} +{"Pretrain/Learning Rate": 2.8496503496503496e-05, "Pretrain/Loss": 2.307614803314209, "Pretrain/Loss (Raw)": 2.3909246921539307, "Pretrain/Step": 163, "Pretrain/Step Time": 8.47515395283699} +{"Pretrain/Learning Rate": 2.8671328671328672e-05, "Pretrain/Loss": 2.303835868835449, "Pretrain/Loss (Raw)": 2.270862340927124, "Pretrain/Step": 164, "Pretrain/Step Time": 8.475426750257611} +{"Pretrain/Learning Rate": 2.8846153846153845e-05, "Pretrain/Loss": 2.304980993270874, "Pretrain/Loss (Raw)": 2.2977139949798584, "Pretrain/Step": 165, "Pretrain/Step Time": 8.467193583026528} +{"Pretrain/Learning Rate": 2.9020979020979022e-05, "Pretrain/Loss": 2.30128812789917, "Pretrain/Loss (Raw)": 2.2643916606903076, "Pretrain/Step": 166, "Pretrain/Step Time": 8.48266677558422} +{"Pretrain/Learning Rate": 2.91958041958042e-05, "Pretrain/Loss": 2.3007264137268066, "Pretrain/Loss (Raw)": 2.079709529876709, "Pretrain/Step": 167, "Pretrain/Step Time": 8.485150368884206} +{"Pretrain/Learning Rate": 2.9370629370629372e-05, "Pretrain/Loss": 2.3029112815856934, "Pretrain/Loss (Raw)": 2.4105992317199707, "Pretrain/Step": 168, "Pretrain/Step Time": 8.486380012705922} +{"Pretrain/Learning Rate": 2.954545454545455e-05, "Pretrain/Loss": 2.3016741275787354, "Pretrain/Loss (Raw)": 2.330735445022583, "Pretrain/Step": 169, "Pretrain/Step Time": 8.491383949294686} +{"Pretrain/Learning Rate": 2.972027972027972e-05, "Pretrain/Loss": 2.297555923461914, "Pretrain/Loss (Raw)": 2.125697135925293, "Pretrain/Step": 170, "Pretrain/Step Time": 8.493447368964553} +{"Pretrain/Learning Rate": 2.9895104895104898e-05, "Pretrain/Loss": 2.29716420173645, "Pretrain/Loss (Raw)": 2.279475212097168, "Pretrain/Step": 171, "Pretrain/Step Time": 8.494901597499847} +{"Pretrain/Learning Rate": 3.0069930069930068e-05, "Pretrain/Loss": 2.2975540161132812, "Pretrain/Loss (Raw)": 2.273315668106079, "Pretrain/Step": 172, "Pretrain/Step Time": 8.49110198020935} +{"Pretrain/Learning Rate": 3.0244755244755245e-05, "Pretrain/Loss": 2.2965633869171143, "Pretrain/Loss (Raw)": 2.1212575435638428, "Pretrain/Step": 173, "Pretrain/Step Time": 8.5051507987082} +{"Pretrain/Learning Rate": 3.0419580419580425e-05, "Pretrain/Loss": 2.2980611324310303, "Pretrain/Loss (Raw)": 2.453132152557373, "Pretrain/Step": 174, "Pretrain/Step Time": 8.50441981293261} +{"Pretrain/Learning Rate": 3.0594405594405594e-05, "Pretrain/Loss": 2.2966670989990234, "Pretrain/Loss (Raw)": 2.4113569259643555, "Pretrain/Step": 175, "Pretrain/Step Time": 8.504154635593295} +{"Pretrain/Learning Rate": 3.0769230769230774e-05, "Pretrain/Loss": 2.29567813873291, "Pretrain/Loss (Raw)": 2.307100296020508, "Pretrain/Step": 176, "Pretrain/Step Time": 8.504850469529629} +{"Pretrain/Learning Rate": 3.094405594405594e-05, "Pretrain/Loss": 2.296130895614624, "Pretrain/Loss (Raw)": 2.4381208419799805, "Pretrain/Step": 177, "Pretrain/Step Time": 8.504536433145404} +{"Pretrain/Learning Rate": 3.111888111888112e-05, "Pretrain/Loss": 2.293525218963623, "Pretrain/Loss (Raw)": 2.1246771812438965, "Pretrain/Step": 178, "Pretrain/Step Time": 8.515034914016724} +{"Pretrain/Learning Rate": 3.1293706293706294e-05, "Pretrain/Loss": 2.293426036834717, "Pretrain/Loss (Raw)": 2.224728584289551, "Pretrain/Step": 179, "Pretrain/Step Time": 8.515455896034837} +{"Pretrain/Learning Rate": 3.146853146853147e-05, "Pretrain/Loss": 2.2960312366485596, "Pretrain/Loss (Raw)": 2.377654552459717, "Pretrain/Step": 180, "Pretrain/Step Time": 8.520031303167343} +{"Pretrain/Learning Rate": 3.164335664335665e-05, "Pretrain/Loss": 2.292383909225464, "Pretrain/Loss (Raw)": 1.9508330821990967, "Pretrain/Step": 181, "Pretrain/Step Time": 8.514181084930897} +{"Pretrain/Learning Rate": 3.181818181818182e-05, "Pretrain/Loss": 2.293520212173462, "Pretrain/Loss (Raw)": 2.25467848777771, "Pretrain/Step": 182, "Pretrain/Step Time": 8.51618048734963} +{"Pretrain/Learning Rate": 3.1993006993006994e-05, "Pretrain/Loss": 2.2915210723876953, "Pretrain/Loss (Raw)": 2.0748677253723145, "Pretrain/Step": 183, "Pretrain/Step Time": 8.508079811930656} +{"Pretrain/Learning Rate": 3.216783216783217e-05, "Pretrain/Loss": 2.290057420730591, "Pretrain/Loss (Raw)": 2.2829744815826416, "Pretrain/Step": 184, "Pretrain/Step Time": 8.514357915148139} +{"Pretrain/Learning Rate": 3.234265734265735e-05, "Pretrain/Loss": 2.290118932723999, "Pretrain/Loss (Raw)": 2.1246042251586914, "Pretrain/Step": 185, "Pretrain/Step Time": 8.527208721265197} +{"Pretrain/Learning Rate": 3.251748251748252e-05, "Pretrain/Loss": 2.2909512519836426, "Pretrain/Loss (Raw)": 2.504605293273926, "Pretrain/Step": 186, "Pretrain/Step Time": 8.534195274114609} +{"Pretrain/Learning Rate": 3.269230769230769e-05, "Pretrain/Loss": 2.285538911819458, "Pretrain/Loss (Raw)": 2.1244277954101562, "Pretrain/Step": 187, "Pretrain/Step Time": 8.533054476603866} +{"Pretrain/Learning Rate": 3.2867132867132866e-05, "Pretrain/Loss": 2.283836841583252, "Pretrain/Loss (Raw)": 2.0293099880218506, "Pretrain/Step": 188, "Pretrain/Step Time": 8.53533411026001} +{"Pretrain/Learning Rate": 3.3041958041958046e-05, "Pretrain/Loss": 2.2805628776550293, "Pretrain/Loss (Raw)": 2.071988344192505, "Pretrain/Step": 189, "Pretrain/Step Time": 8.536856681108475} +{"Pretrain/Learning Rate": 3.321678321678322e-05, "Pretrain/Loss": 2.2803163528442383, "Pretrain/Loss (Raw)": 2.3163609504699707, "Pretrain/Step": 190, "Pretrain/Step Time": 8.544000374153256} +{"Pretrain/Learning Rate": 3.339160839160839e-05, "Pretrain/Loss": 2.2794408798217773, "Pretrain/Loss (Raw)": 2.0985701084136963, "Pretrain/Step": 191, "Pretrain/Step Time": 8.549707811325788} +{"Pretrain/Learning Rate": 3.356643356643357e-05, "Pretrain/Loss": 2.2808635234832764, "Pretrain/Loss (Raw)": 2.2470662593841553, "Pretrain/Step": 192, "Pretrain/Step Time": 8.558862058445811} +{"Pretrain/Learning Rate": 3.374125874125874e-05, "Pretrain/Loss": 2.278440237045288, "Pretrain/Loss (Raw)": 2.307424306869507, "Pretrain/Step": 193, "Pretrain/Step Time": 8.561765672639012} +{"Pretrain/Learning Rate": 3.391608391608392e-05, "Pretrain/Loss": 2.27944016456604, "Pretrain/Loss (Raw)": 2.5330450534820557, "Pretrain/Step": 194, "Pretrain/Step Time": 8.56517574377358} +{"Pretrain/Learning Rate": 3.409090909090909e-05, "Pretrain/Loss": 2.279768943786621, "Pretrain/Loss (Raw)": 2.3174822330474854, "Pretrain/Step": 195, "Pretrain/Step Time": 8.56767993234098} +{"Pretrain/Learning Rate": 3.4265734265734265e-05, "Pretrain/Loss": 2.2786636352539062, "Pretrain/Loss (Raw)": 2.191366195678711, "Pretrain/Step": 196, "Pretrain/Step Time": 8.567567057907581} +{"Pretrain/Learning Rate": 3.4440559440559445e-05, "Pretrain/Loss": 2.2760815620422363, "Pretrain/Loss (Raw)": 2.1221890449523926, "Pretrain/Step": 197, "Pretrain/Step Time": 8.573151810094714} +{"Pretrain/Learning Rate": 3.461538461538462e-05, "Pretrain/Loss": 2.2759947776794434, "Pretrain/Loss (Raw)": 2.1733858585357666, "Pretrain/Step": 198, "Pretrain/Step Time": 8.577472103759646} +{"Pretrain/Learning Rate": 3.479020979020979e-05, "Pretrain/Loss": 2.27424955368042, "Pretrain/Loss (Raw)": 2.1796133518218994, "Pretrain/Step": 199, "Pretrain/Step Time": 8.576240584254265} +{"Pretrain/Learning Rate": 3.4965034965034965e-05, "Pretrain/Loss": 2.274782180786133, "Pretrain/Loss (Raw)": 2.336786985397339, "Pretrain/Step": 200, "Pretrain/Step Time": 8.57833387516439} +{"Pretrain/Learning Rate": 3.5139860139860145e-05, "Pretrain/Loss": 2.275719404220581, "Pretrain/Loss (Raw)": 2.1994099617004395, "Pretrain/Step": 201, "Pretrain/Step Time": 8.572940392419696} +{"Pretrain/Learning Rate": 3.531468531468531e-05, "Pretrain/Loss": 2.273247241973877, "Pretrain/Loss (Raw)": 2.1107840538024902, "Pretrain/Step": 202, "Pretrain/Step Time": 8.53332339413464} +{"Pretrain/Learning Rate": 3.548951048951049e-05, "Pretrain/Loss": 2.2732598781585693, "Pretrain/Loss (Raw)": 2.185131311416626, "Pretrain/Step": 203, "Pretrain/Step Time": 8.531424779444933} +{"Pretrain/Learning Rate": 3.566433566433567e-05, "Pretrain/Loss": 2.2723608016967773, "Pretrain/Loss (Raw)": 2.299997329711914, "Pretrain/Step": 204, "Pretrain/Step Time": 8.537597944959998} +{"Pretrain/Learning Rate": 3.583916083916084e-05, "Pretrain/Loss": 2.2713871002197266, "Pretrain/Loss (Raw)": 2.1378722190856934, "Pretrain/Step": 205, "Pretrain/Step Time": 8.543589431792498} +{"Pretrain/Learning Rate": 3.601398601398602e-05, "Pretrain/Loss": 2.2702949047088623, "Pretrain/Loss (Raw)": 2.2589070796966553, "Pretrain/Step": 206, "Pretrain/Step Time": 8.537757439538836} +{"Pretrain/Learning Rate": 3.618881118881119e-05, "Pretrain/Loss": 2.268500566482544, "Pretrain/Loss (Raw)": 2.0658681392669678, "Pretrain/Step": 207, "Pretrain/Step Time": 8.538732873275876} +{"Pretrain/Learning Rate": 3.6363636363636364e-05, "Pretrain/Loss": 2.2615272998809814, "Pretrain/Loss (Raw)": 2.1409332752227783, "Pretrain/Step": 208, "Pretrain/Step Time": 8.538024488836527} +{"Pretrain/Learning Rate": 3.653846153846154e-05, "Pretrain/Loss": 2.2597341537475586, "Pretrain/Loss (Raw)": 2.257244348526001, "Pretrain/Step": 209, "Pretrain/Step Time": 8.548327395692468} +{"Pretrain/Learning Rate": 3.671328671328672e-05, "Pretrain/Loss": 2.2618532180786133, "Pretrain/Loss (Raw)": 2.2467947006225586, "Pretrain/Step": 210, "Pretrain/Step Time": 8.545601956546307} +{"Pretrain/Learning Rate": 3.688811188811189e-05, "Pretrain/Loss": 2.2608394622802734, "Pretrain/Loss (Raw)": 2.0779097080230713, "Pretrain/Step": 211, "Pretrain/Step Time": 8.548078201711178} +{"Pretrain/Learning Rate": 3.7062937062937064e-05, "Pretrain/Loss": 2.2562835216522217, "Pretrain/Loss (Raw)": 1.8228685855865479, "Pretrain/Step": 212, "Pretrain/Step Time": 8.550512189045548} +{"Pretrain/Learning Rate": 3.7237762237762244e-05, "Pretrain/Loss": 2.2579565048217773, "Pretrain/Loss (Raw)": 2.5341672897338867, "Pretrain/Step": 213, "Pretrain/Step Time": 8.549291610717773} +{"Pretrain/Learning Rate": 3.741258741258741e-05, "Pretrain/Loss": 2.257683753967285, "Pretrain/Loss (Raw)": 2.1012375354766846, "Pretrain/Step": 214, "Pretrain/Step Time": 8.550894249230623} +{"Pretrain/Learning Rate": 3.758741258741259e-05, "Pretrain/Loss": 2.257966995239258, "Pretrain/Loss (Raw)": 2.3196935653686523, "Pretrain/Step": 215, "Pretrain/Step Time": 8.550641678273678} +{"Pretrain/Learning Rate": 3.776223776223776e-05, "Pretrain/Loss": 2.259049654006958, "Pretrain/Loss (Raw)": 2.334731101989746, "Pretrain/Step": 216, "Pretrain/Step Time": 8.542855625972152} +{"Pretrain/Learning Rate": 3.7937062937062936e-05, "Pretrain/Loss": 2.2609658241271973, "Pretrain/Loss (Raw)": 2.428332805633545, "Pretrain/Step": 217, "Pretrain/Step Time": 8.543187053874135} +{"Pretrain/Learning Rate": 3.811188811188811e-05, "Pretrain/Loss": 2.263340473175049, "Pretrain/Loss (Raw)": 2.403498888015747, "Pretrain/Step": 218, "Pretrain/Step Time": 8.544059814885259} +{"Pretrain/Learning Rate": 3.828671328671329e-05, "Pretrain/Loss": 2.2643697261810303, "Pretrain/Loss (Raw)": 2.3161418437957764, "Pretrain/Step": 219, "Pretrain/Step Time": 8.539791278541088} +{"Pretrain/Learning Rate": 3.846153846153846e-05, "Pretrain/Loss": 2.265031337738037, "Pretrain/Loss (Raw)": 2.2356343269348145, "Pretrain/Step": 220, "Pretrain/Step Time": 8.538095140829682} +{"Pretrain/Learning Rate": 3.8636363636363636e-05, "Pretrain/Loss": 2.263819694519043, "Pretrain/Loss (Raw)": 2.210885524749756, "Pretrain/Step": 221, "Pretrain/Step Time": 8.53692626208067} +{"Pretrain/Learning Rate": 3.8811188811188816e-05, "Pretrain/Loss": 2.2629313468933105, "Pretrain/Loss (Raw)": 2.160012722015381, "Pretrain/Step": 222, "Pretrain/Step Time": 8.534507060423493} +{"Pretrain/Learning Rate": 3.898601398601399e-05, "Pretrain/Loss": 2.263575315475464, "Pretrain/Loss (Raw)": 2.096834421157837, "Pretrain/Step": 223, "Pretrain/Step Time": 8.53983067162335} +{"Pretrain/Learning Rate": 3.916083916083916e-05, "Pretrain/Loss": 2.2625679969787598, "Pretrain/Loss (Raw)": 2.2331008911132812, "Pretrain/Step": 224, "Pretrain/Step Time": 8.54301555454731} +{"Pretrain/Learning Rate": 3.9335664335664336e-05, "Pretrain/Loss": 2.2647640705108643, "Pretrain/Loss (Raw)": 2.5185489654541016, "Pretrain/Step": 225, "Pretrain/Step Time": 8.525471979752183} +{"Pretrain/Learning Rate": 3.9510489510489516e-05, "Pretrain/Loss": 2.261539936065674, "Pretrain/Loss (Raw)": 2.0250415802001953, "Pretrain/Step": 226, "Pretrain/Step Time": 8.528700098395348} +{"Pretrain/Learning Rate": 3.968531468531469e-05, "Pretrain/Loss": 2.260039806365967, "Pretrain/Loss (Raw)": 2.129978656768799, "Pretrain/Step": 227, "Pretrain/Step Time": 8.533298663794994} +{"Pretrain/Learning Rate": 3.986013986013986e-05, "Pretrain/Loss": 2.2587337493896484, "Pretrain/Loss (Raw)": 2.1300301551818848, "Pretrain/Step": 228, "Pretrain/Step Time": 8.536443810909986} +{"Pretrain/Learning Rate": 4.0034965034965035e-05, "Pretrain/Loss": 2.257650852203369, "Pretrain/Loss (Raw)": 2.124823808670044, "Pretrain/Step": 229, "Pretrain/Step Time": 8.522286722436547} +{"Pretrain/Learning Rate": 4.020979020979021e-05, "Pretrain/Loss": 2.2516398429870605, "Pretrain/Loss (Raw)": 1.8278961181640625, "Pretrain/Step": 230, "Pretrain/Step Time": 8.52200029976666} +{"Pretrain/Learning Rate": 4.038461538461539e-05, "Pretrain/Loss": 2.2497174739837646, "Pretrain/Loss (Raw)": 2.376225233078003, "Pretrain/Step": 231, "Pretrain/Step Time": 8.526700485497713} +{"Pretrain/Learning Rate": 4.055944055944056e-05, "Pretrain/Loss": 2.2486438751220703, "Pretrain/Loss (Raw)": 2.0639448165893555, "Pretrain/Step": 232, "Pretrain/Step Time": 8.534330397844315} +{"Pretrain/Learning Rate": 4.0734265734265735e-05, "Pretrain/Loss": 2.249490737915039, "Pretrain/Loss (Raw)": 2.249351739883423, "Pretrain/Step": 233, "Pretrain/Step Time": 8.526990042999387} +{"Pretrain/Learning Rate": 4.0909090909090915e-05, "Pretrain/Loss": 2.247775077819824, "Pretrain/Loss (Raw)": 2.069835662841797, "Pretrain/Step": 234, "Pretrain/Step Time": 8.527087613940239} +{"Pretrain/Learning Rate": 4.108391608391609e-05, "Pretrain/Loss": 2.244424343109131, "Pretrain/Loss (Raw)": 2.1135165691375732, "Pretrain/Step": 235, "Pretrain/Step Time": 8.528192279860377} +{"Pretrain/Learning Rate": 4.125874125874126e-05, "Pretrain/Loss": 2.2441511154174805, "Pretrain/Loss (Raw)": 2.122466802597046, "Pretrain/Step": 236, "Pretrain/Step Time": 8.534846600145102} +{"Pretrain/Learning Rate": 4.1433566433566434e-05, "Pretrain/Loss": 2.2442102432250977, "Pretrain/Loss (Raw)": 2.3725337982177734, "Pretrain/Step": 237, "Pretrain/Step Time": 8.534499196335673} +{"Pretrain/Learning Rate": 4.1608391608391614e-05, "Pretrain/Loss": 2.244046688079834, "Pretrain/Loss (Raw)": 2.2148525714874268, "Pretrain/Step": 238, "Pretrain/Step Time": 8.53599439561367} +{"Pretrain/Learning Rate": 4.178321678321678e-05, "Pretrain/Loss": 2.242213249206543, "Pretrain/Loss (Raw)": 2.053377628326416, "Pretrain/Step": 239, "Pretrain/Step Time": 8.530968587845564} +{"Pretrain/Learning Rate": 4.195804195804196e-05, "Pretrain/Loss": 2.241461992263794, "Pretrain/Loss (Raw)": 2.323214530944824, "Pretrain/Step": 240, "Pretrain/Step Time": 8.52428911998868} +{"Pretrain/Learning Rate": 4.213286713286714e-05, "Pretrain/Loss": 2.2411458492279053, "Pretrain/Loss (Raw)": 2.1311581134796143, "Pretrain/Step": 241, "Pretrain/Step Time": 8.524774020537734} +{"Pretrain/Learning Rate": 4.230769230769231e-05, "Pretrain/Loss": 2.2394330501556396, "Pretrain/Loss (Raw)": 2.1306655406951904, "Pretrain/Step": 242, "Pretrain/Step Time": 8.523789277300239} +{"Pretrain/Learning Rate": 4.248251748251749e-05, "Pretrain/Loss": 2.238809823989868, "Pretrain/Loss (Raw)": 2.134343385696411, "Pretrain/Step": 243, "Pretrain/Step Time": 8.52448259294033} +{"Pretrain/Learning Rate": 4.265734265734266e-05, "Pretrain/Loss": 2.2358434200286865, "Pretrain/Loss (Raw)": 2.2791686058044434, "Pretrain/Step": 244, "Pretrain/Step Time": 8.516385607421398} +{"Pretrain/Learning Rate": 4.2832167832167833e-05, "Pretrain/Loss": 2.230746269226074, "Pretrain/Loss (Raw)": 2.152853488922119, "Pretrain/Step": 245, "Pretrain/Step Time": 8.513027114793658} +{"Pretrain/Learning Rate": 4.300699300699301e-05, "Pretrain/Loss": 2.227736473083496, "Pretrain/Loss (Raw)": 2.27725887298584, "Pretrain/Step": 246, "Pretrain/Step Time": 8.522129852324724} +{"Pretrain/Learning Rate": 4.318181818181819e-05, "Pretrain/Loss": 2.229646682739258, "Pretrain/Loss (Raw)": 2.3387646675109863, "Pretrain/Step": 247, "Pretrain/Step Time": 8.519371941685677} +{"Pretrain/Learning Rate": 4.335664335664335e-05, "Pretrain/Loss": 2.230745792388916, "Pretrain/Loss (Raw)": 2.4454550743103027, "Pretrain/Step": 248, "Pretrain/Step Time": 8.509510627016425} +{"Pretrain/Learning Rate": 4.353146853146853e-05, "Pretrain/Loss": 2.2313122749328613, "Pretrain/Loss (Raw)": 2.183842182159424, "Pretrain/Step": 249, "Pretrain/Step Time": 8.518675377592444} +{"Pretrain/Learning Rate": 4.370629370629371e-05, "Pretrain/Loss": 2.2362780570983887, "Pretrain/Loss (Raw)": 2.734666585922241, "Pretrain/Step": 250, "Pretrain/Step Time": 8.520887920632958} +{"Pretrain/Learning Rate": 4.388111888111888e-05, "Pretrain/Loss": 2.239297866821289, "Pretrain/Loss (Raw)": 2.384031295776367, "Pretrain/Step": 251, "Pretrain/Step Time": 8.521580940112472} +{"Pretrain/Learning Rate": 4.405594405594406e-05, "Pretrain/Loss": 2.239954948425293, "Pretrain/Loss (Raw)": 2.2383620738983154, "Pretrain/Step": 252, "Pretrain/Step Time": 8.522713908925653} +{"Pretrain/Learning Rate": 4.423076923076923e-05, "Pretrain/Loss": 2.2406725883483887, "Pretrain/Loss (Raw)": 2.33689546585083, "Pretrain/Step": 253, "Pretrain/Step Time": 8.520536102354527} +{"Pretrain/Learning Rate": 4.4405594405594406e-05, "Pretrain/Loss": 2.241328239440918, "Pretrain/Loss (Raw)": 2.372619390487671, "Pretrain/Step": 254, "Pretrain/Step Time": 8.515554206445813} +{"Pretrain/Learning Rate": 4.458041958041958e-05, "Pretrain/Loss": 2.2410531044006348, "Pretrain/Loss (Raw)": 2.229344129562378, "Pretrain/Step": 255, "Pretrain/Step Time": 8.51662116497755} +{"Pretrain/Learning Rate": 4.475524475524476e-05, "Pretrain/Loss": 2.236703634262085, "Pretrain/Loss (Raw)": 1.9640319347381592, "Pretrain/Step": 256, "Pretrain/Step Time": 8.525511760264635} +{"Pretrain/Learning Rate": 4.493006993006993e-05, "Pretrain/Loss": 2.236633777618408, "Pretrain/Loss (Raw)": 2.296992301940918, "Pretrain/Step": 257, "Pretrain/Step Time": 8.520820019766688} +{"Pretrain/Learning Rate": 4.5104895104895105e-05, "Pretrain/Loss": 2.235137939453125, "Pretrain/Loss (Raw)": 2.2442233562469482, "Pretrain/Step": 258, "Pretrain/Step Time": 8.502062229439616} +{"Pretrain/Learning Rate": 4.5279720279720285e-05, "Pretrain/Loss": 2.2388663291931152, "Pretrain/Loss (Raw)": 2.8627724647521973, "Pretrain/Step": 259, "Pretrain/Step Time": 8.504323413595557} +{"Pretrain/Learning Rate": 4.545454545454546e-05, "Pretrain/Loss": 2.2377123832702637, "Pretrain/Loss (Raw)": 2.180091381072998, "Pretrain/Step": 260, "Pretrain/Step Time": 8.506159896031022} +{"Pretrain/Learning Rate": 4.562937062937063e-05, "Pretrain/Loss": 2.2356743812561035, "Pretrain/Loss (Raw)": 2.222316265106201, "Pretrain/Step": 261, "Pretrain/Step Time": 8.496226727962494} +{"Pretrain/Learning Rate": 4.5804195804195805e-05, "Pretrain/Loss": 2.2318689823150635, "Pretrain/Loss (Raw)": 2.0228378772735596, "Pretrain/Step": 262, "Pretrain/Step Time": 8.504818681627512} +{"Pretrain/Learning Rate": 4.597902097902098e-05, "Pretrain/Loss": 2.2307443618774414, "Pretrain/Loss (Raw)": 2.3753745555877686, "Pretrain/Step": 263, "Pretrain/Step Time": 8.499307135120034} +{"Pretrain/Learning Rate": 4.615384615384616e-05, "Pretrain/Loss": 2.2304468154907227, "Pretrain/Loss (Raw)": 2.267829179763794, "Pretrain/Step": 264, "Pretrain/Step Time": 8.499853217974305} +{"Pretrain/Learning Rate": 4.632867132867133e-05, "Pretrain/Loss": 2.231328010559082, "Pretrain/Loss (Raw)": 2.3461363315582275, "Pretrain/Step": 265, "Pretrain/Step Time": 8.501476226374507} +{"Pretrain/Learning Rate": 4.6503496503496505e-05, "Pretrain/Loss": 2.2333486080169678, "Pretrain/Loss (Raw)": 2.5296990871429443, "Pretrain/Step": 266, "Pretrain/Step Time": 8.494988773018122} +{"Pretrain/Learning Rate": 4.667832167832168e-05, "Pretrain/Loss": 2.231208324432373, "Pretrain/Loss (Raw)": 2.0153958797454834, "Pretrain/Step": 267, "Pretrain/Step Time": 8.496274564415216} +{"Pretrain/Learning Rate": 4.685314685314686e-05, "Pretrain/Loss": 2.2299842834472656, "Pretrain/Loss (Raw)": 2.325410842895508, "Pretrain/Step": 268, "Pretrain/Step Time": 8.499972043558955} +{"Pretrain/Learning Rate": 4.702797202797203e-05, "Pretrain/Loss": 2.2270827293395996, "Pretrain/Loss (Raw)": 2.0022706985473633, "Pretrain/Step": 269, "Pretrain/Step Time": 8.4999197460711} +{"Pretrain/Learning Rate": 4.7202797202797204e-05, "Pretrain/Loss": 2.228968620300293, "Pretrain/Loss (Raw)": 2.1337220668792725, "Pretrain/Step": 270, "Pretrain/Step Time": 8.50369019061327} +{"Pretrain/Learning Rate": 4.7377622377622384e-05, "Pretrain/Loss": 2.230743408203125, "Pretrain/Loss (Raw)": 2.4243123531341553, "Pretrain/Step": 271, "Pretrain/Step Time": 8.501289770007133} +{"Pretrain/Learning Rate": 4.755244755244756e-05, "Pretrain/Loss": 2.232253074645996, "Pretrain/Loss (Raw)": 2.4206109046936035, "Pretrain/Step": 272, "Pretrain/Step Time": 8.502022529020905} +{"Pretrain/Learning Rate": 4.772727272727273e-05, "Pretrain/Loss": 2.231991767883301, "Pretrain/Loss (Raw)": 2.1604971885681152, "Pretrain/Step": 273, "Pretrain/Step Time": 8.508008955046535} +{"Pretrain/Learning Rate": 4.7902097902097904e-05, "Pretrain/Loss": 2.2352347373962402, "Pretrain/Loss (Raw)": 2.310519218444824, "Pretrain/Step": 274, "Pretrain/Step Time": 8.510546082630754} +{"Pretrain/Learning Rate": 4.8076923076923084e-05, "Pretrain/Loss": 2.233349323272705, "Pretrain/Loss (Raw)": 2.090789794921875, "Pretrain/Step": 275, "Pretrain/Step Time": 8.50841816328466} +{"Pretrain/Learning Rate": 4.825174825174825e-05, "Pretrain/Loss": 2.236074924468994, "Pretrain/Loss (Raw)": 2.3648483753204346, "Pretrain/Step": 276, "Pretrain/Step Time": 8.500918230041862} +{"Pretrain/Learning Rate": 4.842657342657343e-05, "Pretrain/Loss": 2.234558582305908, "Pretrain/Loss (Raw)": 2.2214603424072266, "Pretrain/Step": 277, "Pretrain/Step Time": 8.500384898856282} +{"Pretrain/Learning Rate": 4.86013986013986e-05, "Pretrain/Loss": 2.234992504119873, "Pretrain/Loss (Raw)": 2.2434873580932617, "Pretrain/Step": 278, "Pretrain/Step Time": 8.496662087738514} +{"Pretrain/Learning Rate": 4.8776223776223776e-05, "Pretrain/Loss": 2.234066963195801, "Pretrain/Loss (Raw)": 2.029846429824829, "Pretrain/Step": 279, "Pretrain/Step Time": 8.50108139961958} +{"Pretrain/Learning Rate": 4.8951048951048956e-05, "Pretrain/Loss": 2.232913017272949, "Pretrain/Loss (Raw)": 2.1989216804504395, "Pretrain/Step": 280, "Pretrain/Step Time": 8.508386462926865} +{"Pretrain/Learning Rate": 4.912587412587413e-05, "Pretrain/Loss": 2.2327651977539062, "Pretrain/Loss (Raw)": 2.333752155303955, "Pretrain/Step": 281, "Pretrain/Step Time": 8.518818262964487} +{"Pretrain/Learning Rate": 4.93006993006993e-05, "Pretrain/Loss": 2.2304883003234863, "Pretrain/Loss (Raw)": 2.14850115776062, "Pretrain/Step": 282, "Pretrain/Step Time": 8.516837293282151} +{"Pretrain/Learning Rate": 4.9475524475524476e-05, "Pretrain/Loss": 2.2311151027679443, "Pretrain/Loss (Raw)": 2.2583835124969482, "Pretrain/Step": 283, "Pretrain/Step Time": 8.51331221498549} +{"Pretrain/Learning Rate": 4.9650349650349656e-05, "Pretrain/Loss": 2.230978488922119, "Pretrain/Loss (Raw)": 2.260643243789673, "Pretrain/Step": 284, "Pretrain/Step Time": 8.514778282493353} +{"Pretrain/Learning Rate": 4.982517482517482e-05, "Pretrain/Loss": 2.232870578765869, "Pretrain/Loss (Raw)": 2.3420417308807373, "Pretrain/Step": 285, "Pretrain/Step Time": 8.514235066249967} +{"Pretrain/Learning Rate": 5e-05, "Pretrain/Loss": 2.2308249473571777, "Pretrain/Loss (Raw)": 2.0011751651763916, "Pretrain/Step": 286, "Pretrain/Step Time": 8.5172367002815} +{"Pretrain/Learning Rate": 4.9999998558441094e-05, "Pretrain/Loss": 2.232273817062378, "Pretrain/Loss (Raw)": 2.2947885990142822, "Pretrain/Step": 287, "Pretrain/Step Time": 8.525084421038628} +{"Pretrain/Learning Rate": 4.999999423376456e-05, "Pretrain/Loss": 2.235240936279297, "Pretrain/Loss (Raw)": 2.2940690517425537, "Pretrain/Step": 288, "Pretrain/Step Time": 8.518302150070667} +{"Pretrain/Learning Rate": 4.9999987025970884e-05, "Pretrain/Loss": 2.2382965087890625, "Pretrain/Loss (Raw)": 2.6360955238342285, "Pretrain/Step": 289, "Pretrain/Step Time": 8.522453159093857} +{"Pretrain/Learning Rate": 4.99999769350609e-05, "Pretrain/Loss": 2.2378244400024414, "Pretrain/Loss (Raw)": 1.9315779209136963, "Pretrain/Step": 290, "Pretrain/Step Time": 8.51753156259656} +{"Pretrain/Learning Rate": 4.999996396103577e-05, "Pretrain/Loss": 2.2355239391326904, "Pretrain/Loss (Raw)": 2.096473217010498, "Pretrain/Step": 291, "Pretrain/Step Time": 8.516043182462454} +{"Pretrain/Learning Rate": 4.999994810389699e-05, "Pretrain/Loss": 2.2344930171966553, "Pretrain/Loss (Raw)": 2.138883352279663, "Pretrain/Step": 292, "Pretrain/Step Time": 8.516525277867913} +{"Pretrain/Learning Rate": 4.999992936364639e-05, "Pretrain/Loss": 2.2355878353118896, "Pretrain/Loss (Raw)": 2.437866449356079, "Pretrain/Step": 293, "Pretrain/Step Time": 8.530577706173062} +{"Pretrain/Learning Rate": 4.9999907740286136e-05, "Pretrain/Loss": 2.233956813812256, "Pretrain/Loss (Raw)": 2.055640935897827, "Pretrain/Step": 294, "Pretrain/Step Time": 8.518194211646914} +{"Pretrain/Learning Rate": 4.9999883233818724e-05, "Pretrain/Loss": 2.233388662338257, "Pretrain/Loss (Raw)": 2.0069849491119385, "Pretrain/Step": 295, "Pretrain/Step Time": 8.517660081386566} +{"Pretrain/Learning Rate": 4.999985584424696e-05, "Pretrain/Loss": 2.230229139328003, "Pretrain/Loss (Raw)": 2.0061800479888916, "Pretrain/Step": 296, "Pretrain/Step Time": 8.514724891632795} +{"Pretrain/Learning Rate": 4.999982557157403e-05, "Pretrain/Loss": 2.229767322540283, "Pretrain/Loss (Raw)": 2.2715792655944824, "Pretrain/Step": 297, "Pretrain/Step Time": 8.516965009272099} +{"Pretrain/Learning Rate": 4.9999792415803405e-05, "Pretrain/Loss": 2.231161594390869, "Pretrain/Loss (Raw)": 2.304180383682251, "Pretrain/Step": 298, "Pretrain/Step Time": 8.52153491973877} +{"Pretrain/Learning Rate": 4.999975637693892e-05, "Pretrain/Loss": 2.230349540710449, "Pretrain/Loss (Raw)": 2.175532817840576, "Pretrain/Step": 299, "Pretrain/Step Time": 8.531828239560127} +{"Pretrain/Learning Rate": 4.999971745498472e-05, "Pretrain/Loss": 2.2289016246795654, "Pretrain/Loss (Raw)": 2.087996244430542, "Pretrain/Step": 300, "Pretrain/Step Time": 8.537003502249718} +{"Pretrain/Learning Rate": 4.999967564994531e-05, "Pretrain/Loss": 2.2303073406219482, "Pretrain/Loss (Raw)": 2.3011739253997803, "Pretrain/Step": 301, "Pretrain/Step Time": 8.524767702445388} +{"Pretrain/Learning Rate": 4.999963096182549e-05, "Pretrain/Loss": 2.228701591491699, "Pretrain/Loss (Raw)": 2.2476255893707275, "Pretrain/Step": 302, "Pretrain/Step Time": 8.529292555525899} +{"Pretrain/Learning Rate": 4.9999583390630435e-05, "Pretrain/Loss": 2.2271010875701904, "Pretrain/Loss (Raw)": 2.2064921855926514, "Pretrain/Step": 303, "Pretrain/Step Time": 8.529834471642971} +{"Pretrain/Learning Rate": 4.999953293636562e-05, "Pretrain/Loss": 2.2253313064575195, "Pretrain/Loss (Raw)": 2.080531358718872, "Pretrain/Step": 304, "Pretrain/Step Time": 8.535580474883318} +{"Pretrain/Learning Rate": 4.9999479599036856e-05, "Pretrain/Loss": 2.2251553535461426, "Pretrain/Loss (Raw)": 2.415611982345581, "Pretrain/Step": 305, "Pretrain/Step Time": 8.53821543045342} +{"Pretrain/Learning Rate": 4.9999423378650315e-05, "Pretrain/Loss": 2.2259674072265625, "Pretrain/Loss (Raw)": 2.2286267280578613, "Pretrain/Step": 306, "Pretrain/Step Time": 8.53084889613092} +{"Pretrain/Learning Rate": 4.9999364275212466e-05, "Pretrain/Loss": 2.226977586746216, "Pretrain/Loss (Raw)": 2.3540420532226562, "Pretrain/Step": 307, "Pretrain/Step Time": 8.52930479682982} +{"Pretrain/Learning Rate": 4.9999302288730126e-05, "Pretrain/Loss": 2.224444627761841, "Pretrain/Loss (Raw)": 2.0534284114837646, "Pretrain/Step": 308, "Pretrain/Step Time": 8.524120571091771} +{"Pretrain/Learning Rate": 4.9999237419210445e-05, "Pretrain/Loss": 2.225635528564453, "Pretrain/Loss (Raw)": 2.1032516956329346, "Pretrain/Step": 309, "Pretrain/Step Time": 8.524169746786356} +{"Pretrain/Learning Rate": 4.99991696666609e-05, "Pretrain/Loss": 2.225402355194092, "Pretrain/Loss (Raw)": 2.2248215675354004, "Pretrain/Step": 310, "Pretrain/Step Time": 8.526545377448201} +{"Pretrain/Learning Rate": 4.999909903108932e-05, "Pretrain/Loss": 2.224175214767456, "Pretrain/Loss (Raw)": 1.9178340435028076, "Pretrain/Step": 311, "Pretrain/Step Time": 8.536070086061954} +{"Pretrain/Learning Rate": 4.999902551250384e-05, "Pretrain/Loss": 2.221620559692383, "Pretrain/Loss (Raw)": 1.9559787511825562, "Pretrain/Step": 312, "Pretrain/Step Time": 8.536196468397975} +{"Pretrain/Learning Rate": 4.999894911091293e-05, "Pretrain/Loss": 2.2219061851501465, "Pretrain/Loss (Raw)": 2.161132335662842, "Pretrain/Step": 313, "Pretrain/Step Time": 8.520334908738732} +{"Pretrain/Learning Rate": 4.999886982632541e-05, "Pretrain/Loss": 2.2193493843078613, "Pretrain/Loss (Raw)": 2.1773598194122314, "Pretrain/Step": 314, "Pretrain/Step Time": 8.513929223641753} +{"Pretrain/Learning Rate": 4.999878765875042e-05, "Pretrain/Loss": 2.2222037315368652, "Pretrain/Loss (Raw)": 2.4897477626800537, "Pretrain/Step": 315, "Pretrain/Step Time": 8.51618822477758} +{"Pretrain/Learning Rate": 4.999870260819745e-05, "Pretrain/Loss": 2.2236993312835693, "Pretrain/Loss (Raw)": 2.2207791805267334, "Pretrain/Step": 316, "Pretrain/Step Time": 8.520781906321645} +{"Pretrain/Learning Rate": 4.999861467467629e-05, "Pretrain/Loss": 2.2236857414245605, "Pretrain/Loss (Raw)": 2.070237636566162, "Pretrain/Step": 317, "Pretrain/Step Time": 8.52478913962841} +{"Pretrain/Learning Rate": 4.9998523858197094e-05, "Pretrain/Loss": 2.221651077270508, "Pretrain/Loss (Raw)": 2.0559380054473877, "Pretrain/Step": 318, "Pretrain/Step Time": 8.529072104021907} +{"Pretrain/Learning Rate": 4.999843015877032e-05, "Pretrain/Loss": 2.2244420051574707, "Pretrain/Loss (Raw)": 2.455819845199585, "Pretrain/Step": 319, "Pretrain/Step Time": 8.528332088142633} +{"Pretrain/Learning Rate": 4.99983335764068e-05, "Pretrain/Loss": 2.224581003189087, "Pretrain/Loss (Raw)": 2.2648329734802246, "Pretrain/Step": 320, "Pretrain/Step Time": 8.51884163916111} +{"Pretrain/Learning Rate": 4.999823411111765e-05, "Pretrain/Loss": 2.223513603210449, "Pretrain/Loss (Raw)": 2.170825719833374, "Pretrain/Step": 321, "Pretrain/Step Time": 8.516988089308143} +{"Pretrain/Learning Rate": 4.999813176291433e-05, "Pretrain/Loss": 2.2195816040039062, "Pretrain/Loss (Raw)": 2.0297374725341797, "Pretrain/Step": 322, "Pretrain/Step Time": 8.524462742730975} +{"Pretrain/Learning Rate": 4.999802653180868e-05, "Pretrain/Loss": 2.218559980392456, "Pretrain/Loss (Raw)": 2.186717987060547, "Pretrain/Step": 323, "Pretrain/Step Time": 8.534315908327699} +{"Pretrain/Learning Rate": 4.9997918417812805e-05, "Pretrain/Loss": 2.217747688293457, "Pretrain/Loss (Raw)": 2.087379217147827, "Pretrain/Step": 324, "Pretrain/Step Time": 8.537636393681169} +{"Pretrain/Learning Rate": 4.999780742093919e-05, "Pretrain/Loss": 2.216632843017578, "Pretrain/Loss (Raw)": 1.9794840812683105, "Pretrain/Step": 325, "Pretrain/Step Time": 8.531910372897983} +{"Pretrain/Learning Rate": 4.999769354120063e-05, "Pretrain/Loss": 2.2169103622436523, "Pretrain/Loss (Raw)": 2.2089033126831055, "Pretrain/Step": 326, "Pretrain/Step Time": 8.525603957474232} +{"Pretrain/Learning Rate": 4.9997576778610254e-05, "Pretrain/Loss": 2.216689348220825, "Pretrain/Loss (Raw)": 2.151345729827881, "Pretrain/Step": 327, "Pretrain/Step Time": 8.531209859997034} +{"Pretrain/Learning Rate": 4.999745713318154e-05, "Pretrain/Loss": 2.215658187866211, "Pretrain/Loss (Raw)": 2.2047955989837646, "Pretrain/Step": 328, "Pretrain/Step Time": 8.53825474344194} +{"Pretrain/Learning Rate": 4.999733460492826e-05, "Pretrain/Loss": 2.22151780128479, "Pretrain/Loss (Raw)": 2.9494404792785645, "Pretrain/Step": 329, "Pretrain/Step Time": 8.54033600538969} +{"Pretrain/Learning Rate": 4.999720919386457e-05, "Pretrain/Loss": 2.2222847938537598, "Pretrain/Loss (Raw)": 2.20896053314209, "Pretrain/Step": 330, "Pretrain/Step Time": 8.542187541723251} +{"Pretrain/Learning Rate": 4.999708090000493e-05, "Pretrain/Loss": 2.2215168476104736, "Pretrain/Loss (Raw)": 2.086829423904419, "Pretrain/Step": 331, "Pretrain/Step Time": 8.539356170222163} +{"Pretrain/Learning Rate": 4.999694972336413e-05, "Pretrain/Loss": 2.221794843673706, "Pretrain/Loss (Raw)": 2.3355844020843506, "Pretrain/Step": 332, "Pretrain/Step Time": 8.537721717730165} +{"Pretrain/Learning Rate": 4.9996815663957296e-05, "Pretrain/Loss": 2.2221057415008545, "Pretrain/Loss (Raw)": 2.17765474319458, "Pretrain/Step": 333, "Pretrain/Step Time": 8.52695200778544} +{"Pretrain/Learning Rate": 4.9996678721799893e-05, "Pretrain/Loss": 2.222278118133545, "Pretrain/Loss (Raw)": 2.280959129333496, "Pretrain/Step": 334, "Pretrain/Step Time": 8.531141387298703} +{"Pretrain/Learning Rate": 4.999653889690771e-05, "Pretrain/Loss": 2.222160577774048, "Pretrain/Loss (Raw)": 2.050855875015259, "Pretrain/Step": 335, "Pretrain/Step Time": 8.5293089132756} +{"Pretrain/Learning Rate": 4.9996396189296865e-05, "Pretrain/Loss": 2.221686840057373, "Pretrain/Loss (Raw)": 2.080282211303711, "Pretrain/Step": 336, "Pretrain/Step Time": 8.528979565948248} +{"Pretrain/Learning Rate": 4.999625059898384e-05, "Pretrain/Loss": 2.220355749130249, "Pretrain/Loss (Raw)": 2.086853265762329, "Pretrain/Step": 337, "Pretrain/Step Time": 8.524821048602462} +{"Pretrain/Learning Rate": 4.99961021259854e-05, "Pretrain/Loss": 2.2199089527130127, "Pretrain/Loss (Raw)": 2.1896157264709473, "Pretrain/Step": 338, "Pretrain/Step Time": 8.517666276544333} +{"Pretrain/Learning Rate": 4.999595077031868e-05, "Pretrain/Loss": 2.2204031944274902, "Pretrain/Loss (Raw)": 2.141164541244507, "Pretrain/Step": 339, "Pretrain/Step Time": 8.518499011173844} +{"Pretrain/Learning Rate": 4.9995796532001136e-05, "Pretrain/Loss": 2.2248902320861816, "Pretrain/Loss (Raw)": 2.397240400314331, "Pretrain/Step": 340, "Pretrain/Step Time": 8.520911222323775} +{"Pretrain/Learning Rate": 4.999563941105054e-05, "Pretrain/Loss": 2.222562789916992, "Pretrain/Loss (Raw)": 2.23622465133667, "Pretrain/Step": 341, "Pretrain/Step Time": 8.52302386239171} +{"Pretrain/Learning Rate": 4.9995479407485035e-05, "Pretrain/Loss": 2.2227959632873535, "Pretrain/Loss (Raw)": 2.131101608276367, "Pretrain/Step": 342, "Pretrain/Step Time": 8.524770786985755} +{"Pretrain/Learning Rate": 4.9995316521323066e-05, "Pretrain/Loss": 2.2247276306152344, "Pretrain/Loss (Raw)": 2.566924810409546, "Pretrain/Step": 343, "Pretrain/Step Time": 8.517000894993544} +{"Pretrain/Learning Rate": 4.99951507525834e-05, "Pretrain/Loss": 2.2244529724121094, "Pretrain/Loss (Raw)": 2.299582004547119, "Pretrain/Step": 344, "Pretrain/Step Time": 8.52255348674953} +{"Pretrain/Learning Rate": 4.999498210128518e-05, "Pretrain/Loss": 2.222527503967285, "Pretrain/Loss (Raw)": 2.1818647384643555, "Pretrain/Step": 345, "Pretrain/Step Time": 8.52845330350101} +{"Pretrain/Learning Rate": 4.9994810567447834e-05, "Pretrain/Loss": 2.219681739807129, "Pretrain/Loss (Raw)": 2.0392680168151855, "Pretrain/Step": 346, "Pretrain/Step Time": 8.523359071463346} +{"Pretrain/Learning Rate": 4.9994636151091165e-05, "Pretrain/Loss": 2.2181007862091064, "Pretrain/Loss (Raw)": 2.113776445388794, "Pretrain/Step": 347, "Pretrain/Step Time": 8.52530987933278} +{"Pretrain/Learning Rate": 4.999445885223527e-05, "Pretrain/Loss": 2.216805934906006, "Pretrain/Loss (Raw)": 2.0698702335357666, "Pretrain/Step": 348, "Pretrain/Step Time": 8.520856387913227} +{"Pretrain/Learning Rate": 4.99942786709006e-05, "Pretrain/Loss": 2.216413974761963, "Pretrain/Loss (Raw)": 2.160719156265259, "Pretrain/Step": 349, "Pretrain/Step Time": 8.510871268808842} +{"Pretrain/Learning Rate": 4.999409560710794e-05, "Pretrain/Loss": 2.215191125869751, "Pretrain/Loss (Raw)": 2.0034866333007812, "Pretrain/Step": 350, "Pretrain/Step Time": 8.511756557971239} +{"Pretrain/Learning Rate": 4.99939096608784e-05, "Pretrain/Loss": 2.217069387435913, "Pretrain/Loss (Raw)": 2.3372762203216553, "Pretrain/Step": 351, "Pretrain/Step Time": 8.516851658001542} +{"Pretrain/Learning Rate": 4.999372083223343e-05, "Pretrain/Loss": 2.2163641452789307, "Pretrain/Loss (Raw)": 2.142794370651245, "Pretrain/Step": 352, "Pretrain/Step Time": 8.513399792835116} +{"Pretrain/Learning Rate": 4.999352912119478e-05, "Pretrain/Loss": 2.2099783420562744, "Pretrain/Loss (Raw)": 1.7011799812316895, "Pretrain/Step": 353, "Pretrain/Step Time": 8.514916565269232} +{"Pretrain/Learning Rate": 4.999333452778459e-05, "Pretrain/Loss": 2.211646556854248, "Pretrain/Loss (Raw)": 2.238556385040283, "Pretrain/Step": 354, "Pretrain/Step Time": 8.51435223966837} +{"Pretrain/Learning Rate": 4.999313705202529e-05, "Pretrain/Loss": 2.2129478454589844, "Pretrain/Loss (Raw)": 2.296562433242798, "Pretrain/Step": 355, "Pretrain/Step Time": 8.507484903559089} +{"Pretrain/Learning Rate": 4.999293669393965e-05, "Pretrain/Loss": 2.2134575843811035, "Pretrain/Loss (Raw)": 2.195277690887451, "Pretrain/Step": 356, "Pretrain/Step Time": 8.51224859803915} +{"Pretrain/Learning Rate": 4.999273345355078e-05, "Pretrain/Loss": 2.2186241149902344, "Pretrain/Loss (Raw)": 2.7861368656158447, "Pretrain/Step": 357, "Pretrain/Step Time": 8.519861424341798} +{"Pretrain/Learning Rate": 4.9992527330882125e-05, "Pretrain/Loss": 2.221710681915283, "Pretrain/Loss (Raw)": 2.2229723930358887, "Pretrain/Step": 358, "Pretrain/Step Time": 8.523679221048951} +{"Pretrain/Learning Rate": 4.999231832595744e-05, "Pretrain/Loss": 2.22019100189209, "Pretrain/Loss (Raw)": 2.1817383766174316, "Pretrain/Step": 359, "Pretrain/Step Time": 8.526002321392298} +{"Pretrain/Learning Rate": 4.9992106438800846e-05, "Pretrain/Loss": 2.2203369140625, "Pretrain/Loss (Raw)": 2.0826070308685303, "Pretrain/Step": 360, "Pretrain/Step Time": 8.519648557528853} +{"Pretrain/Learning Rate": 4.999189166943677e-05, "Pretrain/Loss": 2.2215240001678467, "Pretrain/Loss (Raw)": 2.4012928009033203, "Pretrain/Step": 361, "Pretrain/Step Time": 8.521597784012556} +{"Pretrain/Learning Rate": 4.999167401788998e-05, "Pretrain/Loss": 2.2212605476379395, "Pretrain/Loss (Raw)": 2.0361108779907227, "Pretrain/Step": 362, "Pretrain/Step Time": 8.516293661668897} +{"Pretrain/Learning Rate": 4.9991453484185577e-05, "Pretrain/Loss": 2.22176456451416, "Pretrain/Loss (Raw)": 2.1780359745025635, "Pretrain/Step": 363, "Pretrain/Step Time": 8.526009250432253} +{"Pretrain/Learning Rate": 4.999123006834899e-05, "Pretrain/Loss": 2.22530460357666, "Pretrain/Loss (Raw)": 2.5755622386932373, "Pretrain/Step": 364, "Pretrain/Step Time": 8.520811202004552} +{"Pretrain/Learning Rate": 4.9991003770405994e-05, "Pretrain/Loss": 2.223473072052002, "Pretrain/Loss (Raw)": 2.138120174407959, "Pretrain/Step": 365, "Pretrain/Step Time": 8.521363412961364} +{"Pretrain/Learning Rate": 4.999077459038268e-05, "Pretrain/Loss": 2.223419189453125, "Pretrain/Loss (Raw)": 2.2079434394836426, "Pretrain/Step": 366, "Pretrain/Step Time": 8.516209261491895} +{"Pretrain/Learning Rate": 4.9990542528305484e-05, "Pretrain/Loss": 2.2233335971832275, "Pretrain/Loss (Raw)": 2.042449712753296, "Pretrain/Step": 367, "Pretrain/Step Time": 8.508514227345586} +{"Pretrain/Learning Rate": 4.999030758420116e-05, "Pretrain/Loss": 2.2226667404174805, "Pretrain/Loss (Raw)": 2.2378365993499756, "Pretrain/Step": 368, "Pretrain/Step Time": 8.507201729342341} +{"Pretrain/Learning Rate": 4.999006975809681e-05, "Pretrain/Loss": 2.222228527069092, "Pretrain/Loss (Raw)": 2.075072765350342, "Pretrain/Step": 369, "Pretrain/Step Time": 8.512178869917989} +{"Pretrain/Learning Rate": 4.998982905001986e-05, "Pretrain/Loss": 2.22306227684021, "Pretrain/Loss (Raw)": 2.237367630004883, "Pretrain/Step": 370, "Pretrain/Step Time": 8.52092550508678} +{"Pretrain/Learning Rate": 4.998958545999806e-05, "Pretrain/Loss": 2.2230758666992188, "Pretrain/Loss (Raw)": 2.136096477508545, "Pretrain/Step": 371, "Pretrain/Step Time": 8.519506704062223} +{"Pretrain/Learning Rate": 4.998933898805951e-05, "Pretrain/Loss": 2.2233712673187256, "Pretrain/Loss (Raw)": 2.316972494125366, "Pretrain/Step": 372, "Pretrain/Step Time": 8.515132527798414} +{"Pretrain/Learning Rate": 4.9989089634232645e-05, "Pretrain/Loss": 2.222189426422119, "Pretrain/Loss (Raw)": 2.0015790462493896, "Pretrain/Step": 373, "Pretrain/Step Time": 8.515467254444957} +{"Pretrain/Learning Rate": 4.9988837398546206e-05, "Pretrain/Loss": 2.22194242477417, "Pretrain/Loss (Raw)": 2.245628595352173, "Pretrain/Step": 374, "Pretrain/Step Time": 8.507514448836446} +{"Pretrain/Learning Rate": 4.9988582281029284e-05, "Pretrain/Loss": 2.2195422649383545, "Pretrain/Loss (Raw)": 2.0315592288970947, "Pretrain/Step": 375, "Pretrain/Step Time": 8.509704500436783} +{"Pretrain/Learning Rate": 4.998832428171131e-05, "Pretrain/Loss": 2.2179369926452637, "Pretrain/Loss (Raw)": 2.2399864196777344, "Pretrain/Step": 376, "Pretrain/Step Time": 8.52289916574955} +{"Pretrain/Learning Rate": 4.998806340062202e-05, "Pretrain/Loss": 2.2175798416137695, "Pretrain/Loss (Raw)": 2.1381309032440186, "Pretrain/Step": 377, "Pretrain/Step Time": 8.51730634830892} +{"Pretrain/Learning Rate": 4.998779963779152e-05, "Pretrain/Loss": 2.214264154434204, "Pretrain/Loss (Raw)": 2.3102269172668457, "Pretrain/Step": 378, "Pretrain/Step Time": 8.516412882134318} +{"Pretrain/Learning Rate": 4.998753299325021e-05, "Pretrain/Loss": 2.2124805450439453, "Pretrain/Loss (Raw)": 2.155762195587158, "Pretrain/Step": 379, "Pretrain/Step Time": 8.520640028640628} +{"Pretrain/Learning Rate": 4.998726346702886e-05, "Pretrain/Loss": 2.2122344970703125, "Pretrain/Loss (Raw)": 2.2068443298339844, "Pretrain/Step": 380, "Pretrain/Step Time": 8.521637085825205} +{"Pretrain/Learning Rate": 4.998699105915854e-05, "Pretrain/Loss": 2.2117011547088623, "Pretrain/Loss (Raw)": 2.268638849258423, "Pretrain/Step": 381, "Pretrain/Step Time": 8.522263741120696} +{"Pretrain/Learning Rate": 4.9986715769670665e-05, "Pretrain/Loss": 2.2120001316070557, "Pretrain/Loss (Raw)": 2.4108810424804688, "Pretrain/Step": 382, "Pretrain/Step Time": 8.52272674255073} +{"Pretrain/Learning Rate": 4.998643759859699e-05, "Pretrain/Loss": 2.21254825592041, "Pretrain/Loss (Raw)": 2.2995314598083496, "Pretrain/Step": 383, "Pretrain/Step Time": 8.523957321420312} +{"Pretrain/Learning Rate": 4.998615654596959e-05, "Pretrain/Loss": 2.2142293453216553, "Pretrain/Loss (Raw)": 2.179178476333618, "Pretrain/Step": 384, "Pretrain/Step Time": 8.5125387404114} +{"Pretrain/Learning Rate": 4.9985872611820885e-05, "Pretrain/Loss": 2.2147908210754395, "Pretrain/Loss (Raw)": 2.3688817024230957, "Pretrain/Step": 385, "Pretrain/Step Time": 8.513954598456621} +{"Pretrain/Learning Rate": 4.9985585796183605e-05, "Pretrain/Loss": 2.2134573459625244, "Pretrain/Loss (Raw)": 2.073521137237549, "Pretrain/Step": 386, "Pretrain/Step Time": 8.514914708212018} +{"Pretrain/Learning Rate": 4.998529609909084e-05, "Pretrain/Loss": 2.2078206539154053, "Pretrain/Loss (Raw)": 2.141265630722046, "Pretrain/Step": 387, "Pretrain/Step Time": 8.521895026788116} +{"Pretrain/Learning Rate": 4.998500352057599e-05, "Pretrain/Loss": 2.2087011337280273, "Pretrain/Loss (Raw)": 2.2928266525268555, "Pretrain/Step": 388, "Pretrain/Step Time": 8.518337665125728} +{"Pretrain/Learning Rate": 4.9984708060672805e-05, "Pretrain/Loss": 2.207122802734375, "Pretrain/Loss (Raw)": 2.0202643871307373, "Pretrain/Step": 389, "Pretrain/Step Time": 8.520318910479546} +{"Pretrain/Learning Rate": 4.9984409719415345e-05, "Pretrain/Loss": 2.2097692489624023, "Pretrain/Loss (Raw)": 2.3615753650665283, "Pretrain/Step": 390, "Pretrain/Step Time": 8.51201532408595} +{"Pretrain/Learning Rate": 4.9984108496838034e-05, "Pretrain/Loss": 2.208949089050293, "Pretrain/Loss (Raw)": 2.2704107761383057, "Pretrain/Step": 391, "Pretrain/Step Time": 8.513597887009382} +{"Pretrain/Learning Rate": 4.99838043929756e-05, "Pretrain/Loss": 2.208812713623047, "Pretrain/Loss (Raw)": 2.250380754470825, "Pretrain/Step": 392, "Pretrain/Step Time": 8.511982083320618} +{"Pretrain/Learning Rate": 4.9983497407863114e-05, "Pretrain/Loss": 2.2073965072631836, "Pretrain/Loss (Raw)": 2.1648902893066406, "Pretrain/Step": 393, "Pretrain/Step Time": 8.51852821558714} +{"Pretrain/Learning Rate": 4.9983187541535984e-05, "Pretrain/Loss": 2.205531358718872, "Pretrain/Loss (Raw)": 2.2909209728240967, "Pretrain/Step": 394, "Pretrain/Step Time": 8.517409682273865} +{"Pretrain/Learning Rate": 4.998287479402994e-05, "Pretrain/Loss": 2.20656156539917, "Pretrain/Loss (Raw)": 2.147265911102295, "Pretrain/Step": 395, "Pretrain/Step Time": 8.528645433485508} +{"Pretrain/Learning Rate": 4.998255916538106e-05, "Pretrain/Loss": 2.2068939208984375, "Pretrain/Loss (Raw)": 2.3679723739624023, "Pretrain/Step": 396, "Pretrain/Step Time": 8.529863975942135} +{"Pretrain/Learning Rate": 4.998224065562572e-05, "Pretrain/Loss": 2.205624580383301, "Pretrain/Loss (Raw)": 1.8397990465164185, "Pretrain/Step": 397, "Pretrain/Step Time": 8.533278213813901} +{"Pretrain/Learning Rate": 4.998191926480068e-05, "Pretrain/Loss": 2.2066268920898438, "Pretrain/Loss (Raw)": 2.262010335922241, "Pretrain/Step": 398, "Pretrain/Step Time": 8.529869178310037} +{"Pretrain/Learning Rate": 4.998159499294299e-05, "Pretrain/Loss": 2.204232692718506, "Pretrain/Loss (Raw)": 2.1178231239318848, "Pretrain/Step": 399, "Pretrain/Step Time": 8.529632730409503} +{"Pretrain/Learning Rate": 4.998126784009005e-05, "Pretrain/Loss": 2.2034263610839844, "Pretrain/Loss (Raw)": 2.317408323287964, "Pretrain/Step": 400, "Pretrain/Step Time": 8.540296038612723} +{"Pretrain/Learning Rate": 4.998093780627958e-05, "Pretrain/Loss": 2.2031047344207764, "Pretrain/Loss (Raw)": 2.1193478107452393, "Pretrain/Step": 401, "Pretrain/Step Time": 8.536532880738378} +{"Pretrain/Learning Rate": 4.9980604891549656e-05, "Pretrain/Loss": 2.200596809387207, "Pretrain/Loss (Raw)": 1.989488959312439, "Pretrain/Step": 402, "Pretrain/Step Time": 8.534700281918049} +{"Pretrain/Learning Rate": 4.998026909593865e-05, "Pretrain/Loss": 2.2002110481262207, "Pretrain/Loss (Raw)": 2.041411876678467, "Pretrain/Step": 403, "Pretrain/Step Time": 8.531603924930096} +{"Pretrain/Learning Rate": 4.997993041948531e-05, "Pretrain/Loss": 2.1978323459625244, "Pretrain/Loss (Raw)": 2.0603814125061035, "Pretrain/Step": 404, "Pretrain/Step Time": 8.530981667339802} +{"Pretrain/Learning Rate": 4.997958886222869e-05, "Pretrain/Loss": 2.1989188194274902, "Pretrain/Loss (Raw)": 2.360546827316284, "Pretrain/Step": 405, "Pretrain/Step Time": 8.533463152125478} +{"Pretrain/Learning Rate": 4.9979244424208165e-05, "Pretrain/Loss": 2.198391914367676, "Pretrain/Loss (Raw)": 2.176051139831543, "Pretrain/Step": 406, "Pretrain/Step Time": 8.532586500048637} +{"Pretrain/Learning Rate": 4.997889710546347e-05, "Pretrain/Loss": 2.1979832649230957, "Pretrain/Loss (Raw)": 1.9775084257125854, "Pretrain/Step": 407, "Pretrain/Step Time": 8.538772251456976} +{"Pretrain/Learning Rate": 4.9978546906034655e-05, "Pretrain/Loss": 2.19827938079834, "Pretrain/Loss (Raw)": 2.236844539642334, "Pretrain/Step": 408, "Pretrain/Step Time": 8.532697521150112} +{"Pretrain/Learning Rate": 4.997819382596212e-05, "Pretrain/Loss": 2.1978187561035156, "Pretrain/Loss (Raw)": 2.27480149269104, "Pretrain/Step": 409, "Pretrain/Step Time": 8.521423671394587} +{"Pretrain/Learning Rate": 4.997783786528656e-05, "Pretrain/Loss": 2.197788715362549, "Pretrain/Loss (Raw)": 2.144660711288452, "Pretrain/Step": 410, "Pretrain/Step Time": 8.516896246001124} +{"Pretrain/Learning Rate": 4.997747902404904e-05, "Pretrain/Loss": 2.198181629180908, "Pretrain/Loss (Raw)": 2.308659076690674, "Pretrain/Step": 411, "Pretrain/Step Time": 8.509394012391567} +{"Pretrain/Learning Rate": 4.997711730229094e-05, "Pretrain/Loss": 2.197438955307007, "Pretrain/Loss (Raw)": 2.1655662059783936, "Pretrain/Step": 412, "Pretrain/Step Time": 8.512684009969234} +{"Pretrain/Learning Rate": 4.9976752700053975e-05, "Pretrain/Loss": 2.198817729949951, "Pretrain/Loss (Raw)": 2.5185365676879883, "Pretrain/Step": 413, "Pretrain/Step Time": 8.526214692741632} +{"Pretrain/Learning Rate": 4.9976385217380195e-05, "Pretrain/Loss": 2.1997475624084473, "Pretrain/Loss (Raw)": 2.120211601257324, "Pretrain/Step": 414, "Pretrain/Step Time": 8.52679057046771} +{"Pretrain/Learning Rate": 4.997601485431198e-05, "Pretrain/Loss": 2.2006096839904785, "Pretrain/Loss (Raw)": 2.4051320552825928, "Pretrain/Step": 415, "Pretrain/Step Time": 8.520083855837584} +{"Pretrain/Learning Rate": 4.997564161089204e-05, "Pretrain/Loss": 2.2014386653900146, "Pretrain/Loss (Raw)": 2.4001681804656982, "Pretrain/Step": 416, "Pretrain/Step Time": 8.519527539610863} +{"Pretrain/Learning Rate": 4.9975265487163424e-05, "Pretrain/Loss": 2.1968724727630615, "Pretrain/Loss (Raw)": 2.051605701446533, "Pretrain/Step": 417, "Pretrain/Step Time": 8.521359462291002} +{"Pretrain/Learning Rate": 4.997488648316951e-05, "Pretrain/Loss": 2.2004642486572266, "Pretrain/Loss (Raw)": 2.3913280963897705, "Pretrain/Step": 418, "Pretrain/Step Time": 8.530617151409388} +{"Pretrain/Learning Rate": 4.997450459895399e-05, "Pretrain/Loss": 2.201357841491699, "Pretrain/Loss (Raw)": 2.210860252380371, "Pretrain/Step": 419, "Pretrain/Step Time": 8.531093949452043} +{"Pretrain/Learning Rate": 4.997411983456092e-05, "Pretrain/Loss": 2.202921152114868, "Pretrain/Loss (Raw)": 2.3389840126037598, "Pretrain/Step": 420, "Pretrain/Step Time": 8.527203729376197} +{"Pretrain/Learning Rate": 4.9973732190034674e-05, "Pretrain/Loss": 2.2025558948516846, "Pretrain/Loss (Raw)": 2.3911190032958984, "Pretrain/Step": 421, "Pretrain/Step Time": 8.514423625543714} +{"Pretrain/Learning Rate": 4.9973341665419946e-05, "Pretrain/Loss": 2.2055444717407227, "Pretrain/Loss (Raw)": 2.4381957054138184, "Pretrain/Step": 422, "Pretrain/Step Time": 8.511383086442947} +{"Pretrain/Learning Rate": 4.997294826076178e-05, "Pretrain/Loss": 2.206691265106201, "Pretrain/Loss (Raw)": 2.153740167617798, "Pretrain/Step": 423, "Pretrain/Step Time": 8.513216257095337} +{"Pretrain/Learning Rate": 4.9972551976105545e-05, "Pretrain/Loss": 2.2107949256896973, "Pretrain/Loss (Raw)": 2.531493902206421, "Pretrain/Step": 424, "Pretrain/Step Time": 8.523685870692134} +{"Pretrain/Learning Rate": 4.9972152811496945e-05, "Pretrain/Loss": 2.2103328704833984, "Pretrain/Loss (Raw)": 2.212380886077881, "Pretrain/Step": 425, "Pretrain/Step Time": 8.517702696844935} +{"Pretrain/Learning Rate": 4.9971750766982e-05, "Pretrain/Loss": 2.2099075317382812, "Pretrain/Loss (Raw)": 2.24977970123291, "Pretrain/Step": 426, "Pretrain/Step Time": 8.51266311109066} +{"Pretrain/Learning Rate": 4.9971345842607095e-05, "Pretrain/Loss": 2.2105393409729004, "Pretrain/Loss (Raw)": 2.2563986778259277, "Pretrain/Step": 427, "Pretrain/Step Time": 8.502013949677348} +{"Pretrain/Learning Rate": 4.997093803841891e-05, "Pretrain/Loss": 2.2117114067077637, "Pretrain/Loss (Raw)": 2.2380168437957764, "Pretrain/Step": 428, "Pretrain/Step Time": 8.501365639269352} +{"Pretrain/Learning Rate": 4.997052735446449e-05, "Pretrain/Loss": 2.215888500213623, "Pretrain/Loss (Raw)": 2.835829019546509, "Pretrain/Step": 429, "Pretrain/Step Time": 8.507528590038419} +{"Pretrain/Learning Rate": 4.997011379079119e-05, "Pretrain/Loss": 2.214311361312866, "Pretrain/Loss (Raw)": 2.0457632541656494, "Pretrain/Step": 430, "Pretrain/Step Time": 8.50498989596963} +{"Pretrain/Learning Rate": 4.996969734744671e-05, "Pretrain/Loss": 2.2142820358276367, "Pretrain/Loss (Raw)": 2.2027156352996826, "Pretrain/Step": 431, "Pretrain/Step Time": 8.51257761195302} +{"Pretrain/Learning Rate": 4.996927802447906e-05, "Pretrain/Loss": 2.215005874633789, "Pretrain/Loss (Raw)": 2.1732118129730225, "Pretrain/Step": 432, "Pretrain/Step Time": 8.509743705391884} +{"Pretrain/Learning Rate": 4.9968855821936613e-05, "Pretrain/Loss": 2.2144641876220703, "Pretrain/Loss (Raw)": 2.346264362335205, "Pretrain/Step": 433, "Pretrain/Step Time": 8.509568138048053} +{"Pretrain/Learning Rate": 4.9968430739868056e-05, "Pretrain/Loss": 2.2135820388793945, "Pretrain/Loss (Raw)": 2.1157102584838867, "Pretrain/Step": 434, "Pretrain/Step Time": 8.509998785331845} +{"Pretrain/Learning Rate": 4.9968002778322406e-05, "Pretrain/Loss": 2.212273120880127, "Pretrain/Loss (Raw)": 2.1865108013153076, "Pretrain/Step": 435, "Pretrain/Step Time": 8.517270779237151} +{"Pretrain/Learning Rate": 4.9967571937349034e-05, "Pretrain/Loss": 2.2117419242858887, "Pretrain/Loss (Raw)": 1.9854094982147217, "Pretrain/Step": 436, "Pretrain/Step Time": 8.521810360252857} +{"Pretrain/Learning Rate": 4.996713821699761e-05, "Pretrain/Loss": 2.2137932777404785, "Pretrain/Loss (Raw)": 2.3658485412597656, "Pretrain/Step": 437, "Pretrain/Step Time": 8.523141095414758} +{"Pretrain/Learning Rate": 4.9966701617318154e-05, "Pretrain/Loss": 2.213454246520996, "Pretrain/Loss (Raw)": 2.1814346313476562, "Pretrain/Step": 438, "Pretrain/Step Time": 8.518501983955503} +{"Pretrain/Learning Rate": 4.996626213836103e-05, "Pretrain/Loss": 2.21645188331604, "Pretrain/Loss (Raw)": 2.3015098571777344, "Pretrain/Step": 439, "Pretrain/Step Time": 8.51144740730524} +{"Pretrain/Learning Rate": 4.99658197801769e-05, "Pretrain/Loss": 2.219022750854492, "Pretrain/Loss (Raw)": 2.2850685119628906, "Pretrain/Step": 440, "Pretrain/Step Time": 8.508801896125078} +{"Pretrain/Learning Rate": 4.99653745428168e-05, "Pretrain/Loss": 2.2193477153778076, "Pretrain/Loss (Raw)": 2.202702522277832, "Pretrain/Step": 441, "Pretrain/Step Time": 8.518667941913009} +{"Pretrain/Learning Rate": 4.9964926426332056e-05, "Pretrain/Loss": 2.2195959091186523, "Pretrain/Loss (Raw)": 2.2091798782348633, "Pretrain/Step": 442, "Pretrain/Step Time": 8.521098582074046} +{"Pretrain/Learning Rate": 4.9964475430774364e-05, "Pretrain/Loss": 2.2166481018066406, "Pretrain/Loss (Raw)": 2.112396240234375, "Pretrain/Step": 443, "Pretrain/Step Time": 8.518784515559673} +{"Pretrain/Learning Rate": 4.996402155619573e-05, "Pretrain/Loss": 2.214851140975952, "Pretrain/Loss (Raw)": 1.9907667636871338, "Pretrain/Step": 444, "Pretrain/Step Time": 8.511586526408792} +{"Pretrain/Learning Rate": 4.9963564802648494e-05, "Pretrain/Loss": 2.222075939178467, "Pretrain/Loss (Raw)": 2.995030403137207, "Pretrain/Step": 445, "Pretrain/Step Time": 8.507800620049238} +{"Pretrain/Learning Rate": 4.9963105170185334e-05, "Pretrain/Loss": 2.2209582328796387, "Pretrain/Loss (Raw)": 1.9128400087356567, "Pretrain/Step": 446, "Pretrain/Step Time": 8.509281508624554} +{"Pretrain/Learning Rate": 4.9962642658859255e-05, "Pretrain/Loss": 2.2181906700134277, "Pretrain/Loss (Raw)": 2.101571559906006, "Pretrain/Step": 447, "Pretrain/Step Time": 8.508948573842645} +{"Pretrain/Learning Rate": 4.99621772687236e-05, "Pretrain/Loss": 2.220017433166504, "Pretrain/Loss (Raw)": 2.49869966506958, "Pretrain/Step": 448, "Pretrain/Step Time": 8.511190885677934} +{"Pretrain/Learning Rate": 4.996170899983203e-05, "Pretrain/Loss": 2.220015525817871, "Pretrain/Loss (Raw)": 2.1705758571624756, "Pretrain/Step": 449, "Pretrain/Step Time": 8.515552844852209} +{"Pretrain/Learning Rate": 4.9961237852238554e-05, "Pretrain/Loss": 2.2188384532928467, "Pretrain/Loss (Raw)": 1.8790507316589355, "Pretrain/Step": 450, "Pretrain/Step Time": 8.506932264193892} +{"Pretrain/Learning Rate": 4.996076382599752e-05, "Pretrain/Loss": 2.220917224884033, "Pretrain/Loss (Raw)": 2.4528160095214844, "Pretrain/Step": 451, "Pretrain/Step Time": 8.500190390273929} +{"Pretrain/Learning Rate": 4.996028692116357e-05, "Pretrain/Loss": 2.222404956817627, "Pretrain/Loss (Raw)": 2.277815580368042, "Pretrain/Step": 452, "Pretrain/Step Time": 8.499708469957113} +{"Pretrain/Learning Rate": 4.995980713779172e-05, "Pretrain/Loss": 2.2240090370178223, "Pretrain/Loss (Raw)": 2.1847763061523438, "Pretrain/Step": 453, "Pretrain/Step Time": 8.511873474344611} +{"Pretrain/Learning Rate": 4.9959324475937297e-05, "Pretrain/Loss": 2.221595287322998, "Pretrain/Loss (Raw)": 1.899963617324829, "Pretrain/Step": 454, "Pretrain/Step Time": 8.514304732903838} +{"Pretrain/Learning Rate": 4.995883893565596e-05, "Pretrain/Loss": 2.221421241760254, "Pretrain/Loss (Raw)": 2.129037618637085, "Pretrain/Step": 455, "Pretrain/Step Time": 8.50886663980782} +{"Pretrain/Learning Rate": 4.995835051700371e-05, "Pretrain/Loss": 2.2217140197753906, "Pretrain/Loss (Raw)": 2.242326498031616, "Pretrain/Step": 456, "Pretrain/Step Time": 8.501399787142873} +{"Pretrain/Learning Rate": 4.995785922003687e-05, "Pretrain/Loss": 2.2169675827026367, "Pretrain/Loss (Raw)": 2.3418502807617188, "Pretrain/Step": 457, "Pretrain/Step Time": 8.50006378814578} +{"Pretrain/Learning Rate": 4.9957365044812097e-05, "Pretrain/Loss": 2.215662956237793, "Pretrain/Loss (Raw)": 2.0420048236846924, "Pretrain/Step": 458, "Pretrain/Step Time": 8.502063052728772} +{"Pretrain/Learning Rate": 4.995686799138639e-05, "Pretrain/Loss": 2.217278480529785, "Pretrain/Loss (Raw)": 2.2936031818389893, "Pretrain/Step": 459, "Pretrain/Step Time": 8.504836717620492} +{"Pretrain/Learning Rate": 4.995636805981706e-05, "Pretrain/Loss": 2.215742349624634, "Pretrain/Loss (Raw)": 2.1389503479003906, "Pretrain/Step": 460, "Pretrain/Step Time": 8.502275712788105} +{"Pretrain/Learning Rate": 4.9955865250161774e-05, "Pretrain/Loss": 2.215097427368164, "Pretrain/Loss (Raw)": 2.0951268672943115, "Pretrain/Step": 461, "Pretrain/Step Time": 8.498922131955624} +{"Pretrain/Learning Rate": 4.9955359562478504e-05, "Pretrain/Loss": 2.2136306762695312, "Pretrain/Loss (Raw)": 2.0931994915008545, "Pretrain/Step": 462, "Pretrain/Step Time": 8.496093152090907} +{"Pretrain/Learning Rate": 4.995485099682558e-05, "Pretrain/Loss": 2.2154057025909424, "Pretrain/Loss (Raw)": 2.27803111076355, "Pretrain/Step": 463, "Pretrain/Step Time": 8.494464129209518} +{"Pretrain/Learning Rate": 4.995433955326165e-05, "Pretrain/Loss": 2.2159061431884766, "Pretrain/Loss (Raw)": 2.1443569660186768, "Pretrain/Step": 464, "Pretrain/Step Time": 8.501359978690743} +{"Pretrain/Learning Rate": 4.995382523184569e-05, "Pretrain/Loss": 2.2158656120300293, "Pretrain/Loss (Raw)": 2.0816633701324463, "Pretrain/Step": 465, "Pretrain/Step Time": 8.500013921409845} +{"Pretrain/Learning Rate": 4.9953308032637016e-05, "Pretrain/Loss": 2.215853691101074, "Pretrain/Loss (Raw)": 2.188093900680542, "Pretrain/Step": 466, "Pretrain/Step Time": 8.499275958165526} +{"Pretrain/Learning Rate": 4.995278795569528e-05, "Pretrain/Loss": 2.2154760360717773, "Pretrain/Loss (Raw)": 2.0928258895874023, "Pretrain/Step": 467, "Pretrain/Step Time": 8.498659556731582} +{"Pretrain/Learning Rate": 4.995226500108046e-05, "Pretrain/Loss": 2.212545394897461, "Pretrain/Loss (Raw)": 2.022139549255371, "Pretrain/Step": 468, "Pretrain/Step Time": 8.494572116062045} +{"Pretrain/Learning Rate": 4.995173916885285e-05, "Pretrain/Loss": 2.2093515396118164, "Pretrain/Loss (Raw)": 1.8273884057998657, "Pretrain/Step": 469, "Pretrain/Step Time": 8.492174917832017} +{"Pretrain/Learning Rate": 4.9951210459073105e-05, "Pretrain/Loss": 2.2068285942077637, "Pretrain/Loss (Raw)": 1.808180809020996, "Pretrain/Step": 470, "Pretrain/Step Time": 8.494457522407174} +{"Pretrain/Learning Rate": 4.99506788718022e-05, "Pretrain/Loss": 2.2024917602539062, "Pretrain/Loss (Raw)": 2.0117740631103516, "Pretrain/Step": 471, "Pretrain/Step Time": 8.509263480082154} +{"Pretrain/Learning Rate": 4.995014440710144e-05, "Pretrain/Loss": 2.2004737854003906, "Pretrain/Loss (Raw)": 2.0413260459899902, "Pretrain/Step": 472, "Pretrain/Step Time": 8.499929375946522} +{"Pretrain/Learning Rate": 4.9949607065032445e-05, "Pretrain/Loss": 2.200695037841797, "Pretrain/Loss (Raw)": 2.210153102874756, "Pretrain/Step": 473, "Pretrain/Step Time": 8.503108916804194} +{"Pretrain/Learning Rate": 4.99490668456572e-05, "Pretrain/Loss": 2.2009763717651367, "Pretrain/Loss (Raw)": 2.0752670764923096, "Pretrain/Step": 474, "Pretrain/Step Time": 8.507823949679732} +{"Pretrain/Learning Rate": 4.994852374903801e-05, "Pretrain/Loss": 2.2022693157196045, "Pretrain/Loss (Raw)": 2.2792954444885254, "Pretrain/Step": 475, "Pretrain/Step Time": 8.506407706066966} +{"Pretrain/Learning Rate": 4.99479777752375e-05, "Pretrain/Loss": 2.203615188598633, "Pretrain/Loss (Raw)": 2.2421531677246094, "Pretrain/Step": 476, "Pretrain/Step Time": 8.518684247508645} +{"Pretrain/Learning Rate": 4.994742892431863e-05, "Pretrain/Loss": 2.202495574951172, "Pretrain/Loss (Raw)": 2.01735782623291, "Pretrain/Step": 477, "Pretrain/Step Time": 8.519088946282864} +{"Pretrain/Learning Rate": 4.99468771963447e-05, "Pretrain/Loss": 2.2048397064208984, "Pretrain/Loss (Raw)": 2.3035523891448975, "Pretrain/Step": 478, "Pretrain/Step Time": 8.514870909973979} +{"Pretrain/Learning Rate": 4.994632259137935e-05, "Pretrain/Loss": 2.2034921646118164, "Pretrain/Loss (Raw)": 2.164801597595215, "Pretrain/Step": 479, "Pretrain/Step Time": 8.507211150601506} +{"Pretrain/Learning Rate": 4.9945765109486506e-05, "Pretrain/Loss": 2.204218626022339, "Pretrain/Loss (Raw)": 2.2357921600341797, "Pretrain/Step": 480, "Pretrain/Step Time": 8.508238414302468} +{"Pretrain/Learning Rate": 4.99452047507305e-05, "Pretrain/Loss": 2.207155227661133, "Pretrain/Loss (Raw)": 2.0770556926727295, "Pretrain/Step": 481, "Pretrain/Step Time": 8.506079973652959} +{"Pretrain/Learning Rate": 4.994464151517593e-05, "Pretrain/Loss": 2.206683397293091, "Pretrain/Loss (Raw)": 2.1781790256500244, "Pretrain/Step": 482, "Pretrain/Step Time": 8.513740299269557} +{"Pretrain/Learning Rate": 4.994407540288775e-05, "Pretrain/Loss": 2.2037291526794434, "Pretrain/Loss (Raw)": 1.9183881282806396, "Pretrain/Step": 483, "Pretrain/Step Time": 8.518720798194408} +{"Pretrain/Learning Rate": 4.994350641393126e-05, "Pretrain/Loss": 2.2029433250427246, "Pretrain/Loss (Raw)": 2.0947046279907227, "Pretrain/Step": 484, "Pretrain/Step Time": 8.517262617126107} +{"Pretrain/Learning Rate": 4.9942934548372077e-05, "Pretrain/Loss": 2.1976048946380615, "Pretrain/Loss (Raw)": 2.102829933166504, "Pretrain/Step": 485, "Pretrain/Step Time": 8.509929422289133} +{"Pretrain/Learning Rate": 4.994235980627614e-05, "Pretrain/Loss": 2.196770191192627, "Pretrain/Loss (Raw)": 2.1161422729492188, "Pretrain/Step": 486, "Pretrain/Step Time": 8.508641317486763} +{"Pretrain/Learning Rate": 4.9941782187709746e-05, "Pretrain/Loss": 2.196507215499878, "Pretrain/Loss (Raw)": 2.148066997528076, "Pretrain/Step": 487, "Pretrain/Step Time": 8.503730203956366} +{"Pretrain/Learning Rate": 4.994120169273949e-05, "Pretrain/Loss": 2.200547695159912, "Pretrain/Loss (Raw)": 2.5997989177703857, "Pretrain/Step": 488, "Pretrain/Step Time": 8.509208969771862} +{"Pretrain/Learning Rate": 4.9940618321432344e-05, "Pretrain/Loss": 2.197917938232422, "Pretrain/Loss (Raw)": 2.0646681785583496, "Pretrain/Step": 489, "Pretrain/Step Time": 8.519383622333407} +{"Pretrain/Learning Rate": 4.994003207385556e-05, "Pretrain/Loss": 2.197537660598755, "Pretrain/Loss (Raw)": 1.9874244928359985, "Pretrain/Step": 490, "Pretrain/Step Time": 8.523669531568885} +{"Pretrain/Learning Rate": 4.9939442950076755e-05, "Pretrain/Loss": 2.1960840225219727, "Pretrain/Loss (Raw)": 1.9919747114181519, "Pretrain/Step": 491, "Pretrain/Step Time": 8.514900233596563} +{"Pretrain/Learning Rate": 4.9938850950163864e-05, "Pretrain/Loss": 2.1925814151763916, "Pretrain/Loss (Raw)": 2.1272358894348145, "Pretrain/Step": 492, "Pretrain/Step Time": 8.51323170401156} +{"Pretrain/Learning Rate": 4.9938256074185174e-05, "Pretrain/Loss": 2.1938140392303467, "Pretrain/Loss (Raw)": 2.295867919921875, "Pretrain/Step": 493, "Pretrain/Step Time": 8.508703337982297} +{"Pretrain/Learning Rate": 4.993765832220928e-05, "Pretrain/Loss": 2.1941404342651367, "Pretrain/Loss (Raw)": 2.2497506141662598, "Pretrain/Step": 494, "Pretrain/Step Time": 8.510889889672399} +{"Pretrain/Learning Rate": 4.993705769430511e-05, "Pretrain/Loss": 2.1952288150787354, "Pretrain/Loss (Raw)": 2.1817708015441895, "Pretrain/Step": 495, "Pretrain/Step Time": 8.518059268593788} +{"Pretrain/Learning Rate": 4.9936454190541945e-05, "Pretrain/Loss": 2.194040536880493, "Pretrain/Loss (Raw)": 2.0857293605804443, "Pretrain/Step": 496, "Pretrain/Step Time": 8.523745069280267} +{"Pretrain/Learning Rate": 4.993584781098939e-05, "Pretrain/Loss": 2.196082592010498, "Pretrain/Loss (Raw)": 2.336459159851074, "Pretrain/Step": 497, "Pretrain/Step Time": 8.518694512546062} +{"Pretrain/Learning Rate": 4.993523855571735e-05, "Pretrain/Loss": 2.195382833480835, "Pretrain/Loss (Raw)": 2.1477909088134766, "Pretrain/Step": 498, "Pretrain/Step Time": 8.505855739116669} +{"Pretrain/Learning Rate": 4.99346264247961e-05, "Pretrain/Loss": 2.196953296661377, "Pretrain/Loss (Raw)": 2.337083578109741, "Pretrain/Step": 499, "Pretrain/Step Time": 8.50887449644506} +{"Pretrain/Learning Rate": 4.993401141829625e-05, "Pretrain/Loss": 2.1961052417755127, "Pretrain/Loss (Raw)": 2.2084460258483887, "Pretrain/Step": 500, "Pretrain/Step Time": 8.516174810007215} +{"Pretrain/Learning Rate": 4.99333935362887e-05, "Pretrain/Loss": 2.1989026069641113, "Pretrain/Loss (Raw)": 2.359635353088379, "Pretrain/Step": 501, "Pretrain/Step Time": 8.522573176771402} +{"Pretrain/Learning Rate": 4.993277277884471e-05, "Pretrain/Loss": 2.195767402648926, "Pretrain/Loss (Raw)": 1.8443374633789062, "Pretrain/Step": 502, "Pretrain/Step Time": 8.522639639675617} +{"Pretrain/Learning Rate": 4.993214914603588e-05, "Pretrain/Loss": 2.1965267658233643, "Pretrain/Loss (Raw)": 2.1287620067596436, "Pretrain/Step": 503, "Pretrain/Step Time": 8.523641465231776} +{"Pretrain/Learning Rate": 4.993152263793414e-05, "Pretrain/Loss": 2.1958131790161133, "Pretrain/Loss (Raw)": 2.148664712905884, "Pretrain/Step": 504, "Pretrain/Step Time": 8.507569294422865} +{"Pretrain/Learning Rate": 4.993089325461171e-05, "Pretrain/Loss": 2.1952743530273438, "Pretrain/Loss (Raw)": 2.0691332817077637, "Pretrain/Step": 505, "Pretrain/Step Time": 8.510460337623954} +{"Pretrain/Learning Rate": 4.99302609961412e-05, "Pretrain/Loss": 2.1944973468780518, "Pretrain/Loss (Raw)": 2.2107696533203125, "Pretrain/Step": 506, "Pretrain/Step Time": 8.51622749492526} +{"Pretrain/Learning Rate": 4.9929625862595516e-05, "Pretrain/Loss": 2.1950714588165283, "Pretrain/Loss (Raw)": 2.229257583618164, "Pretrain/Step": 507, "Pretrain/Step Time": 8.510992491617799} +{"Pretrain/Learning Rate": 4.9928987854047905e-05, "Pretrain/Loss": 2.194889783859253, "Pretrain/Loss (Raw)": 2.183580160140991, "Pretrain/Step": 508, "Pretrain/Step Time": 8.509304052218795} +{"Pretrain/Learning Rate": 4.992834697057195e-05, "Pretrain/Loss": 2.192045211791992, "Pretrain/Loss (Raw)": 1.9045381546020508, "Pretrain/Step": 509, "Pretrain/Step Time": 8.51121199131012} +{"Pretrain/Learning Rate": 4.992770321224155e-05, "Pretrain/Loss": 2.1916160583496094, "Pretrain/Loss (Raw)": 2.355968713760376, "Pretrain/Step": 510, "Pretrain/Step Time": 8.512130314484239} +{"Pretrain/Learning Rate": 4.992705657913095e-05, "Pretrain/Loss": 2.189866065979004, "Pretrain/Loss (Raw)": 2.0755465030670166, "Pretrain/Step": 511, "Pretrain/Step Time": 8.51775555498898} +{"Pretrain/Learning Rate": 4.9926407071314736e-05, "Pretrain/Loss": 2.1885080337524414, "Pretrain/Loss (Raw)": 2.0053153038024902, "Pretrain/Step": 512, "Pretrain/Step Time": 8.521872436627746} +{"Pretrain/Learning Rate": 4.9925754688867796e-05, "Pretrain/Loss": 2.1869564056396484, "Pretrain/Loss (Raw)": 2.1702606678009033, "Pretrain/Step": 513, "Pretrain/Step Time": 8.519552627578378} +{"Pretrain/Learning Rate": 4.992509943186537e-05, "Pretrain/Loss": 2.1877331733703613, "Pretrain/Loss (Raw)": 2.1729555130004883, "Pretrain/Step": 514, "Pretrain/Step Time": 8.520195286720991} +{"Pretrain/Learning Rate": 4.992444130038302e-05, "Pretrain/Loss": 2.186757802963257, "Pretrain/Loss (Raw)": 2.0164124965667725, "Pretrain/Step": 515, "Pretrain/Step Time": 8.508878847584128} +{"Pretrain/Learning Rate": 4.992378029449666e-05, "Pretrain/Loss": 2.1867051124572754, "Pretrain/Loss (Raw)": 2.2860898971557617, "Pretrain/Step": 516, "Pretrain/Step Time": 8.50757403485477} +{"Pretrain/Learning Rate": 4.9923116414282514e-05, "Pretrain/Loss": 2.1895546913146973, "Pretrain/Loss (Raw)": 2.3850409984588623, "Pretrain/Step": 517, "Pretrain/Step Time": 8.508181352168322} +{"Pretrain/Learning Rate": 4.992244965981714e-05, "Pretrain/Loss": 2.187289237976074, "Pretrain/Loss (Raw)": 2.071545362472534, "Pretrain/Step": 518, "Pretrain/Step Time": 8.513352576643229} +{"Pretrain/Learning Rate": 4.9921780031177425e-05, "Pretrain/Loss": 2.186391830444336, "Pretrain/Loss (Raw)": 2.1555871963500977, "Pretrain/Step": 519, "Pretrain/Step Time": 8.512448947876692} +{"Pretrain/Learning Rate": 4.992110752844061e-05, "Pretrain/Loss": 2.1861984729766846, "Pretrain/Loss (Raw)": 2.2256288528442383, "Pretrain/Step": 520, "Pretrain/Step Time": 8.514208475127816} +{"Pretrain/Learning Rate": 4.992043215168424e-05, "Pretrain/Loss": 2.1867482662200928, "Pretrain/Loss (Raw)": 2.2352521419525146, "Pretrain/Step": 521, "Pretrain/Step Time": 8.505837326869369} +{"Pretrain/Learning Rate": 4.99197539009862e-05, "Pretrain/Loss": 2.1847646236419678, "Pretrain/Loss (Raw)": 2.037006378173828, "Pretrain/Step": 522, "Pretrain/Step Time": 8.504907861351967} +{"Pretrain/Learning Rate": 4.9919072776424726e-05, "Pretrain/Loss": 2.1839637756347656, "Pretrain/Loss (Raw)": 2.044761896133423, "Pretrain/Step": 523, "Pretrain/Step Time": 8.506598701700568} +{"Pretrain/Learning Rate": 4.9918388778078347e-05, "Pretrain/Loss": 2.1821653842926025, "Pretrain/Loss (Raw)": 2.137777328491211, "Pretrain/Step": 524, "Pretrain/Step Time": 8.505550047382712} +{"Pretrain/Learning Rate": 4.991770190602596e-05, "Pretrain/Loss": 2.1846890449523926, "Pretrain/Loss (Raw)": 2.1628360748291016, "Pretrain/Step": 525, "Pretrain/Step Time": 8.506166065111756} +{"Pretrain/Learning Rate": 4.991701216034677e-05, "Pretrain/Loss": 2.184464931488037, "Pretrain/Loss (Raw)": 2.23329758644104, "Pretrain/Step": 526, "Pretrain/Step Time": 8.514200510457158} +{"Pretrain/Learning Rate": 4.9916319541120324e-05, "Pretrain/Loss": 2.1844863891601562, "Pretrain/Loss (Raw)": 2.1206090450286865, "Pretrain/Step": 527, "Pretrain/Step Time": 8.514080392196774} +{"Pretrain/Learning Rate": 4.99156240484265e-05, "Pretrain/Loss": 2.181600332260132, "Pretrain/Loss (Raw)": 1.9479869604110718, "Pretrain/Step": 528, "Pretrain/Step Time": 8.508094266057014} +{"Pretrain/Learning Rate": 4.9914925682345504e-05, "Pretrain/Loss": 2.180293083190918, "Pretrain/Loss (Raw)": 1.951987385749817, "Pretrain/Step": 529, "Pretrain/Step Time": 8.51306239515543} +{"Pretrain/Learning Rate": 4.991422444295788e-05, "Pretrain/Loss": 2.181436061859131, "Pretrain/Loss (Raw)": 2.1358158588409424, "Pretrain/Step": 530, "Pretrain/Step Time": 8.514154940843582} +{"Pretrain/Learning Rate": 4.9913520330344486e-05, "Pretrain/Loss": 2.181928873062134, "Pretrain/Loss (Raw)": 2.1044907569885254, "Pretrain/Step": 531, "Pretrain/Step Time": 8.529253348708153} +{"Pretrain/Learning Rate": 4.991281334458654e-05, "Pretrain/Loss": 2.1818935871124268, "Pretrain/Loss (Raw)": 2.0558557510375977, "Pretrain/Step": 532, "Pretrain/Step Time": 8.52920027077198} +{"Pretrain/Learning Rate": 4.991210348576556e-05, "Pretrain/Loss": 2.181710958480835, "Pretrain/Loss (Raw)": 2.3371870517730713, "Pretrain/Step": 533, "Pretrain/Step Time": 8.52652451954782} +{"Pretrain/Learning Rate": 4.991139075396342e-05, "Pretrain/Loss": 2.18257999420166, "Pretrain/Loss (Raw)": 2.287294864654541, "Pretrain/Step": 534, "Pretrain/Step Time": 8.525859545916319} +{"Pretrain/Learning Rate": 4.991067514926231e-05, "Pretrain/Loss": 2.18568754196167, "Pretrain/Loss (Raw)": 2.375260829925537, "Pretrain/Step": 535, "Pretrain/Step Time": 8.519618460908532} +{"Pretrain/Learning Rate": 4.990995667174476e-05, "Pretrain/Loss": 2.1840996742248535, "Pretrain/Loss (Raw)": 2.033581018447876, "Pretrain/Step": 536, "Pretrain/Step Time": 8.519670253619552} +{"Pretrain/Learning Rate": 4.990923532149362e-05, "Pretrain/Loss": 2.1836163997650146, "Pretrain/Loss (Raw)": 2.212942123413086, "Pretrain/Step": 537, "Pretrain/Step Time": 8.526479486376047} +{"Pretrain/Learning Rate": 4.990851109859209e-05, "Pretrain/Loss": 2.183124542236328, "Pretrain/Loss (Raw)": 2.081721544265747, "Pretrain/Step": 538, "Pretrain/Step Time": 8.524640725925565} +{"Pretrain/Learning Rate": 4.9907784003123695e-05, "Pretrain/Loss": 2.1823225021362305, "Pretrain/Loss (Raw)": 2.205970048904419, "Pretrain/Step": 539, "Pretrain/Step Time": 8.529316572472453} +{"Pretrain/Learning Rate": 4.9907054035172273e-05, "Pretrain/Loss": 2.182589530944824, "Pretrain/Loss (Raw)": 2.1997692584991455, "Pretrain/Step": 540, "Pretrain/Step Time": 8.52551088295877} +{"Pretrain/Learning Rate": 4.9906321194822014e-05, "Pretrain/Loss": 2.178903102874756, "Pretrain/Loss (Raw)": 2.0466806888580322, "Pretrain/Step": 541, "Pretrain/Step Time": 8.516722708940506} +{"Pretrain/Learning Rate": 4.9905585482157436e-05, "Pretrain/Loss": 2.1794466972351074, "Pretrain/Loss (Raw)": 2.189776659011841, "Pretrain/Step": 542, "Pretrain/Step Time": 8.521079391241074} +{"Pretrain/Learning Rate": 4.990484689726338e-05, "Pretrain/Loss": 2.1793673038482666, "Pretrain/Loss (Raw)": 2.3949737548828125, "Pretrain/Step": 543, "Pretrain/Step Time": 8.517497764900327} +{"Pretrain/Learning Rate": 4.990410544022502e-05, "Pretrain/Loss": 2.17903733253479, "Pretrain/Loss (Raw)": 2.357940196990967, "Pretrain/Step": 544, "Pretrain/Step Time": 8.521788157522678} +{"Pretrain/Learning Rate": 4.9903361111127864e-05, "Pretrain/Loss": 2.1813621520996094, "Pretrain/Loss (Raw)": 2.349146604537964, "Pretrain/Step": 545, "Pretrain/Step Time": 8.518180565908551} +{"Pretrain/Learning Rate": 4.990261391005777e-05, "Pretrain/Loss": 2.1792678833007812, "Pretrain/Loss (Raw)": 2.1232962608337402, "Pretrain/Step": 546, "Pretrain/Step Time": 8.513877045363188} +{"Pretrain/Learning Rate": 4.9901863837100886e-05, "Pretrain/Loss": 2.1794843673706055, "Pretrain/Loss (Raw)": 2.238565444946289, "Pretrain/Step": 547, "Pretrain/Step Time": 8.51896844431758} +{"Pretrain/Learning Rate": 4.9901110892343724e-05, "Pretrain/Loss": 2.1766254901885986, "Pretrain/Loss (Raw)": 1.9730616807937622, "Pretrain/Step": 548, "Pretrain/Step Time": 8.525071756914258} +{"Pretrain/Learning Rate": 4.9900355075873116e-05, "Pretrain/Loss": 2.1754298210144043, "Pretrain/Loss (Raw)": 2.238070011138916, "Pretrain/Step": 549, "Pretrain/Step Time": 8.525656646117568} +{"Pretrain/Learning Rate": 4.989959638777623e-05, "Pretrain/Loss": 2.1711323261260986, "Pretrain/Loss (Raw)": 1.8881030082702637, "Pretrain/Step": 550, "Pretrain/Step Time": 8.526857692748308} +{"Pretrain/Learning Rate": 4.989883482814056e-05, "Pretrain/Loss": 2.1693010330200195, "Pretrain/Loss (Raw)": 1.9193518161773682, "Pretrain/Step": 551, "Pretrain/Step Time": 8.527533641085029} +{"Pretrain/Learning Rate": 4.989807039705392e-05, "Pretrain/Loss": 2.1666412353515625, "Pretrain/Loss (Raw)": 2.1910200119018555, "Pretrain/Step": 552, "Pretrain/Step Time": 8.516056347638369} +{"Pretrain/Learning Rate": 4.989730309460449e-05, "Pretrain/Loss": 2.165349006652832, "Pretrain/Loss (Raw)": 2.0469510555267334, "Pretrain/Step": 553, "Pretrain/Step Time": 8.5179103333503} +{"Pretrain/Learning Rate": 4.989653292088074e-05, "Pretrain/Loss": 2.16496205329895, "Pretrain/Loss (Raw)": 2.200286626815796, "Pretrain/Step": 554, "Pretrain/Step Time": 8.525949945673347} +{"Pretrain/Learning Rate": 4.9895759875971495e-05, "Pretrain/Loss": 2.1648192405700684, "Pretrain/Loss (Raw)": 2.2380869388580322, "Pretrain/Step": 555, "Pretrain/Step Time": 8.527444805949926} +{"Pretrain/Learning Rate": 4.9894983959965915e-05, "Pretrain/Loss": 2.1640431880950928, "Pretrain/Loss (Raw)": 2.138697624206543, "Pretrain/Step": 556, "Pretrain/Step Time": 8.523155445232987} +{"Pretrain/Learning Rate": 4.989420517295347e-05, "Pretrain/Loss": 2.1581461429595947, "Pretrain/Loss (Raw)": 2.0810158252716064, "Pretrain/Step": 557, "Pretrain/Step Time": 8.51901352033019} +{"Pretrain/Learning Rate": 4.9893423515023986e-05, "Pretrain/Loss": 2.1582276821136475, "Pretrain/Loss (Raw)": 2.0562033653259277, "Pretrain/Step": 558, "Pretrain/Step Time": 8.520977716892958} +{"Pretrain/Learning Rate": 4.9892638986267594e-05, "Pretrain/Loss": 2.157573699951172, "Pretrain/Loss (Raw)": 2.1189889907836914, "Pretrain/Step": 559, "Pretrain/Step Time": 8.515430942177773} +{"Pretrain/Learning Rate": 4.989185158677478e-05, "Pretrain/Loss": 2.158780813217163, "Pretrain/Loss (Raw)": 2.3277406692504883, "Pretrain/Step": 560, "Pretrain/Step Time": 8.521530639380217} +{"Pretrain/Learning Rate": 4.9891061316636346e-05, "Pretrain/Loss": 2.156477928161621, "Pretrain/Loss (Raw)": 2.051494836807251, "Pretrain/Step": 561, "Pretrain/Step Time": 8.520015578716993} +{"Pretrain/Learning Rate": 4.9890268175943425e-05, "Pretrain/Loss": 2.155698299407959, "Pretrain/Loss (Raw)": 2.0159130096435547, "Pretrain/Step": 562, "Pretrain/Step Time": 8.521231386810541} +{"Pretrain/Learning Rate": 4.9889472164787496e-05, "Pretrain/Loss": 2.15714168548584, "Pretrain/Loss (Raw)": 2.3712692260742188, "Pretrain/Step": 563, "Pretrain/Step Time": 8.517711265012622} +{"Pretrain/Learning Rate": 4.9888673283260355e-05, "Pretrain/Loss": 2.159029245376587, "Pretrain/Loss (Raw)": 2.2270188331604004, "Pretrain/Step": 564, "Pretrain/Step Time": 8.513375436887145} +{"Pretrain/Learning Rate": 4.9887871531454134e-05, "Pretrain/Loss": 2.156728744506836, "Pretrain/Loss (Raw)": 2.07137131690979, "Pretrain/Step": 565, "Pretrain/Step Time": 8.516872948035598} +{"Pretrain/Learning Rate": 4.988706690946129e-05, "Pretrain/Loss": 2.1575305461883545, "Pretrain/Loss (Raw)": 2.2840538024902344, "Pretrain/Step": 566, "Pretrain/Step Time": 8.528762936592102} +{"Pretrain/Learning Rate": 4.9886259417374616e-05, "Pretrain/Loss": 2.1586480140686035, "Pretrain/Loss (Raw)": 2.4445674419403076, "Pretrain/Step": 567, "Pretrain/Step Time": 8.529197253286839} +{"Pretrain/Learning Rate": 4.988544905528724e-05, "Pretrain/Loss": 2.155611038208008, "Pretrain/Loss (Raw)": 1.8963297605514526, "Pretrain/Step": 568, "Pretrain/Step Time": 8.529041104018688} +{"Pretrain/Learning Rate": 4.9884635823292615e-05, "Pretrain/Loss": 2.156160831451416, "Pretrain/Loss (Raw)": 2.2730798721313477, "Pretrain/Step": 569, "Pretrain/Step Time": 8.518995003774762} +{"Pretrain/Learning Rate": 4.988381972148452e-05, "Pretrain/Loss": 2.1555328369140625, "Pretrain/Loss (Raw)": 2.1287949085235596, "Pretrain/Step": 570, "Pretrain/Step Time": 8.518737241625786} +{"Pretrain/Learning Rate": 4.9883000749957086e-05, "Pretrain/Loss": 2.155224084854126, "Pretrain/Loss (Raw)": 2.0728697776794434, "Pretrain/Step": 571, "Pretrain/Step Time": 8.51671320386231} +{"Pretrain/Learning Rate": 4.988217890880475e-05, "Pretrain/Loss": 2.1569652557373047, "Pretrain/Loss (Raw)": 2.2136318683624268, "Pretrain/Step": 572, "Pretrain/Step Time": 8.523299979045987} +{"Pretrain/Learning Rate": 4.98813541981223e-05, "Pretrain/Loss": 2.150927782058716, "Pretrain/Loss (Raw)": 2.2222440242767334, "Pretrain/Step": 573, "Pretrain/Step Time": 8.527080295607448} +{"Pretrain/Learning Rate": 4.988052661800483e-05, "Pretrain/Loss": 2.1530981063842773, "Pretrain/Loss (Raw)": 2.190662145614624, "Pretrain/Step": 574, "Pretrain/Step Time": 8.515504855662584} +{"Pretrain/Learning Rate": 4.98796961685478e-05, "Pretrain/Loss": 2.152937889099121, "Pretrain/Loss (Raw)": 2.0810294151306152, "Pretrain/Step": 575, "Pretrain/Step Time": 8.512095630168915} +{"Pretrain/Learning Rate": 4.987886284984695e-05, "Pretrain/Loss": 2.1516036987304688, "Pretrain/Loss (Raw)": 2.327960252761841, "Pretrain/Step": 576, "Pretrain/Step Time": 8.511311125010252} +{"Pretrain/Learning Rate": 4.987802666199842e-05, "Pretrain/Loss": 2.1555395126342773, "Pretrain/Loss (Raw)": 2.674320936203003, "Pretrain/Step": 577, "Pretrain/Step Time": 8.513149408623576} +{"Pretrain/Learning Rate": 4.987718760509863e-05, "Pretrain/Loss": 2.157693386077881, "Pretrain/Loss (Raw)": 2.1547629833221436, "Pretrain/Step": 578, "Pretrain/Step Time": 8.520369866862893} +{"Pretrain/Learning Rate": 4.987634567924433e-05, "Pretrain/Loss": 2.1561241149902344, "Pretrain/Loss (Raw)": 2.2519311904907227, "Pretrain/Step": 579, "Pretrain/Step Time": 8.519205121323466} +{"Pretrain/Learning Rate": 4.9875500884532634e-05, "Pretrain/Loss": 2.154872179031372, "Pretrain/Loss (Raw)": 2.1175756454467773, "Pretrain/Step": 580, "Pretrain/Step Time": 8.51609406620264} +{"Pretrain/Learning Rate": 4.987465322106095e-05, "Pretrain/Loss": 2.155120372772217, "Pretrain/Loss (Raw)": 2.216533899307251, "Pretrain/Step": 581, "Pretrain/Step Time": 8.50612262263894} +{"Pretrain/Learning Rate": 4.987380268892705e-05, "Pretrain/Loss": 2.1573076248168945, "Pretrain/Loss (Raw)": 2.179957628250122, "Pretrain/Step": 582, "Pretrain/Step Time": 8.507313385605812} +{"Pretrain/Learning Rate": 4.987294928822901e-05, "Pretrain/Loss": 2.1581263542175293, "Pretrain/Loss (Raw)": 2.233813524246216, "Pretrain/Step": 583, "Pretrain/Step Time": 8.516418553888798} +{"Pretrain/Learning Rate": 4.9872093019065255e-05, "Pretrain/Loss": 2.1588592529296875, "Pretrain/Loss (Raw)": 2.336169719696045, "Pretrain/Step": 584, "Pretrain/Step Time": 8.522917781025171} +{"Pretrain/Learning Rate": 4.987123388153453e-05, "Pretrain/Loss": 2.15775990486145, "Pretrain/Loss (Raw)": 2.2011168003082275, "Pretrain/Step": 585, "Pretrain/Step Time": 8.531387686729431} +{"Pretrain/Learning Rate": 4.9870371875735916e-05, "Pretrain/Loss": 2.1583762168884277, "Pretrain/Loss (Raw)": 2.1209099292755127, "Pretrain/Step": 586, "Pretrain/Step Time": 8.528463846072555} +{"Pretrain/Learning Rate": 4.986950700176882e-05, "Pretrain/Loss": 2.156301498413086, "Pretrain/Loss (Raw)": 2.0280189514160156, "Pretrain/Step": 587, "Pretrain/Step Time": 8.523541335016489} +{"Pretrain/Learning Rate": 4.9868639259732996e-05, "Pretrain/Loss": 2.1571943759918213, "Pretrain/Loss (Raw)": 2.253239154815674, "Pretrain/Step": 588, "Pretrain/Step Time": 8.523497520014644} +{"Pretrain/Learning Rate": 4.986776864972851e-05, "Pretrain/Loss": 2.157862663269043, "Pretrain/Loss (Raw)": 2.1806414127349854, "Pretrain/Step": 589, "Pretrain/Step Time": 8.52815935201943} +{"Pretrain/Learning Rate": 4.9866895171855756e-05, "Pretrain/Loss": 2.1558170318603516, "Pretrain/Loss (Raw)": 1.8313658237457275, "Pretrain/Step": 590, "Pretrain/Step Time": 8.52317263931036} +{"Pretrain/Learning Rate": 4.9866018826215475e-05, "Pretrain/Loss": 2.1551506519317627, "Pretrain/Loss (Raw)": 2.192767381668091, "Pretrain/Step": 591, "Pretrain/Step Time": 8.52041251398623} +{"Pretrain/Learning Rate": 4.9865139612908736e-05, "Pretrain/Loss": 2.156704902648926, "Pretrain/Loss (Raw)": 2.3433070182800293, "Pretrain/Step": 592, "Pretrain/Step Time": 8.518393954262137} +{"Pretrain/Learning Rate": 4.9864257532036924e-05, "Pretrain/Loss": 2.156785249710083, "Pretrain/Loss (Raw)": 2.091913938522339, "Pretrain/Step": 593, "Pretrain/Step Time": 8.5126943718642} +{"Pretrain/Learning Rate": 4.9863372583701765e-05, "Pretrain/Loss": 2.1561312675476074, "Pretrain/Loss (Raw)": 2.104412078857422, "Pretrain/Step": 594, "Pretrain/Step Time": 8.51535626128316} +{"Pretrain/Learning Rate": 4.9862484768005324e-05, "Pretrain/Loss": 2.155714750289917, "Pretrain/Loss (Raw)": 2.039494037628174, "Pretrain/Step": 595, "Pretrain/Step Time": 8.516007546335459} +{"Pretrain/Learning Rate": 4.986159408504999e-05, "Pretrain/Loss": 2.15609073638916, "Pretrain/Loss (Raw)": 2.070268392562866, "Pretrain/Step": 596, "Pretrain/Step Time": 8.523755611851811} +{"Pretrain/Learning Rate": 4.986070053493846e-05, "Pretrain/Loss": 2.157834529876709, "Pretrain/Loss (Raw)": 2.05060076713562, "Pretrain/Step": 597, "Pretrain/Step Time": 8.526204444468021} +{"Pretrain/Learning Rate": 4.985980411777381e-05, "Pretrain/Loss": 2.1602110862731934, "Pretrain/Loss (Raw)": 2.112387180328369, "Pretrain/Step": 598, "Pretrain/Step Time": 8.520686572417617} +{"Pretrain/Learning Rate": 4.9858904833659404e-05, "Pretrain/Loss": 2.160935878753662, "Pretrain/Loss (Raw)": 2.10455584526062, "Pretrain/Step": 599, "Pretrain/Step Time": 8.504977276548743} +{"Pretrain/Learning Rate": 4.985800268269895e-05, "Pretrain/Loss": 2.162109375, "Pretrain/Loss (Raw)": 2.191514492034912, "Pretrain/Step": 600, "Pretrain/Step Time": 8.509085731580853} +{"Pretrain/Learning Rate": 4.9857097664996486e-05, "Pretrain/Loss": 2.161129951477051, "Pretrain/Loss (Raw)": 2.0847890377044678, "Pretrain/Step": 601, "Pretrain/Step Time": 8.508791761472821} +{"Pretrain/Learning Rate": 4.98561897806564e-05, "Pretrain/Loss": 2.162358283996582, "Pretrain/Loss (Raw)": 2.23248028755188, "Pretrain/Step": 602, "Pretrain/Step Time": 8.506326468661427} +{"Pretrain/Learning Rate": 4.985527902978337e-05, "Pretrain/Loss": 2.160567283630371, "Pretrain/Loss (Raw)": 2.050046682357788, "Pretrain/Step": 603, "Pretrain/Step Time": 8.522598734125495} +{"Pretrain/Learning Rate": 4.985436541248245e-05, "Pretrain/Loss": 2.159979820251465, "Pretrain/Loss (Raw)": 2.166954755783081, "Pretrain/Step": 604, "Pretrain/Step Time": 8.515815438702703} +{"Pretrain/Learning Rate": 4.985344892885899e-05, "Pretrain/Loss": 2.1609158515930176, "Pretrain/Loss (Raw)": 2.1371641159057617, "Pretrain/Step": 605, "Pretrain/Step Time": 8.513917738571763} +{"Pretrain/Learning Rate": 4.985252957901869e-05, "Pretrain/Loss": 2.159451961517334, "Pretrain/Loss (Raw)": 2.1162006855010986, "Pretrain/Step": 606, "Pretrain/Step Time": 8.516361519694328} +{"Pretrain/Learning Rate": 4.985160736306756e-05, "Pretrain/Loss": 2.1589503288269043, "Pretrain/Loss (Raw)": 2.1005914211273193, "Pretrain/Step": 607, "Pretrain/Step Time": 8.516955759376287} +{"Pretrain/Learning Rate": 4.985068228111198e-05, "Pretrain/Loss": 2.1586389541625977, "Pretrain/Loss (Raw)": 2.195936441421509, "Pretrain/Step": 608, "Pretrain/Step Time": 8.525957342237234} +{"Pretrain/Learning Rate": 4.984975433325861e-05, "Pretrain/Loss": 2.1592917442321777, "Pretrain/Loss (Raw)": 2.1606147289276123, "Pretrain/Step": 609, "Pretrain/Step Time": 8.530751699581742} +{"Pretrain/Learning Rate": 4.9848823519614475e-05, "Pretrain/Loss": 2.1590261459350586, "Pretrain/Loss (Raw)": 2.1441657543182373, "Pretrain/Step": 610, "Pretrain/Step Time": 8.520091580227017} +{"Pretrain/Learning Rate": 4.9847889840286924e-05, "Pretrain/Loss": 2.1618525981903076, "Pretrain/Loss (Raw)": 2.280177354812622, "Pretrain/Step": 611, "Pretrain/Step Time": 8.514488676562905} +{"Pretrain/Learning Rate": 4.984695329538362e-05, "Pretrain/Loss": 2.163118362426758, "Pretrain/Loss (Raw)": 2.256721258163452, "Pretrain/Step": 612, "Pretrain/Step Time": 8.511080369353294} +{"Pretrain/Learning Rate": 4.984601388501258e-05, "Pretrain/Loss": 2.163760185241699, "Pretrain/Loss (Raw)": 2.1850032806396484, "Pretrain/Step": 613, "Pretrain/Step Time": 8.51186710037291} +{"Pretrain/Learning Rate": 4.9845071609282145e-05, "Pretrain/Loss": 2.1644651889801025, "Pretrain/Loss (Raw)": 2.2063515186309814, "Pretrain/Step": 614, "Pretrain/Step Time": 8.515370845794678} +{"Pretrain/Learning Rate": 4.984412646830098e-05, "Pretrain/Loss": 2.164172887802124, "Pretrain/Loss (Raw)": 2.1106667518615723, "Pretrain/Step": 615, "Pretrain/Step Time": 8.526843328028917} +{"Pretrain/Learning Rate": 4.9843178462178084e-05, "Pretrain/Loss": 2.1607863903045654, "Pretrain/Loss (Raw)": 2.1663384437561035, "Pretrain/Step": 616, "Pretrain/Step Time": 8.523048017174006} +{"Pretrain/Learning Rate": 4.984222759102277e-05, "Pretrain/Loss": 2.1649508476257324, "Pretrain/Loss (Raw)": 2.5977344512939453, "Pretrain/Step": 617, "Pretrain/Step Time": 8.51171457581222} +{"Pretrain/Learning Rate": 4.984127385494472e-05, "Pretrain/Loss": 2.164862632751465, "Pretrain/Loss (Raw)": 1.9760818481445312, "Pretrain/Step": 618, "Pretrain/Step Time": 8.506130956113338} +{"Pretrain/Learning Rate": 4.984031725405392e-05, "Pretrain/Loss": 2.1663942337036133, "Pretrain/Loss (Raw)": 2.188044548034668, "Pretrain/Step": 619, "Pretrain/Step Time": 8.511113226413727} +{"Pretrain/Learning Rate": 4.983935778846067e-05, "Pretrain/Loss": 2.166901111602783, "Pretrain/Loss (Raw)": 2.192128896713257, "Pretrain/Step": 620, "Pretrain/Step Time": 8.52004843018949} +{"Pretrain/Learning Rate": 4.9838395458275636e-05, "Pretrain/Loss": 2.165236711502075, "Pretrain/Loss (Raw)": 2.082820415496826, "Pretrain/Step": 621, "Pretrain/Step Time": 8.523691331967711} +{"Pretrain/Learning Rate": 4.98374302636098e-05, "Pretrain/Loss": 2.164140462875366, "Pretrain/Loss (Raw)": 2.1094181537628174, "Pretrain/Step": 622, "Pretrain/Step Time": 8.52538039907813} +{"Pretrain/Learning Rate": 4.983646220457446e-05, "Pretrain/Loss": 2.164126396179199, "Pretrain/Loss (Raw)": 2.1799705028533936, "Pretrain/Step": 623, "Pretrain/Step Time": 8.519178269430995} +{"Pretrain/Learning Rate": 4.9835491281281274e-05, "Pretrain/Loss": 2.1651418209075928, "Pretrain/Loss (Raw)": 2.215719699859619, "Pretrain/Step": 624, "Pretrain/Step Time": 8.511936895549297} +{"Pretrain/Learning Rate": 4.9834517493842196e-05, "Pretrain/Loss": 2.1636269092559814, "Pretrain/Loss (Raw)": 2.1425580978393555, "Pretrain/Step": 625, "Pretrain/Step Time": 8.51723425835371} +{"Pretrain/Learning Rate": 4.983354084236954e-05, "Pretrain/Loss": 2.163242816925049, "Pretrain/Loss (Raw)": 2.0985875129699707, "Pretrain/Step": 626, "Pretrain/Step Time": 8.524807728827} +{"Pretrain/Learning Rate": 4.983256132697594e-05, "Pretrain/Loss": 2.159554958343506, "Pretrain/Loss (Raw)": 1.865068793296814, "Pretrain/Step": 627, "Pretrain/Step Time": 8.521563919261098} +{"Pretrain/Learning Rate": 4.983157894777435e-05, "Pretrain/Loss": 2.159008741378784, "Pretrain/Loss (Raw)": 2.1385180950164795, "Pretrain/Step": 628, "Pretrain/Step Time": 8.514143327251077} +{"Pretrain/Learning Rate": 4.983059370487806e-05, "Pretrain/Loss": 2.15665340423584, "Pretrain/Loss (Raw)": 2.058173179626465, "Pretrain/Step": 629, "Pretrain/Step Time": 8.510152207687497} +{"Pretrain/Learning Rate": 4.9829605598400705e-05, "Pretrain/Loss": 2.1593899726867676, "Pretrain/Loss (Raw)": 2.194600820541382, "Pretrain/Step": 630, "Pretrain/Step Time": 8.511700950562954} +{"Pretrain/Learning Rate": 4.982861462845623e-05, "Pretrain/Loss": 2.159844160079956, "Pretrain/Loss (Raw)": 2.1868977546691895, "Pretrain/Step": 631, "Pretrain/Step Time": 8.512968517839909} +{"Pretrain/Learning Rate": 4.982762079515892e-05, "Pretrain/Loss": 2.159219980239868, "Pretrain/Loss (Raw)": 2.0687735080718994, "Pretrain/Step": 632, "Pretrain/Step Time": 8.516907263547182} +{"Pretrain/Learning Rate": 4.982662409862339e-05, "Pretrain/Loss": 2.1604089736938477, "Pretrain/Loss (Raw)": 2.2213516235351562, "Pretrain/Step": 633, "Pretrain/Step Time": 8.513480318710208} +{"Pretrain/Learning Rate": 4.9825624538964576e-05, "Pretrain/Loss": 2.1589231491088867, "Pretrain/Loss (Raw)": 2.020549774169922, "Pretrain/Step": 634, "Pretrain/Step Time": 8.506378067657351} +{"Pretrain/Learning Rate": 4.982462211629776e-05, "Pretrain/Loss": 2.1588551998138428, "Pretrain/Loss (Raw)": 2.220553159713745, "Pretrain/Step": 635, "Pretrain/Step Time": 8.508465809747577} +{"Pretrain/Learning Rate": 4.9823616830738546e-05, "Pretrain/Loss": 2.1596221923828125, "Pretrain/Loss (Raw)": 2.2817935943603516, "Pretrain/Step": 636, "Pretrain/Step Time": 8.512817615643144} +{"Pretrain/Learning Rate": 4.9822608682402866e-05, "Pretrain/Loss": 2.1616671085357666, "Pretrain/Loss (Raw)": 2.1662604808807373, "Pretrain/Step": 637, "Pretrain/Step Time": 8.512011110782623} +{"Pretrain/Learning Rate": 4.9821597671406984e-05, "Pretrain/Loss": 2.1598873138427734, "Pretrain/Loss (Raw)": 2.128143787384033, "Pretrain/Step": 638, "Pretrain/Step Time": 8.518962191417813} +{"Pretrain/Learning Rate": 4.982058379786749e-05, "Pretrain/Loss": 2.16011643409729, "Pretrain/Loss (Raw)": 2.1048758029937744, "Pretrain/Step": 639, "Pretrain/Step Time": 8.51790146715939} +{"Pretrain/Learning Rate": 4.9819567061901327e-05, "Pretrain/Loss": 2.161440849304199, "Pretrain/Loss (Raw)": 2.1748406887054443, "Pretrain/Step": 640, "Pretrain/Step Time": 8.514440206810832} +{"Pretrain/Learning Rate": 4.981854746362573e-05, "Pretrain/Loss": 2.1622390747070312, "Pretrain/Loss (Raw)": 2.272468328475952, "Pretrain/Step": 641, "Pretrain/Step Time": 8.519481951370835} +{"Pretrain/Learning Rate": 4.981752500315829e-05, "Pretrain/Loss": 2.1622602939605713, "Pretrain/Loss (Raw)": 2.1756560802459717, "Pretrain/Step": 642, "Pretrain/Step Time": 8.526318371295929} +{"Pretrain/Learning Rate": 4.981649968061692e-05, "Pretrain/Loss": 2.1642441749572754, "Pretrain/Loss (Raw)": 2.2703535556793213, "Pretrain/Step": 643, "Pretrain/Step Time": 8.527706012129784} +{"Pretrain/Learning Rate": 4.981547149611987e-05, "Pretrain/Loss": 2.1637401580810547, "Pretrain/Loss (Raw)": 2.2215588092803955, "Pretrain/Step": 644, "Pretrain/Step Time": 8.537137208506465} +{"Pretrain/Learning Rate": 4.9814440449785715e-05, "Pretrain/Loss": 2.162041664123535, "Pretrain/Loss (Raw)": 2.167647361755371, "Pretrain/Step": 645, "Pretrain/Step Time": 8.534398801624775} +{"Pretrain/Learning Rate": 4.9813406541733355e-05, "Pretrain/Loss": 2.1615123748779297, "Pretrain/Loss (Raw)": 2.00376296043396, "Pretrain/Step": 646, "Pretrain/Step Time": 8.52586443722248} +{"Pretrain/Learning Rate": 4.981236977208203e-05, "Pretrain/Loss": 2.1616322994232178, "Pretrain/Loss (Raw)": 2.1709775924682617, "Pretrain/Step": 647, "Pretrain/Step Time": 8.523817021399736} +{"Pretrain/Learning Rate": 4.98113301409513e-05, "Pretrain/Loss": 2.1605939865112305, "Pretrain/Loss (Raw)": 2.0926895141601562, "Pretrain/Step": 648, "Pretrain/Step Time": 8.524839410558343} +{"Pretrain/Learning Rate": 4.981028764846106e-05, "Pretrain/Loss": 2.1584181785583496, "Pretrain/Loss (Raw)": 1.9567621946334839, "Pretrain/Step": 649, "Pretrain/Step Time": 8.532888274639845} +{"Pretrain/Learning Rate": 4.980924229473155e-05, "Pretrain/Loss": 2.1592326164245605, "Pretrain/Loss (Raw)": 2.1412618160247803, "Pretrain/Step": 650, "Pretrain/Step Time": 8.533561566844583} +{"Pretrain/Learning Rate": 4.980819407988331e-05, "Pretrain/Loss": 2.160244941711426, "Pretrain/Loss (Raw)": 2.1743340492248535, "Pretrain/Step": 651, "Pretrain/Step Time": 8.521830812096596} +{"Pretrain/Learning Rate": 4.980714300403723e-05, "Pretrain/Loss": 2.1598029136657715, "Pretrain/Loss (Raw)": 2.08121657371521, "Pretrain/Step": 652, "Pretrain/Step Time": 8.520187115296721} +{"Pretrain/Learning Rate": 4.9806089067314515e-05, "Pretrain/Loss": 2.1591334342956543, "Pretrain/Loss (Raw)": 2.0771429538726807, "Pretrain/Step": 653, "Pretrain/Step Time": 8.513028793036938} +{"Pretrain/Learning Rate": 4.980503226983673e-05, "Pretrain/Loss": 2.158785820007324, "Pretrain/Loss (Raw)": 2.188783884048462, "Pretrain/Step": 654, "Pretrain/Step Time": 8.507768822833896} +{"Pretrain/Learning Rate": 4.980397261172573e-05, "Pretrain/Loss": 2.1595635414123535, "Pretrain/Loss (Raw)": 2.22015643119812, "Pretrain/Step": 655, "Pretrain/Step Time": 8.5118528008461} +{"Pretrain/Learning Rate": 4.9802910093103725e-05, "Pretrain/Loss": 2.159700870513916, "Pretrain/Loss (Raw)": 1.9655448198318481, "Pretrain/Step": 656, "Pretrain/Step Time": 8.512039480730891} +{"Pretrain/Learning Rate": 4.980184471409326e-05, "Pretrain/Loss": 2.1601438522338867, "Pretrain/Loss (Raw)": 2.0086991786956787, "Pretrain/Step": 657, "Pretrain/Step Time": 8.51311231404543} +{"Pretrain/Learning Rate": 4.980077647481719e-05, "Pretrain/Loss": 2.1602983474731445, "Pretrain/Loss (Raw)": 2.1556084156036377, "Pretrain/Step": 658, "Pretrain/Step Time": 8.510655065998435} +{"Pretrain/Learning Rate": 4.979970537539871e-05, "Pretrain/Loss": 2.160785675048828, "Pretrain/Loss (Raw)": 2.166872262954712, "Pretrain/Step": 659, "Pretrain/Step Time": 8.501208819448948} +{"Pretrain/Learning Rate": 4.979863141596135e-05, "Pretrain/Loss": 2.160421848297119, "Pretrain/Loss (Raw)": 2.0092885494232178, "Pretrain/Step": 660, "Pretrain/Step Time": 8.502635085955262} +{"Pretrain/Learning Rate": 4.979755459662896e-05, "Pretrain/Loss": 2.1578774452209473, "Pretrain/Loss (Raw)": 2.0115065574645996, "Pretrain/Step": 661, "Pretrain/Step Time": 8.510142300277948} +{"Pretrain/Learning Rate": 4.979647491752572e-05, "Pretrain/Loss": 2.156430244445801, "Pretrain/Loss (Raw)": 2.1020359992980957, "Pretrain/Step": 662, "Pretrain/Step Time": 8.512291252613068} +{"Pretrain/Learning Rate": 4.979539237877615e-05, "Pretrain/Loss": 2.1537184715270996, "Pretrain/Loss (Raw)": 2.0281589031219482, "Pretrain/Step": 663, "Pretrain/Step Time": 8.508002435788512} +{"Pretrain/Learning Rate": 4.979430698050509e-05, "Pretrain/Loss": 2.1537699699401855, "Pretrain/Loss (Raw)": 2.0401554107666016, "Pretrain/Step": 664, "Pretrain/Step Time": 8.503813162446022} +{"Pretrain/Learning Rate": 4.979321872283772e-05, "Pretrain/Loss": 2.1547842025756836, "Pretrain/Loss (Raw)": 2.3427953720092773, "Pretrain/Step": 665, "Pretrain/Step Time": 8.496937520802021} +{"Pretrain/Learning Rate": 4.979212760589953e-05, "Pretrain/Loss": 2.157153844833374, "Pretrain/Loss (Raw)": 2.3850274085998535, "Pretrain/Step": 666, "Pretrain/Step Time": 8.499566303566098} +{"Pretrain/Learning Rate": 4.9791033629816364e-05, "Pretrain/Loss": 2.1571731567382812, "Pretrain/Loss (Raw)": 2.2084248065948486, "Pretrain/Step": 667, "Pretrain/Step Time": 8.503054803237319} +{"Pretrain/Learning Rate": 4.978993679471438e-05, "Pretrain/Loss": 2.156892776489258, "Pretrain/Loss (Raw)": 2.1638858318328857, "Pretrain/Step": 668, "Pretrain/Step Time": 8.505853557959199} +{"Pretrain/Learning Rate": 4.978883710072008e-05, "Pretrain/Loss": 2.1562654972076416, "Pretrain/Loss (Raw)": 1.966408610343933, "Pretrain/Step": 669, "Pretrain/Step Time": 8.504635531455278} +{"Pretrain/Learning Rate": 4.978773454796026e-05, "Pretrain/Loss": 2.1562676429748535, "Pretrain/Loss (Raw)": 2.1900391578674316, "Pretrain/Step": 670, "Pretrain/Step Time": 8.494625398889184} +{"Pretrain/Learning Rate": 4.9786629136562095e-05, "Pretrain/Loss": 2.154609203338623, "Pretrain/Loss (Raw)": 2.1826980113983154, "Pretrain/Step": 671, "Pretrain/Step Time": 8.502025013789535} +{"Pretrain/Learning Rate": 4.978552086665306e-05, "Pretrain/Loss": 2.153542995452881, "Pretrain/Loss (Raw)": 2.2214691638946533, "Pretrain/Step": 672, "Pretrain/Step Time": 8.50217554345727} +{"Pretrain/Learning Rate": 4.9784409738360973e-05, "Pretrain/Loss": 2.15104603767395, "Pretrain/Loss (Raw)": 2.029536485671997, "Pretrain/Step": 673, "Pretrain/Step Time": 8.50330369360745} +{"Pretrain/Learning Rate": 4.978329575181395e-05, "Pretrain/Loss": 2.149282455444336, "Pretrain/Loss (Raw)": 1.8975666761398315, "Pretrain/Step": 674, "Pretrain/Step Time": 8.505529953166842} +{"Pretrain/Learning Rate": 4.978217890714049e-05, "Pretrain/Loss": 2.150465726852417, "Pretrain/Loss (Raw)": 2.3899986743927, "Pretrain/Step": 675, "Pretrain/Step Time": 8.498871630057693} +{"Pretrain/Learning Rate": 4.978105920446938e-05, "Pretrain/Loss": 2.150698184967041, "Pretrain/Loss (Raw)": 2.002855062484741, "Pretrain/Step": 676, "Pretrain/Step Time": 8.493494130671024} +{"Pretrain/Learning Rate": 4.977993664392975e-05, "Pretrain/Loss": 2.148844003677368, "Pretrain/Loss (Raw)": 2.000697612762451, "Pretrain/Step": 677, "Pretrain/Step Time": 8.491919633001089} +{"Pretrain/Learning Rate": 4.9778811225651056e-05, "Pretrain/Loss": 2.1505377292633057, "Pretrain/Loss (Raw)": 2.104910135269165, "Pretrain/Step": 678, "Pretrain/Step Time": 8.505663145333529} +{"Pretrain/Learning Rate": 4.9777682949763096e-05, "Pretrain/Loss": 2.152717113494873, "Pretrain/Loss (Raw)": 2.198293685913086, "Pretrain/Step": 679, "Pretrain/Step Time": 8.505769727751613} +{"Pretrain/Learning Rate": 4.9776551816395975e-05, "Pretrain/Loss": 2.1528306007385254, "Pretrain/Loss (Raw)": 2.205583333969116, "Pretrain/Step": 680, "Pretrain/Step Time": 8.512325379997492} +{"Pretrain/Learning Rate": 4.977541782568015e-05, "Pretrain/Loss": 2.1534011363983154, "Pretrain/Loss (Raw)": 2.119964838027954, "Pretrain/Step": 681, "Pretrain/Step Time": 8.510431127622724} +{"Pretrain/Learning Rate": 4.97742809777464e-05, "Pretrain/Loss": 2.1531035900115967, "Pretrain/Loss (Raw)": 2.16221284866333, "Pretrain/Step": 682, "Pretrain/Step Time": 8.50040645711124} +{"Pretrain/Learning Rate": 4.9773141272725824e-05, "Pretrain/Loss": 2.1528449058532715, "Pretrain/Loss (Raw)": 2.2049758434295654, "Pretrain/Step": 683, "Pretrain/Step Time": 8.502521947026253} +{"Pretrain/Learning Rate": 4.9771998710749864e-05, "Pretrain/Loss": 2.1516847610473633, "Pretrain/Loss (Raw)": 1.9901676177978516, "Pretrain/Step": 684, "Pretrain/Step Time": 8.510450590401888} +{"Pretrain/Learning Rate": 4.977085329195028e-05, "Pretrain/Loss": 2.151644468307495, "Pretrain/Loss (Raw)": 2.075869083404541, "Pretrain/Step": 685, "Pretrain/Step Time": 8.510218182578683} +{"Pretrain/Learning Rate": 4.9769705016459164e-05, "Pretrain/Loss": 2.1526007652282715, "Pretrain/Loss (Raw)": 2.1786000728607178, "Pretrain/Step": 686, "Pretrain/Step Time": 8.509594647213817} +{"Pretrain/Learning Rate": 4.976855388440896e-05, "Pretrain/Loss": 2.152684211730957, "Pretrain/Loss (Raw)": 2.1297032833099365, "Pretrain/Step": 687, "Pretrain/Step Time": 8.507430206984282} +{"Pretrain/Learning Rate": 4.97673998959324e-05, "Pretrain/Loss": 2.150834560394287, "Pretrain/Loss (Raw)": 2.0909881591796875, "Pretrain/Step": 688, "Pretrain/Step Time": 8.499460807070136} +{"Pretrain/Learning Rate": 4.976624305116259e-05, "Pretrain/Loss": 2.152440309524536, "Pretrain/Loss (Raw)": 2.257011890411377, "Pretrain/Step": 689, "Pretrain/Step Time": 8.497047021985054} +{"Pretrain/Learning Rate": 4.9765083350232913e-05, "Pretrain/Loss": 2.1527884006500244, "Pretrain/Loss (Raw)": 2.0604724884033203, "Pretrain/Step": 690, "Pretrain/Step Time": 8.504931461066008} +{"Pretrain/Learning Rate": 4.976392079327713e-05, "Pretrain/Loss": 2.1511800289154053, "Pretrain/Loss (Raw)": 2.1653881072998047, "Pretrain/Step": 691, "Pretrain/Step Time": 8.511315759271383} +{"Pretrain/Learning Rate": 4.976275538042932e-05, "Pretrain/Loss": 2.150351047515869, "Pretrain/Loss (Raw)": 2.120943069458008, "Pretrain/Step": 692, "Pretrain/Step Time": 8.513092443346977} +{"Pretrain/Learning Rate": 4.976158711182386e-05, "Pretrain/Loss": 2.1510133743286133, "Pretrain/Loss (Raw)": 2.156108856201172, "Pretrain/Step": 693, "Pretrain/Step Time": 8.50789332203567} +{"Pretrain/Learning Rate": 4.9760415987595496e-05, "Pretrain/Loss": 2.149656295776367, "Pretrain/Loss (Raw)": 2.1103320121765137, "Pretrain/Step": 694, "Pretrain/Step Time": 8.498443480581045} +{"Pretrain/Learning Rate": 4.9759242007879295e-05, "Pretrain/Loss": 2.1512393951416016, "Pretrain/Loss (Raw)": 2.647223711013794, "Pretrain/Step": 695, "Pretrain/Step Time": 8.49835243448615} +{"Pretrain/Learning Rate": 4.975806517281062e-05, "Pretrain/Loss": 2.153010368347168, "Pretrain/Loss (Raw)": 2.123044967651367, "Pretrain/Step": 696, "Pretrain/Step Time": 8.502261318266392} +{"Pretrain/Learning Rate": 4.975688548252522e-05, "Pretrain/Loss": 2.152614116668701, "Pretrain/Loss (Raw)": 2.2223503589630127, "Pretrain/Step": 697, "Pretrain/Step Time": 8.508583122864366} +{"Pretrain/Learning Rate": 4.9755702937159124e-05, "Pretrain/Loss": 2.1525068283081055, "Pretrain/Loss (Raw)": 2.1150307655334473, "Pretrain/Step": 698, "Pretrain/Step Time": 8.520265243947506} +{"Pretrain/Learning Rate": 4.975451753684871e-05, "Pretrain/Loss": 2.1528849601745605, "Pretrain/Loss (Raw)": 2.1212964057922363, "Pretrain/Step": 699, "Pretrain/Step Time": 8.520516693592072} +{"Pretrain/Learning Rate": 4.975332928173069e-05, "Pretrain/Loss": 2.152240753173828, "Pretrain/Loss (Raw)": 2.13114857673645, "Pretrain/Step": 700, "Pretrain/Step Time": 8.513415886089206} +{"Pretrain/Learning Rate": 4.975213817194209e-05, "Pretrain/Loss": 2.1514534950256348, "Pretrain/Loss (Raw)": 2.121497631072998, "Pretrain/Step": 701, "Pretrain/Step Time": 8.510415552183986} +{"Pretrain/Learning Rate": 4.975094420762029e-05, "Pretrain/Loss": 2.1505789756774902, "Pretrain/Loss (Raw)": 2.0787110328674316, "Pretrain/Step": 702, "Pretrain/Step Time": 8.519346833229065} +{"Pretrain/Learning Rate": 4.9749747388902964e-05, "Pretrain/Loss": 2.15085506439209, "Pretrain/Loss (Raw)": 2.1163814067840576, "Pretrain/Step": 703, "Pretrain/Step Time": 8.520676987245679} +{"Pretrain/Learning Rate": 4.974854771592815e-05, "Pretrain/Loss": 2.1484534740448, "Pretrain/Loss (Raw)": 2.0205330848693848, "Pretrain/Step": 704, "Pretrain/Step Time": 8.522015722468495} +{"Pretrain/Learning Rate": 4.974734518883419e-05, "Pretrain/Loss": 2.1472465991973877, "Pretrain/Loss (Raw)": 2.5198416709899902, "Pretrain/Step": 705, "Pretrain/Step Time": 8.513703672215343} +{"Pretrain/Learning Rate": 4.974613980775977e-05, "Pretrain/Loss": 2.145331859588623, "Pretrain/Loss (Raw)": 1.9096671342849731, "Pretrain/Step": 706, "Pretrain/Step Time": 8.507642963901162} +{"Pretrain/Learning Rate": 4.974493157284391e-05, "Pretrain/Loss": 2.1448311805725098, "Pretrain/Loss (Raw)": 2.1878764629364014, "Pretrain/Step": 707, "Pretrain/Step Time": 8.508485725149512} +{"Pretrain/Learning Rate": 4.974372048422593e-05, "Pretrain/Loss": 2.144120693206787, "Pretrain/Loss (Raw)": 2.0266315937042236, "Pretrain/Step": 708, "Pretrain/Step Time": 8.517332166433334} +{"Pretrain/Learning Rate": 4.974250654204551e-05, "Pretrain/Loss": 2.1458635330200195, "Pretrain/Loss (Raw)": 2.4395883083343506, "Pretrain/Step": 709, "Pretrain/Step Time": 8.518390694633126} +{"Pretrain/Learning Rate": 4.974128974644264e-05, "Pretrain/Loss": 2.1457624435424805, "Pretrain/Loss (Raw)": 2.167022705078125, "Pretrain/Step": 710, "Pretrain/Step Time": 8.520139077678323} +{"Pretrain/Learning Rate": 4.9740070097557656e-05, "Pretrain/Loss": 2.144949197769165, "Pretrain/Loss (Raw)": 2.1297221183776855, "Pretrain/Step": 711, "Pretrain/Step Time": 8.512881584465504} +{"Pretrain/Learning Rate": 4.973884759553121e-05, "Pretrain/Loss": 2.1442229747772217, "Pretrain/Loss (Raw)": 2.2432315349578857, "Pretrain/Step": 712, "Pretrain/Step Time": 8.508525602519512} +{"Pretrain/Learning Rate": 4.973762224050428e-05, "Pretrain/Loss": 2.143673896789551, "Pretrain/Loss (Raw)": 2.1308205127716064, "Pretrain/Step": 713, "Pretrain/Step Time": 8.497678944841027} +{"Pretrain/Learning Rate": 4.973639403261819e-05, "Pretrain/Loss": 2.143472671508789, "Pretrain/Loss (Raw)": 2.095170497894287, "Pretrain/Step": 714, "Pretrain/Step Time": 8.505440726876259} +{"Pretrain/Learning Rate": 4.9735162972014584e-05, "Pretrain/Loss": 2.143948554992676, "Pretrain/Loss (Raw)": 2.088940143585205, "Pretrain/Step": 715, "Pretrain/Step Time": 8.503326211124659} +{"Pretrain/Learning Rate": 4.9733929058835425e-05, "Pretrain/Loss": 2.142923355102539, "Pretrain/Loss (Raw)": 2.1219706535339355, "Pretrain/Step": 716, "Pretrain/Step Time": 8.515828307718039} +{"Pretrain/Learning Rate": 4.973269229322301e-05, "Pretrain/Loss": 2.143486499786377, "Pretrain/Loss (Raw)": 2.252723217010498, "Pretrain/Step": 717, "Pretrain/Step Time": 8.513215474784374} +{"Pretrain/Learning Rate": 4.973145267531998e-05, "Pretrain/Loss": 2.1456828117370605, "Pretrain/Loss (Raw)": 2.112516403198242, "Pretrain/Step": 718, "Pretrain/Step Time": 8.515024188905954} +{"Pretrain/Learning Rate": 4.973021020526929e-05, "Pretrain/Loss": 2.1459274291992188, "Pretrain/Loss (Raw)": 2.2240703105926514, "Pretrain/Step": 719, "Pretrain/Step Time": 8.519639460369945} +{"Pretrain/Learning Rate": 4.972896488321422e-05, "Pretrain/Loss": 2.144416093826294, "Pretrain/Loss (Raw)": 2.149855375289917, "Pretrain/Step": 720, "Pretrain/Step Time": 8.52146078273654} +{"Pretrain/Learning Rate": 4.97277167092984e-05, "Pretrain/Loss": 2.142608165740967, "Pretrain/Loss (Raw)": 1.8604836463928223, "Pretrain/Step": 721, "Pretrain/Step Time": 8.51991605386138} +{"Pretrain/Learning Rate": 4.972646568366577e-05, "Pretrain/Loss": 2.1439640522003174, "Pretrain/Loss (Raw)": 2.2779757976531982, "Pretrain/Step": 722, "Pretrain/Step Time": 8.521265782415867} +{"Pretrain/Learning Rate": 4.9725211806460604e-05, "Pretrain/Loss": 2.1442697048187256, "Pretrain/Loss (Raw)": 2.078629493713379, "Pretrain/Step": 723, "Pretrain/Step Time": 8.513755640015006} +{"Pretrain/Learning Rate": 4.97239550778275e-05, "Pretrain/Loss": 2.146536350250244, "Pretrain/Loss (Raw)": 2.360398292541504, "Pretrain/Step": 724, "Pretrain/Step Time": 8.50632955506444} +{"Pretrain/Learning Rate": 4.972269549791139e-05, "Pretrain/Loss": 2.1480846405029297, "Pretrain/Loss (Raw)": 2.2487757205963135, "Pretrain/Step": 725, "Pretrain/Step Time": 8.513350604102015} +{"Pretrain/Learning Rate": 4.9721433066857535e-05, "Pretrain/Loss": 2.148362159729004, "Pretrain/Loss (Raw)": 2.147914409637451, "Pretrain/Step": 726, "Pretrain/Step Time": 8.515141332522035} +{"Pretrain/Learning Rate": 4.9720167784811535e-05, "Pretrain/Loss": 2.1476874351501465, "Pretrain/Loss (Raw)": 2.018172264099121, "Pretrain/Step": 727, "Pretrain/Step Time": 8.51833514496684} +{"Pretrain/Learning Rate": 4.97188996519193e-05, "Pretrain/Loss": 2.148463487625122, "Pretrain/Loss (Raw)": 2.2908825874328613, "Pretrain/Step": 728, "Pretrain/Step Time": 8.51881786994636} +{"Pretrain/Learning Rate": 4.971762866832708e-05, "Pretrain/Loss": 2.1484506130218506, "Pretrain/Loss (Raw)": 2.0831148624420166, "Pretrain/Step": 729, "Pretrain/Step Time": 8.514176052063704} +{"Pretrain/Learning Rate": 4.971635483418144e-05, "Pretrain/Loss": 2.1469359397888184, "Pretrain/Loss (Raw)": 2.038611650466919, "Pretrain/Step": 730, "Pretrain/Step Time": 8.519518813118339} +{"Pretrain/Learning Rate": 4.97150781496293e-05, "Pretrain/Loss": 2.1481382846832275, "Pretrain/Loss (Raw)": 2.203948736190796, "Pretrain/Step": 731, "Pretrain/Step Time": 8.505079317837954} +{"Pretrain/Learning Rate": 4.971379861481789e-05, "Pretrain/Loss": 2.1473708152770996, "Pretrain/Loss (Raw)": 2.068739175796509, "Pretrain/Step": 732, "Pretrain/Step Time": 8.511030921712518} +{"Pretrain/Learning Rate": 4.9712516229894756e-05, "Pretrain/Loss": 2.147233247756958, "Pretrain/Loss (Raw)": 2.1195361614227295, "Pretrain/Step": 733, "Pretrain/Step Time": 8.51333081535995} +{"Pretrain/Learning Rate": 4.971123099500781e-05, "Pretrain/Loss": 2.148313522338867, "Pretrain/Loss (Raw)": 2.2544708251953125, "Pretrain/Step": 734, "Pretrain/Step Time": 8.514977131038904} +{"Pretrain/Learning Rate": 4.970994291030526e-05, "Pretrain/Loss": 2.1493163108825684, "Pretrain/Loss (Raw)": 2.228965997695923, "Pretrain/Step": 735, "Pretrain/Step Time": 8.512083554640412} +{"Pretrain/Learning Rate": 4.970865197593566e-05, "Pretrain/Loss": 2.148804187774658, "Pretrain/Loss (Raw)": 2.1303789615631104, "Pretrain/Step": 736, "Pretrain/Step Time": 8.503832938149571} +{"Pretrain/Learning Rate": 4.9707358192047885e-05, "Pretrain/Loss": 2.1492528915405273, "Pretrain/Loss (Raw)": 2.218038558959961, "Pretrain/Step": 737, "Pretrain/Step Time": 8.51283217407763} +{"Pretrain/Learning Rate": 4.970606155879113e-05, "Pretrain/Loss": 2.147151231765747, "Pretrain/Loss (Raw)": 1.875144124031067, "Pretrain/Step": 738, "Pretrain/Step Time": 8.511959109455347} +{"Pretrain/Learning Rate": 4.970476207631494e-05, "Pretrain/Loss": 2.14530873298645, "Pretrain/Loss (Raw)": 2.044356346130371, "Pretrain/Step": 739, "Pretrain/Step Time": 8.512888886034489} +{"Pretrain/Learning Rate": 4.970345974476918e-05, "Pretrain/Loss": 2.144362449645996, "Pretrain/Loss (Raw)": 2.135607957839966, "Pretrain/Step": 740, "Pretrain/Step Time": 8.515549093484879} +{"Pretrain/Learning Rate": 4.970215456430403e-05, "Pretrain/Loss": 2.143425464630127, "Pretrain/Loss (Raw)": 2.0650362968444824, "Pretrain/Step": 741, "Pretrain/Step Time": 8.514110121876001} +{"Pretrain/Learning Rate": 4.970084653507001e-05, "Pretrain/Loss": 2.1451053619384766, "Pretrain/Loss (Raw)": 2.4213969707489014, "Pretrain/Step": 742, "Pretrain/Step Time": 8.507462289184332} +{"Pretrain/Learning Rate": 4.969953565721799e-05, "Pretrain/Loss": 2.144252300262451, "Pretrain/Loss (Raw)": 2.0015110969543457, "Pretrain/Step": 743, "Pretrain/Step Time": 8.502794532105327} +{"Pretrain/Learning Rate": 4.969822193089911e-05, "Pretrain/Loss": 2.1442809104919434, "Pretrain/Loss (Raw)": 2.1699790954589844, "Pretrain/Step": 744, "Pretrain/Step Time": 8.502289881929755} +{"Pretrain/Learning Rate": 4.969690535626491e-05, "Pretrain/Loss": 2.140075445175171, "Pretrain/Loss (Raw)": 2.0594334602355957, "Pretrain/Step": 745, "Pretrain/Step Time": 8.507552240043879} +{"Pretrain/Learning Rate": 4.96955859334672e-05, "Pretrain/Loss": 2.1402173042297363, "Pretrain/Loss (Raw)": 1.9942294359207153, "Pretrain/Step": 746, "Pretrain/Step Time": 8.511821925640106} +{"Pretrain/Learning Rate": 4.9694263662658156e-05, "Pretrain/Loss": 2.1395583152770996, "Pretrain/Loss (Raw)": 2.1036698818206787, "Pretrain/Step": 747, "Pretrain/Step Time": 8.507034204900265} +{"Pretrain/Learning Rate": 4.9692938543990265e-05, "Pretrain/Loss": 2.139984130859375, "Pretrain/Loss (Raw)": 2.246645927429199, "Pretrain/Step": 748, "Pretrain/Step Time": 8.502151906490326} +{"Pretrain/Learning Rate": 4.969161057761634e-05, "Pretrain/Loss": 2.139249324798584, "Pretrain/Loss (Raw)": 1.9887843132019043, "Pretrain/Step": 749, "Pretrain/Step Time": 8.503156125545502} +{"Pretrain/Learning Rate": 4.969027976368954e-05, "Pretrain/Loss": 2.140655040740967, "Pretrain/Loss (Raw)": 2.289337158203125, "Pretrain/Step": 750, "Pretrain/Step Time": 8.501369124278426} +{"Pretrain/Learning Rate": 4.968894610236332e-05, "Pretrain/Loss": 2.1402530670166016, "Pretrain/Loss (Raw)": 2.1285200119018555, "Pretrain/Step": 751, "Pretrain/Step Time": 8.504943398758769} +{"Pretrain/Learning Rate": 4.968760959379151e-05, "Pretrain/Loss": 2.1409616470336914, "Pretrain/Loss (Raw)": 2.306410312652588, "Pretrain/Step": 752, "Pretrain/Step Time": 8.510349662974477} +{"Pretrain/Learning Rate": 4.968627023812822e-05, "Pretrain/Loss": 2.1406681537628174, "Pretrain/Loss (Raw)": 2.104994058609009, "Pretrain/Step": 753, "Pretrain/Step Time": 8.506611581891775} +{"Pretrain/Learning Rate": 4.968492803552793e-05, "Pretrain/Loss": 2.14087176322937, "Pretrain/Loss (Raw)": 2.1246442794799805, "Pretrain/Step": 754, "Pretrain/Step Time": 8.503620196133852} +{"Pretrain/Learning Rate": 4.968358298614541e-05, "Pretrain/Loss": 2.142319679260254, "Pretrain/Loss (Raw)": 2.050396203994751, "Pretrain/Step": 755, "Pretrain/Step Time": 8.510158859193325} +{"Pretrain/Learning Rate": 4.968223509013579e-05, "Pretrain/Loss": 2.1435863971710205, "Pretrain/Loss (Raw)": 2.3006699085235596, "Pretrain/Step": 756, "Pretrain/Step Time": 8.508131574839354} +{"Pretrain/Learning Rate": 4.968088434765452e-05, "Pretrain/Loss": 2.144087314605713, "Pretrain/Loss (Raw)": 2.122272253036499, "Pretrain/Step": 757, "Pretrain/Step Time": 8.50750993564725} +{"Pretrain/Learning Rate": 4.967953075885736e-05, "Pretrain/Loss": 2.142792224884033, "Pretrain/Loss (Raw)": 2.0288259983062744, "Pretrain/Step": 758, "Pretrain/Step Time": 8.503815209493041} +{"Pretrain/Learning Rate": 4.9678174323900415e-05, "Pretrain/Loss": 2.1435413360595703, "Pretrain/Loss (Raw)": 2.2828171253204346, "Pretrain/Step": 759, "Pretrain/Step Time": 8.499390698969364} +{"Pretrain/Learning Rate": 4.9676815042940125e-05, "Pretrain/Loss": 2.144197940826416, "Pretrain/Loss (Raw)": 2.152817487716675, "Pretrain/Step": 760, "Pretrain/Step Time": 8.503820739686489} +{"Pretrain/Learning Rate": 4.967545291613325e-05, "Pretrain/Loss": 2.1438000202178955, "Pretrain/Loss (Raw)": 2.170424222946167, "Pretrain/Step": 761, "Pretrain/Step Time": 8.50892791710794} +{"Pretrain/Learning Rate": 4.967408794363686e-05, "Pretrain/Loss": 2.144672393798828, "Pretrain/Loss (Raw)": 2.1321749687194824, "Pretrain/Step": 762, "Pretrain/Step Time": 8.510518254712224} +{"Pretrain/Learning Rate": 4.9672720125608384e-05, "Pretrain/Loss": 2.145314931869507, "Pretrain/Loss (Raw)": 2.3028087615966797, "Pretrain/Step": 763, "Pretrain/Step Time": 8.512829627841711} +{"Pretrain/Learning Rate": 4.9671349462205565e-05, "Pretrain/Loss": 2.1441099643707275, "Pretrain/Loss (Raw)": 2.1275711059570312, "Pretrain/Step": 764, "Pretrain/Step Time": 8.50631944835186} +{"Pretrain/Learning Rate": 4.966997595358647e-05, "Pretrain/Loss": 2.143805980682373, "Pretrain/Loss (Raw)": 2.1273486614227295, "Pretrain/Step": 765, "Pretrain/Step Time": 8.506596187129617} +{"Pretrain/Learning Rate": 4.966859959990949e-05, "Pretrain/Loss": 2.144561767578125, "Pretrain/Loss (Raw)": 2.224897623062134, "Pretrain/Step": 766, "Pretrain/Step Time": 8.505010344088078} +{"Pretrain/Learning Rate": 4.966722040133337e-05, "Pretrain/Loss": 2.1447319984436035, "Pretrain/Loss (Raw)": 2.1266887187957764, "Pretrain/Step": 767, "Pretrain/Step Time": 8.503550665453076} +{"Pretrain/Learning Rate": 4.9665838358017156e-05, "Pretrain/Loss": 2.143850803375244, "Pretrain/Loss (Raw)": 2.0619871616363525, "Pretrain/Step": 768, "Pretrain/Step Time": 8.503589833155274} +{"Pretrain/Learning Rate": 4.966445347012023e-05, "Pretrain/Loss": 2.1430885791778564, "Pretrain/Loss (Raw)": 2.174923896789551, "Pretrain/Step": 769, "Pretrain/Step Time": 8.507150145247579} +{"Pretrain/Learning Rate": 4.9663065737802316e-05, "Pretrain/Loss": 2.1426806449890137, "Pretrain/Loss (Raw)": 2.1234426498413086, "Pretrain/Step": 770, "Pretrain/Step Time": 8.498807130381465} +{"Pretrain/Learning Rate": 4.9661675161223435e-05, "Pretrain/Loss": 2.141279697418213, "Pretrain/Loss (Raw)": 2.0910561084747314, "Pretrain/Step": 771, "Pretrain/Step Time": 8.500307193025947} +{"Pretrain/Learning Rate": 4.966028174054397e-05, "Pretrain/Loss": 2.139497995376587, "Pretrain/Loss (Raw)": 1.9934617280960083, "Pretrain/Step": 772, "Pretrain/Step Time": 8.493729505687952} +{"Pretrain/Learning Rate": 4.965888547592461e-05, "Pretrain/Loss": 2.1406426429748535, "Pretrain/Loss (Raw)": 2.3141584396362305, "Pretrain/Step": 773, "Pretrain/Step Time": 8.503223551437259} +{"Pretrain/Learning Rate": 4.965748636752638e-05, "Pretrain/Loss": 2.1423325538635254, "Pretrain/Loss (Raw)": 2.220099925994873, "Pretrain/Step": 774, "Pretrain/Step Time": 8.506590956822038} +{"Pretrain/Learning Rate": 4.965608441551063e-05, "Pretrain/Loss": 2.141566753387451, "Pretrain/Loss (Raw)": 2.072935104370117, "Pretrain/Step": 775, "Pretrain/Step Time": 8.511251095682383} +{"Pretrain/Learning Rate": 4.965467962003905e-05, "Pretrain/Loss": 2.140578508377075, "Pretrain/Loss (Raw)": 1.96620774269104, "Pretrain/Step": 776, "Pretrain/Step Time": 8.506704442203045} +{"Pretrain/Learning Rate": 4.965327198127363e-05, "Pretrain/Loss": 2.1434054374694824, "Pretrain/Loss (Raw)": 2.318601369857788, "Pretrain/Step": 777, "Pretrain/Step Time": 8.496337676420808} +{"Pretrain/Learning Rate": 4.965186149937672e-05, "Pretrain/Loss": 2.1426844596862793, "Pretrain/Loss (Raw)": 2.04897403717041, "Pretrain/Step": 778, "Pretrain/Step Time": 8.498807735741138} +{"Pretrain/Learning Rate": 4.9650448174510986e-05, "Pretrain/Loss": 2.1427502632141113, "Pretrain/Loss (Raw)": 2.182744026184082, "Pretrain/Step": 779, "Pretrain/Step Time": 8.505539817735553} +{"Pretrain/Learning Rate": 4.9649032006839404e-05, "Pretrain/Loss": 2.1431946754455566, "Pretrain/Loss (Raw)": 2.1381280422210693, "Pretrain/Step": 780, "Pretrain/Step Time": 8.506198288872838} +{"Pretrain/Learning Rate": 4.964761299652529e-05, "Pretrain/Loss": 2.1413230895996094, "Pretrain/Loss (Raw)": 1.837586760520935, "Pretrain/Step": 781, "Pretrain/Step Time": 8.514621371403337} +{"Pretrain/Learning Rate": 4.9646191143732324e-05, "Pretrain/Loss": 2.1417016983032227, "Pretrain/Loss (Raw)": 2.237227439880371, "Pretrain/Step": 782, "Pretrain/Step Time": 8.512668250128627} +{"Pretrain/Learning Rate": 4.9644766448624444e-05, "Pretrain/Loss": 2.1395421028137207, "Pretrain/Loss (Raw)": 1.9437363147735596, "Pretrain/Step": 783, "Pretrain/Step Time": 8.507436195388436} +{"Pretrain/Learning Rate": 4.9643338911365964e-05, "Pretrain/Loss": 2.1398911476135254, "Pretrain/Loss (Raw)": 2.0102379322052, "Pretrain/Step": 784, "Pretrain/Step Time": 8.508726323023438} +{"Pretrain/Learning Rate": 4.9641908532121525e-05, "Pretrain/Loss": 2.141078472137451, "Pretrain/Loss (Raw)": 2.1606686115264893, "Pretrain/Step": 785, "Pretrain/Step Time": 8.504909140989184} +{"Pretrain/Learning Rate": 4.964047531105608e-05, "Pretrain/Loss": 2.141190528869629, "Pretrain/Loss (Raw)": 2.1699626445770264, "Pretrain/Step": 786, "Pretrain/Step Time": 8.51034166291356} +{"Pretrain/Learning Rate": 4.963903924833491e-05, "Pretrain/Loss": 2.139615058898926, "Pretrain/Loss (Raw)": 1.9652185440063477, "Pretrain/Step": 787, "Pretrain/Step Time": 8.504793837666512} +{"Pretrain/Learning Rate": 4.963760034412363e-05, "Pretrain/Loss": 2.141552448272705, "Pretrain/Loss (Raw)": 2.2572429180145264, "Pretrain/Step": 788, "Pretrain/Step Time": 8.505364693701267} +{"Pretrain/Learning Rate": 4.9636158598588185e-05, "Pretrain/Loss": 2.1436991691589355, "Pretrain/Loss (Raw)": 2.2862956523895264, "Pretrain/Step": 789, "Pretrain/Step Time": 8.502573430538177} +{"Pretrain/Learning Rate": 4.9634714011894836e-05, "Pretrain/Loss": 2.1450212001800537, "Pretrain/Loss (Raw)": 2.2712597846984863, "Pretrain/Step": 790, "Pretrain/Step Time": 8.497747270390391} +{"Pretrain/Learning Rate": 4.963326658421019e-05, "Pretrain/Loss": 2.1471452713012695, "Pretrain/Loss (Raw)": 2.300041437149048, "Pretrain/Step": 791, "Pretrain/Step Time": 8.50714193098247} +{"Pretrain/Learning Rate": 4.9631816315701165e-05, "Pretrain/Loss": 2.1489546298980713, "Pretrain/Loss (Raw)": 2.271744966506958, "Pretrain/Step": 792, "Pretrain/Step Time": 8.511459885165095} +{"Pretrain/Learning Rate": 4.9630363206535e-05, "Pretrain/Loss": 2.143789291381836, "Pretrain/Loss (Raw)": 1.6816520690917969, "Pretrain/Step": 793, "Pretrain/Step Time": 8.519225340336561} +{"Pretrain/Learning Rate": 4.962890725687931e-05, "Pretrain/Loss": 2.1406962871551514, "Pretrain/Loss (Raw)": 1.9891119003295898, "Pretrain/Step": 794, "Pretrain/Step Time": 8.519883142784238} +{"Pretrain/Learning Rate": 4.962744846690196e-05, "Pretrain/Loss": 2.1396074295043945, "Pretrain/Loss (Raw)": 2.069027900695801, "Pretrain/Step": 795, "Pretrain/Step Time": 8.511869840323925} +{"Pretrain/Learning Rate": 4.962598683677122e-05, "Pretrain/Loss": 2.1401703357696533, "Pretrain/Loss (Raw)": 2.235948324203491, "Pretrain/Step": 796, "Pretrain/Step Time": 8.510709187015891} +{"Pretrain/Learning Rate": 4.9624522366655625e-05, "Pretrain/Loss": 2.1404178142547607, "Pretrain/Loss (Raw)": 1.998094081878662, "Pretrain/Step": 797, "Pretrain/Step Time": 8.513509595766664} +{"Pretrain/Learning Rate": 4.962305505672408e-05, "Pretrain/Loss": 2.142106056213379, "Pretrain/Loss (Raw)": 2.4061107635498047, "Pretrain/Step": 798, "Pretrain/Step Time": 8.517401196062565} +{"Pretrain/Learning Rate": 4.96215849071458e-05, "Pretrain/Loss": 2.141073226928711, "Pretrain/Loss (Raw)": 2.0505025386810303, "Pretrain/Step": 799, "Pretrain/Step Time": 8.514004398137331} +{"Pretrain/Learning Rate": 4.962011191809033e-05, "Pretrain/Loss": 2.140772819519043, "Pretrain/Loss (Raw)": 2.183049201965332, "Pretrain/Step": 800, "Pretrain/Step Time": 8.506172895431519} +{"Pretrain/Learning Rate": 4.961863608972753e-05, "Pretrain/Loss": 2.1407315731048584, "Pretrain/Loss (Raw)": 2.024242639541626, "Pretrain/Step": 801, "Pretrain/Step Time": 8.504743434488773} +{"Pretrain/Learning Rate": 4.961715742222762e-05, "Pretrain/Loss": 2.142603874206543, "Pretrain/Loss (Raw)": 2.137216329574585, "Pretrain/Step": 802, "Pretrain/Step Time": 8.506992576643825} +{"Pretrain/Learning Rate": 4.961567591576112e-05, "Pretrain/Loss": 2.138714551925659, "Pretrain/Loss (Raw)": 1.8921767473220825, "Pretrain/Step": 803, "Pretrain/Step Time": 8.51540000922978} +{"Pretrain/Learning Rate": 4.961419157049887e-05, "Pretrain/Loss": 2.1397862434387207, "Pretrain/Loss (Raw)": 2.1400153636932373, "Pretrain/Step": 804, "Pretrain/Step Time": 8.516409907490015} +{"Pretrain/Learning Rate": 4.9612704386612066e-05, "Pretrain/Loss": 2.1424150466918945, "Pretrain/Loss (Raw)": 2.337218999862671, "Pretrain/Step": 805, "Pretrain/Step Time": 8.51868375390768} +{"Pretrain/Learning Rate": 4.9611214364272206e-05, "Pretrain/Loss": 2.1432580947875977, "Pretrain/Loss (Raw)": 2.212784767150879, "Pretrain/Step": 806, "Pretrain/Step Time": 8.504129104316235} +{"Pretrain/Learning Rate": 4.960972150365114e-05, "Pretrain/Loss": 2.142982006072998, "Pretrain/Loss (Raw)": 2.1629698276519775, "Pretrain/Step": 807, "Pretrain/Step Time": 8.505156731233} +{"Pretrain/Learning Rate": 4.960822580492103e-05, "Pretrain/Loss": 2.141996145248413, "Pretrain/Loss (Raw)": 2.0793910026550293, "Pretrain/Step": 808, "Pretrain/Step Time": 8.50631882995367} +{"Pretrain/Learning Rate": 4.960672726825436e-05, "Pretrain/Loss": 2.142983913421631, "Pretrain/Loss (Raw)": 2.2463760375976562, "Pretrain/Step": 809, "Pretrain/Step Time": 8.513080295175314} +{"Pretrain/Learning Rate": 4.960522589382395e-05, "Pretrain/Loss": 2.1443581581115723, "Pretrain/Loss (Raw)": 2.3381314277648926, "Pretrain/Step": 810, "Pretrain/Step Time": 8.519224043935537} +{"Pretrain/Learning Rate": 4.960372168180294e-05, "Pretrain/Loss": 2.144418716430664, "Pretrain/Loss (Raw)": 2.2127106189727783, "Pretrain/Step": 811, "Pretrain/Step Time": 8.515154510736465} +{"Pretrain/Learning Rate": 4.9602214632364816e-05, "Pretrain/Loss": 2.146685838699341, "Pretrain/Loss (Raw)": 2.280388832092285, "Pretrain/Step": 812, "Pretrain/Step Time": 8.50856515020132} +{"Pretrain/Learning Rate": 4.9600704745683367e-05, "Pretrain/Loss": 2.147543430328369, "Pretrain/Loss (Raw)": 2.1856017112731934, "Pretrain/Step": 813, "Pretrain/Step Time": 8.510877838358283} +{"Pretrain/Learning Rate": 4.959919202193273e-05, "Pretrain/Loss": 2.1466641426086426, "Pretrain/Loss (Raw)": 2.06609845161438, "Pretrain/Step": 814, "Pretrain/Step Time": 8.51160342618823} +{"Pretrain/Learning Rate": 4.959767646128735e-05, "Pretrain/Loss": 2.146526575088501, "Pretrain/Loss (Raw)": 2.112074136734009, "Pretrain/Step": 815, "Pretrain/Step Time": 8.51321535371244} +{"Pretrain/Learning Rate": 4.959615806392201e-05, "Pretrain/Loss": 2.1468777656555176, "Pretrain/Loss (Raw)": 2.1359381675720215, "Pretrain/Step": 816, "Pretrain/Step Time": 8.517104435712099} +{"Pretrain/Learning Rate": 4.959463683001182e-05, "Pretrain/Loss": 2.144955635070801, "Pretrain/Loss (Raw)": 2.0109927654266357, "Pretrain/Step": 817, "Pretrain/Step Time": 8.518643053248525} +{"Pretrain/Learning Rate": 4.959311275973223e-05, "Pretrain/Loss": 2.1443405151367188, "Pretrain/Loss (Raw)": 1.9817394018173218, "Pretrain/Step": 818, "Pretrain/Step Time": 8.50573742389679} +{"Pretrain/Learning Rate": 4.959158585325898e-05, "Pretrain/Loss": 2.143343210220337, "Pretrain/Loss (Raw)": 2.037717580795288, "Pretrain/Step": 819, "Pretrain/Step Time": 8.498160680755973} +{"Pretrain/Learning Rate": 4.959005611076817e-05, "Pretrain/Loss": 2.1432876586914062, "Pretrain/Loss (Raw)": 2.1138362884521484, "Pretrain/Step": 820, "Pretrain/Step Time": 8.507164219394326} +{"Pretrain/Learning Rate": 4.9588523532436214e-05, "Pretrain/Loss": 2.143514394760132, "Pretrain/Loss (Raw)": 2.1851308345794678, "Pretrain/Step": 821, "Pretrain/Step Time": 8.51042341068387} +{"Pretrain/Learning Rate": 4.9586988118439863e-05, "Pretrain/Loss": 2.1446869373321533, "Pretrain/Loss (Raw)": 2.2604308128356934, "Pretrain/Step": 822, "Pretrain/Step Time": 8.5133286267519} +{"Pretrain/Learning Rate": 4.958544986895619e-05, "Pretrain/Loss": 2.1435811519622803, "Pretrain/Loss (Raw)": 2.5056726932525635, "Pretrain/Step": 823, "Pretrain/Step Time": 8.515643700957298} +{"Pretrain/Learning Rate": 4.958390878416258e-05, "Pretrain/Loss": 2.1443190574645996, "Pretrain/Loss (Raw)": 2.2175004482269287, "Pretrain/Step": 824, "Pretrain/Step Time": 8.509163912385702} +{"Pretrain/Learning Rate": 4.9582364864236765e-05, "Pretrain/Loss": 2.1438093185424805, "Pretrain/Loss (Raw)": 2.1570968627929688, "Pretrain/Step": 825, "Pretrain/Step Time": 8.50591298379004} +{"Pretrain/Learning Rate": 4.95808181093568e-05, "Pretrain/Loss": 2.143179178237915, "Pretrain/Loss (Raw)": 2.034360885620117, "Pretrain/Step": 826, "Pretrain/Step Time": 8.501659432426095} +{"Pretrain/Learning Rate": 4.9579268519701063e-05, "Pretrain/Loss": 2.143674373626709, "Pretrain/Loss (Raw)": 2.184685230255127, "Pretrain/Step": 827, "Pretrain/Step Time": 8.503542095422745} +{"Pretrain/Learning Rate": 4.957771609544826e-05, "Pretrain/Loss": 2.143671989440918, "Pretrain/Loss (Raw)": 2.130868434906006, "Pretrain/Step": 828, "Pretrain/Step Time": 8.508290361613035} +{"Pretrain/Learning Rate": 4.957616083677742e-05, "Pretrain/Loss": 2.1440916061401367, "Pretrain/Loss (Raw)": 2.175194501876831, "Pretrain/Step": 829, "Pretrain/Step Time": 8.514464352279902} +{"Pretrain/Learning Rate": 4.9574602743867916e-05, "Pretrain/Loss": 2.1450035572052, "Pretrain/Loss (Raw)": 2.195444345474243, "Pretrain/Step": 830, "Pretrain/Step Time": 8.507574750110507} +{"Pretrain/Learning Rate": 4.957304181689941e-05, "Pretrain/Loss": 2.1443674564361572, "Pretrain/Loss (Raw)": 2.034942865371704, "Pretrain/Step": 831, "Pretrain/Step Time": 8.509876327589154} +{"Pretrain/Learning Rate": 4.957147805605194e-05, "Pretrain/Loss": 2.1459875106811523, "Pretrain/Loss (Raw)": 2.227917194366455, "Pretrain/Step": 832, "Pretrain/Step Time": 8.513815874233842} +{"Pretrain/Learning Rate": 4.956991146150583e-05, "Pretrain/Loss": 2.1414523124694824, "Pretrain/Loss (Raw)": 1.9393140077590942, "Pretrain/Step": 833, "Pretrain/Step Time": 8.515157092362642} +{"Pretrain/Learning Rate": 4.9568342033441755e-05, "Pretrain/Loss": 2.1433498859405518, "Pretrain/Loss (Raw)": 2.152573585510254, "Pretrain/Step": 834, "Pretrain/Step Time": 8.515401331707835} +{"Pretrain/Learning Rate": 4.956676977204071e-05, "Pretrain/Loss": 2.143805742263794, "Pretrain/Loss (Raw)": 2.2462170124053955, "Pretrain/Step": 835, "Pretrain/Step Time": 8.51102327555418} +{"Pretrain/Learning Rate": 4.9565194677484e-05, "Pretrain/Loss": 2.1451988220214844, "Pretrain/Loss (Raw)": 2.2049601078033447, "Pretrain/Step": 836, "Pretrain/Step Time": 8.502131706103683} +{"Pretrain/Learning Rate": 4.95636167499533e-05, "Pretrain/Loss": 2.143031597137451, "Pretrain/Loss (Raw)": 2.162179946899414, "Pretrain/Step": 837, "Pretrain/Step Time": 8.504550710320473} +{"Pretrain/Learning Rate": 4.9562035989630564e-05, "Pretrain/Loss": 2.1411211490631104, "Pretrain/Loss (Raw)": 1.9224945306777954, "Pretrain/Step": 838, "Pretrain/Step Time": 8.510808924213052} +{"Pretrain/Learning Rate": 4.95604523966981e-05, "Pretrain/Loss": 2.1409833431243896, "Pretrain/Loss (Raw)": 2.112086296081543, "Pretrain/Step": 839, "Pretrain/Step Time": 8.51053785905242} +{"Pretrain/Learning Rate": 4.9558865971338524e-05, "Pretrain/Loss": 2.1400980949401855, "Pretrain/Loss (Raw)": 2.129927635192871, "Pretrain/Step": 840, "Pretrain/Step Time": 8.508805917575955} +{"Pretrain/Learning Rate": 4.9557276713734805e-05, "Pretrain/Loss": 2.1405694484710693, "Pretrain/Loss (Raw)": 2.191134214401245, "Pretrain/Step": 841, "Pretrain/Step Time": 8.513050435110927} +{"Pretrain/Learning Rate": 4.955568462407022e-05, "Pretrain/Loss": 2.138153076171875, "Pretrain/Loss (Raw)": 1.7858582735061646, "Pretrain/Step": 842, "Pretrain/Step Time": 8.504744613543153} +{"Pretrain/Learning Rate": 4.955408970252837e-05, "Pretrain/Loss": 2.1401314735412598, "Pretrain/Loss (Raw)": 2.342210054397583, "Pretrain/Step": 843, "Pretrain/Step Time": 8.506734419614077} +{"Pretrain/Learning Rate": 4.955249194929319e-05, "Pretrain/Loss": 2.1411123275756836, "Pretrain/Loss (Raw)": 2.247520685195923, "Pretrain/Step": 844, "Pretrain/Step Time": 8.504449307918549} +{"Pretrain/Learning Rate": 4.955089136454895e-05, "Pretrain/Loss": 2.140213966369629, "Pretrain/Loss (Raw)": 2.1377172470092773, "Pretrain/Step": 845, "Pretrain/Step Time": 8.503170888870955} +{"Pretrain/Learning Rate": 4.954928794848023e-05, "Pretrain/Loss": 2.140716552734375, "Pretrain/Loss (Raw)": 2.176844358444214, "Pretrain/Step": 846, "Pretrain/Step Time": 8.506312746554613} +{"Pretrain/Learning Rate": 4.954768170127194e-05, "Pretrain/Loss": 2.140468120574951, "Pretrain/Loss (Raw)": 2.192284107208252, "Pretrain/Step": 847, "Pretrain/Step Time": 8.506050609052181} +{"Pretrain/Learning Rate": 4.9546072623109325e-05, "Pretrain/Loss": 2.1395537853240967, "Pretrain/Loss (Raw)": 2.032811164855957, "Pretrain/Step": 848, "Pretrain/Step Time": 8.49884857609868} +{"Pretrain/Learning Rate": 4.954446071417795e-05, "Pretrain/Loss": 2.1415891647338867, "Pretrain/Loss (Raw)": 2.1210086345672607, "Pretrain/Step": 849, "Pretrain/Step Time": 8.509951749816537} +{"Pretrain/Learning Rate": 4.954284597466371e-05, "Pretrain/Loss": 2.139702320098877, "Pretrain/Loss (Raw)": 2.036440849304199, "Pretrain/Step": 850, "Pretrain/Step Time": 8.510960331186652} +{"Pretrain/Learning Rate": 4.954122840475281e-05, "Pretrain/Loss": 2.1377663612365723, "Pretrain/Loss (Raw)": 1.830836534500122, "Pretrain/Step": 851, "Pretrain/Step Time": 8.518092174082994} +{"Pretrain/Learning Rate": 4.9539608004631825e-05, "Pretrain/Loss": 2.136568307876587, "Pretrain/Loss (Raw)": 2.2070562839508057, "Pretrain/Step": 852, "Pretrain/Step Time": 8.51705121435225} +{"Pretrain/Learning Rate": 4.9537984774487606e-05, "Pretrain/Loss": 2.1366913318634033, "Pretrain/Loss (Raw)": 2.2645115852355957, "Pretrain/Step": 853, "Pretrain/Step Time": 8.508914466947317} +{"Pretrain/Learning Rate": 4.953635871450736e-05, "Pretrain/Loss": 2.137345314025879, "Pretrain/Loss (Raw)": 2.231633424758911, "Pretrain/Step": 854, "Pretrain/Step Time": 8.507471887394786} +{"Pretrain/Learning Rate": 4.95347298248786e-05, "Pretrain/Loss": 2.137648820877075, "Pretrain/Loss (Raw)": 2.057033061981201, "Pretrain/Step": 855, "Pretrain/Step Time": 8.507179433479905} +{"Pretrain/Learning Rate": 4.953309810578918e-05, "Pretrain/Loss": 2.134549140930176, "Pretrain/Loss (Raw)": 1.894127607345581, "Pretrain/Step": 856, "Pretrain/Step Time": 8.511437522247434} +{"Pretrain/Learning Rate": 4.953146355742729e-05, "Pretrain/Loss": 2.132874011993408, "Pretrain/Loss (Raw)": 1.86869215965271, "Pretrain/Step": 857, "Pretrain/Step Time": 8.507758783176541} +{"Pretrain/Learning Rate": 4.952982617998143e-05, "Pretrain/Loss": 2.1346147060394287, "Pretrain/Loss (Raw)": 2.2614104747772217, "Pretrain/Step": 858, "Pretrain/Step Time": 8.506220145151019} +{"Pretrain/Learning Rate": 4.952818597364043e-05, "Pretrain/Loss": 2.134568691253662, "Pretrain/Loss (Raw)": 2.1980576515197754, "Pretrain/Step": 859, "Pretrain/Step Time": 8.506622379645705} +{"Pretrain/Learning Rate": 4.952654293859344e-05, "Pretrain/Loss": 2.135087490081787, "Pretrain/Loss (Raw)": 2.135146379470825, "Pretrain/Step": 860, "Pretrain/Step Time": 8.49261817894876} +{"Pretrain/Learning Rate": 4.952489707502993e-05, "Pretrain/Loss": 2.13517427444458, "Pretrain/Loss (Raw)": 2.1306703090667725, "Pretrain/Step": 861, "Pretrain/Step Time": 8.497133819386363} +{"Pretrain/Learning Rate": 4.952324838313974e-05, "Pretrain/Loss": 2.1386117935180664, "Pretrain/Loss (Raw)": 2.694436550140381, "Pretrain/Step": 862, "Pretrain/Step Time": 8.505246667191386} +{"Pretrain/Learning Rate": 4.9521596863112986e-05, "Pretrain/Loss": 2.1392006874084473, "Pretrain/Loss (Raw)": 2.30435848236084, "Pretrain/Step": 863, "Pretrain/Step Time": 8.511526122689247} +{"Pretrain/Learning Rate": 4.951994251514013e-05, "Pretrain/Loss": 2.139507293701172, "Pretrain/Loss (Raw)": 2.1696364879608154, "Pretrain/Step": 864, "Pretrain/Step Time": 8.51146569289267} +{"Pretrain/Learning Rate": 4.9518285339411966e-05, "Pretrain/Loss": 2.137871742248535, "Pretrain/Loss (Raw)": 2.0086669921875, "Pretrain/Step": 865, "Pretrain/Step Time": 8.5027697365731} +{"Pretrain/Learning Rate": 4.9516625336119595e-05, "Pretrain/Loss": 2.1407949924468994, "Pretrain/Loss (Raw)": 2.2493274211883545, "Pretrain/Step": 866, "Pretrain/Step Time": 8.504980528727174} +{"Pretrain/Learning Rate": 4.951496250545446e-05, "Pretrain/Loss": 2.1403698921203613, "Pretrain/Loss (Raw)": 1.9899275302886963, "Pretrain/Step": 867, "Pretrain/Step Time": 8.514170281589031} +{"Pretrain/Learning Rate": 4.951329684760835e-05, "Pretrain/Loss": 2.1402931213378906, "Pretrain/Loss (Raw)": 2.1258130073547363, "Pretrain/Step": 868, "Pretrain/Step Time": 8.520485829561949} +{"Pretrain/Learning Rate": 4.951162836277332e-05, "Pretrain/Loss": 2.1399049758911133, "Pretrain/Loss (Raw)": 2.0153307914733887, "Pretrain/Step": 869, "Pretrain/Step Time": 8.518881237134337} +{"Pretrain/Learning Rate": 4.950995705114182e-05, "Pretrain/Loss": 2.1373910903930664, "Pretrain/Loss (Raw)": 2.0996439456939697, "Pretrain/Step": 870, "Pretrain/Step Time": 8.523646438494325} +{"Pretrain/Learning Rate": 4.950828291290656e-05, "Pretrain/Loss": 2.138361692428589, "Pretrain/Loss (Raw)": 2.125749349594116, "Pretrain/Step": 871, "Pretrain/Step Time": 8.515378002077341} +{"Pretrain/Learning Rate": 4.950660594826064e-05, "Pretrain/Loss": 2.13999080657959, "Pretrain/Loss (Raw)": 2.378467082977295, "Pretrain/Step": 872, "Pretrain/Step Time": 8.510838814079762} +{"Pretrain/Learning Rate": 4.9504926157397436e-05, "Pretrain/Loss": 2.139146566390991, "Pretrain/Loss (Raw)": 1.9513976573944092, "Pretrain/Step": 873, "Pretrain/Step Time": 8.509133487939835} +{"Pretrain/Learning Rate": 4.950324354051068e-05, "Pretrain/Loss": 2.1399102210998535, "Pretrain/Loss (Raw)": 2.091977834701538, "Pretrain/Step": 874, "Pretrain/Step Time": 8.512509057298303} +{"Pretrain/Learning Rate": 4.950155809779442e-05, "Pretrain/Loss": 2.138392925262451, "Pretrain/Loss (Raw)": 1.9094552993774414, "Pretrain/Step": 875, "Pretrain/Step Time": 8.516076561063528} +{"Pretrain/Learning Rate": 4.9499869829443026e-05, "Pretrain/Loss": 2.136655330657959, "Pretrain/Loss (Raw)": 2.0242104530334473, "Pretrain/Step": 876, "Pretrain/Step Time": 8.514728009700775} +{"Pretrain/Learning Rate": 4.9498178735651184e-05, "Pretrain/Loss": 2.1389782428741455, "Pretrain/Loss (Raw)": 2.286132335662842, "Pretrain/Step": 877, "Pretrain/Step Time": 8.511359088122845} +{"Pretrain/Learning Rate": 4.949648481661394e-05, "Pretrain/Loss": 2.1375880241394043, "Pretrain/Loss (Raw)": 2.111395835876465, "Pretrain/Step": 878, "Pretrain/Step Time": 8.507580796256661} +{"Pretrain/Learning Rate": 4.949478807252663e-05, "Pretrain/Loss": 2.1370086669921875, "Pretrain/Loss (Raw)": 2.0543458461761475, "Pretrain/Step": 879, "Pretrain/Step Time": 8.511769374832511} +{"Pretrain/Learning Rate": 4.949308850358494e-05, "Pretrain/Loss": 2.1357884407043457, "Pretrain/Loss (Raw)": 2.1502535343170166, "Pretrain/Step": 880, "Pretrain/Step Time": 8.510872974991798} +{"Pretrain/Learning Rate": 4.949138610998487e-05, "Pretrain/Loss": 2.1356914043426514, "Pretrain/Loss (Raw)": 2.092561721801758, "Pretrain/Step": 881, "Pretrain/Step Time": 8.511964403092861} +{"Pretrain/Learning Rate": 4.9489680891922746e-05, "Pretrain/Loss": 2.1354475021362305, "Pretrain/Loss (Raw)": 2.093430280685425, "Pretrain/Step": 882, "Pretrain/Step Time": 8.512967564165592} +{"Pretrain/Learning Rate": 4.948797284959522e-05, "Pretrain/Loss": 2.137176036834717, "Pretrain/Loss (Raw)": 2.271620035171509, "Pretrain/Step": 883, "Pretrain/Step Time": 8.504966620355844} +{"Pretrain/Learning Rate": 4.948626198319928e-05, "Pretrain/Loss": 2.1351044178009033, "Pretrain/Loss (Raw)": 2.0355114936828613, "Pretrain/Step": 884, "Pretrain/Step Time": 8.504845693707466} +{"Pretrain/Learning Rate": 4.948454829293222e-05, "Pretrain/Loss": 2.134683609008789, "Pretrain/Loss (Raw)": 2.068392515182495, "Pretrain/Step": 885, "Pretrain/Step Time": 8.511761780828238} +{"Pretrain/Learning Rate": 4.9482831778991676e-05, "Pretrain/Loss": 2.137209892272949, "Pretrain/Loss (Raw)": 2.3522157669067383, "Pretrain/Step": 886, "Pretrain/Step Time": 8.515962084755301} +{"Pretrain/Learning Rate": 4.9481112441575605e-05, "Pretrain/Loss": 2.1355020999908447, "Pretrain/Loss (Raw)": 2.0642311573028564, "Pretrain/Step": 887, "Pretrain/Step Time": 8.51976465061307} +{"Pretrain/Learning Rate": 4.947939028088229e-05, "Pretrain/Loss": 2.133939743041992, "Pretrain/Loss (Raw)": 1.9527920484542847, "Pretrain/Step": 888, "Pretrain/Step Time": 8.516850067302585} +{"Pretrain/Learning Rate": 4.947766529711033e-05, "Pretrain/Loss": 2.133453845977783, "Pretrain/Loss (Raw)": 2.1082370281219482, "Pretrain/Step": 889, "Pretrain/Step Time": 8.513551751151681} +{"Pretrain/Learning Rate": 4.947593749045867e-05, "Pretrain/Loss": 2.1341917514801025, "Pretrain/Loss (Raw)": 2.226646661758423, "Pretrain/Step": 890, "Pretrain/Step Time": 8.513794794678688} +{"Pretrain/Learning Rate": 4.947420686112657e-05, "Pretrain/Loss": 2.131507396697998, "Pretrain/Loss (Raw)": 1.959230899810791, "Pretrain/Step": 891, "Pretrain/Step Time": 8.514069905504584} +{"Pretrain/Learning Rate": 4.9472473409313605e-05, "Pretrain/Loss": 2.1311886310577393, "Pretrain/Loss (Raw)": 2.0867466926574707, "Pretrain/Step": 892, "Pretrain/Step Time": 8.51472127251327} +{"Pretrain/Learning Rate": 4.947073713521968e-05, "Pretrain/Loss": 2.1311583518981934, "Pretrain/Loss (Raw)": 2.123472213745117, "Pretrain/Step": 893, "Pretrain/Step Time": 8.513542536646128} +{"Pretrain/Learning Rate": 4.9468998039045046e-05, "Pretrain/Loss": 2.1273159980773926, "Pretrain/Loss (Raw)": 1.7330877780914307, "Pretrain/Step": 894, "Pretrain/Step Time": 8.51256244070828} +{"Pretrain/Learning Rate": 4.946725612099026e-05, "Pretrain/Loss": 2.126793146133423, "Pretrain/Loss (Raw)": 2.0597498416900635, "Pretrain/Step": 895, "Pretrain/Step Time": 8.508391985669732} +{"Pretrain/Learning Rate": 4.9465511381256204e-05, "Pretrain/Loss": 2.1271023750305176, "Pretrain/Loss (Raw)": 2.1015520095825195, "Pretrain/Step": 896, "Pretrain/Step Time": 8.504968898370862} +{"Pretrain/Learning Rate": 4.946376382004408e-05, "Pretrain/Loss": 2.1261110305786133, "Pretrain/Loss (Raw)": 2.0480563640594482, "Pretrain/Step": 897, "Pretrain/Step Time": 8.501976739615202} +{"Pretrain/Learning Rate": 4.9462013437555446e-05, "Pretrain/Loss": 2.1264843940734863, "Pretrain/Loss (Raw)": 2.171247720718384, "Pretrain/Step": 898, "Pretrain/Step Time": 8.510589743033051} +{"Pretrain/Learning Rate": 4.946026023399215e-05, "Pretrain/Loss": 2.1279423236846924, "Pretrain/Loss (Raw)": 2.2776498794555664, "Pretrain/Step": 899, "Pretrain/Step Time": 8.509440030902624} +{"Pretrain/Learning Rate": 4.9458504209556377e-05, "Pretrain/Loss": 2.127376079559326, "Pretrain/Loss (Raw)": 1.9209938049316406, "Pretrain/Step": 900, "Pretrain/Step Time": 8.50761222280562} +{"Pretrain/Learning Rate": 4.945674536445065e-05, "Pretrain/Loss": 2.1290526390075684, "Pretrain/Loss (Raw)": 2.5287258625030518, "Pretrain/Step": 901, "Pretrain/Step Time": 8.501532565802336} +{"Pretrain/Learning Rate": 4.945498369887781e-05, "Pretrain/Loss": 2.130354881286621, "Pretrain/Loss (Raw)": 2.3867850303649902, "Pretrain/Step": 902, "Pretrain/Step Time": 8.498111544176936} +{"Pretrain/Learning Rate": 4.945321921304101e-05, "Pretrain/Loss": 2.132068157196045, "Pretrain/Loss (Raw)": 2.29227352142334, "Pretrain/Step": 903, "Pretrain/Step Time": 8.502441992983222} +{"Pretrain/Learning Rate": 4.945145190714374e-05, "Pretrain/Loss": 2.1334619522094727, "Pretrain/Loss (Raw)": 2.1446022987365723, "Pretrain/Step": 904, "Pretrain/Step Time": 8.509031008929014} +{"Pretrain/Learning Rate": 4.944968178138982e-05, "Pretrain/Loss": 2.1318392753601074, "Pretrain/Loss (Raw)": 2.1109087467193604, "Pretrain/Step": 905, "Pretrain/Step Time": 8.51859175041318} +{"Pretrain/Learning Rate": 4.944790883598339e-05, "Pretrain/Loss": 2.1328485012054443, "Pretrain/Loss (Raw)": 2.1781458854675293, "Pretrain/Step": 906, "Pretrain/Step Time": 8.514993535354733} +{"Pretrain/Learning Rate": 4.9446133071128905e-05, "Pretrain/Loss": 2.1345701217651367, "Pretrain/Loss (Raw)": 2.4031176567077637, "Pretrain/Step": 907, "Pretrain/Step Time": 8.513661585748196} +{"Pretrain/Learning Rate": 4.944435448703116e-05, "Pretrain/Loss": 2.13556170463562, "Pretrain/Loss (Raw)": 2.265042781829834, "Pretrain/Step": 908, "Pretrain/Step Time": 8.50687482394278} +{"Pretrain/Learning Rate": 4.944257308389528e-05, "Pretrain/Loss": 2.136727809906006, "Pretrain/Loss (Raw)": 1.9868264198303223, "Pretrain/Step": 909, "Pretrain/Step Time": 8.508701862767339} +{"Pretrain/Learning Rate": 4.944078886192668e-05, "Pretrain/Loss": 2.1363635063171387, "Pretrain/Loss (Raw)": 2.1906135082244873, "Pretrain/Step": 910, "Pretrain/Step Time": 8.510969491675496} +{"Pretrain/Learning Rate": 4.943900182133116e-05, "Pretrain/Loss": 2.1362099647521973, "Pretrain/Loss (Raw)": 1.9240963459014893, "Pretrain/Step": 911, "Pretrain/Step Time": 8.514667877927423} +{"Pretrain/Learning Rate": 4.943721196231477e-05, "Pretrain/Loss": 2.136934518814087, "Pretrain/Loss (Raw)": 2.1029539108276367, "Pretrain/Step": 912, "Pretrain/Step Time": 8.508940072730184} +{"Pretrain/Learning Rate": 4.943541928508395e-05, "Pretrain/Loss": 2.1359572410583496, "Pretrain/Loss (Raw)": 2.03560733795166, "Pretrain/Step": 913, "Pretrain/Step Time": 8.50778536312282} +{"Pretrain/Learning Rate": 4.9433623789845426e-05, "Pretrain/Loss": 2.134472370147705, "Pretrain/Loss (Raw)": 1.979866623878479, "Pretrain/Step": 914, "Pretrain/Step Time": 8.500885613262653} +{"Pretrain/Learning Rate": 4.943182547680629e-05, "Pretrain/Loss": 2.1368868350982666, "Pretrain/Loss (Raw)": 2.274287223815918, "Pretrain/Step": 915, "Pretrain/Step Time": 8.509301884099841} +{"Pretrain/Learning Rate": 4.94300243461739e-05, "Pretrain/Loss": 2.1348414421081543, "Pretrain/Loss (Raw)": 1.9954510927200317, "Pretrain/Step": 916, "Pretrain/Step Time": 8.5138501804322} +{"Pretrain/Learning Rate": 4.9428220398155986e-05, "Pretrain/Loss": 2.1350150108337402, "Pretrain/Loss (Raw)": 2.308518886566162, "Pretrain/Step": 917, "Pretrain/Step Time": 8.514472229406238} +{"Pretrain/Learning Rate": 4.94264136329606e-05, "Pretrain/Loss": 2.1339616775512695, "Pretrain/Loss (Raw)": 2.136399745941162, "Pretrain/Step": 918, "Pretrain/Step Time": 8.516234751790762} +{"Pretrain/Learning Rate": 4.942460405079608e-05, "Pretrain/Loss": 2.1314172744750977, "Pretrain/Loss (Raw)": 1.974363923072815, "Pretrain/Step": 919, "Pretrain/Step Time": 8.50681466422975} +{"Pretrain/Learning Rate": 4.942279165187113e-05, "Pretrain/Loss": 2.1307430267333984, "Pretrain/Loss (Raw)": 2.1854376792907715, "Pretrain/Step": 920, "Pretrain/Step Time": 8.50248490087688} +{"Pretrain/Learning Rate": 4.9420976436394764e-05, "Pretrain/Loss": 2.1348438262939453, "Pretrain/Loss (Raw)": 2.2065773010253906, "Pretrain/Step": 921, "Pretrain/Step Time": 8.500686654821038} +{"Pretrain/Learning Rate": 4.941915840457632e-05, "Pretrain/Loss": 2.1359658241271973, "Pretrain/Loss (Raw)": 2.1327221393585205, "Pretrain/Step": 922, "Pretrain/Step Time": 8.509089155122638} +{"Pretrain/Learning Rate": 4.941733755662545e-05, "Pretrain/Loss": 2.137545585632324, "Pretrain/Loss (Raw)": 2.271252393722534, "Pretrain/Step": 923, "Pretrain/Step Time": 8.51370957121253} +{"Pretrain/Learning Rate": 4.941551389275217e-05, "Pretrain/Loss": 2.1374926567077637, "Pretrain/Loss (Raw)": 2.229156494140625, "Pretrain/Step": 924, "Pretrain/Step Time": 8.513213887810707} +{"Pretrain/Learning Rate": 4.9413687413166777e-05, "Pretrain/Loss": 2.13803768157959, "Pretrain/Loss (Raw)": 2.0678369998931885, "Pretrain/Step": 925, "Pretrain/Step Time": 8.507971560582519} +{"Pretrain/Learning Rate": 4.94118581180799e-05, "Pretrain/Loss": 2.134608268737793, "Pretrain/Loss (Raw)": 1.9671807289123535, "Pretrain/Step": 926, "Pretrain/Step Time": 8.514346977695823} +{"Pretrain/Learning Rate": 4.9410026007702525e-05, "Pretrain/Loss": 2.135741949081421, "Pretrain/Loss (Raw)": 2.1955864429473877, "Pretrain/Step": 927, "Pretrain/Step Time": 8.518831174820662} +{"Pretrain/Learning Rate": 4.940819108224592e-05, "Pretrain/Loss": 2.135404586791992, "Pretrain/Loss (Raw)": 2.1398627758026123, "Pretrain/Step": 928, "Pretrain/Step Time": 8.520540939643979} +{"Pretrain/Learning Rate": 4.940635334192171e-05, "Pretrain/Loss": 2.1362619400024414, "Pretrain/Loss (Raw)": 2.133981466293335, "Pretrain/Step": 929, "Pretrain/Step Time": 8.521881140768528} +{"Pretrain/Learning Rate": 4.940451278694181e-05, "Pretrain/Loss": 2.134451150894165, "Pretrain/Loss (Raw)": 1.905446171760559, "Pretrain/Step": 930, "Pretrain/Step Time": 8.514668919146061} +{"Pretrain/Learning Rate": 4.9402669417518514e-05, "Pretrain/Loss": 2.135989189147949, "Pretrain/Loss (Raw)": 2.0890300273895264, "Pretrain/Step": 931, "Pretrain/Step Time": 8.506254183128476} +{"Pretrain/Learning Rate": 4.940082323386439e-05, "Pretrain/Loss": 2.1344361305236816, "Pretrain/Loss (Raw)": 1.9412596225738525, "Pretrain/Step": 932, "Pretrain/Step Time": 8.509847663342953} +{"Pretrain/Learning Rate": 4.939897423619234e-05, "Pretrain/Loss": 2.133406639099121, "Pretrain/Loss (Raw)": 2.2054262161254883, "Pretrain/Step": 933, "Pretrain/Step Time": 8.513601263985038} +{"Pretrain/Learning Rate": 4.9397122424715624e-05, "Pretrain/Loss": 2.1334691047668457, "Pretrain/Loss (Raw)": 2.2208030223846436, "Pretrain/Step": 934, "Pretrain/Step Time": 8.517423123121262} +{"Pretrain/Learning Rate": 4.939526779964778e-05, "Pretrain/Loss": 2.1329212188720703, "Pretrain/Loss (Raw)": 2.0928025245666504, "Pretrain/Step": 935, "Pretrain/Step Time": 8.515703674405813} +{"Pretrain/Learning Rate": 4.9393410361202694e-05, "Pretrain/Loss": 2.13448429107666, "Pretrain/Loss (Raw)": 2.2794885635375977, "Pretrain/Step": 936, "Pretrain/Step Time": 8.510678626596928} +{"Pretrain/Learning Rate": 4.9391550109594584e-05, "Pretrain/Loss": 2.136134147644043, "Pretrain/Loss (Raw)": 2.457547903060913, "Pretrain/Step": 937, "Pretrain/Step Time": 8.503823935985565} +{"Pretrain/Learning Rate": 4.938968704503798e-05, "Pretrain/Loss": 2.1348483562469482, "Pretrain/Loss (Raw)": 2.1735715866088867, "Pretrain/Step": 938, "Pretrain/Step Time": 8.497594805434346} +{"Pretrain/Learning Rate": 4.938782116774774e-05, "Pretrain/Loss": 2.138028621673584, "Pretrain/Loss (Raw)": 2.6197803020477295, "Pretrain/Step": 939, "Pretrain/Step Time": 8.50001822412014} +{"Pretrain/Learning Rate": 4.938595247793903e-05, "Pretrain/Loss": 2.1364879608154297, "Pretrain/Loss (Raw)": 2.0831594467163086, "Pretrain/Step": 940, "Pretrain/Step Time": 8.509008111432195} +{"Pretrain/Learning Rate": 4.938408097582738e-05, "Pretrain/Loss": 2.1367249488830566, "Pretrain/Loss (Raw)": 2.2159202098846436, "Pretrain/Step": 941, "Pretrain/Step Time": 8.513206945732236} +{"Pretrain/Learning Rate": 4.9382206661628615e-05, "Pretrain/Loss": 2.136056423187256, "Pretrain/Loss (Raw)": 1.9805611371994019, "Pretrain/Step": 942, "Pretrain/Step Time": 8.50952017493546} +{"Pretrain/Learning Rate": 4.9380329535558887e-05, "Pretrain/Loss": 2.135242223739624, "Pretrain/Loss (Raw)": 2.0078399181365967, "Pretrain/Step": 943, "Pretrain/Step Time": 8.511573527008295} +{"Pretrain/Learning Rate": 4.9378449597834664e-05, "Pretrain/Loss": 2.136043071746826, "Pretrain/Loss (Raw)": 2.2384581565856934, "Pretrain/Step": 944, "Pretrain/Step Time": 8.510018981993198} +{"Pretrain/Learning Rate": 4.937656684867276e-05, "Pretrain/Loss": 2.138103485107422, "Pretrain/Loss (Raw)": 2.274733066558838, "Pretrain/Step": 945, "Pretrain/Step Time": 8.519239749759436} +{"Pretrain/Learning Rate": 4.93746812882903e-05, "Pretrain/Loss": 2.139910936355591, "Pretrain/Loss (Raw)": 2.213087797164917, "Pretrain/Step": 946, "Pretrain/Step Time": 8.521941998973489} +{"Pretrain/Learning Rate": 4.937279291690474e-05, "Pretrain/Loss": 2.140925884246826, "Pretrain/Loss (Raw)": 2.167614698410034, "Pretrain/Step": 947, "Pretrain/Step Time": 8.522955184802413} +{"Pretrain/Learning Rate": 4.9370901734733856e-05, "Pretrain/Loss": 2.1418557167053223, "Pretrain/Loss (Raw)": 2.23286771774292, "Pretrain/Step": 948, "Pretrain/Step Time": 8.51475015282631} +{"Pretrain/Learning Rate": 4.936900774199573e-05, "Pretrain/Loss": 2.142253875732422, "Pretrain/Loss (Raw)": 2.2360899448394775, "Pretrain/Step": 949, "Pretrain/Step Time": 8.509478701278567} +{"Pretrain/Learning Rate": 4.936711093890881e-05, "Pretrain/Loss": 2.1431455612182617, "Pretrain/Loss (Raw)": 2.3745615482330322, "Pretrain/Step": 950, "Pretrain/Step Time": 8.509314876049757} +{"Pretrain/Learning Rate": 4.936521132569184e-05, "Pretrain/Loss": 2.138578176498413, "Pretrain/Loss (Raw)": 1.9210432767868042, "Pretrain/Step": 951, "Pretrain/Step Time": 8.51105192489922} +{"Pretrain/Learning Rate": 4.936330890256388e-05, "Pretrain/Loss": 2.13799786567688, "Pretrain/Loss (Raw)": 2.143247365951538, "Pretrain/Step": 952, "Pretrain/Step Time": 8.513573929667473} +{"Pretrain/Learning Rate": 4.9361403669744336e-05, "Pretrain/Loss": 2.1371359825134277, "Pretrain/Loss (Raw)": 2.0467498302459717, "Pretrain/Step": 953, "Pretrain/Step Time": 8.513562520965934} +{"Pretrain/Learning Rate": 4.935949562745293e-05, "Pretrain/Loss": 2.1406891345977783, "Pretrain/Loss (Raw)": 2.4891767501831055, "Pretrain/Step": 954, "Pretrain/Step Time": 8.507956640794873} +{"Pretrain/Learning Rate": 4.93575847759097e-05, "Pretrain/Loss": 2.1404776573181152, "Pretrain/Loss (Raw)": 2.1576244831085205, "Pretrain/Step": 955, "Pretrain/Step Time": 8.507522651925683} +{"Pretrain/Learning Rate": 4.9355671115335015e-05, "Pretrain/Loss": 2.140085458755493, "Pretrain/Loss (Raw)": 2.0806725025177, "Pretrain/Step": 956, "Pretrain/Step Time": 8.509669369086623} +{"Pretrain/Learning Rate": 4.935375464594957e-05, "Pretrain/Loss": 2.1395885944366455, "Pretrain/Loss (Raw)": 2.111560106277466, "Pretrain/Step": 957, "Pretrain/Step Time": 8.509459633380175} +{"Pretrain/Learning Rate": 4.9351835367974375e-05, "Pretrain/Loss": 2.1402196884155273, "Pretrain/Loss (Raw)": 2.2762370109558105, "Pretrain/Step": 958, "Pretrain/Step Time": 8.509590780362487} +{"Pretrain/Learning Rate": 4.9349913281630786e-05, "Pretrain/Loss": 2.1408352851867676, "Pretrain/Loss (Raw)": 2.1137216091156006, "Pretrain/Step": 959, "Pretrain/Step Time": 8.50685253366828} +{"Pretrain/Learning Rate": 4.934798838714045e-05, "Pretrain/Loss": 2.141585111618042, "Pretrain/Loss (Raw)": 2.3239288330078125, "Pretrain/Step": 960, "Pretrain/Step Time": 8.501228909939528} +{"Pretrain/Learning Rate": 4.9346060684725364e-05, "Pretrain/Loss": 2.1419386863708496, "Pretrain/Loss (Raw)": 1.9845788478851318, "Pretrain/Step": 961, "Pretrain/Step Time": 8.50317818671465} +{"Pretrain/Learning Rate": 4.934413017460784e-05, "Pretrain/Loss": 2.1414289474487305, "Pretrain/Loss (Raw)": 2.087333917617798, "Pretrain/Step": 962, "Pretrain/Step Time": 8.508645059540868} +{"Pretrain/Learning Rate": 4.93421968570105e-05, "Pretrain/Loss": 2.1407153606414795, "Pretrain/Loss (Raw)": 2.154853105545044, "Pretrain/Step": 963, "Pretrain/Step Time": 8.515329556539655} +{"Pretrain/Learning Rate": 4.934026073215633e-05, "Pretrain/Loss": 2.1396188735961914, "Pretrain/Loss (Raw)": 2.0646257400512695, "Pretrain/Step": 964, "Pretrain/Step Time": 8.521630255505443} +{"Pretrain/Learning Rate": 4.933832180026858e-05, "Pretrain/Loss": 2.13887882232666, "Pretrain/Loss (Raw)": 2.0674586296081543, "Pretrain/Step": 965, "Pretrain/Step Time": 8.515406098216772} +{"Pretrain/Learning Rate": 4.933638006157089e-05, "Pretrain/Loss": 2.141719341278076, "Pretrain/Loss (Raw)": 2.2860703468322754, "Pretrain/Step": 966, "Pretrain/Step Time": 8.504308674484491} +{"Pretrain/Learning Rate": 4.933443551628717e-05, "Pretrain/Loss": 2.140305280685425, "Pretrain/Loss (Raw)": 1.931066632270813, "Pretrain/Step": 967, "Pretrain/Step Time": 8.504543581977487} +{"Pretrain/Learning Rate": 4.933248816464168e-05, "Pretrain/Loss": 2.139371395111084, "Pretrain/Loss (Raw)": 2.010390043258667, "Pretrain/Step": 968, "Pretrain/Step Time": 8.511292172595859} +{"Pretrain/Learning Rate": 4.933053800685899e-05, "Pretrain/Loss": 2.1402945518493652, "Pretrain/Loss (Raw)": 2.3093037605285645, "Pretrain/Step": 969, "Pretrain/Step Time": 8.510687349364161} +{"Pretrain/Learning Rate": 4.932858504316401e-05, "Pretrain/Loss": 2.143918514251709, "Pretrain/Loss (Raw)": 2.2497222423553467, "Pretrain/Step": 970, "Pretrain/Step Time": 8.508307946845889} +{"Pretrain/Learning Rate": 4.932662927378196e-05, "Pretrain/Loss": 2.143263339996338, "Pretrain/Loss (Raw)": 2.2583794593811035, "Pretrain/Step": 971, "Pretrain/Step Time": 8.51031007617712} +{"Pretrain/Learning Rate": 4.93246706989384e-05, "Pretrain/Loss": 2.1413121223449707, "Pretrain/Loss (Raw)": 1.9977425336837769, "Pretrain/Step": 972, "Pretrain/Step Time": 8.498127842321992} +{"Pretrain/Learning Rate": 4.932270931885918e-05, "Pretrain/Loss": 2.141843318939209, "Pretrain/Loss (Raw)": 2.2056784629821777, "Pretrain/Step": 973, "Pretrain/Step Time": 8.50064406171441} +{"Pretrain/Learning Rate": 4.9320745133770524e-05, "Pretrain/Loss": 2.141187906265259, "Pretrain/Loss (Raw)": 2.0929768085479736, "Pretrain/Step": 974, "Pretrain/Step Time": 8.502981707453728} +{"Pretrain/Learning Rate": 4.931877814389893e-05, "Pretrain/Loss": 2.1403121948242188, "Pretrain/Loss (Raw)": 2.0801751613616943, "Pretrain/Step": 975, "Pretrain/Step Time": 8.503715498372912} +{"Pretrain/Learning Rate": 4.931680834947124e-05, "Pretrain/Loss": 2.1397805213928223, "Pretrain/Loss (Raw)": 1.964779019355774, "Pretrain/Step": 976, "Pretrain/Step Time": 8.507800403982401} +{"Pretrain/Learning Rate": 4.9314835750714635e-05, "Pretrain/Loss": 2.137969732284546, "Pretrain/Loss (Raw)": 1.8892377614974976, "Pretrain/Step": 977, "Pretrain/Step Time": 8.499148709699512} +{"Pretrain/Learning Rate": 4.9312860347856595e-05, "Pretrain/Loss": 2.1393728256225586, "Pretrain/Loss (Raw)": 2.216015577316284, "Pretrain/Step": 978, "Pretrain/Step Time": 8.496299095451832} +{"Pretrain/Learning Rate": 4.931088214112494e-05, "Pretrain/Loss": 2.1421284675598145, "Pretrain/Loss (Raw)": 2.183561325073242, "Pretrain/Step": 979, "Pretrain/Step Time": 8.491905646398664} +{"Pretrain/Learning Rate": 4.930890113074779e-05, "Pretrain/Loss": 2.1429874897003174, "Pretrain/Loss (Raw)": 2.3170151710510254, "Pretrain/Step": 980, "Pretrain/Step Time": 8.498359847813845} +{"Pretrain/Learning Rate": 4.930691731695362e-05, "Pretrain/Loss": 2.1414971351623535, "Pretrain/Loss (Raw)": 2.0737416744232178, "Pretrain/Step": 981, "Pretrain/Step Time": 8.502334138378501} +{"Pretrain/Learning Rate": 4.9304930699971194e-05, "Pretrain/Loss": 2.1401782035827637, "Pretrain/Loss (Raw)": 2.062814712524414, "Pretrain/Step": 982, "Pretrain/Step Time": 8.509986456483603} +{"Pretrain/Learning Rate": 4.9302941280029645e-05, "Pretrain/Loss": 2.140934467315674, "Pretrain/Loss (Raw)": 2.1538360118865967, "Pretrain/Step": 983, "Pretrain/Step Time": 8.511701820418239} +{"Pretrain/Learning Rate": 4.930094905735838e-05, "Pretrain/Loss": 2.142754554748535, "Pretrain/Loss (Raw)": 2.1271228790283203, "Pretrain/Step": 984, "Pretrain/Step Time": 8.50602643750608} +{"Pretrain/Learning Rate": 4.929895403218717e-05, "Pretrain/Loss": 2.1440815925598145, "Pretrain/Loss (Raw)": 2.038541078567505, "Pretrain/Step": 985, "Pretrain/Step Time": 8.508916553109884} +{"Pretrain/Learning Rate": 4.929695620474607e-05, "Pretrain/Loss": 2.1431941986083984, "Pretrain/Loss (Raw)": 2.147824287414551, "Pretrain/Step": 986, "Pretrain/Step Time": 8.513371277600527} +{"Pretrain/Learning Rate": 4.9294955575265494e-05, "Pretrain/Loss": 2.1446409225463867, "Pretrain/Loss (Raw)": 2.383232355117798, "Pretrain/Step": 987, "Pretrain/Step Time": 8.513704055920243} +{"Pretrain/Learning Rate": 4.929295214397616e-05, "Pretrain/Loss": 2.143609046936035, "Pretrain/Loss (Raw)": 2.0030765533447266, "Pretrain/Step": 988, "Pretrain/Step Time": 8.516528222709894} +{"Pretrain/Learning Rate": 4.929094591110911e-05, "Pretrain/Loss": 2.14339017868042, "Pretrain/Loss (Raw)": 2.1026337146759033, "Pretrain/Step": 989, "Pretrain/Step Time": 8.513960441574454} +{"Pretrain/Learning Rate": 4.928893687689572e-05, "Pretrain/Loss": 2.139008045196533, "Pretrain/Loss (Raw)": 2.133546829223633, "Pretrain/Step": 990, "Pretrain/Step Time": 8.502454340457916} +{"Pretrain/Learning Rate": 4.928692504156767e-05, "Pretrain/Loss": 2.1375324726104736, "Pretrain/Loss (Raw)": 2.1154654026031494, "Pretrain/Step": 991, "Pretrain/Step Time": 8.50052004121244} +{"Pretrain/Learning Rate": 4.928491040535699e-05, "Pretrain/Loss": 2.13662052154541, "Pretrain/Loss (Raw)": 2.0529184341430664, "Pretrain/Step": 992, "Pretrain/Step Time": 8.510439472272992} +{"Pretrain/Learning Rate": 4.9282892968495995e-05, "Pretrain/Loss": 2.1372528076171875, "Pretrain/Loss (Raw)": 2.0895981788635254, "Pretrain/Step": 993, "Pretrain/Step Time": 8.508711891248822} +{"Pretrain/Learning Rate": 4.928087273121737e-05, "Pretrain/Loss": 2.1353464126586914, "Pretrain/Loss (Raw)": 2.005324363708496, "Pretrain/Step": 994, "Pretrain/Step Time": 8.509489592164755} +{"Pretrain/Learning Rate": 4.9278849693754076e-05, "Pretrain/Loss": 2.1365878582000732, "Pretrain/Loss (Raw)": 2.1488113403320312, "Pretrain/Step": 995, "Pretrain/Step Time": 8.50100514665246} +{"Pretrain/Learning Rate": 4.927682385633944e-05, "Pretrain/Loss": 2.137573719024658, "Pretrain/Loss (Raw)": 2.2519795894622803, "Pretrain/Step": 996, "Pretrain/Step Time": 8.492796033620834} +{"Pretrain/Learning Rate": 4.927479521920707e-05, "Pretrain/Loss": 2.138958215713501, "Pretrain/Loss (Raw)": 2.1925747394561768, "Pretrain/Step": 997, "Pretrain/Step Time": 8.495206901803613} +{"Pretrain/Learning Rate": 4.927276378259094e-05, "Pretrain/Loss": 2.1389288902282715, "Pretrain/Loss (Raw)": 2.095871925354004, "Pretrain/Step": 998, "Pretrain/Step Time": 8.503012416884303} +{"Pretrain/Learning Rate": 4.9270729546725305e-05, "Pretrain/Loss": 2.1409380435943604, "Pretrain/Loss (Raw)": 2.382930278778076, "Pretrain/Step": 999, "Pretrain/Step Time": 8.507368590682745} +{"Pretrain/Learning Rate": 4.9268692511844774e-05, "Pretrain/Loss": 2.1380186080932617, "Pretrain/Loss (Raw)": 2.0048165321350098, "Pretrain/Step": 1000, "Pretrain/Step Time": 8.512724820524454} +{"Pretrain/Learning Rate": 4.926665267818426e-05, "Pretrain/Loss": 2.140780448913574, "Pretrain/Loss (Raw)": 2.30489182472229, "Pretrain/Step": 1001, "Pretrain/Step Time": 8.512259928509593} +{"Pretrain/Learning Rate": 4.926461004597901e-05, "Pretrain/Loss": 2.1415963172912598, "Pretrain/Loss (Raw)": 2.1964237689971924, "Pretrain/Step": 1002, "Pretrain/Step Time": 8.50651046819985} +{"Pretrain/Learning Rate": 4.92625646154646e-05, "Pretrain/Loss": 2.1426634788513184, "Pretrain/Loss (Raw)": 2.0460174083709717, "Pretrain/Step": 1003, "Pretrain/Step Time": 8.50700230896473} +{"Pretrain/Learning Rate": 4.926051638687691e-05, "Pretrain/Loss": 2.142148971557617, "Pretrain/Loss (Raw)": 1.9583592414855957, "Pretrain/Step": 1004, "Pretrain/Step Time": 8.508435787633061} +{"Pretrain/Learning Rate": 4.925846536045215e-05, "Pretrain/Loss": 2.1412036418914795, "Pretrain/Loss (Raw)": 2.165149211883545, "Pretrain/Step": 1005, "Pretrain/Step Time": 8.511817304417491} +{"Pretrain/Learning Rate": 4.925641153642684e-05, "Pretrain/Loss": 2.1414151191711426, "Pretrain/Loss (Raw)": 2.13844633102417, "Pretrain/Step": 1006, "Pretrain/Step Time": 8.514970254153013} +{"Pretrain/Learning Rate": 4.925435491503787e-05, "Pretrain/Loss": 2.140817165374756, "Pretrain/Loss (Raw)": 1.9777922630310059, "Pretrain/Step": 1007, "Pretrain/Step Time": 8.509012922644615} +{"Pretrain/Learning Rate": 4.9252295496522395e-05, "Pretrain/Loss": 2.140958070755005, "Pretrain/Loss (Raw)": 2.168320655822754, "Pretrain/Step": 1008, "Pretrain/Step Time": 8.506661619991064} +{"Pretrain/Learning Rate": 4.925023328111792e-05, "Pretrain/Loss": 2.1397383213043213, "Pretrain/Loss (Raw)": 1.9364362955093384, "Pretrain/Step": 1009, "Pretrain/Step Time": 8.511834252625704} +{"Pretrain/Learning Rate": 4.924816826906227e-05, "Pretrain/Loss": 2.141695976257324, "Pretrain/Loss (Raw)": 2.343984842300415, "Pretrain/Step": 1010, "Pretrain/Step Time": 8.506682964041829} +{"Pretrain/Learning Rate": 4.92461004605936e-05, "Pretrain/Loss": 2.141932249069214, "Pretrain/Loss (Raw)": 2.3018765449523926, "Pretrain/Step": 1011, "Pretrain/Step Time": 8.513322860002518} +{"Pretrain/Learning Rate": 4.924402985595037e-05, "Pretrain/Loss": 2.1429548263549805, "Pretrain/Loss (Raw)": 2.166375160217285, "Pretrain/Step": 1012, "Pretrain/Step Time": 8.51420765556395} +{"Pretrain/Learning Rate": 4.924195645537138e-05, "Pretrain/Loss": 2.142759084701538, "Pretrain/Loss (Raw)": 2.0433619022369385, "Pretrain/Step": 1013, "Pretrain/Step Time": 8.505742320790887} +{"Pretrain/Learning Rate": 4.923988025909574e-05, "Pretrain/Loss": 2.144629716873169, "Pretrain/Loss (Raw)": 2.591656446456909, "Pretrain/Step": 1014, "Pretrain/Step Time": 8.503352330997586} +{"Pretrain/Learning Rate": 4.923780126736288e-05, "Pretrain/Loss": 2.1464030742645264, "Pretrain/Loss (Raw)": 2.2912099361419678, "Pretrain/Step": 1015, "Pretrain/Step Time": 8.502830633893609} +{"Pretrain/Learning Rate": 4.923571948041257e-05, "Pretrain/Loss": 2.1468682289123535, "Pretrain/Loss (Raw)": 2.0123562812805176, "Pretrain/Step": 1016, "Pretrain/Step Time": 8.507290232926607} +{"Pretrain/Learning Rate": 4.923363489848489e-05, "Pretrain/Loss": 2.148489236831665, "Pretrain/Loss (Raw)": 2.3157169818878174, "Pretrain/Step": 1017, "Pretrain/Step Time": 8.507702890783548} +{"Pretrain/Learning Rate": 4.923154752182023e-05, "Pretrain/Loss": 2.14723539352417, "Pretrain/Loss (Raw)": 2.066157817840576, "Pretrain/Step": 1018, "Pretrain/Step Time": 8.508465068414807} +{"Pretrain/Learning Rate": 4.922945735065934e-05, "Pretrain/Loss": 2.1482067108154297, "Pretrain/Loss (Raw)": 2.083575963973999, "Pretrain/Step": 1019, "Pretrain/Step Time": 8.504134574905038} +{"Pretrain/Learning Rate": 4.9227364385243246e-05, "Pretrain/Loss": 2.1477670669555664, "Pretrain/Loss (Raw)": 2.030437469482422, "Pretrain/Step": 1020, "Pretrain/Step Time": 8.506199577823281} +{"Pretrain/Learning Rate": 4.922526862581333e-05, "Pretrain/Loss": 2.1469645500183105, "Pretrain/Loss (Raw)": 2.0207767486572266, "Pretrain/Step": 1021, "Pretrain/Step Time": 8.506109073758125} +{"Pretrain/Learning Rate": 4.922317007261129e-05, "Pretrain/Loss": 2.150322437286377, "Pretrain/Loss (Raw)": 2.1628808975219727, "Pretrain/Step": 1022, "Pretrain/Step Time": 8.50584571249783} +{"Pretrain/Learning Rate": 4.922106872587913e-05, "Pretrain/Loss": 2.1487510204315186, "Pretrain/Loss (Raw)": 1.8586151599884033, "Pretrain/Step": 1023, "Pretrain/Step Time": 8.509846322238445} +{"Pretrain/Learning Rate": 4.921896458585919e-05, "Pretrain/Loss": 2.1495513916015625, "Pretrain/Loss (Raw)": 2.203997850418091, "Pretrain/Step": 1024, "Pretrain/Step Time": 8.515694478526711} +{"Pretrain/Learning Rate": 4.9216857652794125e-05, "Pretrain/Loss": 2.1513431072235107, "Pretrain/Loss (Raw)": 2.277418375015259, "Pretrain/Step": 1025, "Pretrain/Step Time": 8.508809100836515} +{"Pretrain/Learning Rate": 4.921474792692692e-05, "Pretrain/Loss": 2.1517627239227295, "Pretrain/Loss (Raw)": 2.224932909011841, "Pretrain/Step": 1026, "Pretrain/Step Time": 8.500676654279232} +{"Pretrain/Learning Rate": 4.921263540850089e-05, "Pretrain/Loss": 2.150712728500366, "Pretrain/Loss (Raw)": 2.1432721614837646, "Pretrain/Step": 1027, "Pretrain/Step Time": 8.505863811820745} +{"Pretrain/Learning Rate": 4.921052009775965e-05, "Pretrain/Loss": 2.1521263122558594, "Pretrain/Loss (Raw)": 2.101893424987793, "Pretrain/Step": 1028, "Pretrain/Step Time": 8.510994512587786} +{"Pretrain/Learning Rate": 4.9208401994947144e-05, "Pretrain/Loss": 2.148954391479492, "Pretrain/Loss (Raw)": 2.12273907661438, "Pretrain/Step": 1029, "Pretrain/Step Time": 8.516643261536956} +{"Pretrain/Learning Rate": 4.920628110030765e-05, "Pretrain/Loss": 2.1456761360168457, "Pretrain/Loss (Raw)": 1.9671591520309448, "Pretrain/Step": 1030, "Pretrain/Step Time": 8.519116006791592} +{"Pretrain/Learning Rate": 4.920415741408575e-05, "Pretrain/Loss": 2.1432971954345703, "Pretrain/Loss (Raw)": 1.9877930879592896, "Pretrain/Step": 1031, "Pretrain/Step Time": 8.51115646213293} +{"Pretrain/Learning Rate": 4.920203093652637e-05, "Pretrain/Loss": 2.1432766914367676, "Pretrain/Loss (Raw)": 2.141936779022217, "Pretrain/Step": 1032, "Pretrain/Step Time": 8.511384362354875} +{"Pretrain/Learning Rate": 4.919990166787474e-05, "Pretrain/Loss": 2.144132375717163, "Pretrain/Loss (Raw)": 2.2204504013061523, "Pretrain/Step": 1033, "Pretrain/Step Time": 8.506014304235578} +{"Pretrain/Learning Rate": 4.919776960837641e-05, "Pretrain/Loss": 2.143272638320923, "Pretrain/Loss (Raw)": 2.068108558654785, "Pretrain/Step": 1034, "Pretrain/Step Time": 8.504563143476844} +{"Pretrain/Learning Rate": 4.9195634758277264e-05, "Pretrain/Loss": 2.1406984329223633, "Pretrain/Loss (Raw)": 2.073643207550049, "Pretrain/Step": 1035, "Pretrain/Step Time": 8.512593964114785} +{"Pretrain/Learning Rate": 4.919349711782351e-05, "Pretrain/Loss": 2.138302803039551, "Pretrain/Loss (Raw)": 1.9583731889724731, "Pretrain/Step": 1036, "Pretrain/Step Time": 8.518003510311246} +{"Pretrain/Learning Rate": 4.919135668726167e-05, "Pretrain/Loss": 2.1387500762939453, "Pretrain/Loss (Raw)": 2.044102430343628, "Pretrain/Step": 1037, "Pretrain/Step Time": 8.50808048248291} +{"Pretrain/Learning Rate": 4.9189213466838565e-05, "Pretrain/Loss": 2.138373851776123, "Pretrain/Loss (Raw)": 2.142423152923584, "Pretrain/Step": 1038, "Pretrain/Step Time": 8.50567827001214} +{"Pretrain/Learning Rate": 4.91870674568014e-05, "Pretrain/Loss": 2.1411972045898438, "Pretrain/Loss (Raw)": 2.2854838371276855, "Pretrain/Step": 1039, "Pretrain/Step Time": 8.508327424526215} +{"Pretrain/Learning Rate": 4.9184918657397625e-05, "Pretrain/Loss": 2.1418771743774414, "Pretrain/Loss (Raw)": 2.1900181770324707, "Pretrain/Step": 1040, "Pretrain/Step Time": 8.5153139680624} +{"Pretrain/Learning Rate": 4.918276706887508e-05, "Pretrain/Loss": 2.1417131423950195, "Pretrain/Loss (Raw)": 2.0146026611328125, "Pretrain/Step": 1041, "Pretrain/Step Time": 8.516552492976189} +{"Pretrain/Learning Rate": 4.918061269148187e-05, "Pretrain/Loss": 2.1427998542785645, "Pretrain/Loss (Raw)": 2.118969440460205, "Pretrain/Step": 1042, "Pretrain/Step Time": 8.51960650831461} +{"Pretrain/Learning Rate": 4.9178455525466484e-05, "Pretrain/Loss": 2.140313148498535, "Pretrain/Loss (Raw)": 1.9559987783432007, "Pretrain/Step": 1043, "Pretrain/Step Time": 8.5129265319556} +{"Pretrain/Learning Rate": 4.9176295571077655e-05, "Pretrain/Loss": 2.141648769378662, "Pretrain/Loss (Raw)": 2.1663899421691895, "Pretrain/Step": 1044, "Pretrain/Step Time": 8.507731158286333} +{"Pretrain/Learning Rate": 4.917413282856451e-05, "Pretrain/Loss": 2.1395199298858643, "Pretrain/Loss (Raw)": 2.0360214710235596, "Pretrain/Step": 1045, "Pretrain/Step Time": 8.51333206705749} +{"Pretrain/Learning Rate": 4.917196729817645e-05, "Pretrain/Loss": 2.1376919746398926, "Pretrain/Loss (Raw)": 1.902398705482483, "Pretrain/Step": 1046, "Pretrain/Step Time": 8.511281860992312} +{"Pretrain/Learning Rate": 4.9169798980163215e-05, "Pretrain/Loss": 2.139812469482422, "Pretrain/Loss (Raw)": 2.2458393573760986, "Pretrain/Step": 1047, "Pretrain/Step Time": 8.510190287604928} +{"Pretrain/Learning Rate": 4.916762787477487e-05, "Pretrain/Loss": 2.138657569885254, "Pretrain/Loss (Raw)": 2.0375747680664062, "Pretrain/Step": 1048, "Pretrain/Step Time": 8.509433617815375} +{"Pretrain/Learning Rate": 4.91654539822618e-05, "Pretrain/Loss": 2.1384990215301514, "Pretrain/Loss (Raw)": 2.1862974166870117, "Pretrain/Step": 1049, "Pretrain/Step Time": 8.504999868571758} +{"Pretrain/Learning Rate": 4.916327730287471e-05, "Pretrain/Loss": 2.137700319290161, "Pretrain/Loss (Raw)": 2.0304927825927734, "Pretrain/Step": 1050, "Pretrain/Step Time": 8.501804497092962} +{"Pretrain/Learning Rate": 4.916109783686461e-05, "Pretrain/Loss": 2.134293556213379, "Pretrain/Loss (Raw)": 1.835193395614624, "Pretrain/Step": 1051, "Pretrain/Step Time": 8.500073444098234} +{"Pretrain/Learning Rate": 4.915891558448287e-05, "Pretrain/Loss": 2.1325604915618896, "Pretrain/Loss (Raw)": 2.0073230266571045, "Pretrain/Step": 1052, "Pretrain/Step Time": 8.504101507365704} +{"Pretrain/Learning Rate": 4.915673054598113e-05, "Pretrain/Loss": 2.1342246532440186, "Pretrain/Loss (Raw)": 2.2808516025543213, "Pretrain/Step": 1053, "Pretrain/Step Time": 8.50693653896451} +{"Pretrain/Learning Rate": 4.91545427216114e-05, "Pretrain/Loss": 2.134211540222168, "Pretrain/Loss (Raw)": 1.9654864072799683, "Pretrain/Step": 1054, "Pretrain/Step Time": 8.497121335938573} +{"Pretrain/Learning Rate": 4.915235211162599e-05, "Pretrain/Loss": 2.1343774795532227, "Pretrain/Loss (Raw)": 2.2168142795562744, "Pretrain/Step": 1055, "Pretrain/Step Time": 8.489176779985428} +{"Pretrain/Learning Rate": 4.9150158716277516e-05, "Pretrain/Loss": 2.131981134414673, "Pretrain/Loss (Raw)": 1.8331587314605713, "Pretrain/Step": 1056, "Pretrain/Step Time": 8.494891438633204} +{"Pretrain/Learning Rate": 4.9147962535818935e-05, "Pretrain/Loss": 2.131927251815796, "Pretrain/Loss (Raw)": 2.1270523071289062, "Pretrain/Step": 1057, "Pretrain/Step Time": 8.499143309891224} +{"Pretrain/Learning Rate": 4.9145763570503536e-05, "Pretrain/Loss": 2.133211135864258, "Pretrain/Loss (Raw)": 2.0697946548461914, "Pretrain/Step": 1058, "Pretrain/Step Time": 8.503116412088275} +{"Pretrain/Learning Rate": 4.914356182058491e-05, "Pretrain/Loss": 2.1328253746032715, "Pretrain/Loss (Raw)": 2.039668560028076, "Pretrain/Step": 1059, "Pretrain/Step Time": 8.504677752032876} +{"Pretrain/Learning Rate": 4.914135728631695e-05, "Pretrain/Loss": 2.1343817710876465, "Pretrain/Loss (Raw)": 2.1404683589935303, "Pretrain/Step": 1060, "Pretrain/Step Time": 8.50311435200274} +{"Pretrain/Learning Rate": 4.913914996795391e-05, "Pretrain/Loss": 2.134096145629883, "Pretrain/Loss (Raw)": 2.168851613998413, "Pretrain/Step": 1061, "Pretrain/Step Time": 8.497596245259047} +{"Pretrain/Learning Rate": 4.9136939865750357e-05, "Pretrain/Loss": 2.1323561668395996, "Pretrain/Loss (Raw)": 1.998090147972107, "Pretrain/Step": 1062, "Pretrain/Step Time": 8.50051949173212} +{"Pretrain/Learning Rate": 4.913472697996116e-05, "Pretrain/Loss": 2.132561445236206, "Pretrain/Loss (Raw)": 2.1190919876098633, "Pretrain/Step": 1063, "Pretrain/Step Time": 8.511881809681654} +{"Pretrain/Learning Rate": 4.913251131084152e-05, "Pretrain/Loss": 2.129760980606079, "Pretrain/Loss (Raw)": 1.9210373163223267, "Pretrain/Step": 1064, "Pretrain/Step Time": 8.511855531483889} +{"Pretrain/Learning Rate": 4.9130292858646966e-05, "Pretrain/Loss": 2.129582166671753, "Pretrain/Loss (Raw)": 2.434661388397217, "Pretrain/Step": 1065, "Pretrain/Step Time": 8.515032822266221} +{"Pretrain/Learning Rate": 4.912807162363332e-05, "Pretrain/Loss": 2.1284072399139404, "Pretrain/Loss (Raw)": 2.0231666564941406, "Pretrain/Step": 1066, "Pretrain/Step Time": 8.5191222243011} +{"Pretrain/Learning Rate": 4.912584760605677e-05, "Pretrain/Loss": 2.1248679161071777, "Pretrain/Loss (Raw)": 2.1667568683624268, "Pretrain/Step": 1067, "Pretrain/Step Time": 8.514564797282219} +{"Pretrain/Learning Rate": 4.9123620806173785e-05, "Pretrain/Loss": 2.124528408050537, "Pretrain/Loss (Raw)": 2.0397002696990967, "Pretrain/Step": 1068, "Pretrain/Step Time": 8.512015368789434} +{"Pretrain/Learning Rate": 4.9121391224241174e-05, "Pretrain/Loss": 2.1236228942871094, "Pretrain/Loss (Raw)": 2.100022315979004, "Pretrain/Step": 1069, "Pretrain/Step Time": 8.510068286210299} +{"Pretrain/Learning Rate": 4.9119158860516066e-05, "Pretrain/Loss": 2.1236157417297363, "Pretrain/Loss (Raw)": 1.9796439409255981, "Pretrain/Step": 1070, "Pretrain/Step Time": 8.511356493458152} +{"Pretrain/Learning Rate": 4.9116923715255905e-05, "Pretrain/Loss": 2.124269485473633, "Pretrain/Loss (Raw)": 2.0914883613586426, "Pretrain/Step": 1071, "Pretrain/Step Time": 8.511177904903889} +{"Pretrain/Learning Rate": 4.9114685788718454e-05, "Pretrain/Loss": 2.1237564086914062, "Pretrain/Loss (Raw)": 2.172804594039917, "Pretrain/Step": 1072, "Pretrain/Step Time": 8.510902086272836} +{"Pretrain/Learning Rate": 4.9112445081161813e-05, "Pretrain/Loss": 2.1217997074127197, "Pretrain/Loss (Raw)": 2.0242574214935303, "Pretrain/Step": 1073, "Pretrain/Step Time": 8.499625887721777} +{"Pretrain/Learning Rate": 4.9110201592844376e-05, "Pretrain/Loss": 2.1189494132995605, "Pretrain/Loss (Raw)": 1.8482588529586792, "Pretrain/Step": 1074, "Pretrain/Step Time": 8.504972832277417} +{"Pretrain/Learning Rate": 4.910795532402489e-05, "Pretrain/Loss": 2.1181371212005615, "Pretrain/Loss (Raw)": 2.063645362854004, "Pretrain/Step": 1075, "Pretrain/Step Time": 8.511760551482439} +{"Pretrain/Learning Rate": 4.910570627496239e-05, "Pretrain/Loss": 2.117715835571289, "Pretrain/Loss (Raw)": 2.178933620452881, "Pretrain/Step": 1076, "Pretrain/Step Time": 8.5109180547297} +{"Pretrain/Learning Rate": 4.9103454445916256e-05, "Pretrain/Loss": 2.1159074306488037, "Pretrain/Loss (Raw)": 2.0046215057373047, "Pretrain/Step": 1077, "Pretrain/Step Time": 8.51548882201314} +{"Pretrain/Learning Rate": 4.910119983714616e-05, "Pretrain/Loss": 2.1146903038024902, "Pretrain/Loss (Raw)": 2.218785047531128, "Pretrain/Step": 1078, "Pretrain/Step Time": 8.512176560238004} +{"Pretrain/Learning Rate": 4.909894244891214e-05, "Pretrain/Loss": 2.1171727180480957, "Pretrain/Loss (Raw)": 2.238783121109009, "Pretrain/Step": 1079, "Pretrain/Step Time": 8.50838795863092} +{"Pretrain/Learning Rate": 4.909668228147453e-05, "Pretrain/Loss": 2.118079662322998, "Pretrain/Loss (Raw)": 2.2593421936035156, "Pretrain/Step": 1080, "Pretrain/Step Time": 8.50744721479714} +{"Pretrain/Learning Rate": 4.9094419335093966e-05, "Pretrain/Loss": 2.118108034133911, "Pretrain/Loss (Raw)": 2.0503852367401123, "Pretrain/Step": 1081, "Pretrain/Step Time": 8.510681932792068} +{"Pretrain/Learning Rate": 4.909215361003142e-05, "Pretrain/Loss": 2.1149044036865234, "Pretrain/Loss (Raw)": 2.0791172981262207, "Pretrain/Step": 1082, "Pretrain/Step Time": 8.514771591871977} +{"Pretrain/Learning Rate": 4.90898851065482e-05, "Pretrain/Loss": 2.11448335647583, "Pretrain/Loss (Raw)": 2.10371732711792, "Pretrain/Step": 1083, "Pretrain/Step Time": 8.512391043826938} +{"Pretrain/Learning Rate": 4.908761382490591e-05, "Pretrain/Loss": 2.113638401031494, "Pretrain/Loss (Raw)": 1.9725207090377808, "Pretrain/Step": 1084, "Pretrain/Step Time": 8.50740173831582} +{"Pretrain/Learning Rate": 4.908533976536649e-05, "Pretrain/Loss": 2.1145689487457275, "Pretrain/Loss (Raw)": 2.230668067932129, "Pretrain/Step": 1085, "Pretrain/Step Time": 8.50279145874083} +{"Pretrain/Learning Rate": 4.90830629281922e-05, "Pretrain/Loss": 2.113501787185669, "Pretrain/Loss (Raw)": 2.1396570205688477, "Pretrain/Step": 1086, "Pretrain/Step Time": 8.503868447616696} +{"Pretrain/Learning Rate": 4.908078331364561e-05, "Pretrain/Loss": 2.1137773990631104, "Pretrain/Loss (Raw)": 2.148972511291504, "Pretrain/Step": 1087, "Pretrain/Step Time": 8.512758664786816} +{"Pretrain/Learning Rate": 4.907850092198961e-05, "Pretrain/Loss": 2.1130025386810303, "Pretrain/Loss (Raw)": 2.224749803543091, "Pretrain/Step": 1088, "Pretrain/Step Time": 8.51908527687192} +{"Pretrain/Learning Rate": 4.9076215753487425e-05, "Pretrain/Loss": 2.114243507385254, "Pretrain/Loss (Raw)": 2.1434218883514404, "Pretrain/Step": 1089, "Pretrain/Step Time": 8.518277989700437} +{"Pretrain/Learning Rate": 4.9073927808402585e-05, "Pretrain/Loss": 2.1153149604797363, "Pretrain/Loss (Raw)": 2.224489212036133, "Pretrain/Step": 1090, "Pretrain/Step Time": 8.51434007845819} +{"Pretrain/Learning Rate": 4.907163708699896e-05, "Pretrain/Loss": 2.114347457885742, "Pretrain/Loss (Raw)": 2.031013250350952, "Pretrain/Step": 1091, "Pretrain/Step Time": 8.507595300674438} +{"Pretrain/Learning Rate": 4.9069343589540704e-05, "Pretrain/Loss": 2.115797281265259, "Pretrain/Loss (Raw)": 2.2501912117004395, "Pretrain/Step": 1092, "Pretrain/Step Time": 8.505880307406187} +{"Pretrain/Learning Rate": 4.906704731629233e-05, "Pretrain/Loss": 2.115288734436035, "Pretrain/Loss (Raw)": 2.002387762069702, "Pretrain/Step": 1093, "Pretrain/Step Time": 8.513063356280327} +{"Pretrain/Learning Rate": 4.9064748267518656e-05, "Pretrain/Loss": 2.1163718700408936, "Pretrain/Loss (Raw)": 2.424703598022461, "Pretrain/Step": 1094, "Pretrain/Step Time": 8.515050370246172} +{"Pretrain/Learning Rate": 4.9062446443484813e-05, "Pretrain/Loss": 2.1182031631469727, "Pretrain/Loss (Raw)": 2.1654698848724365, "Pretrain/Step": 1095, "Pretrain/Step Time": 8.513255713507533} +{"Pretrain/Learning Rate": 4.9060141844456267e-05, "Pretrain/Loss": 2.1197662353515625, "Pretrain/Loss (Raw)": 2.210465908050537, "Pretrain/Step": 1096, "Pretrain/Step Time": 8.50815256498754} +{"Pretrain/Learning Rate": 4.905783447069878e-05, "Pretrain/Loss": 2.1168925762176514, "Pretrain/Loss (Raw)": 1.9414737224578857, "Pretrain/Step": 1097, "Pretrain/Step Time": 8.509035950526595} +{"Pretrain/Learning Rate": 4.905552432247846e-05, "Pretrain/Loss": 2.115604877471924, "Pretrain/Loss (Raw)": 2.0848944187164307, "Pretrain/Step": 1098, "Pretrain/Step Time": 8.516352340579033} +{"Pretrain/Learning Rate": 4.905321140006172e-05, "Pretrain/Loss": 2.115417003631592, "Pretrain/Loss (Raw)": 2.234325647354126, "Pretrain/Step": 1099, "Pretrain/Step Time": 8.51210468634963} +{"Pretrain/Learning Rate": 4.90508957037153e-05, "Pretrain/Loss": 2.117947578430176, "Pretrain/Loss (Raw)": 2.3216605186462402, "Pretrain/Step": 1100, "Pretrain/Step Time": 8.518373450264335} +{"Pretrain/Learning Rate": 4.9048577233706264e-05, "Pretrain/Loss": 2.118105411529541, "Pretrain/Loss (Raw)": 2.2258899211883545, "Pretrain/Step": 1101, "Pretrain/Step Time": 8.516153655946255} +{"Pretrain/Learning Rate": 4.9046255990301965e-05, "Pretrain/Loss": 2.1184983253479004, "Pretrain/Loss (Raw)": 2.1432859897613525, "Pretrain/Step": 1102, "Pretrain/Step Time": 8.507691053673625} +{"Pretrain/Learning Rate": 4.904393197377012e-05, "Pretrain/Loss": 2.118987560272217, "Pretrain/Loss (Raw)": 2.1427574157714844, "Pretrain/Step": 1103, "Pretrain/Step Time": 8.510017929598689} +{"Pretrain/Learning Rate": 4.9041605184378746e-05, "Pretrain/Loss": 2.120913028717041, "Pretrain/Loss (Raw)": 2.2112457752227783, "Pretrain/Step": 1104, "Pretrain/Step Time": 8.513107782229781} +{"Pretrain/Learning Rate": 4.903927562239617e-05, "Pretrain/Loss": 2.123059034347534, "Pretrain/Loss (Raw)": 2.163935899734497, "Pretrain/Step": 1105, "Pretrain/Step Time": 8.519851634278893} +{"Pretrain/Learning Rate": 4.9036943288091066e-05, "Pretrain/Loss": 2.1229801177978516, "Pretrain/Loss (Raw)": 2.2059035301208496, "Pretrain/Step": 1106, "Pretrain/Step Time": 8.520840333774686} +{"Pretrain/Learning Rate": 4.903460818173238e-05, "Pretrain/Loss": 2.1212692260742188, "Pretrain/Loss (Raw)": 1.964612364768982, "Pretrain/Step": 1107, "Pretrain/Step Time": 8.519917218014598} +{"Pretrain/Learning Rate": 4.9032270303589435e-05, "Pretrain/Loss": 2.118826389312744, "Pretrain/Loss (Raw)": 2.004323959350586, "Pretrain/Step": 1108, "Pretrain/Step Time": 8.514689171686769} +{"Pretrain/Learning Rate": 4.9029929653931826e-05, "Pretrain/Loss": 2.1178524494171143, "Pretrain/Loss (Raw)": 1.9490540027618408, "Pretrain/Step": 1109, "Pretrain/Step Time": 8.513795899227262} +{"Pretrain/Learning Rate": 4.90275862330295e-05, "Pretrain/Loss": 2.1172914505004883, "Pretrain/Loss (Raw)": 1.9910038709640503, "Pretrain/Step": 1110, "Pretrain/Step Time": 8.509478213265538} +{"Pretrain/Learning Rate": 4.902524004115271e-05, "Pretrain/Loss": 2.115845203399658, "Pretrain/Loss (Raw)": 1.9687094688415527, "Pretrain/Step": 1111, "Pretrain/Step Time": 8.515601022168994} +{"Pretrain/Learning Rate": 4.902289107857202e-05, "Pretrain/Loss": 2.1146957874298096, "Pretrain/Loss (Raw)": 1.9800026416778564, "Pretrain/Step": 1112, "Pretrain/Step Time": 8.517102118581533} +{"Pretrain/Learning Rate": 4.9020539345558335e-05, "Pretrain/Loss": 2.114288806915283, "Pretrain/Loss (Raw)": 1.9864410161972046, "Pretrain/Step": 1113, "Pretrain/Step Time": 8.517589190974832} +{"Pretrain/Learning Rate": 4.9018184842382866e-05, "Pretrain/Loss": 2.1132099628448486, "Pretrain/Loss (Raw)": 2.009737014770508, "Pretrain/Step": 1114, "Pretrain/Step Time": 8.509618086740375} +{"Pretrain/Learning Rate": 4.901582756931715e-05, "Pretrain/Loss": 2.1106812953948975, "Pretrain/Loss (Raw)": 2.059565544128418, "Pretrain/Step": 1115, "Pretrain/Step Time": 8.507944069802761} +{"Pretrain/Learning Rate": 4.901346752663302e-05, "Pretrain/Loss": 2.1121268272399902, "Pretrain/Loss (Raw)": 2.1881344318389893, "Pretrain/Step": 1116, "Pretrain/Step Time": 8.515688439831138} +{"Pretrain/Learning Rate": 4.9011104714602666e-05, "Pretrain/Loss": 2.112186908721924, "Pretrain/Loss (Raw)": 2.110276937484741, "Pretrain/Step": 1117, "Pretrain/Step Time": 8.521610725671053} +{"Pretrain/Learning Rate": 4.900873913349857e-05, "Pretrain/Loss": 2.1161177158355713, "Pretrain/Loss (Raw)": 2.636706829071045, "Pretrain/Step": 1118, "Pretrain/Step Time": 8.52685696259141} +{"Pretrain/Learning Rate": 4.9006370783593544e-05, "Pretrain/Loss": 2.11584734916687, "Pretrain/Loss (Raw)": 2.080859422683716, "Pretrain/Step": 1119, "Pretrain/Step Time": 8.524966314435005} +{"Pretrain/Learning Rate": 4.900399966516073e-05, "Pretrain/Loss": 2.1159443855285645, "Pretrain/Loss (Raw)": 2.0653505325317383, "Pretrain/Step": 1120, "Pretrain/Step Time": 8.514818856492639} +{"Pretrain/Learning Rate": 4.900162577847355e-05, "Pretrain/Loss": 2.116971254348755, "Pretrain/Loss (Raw)": 2.221021890640259, "Pretrain/Step": 1121, "Pretrain/Step Time": 8.519604099914432} +{"Pretrain/Learning Rate": 4.899924912380579e-05, "Pretrain/Loss": 2.116337299346924, "Pretrain/Loss (Raw)": 1.9241596460342407, "Pretrain/Step": 1122, "Pretrain/Step Time": 8.525350274518132} +{"Pretrain/Learning Rate": 4.899686970143153e-05, "Pretrain/Loss": 2.117464542388916, "Pretrain/Loss (Raw)": 2.293104410171509, "Pretrain/Step": 1123, "Pretrain/Step Time": 8.525258155539632} +{"Pretrain/Learning Rate": 4.8994487511625184e-05, "Pretrain/Loss": 2.1149239540100098, "Pretrain/Loss (Raw)": 1.9267784357070923, "Pretrain/Step": 1124, "Pretrain/Step Time": 8.52212617918849} +{"Pretrain/Learning Rate": 4.899210255466147e-05, "Pretrain/Loss": 2.114452362060547, "Pretrain/Loss (Raw)": 2.1322195529937744, "Pretrain/Step": 1125, "Pretrain/Step Time": 8.524712443351746} +{"Pretrain/Learning Rate": 4.898971483081543e-05, "Pretrain/Loss": 2.115285873413086, "Pretrain/Loss (Raw)": 2.202566385269165, "Pretrain/Step": 1126, "Pretrain/Step Time": 8.513915473595262} +{"Pretrain/Learning Rate": 4.898732434036244e-05, "Pretrain/Loss": 2.1142959594726562, "Pretrain/Loss (Raw)": 2.2562146186828613, "Pretrain/Step": 1127, "Pretrain/Step Time": 8.512328919023275} +{"Pretrain/Learning Rate": 4.898493108357817e-05, "Pretrain/Loss": 2.114696741104126, "Pretrain/Loss (Raw)": 2.0561275482177734, "Pretrain/Step": 1128, "Pretrain/Step Time": 8.516724791377783} +{"Pretrain/Learning Rate": 4.898253506073863e-05, "Pretrain/Loss": 2.1119346618652344, "Pretrain/Loss (Raw)": 1.9513516426086426, "Pretrain/Step": 1129, "Pretrain/Step Time": 8.519008323550224} +{"Pretrain/Learning Rate": 4.8980136272120136e-05, "Pretrain/Loss": 2.1109988689422607, "Pretrain/Loss (Raw)": 2.0766489505767822, "Pretrain/Step": 1130, "Pretrain/Step Time": 8.519260125234723} +{"Pretrain/Learning Rate": 4.8977734717999326e-05, "Pretrain/Loss": 2.1115198135375977, "Pretrain/Loss (Raw)": 2.1126794815063477, "Pretrain/Step": 1131, "Pretrain/Step Time": 8.517201105132699} +{"Pretrain/Learning Rate": 4.8975330398653164e-05, "Pretrain/Loss": 2.11326265335083, "Pretrain/Loss (Raw)": 2.1814475059509277, "Pretrain/Step": 1132, "Pretrain/Step Time": 8.515827460214496} +{"Pretrain/Learning Rate": 4.8972923314358934e-05, "Pretrain/Loss": 2.112140655517578, "Pretrain/Loss (Raw)": 2.021543025970459, "Pretrain/Step": 1133, "Pretrain/Step Time": 8.514786647632718} +{"Pretrain/Learning Rate": 4.8970513465394206e-05, "Pretrain/Loss": 2.1120946407318115, "Pretrain/Loss (Raw)": 2.132554054260254, "Pretrain/Step": 1134, "Pretrain/Step Time": 8.521434513852} +{"Pretrain/Learning Rate": 4.896810085203692e-05, "Pretrain/Loss": 2.1126129627227783, "Pretrain/Loss (Raw)": 2.0441296100616455, "Pretrain/Step": 1135, "Pretrain/Step Time": 8.5173668731004} +{"Pretrain/Learning Rate": 4.896568547456531e-05, "Pretrain/Loss": 2.11098575592041, "Pretrain/Loss (Raw)": 1.9600533246994019, "Pretrain/Step": 1136, "Pretrain/Step Time": 8.519463919103146} +{"Pretrain/Learning Rate": 4.896326733325791e-05, "Pretrain/Loss": 2.1117758750915527, "Pretrain/Loss (Raw)": 2.0375688076019287, "Pretrain/Step": 1137, "Pretrain/Step Time": 8.511167034506798} +{"Pretrain/Learning Rate": 4.8960846428393615e-05, "Pretrain/Loss": 2.1089024543762207, "Pretrain/Loss (Raw)": 1.9761618375778198, "Pretrain/Step": 1138, "Pretrain/Step Time": 8.513053741306067} +{"Pretrain/Learning Rate": 4.8958422760251585e-05, "Pretrain/Loss": 2.1066012382507324, "Pretrain/Loss (Raw)": 2.007333993911743, "Pretrain/Step": 1139, "Pretrain/Step Time": 8.508927488699555} +{"Pretrain/Learning Rate": 4.8955996329111364e-05, "Pretrain/Loss": 2.1066110134124756, "Pretrain/Loss (Raw)": 2.167626142501831, "Pretrain/Step": 1140, "Pretrain/Step Time": 8.512738358229399} +{"Pretrain/Learning Rate": 4.895356713525275e-05, "Pretrain/Loss": 2.1067094802856445, "Pretrain/Loss (Raw)": 2.0559496879577637, "Pretrain/Step": 1141, "Pretrain/Step Time": 8.517247270792723} +{"Pretrain/Learning Rate": 4.895113517895591e-05, "Pretrain/Loss": 2.103858470916748, "Pretrain/Loss (Raw)": 2.2267327308654785, "Pretrain/Step": 1142, "Pretrain/Step Time": 8.520068060606718} +{"Pretrain/Learning Rate": 4.8948700460501294e-05, "Pretrain/Loss": 2.1021945476531982, "Pretrain/Loss (Raw)": 2.0782487392425537, "Pretrain/Step": 1143, "Pretrain/Step Time": 8.51635811664164} +{"Pretrain/Learning Rate": 4.8946262980169686e-05, "Pretrain/Loss": 2.10318660736084, "Pretrain/Loss (Raw)": 2.139331579208374, "Pretrain/Step": 1144, "Pretrain/Step Time": 8.509781807661057} +{"Pretrain/Learning Rate": 4.894382273824221e-05, "Pretrain/Loss": 2.1024770736694336, "Pretrain/Loss (Raw)": 2.224881410598755, "Pretrain/Step": 1145, "Pretrain/Step Time": 8.511127846315503} +{"Pretrain/Learning Rate": 4.894137973500025e-05, "Pretrain/Loss": 2.1009068489074707, "Pretrain/Loss (Raw)": 1.8651882410049438, "Pretrain/Step": 1146, "Pretrain/Step Time": 8.515945438295603} +{"Pretrain/Learning Rate": 4.893893397072558e-05, "Pretrain/Loss": 2.10088849067688, "Pretrain/Loss (Raw)": 2.0812137126922607, "Pretrain/Step": 1147, "Pretrain/Step Time": 8.517335746437311} +{"Pretrain/Learning Rate": 4.893648544570022e-05, "Pretrain/Loss": 2.100564956665039, "Pretrain/Loss (Raw)": 1.9890280961990356, "Pretrain/Step": 1148, "Pretrain/Step Time": 8.518908208236098} +{"Pretrain/Learning Rate": 4.893403416020658e-05, "Pretrain/Loss": 2.1005916595458984, "Pretrain/Loss (Raw)": 2.0242159366607666, "Pretrain/Step": 1149, "Pretrain/Step Time": 8.51556969806552} +{"Pretrain/Learning Rate": 4.893158011452734e-05, "Pretrain/Loss": 2.097731590270996, "Pretrain/Loss (Raw)": 1.7967753410339355, "Pretrain/Step": 1150, "Pretrain/Step Time": 8.511858209967613} +{"Pretrain/Learning Rate": 4.8929123308945505e-05, "Pretrain/Loss": 2.100013256072998, "Pretrain/Loss (Raw)": 2.150683879852295, "Pretrain/Step": 1151, "Pretrain/Step Time": 8.518858088180423} +{"Pretrain/Learning Rate": 4.8926663743744414e-05, "Pretrain/Loss": 2.09779953956604, "Pretrain/Loss (Raw)": 1.9206289052963257, "Pretrain/Step": 1152, "Pretrain/Step Time": 8.513731550425291} +{"Pretrain/Learning Rate": 4.892420141920772e-05, "Pretrain/Loss": 2.0952582359313965, "Pretrain/Loss (Raw)": 1.9521070718765259, "Pretrain/Step": 1153, "Pretrain/Step Time": 8.518933216109872} +{"Pretrain/Learning Rate": 4.8921736335619385e-05, "Pretrain/Loss": 2.0950465202331543, "Pretrain/Loss (Raw)": 2.197859287261963, "Pretrain/Step": 1154, "Pretrain/Step Time": 8.521171094849706} +{"Pretrain/Learning Rate": 4.8919268493263684e-05, "Pretrain/Loss": 2.0941929817199707, "Pretrain/Loss (Raw)": 2.0340001583099365, "Pretrain/Step": 1155, "Pretrain/Step Time": 8.517956105992198} +{"Pretrain/Learning Rate": 4.891679789242524e-05, "Pretrain/Loss": 2.096123456954956, "Pretrain/Loss (Raw)": 2.3490264415740967, "Pretrain/Step": 1156, "Pretrain/Step Time": 8.513165248557925} +{"Pretrain/Learning Rate": 4.891432453338895e-05, "Pretrain/Loss": 2.0956549644470215, "Pretrain/Loss (Raw)": 2.0627474784851074, "Pretrain/Step": 1157, "Pretrain/Step Time": 8.50917018018663} +{"Pretrain/Learning Rate": 4.8911848416440075e-05, "Pretrain/Loss": 2.0965704917907715, "Pretrain/Loss (Raw)": 2.0843372344970703, "Pretrain/Step": 1158, "Pretrain/Step Time": 8.514545314013958} +{"Pretrain/Learning Rate": 4.890936954186416e-05, "Pretrain/Loss": 2.09796404838562, "Pretrain/Loss (Raw)": 2.1662089824676514, "Pretrain/Step": 1159, "Pretrain/Step Time": 8.516147140413523} +{"Pretrain/Learning Rate": 4.890688790994709e-05, "Pretrain/Loss": 2.0977020263671875, "Pretrain/Loss (Raw)": 2.108362913131714, "Pretrain/Step": 1160, "Pretrain/Step Time": 8.517040874809027} +{"Pretrain/Learning Rate": 4.890440352097505e-05, "Pretrain/Loss": 2.0965542793273926, "Pretrain/Loss (Raw)": 2.0735769271850586, "Pretrain/Step": 1161, "Pretrain/Step Time": 8.51390734128654} +{"Pretrain/Learning Rate": 4.8901916375234556e-05, "Pretrain/Loss": 2.095705032348633, "Pretrain/Loss (Raw)": 1.9593970775604248, "Pretrain/Step": 1162, "Pretrain/Step Time": 8.517251003533602} +{"Pretrain/Learning Rate": 4.889942647301243e-05, "Pretrain/Loss": 2.0958266258239746, "Pretrain/Loss (Raw)": 2.0891802310943604, "Pretrain/Step": 1163, "Pretrain/Step Time": 8.506947731599212} +{"Pretrain/Learning Rate": 4.8896933814595834e-05, "Pretrain/Loss": 2.097095012664795, "Pretrain/Loss (Raw)": 2.120743989944458, "Pretrain/Step": 1164, "Pretrain/Step Time": 8.508531453087926} +{"Pretrain/Learning Rate": 4.8894438400272224e-05, "Pretrain/Loss": 2.097451686859131, "Pretrain/Loss (Raw)": 2.0897727012634277, "Pretrain/Step": 1165, "Pretrain/Step Time": 8.516957640647888} +{"Pretrain/Learning Rate": 4.889194023032938e-05, "Pretrain/Loss": 2.0975279808044434, "Pretrain/Loss (Raw)": 2.152165412902832, "Pretrain/Step": 1166, "Pretrain/Step Time": 8.520011017099023} +{"Pretrain/Learning Rate": 4.8889439305055406e-05, "Pretrain/Loss": 2.0954713821411133, "Pretrain/Loss (Raw)": 2.0222315788269043, "Pretrain/Step": 1167, "Pretrain/Step Time": 8.511511093005538} +{"Pretrain/Learning Rate": 4.8886935624738715e-05, "Pretrain/Loss": 2.0943946838378906, "Pretrain/Loss (Raw)": 2.0522217750549316, "Pretrain/Step": 1168, "Pretrain/Step Time": 8.50573942065239} +{"Pretrain/Learning Rate": 4.888442918966806e-05, "Pretrain/Loss": 2.0968711376190186, "Pretrain/Loss (Raw)": 2.331575870513916, "Pretrain/Step": 1169, "Pretrain/Step Time": 8.5076863206923} +{"Pretrain/Learning Rate": 4.888192000013248e-05, "Pretrain/Loss": 2.097994804382324, "Pretrain/Loss (Raw)": 2.2628023624420166, "Pretrain/Step": 1170, "Pretrain/Step Time": 8.511211056262255} +{"Pretrain/Learning Rate": 4.887940805642135e-05, "Pretrain/Loss": 2.0989151000976562, "Pretrain/Loss (Raw)": 2.0737802982330322, "Pretrain/Step": 1171, "Pretrain/Step Time": 8.513966083526611} +{"Pretrain/Learning Rate": 4.887689335882436e-05, "Pretrain/Loss": 2.0975005626678467, "Pretrain/Loss (Raw)": 1.9853488206863403, "Pretrain/Step": 1172, "Pretrain/Step Time": 8.511605093255639} +{"Pretrain/Learning Rate": 4.8874375907631506e-05, "Pretrain/Loss": 2.10025954246521, "Pretrain/Loss (Raw)": 2.389183759689331, "Pretrain/Step": 1173, "Pretrain/Step Time": 8.505899639800191} +{"Pretrain/Learning Rate": 4.887185570313314e-05, "Pretrain/Loss": 2.101806163787842, "Pretrain/Loss (Raw)": 2.100358009338379, "Pretrain/Step": 1174, "Pretrain/Step Time": 8.509114488959312} +{"Pretrain/Learning Rate": 4.886933274561988e-05, "Pretrain/Loss": 2.0992746353149414, "Pretrain/Loss (Raw)": 1.9217936992645264, "Pretrain/Step": 1175, "Pretrain/Step Time": 8.512411169707775} +{"Pretrain/Learning Rate": 4.886680703538269e-05, "Pretrain/Loss": 2.0994694232940674, "Pretrain/Loss (Raw)": 2.0625205039978027, "Pretrain/Step": 1176, "Pretrain/Step Time": 8.515202017500997} +{"Pretrain/Learning Rate": 4.886427857271284e-05, "Pretrain/Loss": 2.0995635986328125, "Pretrain/Loss (Raw)": 2.1983439922332764, "Pretrain/Step": 1177, "Pretrain/Step Time": 8.518491256982088} +{"Pretrain/Learning Rate": 4.886174735790194e-05, "Pretrain/Loss": 2.099841594696045, "Pretrain/Loss (Raw)": 2.06606388092041, "Pretrain/Step": 1178, "Pretrain/Step Time": 8.51763223297894} +{"Pretrain/Learning Rate": 4.88592133912419e-05, "Pretrain/Loss": 2.102682590484619, "Pretrain/Loss (Raw)": 2.1988449096679688, "Pretrain/Step": 1179, "Pretrain/Step Time": 8.51443942822516} +{"Pretrain/Learning Rate": 4.885667667302494e-05, "Pretrain/Loss": 2.103555679321289, "Pretrain/Loss (Raw)": 2.1190919876098633, "Pretrain/Step": 1180, "Pretrain/Step Time": 8.506966318935156} +{"Pretrain/Learning Rate": 4.88541372035436e-05, "Pretrain/Loss": 2.102815628051758, "Pretrain/Loss (Raw)": 2.1861283779144287, "Pretrain/Step": 1181, "Pretrain/Step Time": 8.513323176652193} +{"Pretrain/Learning Rate": 4.885159498309077e-05, "Pretrain/Loss": 2.1056864261627197, "Pretrain/Loss (Raw)": 2.332932949066162, "Pretrain/Step": 1182, "Pretrain/Step Time": 8.516009701415896} +{"Pretrain/Learning Rate": 4.884905001195961e-05, "Pretrain/Loss": 2.1087143421173096, "Pretrain/Loss (Raw)": 2.6043930053710938, "Pretrain/Step": 1183, "Pretrain/Step Time": 8.525442836806178} +{"Pretrain/Learning Rate": 4.884650229044361e-05, "Pretrain/Loss": 2.110527276992798, "Pretrain/Loss (Raw)": 2.065221071243286, "Pretrain/Step": 1184, "Pretrain/Step Time": 8.521713623777032} +{"Pretrain/Learning Rate": 4.884395181883661e-05, "Pretrain/Loss": 2.110896587371826, "Pretrain/Loss (Raw)": 2.1743083000183105, "Pretrain/Step": 1185, "Pretrain/Step Time": 8.513563647866249} +{"Pretrain/Learning Rate": 4.8841398597432725e-05, "Pretrain/Loss": 2.110332489013672, "Pretrain/Loss (Raw)": 1.9976056814193726, "Pretrain/Step": 1186, "Pretrain/Step Time": 8.511399064213037} +{"Pretrain/Learning Rate": 4.883884262652641e-05, "Pretrain/Loss": 2.111173391342163, "Pretrain/Loss (Raw)": 2.14729380607605, "Pretrain/Step": 1187, "Pretrain/Step Time": 8.516288163140416} +{"Pretrain/Learning Rate": 4.883628390641243e-05, "Pretrain/Loss": 2.1072771549224854, "Pretrain/Loss (Raw)": 1.6417455673217773, "Pretrain/Step": 1188, "Pretrain/Step Time": 8.521230457350612} +{"Pretrain/Learning Rate": 4.883372243738588e-05, "Pretrain/Loss": 2.108132839202881, "Pretrain/Loss (Raw)": 2.2784135341644287, "Pretrain/Step": 1189, "Pretrain/Step Time": 8.52528777346015} +{"Pretrain/Learning Rate": 4.883115821974213e-05, "Pretrain/Loss": 2.1055688858032227, "Pretrain/Loss (Raw)": 1.6698963642120361, "Pretrain/Step": 1190, "Pretrain/Step Time": 8.522247985005379} +{"Pretrain/Learning Rate": 4.8828591253776937e-05, "Pretrain/Loss": 2.1047348976135254, "Pretrain/Loss (Raw)": 2.012319803237915, "Pretrain/Step": 1191, "Pretrain/Step Time": 8.507983913645148} +{"Pretrain/Learning Rate": 4.88260215397863e-05, "Pretrain/Loss": 2.106489658355713, "Pretrain/Loss (Raw)": 2.145681619644165, "Pretrain/Step": 1192, "Pretrain/Step Time": 8.508656395599246} +{"Pretrain/Learning Rate": 4.882344907806659e-05, "Pretrain/Loss": 2.102780342102051, "Pretrain/Loss (Raw)": 1.9598629474639893, "Pretrain/Step": 1193, "Pretrain/Step Time": 8.507231695577502} +{"Pretrain/Learning Rate": 4.882087386891448e-05, "Pretrain/Loss": 2.103039264678955, "Pretrain/Loss (Raw)": 2.0563008785247803, "Pretrain/Step": 1194, "Pretrain/Step Time": 8.519152389839292} +{"Pretrain/Learning Rate": 4.8818295912626955e-05, "Pretrain/Loss": 2.102599620819092, "Pretrain/Loss (Raw)": 2.110485315322876, "Pretrain/Step": 1195, "Pretrain/Step Time": 8.522971956059337} +{"Pretrain/Learning Rate": 4.88157152095013e-05, "Pretrain/Loss": 2.101405620574951, "Pretrain/Loss (Raw)": 1.8868401050567627, "Pretrain/Step": 1196, "Pretrain/Step Time": 8.518379304558039} +{"Pretrain/Learning Rate": 4.881313175983515e-05, "Pretrain/Loss": 2.1061534881591797, "Pretrain/Loss (Raw)": 2.707751989364624, "Pretrain/Step": 1197, "Pretrain/Step Time": 8.51240867562592} +{"Pretrain/Learning Rate": 4.881054556392642e-05, "Pretrain/Loss": 2.106776714324951, "Pretrain/Loss (Raw)": 2.0594000816345215, "Pretrain/Step": 1198, "Pretrain/Step Time": 8.511384854093194} +{"Pretrain/Learning Rate": 4.8807956622073394e-05, "Pretrain/Loss": 2.11006760597229, "Pretrain/Loss (Raw)": 2.512739896774292, "Pretrain/Step": 1199, "Pretrain/Step Time": 8.510655926540494} +{"Pretrain/Learning Rate": 4.880536493457461e-05, "Pretrain/Loss": 2.110044240951538, "Pretrain/Loss (Raw)": 2.1698179244995117, "Pretrain/Step": 1200, "Pretrain/Step Time": 8.514119066298008} +{"Pretrain/Learning Rate": 4.880277050172897e-05, "Pretrain/Loss": 2.1089744567871094, "Pretrain/Loss (Raw)": 1.8873158693313599, "Pretrain/Step": 1201, "Pretrain/Step Time": 8.523329405114055} +{"Pretrain/Learning Rate": 4.880017332383567e-05, "Pretrain/Loss": 2.1113290786743164, "Pretrain/Loss (Raw)": 2.1496503353118896, "Pretrain/Step": 1202, "Pretrain/Step Time": 8.521701704710722} +{"Pretrain/Learning Rate": 4.879757340119425e-05, "Pretrain/Loss": 2.1116321086883545, "Pretrain/Loss (Raw)": 2.1024415493011475, "Pretrain/Step": 1203, "Pretrain/Step Time": 8.516230883076787} +{"Pretrain/Learning Rate": 4.879497073410451e-05, "Pretrain/Loss": 2.111189365386963, "Pretrain/Loss (Raw)": 2.122244119644165, "Pretrain/Step": 1204, "Pretrain/Step Time": 8.514066418632865} +{"Pretrain/Learning Rate": 4.8792365322866626e-05, "Pretrain/Loss": 2.112247943878174, "Pretrain/Loss (Raw)": 2.1401219367980957, "Pretrain/Step": 1205, "Pretrain/Step Time": 8.513569323346019} +{"Pretrain/Learning Rate": 4.878975716778106e-05, "Pretrain/Loss": 2.1122748851776123, "Pretrain/Loss (Raw)": 2.2222506999969482, "Pretrain/Step": 1206, "Pretrain/Step Time": 8.519278187304735} +{"Pretrain/Learning Rate": 4.878714626914859e-05, "Pretrain/Loss": 2.111945629119873, "Pretrain/Loss (Raw)": 2.1966135501861572, "Pretrain/Step": 1207, "Pretrain/Step Time": 8.521663641557097} +{"Pretrain/Learning Rate": 4.878453262727033e-05, "Pretrain/Loss": 2.1106414794921875, "Pretrain/Loss (Raw)": 2.0924410820007324, "Pretrain/Step": 1208, "Pretrain/Step Time": 8.521659454330802} +{"Pretrain/Learning Rate": 4.878191624244769e-05, "Pretrain/Loss": 2.1122591495513916, "Pretrain/Loss (Raw)": 2.2574527263641357, "Pretrain/Step": 1209, "Pretrain/Step Time": 8.517591772601008} +{"Pretrain/Learning Rate": 4.8779297114982406e-05, "Pretrain/Loss": 2.112832546234131, "Pretrain/Loss (Raw)": 2.1524853706359863, "Pretrain/Step": 1210, "Pretrain/Step Time": 8.50991227477789} +{"Pretrain/Learning Rate": 4.877667524517652e-05, "Pretrain/Loss": 2.113333225250244, "Pretrain/Loss (Raw)": 2.167839288711548, "Pretrain/Step": 1211, "Pretrain/Step Time": 8.517888281494379} +{"Pretrain/Learning Rate": 4.877405063333241e-05, "Pretrain/Loss": 2.114494800567627, "Pretrain/Loss (Raw)": 2.1211695671081543, "Pretrain/Step": 1212, "Pretrain/Step Time": 8.518019398674369} +{"Pretrain/Learning Rate": 4.877142327975276e-05, "Pretrain/Loss": 2.113332986831665, "Pretrain/Loss (Raw)": 2.0819621086120605, "Pretrain/Step": 1213, "Pretrain/Step Time": 8.520978216081858} +{"Pretrain/Learning Rate": 4.8768793184740556e-05, "Pretrain/Loss": 2.1128854751586914, "Pretrain/Loss (Raw)": 2.0823748111724854, "Pretrain/Step": 1214, "Pretrain/Step Time": 8.518070008605719} +{"Pretrain/Learning Rate": 4.8766160348599125e-05, "Pretrain/Loss": 2.112966775894165, "Pretrain/Loss (Raw)": 2.1593875885009766, "Pretrain/Step": 1215, "Pretrain/Step Time": 8.508385283872485} +{"Pretrain/Learning Rate": 4.876352477163209e-05, "Pretrain/Loss": 2.109990119934082, "Pretrain/Loss (Raw)": 1.8437371253967285, "Pretrain/Step": 1216, "Pretrain/Step Time": 8.501111960038543} +{"Pretrain/Learning Rate": 4.8760886454143394e-05, "Pretrain/Loss": 2.1099538803100586, "Pretrain/Loss (Raw)": 2.1387970447540283, "Pretrain/Step": 1217, "Pretrain/Step Time": 8.50889266654849} +{"Pretrain/Learning Rate": 4.875824539643731e-05, "Pretrain/Loss": 2.1098432540893555, "Pretrain/Loss (Raw)": 2.210285186767578, "Pretrain/Step": 1218, "Pretrain/Step Time": 8.50721101090312} +{"Pretrain/Learning Rate": 4.8755601598818427e-05, "Pretrain/Loss": 2.1102612018585205, "Pretrain/Loss (Raw)": 2.0845394134521484, "Pretrain/Step": 1219, "Pretrain/Step Time": 8.509796384721994} +{"Pretrain/Learning Rate": 4.875295506159161e-05, "Pretrain/Loss": 2.109175205230713, "Pretrain/Loss (Raw)": 2.111175775527954, "Pretrain/Step": 1220, "Pretrain/Step Time": 8.511339221149683} +{"Pretrain/Learning Rate": 4.87503057850621e-05, "Pretrain/Loss": 2.1096415519714355, "Pretrain/Loss (Raw)": 2.0620763301849365, "Pretrain/Step": 1221, "Pretrain/Step Time": 8.504426762461662} +{"Pretrain/Learning Rate": 4.874765376953541e-05, "Pretrain/Loss": 2.1065032482147217, "Pretrain/Loss (Raw)": 2.0230143070220947, "Pretrain/Step": 1222, "Pretrain/Step Time": 8.502905694767833} +{"Pretrain/Learning Rate": 4.874499901531737e-05, "Pretrain/Loss": 2.106398105621338, "Pretrain/Loss (Raw)": 2.152019739151001, "Pretrain/Step": 1223, "Pretrain/Step Time": 8.51501401886344} +{"Pretrain/Learning Rate": 4.874234152271418e-05, "Pretrain/Loss": 2.105983257293701, "Pretrain/Loss (Raw)": 2.157341957092285, "Pretrain/Step": 1224, "Pretrain/Step Time": 8.515544731169939} +{"Pretrain/Learning Rate": 4.8739681292032266e-05, "Pretrain/Loss": 2.1085433959960938, "Pretrain/Loss (Raw)": 2.2692041397094727, "Pretrain/Step": 1225, "Pretrain/Step Time": 8.512489339336753} +{"Pretrain/Learning Rate": 4.8737018323578445e-05, "Pretrain/Loss": 2.1092681884765625, "Pretrain/Loss (Raw)": 2.177659273147583, "Pretrain/Step": 1226, "Pretrain/Step Time": 8.50838765874505} +{"Pretrain/Learning Rate": 4.873435261765982e-05, "Pretrain/Loss": 2.108471393585205, "Pretrain/Loss (Raw)": 2.1323161125183105, "Pretrain/Step": 1227, "Pretrain/Step Time": 8.51093484647572} +{"Pretrain/Learning Rate": 4.873168417458381e-05, "Pretrain/Loss": 2.1059796810150146, "Pretrain/Loss (Raw)": 2.0027449131011963, "Pretrain/Step": 1228, "Pretrain/Step Time": 8.510374944657087} +{"Pretrain/Learning Rate": 4.8729012994658166e-05, "Pretrain/Loss": 2.1055991649627686, "Pretrain/Loss (Raw)": 2.1771650314331055, "Pretrain/Step": 1229, "Pretrain/Step Time": 8.51381897367537} +{"Pretrain/Learning Rate": 4.8726339078190914e-05, "Pretrain/Loss": 2.106326103210449, "Pretrain/Loss (Raw)": 2.2363452911376953, "Pretrain/Step": 1230, "Pretrain/Step Time": 8.521092122420669} +{"Pretrain/Learning Rate": 4.872366242549044e-05, "Pretrain/Loss": 2.106132984161377, "Pretrain/Loss (Raw)": 2.118042230606079, "Pretrain/Step": 1231, "Pretrain/Step Time": 8.515654722228646} +{"Pretrain/Learning Rate": 4.872098303686543e-05, "Pretrain/Loss": 2.1033177375793457, "Pretrain/Loss (Raw)": 1.8508950471878052, "Pretrain/Step": 1232, "Pretrain/Step Time": 8.512072106823325} +{"Pretrain/Learning Rate": 4.871830091262488e-05, "Pretrain/Loss": 2.102196216583252, "Pretrain/Loss (Raw)": 2.0203824043273926, "Pretrain/Step": 1233, "Pretrain/Step Time": 8.504391364753246} +{"Pretrain/Learning Rate": 4.8715616053078095e-05, "Pretrain/Loss": 2.1024363040924072, "Pretrain/Loss (Raw)": 2.2366137504577637, "Pretrain/Step": 1234, "Pretrain/Step Time": 8.509143212810159} +{"Pretrain/Learning Rate": 4.871292845853472e-05, "Pretrain/Loss": 2.1049270629882812, "Pretrain/Loss (Raw)": 2.283407211303711, "Pretrain/Step": 1235, "Pretrain/Step Time": 8.51391188800335} +{"Pretrain/Learning Rate": 4.87102381293047e-05, "Pretrain/Loss": 2.1065032482147217, "Pretrain/Loss (Raw)": 2.206099033355713, "Pretrain/Step": 1236, "Pretrain/Step Time": 8.51357471011579} +{"Pretrain/Learning Rate": 4.870754506569829e-05, "Pretrain/Loss": 2.1065220832824707, "Pretrain/Loss (Raw)": 1.9514946937561035, "Pretrain/Step": 1237, "Pretrain/Step Time": 8.513706089928746} +{"Pretrain/Learning Rate": 4.870484926802606e-05, "Pretrain/Loss": 2.1087400913238525, "Pretrain/Loss (Raw)": 2.274902582168579, "Pretrain/Step": 1238, "Pretrain/Step Time": 8.513641877099872} +{"Pretrain/Learning Rate": 4.8702150736598925e-05, "Pretrain/Loss": 2.109984874725342, "Pretrain/Loss (Raw)": 2.128028631210327, "Pretrain/Step": 1239, "Pretrain/Step Time": 8.505414070561528} +{"Pretrain/Learning Rate": 4.8699449471728075e-05, "Pretrain/Loss": 2.109039306640625, "Pretrain/Loss (Raw)": 1.858965516090393, "Pretrain/Step": 1240, "Pretrain/Step Time": 8.500681765377522} +{"Pretrain/Learning Rate": 4.869674547372504e-05, "Pretrain/Loss": 2.1102395057678223, "Pretrain/Loss (Raw)": 2.1400816440582275, "Pretrain/Step": 1241, "Pretrain/Step Time": 8.512697417289019} +{"Pretrain/Learning Rate": 4.8694038742901646e-05, "Pretrain/Loss": 2.1097989082336426, "Pretrain/Loss (Raw)": 1.9533518552780151, "Pretrain/Step": 1242, "Pretrain/Step Time": 8.51325642876327} +{"Pretrain/Learning Rate": 4.869132927957007e-05, "Pretrain/Loss": 2.1119513511657715, "Pretrain/Loss (Raw)": 2.335069417953491, "Pretrain/Step": 1243, "Pretrain/Step Time": 8.514142964035273} +{"Pretrain/Learning Rate": 4.868861708404275e-05, "Pretrain/Loss": 2.111884593963623, "Pretrain/Loss (Raw)": 2.1795835494995117, "Pretrain/Step": 1244, "Pretrain/Step Time": 8.508693126961589} +{"Pretrain/Learning Rate": 4.868590215663248e-05, "Pretrain/Loss": 2.1121327877044678, "Pretrain/Loss (Raw)": 2.14202880859375, "Pretrain/Step": 1245, "Pretrain/Step Time": 8.502082698047161} +{"Pretrain/Learning Rate": 4.8683184497652366e-05, "Pretrain/Loss": 2.1072170734405518, "Pretrain/Loss (Raw)": 2.0075058937072754, "Pretrain/Step": 1246, "Pretrain/Step Time": 8.504387769848108} +{"Pretrain/Learning Rate": 4.868046410741582e-05, "Pretrain/Loss": 2.106241464614868, "Pretrain/Loss (Raw)": 1.9559663534164429, "Pretrain/Step": 1247, "Pretrain/Step Time": 8.504165928810835} +{"Pretrain/Learning Rate": 4.867774098623657e-05, "Pretrain/Loss": 2.1071319580078125, "Pretrain/Loss (Raw)": 2.179366111755371, "Pretrain/Step": 1248, "Pretrain/Step Time": 8.508910043165088} +{"Pretrain/Learning Rate": 4.8675015134428654e-05, "Pretrain/Loss": 2.1062161922454834, "Pretrain/Loss (Raw)": 2.1037890911102295, "Pretrain/Step": 1249, "Pretrain/Step Time": 8.502832178026438} +{"Pretrain/Learning Rate": 4.867228655230643e-05, "Pretrain/Loss": 2.1077566146850586, "Pretrain/Loss (Raw)": 2.1213231086730957, "Pretrain/Step": 1250, "Pretrain/Step Time": 8.496524130925536} +{"Pretrain/Learning Rate": 4.866955524018457e-05, "Pretrain/Loss": 2.1051244735717773, "Pretrain/Loss (Raw)": 1.956196665763855, "Pretrain/Step": 1251, "Pretrain/Step Time": 8.495489165186882} +{"Pretrain/Learning Rate": 4.866682119837807e-05, "Pretrain/Loss": 2.106123447418213, "Pretrain/Loss (Raw)": 2.0546183586120605, "Pretrain/Step": 1252, "Pretrain/Step Time": 8.504251202568412} +{"Pretrain/Learning Rate": 4.866408442720223e-05, "Pretrain/Loss": 2.1062331199645996, "Pretrain/Loss (Raw)": 2.1462929248809814, "Pretrain/Step": 1253, "Pretrain/Step Time": 8.507023867219687} +{"Pretrain/Learning Rate": 4.8661344926972666e-05, "Pretrain/Loss": 2.105628252029419, "Pretrain/Loss (Raw)": 2.1251413822174072, "Pretrain/Step": 1254, "Pretrain/Step Time": 8.507603146135807} +{"Pretrain/Learning Rate": 4.8658602698005294e-05, "Pretrain/Loss": 2.1041955947875977, "Pretrain/Loss (Raw)": 2.07281231880188, "Pretrain/Step": 1255, "Pretrain/Step Time": 8.507549814879894} +{"Pretrain/Learning Rate": 4.8655857740616395e-05, "Pretrain/Loss": 2.104145050048828, "Pretrain/Loss (Raw)": 2.0496551990509033, "Pretrain/Step": 1256, "Pretrain/Step Time": 8.498358642682433} +{"Pretrain/Learning Rate": 4.8653110055122496e-05, "Pretrain/Loss": 2.104403018951416, "Pretrain/Loss (Raw)": 1.9843826293945312, "Pretrain/Step": 1257, "Pretrain/Step Time": 8.494487533345819} +{"Pretrain/Learning Rate": 4.8650359641840495e-05, "Pretrain/Loss": 2.10440731048584, "Pretrain/Loss (Raw)": 2.0772039890289307, "Pretrain/Step": 1258, "Pretrain/Step Time": 8.501342356204987} +{"Pretrain/Learning Rate": 4.864760650108758e-05, "Pretrain/Loss": 2.1046359539031982, "Pretrain/Loss (Raw)": 2.1419568061828613, "Pretrain/Step": 1259, "Pretrain/Step Time": 8.50034206174314} +{"Pretrain/Learning Rate": 4.864485063318125e-05, "Pretrain/Loss": 2.104177951812744, "Pretrain/Loss (Raw)": 2.122797966003418, "Pretrain/Step": 1260, "Pretrain/Step Time": 8.50112940184772} +{"Pretrain/Learning Rate": 4.864209203843932e-05, "Pretrain/Loss": 2.1027722358703613, "Pretrain/Loss (Raw)": 1.8416378498077393, "Pretrain/Step": 1261, "Pretrain/Step Time": 8.500475835055113} +{"Pretrain/Learning Rate": 4.8639330717179946e-05, "Pretrain/Loss": 2.1029834747314453, "Pretrain/Loss (Raw)": 2.1596004962921143, "Pretrain/Step": 1262, "Pretrain/Step Time": 8.493307692930102} +{"Pretrain/Learning Rate": 4.863656666972154e-05, "Pretrain/Loss": 2.1023478507995605, "Pretrain/Loss (Raw)": 1.9627398252487183, "Pretrain/Step": 1263, "Pretrain/Step Time": 8.495242336764932} +{"Pretrain/Learning Rate": 4.86337998963829e-05, "Pretrain/Loss": 2.1039223670959473, "Pretrain/Loss (Raw)": 2.161606788635254, "Pretrain/Step": 1264, "Pretrain/Step Time": 8.498696975409985} +{"Pretrain/Learning Rate": 4.863103039748309e-05, "Pretrain/Loss": 2.1044678688049316, "Pretrain/Loss (Raw)": 2.107412338256836, "Pretrain/Step": 1265, "Pretrain/Step Time": 8.506632393226027} +{"Pretrain/Learning Rate": 4.86282581733415e-05, "Pretrain/Loss": 2.1061878204345703, "Pretrain/Loss (Raw)": 2.196279287338257, "Pretrain/Step": 1266, "Pretrain/Step Time": 8.508557071909308} +{"Pretrain/Learning Rate": 4.8625483224277835e-05, "Pretrain/Loss": 2.107693672180176, "Pretrain/Loss (Raw)": 2.2000787258148193, "Pretrain/Step": 1267, "Pretrain/Step Time": 8.50981061346829} +{"Pretrain/Learning Rate": 4.8622705550612126e-05, "Pretrain/Loss": 2.1067471504211426, "Pretrain/Loss (Raw)": 2.046476125717163, "Pretrain/Step": 1268, "Pretrain/Step Time": 8.505819834768772} +{"Pretrain/Learning Rate": 4.861992515266469e-05, "Pretrain/Loss": 2.106127977371216, "Pretrain/Loss (Raw)": 1.9767060279846191, "Pretrain/Step": 1269, "Pretrain/Step Time": 8.49972864612937} +{"Pretrain/Learning Rate": 4.8617142030756194e-05, "Pretrain/Loss": 2.103954315185547, "Pretrain/Loss (Raw)": 1.9484866857528687, "Pretrain/Step": 1270, "Pretrain/Step Time": 8.510588120669127} +{"Pretrain/Learning Rate": 4.8614356185207575e-05, "Pretrain/Loss": 2.103383779525757, "Pretrain/Loss (Raw)": 2.0052363872528076, "Pretrain/Step": 1271, "Pretrain/Step Time": 8.511258849874139} +{"Pretrain/Learning Rate": 4.861156761634014e-05, "Pretrain/Loss": 2.1036500930786133, "Pretrain/Loss (Raw)": 2.1734306812286377, "Pretrain/Step": 1272, "Pretrain/Step Time": 8.513290433213115} +{"Pretrain/Learning Rate": 4.860877632447546e-05, "Pretrain/Loss": 2.1036217212677, "Pretrain/Loss (Raw)": 2.2212462425231934, "Pretrain/Step": 1273, "Pretrain/Step Time": 8.511342067271471} +{"Pretrain/Learning Rate": 4.8605982309935446e-05, "Pretrain/Loss": 2.1046221256256104, "Pretrain/Loss (Raw)": 1.993251919746399, "Pretrain/Step": 1274, "Pretrain/Step Time": 8.504590164870024} +{"Pretrain/Learning Rate": 4.860318557304232e-05, "Pretrain/Loss": 2.1052255630493164, "Pretrain/Loss (Raw)": 2.1584274768829346, "Pretrain/Step": 1275, "Pretrain/Step Time": 8.502819133922458} +{"Pretrain/Learning Rate": 4.860038611411861e-05, "Pretrain/Loss": 2.1062841415405273, "Pretrain/Loss (Raw)": 2.1245412826538086, "Pretrain/Step": 1276, "Pretrain/Step Time": 8.50782303698361} +{"Pretrain/Learning Rate": 4.8597583933487165e-05, "Pretrain/Loss": 2.1085124015808105, "Pretrain/Loss (Raw)": 2.309404134750366, "Pretrain/Step": 1277, "Pretrain/Step Time": 8.51502926275134} +{"Pretrain/Learning Rate": 4.859477903147115e-05, "Pretrain/Loss": 2.1102030277252197, "Pretrain/Loss (Raw)": 2.013211727142334, "Pretrain/Step": 1278, "Pretrain/Step Time": 8.514596071094275} +{"Pretrain/Learning Rate": 4.8591971408394034e-05, "Pretrain/Loss": 2.1095972061157227, "Pretrain/Loss (Raw)": 2.0731353759765625, "Pretrain/Step": 1279, "Pretrain/Step Time": 8.505974657833576} +{"Pretrain/Learning Rate": 4.85891610645796e-05, "Pretrain/Loss": 2.1123135089874268, "Pretrain/Loss (Raw)": 2.26831316947937, "Pretrain/Step": 1280, "Pretrain/Step Time": 8.506786974146962} +{"Pretrain/Learning Rate": 4.8586348000351956e-05, "Pretrain/Loss": 2.113483428955078, "Pretrain/Loss (Raw)": 2.1018640995025635, "Pretrain/Step": 1281, "Pretrain/Step Time": 8.504469271749258} +{"Pretrain/Learning Rate": 4.8583532216035524e-05, "Pretrain/Loss": 2.1137592792510986, "Pretrain/Loss (Raw)": 2.233147382736206, "Pretrain/Step": 1282, "Pretrain/Step Time": 8.509766023606062} +{"Pretrain/Learning Rate": 4.858071371195502e-05, "Pretrain/Loss": 2.114621639251709, "Pretrain/Loss (Raw)": 2.1443636417388916, "Pretrain/Step": 1283, "Pretrain/Step Time": 8.511373177170753} +{"Pretrain/Learning Rate": 4.8577892488435504e-05, "Pretrain/Loss": 2.1107943058013916, "Pretrain/Loss (Raw)": 1.8591721057891846, "Pretrain/Step": 1284, "Pretrain/Step Time": 8.51732386648655} +{"Pretrain/Learning Rate": 4.8575068545802316e-05, "Pretrain/Loss": 2.110882520675659, "Pretrain/Loss (Raw)": 2.0740063190460205, "Pretrain/Step": 1285, "Pretrain/Step Time": 8.514360714703798} +{"Pretrain/Learning Rate": 4.8572241884381145e-05, "Pretrain/Loss": 2.1107282638549805, "Pretrain/Loss (Raw)": 2.064588785171509, "Pretrain/Step": 1286, "Pretrain/Step Time": 8.505216471850872} +{"Pretrain/Learning Rate": 4.856941250449795e-05, "Pretrain/Loss": 2.113161087036133, "Pretrain/Loss (Raw)": 2.4776415824890137, "Pretrain/Step": 1287, "Pretrain/Step Time": 8.507914705201983} +{"Pretrain/Learning Rate": 4.8566580406479045e-05, "Pretrain/Loss": 2.1149749755859375, "Pretrain/Loss (Raw)": 2.3405354022979736, "Pretrain/Step": 1288, "Pretrain/Step Time": 8.507369503378868} +{"Pretrain/Learning Rate": 4.856374559065104e-05, "Pretrain/Loss": 2.114910840988159, "Pretrain/Loss (Raw)": 2.0653557777404785, "Pretrain/Step": 1289, "Pretrain/Step Time": 8.511388685554266} +{"Pretrain/Learning Rate": 4.856090805734086e-05, "Pretrain/Loss": 2.116891860961914, "Pretrain/Loss (Raw)": 2.212979793548584, "Pretrain/Step": 1290, "Pretrain/Step Time": 8.513109249994159} +{"Pretrain/Learning Rate": 4.855806780687574e-05, "Pretrain/Loss": 2.117499828338623, "Pretrain/Loss (Raw)": 2.166975498199463, "Pretrain/Step": 1291, "Pretrain/Step Time": 8.508769009262323} +{"Pretrain/Learning Rate": 4.8555224839583236e-05, "Pretrain/Loss": 2.118191719055176, "Pretrain/Loss (Raw)": 2.209352731704712, "Pretrain/Step": 1292, "Pretrain/Step Time": 8.504706904292107} +{"Pretrain/Learning Rate": 4.8552379155791194e-05, "Pretrain/Loss": 2.1175169944763184, "Pretrain/Loss (Raw)": 2.0033488273620605, "Pretrain/Step": 1293, "Pretrain/Step Time": 8.504132622852921} +{"Pretrain/Learning Rate": 4.854953075582782e-05, "Pretrain/Loss": 2.1165223121643066, "Pretrain/Loss (Raw)": 2.0249032974243164, "Pretrain/Step": 1294, "Pretrain/Step Time": 8.49809193983674} +{"Pretrain/Learning Rate": 4.854667964002158e-05, "Pretrain/Loss": 2.1159486770629883, "Pretrain/Loss (Raw)": 1.9487512111663818, "Pretrain/Step": 1295, "Pretrain/Step Time": 8.513483241200447} +{"Pretrain/Learning Rate": 4.8543825808701294e-05, "Pretrain/Loss": 2.1168293952941895, "Pretrain/Loss (Raw)": 2.1649765968322754, "Pretrain/Step": 1296, "Pretrain/Step Time": 8.520331455394626} +{"Pretrain/Learning Rate": 4.854096926219607e-05, "Pretrain/Loss": 2.1150825023651123, "Pretrain/Loss (Raw)": 2.1079752445220947, "Pretrain/Step": 1297, "Pretrain/Step Time": 8.516907874494791} +{"Pretrain/Learning Rate": 4.853811000083535e-05, "Pretrain/Loss": 2.1137285232543945, "Pretrain/Loss (Raw)": 2.0894834995269775, "Pretrain/Step": 1298, "Pretrain/Step Time": 8.510722320526838} +{"Pretrain/Learning Rate": 4.8535248024948854e-05, "Pretrain/Loss": 2.1131558418273926, "Pretrain/Loss (Raw)": 2.000490665435791, "Pretrain/Step": 1299, "Pretrain/Step Time": 8.509929107502103} +{"Pretrain/Learning Rate": 4.853238333486666e-05, "Pretrain/Loss": 2.114875555038452, "Pretrain/Loss (Raw)": 2.205484628677368, "Pretrain/Step": 1300, "Pretrain/Step Time": 8.516725201159716} +{"Pretrain/Learning Rate": 4.852951593091914e-05, "Pretrain/Loss": 2.1104729175567627, "Pretrain/Loss (Raw)": 1.8256149291992188, "Pretrain/Step": 1301, "Pretrain/Step Time": 8.514583135023713} +{"Pretrain/Learning Rate": 4.852664581343696e-05, "Pretrain/Loss": 2.1097326278686523, "Pretrain/Loss (Raw)": 2.005621910095215, "Pretrain/Step": 1302, "Pretrain/Step Time": 8.514752961695194} +{"Pretrain/Learning Rate": 4.852377298275113e-05, "Pretrain/Loss": 2.111100196838379, "Pretrain/Loss (Raw)": 2.09684681892395, "Pretrain/Step": 1303, "Pretrain/Step Time": 8.514474200084805} +{"Pretrain/Learning Rate": 4.852089743919295e-05, "Pretrain/Loss": 2.112185478210449, "Pretrain/Loss (Raw)": 2.2014260292053223, "Pretrain/Step": 1304, "Pretrain/Step Time": 8.513189436867833} +{"Pretrain/Learning Rate": 4.851801918309403e-05, "Pretrain/Loss": 2.1131484508514404, "Pretrain/Loss (Raw)": 2.3215909004211426, "Pretrain/Step": 1305, "Pretrain/Step Time": 8.513581644743681} +{"Pretrain/Learning Rate": 4.8515138214786335e-05, "Pretrain/Loss": 2.114183187484741, "Pretrain/Loss (Raw)": 2.1985318660736084, "Pretrain/Step": 1306, "Pretrain/Step Time": 8.517031893134117} +{"Pretrain/Learning Rate": 4.851225453460209e-05, "Pretrain/Loss": 2.113597869873047, "Pretrain/Loss (Raw)": 2.123908519744873, "Pretrain/Step": 1307, "Pretrain/Step Time": 8.518383216112852} +{"Pretrain/Learning Rate": 4.850936814287386e-05, "Pretrain/Loss": 2.1148526668548584, "Pretrain/Loss (Raw)": 2.2797367572784424, "Pretrain/Step": 1308, "Pretrain/Step Time": 8.524888413026929} +{"Pretrain/Learning Rate": 4.85064790399345e-05, "Pretrain/Loss": 2.114799976348877, "Pretrain/Loss (Raw)": 2.1793553829193115, "Pretrain/Step": 1309, "Pretrain/Step Time": 8.518036974593997} +{"Pretrain/Learning Rate": 4.850358722611723e-05, "Pretrain/Loss": 2.1126327514648438, "Pretrain/Loss (Raw)": 2.055555582046509, "Pretrain/Step": 1310, "Pretrain/Step Time": 8.517356179654598} +{"Pretrain/Learning Rate": 4.850069270175552e-05, "Pretrain/Loss": 2.1091508865356445, "Pretrain/Loss (Raw)": 2.158696174621582, "Pretrain/Step": 1311, "Pretrain/Step Time": 8.516028992831707} +{"Pretrain/Learning Rate": 4.849779546718319e-05, "Pretrain/Loss": 2.1084675788879395, "Pretrain/Loss (Raw)": 1.977731704711914, "Pretrain/Step": 1312, "Pretrain/Step Time": 8.520469294860959} +{"Pretrain/Learning Rate": 4.8494895522734364e-05, "Pretrain/Loss": 2.106978416442871, "Pretrain/Loss (Raw)": 1.9837087392807007, "Pretrain/Step": 1313, "Pretrain/Step Time": 8.524962842464447} +{"Pretrain/Learning Rate": 4.849199286874347e-05, "Pretrain/Loss": 2.1100199222564697, "Pretrain/Loss (Raw)": 2.386931896209717, "Pretrain/Step": 1314, "Pretrain/Step Time": 8.523715550079942} +{"Pretrain/Learning Rate": 4.8489087505545266e-05, "Pretrain/Loss": 2.108927011489868, "Pretrain/Loss (Raw)": 2.0073986053466797, "Pretrain/Step": 1315, "Pretrain/Step Time": 8.51899453997612} +{"Pretrain/Learning Rate": 4.84861794334748e-05, "Pretrain/Loss": 2.1147918701171875, "Pretrain/Loss (Raw)": 2.392443895339966, "Pretrain/Step": 1316, "Pretrain/Step Time": 8.508338678628206} +{"Pretrain/Learning Rate": 4.848326865286746e-05, "Pretrain/Loss": 2.113920211791992, "Pretrain/Loss (Raw)": 2.1668448448181152, "Pretrain/Step": 1317, "Pretrain/Step Time": 8.509147292003036} +{"Pretrain/Learning Rate": 4.848035516405892e-05, "Pretrain/Loss": 2.118086576461792, "Pretrain/Loss (Raw)": 2.203193426132202, "Pretrain/Step": 1318, "Pretrain/Step Time": 8.51083329692483} +{"Pretrain/Learning Rate": 4.847743896738517e-05, "Pretrain/Loss": 2.1187684535980225, "Pretrain/Loss (Raw)": 2.099592447280884, "Pretrain/Step": 1319, "Pretrain/Step Time": 8.51501426845789} +{"Pretrain/Learning Rate": 4.847452006318254e-05, "Pretrain/Loss": 2.120107650756836, "Pretrain/Loss (Raw)": 2.3170790672302246, "Pretrain/Step": 1320, "Pretrain/Step Time": 8.51410337164998} +{"Pretrain/Learning Rate": 4.8471598451787635e-05, "Pretrain/Loss": 2.120549201965332, "Pretrain/Loss (Raw)": 2.0163776874542236, "Pretrain/Step": 1321, "Pretrain/Step Time": 8.514146415516734} +{"Pretrain/Learning Rate": 4.8468674133537395e-05, "Pretrain/Loss": 2.1221203804016113, "Pretrain/Loss (Raw)": 2.257439374923706, "Pretrain/Step": 1322, "Pretrain/Step Time": 8.498982233926654} +{"Pretrain/Learning Rate": 4.846574710876907e-05, "Pretrain/Loss": 2.122032403945923, "Pretrain/Loss (Raw)": 2.099212884902954, "Pretrain/Step": 1323, "Pretrain/Step Time": 8.501366013661027} +{"Pretrain/Learning Rate": 4.846281737782021e-05, "Pretrain/Loss": 2.120793104171753, "Pretrain/Loss (Raw)": 1.7282370328903198, "Pretrain/Step": 1324, "Pretrain/Step Time": 8.508035635575652} +{"Pretrain/Learning Rate": 4.845988494102869e-05, "Pretrain/Loss": 2.115598678588867, "Pretrain/Loss (Raw)": 2.0428383350372314, "Pretrain/Step": 1325, "Pretrain/Step Time": 8.509067637845874} +{"Pretrain/Learning Rate": 4.845694979873269e-05, "Pretrain/Loss": 2.1135387420654297, "Pretrain/Loss (Raw)": 1.795737385749817, "Pretrain/Step": 1326, "Pretrain/Step Time": 8.510106047615409} +{"Pretrain/Learning Rate": 4.845401195127071e-05, "Pretrain/Loss": 2.111626148223877, "Pretrain/Loss (Raw)": 2.2679529190063477, "Pretrain/Step": 1327, "Pretrain/Step Time": 8.51541681587696} +{"Pretrain/Learning Rate": 4.845107139898155e-05, "Pretrain/Loss": 2.1098458766937256, "Pretrain/Loss (Raw)": 1.941893219947815, "Pretrain/Step": 1328, "Pretrain/Step Time": 8.510073851794004} +{"Pretrain/Learning Rate": 4.8448128142204334e-05, "Pretrain/Loss": 2.1121737957000732, "Pretrain/Loss (Raw)": 2.1852996349334717, "Pretrain/Step": 1329, "Pretrain/Step Time": 8.500320328399539} +{"Pretrain/Learning Rate": 4.8445182181278494e-05, "Pretrain/Loss": 2.1125659942626953, "Pretrain/Loss (Raw)": 2.199862480163574, "Pretrain/Step": 1330, "Pretrain/Step Time": 8.505497446283698} +{"Pretrain/Learning Rate": 4.8442233516543756e-05, "Pretrain/Loss": 2.1112194061279297, "Pretrain/Loss (Raw)": 1.9300930500030518, "Pretrain/Step": 1331, "Pretrain/Step Time": 8.503604600206017} +{"Pretrain/Learning Rate": 4.8439282148340195e-05, "Pretrain/Loss": 2.11240553855896, "Pretrain/Loss (Raw)": 2.2740395069122314, "Pretrain/Step": 1332, "Pretrain/Step Time": 8.509959118440747} +{"Pretrain/Learning Rate": 4.843632807700816e-05, "Pretrain/Loss": 2.1127805709838867, "Pretrain/Loss (Raw)": 2.1881401538848877, "Pretrain/Step": 1333, "Pretrain/Step Time": 8.506830539554358} +{"Pretrain/Learning Rate": 4.843337130288834e-05, "Pretrain/Loss": 2.112098217010498, "Pretrain/Loss (Raw)": 2.134913921356201, "Pretrain/Step": 1334, "Pretrain/Step Time": 8.500873686745763} +{"Pretrain/Learning Rate": 4.843041182632172e-05, "Pretrain/Loss": 2.1118505001068115, "Pretrain/Loss (Raw)": 2.1648967266082764, "Pretrain/Step": 1335, "Pretrain/Step Time": 8.500201031565666} +{"Pretrain/Learning Rate": 4.84274496476496e-05, "Pretrain/Loss": 2.1126298904418945, "Pretrain/Loss (Raw)": 2.1922264099121094, "Pretrain/Step": 1336, "Pretrain/Step Time": 8.501941218972206} +{"Pretrain/Learning Rate": 4.84244847672136e-05, "Pretrain/Loss": 2.1122190952301025, "Pretrain/Loss (Raw)": 2.204857587814331, "Pretrain/Step": 1337, "Pretrain/Step Time": 8.506996855139732} +{"Pretrain/Learning Rate": 4.842151718535563e-05, "Pretrain/Loss": 2.110731601715088, "Pretrain/Loss (Raw)": 1.962093710899353, "Pretrain/Step": 1338, "Pretrain/Step Time": 8.511726086959243} +{"Pretrain/Learning Rate": 4.841854690241793e-05, "Pretrain/Loss": 2.109804630279541, "Pretrain/Loss (Raw)": 2.049180030822754, "Pretrain/Step": 1339, "Pretrain/Step Time": 8.504349432885647} +{"Pretrain/Learning Rate": 4.841557391874304e-05, "Pretrain/Loss": 2.109114646911621, "Pretrain/Loss (Raw)": 2.032837390899658, "Pretrain/Step": 1340, "Pretrain/Step Time": 8.505498023703694} +{"Pretrain/Learning Rate": 4.8412598234673845e-05, "Pretrain/Loss": 2.1078386306762695, "Pretrain/Loss (Raw)": 1.9186456203460693, "Pretrain/Step": 1341, "Pretrain/Step Time": 8.507794616743922} +{"Pretrain/Learning Rate": 4.840961985055349e-05, "Pretrain/Loss": 2.1076297760009766, "Pretrain/Loss (Raw)": 2.0556321144104004, "Pretrain/Step": 1342, "Pretrain/Step Time": 8.511318014934659} +{"Pretrain/Learning Rate": 4.8406638766725464e-05, "Pretrain/Loss": 2.106720447540283, "Pretrain/Loss (Raw)": 2.0430095195770264, "Pretrain/Step": 1343, "Pretrain/Step Time": 8.514493618160486} +{"Pretrain/Learning Rate": 4.840365498353357e-05, "Pretrain/Loss": 2.107680559158325, "Pretrain/Loss (Raw)": 1.9666005373001099, "Pretrain/Step": 1344, "Pretrain/Step Time": 8.515618208795786} +{"Pretrain/Learning Rate": 4.840066850132189e-05, "Pretrain/Loss": 2.1061506271362305, "Pretrain/Loss (Raw)": 1.9429727792739868, "Pretrain/Step": 1345, "Pretrain/Step Time": 8.510652473196387} +{"Pretrain/Learning Rate": 4.839767932043485e-05, "Pretrain/Loss": 2.105098247528076, "Pretrain/Loss (Raw)": 2.0755887031555176, "Pretrain/Step": 1346, "Pretrain/Step Time": 8.507951948791742} +{"Pretrain/Learning Rate": 4.839468744121718e-05, "Pretrain/Loss": 2.105794906616211, "Pretrain/Loss (Raw)": 2.173712730407715, "Pretrain/Step": 1347, "Pretrain/Step Time": 8.505971297621727} +{"Pretrain/Learning Rate": 4.8391692864013916e-05, "Pretrain/Loss": 2.105057716369629, "Pretrain/Loss (Raw)": 2.016796350479126, "Pretrain/Step": 1348, "Pretrain/Step Time": 8.50797450169921} +{"Pretrain/Learning Rate": 4.838869558917041e-05, "Pretrain/Loss": 2.104383945465088, "Pretrain/Loss (Raw)": 1.9758325815200806, "Pretrain/Step": 1349, "Pretrain/Step Time": 8.513814132660627} +{"Pretrain/Learning Rate": 4.838569561703231e-05, "Pretrain/Loss": 2.1048271656036377, "Pretrain/Loss (Raw)": 2.079768180847168, "Pretrain/Step": 1350, "Pretrain/Step Time": 8.515557006001472} +{"Pretrain/Learning Rate": 4.83826929479456e-05, "Pretrain/Loss": 2.105116844177246, "Pretrain/Loss (Raw)": 2.1891019344329834, "Pretrain/Step": 1351, "Pretrain/Step Time": 8.504694383591413} +{"Pretrain/Learning Rate": 4.837968758225655e-05, "Pretrain/Loss": 2.1056432723999023, "Pretrain/Loss (Raw)": 2.2247347831726074, "Pretrain/Step": 1352, "Pretrain/Step Time": 8.509249968454242} +{"Pretrain/Learning Rate": 4.837667952031176e-05, "Pretrain/Loss": 2.1044394969940186, "Pretrain/Loss (Raw)": 2.115116834640503, "Pretrain/Step": 1353, "Pretrain/Step Time": 8.512617990374565} +{"Pretrain/Learning Rate": 4.8373668762458144e-05, "Pretrain/Loss": 2.103755474090576, "Pretrain/Loss (Raw)": 2.090095043182373, "Pretrain/Step": 1354, "Pretrain/Step Time": 8.514731891453266} +{"Pretrain/Learning Rate": 4.8370655309042896e-05, "Pretrain/Loss": 2.1049280166625977, "Pretrain/Loss (Raw)": 2.2823989391326904, "Pretrain/Step": 1355, "Pretrain/Step Time": 8.517279364168644} +{"Pretrain/Learning Rate": 4.8367639160413553e-05, "Pretrain/Loss": 2.1053452491760254, "Pretrain/Loss (Raw)": 2.056138277053833, "Pretrain/Step": 1356, "Pretrain/Step Time": 8.511710777878761} +{"Pretrain/Learning Rate": 4.8364620316917956e-05, "Pretrain/Loss": 2.10477352142334, "Pretrain/Loss (Raw)": 2.1040031909942627, "Pretrain/Step": 1357, "Pretrain/Step Time": 8.506626630201936} +{"Pretrain/Learning Rate": 4.836159877890424e-05, "Pretrain/Loss": 2.103188991546631, "Pretrain/Loss (Raw)": 2.0335114002227783, "Pretrain/Step": 1358, "Pretrain/Step Time": 8.50171273574233} +{"Pretrain/Learning Rate": 4.835857454672087e-05, "Pretrain/Loss": 2.1018528938293457, "Pretrain/Loss (Raw)": 1.9470348358154297, "Pretrain/Step": 1359, "Pretrain/Step Time": 8.514317920431495} +{"Pretrain/Learning Rate": 4.835554762071661e-05, "Pretrain/Loss": 2.1040360927581787, "Pretrain/Loss (Raw)": 2.130342721939087, "Pretrain/Step": 1360, "Pretrain/Step Time": 8.512895310297608} +{"Pretrain/Learning Rate": 4.8352518001240555e-05, "Pretrain/Loss": 2.1045265197753906, "Pretrain/Loss (Raw)": 2.0831527709960938, "Pretrain/Step": 1361, "Pretrain/Step Time": 8.5174699742347} +{"Pretrain/Learning Rate": 4.834948568864207e-05, "Pretrain/Loss": 2.103458881378174, "Pretrain/Loss (Raw)": 2.0999608039855957, "Pretrain/Step": 1362, "Pretrain/Step Time": 8.512306747958064} +{"Pretrain/Learning Rate": 4.8346450683270875e-05, "Pretrain/Loss": 2.1027212142944336, "Pretrain/Loss (Raw)": 2.1889805793762207, "Pretrain/Step": 1363, "Pretrain/Step Time": 8.505713827908039} +{"Pretrain/Learning Rate": 4.8343412985476974e-05, "Pretrain/Loss": 2.1020593643188477, "Pretrain/Loss (Raw)": 2.121396780014038, "Pretrain/Step": 1364, "Pretrain/Step Time": 8.509400859475136} +{"Pretrain/Learning Rate": 4.83403725956107e-05, "Pretrain/Loss": 2.1034083366394043, "Pretrain/Loss (Raw)": 2.124150514602661, "Pretrain/Step": 1365, "Pretrain/Step Time": 8.515411235392094} +{"Pretrain/Learning Rate": 4.8337329514022664e-05, "Pretrain/Loss": 2.1031274795532227, "Pretrain/Loss (Raw)": 2.238982677459717, "Pretrain/Step": 1366, "Pretrain/Step Time": 8.513564229011536} +{"Pretrain/Learning Rate": 4.833428374106382e-05, "Pretrain/Loss": 2.1033499240875244, "Pretrain/Loss (Raw)": 2.1564948558807373, "Pretrain/Step": 1367, "Pretrain/Step Time": 8.513110853731632} +{"Pretrain/Learning Rate": 4.833123527708542e-05, "Pretrain/Loss": 2.105949878692627, "Pretrain/Loss (Raw)": 2.1917564868927, "Pretrain/Step": 1368, "Pretrain/Step Time": 8.516815155744553} +{"Pretrain/Learning Rate": 4.832818412243904e-05, "Pretrain/Loss": 2.1050305366516113, "Pretrain/Loss (Raw)": 2.0223758220672607, "Pretrain/Step": 1369, "Pretrain/Step Time": 8.502573011443019} +{"Pretrain/Learning Rate": 4.8325130277476526e-05, "Pretrain/Loss": 2.106123208999634, "Pretrain/Loss (Raw)": 2.0932369232177734, "Pretrain/Step": 1370, "Pretrain/Step Time": 8.504422284662724} +{"Pretrain/Learning Rate": 4.832207374255008e-05, "Pretrain/Loss": 2.1038880348205566, "Pretrain/Loss (Raw)": 2.04897141456604, "Pretrain/Step": 1371, "Pretrain/Step Time": 8.516200073063374} +{"Pretrain/Learning Rate": 4.8319014518012195e-05, "Pretrain/Loss": 2.102836847305298, "Pretrain/Loss (Raw)": 2.045003890991211, "Pretrain/Step": 1372, "Pretrain/Step Time": 8.516515554860234} +{"Pretrain/Learning Rate": 4.831595260421567e-05, "Pretrain/Loss": 2.1023752689361572, "Pretrain/Loss (Raw)": 2.08297061920166, "Pretrain/Step": 1373, "Pretrain/Step Time": 8.5157425776124} +{"Pretrain/Learning Rate": 4.8312888001513624e-05, "Pretrain/Loss": 2.104644298553467, "Pretrain/Loss (Raw)": 2.2979159355163574, "Pretrain/Step": 1374, "Pretrain/Step Time": 8.510186452418566} +{"Pretrain/Learning Rate": 4.830982071025948e-05, "Pretrain/Loss": 2.105215549468994, "Pretrain/Loss (Raw)": 2.0291247367858887, "Pretrain/Step": 1375, "Pretrain/Step Time": 8.510006004944444} +{"Pretrain/Learning Rate": 4.830675073080697e-05, "Pretrain/Loss": 2.1042165756225586, "Pretrain/Loss (Raw)": 2.0514841079711914, "Pretrain/Step": 1376, "Pretrain/Step Time": 8.505710469558835} +{"Pretrain/Learning Rate": 4.830367806351015e-05, "Pretrain/Loss": 2.103349208831787, "Pretrain/Loss (Raw)": 1.9927698373794556, "Pretrain/Step": 1377, "Pretrain/Step Time": 8.511894108727574} +{"Pretrain/Learning Rate": 4.830060270872335e-05, "Pretrain/Loss": 2.102020025253296, "Pretrain/Loss (Raw)": 1.9511713981628418, "Pretrain/Step": 1378, "Pretrain/Step Time": 8.512302177026868} +{"Pretrain/Learning Rate": 4.8297524666801265e-05, "Pretrain/Loss": 2.102679967880249, "Pretrain/Loss (Raw)": 2.0406789779663086, "Pretrain/Step": 1379, "Pretrain/Step Time": 8.519165782257915} +{"Pretrain/Learning Rate": 4.829444393809884e-05, "Pretrain/Loss": 2.1020896434783936, "Pretrain/Loss (Raw)": 1.9790451526641846, "Pretrain/Step": 1380, "Pretrain/Step Time": 8.51117211394012} +{"Pretrain/Learning Rate": 4.829136052297138e-05, "Pretrain/Loss": 2.1028831005096436, "Pretrain/Loss (Raw)": 2.2478761672973633, "Pretrain/Step": 1381, "Pretrain/Step Time": 8.502639601007104} +{"Pretrain/Learning Rate": 4.828827442177447e-05, "Pretrain/Loss": 2.102201223373413, "Pretrain/Loss (Raw)": 2.037843942642212, "Pretrain/Step": 1382, "Pretrain/Step Time": 8.502726316452026} +{"Pretrain/Learning Rate": 4.8285185634864024e-05, "Pretrain/Loss": 2.10150146484375, "Pretrain/Loss (Raw)": 1.983259916305542, "Pretrain/Step": 1383, "Pretrain/Step Time": 8.511895086616278} +{"Pretrain/Learning Rate": 4.8282094162596235e-05, "Pretrain/Loss": 2.0996336936950684, "Pretrain/Loss (Raw)": 1.8105510473251343, "Pretrain/Step": 1384, "Pretrain/Step Time": 8.521713845431805} +{"Pretrain/Learning Rate": 4.8279000005327644e-05, "Pretrain/Loss": 2.0992226600646973, "Pretrain/Loss (Raw)": 1.931795358657837, "Pretrain/Step": 1385, "Pretrain/Step Time": 8.523621182888746} +{"Pretrain/Learning Rate": 4.827590316341508e-05, "Pretrain/Loss": 2.0965347290039062, "Pretrain/Loss (Raw)": 1.7331522703170776, "Pretrain/Step": 1386, "Pretrain/Step Time": 8.517399992793798} +{"Pretrain/Learning Rate": 4.827280363721568e-05, "Pretrain/Loss": 2.096947193145752, "Pretrain/Loss (Raw)": 2.1947455406188965, "Pretrain/Step": 1387, "Pretrain/Step Time": 8.514957841485739} +{"Pretrain/Learning Rate": 4.82697014270869e-05, "Pretrain/Loss": 2.0954232215881348, "Pretrain/Loss (Raw)": 1.927710771560669, "Pretrain/Step": 1388, "Pretrain/Step Time": 8.514640513807535} +{"Pretrain/Learning Rate": 4.8266596533386505e-05, "Pretrain/Loss": 2.096816301345825, "Pretrain/Loss (Raw)": 2.0199694633483887, "Pretrain/Step": 1389, "Pretrain/Step Time": 8.523375734686852} +{"Pretrain/Learning Rate": 4.8263488956472555e-05, "Pretrain/Loss": 2.098997116088867, "Pretrain/Loss (Raw)": 2.4387357234954834, "Pretrain/Step": 1390, "Pretrain/Step Time": 8.52247709967196} +{"Pretrain/Learning Rate": 4.826037869670345e-05, "Pretrain/Loss": 2.098722457885742, "Pretrain/Loss (Raw)": 1.9275885820388794, "Pretrain/Step": 1391, "Pretrain/Step Time": 8.524308145046234} +{"Pretrain/Learning Rate": 4.8257265754437854e-05, "Pretrain/Loss": 2.0983352661132812, "Pretrain/Loss (Raw)": 2.112046003341675, "Pretrain/Step": 1392, "Pretrain/Step Time": 8.521366972476244} +{"Pretrain/Learning Rate": 4.825415013003478e-05, "Pretrain/Loss": 2.098830461502075, "Pretrain/Loss (Raw)": 2.17079758644104, "Pretrain/Step": 1393, "Pretrain/Step Time": 8.513374876230955} +{"Pretrain/Learning Rate": 4.8251031823853546e-05, "Pretrain/Loss": 2.0965609550476074, "Pretrain/Loss (Raw)": 1.9057872295379639, "Pretrain/Step": 1394, "Pretrain/Step Time": 8.51016778498888} +{"Pretrain/Learning Rate": 4.824791083625375e-05, "Pretrain/Loss": 2.094407320022583, "Pretrain/Loss (Raw)": 1.9244142770767212, "Pretrain/Step": 1395, "Pretrain/Step Time": 8.519493447616696} +{"Pretrain/Learning Rate": 4.8244787167595335e-05, "Pretrain/Loss": 2.0950417518615723, "Pretrain/Loss (Raw)": 2.127692699432373, "Pretrain/Step": 1396, "Pretrain/Step Time": 8.519270932301879} +{"Pretrain/Learning Rate": 4.824166081823853e-05, "Pretrain/Loss": 2.0957376956939697, "Pretrain/Loss (Raw)": 2.065784215927124, "Pretrain/Step": 1397, "Pretrain/Step Time": 8.521053425967693} +{"Pretrain/Learning Rate": 4.823853178854387e-05, "Pretrain/Loss": 2.096282482147217, "Pretrain/Loss (Raw)": 2.018185615539551, "Pretrain/Step": 1398, "Pretrain/Step Time": 8.508846638724208} +{"Pretrain/Learning Rate": 4.8235400078872234e-05, "Pretrain/Loss": 2.0975427627563477, "Pretrain/Loss (Raw)": 2.1665921211242676, "Pretrain/Step": 1399, "Pretrain/Step Time": 8.508538829162717} +{"Pretrain/Learning Rate": 4.823226568958477e-05, "Pretrain/Loss": 2.09879207611084, "Pretrain/Loss (Raw)": 2.3333377838134766, "Pretrain/Step": 1400, "Pretrain/Step Time": 8.508927514776587} +{"Pretrain/Learning Rate": 4.822912862104295e-05, "Pretrain/Loss": 2.0977096557617188, "Pretrain/Loss (Raw)": 2.0826849937438965, "Pretrain/Step": 1401, "Pretrain/Step Time": 8.51851967908442} +{"Pretrain/Learning Rate": 4.8225988873608554e-05, "Pretrain/Loss": 2.098909854888916, "Pretrain/Loss (Raw)": 2.146876573562622, "Pretrain/Step": 1402, "Pretrain/Step Time": 8.516517108306289} +{"Pretrain/Learning Rate": 4.8222846447643686e-05, "Pretrain/Loss": 2.099738597869873, "Pretrain/Loss (Raw)": 2.2645297050476074, "Pretrain/Step": 1403, "Pretrain/Step Time": 8.519155042245984} +{"Pretrain/Learning Rate": 4.8219701343510727e-05, "Pretrain/Loss": 2.0996246337890625, "Pretrain/Loss (Raw)": 2.109938859939575, "Pretrain/Step": 1404, "Pretrain/Step Time": 8.510184112936258} +{"Pretrain/Learning Rate": 4.8216553561572395e-05, "Pretrain/Loss": 2.0979652404785156, "Pretrain/Loss (Raw)": 2.097007989883423, "Pretrain/Step": 1405, "Pretrain/Step Time": 8.505946351215243} +{"Pretrain/Learning Rate": 4.821340310219171e-05, "Pretrain/Loss": 2.0997533798217773, "Pretrain/Loss (Raw)": 2.2420780658721924, "Pretrain/Step": 1406, "Pretrain/Step Time": 8.512525953352451} +{"Pretrain/Learning Rate": 4.8210249965732e-05, "Pretrain/Loss": 2.1005752086639404, "Pretrain/Loss (Raw)": 2.1783478260040283, "Pretrain/Step": 1407, "Pretrain/Step Time": 8.516962369903922} +{"Pretrain/Learning Rate": 4.8207094152556886e-05, "Pretrain/Loss": 2.0999596118927, "Pretrain/Loss (Raw)": 2.1894872188568115, "Pretrain/Step": 1408, "Pretrain/Step Time": 8.51684202812612} +{"Pretrain/Learning Rate": 4.820393566303032e-05, "Pretrain/Loss": 2.1006319522857666, "Pretrain/Loss (Raw)": 2.187925338745117, "Pretrain/Step": 1409, "Pretrain/Step Time": 8.517852937802672} +{"Pretrain/Learning Rate": 4.8200774497516555e-05, "Pretrain/Loss": 2.1001768112182617, "Pretrain/Loss (Raw)": 2.1749048233032227, "Pretrain/Step": 1410, "Pretrain/Step Time": 8.51400738954544} +{"Pretrain/Learning Rate": 4.8197610656380144e-05, "Pretrain/Loss": 2.100480556488037, "Pretrain/Loss (Raw)": 2.1832351684570312, "Pretrain/Step": 1411, "Pretrain/Step Time": 8.508728351444006} +{"Pretrain/Learning Rate": 4.8194444139985965e-05, "Pretrain/Loss": 2.10357666015625, "Pretrain/Loss (Raw)": 2.255493640899658, "Pretrain/Step": 1412, "Pretrain/Step Time": 8.510102339088917} +{"Pretrain/Learning Rate": 4.81912749486992e-05, "Pretrain/Loss": 2.1050238609313965, "Pretrain/Loss (Raw)": 2.259216785430908, "Pretrain/Step": 1413, "Pretrain/Step Time": 8.514785271137953} +{"Pretrain/Learning Rate": 4.818810308288531e-05, "Pretrain/Loss": 2.1054155826568604, "Pretrain/Loss (Raw)": 2.114739418029785, "Pretrain/Step": 1414, "Pretrain/Step Time": 8.516204867511988} +{"Pretrain/Learning Rate": 4.818492854291012e-05, "Pretrain/Loss": 2.1016736030578613, "Pretrain/Loss (Raw)": 1.998663306236267, "Pretrain/Step": 1415, "Pretrain/Step Time": 8.517141183838248} +{"Pretrain/Learning Rate": 4.818175132913971e-05, "Pretrain/Loss": 2.0987064838409424, "Pretrain/Loss (Raw)": 1.9607644081115723, "Pretrain/Step": 1416, "Pretrain/Step Time": 8.510353788733482} +{"Pretrain/Learning Rate": 4.817857144194051e-05, "Pretrain/Loss": 2.1001529693603516, "Pretrain/Loss (Raw)": 2.250493049621582, "Pretrain/Step": 1417, "Pretrain/Step Time": 8.508383532986045} +{"Pretrain/Learning Rate": 4.817538888167923e-05, "Pretrain/Loss": 2.0978925228118896, "Pretrain/Loss (Raw)": 1.923653483390808, "Pretrain/Step": 1418, "Pretrain/Step Time": 8.513463914394379} +{"Pretrain/Learning Rate": 4.817220364872289e-05, "Pretrain/Loss": 2.0993547439575195, "Pretrain/Loss (Raw)": 2.3541407585144043, "Pretrain/Step": 1419, "Pretrain/Step Time": 8.518276821821928} +{"Pretrain/Learning Rate": 4.816901574343884e-05, "Pretrain/Loss": 2.0970263481140137, "Pretrain/Loss (Raw)": 1.911321997642517, "Pretrain/Step": 1420, "Pretrain/Step Time": 8.520456595346332} +{"Pretrain/Learning Rate": 4.816582516619471e-05, "Pretrain/Loss": 2.0984063148498535, "Pretrain/Loss (Raw)": 2.179986000061035, "Pretrain/Step": 1421, "Pretrain/Step Time": 8.515472369268537} +{"Pretrain/Learning Rate": 4.816263191735847e-05, "Pretrain/Loss": 2.099456548690796, "Pretrain/Loss (Raw)": 2.1593246459960938, "Pretrain/Step": 1422, "Pretrain/Step Time": 8.519038274884224} +{"Pretrain/Learning Rate": 4.8159435997298375e-05, "Pretrain/Loss": 2.1015946865081787, "Pretrain/Loss (Raw)": 2.222426414489746, "Pretrain/Step": 1423, "Pretrain/Step Time": 8.503471534699202} +{"Pretrain/Learning Rate": 4.8156237406382975e-05, "Pretrain/Loss": 2.1013474464416504, "Pretrain/Loss (Raw)": 2.133331537246704, "Pretrain/Step": 1424, "Pretrain/Step Time": 8.504952682182193} +{"Pretrain/Learning Rate": 4.815303614498118e-05, "Pretrain/Loss": 2.1005921363830566, "Pretrain/Loss (Raw)": 2.011301040649414, "Pretrain/Step": 1425, "Pretrain/Step Time": 8.50848876312375} +{"Pretrain/Learning Rate": 4.814983221346214e-05, "Pretrain/Loss": 2.0996174812316895, "Pretrain/Loss (Raw)": 1.9647462368011475, "Pretrain/Step": 1426, "Pretrain/Step Time": 8.51298119686544} +{"Pretrain/Learning Rate": 4.814662561219537e-05, "Pretrain/Loss": 2.10038423538208, "Pretrain/Loss (Raw)": 2.0986084938049316, "Pretrain/Step": 1427, "Pretrain/Step Time": 8.511620946228504} +{"Pretrain/Learning Rate": 4.814341634155066e-05, "Pretrain/Loss": 2.1007819175720215, "Pretrain/Loss (Raw)": 2.2564125061035156, "Pretrain/Step": 1428, "Pretrain/Step Time": 8.507311856374145} +{"Pretrain/Learning Rate": 4.8140204401898134e-05, "Pretrain/Loss": 2.110358715057373, "Pretrain/Loss (Raw)": 3.0514161586761475, "Pretrain/Step": 1429, "Pretrain/Step Time": 8.504168838262558} +{"Pretrain/Learning Rate": 4.813698979360819e-05, "Pretrain/Loss": 2.1116714477539062, "Pretrain/Loss (Raw)": 2.1736786365509033, "Pretrain/Step": 1430, "Pretrain/Step Time": 8.506886655464768} +{"Pretrain/Learning Rate": 4.813377251705156e-05, "Pretrain/Loss": 2.1130268573760986, "Pretrain/Loss (Raw)": 2.2703146934509277, "Pretrain/Step": 1431, "Pretrain/Step Time": 8.50653493963182} +{"Pretrain/Learning Rate": 4.8130552572599265e-05, "Pretrain/Loss": 2.1125288009643555, "Pretrain/Loss (Raw)": 2.137709617614746, "Pretrain/Step": 1432, "Pretrain/Step Time": 8.510335570201278} +{"Pretrain/Learning Rate": 4.8127329960622656e-05, "Pretrain/Loss": 2.111137866973877, "Pretrain/Loss (Raw)": 2.1435210704803467, "Pretrain/Step": 1433, "Pretrain/Step Time": 8.504518194124103} +{"Pretrain/Learning Rate": 4.8124104681493375e-05, "Pretrain/Loss": 2.1087610721588135, "Pretrain/Loss (Raw)": 1.8942948579788208, "Pretrain/Step": 1434, "Pretrain/Step Time": 8.497271928936243} +{"Pretrain/Learning Rate": 4.8120876735583384e-05, "Pretrain/Loss": 2.1081507205963135, "Pretrain/Loss (Raw)": 2.0457823276519775, "Pretrain/Step": 1435, "Pretrain/Step Time": 8.498319160193205} +{"Pretrain/Learning Rate": 4.811764612326493e-05, "Pretrain/Loss": 2.1054811477661133, "Pretrain/Loss (Raw)": 1.938059687614441, "Pretrain/Step": 1436, "Pretrain/Step Time": 8.50388896651566} +{"Pretrain/Learning Rate": 4.8114412844910595e-05, "Pretrain/Loss": 2.106715202331543, "Pretrain/Loss (Raw)": 2.337296962738037, "Pretrain/Step": 1437, "Pretrain/Step Time": 8.50196243263781} +{"Pretrain/Learning Rate": 4.8111176900893254e-05, "Pretrain/Loss": 2.1073153018951416, "Pretrain/Loss (Raw)": 2.132378578186035, "Pretrain/Step": 1438, "Pretrain/Step Time": 8.507981296628714} +{"Pretrain/Learning Rate": 4.810793829158609e-05, "Pretrain/Loss": 2.1058080196380615, "Pretrain/Loss (Raw)": 1.9657446146011353, "Pretrain/Step": 1439, "Pretrain/Step Time": 8.50105207040906} +{"Pretrain/Learning Rate": 4.8104697017362595e-05, "Pretrain/Loss": 2.106935977935791, "Pretrain/Loss (Raw)": 2.1221303939819336, "Pretrain/Step": 1440, "Pretrain/Step Time": 8.495040783658624} +{"Pretrain/Learning Rate": 4.8101453078596565e-05, "Pretrain/Loss": 2.1046910285949707, "Pretrain/Loss (Raw)": 1.6963164806365967, "Pretrain/Step": 1441, "Pretrain/Step Time": 8.495268691331148} +{"Pretrain/Learning Rate": 4.809820647566211e-05, "Pretrain/Loss": 2.1000194549560547, "Pretrain/Loss (Raw)": 1.789006233215332, "Pretrain/Step": 1442, "Pretrain/Step Time": 8.49638456106186} +{"Pretrain/Learning Rate": 4.8094957208933635e-05, "Pretrain/Loss": 2.1011085510253906, "Pretrain/Loss (Raw)": 2.1468095779418945, "Pretrain/Step": 1443, "Pretrain/Step Time": 8.499297358095646} +{"Pretrain/Learning Rate": 4.809170527878587e-05, "Pretrain/Loss": 2.09830379486084, "Pretrain/Loss (Raw)": 2.03341007232666, "Pretrain/Step": 1444, "Pretrain/Step Time": 8.507181534543633} +{"Pretrain/Learning Rate": 4.808845068559384e-05, "Pretrain/Loss": 2.0992941856384277, "Pretrain/Loss (Raw)": 2.2936055660247803, "Pretrain/Step": 1445, "Pretrain/Step Time": 8.502360494807363} +{"Pretrain/Learning Rate": 4.808519342973289e-05, "Pretrain/Loss": 2.0979976654052734, "Pretrain/Loss (Raw)": 2.0372700691223145, "Pretrain/Step": 1446, "Pretrain/Step Time": 8.497997971251607} +{"Pretrain/Learning Rate": 4.808193351157865e-05, "Pretrain/Loss": 2.098874568939209, "Pretrain/Loss (Raw)": 2.2117958068847656, "Pretrain/Step": 1447, "Pretrain/Step Time": 8.503551816567779} +{"Pretrain/Learning Rate": 4.8078670931507064e-05, "Pretrain/Loss": 2.0973167419433594, "Pretrain/Loss (Raw)": 2.117723226547241, "Pretrain/Step": 1448, "Pretrain/Step Time": 8.506924144923687} +{"Pretrain/Learning Rate": 4.80754056898944e-05, "Pretrain/Loss": 2.0985777378082275, "Pretrain/Loss (Raw)": 2.1777708530426025, "Pretrain/Step": 1449, "Pretrain/Step Time": 8.506672002375126} +{"Pretrain/Learning Rate": 4.807213778711722e-05, "Pretrain/Loss": 2.098304271697998, "Pretrain/Loss (Raw)": 2.222439765930176, "Pretrain/Step": 1450, "Pretrain/Step Time": 8.513434447348118} +{"Pretrain/Learning Rate": 4.8068867223552384e-05, "Pretrain/Loss": 2.097445487976074, "Pretrain/Loss (Raw)": 1.989263653755188, "Pretrain/Step": 1451, "Pretrain/Step Time": 8.510325102135539} +{"Pretrain/Learning Rate": 4.8065593999577086e-05, "Pretrain/Loss": 2.0997300148010254, "Pretrain/Loss (Raw)": 2.0206613540649414, "Pretrain/Step": 1452, "Pretrain/Step Time": 8.50074490904808} +{"Pretrain/Learning Rate": 4.806231811556879e-05, "Pretrain/Loss": 2.0976545810699463, "Pretrain/Loss (Raw)": 1.7771810293197632, "Pretrain/Step": 1453, "Pretrain/Step Time": 8.504091132432222} +{"Pretrain/Learning Rate": 4.80590395719053e-05, "Pretrain/Loss": 2.098677158355713, "Pretrain/Loss (Raw)": 1.9266538619995117, "Pretrain/Step": 1454, "Pretrain/Step Time": 8.507650030776858} +{"Pretrain/Learning Rate": 4.805575836896471e-05, "Pretrain/Loss": 2.098933458328247, "Pretrain/Loss (Raw)": 2.30075740814209, "Pretrain/Step": 1455, "Pretrain/Step Time": 8.503383383154869} +{"Pretrain/Learning Rate": 4.805247450712542e-05, "Pretrain/Loss": 2.1005795001983643, "Pretrain/Loss (Raw)": 2.152578830718994, "Pretrain/Step": 1456, "Pretrain/Step Time": 8.508850324898958} +{"Pretrain/Learning Rate": 4.804918798676614e-05, "Pretrain/Loss": 2.0999908447265625, "Pretrain/Loss (Raw)": 2.1099252700805664, "Pretrain/Step": 1457, "Pretrain/Step Time": 8.512883001938462} +{"Pretrain/Learning Rate": 4.804589880826589e-05, "Pretrain/Loss": 2.0988857746124268, "Pretrain/Loss (Raw)": 2.058429002761841, "Pretrain/Step": 1458, "Pretrain/Step Time": 8.502463135868311} +{"Pretrain/Learning Rate": 4.8042606972004e-05, "Pretrain/Loss": 2.099458694458008, "Pretrain/Loss (Raw)": 2.003432035446167, "Pretrain/Step": 1459, "Pretrain/Step Time": 8.501144289970398} +{"Pretrain/Learning Rate": 4.803931247836009e-05, "Pretrain/Loss": 2.099428653717041, "Pretrain/Loss (Raw)": 2.270217180252075, "Pretrain/Step": 1460, "Pretrain/Step Time": 8.497944684699178} +{"Pretrain/Learning Rate": 4.80360153277141e-05, "Pretrain/Loss": 2.0988247394561768, "Pretrain/Loss (Raw)": 2.110805034637451, "Pretrain/Step": 1461, "Pretrain/Step Time": 8.50955124385655} +{"Pretrain/Learning Rate": 4.8032715520446275e-05, "Pretrain/Loss": 2.0968852043151855, "Pretrain/Loss (Raw)": 1.8866838216781616, "Pretrain/Step": 1462, "Pretrain/Step Time": 8.514044841751456} +{"Pretrain/Learning Rate": 4.802941305693716e-05, "Pretrain/Loss": 2.095376968383789, "Pretrain/Loss (Raw)": 1.9718235731124878, "Pretrain/Step": 1463, "Pretrain/Step Time": 8.513048468157649} +{"Pretrain/Learning Rate": 4.802610793756761e-05, "Pretrain/Loss": 2.0942583084106445, "Pretrain/Loss (Raw)": 2.0490310192108154, "Pretrain/Step": 1464, "Pretrain/Step Time": 8.512173781171441} +{"Pretrain/Learning Rate": 4.8022800162718794e-05, "Pretrain/Loss": 2.094275951385498, "Pretrain/Loss (Raw)": 2.2071425914764404, "Pretrain/Step": 1465, "Pretrain/Step Time": 8.51081845909357} +{"Pretrain/Learning Rate": 4.801948973277218e-05, "Pretrain/Loss": 2.0953283309936523, "Pretrain/Loss (Raw)": 2.096776008605957, "Pretrain/Step": 1466, "Pretrain/Step Time": 8.512170108035207} +{"Pretrain/Learning Rate": 4.8016176648109534e-05, "Pretrain/Loss": 2.094303607940674, "Pretrain/Loss (Raw)": 1.9180397987365723, "Pretrain/Step": 1467, "Pretrain/Step Time": 8.512576567009091} +{"Pretrain/Learning Rate": 4.801286090911295e-05, "Pretrain/Loss": 2.095134735107422, "Pretrain/Loss (Raw)": 2.1392037868499756, "Pretrain/Step": 1468, "Pretrain/Step Time": 8.515707824379206} +{"Pretrain/Learning Rate": 4.80095425161648e-05, "Pretrain/Loss": 2.093622922897339, "Pretrain/Loss (Raw)": 1.7251224517822266, "Pretrain/Step": 1469, "Pretrain/Step Time": 8.509817423298955} +{"Pretrain/Learning Rate": 4.800622146964777e-05, "Pretrain/Loss": 2.093019485473633, "Pretrain/Loss (Raw)": 1.9784071445465088, "Pretrain/Step": 1470, "Pretrain/Step Time": 8.50683917477727} +{"Pretrain/Learning Rate": 4.8002897769944885e-05, "Pretrain/Loss": 2.0939459800720215, "Pretrain/Loss (Raw)": 2.161585807800293, "Pretrain/Step": 1471, "Pretrain/Step Time": 8.508080629631877} +{"Pretrain/Learning Rate": 4.799957141743944e-05, "Pretrain/Loss": 2.0952653884887695, "Pretrain/Loss (Raw)": 2.1354825496673584, "Pretrain/Step": 1472, "Pretrain/Step Time": 8.51110977306962} +{"Pretrain/Learning Rate": 4.799624241251502e-05, "Pretrain/Loss": 2.0981178283691406, "Pretrain/Loss (Raw)": 2.308096170425415, "Pretrain/Step": 1473, "Pretrain/Step Time": 8.510619634762406} +{"Pretrain/Learning Rate": 4.7992910755555584e-05, "Pretrain/Loss": 2.1002047061920166, "Pretrain/Loss (Raw)": 2.342695951461792, "Pretrain/Step": 1474, "Pretrain/Step Time": 8.514312770217657} +{"Pretrain/Learning Rate": 4.798957644694533e-05, "Pretrain/Loss": 2.0998711585998535, "Pretrain/Loss (Raw)": 2.1310298442840576, "Pretrain/Step": 1475, "Pretrain/Step Time": 8.51774975284934} +{"Pretrain/Learning Rate": 4.7986239487068785e-05, "Pretrain/Loss": 2.098583698272705, "Pretrain/Loss (Raw)": 1.851993203163147, "Pretrain/Step": 1476, "Pretrain/Step Time": 8.509073071181774} +{"Pretrain/Learning Rate": 4.798289987631079e-05, "Pretrain/Loss": 2.098526954650879, "Pretrain/Loss (Raw)": 1.968559980392456, "Pretrain/Step": 1477, "Pretrain/Step Time": 8.507634803652763} +{"Pretrain/Learning Rate": 4.797955761505648e-05, "Pretrain/Loss": 2.098262071609497, "Pretrain/Loss (Raw)": 2.045889377593994, "Pretrain/Step": 1478, "Pretrain/Step Time": 8.51862526871264} +{"Pretrain/Learning Rate": 4.7976212703691306e-05, "Pretrain/Loss": 2.0976274013519287, "Pretrain/Loss (Raw)": 2.1078412532806396, "Pretrain/Step": 1479, "Pretrain/Step Time": 8.518850645050406} +{"Pretrain/Learning Rate": 4.797286514260101e-05, "Pretrain/Loss": 2.0977678298950195, "Pretrain/Loss (Raw)": 2.2427399158477783, "Pretrain/Step": 1480, "Pretrain/Step Time": 8.513305870816112} +{"Pretrain/Learning Rate": 4.7969514932171665e-05, "Pretrain/Loss": 2.0965158939361572, "Pretrain/Loss (Raw)": 1.9548569917678833, "Pretrain/Step": 1481, "Pretrain/Step Time": 8.51358682103455} +{"Pretrain/Learning Rate": 4.796616207278961e-05, "Pretrain/Loss": 2.0965871810913086, "Pretrain/Loss (Raw)": 2.09919810295105, "Pretrain/Step": 1482, "Pretrain/Step Time": 8.511464377865195} +{"Pretrain/Learning Rate": 4.796280656484153e-05, "Pretrain/Loss": 2.0962600708007812, "Pretrain/Loss (Raw)": 2.2405588626861572, "Pretrain/Step": 1483, "Pretrain/Step Time": 8.514777455478907} +{"Pretrain/Learning Rate": 4.795944840871439e-05, "Pretrain/Loss": 2.097102165222168, "Pretrain/Loss (Raw)": 2.1639273166656494, "Pretrain/Step": 1484, "Pretrain/Step Time": 8.5237419269979} +{"Pretrain/Learning Rate": 4.7956087604795474e-05, "Pretrain/Loss": 2.0958123207092285, "Pretrain/Loss (Raw)": 1.9388885498046875, "Pretrain/Step": 1485, "Pretrain/Step Time": 8.525092149153352} +{"Pretrain/Learning Rate": 4.7952724153472366e-05, "Pretrain/Loss": 2.0957107543945312, "Pretrain/Loss (Raw)": 2.0205209255218506, "Pretrain/Step": 1486, "Pretrain/Step Time": 8.522997507825494} +{"Pretrain/Learning Rate": 4.7949358055132945e-05, "Pretrain/Loss": 2.096245288848877, "Pretrain/Loss (Raw)": 2.0154104232788086, "Pretrain/Step": 1487, "Pretrain/Step Time": 8.51194249279797} +{"Pretrain/Learning Rate": 4.7945989310165415e-05, "Pretrain/Loss": 2.0951151847839355, "Pretrain/Loss (Raw)": 1.9857133626937866, "Pretrain/Step": 1488, "Pretrain/Step Time": 8.509335787966847} +{"Pretrain/Learning Rate": 4.794261791895828e-05, "Pretrain/Loss": 2.095053195953369, "Pretrain/Loss (Raw)": 2.0752172470092773, "Pretrain/Step": 1489, "Pretrain/Step Time": 8.503222269937396} +{"Pretrain/Learning Rate": 4.793924388190033e-05, "Pretrain/Loss": 2.0946459770202637, "Pretrain/Loss (Raw)": 2.0478365421295166, "Pretrain/Step": 1490, "Pretrain/Step Time": 8.512429602444172} +{"Pretrain/Learning Rate": 4.793586719938068e-05, "Pretrain/Loss": 2.0943806171417236, "Pretrain/Loss (Raw)": 2.1550211906433105, "Pretrain/Step": 1491, "Pretrain/Step Time": 8.515579411759973} +{"Pretrain/Learning Rate": 4.7932487871788746e-05, "Pretrain/Loss": 2.0943515300750732, "Pretrain/Loss (Raw)": 2.117687225341797, "Pretrain/Step": 1492, "Pretrain/Step Time": 8.514883860945702} +{"Pretrain/Learning Rate": 4.792910589951426e-05, "Pretrain/Loss": 2.093177318572998, "Pretrain/Loss (Raw)": 1.9738192558288574, "Pretrain/Step": 1493, "Pretrain/Step Time": 8.505781814455986} +{"Pretrain/Learning Rate": 4.792572128294722e-05, "Pretrain/Loss": 2.091571569442749, "Pretrain/Loss (Raw)": 2.033468008041382, "Pretrain/Step": 1494, "Pretrain/Step Time": 8.506887074559927} +{"Pretrain/Learning Rate": 4.792233402247799e-05, "Pretrain/Loss": 2.094024658203125, "Pretrain/Loss (Raw)": 2.4704513549804688, "Pretrain/Step": 1495, "Pretrain/Step Time": 8.509686693549156} +{"Pretrain/Learning Rate": 4.791894411849718e-05, "Pretrain/Loss": 2.093069076538086, "Pretrain/Loss (Raw)": 2.0694704055786133, "Pretrain/Step": 1496, "Pretrain/Step Time": 8.5158312600106} +{"Pretrain/Learning Rate": 4.7915551571395726e-05, "Pretrain/Loss": 2.093364715576172, "Pretrain/Loss (Raw)": 2.0602338314056396, "Pretrain/Step": 1497, "Pretrain/Step Time": 8.518147122114897} +{"Pretrain/Learning Rate": 4.79121563815649e-05, "Pretrain/Loss": 2.09299635887146, "Pretrain/Loss (Raw)": 2.0460853576660156, "Pretrain/Step": 1498, "Pretrain/Step Time": 8.517641508951783} +{"Pretrain/Learning Rate": 4.790875854939622e-05, "Pretrain/Loss": 2.0942325592041016, "Pretrain/Loss (Raw)": 2.20719575881958, "Pretrain/Step": 1499, "Pretrain/Step Time": 8.504003506153822} +{"Pretrain/Learning Rate": 4.790535807528156e-05, "Pretrain/Loss": 2.0941903591156006, "Pretrain/Loss (Raw)": 2.039620876312256, "Pretrain/Step": 1500, "Pretrain/Step Time": 8.503934243693948} +{"Pretrain/Learning Rate": 4.7901954959613076e-05, "Pretrain/Loss": 2.0943431854248047, "Pretrain/Loss (Raw)": 2.1025266647338867, "Pretrain/Step": 1501, "Pretrain/Step Time": 8.512327056378126} +{"Pretrain/Learning Rate": 4.789854920278323e-05, "Pretrain/Loss": 2.092872142791748, "Pretrain/Loss (Raw)": 2.109618902206421, "Pretrain/Step": 1502, "Pretrain/Step Time": 8.51609656214714} +{"Pretrain/Learning Rate": 4.789514080518478e-05, "Pretrain/Loss": 2.092991352081299, "Pretrain/Loss (Raw)": 2.0443508625030518, "Pretrain/Step": 1503, "Pretrain/Step Time": 8.51390803232789} +{"Pretrain/Learning Rate": 4.789172976721081e-05, "Pretrain/Loss": 2.0922672748565674, "Pretrain/Loss (Raw)": 1.9588367938995361, "Pretrain/Step": 1504, "Pretrain/Step Time": 8.515519518405199} +{"Pretrain/Learning Rate": 4.7888316089254705e-05, "Pretrain/Loss": 2.0925328731536865, "Pretrain/Loss (Raw)": 2.0267653465270996, "Pretrain/Step": 1505, "Pretrain/Step Time": 8.50959737971425} +{"Pretrain/Learning Rate": 4.7884899771710126e-05, "Pretrain/Loss": 2.0944817066192627, "Pretrain/Loss (Raw)": 2.2006077766418457, "Pretrain/Step": 1506, "Pretrain/Step Time": 8.509904013946652} +{"Pretrain/Learning Rate": 4.788148081497106e-05, "Pretrain/Loss": 2.0949721336364746, "Pretrain/Loss (Raw)": 2.103454351425171, "Pretrain/Step": 1507, "Pretrain/Step Time": 8.516794435679913} +{"Pretrain/Learning Rate": 4.787805921943181e-05, "Pretrain/Loss": 2.0961780548095703, "Pretrain/Loss (Raw)": 2.133415937423706, "Pretrain/Step": 1508, "Pretrain/Step Time": 8.5151854660362} +{"Pretrain/Learning Rate": 4.787463498548698e-05, "Pretrain/Loss": 2.094306468963623, "Pretrain/Loss (Raw)": 2.0083134174346924, "Pretrain/Step": 1509, "Pretrain/Step Time": 8.518777953460813} +{"Pretrain/Learning Rate": 4.787120811353144e-05, "Pretrain/Loss": 2.0948567390441895, "Pretrain/Loss (Raw)": 2.108262300491333, "Pretrain/Step": 1510, "Pretrain/Step Time": 8.521220114082098} +{"Pretrain/Learning Rate": 4.786777860396041e-05, "Pretrain/Loss": 2.0963242053985596, "Pretrain/Loss (Raw)": 2.171107769012451, "Pretrain/Step": 1511, "Pretrain/Step Time": 8.511353051289916} +{"Pretrain/Learning Rate": 4.78643464571694e-05, "Pretrain/Loss": 2.098733901977539, "Pretrain/Loss (Raw)": 2.1189794540405273, "Pretrain/Step": 1512, "Pretrain/Step Time": 8.509095929563046} +{"Pretrain/Learning Rate": 4.786091167355421e-05, "Pretrain/Loss": 2.097405433654785, "Pretrain/Loss (Raw)": 1.761784553527832, "Pretrain/Step": 1513, "Pretrain/Step Time": 8.51472820341587} +{"Pretrain/Learning Rate": 4.785747425351097e-05, "Pretrain/Loss": 2.099684238433838, "Pretrain/Loss (Raw)": 2.0248334407806396, "Pretrain/Step": 1514, "Pretrain/Step Time": 8.514273397624493} +{"Pretrain/Learning Rate": 4.785403419743608e-05, "Pretrain/Loss": 2.0965638160705566, "Pretrain/Loss (Raw)": 1.7953159809112549, "Pretrain/Step": 1515, "Pretrain/Step Time": 8.512887753546238} +{"Pretrain/Learning Rate": 4.785059150572628e-05, "Pretrain/Loss": 2.0978152751922607, "Pretrain/Loss (Raw)": 2.0878992080688477, "Pretrain/Step": 1516, "Pretrain/Step Time": 8.513196034356952} +{"Pretrain/Learning Rate": 4.784714617877859e-05, "Pretrain/Loss": 2.0974924564361572, "Pretrain/Loss (Raw)": 1.9786502122879028, "Pretrain/Step": 1517, "Pretrain/Step Time": 8.5027666259557} +{"Pretrain/Learning Rate": 4.784369821699035e-05, "Pretrain/Loss": 2.093576431274414, "Pretrain/Loss (Raw)": 1.937492847442627, "Pretrain/Step": 1518, "Pretrain/Step Time": 8.502114163711667} +{"Pretrain/Learning Rate": 4.784024762075918e-05, "Pretrain/Loss": 2.093410015106201, "Pretrain/Loss (Raw)": 1.9062588214874268, "Pretrain/Step": 1519, "Pretrain/Step Time": 8.510145273059607} +{"Pretrain/Learning Rate": 4.7836794390483035e-05, "Pretrain/Loss": 2.0915169715881348, "Pretrain/Loss (Raw)": 1.8697655200958252, "Pretrain/Step": 1520, "Pretrain/Step Time": 8.508090810850263} +{"Pretrain/Learning Rate": 4.7833338526560145e-05, "Pretrain/Loss": 2.0891902446746826, "Pretrain/Loss (Raw)": 1.8729661703109741, "Pretrain/Step": 1521, "Pretrain/Step Time": 8.51317104510963} +{"Pretrain/Learning Rate": 4.782988002938907e-05, "Pretrain/Loss": 2.0903000831604004, "Pretrain/Loss (Raw)": 2.0478463172912598, "Pretrain/Step": 1522, "Pretrain/Step Time": 8.513644680380821} +{"Pretrain/Learning Rate": 4.782641889936864e-05, "Pretrain/Loss": 2.089859962463379, "Pretrain/Loss (Raw)": 1.8680821657180786, "Pretrain/Step": 1523, "Pretrain/Step Time": 8.501771679148078} +{"Pretrain/Learning Rate": 4.782295513689803e-05, "Pretrain/Loss": 2.089747905731201, "Pretrain/Loss (Raw)": 2.1133573055267334, "Pretrain/Step": 1524, "Pretrain/Step Time": 8.504917031154037} +{"Pretrain/Learning Rate": 4.7819488742376686e-05, "Pretrain/Loss": 2.0883193016052246, "Pretrain/Loss (Raw)": 1.882910966873169, "Pretrain/Step": 1525, "Pretrain/Step Time": 8.513507302850485} +{"Pretrain/Learning Rate": 4.7816019716204375e-05, "Pretrain/Loss": 2.0870323181152344, "Pretrain/Loss (Raw)": 1.853436827659607, "Pretrain/Step": 1526, "Pretrain/Step Time": 8.511020012199879} +{"Pretrain/Learning Rate": 4.781254805878115e-05, "Pretrain/Loss": 2.0885300636291504, "Pretrain/Loss (Raw)": 2.358311653137207, "Pretrain/Step": 1527, "Pretrain/Step Time": 8.509869806468487} +{"Pretrain/Learning Rate": 4.780907377050739e-05, "Pretrain/Loss": 2.086036205291748, "Pretrain/Loss (Raw)": 2.0141007900238037, "Pretrain/Step": 1528, "Pretrain/Step Time": 8.505605414509773} +{"Pretrain/Learning Rate": 4.780559685178376e-05, "Pretrain/Loss": 2.0852770805358887, "Pretrain/Loss (Raw)": 1.985556960105896, "Pretrain/Step": 1529, "Pretrain/Step Time": 8.495434144511819} +{"Pretrain/Learning Rate": 4.780211730301124e-05, "Pretrain/Loss": 2.084951162338257, "Pretrain/Loss (Raw)": 2.1051621437072754, "Pretrain/Step": 1530, "Pretrain/Step Time": 8.505268527194858} +{"Pretrain/Learning Rate": 4.779863512459111e-05, "Pretrain/Loss": 2.0834248065948486, "Pretrain/Loss (Raw)": 2.069122314453125, "Pretrain/Step": 1531, "Pretrain/Step Time": 8.507662391290069} +{"Pretrain/Learning Rate": 4.779515031692494e-05, "Pretrain/Loss": 2.084113121032715, "Pretrain/Loss (Raw)": 2.1980395317077637, "Pretrain/Step": 1532, "Pretrain/Step Time": 8.510919565334916} +{"Pretrain/Learning Rate": 4.7791662880414625e-05, "Pretrain/Loss": 2.0824904441833496, "Pretrain/Loss (Raw)": 1.889327883720398, "Pretrain/Step": 1533, "Pretrain/Step Time": 8.507508497685194} +{"Pretrain/Learning Rate": 4.778817281546235e-05, "Pretrain/Loss": 2.0811119079589844, "Pretrain/Loss (Raw)": 2.065609931945801, "Pretrain/Step": 1534, "Pretrain/Step Time": 8.499804504215717} +{"Pretrain/Learning Rate": 4.7784680122470605e-05, "Pretrain/Loss": 2.082765579223633, "Pretrain/Loss (Raw)": 2.390004873275757, "Pretrain/Step": 1535, "Pretrain/Step Time": 8.495140604674816} +{"Pretrain/Learning Rate": 4.778118480184218e-05, "Pretrain/Loss": 2.083707571029663, "Pretrain/Loss (Raw)": 2.3100857734680176, "Pretrain/Step": 1536, "Pretrain/Step Time": 8.49689650349319} +{"Pretrain/Learning Rate": 4.777768685398017e-05, "Pretrain/Loss": 2.0792250633239746, "Pretrain/Loss (Raw)": 1.6141821146011353, "Pretrain/Step": 1537, "Pretrain/Step Time": 8.504307717084885} +{"Pretrain/Learning Rate": 4.777418627928799e-05, "Pretrain/Loss": 2.0805463790893555, "Pretrain/Loss (Raw)": 2.344027519226074, "Pretrain/Step": 1538, "Pretrain/Step Time": 8.507040299475193} +{"Pretrain/Learning Rate": 4.777068307816932e-05, "Pretrain/Loss": 2.080704927444458, "Pretrain/Loss (Raw)": 2.203514575958252, "Pretrain/Step": 1539, "Pretrain/Step Time": 8.507593328133225} +{"Pretrain/Learning Rate": 4.776717725102819e-05, "Pretrain/Loss": 2.0803632736206055, "Pretrain/Loss (Raw)": 2.211740255355835, "Pretrain/Step": 1540, "Pretrain/Step Time": 8.505541918799281} +{"Pretrain/Learning Rate": 4.77636687982689e-05, "Pretrain/Loss": 2.07828950881958, "Pretrain/Loss (Raw)": 1.9938013553619385, "Pretrain/Step": 1541, "Pretrain/Step Time": 8.49855574592948} +{"Pretrain/Learning Rate": 4.776015772029605e-05, "Pretrain/Loss": 2.078667163848877, "Pretrain/Loss (Raw)": 2.163086175918579, "Pretrain/Step": 1542, "Pretrain/Step Time": 8.50346746854484} +{"Pretrain/Learning Rate": 4.7756644017514564e-05, "Pretrain/Loss": 2.0788869857788086, "Pretrain/Loss (Raw)": 2.026766538619995, "Pretrain/Step": 1543, "Pretrain/Step Time": 8.507749294862151} +{"Pretrain/Learning Rate": 4.775312769032966e-05, "Pretrain/Loss": 2.0798139572143555, "Pretrain/Loss (Raw)": 2.0794522762298584, "Pretrain/Step": 1544, "Pretrain/Step Time": 8.51350879482925} +{"Pretrain/Learning Rate": 4.774960873914685e-05, "Pretrain/Loss": 2.0778539180755615, "Pretrain/Loss (Raw)": 1.9996066093444824, "Pretrain/Step": 1545, "Pretrain/Step Time": 8.513237224891782} +{"Pretrain/Learning Rate": 4.774608716437196e-05, "Pretrain/Loss": 2.0781984329223633, "Pretrain/Loss (Raw)": 1.9677456617355347, "Pretrain/Step": 1546, "Pretrain/Step Time": 8.504580026492476} +{"Pretrain/Learning Rate": 4.7742562966411117e-05, "Pretrain/Loss": 2.0750458240509033, "Pretrain/Loss (Raw)": 1.9505927562713623, "Pretrain/Step": 1547, "Pretrain/Step Time": 8.501462450250983} +{"Pretrain/Learning Rate": 4.7739036145670744e-05, "Pretrain/Loss": 2.07722544670105, "Pretrain/Loss (Raw)": 2.1903083324432373, "Pretrain/Step": 1548, "Pretrain/Step Time": 8.50349548831582} +{"Pretrain/Learning Rate": 4.773550670255758e-05, "Pretrain/Loss": 2.076956272125244, "Pretrain/Loss (Raw)": 2.145537853240967, "Pretrain/Step": 1549, "Pretrain/Step Time": 8.515342386439443} +{"Pretrain/Learning Rate": 4.773197463747865e-05, "Pretrain/Loss": 2.077510356903076, "Pretrain/Loss (Raw)": 2.230245590209961, "Pretrain/Step": 1550, "Pretrain/Step Time": 8.513814995065331} +{"Pretrain/Learning Rate": 4.772843995084128e-05, "Pretrain/Loss": 2.0771398544311523, "Pretrain/Loss (Raw)": 2.175015687942505, "Pretrain/Step": 1551, "Pretrain/Step Time": 8.52041676454246} +{"Pretrain/Learning Rate": 4.7724902643053116e-05, "Pretrain/Loss": 2.0769259929656982, "Pretrain/Loss (Raw)": 2.105944871902466, "Pretrain/Step": 1552, "Pretrain/Step Time": 8.508487451821566} +{"Pretrain/Learning Rate": 4.77213627145221e-05, "Pretrain/Loss": 2.079555034637451, "Pretrain/Loss (Raw)": 2.3478524684906006, "Pretrain/Step": 1553, "Pretrain/Step Time": 8.501860050484538} +{"Pretrain/Learning Rate": 4.771782016565647e-05, "Pretrain/Loss": 2.079954147338867, "Pretrain/Loss (Raw)": 2.0158064365386963, "Pretrain/Step": 1554, "Pretrain/Step Time": 8.501704767346382} +{"Pretrain/Learning Rate": 4.771427499686477e-05, "Pretrain/Loss": 2.079092502593994, "Pretrain/Loss (Raw)": 1.988338589668274, "Pretrain/Step": 1555, "Pretrain/Step Time": 8.510860929265618} +{"Pretrain/Learning Rate": 4.771072720855584e-05, "Pretrain/Loss": 2.077688217163086, "Pretrain/Loss (Raw)": 2.0766265392303467, "Pretrain/Step": 1556, "Pretrain/Step Time": 8.511207215487957} +{"Pretrain/Learning Rate": 4.770717680113883e-05, "Pretrain/Loss": 2.0711116790771484, "Pretrain/Loss (Raw)": 2.209649085998535, "Pretrain/Step": 1557, "Pretrain/Step Time": 8.520120730623603} +{"Pretrain/Learning Rate": 4.770362377502319e-05, "Pretrain/Loss": 2.070439338684082, "Pretrain/Loss (Raw)": 2.087606430053711, "Pretrain/Step": 1558, "Pretrain/Step Time": 8.519105236977339} +{"Pretrain/Learning Rate": 4.770006813061868e-05, "Pretrain/Loss": 2.06870174407959, "Pretrain/Loss (Raw)": 2.047903299331665, "Pretrain/Step": 1559, "Pretrain/Step Time": 8.516807010397315} +{"Pretrain/Learning Rate": 4.769650986833535e-05, "Pretrain/Loss": 2.068535089492798, "Pretrain/Loss (Raw)": 2.1163864135742188, "Pretrain/Step": 1560, "Pretrain/Step Time": 8.516170272603631} +{"Pretrain/Learning Rate": 4.769294898858354e-05, "Pretrain/Loss": 2.0681416988372803, "Pretrain/Loss (Raw)": 2.093160629272461, "Pretrain/Step": 1561, "Pretrain/Step Time": 8.523914139717817} +{"Pretrain/Learning Rate": 4.768938549177393e-05, "Pretrain/Loss": 2.0665223598480225, "Pretrain/Loss (Raw)": 1.6870275735855103, "Pretrain/Step": 1562, "Pretrain/Step Time": 8.524300830438733} +{"Pretrain/Learning Rate": 4.768581937831746e-05, "Pretrain/Loss": 2.0680956840515137, "Pretrain/Loss (Raw)": 2.2471463680267334, "Pretrain/Step": 1563, "Pretrain/Step Time": 8.52493466064334} +{"Pretrain/Learning Rate": 4.768225064862541e-05, "Pretrain/Loss": 2.069411516189575, "Pretrain/Loss (Raw)": 2.1065073013305664, "Pretrain/Step": 1564, "Pretrain/Step Time": 8.512393048033118} +{"Pretrain/Learning Rate": 4.767867930310933e-05, "Pretrain/Loss": 2.067146062850952, "Pretrain/Loss (Raw)": 2.047314167022705, "Pretrain/Step": 1565, "Pretrain/Step Time": 8.513347556814551} +{"Pretrain/Learning Rate": 4.7675105342181084e-05, "Pretrain/Loss": 2.0666842460632324, "Pretrain/Loss (Raw)": 2.073251724243164, "Pretrain/Step": 1566, "Pretrain/Step Time": 8.50976893119514} +{"Pretrain/Learning Rate": 4.767152876625285e-05, "Pretrain/Loss": 2.0677542686462402, "Pretrain/Loss (Raw)": 2.1027450561523438, "Pretrain/Step": 1567, "Pretrain/Step Time": 8.517414571717381} +{"Pretrain/Learning Rate": 4.766794957573708e-05, "Pretrain/Loss": 2.0665807723999023, "Pretrain/Loss (Raw)": 1.9719072580337524, "Pretrain/Step": 1568, "Pretrain/Step Time": 8.522750452160835} +{"Pretrain/Learning Rate": 4.766436777104655e-05, "Pretrain/Loss": 2.0701639652252197, "Pretrain/Loss (Raw)": 2.154968738555908, "Pretrain/Step": 1569, "Pretrain/Step Time": 8.519976157695055} +{"Pretrain/Learning Rate": 4.766078335259433e-05, "Pretrain/Loss": 2.071667432785034, "Pretrain/Loss (Raw)": 1.9814293384552002, "Pretrain/Step": 1570, "Pretrain/Step Time": 8.52243579365313} +{"Pretrain/Learning Rate": 4.76571963207938e-05, "Pretrain/Loss": 2.0716543197631836, "Pretrain/Loss (Raw)": 2.145148277282715, "Pretrain/Step": 1571, "Pretrain/Step Time": 8.516215585172176} +{"Pretrain/Learning Rate": 4.765360667605861e-05, "Pretrain/Loss": 2.072483539581299, "Pretrain/Loss (Raw)": 2.1395514011383057, "Pretrain/Step": 1572, "Pretrain/Step Time": 8.51605393178761} +{"Pretrain/Learning Rate": 4.765001441880276e-05, "Pretrain/Loss": 2.0707554817199707, "Pretrain/Loss (Raw)": 2.07239031791687, "Pretrain/Step": 1573, "Pretrain/Step Time": 8.527754733338952} +{"Pretrain/Learning Rate": 4.764641954944052e-05, "Pretrain/Loss": 2.0704128742218018, "Pretrain/Loss (Raw)": 1.9934170246124268, "Pretrain/Step": 1574, "Pretrain/Step Time": 8.527634656056762} +{"Pretrain/Learning Rate": 4.764282206838646e-05, "Pretrain/Loss": 2.0677549839019775, "Pretrain/Loss (Raw)": 1.8716081380844116, "Pretrain/Step": 1575, "Pretrain/Step Time": 8.522552384063601} +{"Pretrain/Learning Rate": 4.763922197605547e-05, "Pretrain/Loss": 2.0672008991241455, "Pretrain/Loss (Raw)": 2.046799659729004, "Pretrain/Step": 1576, "Pretrain/Step Time": 8.52085518464446} +{"Pretrain/Learning Rate": 4.763561927286271e-05, "Pretrain/Loss": 2.066631317138672, "Pretrain/Loss (Raw)": 2.1048452854156494, "Pretrain/Step": 1577, "Pretrain/Step Time": 8.519597796723247} +{"Pretrain/Learning Rate": 4.7632013959223684e-05, "Pretrain/Loss": 2.066286087036133, "Pretrain/Loss (Raw)": 2.1782712936401367, "Pretrain/Step": 1578, "Pretrain/Step Time": 8.516518548130989} +{"Pretrain/Learning Rate": 4.7628406035554156e-05, "Pretrain/Loss": 2.068211555480957, "Pretrain/Loss (Raw)": 2.2357287406921387, "Pretrain/Step": 1579, "Pretrain/Step Time": 8.526422843337059} +{"Pretrain/Learning Rate": 4.762479550227022e-05, "Pretrain/Loss": 2.0725479125976562, "Pretrain/Loss (Raw)": 2.575705051422119, "Pretrain/Step": 1580, "Pretrain/Step Time": 8.527868837118149} +{"Pretrain/Learning Rate": 4.762118235978825e-05, "Pretrain/Loss": 2.0748143196105957, "Pretrain/Loss (Raw)": 2.0673043727874756, "Pretrain/Step": 1581, "Pretrain/Step Time": 8.522488137707114} +{"Pretrain/Learning Rate": 4.7617566608524946e-05, "Pretrain/Loss": 2.0759072303771973, "Pretrain/Loss (Raw)": 2.0665342807769775, "Pretrain/Step": 1582, "Pretrain/Step Time": 8.52053557895124} +{"Pretrain/Learning Rate": 4.761394824889727e-05, "Pretrain/Loss": 2.075596332550049, "Pretrain/Loss (Raw)": 2.2609620094299316, "Pretrain/Step": 1583, "Pretrain/Step Time": 8.516171107068658} +{"Pretrain/Learning Rate": 4.761032728132253e-05, "Pretrain/Loss": 2.075019359588623, "Pretrain/Loss (Raw)": 2.0787343978881836, "Pretrain/Step": 1584, "Pretrain/Step Time": 8.513392586261034} +{"Pretrain/Learning Rate": 4.76067037062183e-05, "Pretrain/Loss": 2.075662136077881, "Pretrain/Loss (Raw)": 2.192190170288086, "Pretrain/Step": 1585, "Pretrain/Step Time": 8.521172063425183} +{"Pretrain/Learning Rate": 4.7603077524002474e-05, "Pretrain/Loss": 2.076301097869873, "Pretrain/Loss (Raw)": 2.1402056217193604, "Pretrain/Step": 1586, "Pretrain/Step Time": 8.528573175892234} +{"Pretrain/Learning Rate": 4.759944873509324e-05, "Pretrain/Loss": 2.076134204864502, "Pretrain/Loss (Raw)": 1.9820822477340698, "Pretrain/Step": 1587, "Pretrain/Step Time": 8.527198972180486} +{"Pretrain/Learning Rate": 4.7595817339909086e-05, "Pretrain/Loss": 2.074751615524292, "Pretrain/Loss (Raw)": 2.093245506286621, "Pretrain/Step": 1588, "Pretrain/Step Time": 8.524944089353085} +{"Pretrain/Learning Rate": 4.75921833388688e-05, "Pretrain/Loss": 2.074249505996704, "Pretrain/Loss (Raw)": 2.0465214252471924, "Pretrain/Step": 1589, "Pretrain/Step Time": 8.511535834521055} +{"Pretrain/Learning Rate": 4.758854673239147e-05, "Pretrain/Loss": 2.0750792026519775, "Pretrain/Loss (Raw)": 1.9928885698318481, "Pretrain/Step": 1590, "Pretrain/Step Time": 8.512311479076743} +{"Pretrain/Learning Rate": 4.7584907520896495e-05, "Pretrain/Loss": 2.073990821838379, "Pretrain/Loss (Raw)": 1.8325209617614746, "Pretrain/Step": 1591, "Pretrain/Step Time": 8.515851113945246} +{"Pretrain/Learning Rate": 4.7581265704803554e-05, "Pretrain/Loss": 2.0747172832489014, "Pretrain/Loss (Raw)": 2.1420254707336426, "Pretrain/Step": 1592, "Pretrain/Step Time": 8.514712957665324} +{"Pretrain/Learning Rate": 4.757762128453266e-05, "Pretrain/Loss": 2.0723330974578857, "Pretrain/Loss (Raw)": 1.9019436836242676, "Pretrain/Step": 1593, "Pretrain/Step Time": 8.514722073450685} +{"Pretrain/Learning Rate": 4.757397426050408e-05, "Pretrain/Loss": 2.0727477073669434, "Pretrain/Loss (Raw)": 2.149837017059326, "Pretrain/Step": 1594, "Pretrain/Step Time": 8.508357441052794} +{"Pretrain/Learning Rate": 4.757032463313842e-05, "Pretrain/Loss": 2.0736160278320312, "Pretrain/Loss (Raw)": 2.0292015075683594, "Pretrain/Step": 1595, "Pretrain/Step Time": 8.510850230231881} +{"Pretrain/Learning Rate": 4.756667240285656e-05, "Pretrain/Loss": 2.0735599994659424, "Pretrain/Loss (Raw)": 2.1320278644561768, "Pretrain/Step": 1596, "Pretrain/Step Time": 8.513459011912346} +{"Pretrain/Learning Rate": 4.756301757007971e-05, "Pretrain/Loss": 2.0772545337677, "Pretrain/Loss (Raw)": 2.1980297565460205, "Pretrain/Step": 1597, "Pretrain/Step Time": 8.514630489051342} +{"Pretrain/Learning Rate": 4.755936013522935e-05, "Pretrain/Loss": 2.077514410018921, "Pretrain/Loss (Raw)": 2.0116631984710693, "Pretrain/Step": 1598, "Pretrain/Step Time": 8.517025841400027} +{"Pretrain/Learning Rate": 4.7555700098727276e-05, "Pretrain/Loss": 2.077425003051758, "Pretrain/Loss (Raw)": 2.1501502990722656, "Pretrain/Step": 1599, "Pretrain/Step Time": 8.51374239102006} +{"Pretrain/Learning Rate": 4.755203746099558e-05, "Pretrain/Loss": 2.0769994258880615, "Pretrain/Loss (Raw)": 2.0810258388519287, "Pretrain/Step": 1600, "Pretrain/Step Time": 8.507459864020348} +{"Pretrain/Learning Rate": 4.754837222245666e-05, "Pretrain/Loss": 2.076050281524658, "Pretrain/Loss (Raw)": 2.186614990234375, "Pretrain/Step": 1601, "Pretrain/Step Time": 8.506671188399196} +{"Pretrain/Learning Rate": 4.75447043835332e-05, "Pretrain/Loss": 2.07405424118042, "Pretrain/Loss (Raw)": 2.087164878845215, "Pretrain/Step": 1602, "Pretrain/Step Time": 8.514234226197004} +{"Pretrain/Learning Rate": 4.75410339446482e-05, "Pretrain/Loss": 2.0741920471191406, "Pretrain/Loss (Raw)": 2.1486804485321045, "Pretrain/Step": 1603, "Pretrain/Step Time": 8.510886019095778} +{"Pretrain/Learning Rate": 4.753736090622494e-05, "Pretrain/Loss": 2.076267719268799, "Pretrain/Loss (Raw)": 2.117678642272949, "Pretrain/Step": 1604, "Pretrain/Step Time": 8.512797549366951} +{"Pretrain/Learning Rate": 4.753368526868703e-05, "Pretrain/Loss": 2.075378894805908, "Pretrain/Loss (Raw)": 1.8547875881195068, "Pretrain/Step": 1605, "Pretrain/Step Time": 8.511641446501017} +{"Pretrain/Learning Rate": 4.753000703245834e-05, "Pretrain/Loss": 2.0760672092437744, "Pretrain/Loss (Raw)": 2.1339986324310303, "Pretrain/Step": 1606, "Pretrain/Step Time": 8.500436328351498} +{"Pretrain/Learning Rate": 4.752632619796309e-05, "Pretrain/Loss": 2.076850414276123, "Pretrain/Loss (Raw)": 2.208081007003784, "Pretrain/Step": 1607, "Pretrain/Step Time": 8.504743043333292} +{"Pretrain/Learning Rate": 4.752264276562575e-05, "Pretrain/Loss": 2.076713800430298, "Pretrain/Loss (Raw)": 2.225282669067383, "Pretrain/Step": 1608, "Pretrain/Step Time": 8.502722157165408} +{"Pretrain/Learning Rate": 4.751895673587111e-05, "Pretrain/Loss": 2.0778603553771973, "Pretrain/Loss (Raw)": 2.1015918254852295, "Pretrain/Step": 1609, "Pretrain/Step Time": 8.50397614389658} +{"Pretrain/Learning Rate": 4.751526810912427e-05, "Pretrain/Loss": 2.0771989822387695, "Pretrain/Loss (Raw)": 2.014528751373291, "Pretrain/Step": 1610, "Pretrain/Step Time": 8.503100564703345} +{"Pretrain/Learning Rate": 4.751157688581062e-05, "Pretrain/Loss": 2.0751113891601562, "Pretrain/Loss (Raw)": 1.9733351469039917, "Pretrain/Step": 1611, "Pretrain/Step Time": 8.499403279274702} +{"Pretrain/Learning Rate": 4.750788306635584e-05, "Pretrain/Loss": 2.0745010375976562, "Pretrain/Loss (Raw)": 2.085838556289673, "Pretrain/Step": 1612, "Pretrain/Step Time": 8.490998828783631} +{"Pretrain/Learning Rate": 4.7504186651185926e-05, "Pretrain/Loss": 2.0762014389038086, "Pretrain/Loss (Raw)": 2.1565399169921875, "Pretrain/Step": 1613, "Pretrain/Step Time": 8.491869071498513} +{"Pretrain/Learning Rate": 4.7500487640727165e-05, "Pretrain/Loss": 2.0758395195007324, "Pretrain/Loss (Raw)": 1.9741929769515991, "Pretrain/Step": 1614, "Pretrain/Step Time": 8.508965861052275} +{"Pretrain/Learning Rate": 4.7496786035406144e-05, "Pretrain/Loss": 2.076380729675293, "Pretrain/Loss (Raw)": 2.0846593379974365, "Pretrain/Step": 1615, "Pretrain/Step Time": 8.506332758814096} +{"Pretrain/Learning Rate": 4.749308183564974e-05, "Pretrain/Loss": 2.0763661861419678, "Pretrain/Loss (Raw)": 1.983898639678955, "Pretrain/Step": 1616, "Pretrain/Step Time": 8.507894612848759} +{"Pretrain/Learning Rate": 4.748937504188517e-05, "Pretrain/Loss": 2.0768051147460938, "Pretrain/Loss (Raw)": 2.13136887550354, "Pretrain/Step": 1617, "Pretrain/Step Time": 8.513928577303886} +{"Pretrain/Learning Rate": 4.748566565453988e-05, "Pretrain/Loss": 2.0747628211975098, "Pretrain/Loss (Raw)": 1.7864316701889038, "Pretrain/Step": 1618, "Pretrain/Step Time": 8.503188295289874} +{"Pretrain/Learning Rate": 4.748195367404167e-05, "Pretrain/Loss": 2.072841167449951, "Pretrain/Loss (Raw)": 1.9090481996536255, "Pretrain/Step": 1619, "Pretrain/Step Time": 8.503779169172049} +{"Pretrain/Learning Rate": 4.747823910081863e-05, "Pretrain/Loss": 2.0732293128967285, "Pretrain/Loss (Raw)": 2.1673855781555176, "Pretrain/Step": 1620, "Pretrain/Step Time": 8.50333402492106} +{"Pretrain/Learning Rate": 4.747452193529913e-05, "Pretrain/Loss": 2.0743231773376465, "Pretrain/Loss (Raw)": 2.113823175430298, "Pretrain/Step": 1621, "Pretrain/Step Time": 8.513459092006087} +{"Pretrain/Learning Rate": 4.747080217791187e-05, "Pretrain/Loss": 2.073652982711792, "Pretrain/Loss (Raw)": 1.9476603269577026, "Pretrain/Step": 1622, "Pretrain/Step Time": 8.511468786746264} +{"Pretrain/Learning Rate": 4.7467079829085804e-05, "Pretrain/Loss": 2.0717244148254395, "Pretrain/Loss (Raw)": 2.223632335662842, "Pretrain/Step": 1623, "Pretrain/Step Time": 8.508902063593268} +{"Pretrain/Learning Rate": 4.746335488925022e-05, "Pretrain/Loss": 2.0726354122161865, "Pretrain/Loss (Raw)": 2.1860756874084473, "Pretrain/Step": 1624, "Pretrain/Step Time": 8.4992965888232} +{"Pretrain/Learning Rate": 4.7459627358834716e-05, "Pretrain/Loss": 2.073315143585205, "Pretrain/Loss (Raw)": 2.147221803665161, "Pretrain/Step": 1625, "Pretrain/Step Time": 8.50562559068203} +{"Pretrain/Learning Rate": 4.7455897238269134e-05, "Pretrain/Loss": 2.073866605758667, "Pretrain/Loss (Raw)": 2.1166741847991943, "Pretrain/Step": 1626, "Pretrain/Step Time": 8.50982329621911} +{"Pretrain/Learning Rate": 4.745216452798368e-05, "Pretrain/Loss": 2.0728044509887695, "Pretrain/Loss (Raw)": 2.0712392330169678, "Pretrain/Step": 1627, "Pretrain/Step Time": 8.51118510775268} +{"Pretrain/Learning Rate": 4.744842922840881e-05, "Pretrain/Loss": 2.073434352874756, "Pretrain/Loss (Raw)": 2.120256185531616, "Pretrain/Step": 1628, "Pretrain/Step Time": 8.510911216959357} +{"Pretrain/Learning Rate": 4.74446913399753e-05, "Pretrain/Loss": 2.073744297027588, "Pretrain/Loss (Raw)": 2.1421988010406494, "Pretrain/Step": 1629, "Pretrain/Step Time": 8.500476205721498} +{"Pretrain/Learning Rate": 4.744095086311422e-05, "Pretrain/Loss": 2.07366681098938, "Pretrain/Loss (Raw)": 2.0996804237365723, "Pretrain/Step": 1630, "Pretrain/Step Time": 8.495867758989334} +{"Pretrain/Learning Rate": 4.743720779825694e-05, "Pretrain/Loss": 2.0722339153289795, "Pretrain/Loss (Raw)": 1.860935926437378, "Pretrain/Step": 1631, "Pretrain/Step Time": 8.499547133222222} +{"Pretrain/Learning Rate": 4.743346214583514e-05, "Pretrain/Loss": 2.071383237838745, "Pretrain/Loss (Raw)": 1.8499888181686401, "Pretrain/Step": 1632, "Pretrain/Step Time": 8.507831234484911} +{"Pretrain/Learning Rate": 4.742971390628076e-05, "Pretrain/Loss": 2.0711278915405273, "Pretrain/Loss (Raw)": 1.9940341711044312, "Pretrain/Step": 1633, "Pretrain/Step Time": 8.512813795357943} +{"Pretrain/Learning Rate": 4.742596308002609e-05, "Pretrain/Loss": 2.0708866119384766, "Pretrain/Loss (Raw)": 2.1697731018066406, "Pretrain/Step": 1634, "Pretrain/Step Time": 8.515184780582786} +{"Pretrain/Learning Rate": 4.742220966750368e-05, "Pretrain/Loss": 2.0704894065856934, "Pretrain/Loss (Raw)": 2.052572727203369, "Pretrain/Step": 1635, "Pretrain/Step Time": 8.500769030302763} +{"Pretrain/Learning Rate": 4.7418453669146404e-05, "Pretrain/Loss": 2.07102108001709, "Pretrain/Loss (Raw)": 2.2014715671539307, "Pretrain/Step": 1636, "Pretrain/Step Time": 8.501804335042834} +{"Pretrain/Learning Rate": 4.74146950853874e-05, "Pretrain/Loss": 2.0700864791870117, "Pretrain/Loss (Raw)": 1.888681411743164, "Pretrain/Step": 1637, "Pretrain/Step Time": 8.506476175040007} +{"Pretrain/Learning Rate": 4.741093391666014e-05, "Pretrain/Loss": 2.0701546669006348, "Pretrain/Loss (Raw)": 2.1170005798339844, "Pretrain/Step": 1638, "Pretrain/Step Time": 8.512041963636875} +{"Pretrain/Learning Rate": 4.7407170163398375e-05, "Pretrain/Loss": 2.0695438385009766, "Pretrain/Loss (Raw)": 2.092924118041992, "Pretrain/Step": 1639, "Pretrain/Step Time": 8.514266716316342} +{"Pretrain/Learning Rate": 4.740340382603616e-05, "Pretrain/Loss": 2.0689823627471924, "Pretrain/Loss (Raw)": 2.047140121459961, "Pretrain/Step": 1640, "Pretrain/Step Time": 8.509859444573522} +{"Pretrain/Learning Rate": 4.739963490500785e-05, "Pretrain/Loss": 2.0708322525024414, "Pretrain/Loss (Raw)": 1.9985545873641968, "Pretrain/Step": 1641, "Pretrain/Step Time": 8.499589636921883} +{"Pretrain/Learning Rate": 4.7395863400748096e-05, "Pretrain/Loss": 2.0714428424835205, "Pretrain/Loss (Raw)": 2.102975845336914, "Pretrain/Step": 1642, "Pretrain/Step Time": 8.501284595578909} +{"Pretrain/Learning Rate": 4.7392089313691835e-05, "Pretrain/Loss": 2.075047492980957, "Pretrain/Loss (Raw)": 2.2567126750946045, "Pretrain/Step": 1643, "Pretrain/Step Time": 8.507623225450516} +{"Pretrain/Learning Rate": 4.738831264427432e-05, "Pretrain/Loss": 2.0758514404296875, "Pretrain/Loss (Raw)": 2.190812587738037, "Pretrain/Step": 1644, "Pretrain/Step Time": 8.511972213163972} +{"Pretrain/Learning Rate": 4.73845333929311e-05, "Pretrain/Loss": 2.0763187408447266, "Pretrain/Loss (Raw)": 2.03845477104187, "Pretrain/Step": 1645, "Pretrain/Step Time": 8.515415597707033} +{"Pretrain/Learning Rate": 4.738075156009801e-05, "Pretrain/Loss": 2.0786542892456055, "Pretrain/Loss (Raw)": 2.2364416122436523, "Pretrain/Step": 1646, "Pretrain/Step Time": 8.517448350787163} +{"Pretrain/Learning Rate": 4.737696714621118e-05, "Pretrain/Loss": 2.081070899963379, "Pretrain/Loss (Raw)": 2.2156131267547607, "Pretrain/Step": 1647, "Pretrain/Step Time": 8.507809611037374} +{"Pretrain/Learning Rate": 4.7373180151707065e-05, "Pretrain/Loss": 2.0823028087615967, "Pretrain/Loss (Raw)": 2.027430534362793, "Pretrain/Step": 1648, "Pretrain/Step Time": 8.50814956985414} +{"Pretrain/Learning Rate": 4.7369390577022385e-05, "Pretrain/Loss": 2.082700729370117, "Pretrain/Loss (Raw)": 1.9238934516906738, "Pretrain/Step": 1649, "Pretrain/Step Time": 8.5105139631778} +{"Pretrain/Learning Rate": 4.736559842259417e-05, "Pretrain/Loss": 2.083693265914917, "Pretrain/Loss (Raw)": 2.1749114990234375, "Pretrain/Step": 1650, "Pretrain/Step Time": 8.519553139805794} +{"Pretrain/Learning Rate": 4.736180368885976e-05, "Pretrain/Loss": 2.08484148979187, "Pretrain/Loss (Raw)": 2.0150513648986816, "Pretrain/Step": 1651, "Pretrain/Step Time": 8.52117583155632} +{"Pretrain/Learning Rate": 4.735800637625678e-05, "Pretrain/Loss": 2.0846071243286133, "Pretrain/Loss (Raw)": 2.0833346843719482, "Pretrain/Step": 1652, "Pretrain/Step Time": 8.522680485621095} +{"Pretrain/Learning Rate": 4.735420648522314e-05, "Pretrain/Loss": 2.0870490074157715, "Pretrain/Loss (Raw)": 2.195467710494995, "Pretrain/Step": 1653, "Pretrain/Step Time": 8.51320731639862} +{"Pretrain/Learning Rate": 4.7350404016197083e-05, "Pretrain/Loss": 2.0914931297302246, "Pretrain/Loss (Raw)": 2.4222960472106934, "Pretrain/Step": 1654, "Pretrain/Step Time": 8.513173619285226} +{"Pretrain/Learning Rate": 4.734659896961711e-05, "Pretrain/Loss": 2.0902023315429688, "Pretrain/Loss (Raw)": 2.1931235790252686, "Pretrain/Step": 1655, "Pretrain/Step Time": 8.519048945978284} +{"Pretrain/Learning Rate": 4.734279134592204e-05, "Pretrain/Loss": 2.0909926891326904, "Pretrain/Loss (Raw)": 2.1152586936950684, "Pretrain/Step": 1656, "Pretrain/Step Time": 8.528817193582654} +{"Pretrain/Learning Rate": 4.7338981145550994e-05, "Pretrain/Loss": 2.091142177581787, "Pretrain/Loss (Raw)": 2.004687547683716, "Pretrain/Step": 1657, "Pretrain/Step Time": 8.526293667033315} +{"Pretrain/Learning Rate": 4.7335168368943374e-05, "Pretrain/Loss": 2.0916621685028076, "Pretrain/Loss (Raw)": 2.171696424484253, "Pretrain/Step": 1658, "Pretrain/Step Time": 8.518584376201034} +{"Pretrain/Learning Rate": 4.733135301653889e-05, "Pretrain/Loss": 2.0905933380126953, "Pretrain/Loss (Raw)": 1.932326078414917, "Pretrain/Step": 1659, "Pretrain/Step Time": 8.519388346001506} +{"Pretrain/Learning Rate": 4.732753508877755e-05, "Pretrain/Loss": 2.0905842781066895, "Pretrain/Loss (Raw)": 2.19686222076416, "Pretrain/Step": 1660, "Pretrain/Step Time": 8.514158867299557} +{"Pretrain/Learning Rate": 4.732371458609966e-05, "Pretrain/Loss": 2.091221809387207, "Pretrain/Loss (Raw)": 1.9709550142288208, "Pretrain/Step": 1661, "Pretrain/Step Time": 8.519379733130336} +{"Pretrain/Learning Rate": 4.73198915089458e-05, "Pretrain/Loss": 2.091372489929199, "Pretrain/Loss (Raw)": 2.0848944187164307, "Pretrain/Step": 1662, "Pretrain/Step Time": 8.530255427584052} +{"Pretrain/Learning Rate": 4.731606585775689e-05, "Pretrain/Loss": 2.088754177093506, "Pretrain/Loss (Raw)": 2.054863929748535, "Pretrain/Step": 1663, "Pretrain/Step Time": 8.530273327603936} +{"Pretrain/Learning Rate": 4.731223763297409e-05, "Pretrain/Loss": 2.086782932281494, "Pretrain/Loss (Raw)": 2.0577445030212402, "Pretrain/Step": 1664, "Pretrain/Step Time": 8.528239818289876} +{"Pretrain/Learning Rate": 4.730840683503892e-05, "Pretrain/Loss": 2.0904102325439453, "Pretrain/Loss (Raw)": 2.0784826278686523, "Pretrain/Step": 1665, "Pretrain/Step Time": 8.52114918269217} +{"Pretrain/Learning Rate": 4.730457346439315e-05, "Pretrain/Loss": 2.0878443717956543, "Pretrain/Loss (Raw)": 2.015622854232788, "Pretrain/Step": 1666, "Pretrain/Step Time": 8.516363952308893} +{"Pretrain/Learning Rate": 4.7300737521478863e-05, "Pretrain/Loss": 2.0872206687927246, "Pretrain/Loss (Raw)": 2.123652935028076, "Pretrain/Step": 1667, "Pretrain/Step Time": 8.517336627468467} +{"Pretrain/Learning Rate": 4.729689900673845e-05, "Pretrain/Loss": 2.085400104522705, "Pretrain/Loss (Raw)": 1.9787076711654663, "Pretrain/Step": 1668, "Pretrain/Step Time": 8.518007155507803} +{"Pretrain/Learning Rate": 4.729305792061457e-05, "Pretrain/Loss": 2.085310935974121, "Pretrain/Loss (Raw)": 1.9823886156082153, "Pretrain/Step": 1669, "Pretrain/Step Time": 8.525781689211726} +{"Pretrain/Learning Rate": 4.72892142635502e-05, "Pretrain/Loss": 2.0837621688842773, "Pretrain/Loss (Raw)": 1.9648234844207764, "Pretrain/Step": 1670, "Pretrain/Step Time": 8.520670706406236} +{"Pretrain/Learning Rate": 4.728536803598862e-05, "Pretrain/Loss": 2.0847859382629395, "Pretrain/Loss (Raw)": 2.1578309535980225, "Pretrain/Step": 1671, "Pretrain/Step Time": 8.51133551262319} +{"Pretrain/Learning Rate": 4.728151923837337e-05, "Pretrain/Loss": 2.0821259021759033, "Pretrain/Loss (Raw)": 1.7389923334121704, "Pretrain/Step": 1672, "Pretrain/Step Time": 8.508720504119992} +{"Pretrain/Learning Rate": 4.727766787114835e-05, "Pretrain/Loss": 2.0825624465942383, "Pretrain/Loss (Raw)": 2.0554840564727783, "Pretrain/Step": 1673, "Pretrain/Step Time": 8.520864300429821} +{"Pretrain/Learning Rate": 4.727381393475767e-05, "Pretrain/Loss": 2.0848207473754883, "Pretrain/Loss (Raw)": 2.2567927837371826, "Pretrain/Step": 1674, "Pretrain/Step Time": 8.520565066486597} +{"Pretrain/Learning Rate": 4.726995742964583e-05, "Pretrain/Loss": 2.085820436477661, "Pretrain/Loss (Raw)": 2.0785372257232666, "Pretrain/Step": 1675, "Pretrain/Step Time": 8.522084683179855} +{"Pretrain/Learning Rate": 4.726609835625755e-05, "Pretrain/Loss": 2.0857653617858887, "Pretrain/Loss (Raw)": 2.1832613945007324, "Pretrain/Step": 1676, "Pretrain/Step Time": 8.518398482352495} +{"Pretrain/Learning Rate": 4.726223671503789e-05, "Pretrain/Loss": 2.085378646850586, "Pretrain/Loss (Raw)": 2.0960733890533447, "Pretrain/Step": 1677, "Pretrain/Step Time": 8.505196142941713} +{"Pretrain/Learning Rate": 4.725837250643218e-05, "Pretrain/Loss": 2.0861620903015137, "Pretrain/Loss (Raw)": 2.330496311187744, "Pretrain/Step": 1678, "Pretrain/Step Time": 8.512023318558931} +{"Pretrain/Learning Rate": 4.7254505730886075e-05, "Pretrain/Loss": 2.084688186645508, "Pretrain/Loss (Raw)": 1.9863756895065308, "Pretrain/Step": 1679, "Pretrain/Step Time": 8.512891443446279} +{"Pretrain/Learning Rate": 4.725063638884551e-05, "Pretrain/Loss": 2.0846943855285645, "Pretrain/Loss (Raw)": 2.1067311763763428, "Pretrain/Step": 1680, "Pretrain/Step Time": 8.514324340969324} +{"Pretrain/Learning Rate": 4.724676448075669e-05, "Pretrain/Loss": 2.082406520843506, "Pretrain/Loss (Raw)": 2.0550031661987305, "Pretrain/Step": 1681, "Pretrain/Step Time": 8.5163599178195} +{"Pretrain/Learning Rate": 4.724289000706617e-05, "Pretrain/Loss": 2.0813064575195312, "Pretrain/Loss (Raw)": 1.8749884366989136, "Pretrain/Step": 1682, "Pretrain/Step Time": 8.512472156435251} +{"Pretrain/Learning Rate": 4.723901296822076e-05, "Pretrain/Loss": 2.081989288330078, "Pretrain/Loss (Raw)": 2.0757429599761963, "Pretrain/Step": 1683, "Pretrain/Step Time": 8.502067303285003} +{"Pretrain/Learning Rate": 4.723513336466759e-05, "Pretrain/Loss": 2.081312894821167, "Pretrain/Loss (Raw)": 1.9900522232055664, "Pretrain/Step": 1684, "Pretrain/Step Time": 8.502876736223698} +{"Pretrain/Learning Rate": 4.723125119685405e-05, "Pretrain/Loss": 2.080186605453491, "Pretrain/Loss (Raw)": 2.0654799938201904, "Pretrain/Step": 1685, "Pretrain/Step Time": 8.501240085810423} +{"Pretrain/Learning Rate": 4.722736646522788e-05, "Pretrain/Loss": 2.080660820007324, "Pretrain/Loss (Raw)": 2.1483311653137207, "Pretrain/Step": 1686, "Pretrain/Step Time": 8.501246927306056} +{"Pretrain/Learning Rate": 4.722347917023706e-05, "Pretrain/Loss": 2.0809779167175293, "Pretrain/Loss (Raw)": 2.0884575843811035, "Pretrain/Step": 1687, "Pretrain/Step Time": 8.506628071889281} +{"Pretrain/Learning Rate": 4.72195893123299e-05, "Pretrain/Loss": 2.079432487487793, "Pretrain/Loss (Raw)": 1.9185774326324463, "Pretrain/Step": 1688, "Pretrain/Step Time": 8.501924760639668} +{"Pretrain/Learning Rate": 4.7215696891955006e-05, "Pretrain/Loss": 2.0795722007751465, "Pretrain/Loss (Raw)": 2.1110572814941406, "Pretrain/Step": 1689, "Pretrain/Step Time": 8.500309580937028} +{"Pretrain/Learning Rate": 4.721180190956126e-05, "Pretrain/Loss": 2.082425355911255, "Pretrain/Loss (Raw)": 2.052213430404663, "Pretrain/Step": 1690, "Pretrain/Step Time": 8.498514795675874} +{"Pretrain/Learning Rate": 4.7207904365597855e-05, "Pretrain/Loss": 2.0815086364746094, "Pretrain/Loss (Raw)": 2.1298067569732666, "Pretrain/Step": 1691, "Pretrain/Step Time": 8.504081977531314} +{"Pretrain/Learning Rate": 4.720400426051427e-05, "Pretrain/Loss": 2.0809874534606934, "Pretrain/Loss (Raw)": 2.039783477783203, "Pretrain/Step": 1692, "Pretrain/Step Time": 8.510757844895124} +{"Pretrain/Learning Rate": 4.720010159476028e-05, "Pretrain/Loss": 2.0790414810180664, "Pretrain/Loss (Raw)": 1.7982558012008667, "Pretrain/Step": 1693, "Pretrain/Step Time": 8.50992538407445} +{"Pretrain/Learning Rate": 4.719619636878597e-05, "Pretrain/Loss": 2.078824996948242, "Pretrain/Loss (Raw)": 2.0455241203308105, "Pretrain/Step": 1694, "Pretrain/Step Time": 8.50522325746715} +{"Pretrain/Learning Rate": 4.71922885830417e-05, "Pretrain/Loss": 2.079378843307495, "Pretrain/Loss (Raw)": 2.1736485958099365, "Pretrain/Step": 1695, "Pretrain/Step Time": 8.499964892864227} +{"Pretrain/Learning Rate": 4.718837823797814e-05, "Pretrain/Loss": 2.0799338817596436, "Pretrain/Loss (Raw)": 2.0429344177246094, "Pretrain/Step": 1696, "Pretrain/Step Time": 8.497845478355885} +{"Pretrain/Learning Rate": 4.7184465334046246e-05, "Pretrain/Loss": 2.077162504196167, "Pretrain/Loss (Raw)": 1.800234317779541, "Pretrain/Step": 1697, "Pretrain/Step Time": 8.505843421444297} +{"Pretrain/Learning Rate": 4.718054987169727e-05, "Pretrain/Loss": 2.077655553817749, "Pretrain/Loss (Raw)": 2.044544219970703, "Pretrain/Step": 1698, "Pretrain/Step Time": 8.503912381827831} +{"Pretrain/Learning Rate": 4.717663185138276e-05, "Pretrain/Loss": 2.0765137672424316, "Pretrain/Loss (Raw)": 1.9990241527557373, "Pretrain/Step": 1699, "Pretrain/Step Time": 8.508418722078204} +{"Pretrain/Learning Rate": 4.7172711273554576e-05, "Pretrain/Loss": 2.0765366554260254, "Pretrain/Loss (Raw)": 2.1424787044525146, "Pretrain/Step": 1700, "Pretrain/Step Time": 8.505287125706673} +{"Pretrain/Learning Rate": 4.7168788138664845e-05, "Pretrain/Loss": 2.0768518447875977, "Pretrain/Loss (Raw)": 2.1126980781555176, "Pretrain/Step": 1701, "Pretrain/Step Time": 8.493645252659917} +{"Pretrain/Learning Rate": 4.7164862447165995e-05, "Pretrain/Loss": 2.076531171798706, "Pretrain/Loss (Raw)": 1.9523875713348389, "Pretrain/Step": 1702, "Pretrain/Step Time": 8.500330984592438} +{"Pretrain/Learning Rate": 4.716093419951077e-05, "Pretrain/Loss": 2.0787558555603027, "Pretrain/Loss (Raw)": 2.1563680171966553, "Pretrain/Step": 1703, "Pretrain/Step Time": 8.499962121248245} +{"Pretrain/Learning Rate": 4.7157003396152184e-05, "Pretrain/Loss": 2.079341411590576, "Pretrain/Loss (Raw)": 2.12172269821167, "Pretrain/Step": 1704, "Pretrain/Step Time": 8.50324185565114} +{"Pretrain/Learning Rate": 4.715307003754356e-05, "Pretrain/Loss": 2.0796098709106445, "Pretrain/Loss (Raw)": 2.1392247676849365, "Pretrain/Step": 1705, "Pretrain/Step Time": 8.502641143277287} +{"Pretrain/Learning Rate": 4.714913412413851e-05, "Pretrain/Loss": 2.079920768737793, "Pretrain/Loss (Raw)": 2.2180771827697754, "Pretrain/Step": 1706, "Pretrain/Step Time": 8.501703659072518} +{"Pretrain/Learning Rate": 4.714519565639095e-05, "Pretrain/Loss": 2.0788450241088867, "Pretrain/Loss (Raw)": 2.098039388656616, "Pretrain/Step": 1707, "Pretrain/Step Time": 8.489604070782661} +{"Pretrain/Learning Rate": 4.714125463475506e-05, "Pretrain/Loss": 2.0752782821655273, "Pretrain/Loss (Raw)": 2.119169235229492, "Pretrain/Step": 1708, "Pretrain/Step Time": 8.495683073997498} +{"Pretrain/Learning Rate": 4.713731105968536e-05, "Pretrain/Loss": 2.077519416809082, "Pretrain/Loss (Raw)": 2.3541574478149414, "Pretrain/Step": 1709, "Pretrain/Step Time": 8.499998638406396} +{"Pretrain/Learning Rate": 4.7133364931636644e-05, "Pretrain/Loss": 2.078535556793213, "Pretrain/Loss (Raw)": 2.196584701538086, "Pretrain/Step": 1710, "Pretrain/Step Time": 8.500164311379194} +{"Pretrain/Learning Rate": 4.712941625106398e-05, "Pretrain/Loss": 2.076939105987549, "Pretrain/Loss (Raw)": 2.056624174118042, "Pretrain/Step": 1711, "Pretrain/Step Time": 8.50517156533897} +{"Pretrain/Learning Rate": 4.7125465018422755e-05, "Pretrain/Loss": 2.076376438140869, "Pretrain/Loss (Raw)": 2.0066916942596436, "Pretrain/Step": 1712, "Pretrain/Step Time": 8.500460287556052} +{"Pretrain/Learning Rate": 4.7121511234168644e-05, "Pretrain/Loss": 2.0757362842559814, "Pretrain/Loss (Raw)": 2.1102640628814697, "Pretrain/Step": 1713, "Pretrain/Step Time": 8.49145695194602} +{"Pretrain/Learning Rate": 4.711755489875762e-05, "Pretrain/Loss": 2.0756654739379883, "Pretrain/Loss (Raw)": 2.1311473846435547, "Pretrain/Step": 1714, "Pretrain/Step Time": 8.49852054938674} +{"Pretrain/Learning Rate": 4.711359601264594e-05, "Pretrain/Loss": 2.0760562419891357, "Pretrain/Loss (Raw)": 2.0321156978607178, "Pretrain/Step": 1715, "Pretrain/Step Time": 8.506407096982002} +{"Pretrain/Learning Rate": 4.7109634576290175e-05, "Pretrain/Loss": 2.0752289295196533, "Pretrain/Loss (Raw)": 1.9873502254486084, "Pretrain/Step": 1716, "Pretrain/Step Time": 8.505390906706452} +{"Pretrain/Learning Rate": 4.710567059014716e-05, "Pretrain/Loss": 2.0758092403411865, "Pretrain/Loss (Raw)": 2.120786666870117, "Pretrain/Step": 1717, "Pretrain/Step Time": 8.510485725477338} +{"Pretrain/Learning Rate": 4.710170405467405e-05, "Pretrain/Loss": 2.0763139724731445, "Pretrain/Loss (Raw)": 2.0574984550476074, "Pretrain/Step": 1718, "Pretrain/Step Time": 8.502564739435911} +{"Pretrain/Learning Rate": 4.709773497032828e-05, "Pretrain/Loss": 2.0794713497161865, "Pretrain/Loss (Raw)": 2.2366507053375244, "Pretrain/Step": 1719, "Pretrain/Step Time": 8.49953737296164} +{"Pretrain/Learning Rate": 4.7093763337567585e-05, "Pretrain/Loss": 2.07975172996521, "Pretrain/Loss (Raw)": 2.1779215335845947, "Pretrain/Step": 1720, "Pretrain/Step Time": 8.500207625329494} +{"Pretrain/Learning Rate": 4.708978915685e-05, "Pretrain/Loss": 2.0828464031219482, "Pretrain/Loss (Raw)": 2.2980639934539795, "Pretrain/Step": 1721, "Pretrain/Step Time": 8.505722973495722} +{"Pretrain/Learning Rate": 4.708581242863382e-05, "Pretrain/Loss": 2.0828771591186523, "Pretrain/Loss (Raw)": 2.153782844543457, "Pretrain/Step": 1722, "Pretrain/Step Time": 8.512058088555932} +{"Pretrain/Learning Rate": 4.7081833153377694e-05, "Pretrain/Loss": 2.0836873054504395, "Pretrain/Loss (Raw)": 2.1329123973846436, "Pretrain/Step": 1723, "Pretrain/Step Time": 8.510868964716792} +{"Pretrain/Learning Rate": 4.707785133154051e-05, "Pretrain/Loss": 2.0824460983276367, "Pretrain/Loss (Raw)": 1.9731489419937134, "Pretrain/Step": 1724, "Pretrain/Step Time": 8.50383461266756} +{"Pretrain/Learning Rate": 4.707386696358148e-05, "Pretrain/Loss": 2.0812954902648926, "Pretrain/Loss (Raw)": 2.0507426261901855, "Pretrain/Step": 1725, "Pretrain/Step Time": 8.500270219519734} +{"Pretrain/Learning Rate": 4.7069880049960104e-05, "Pretrain/Loss": 2.0804481506347656, "Pretrain/Loss (Raw)": 1.9032000303268433, "Pretrain/Step": 1726, "Pretrain/Step Time": 8.505796793848276} +{"Pretrain/Learning Rate": 4.7065890591136154e-05, "Pretrain/Loss": 2.079683780670166, "Pretrain/Loss (Raw)": 2.052325963973999, "Pretrain/Step": 1727, "Pretrain/Step Time": 8.50812910683453} +{"Pretrain/Learning Rate": 4.706189858756972e-05, "Pretrain/Loss": 2.0802724361419678, "Pretrain/Loss (Raw)": 2.15635085105896, "Pretrain/Step": 1728, "Pretrain/Step Time": 8.514481542631984} +{"Pretrain/Learning Rate": 4.705790403972119e-05, "Pretrain/Loss": 2.07781982421875, "Pretrain/Loss (Raw)": 1.8726826906204224, "Pretrain/Step": 1729, "Pretrain/Step Time": 8.51626923494041} +{"Pretrain/Learning Rate": 4.705390694805122e-05, "Pretrain/Loss": 2.0777862071990967, "Pretrain/Loss (Raw)": 2.082888126373291, "Pretrain/Step": 1730, "Pretrain/Step Time": 8.50628349930048} +{"Pretrain/Learning Rate": 4.704990731302078e-05, "Pretrain/Loss": 2.0738275051116943, "Pretrain/Loss (Raw)": 1.6419627666473389, "Pretrain/Step": 1731, "Pretrain/Step Time": 8.50672466121614} +{"Pretrain/Learning Rate": 4.7045905135091126e-05, "Pretrain/Loss": 2.0730438232421875, "Pretrain/Loss (Raw)": 2.0173604488372803, "Pretrain/Step": 1732, "Pretrain/Step Time": 8.509889263659716} +{"Pretrain/Learning Rate": 4.704190041472381e-05, "Pretrain/Loss": 2.075774669647217, "Pretrain/Loss (Raw)": 2.2043235301971436, "Pretrain/Step": 1733, "Pretrain/Step Time": 8.517029229551554} +{"Pretrain/Learning Rate": 4.703789315238067e-05, "Pretrain/Loss": 2.075012445449829, "Pretrain/Loss (Raw)": 2.036454439163208, "Pretrain/Step": 1734, "Pretrain/Step Time": 8.520998645573854} +{"Pretrain/Learning Rate": 4.703388334852385e-05, "Pretrain/Loss": 2.0737648010253906, "Pretrain/Loss (Raw)": 2.048386573791504, "Pretrain/Step": 1735, "Pretrain/Step Time": 8.513792745769024} +{"Pretrain/Learning Rate": 4.7029871003615776e-05, "Pretrain/Loss": 2.0719799995422363, "Pretrain/Loss (Raw)": 1.9968310594558716, "Pretrain/Step": 1736, "Pretrain/Step Time": 8.514234522357583} +{"Pretrain/Learning Rate": 4.7025856118119164e-05, "Pretrain/Loss": 2.0701866149902344, "Pretrain/Loss (Raw)": 1.8720448017120361, "Pretrain/Step": 1737, "Pretrain/Step Time": 8.512388801202178} +{"Pretrain/Learning Rate": 4.7021838692497046e-05, "Pretrain/Loss": 2.0683059692382812, "Pretrain/Loss (Raw)": 1.7737773656845093, "Pretrain/Step": 1738, "Pretrain/Step Time": 8.518103152513504} +{"Pretrain/Learning Rate": 4.70178187272127e-05, "Pretrain/Loss": 2.068669319152832, "Pretrain/Loss (Raw)": 2.0198707580566406, "Pretrain/Step": 1739, "Pretrain/Step Time": 8.521471925079823} +{"Pretrain/Learning Rate": 4.701379622272977e-05, "Pretrain/Loss": 2.0692074298858643, "Pretrain/Loss (Raw)": 2.15468692779541, "Pretrain/Step": 1740, "Pretrain/Step Time": 8.522423474118114} +{"Pretrain/Learning Rate": 4.700977117951211e-05, "Pretrain/Loss": 2.068160057067871, "Pretrain/Loss (Raw)": 2.0225024223327637, "Pretrain/Step": 1741, "Pretrain/Step Time": 8.522705199196935} +{"Pretrain/Learning Rate": 4.700574359802393e-05, "Pretrain/Loss": 2.0673911571502686, "Pretrain/Loss (Raw)": 1.8757522106170654, "Pretrain/Step": 1742, "Pretrain/Step Time": 8.508168192580342} +{"Pretrain/Learning Rate": 4.700171347872971e-05, "Pretrain/Loss": 2.067904472351074, "Pretrain/Loss (Raw)": 2.1503968238830566, "Pretrain/Step": 1743, "Pretrain/Step Time": 8.510682065039873} +{"Pretrain/Learning Rate": 4.699768082209421e-05, "Pretrain/Loss": 2.0691006183624268, "Pretrain/Loss (Raw)": 2.1369752883911133, "Pretrain/Step": 1744, "Pretrain/Step Time": 8.510833332315087} +{"Pretrain/Learning Rate": 4.69936456285825e-05, "Pretrain/Loss": 2.0684690475463867, "Pretrain/Loss (Raw)": 2.050532817840576, "Pretrain/Step": 1745, "Pretrain/Step Time": 8.51735563017428} +{"Pretrain/Learning Rate": 4.698960789865994e-05, "Pretrain/Loss": 2.0705690383911133, "Pretrain/Loss (Raw)": 2.0552284717559814, "Pretrain/Step": 1746, "Pretrain/Step Time": 8.519341237843037} +{"Pretrain/Learning Rate": 4.698556763279218e-05, "Pretrain/Loss": 2.0709121227264404, "Pretrain/Loss (Raw)": 1.952979326248169, "Pretrain/Step": 1747, "Pretrain/Step Time": 8.518305417150259} +{"Pretrain/Learning Rate": 4.698152483144516e-05, "Pretrain/Loss": 2.069549083709717, "Pretrain/Loss (Raw)": 1.992891788482666, "Pretrain/Step": 1748, "Pretrain/Step Time": 8.512358572334051} +{"Pretrain/Learning Rate": 4.697747949508512e-05, "Pretrain/Loss": 2.0699353218078613, "Pretrain/Loss (Raw)": 2.1632587909698486, "Pretrain/Step": 1749, "Pretrain/Step Time": 8.504992006346583} +{"Pretrain/Learning Rate": 4.697343162417858e-05, "Pretrain/Loss": 2.0723659992218018, "Pretrain/Loss (Raw)": 2.2587966918945312, "Pretrain/Step": 1750, "Pretrain/Step Time": 8.513169990852475} +{"Pretrain/Learning Rate": 4.696938121919235e-05, "Pretrain/Loss": 2.070702314376831, "Pretrain/Loss (Raw)": 2.0106935501098633, "Pretrain/Step": 1751, "Pretrain/Step Time": 8.519042583182454} +{"Pretrain/Learning Rate": 4.696532828059358e-05, "Pretrain/Loss": 2.0748651027679443, "Pretrain/Loss (Raw)": 2.7189183235168457, "Pretrain/Step": 1752, "Pretrain/Step Time": 8.521626453846693} +{"Pretrain/Learning Rate": 4.6961272808849634e-05, "Pretrain/Loss": 2.074305534362793, "Pretrain/Loss (Raw)": 2.075590133666992, "Pretrain/Step": 1753, "Pretrain/Step Time": 8.517069734632969} +{"Pretrain/Learning Rate": 4.6957214804428217e-05, "Pretrain/Loss": 2.0751664638519287, "Pretrain/Loss (Raw)": 2.226872205734253, "Pretrain/Step": 1754, "Pretrain/Step Time": 8.507389323785901} +{"Pretrain/Learning Rate": 4.695315426779734e-05, "Pretrain/Loss": 2.07570743560791, "Pretrain/Loss (Raw)": 2.140476703643799, "Pretrain/Step": 1755, "Pretrain/Step Time": 8.517040168866515} +{"Pretrain/Learning Rate": 4.694909119942526e-05, "Pretrain/Loss": 2.0749664306640625, "Pretrain/Loss (Raw)": 2.0253896713256836, "Pretrain/Step": 1756, "Pretrain/Step Time": 8.5186613406986} +{"Pretrain/Learning Rate": 4.694502559978055e-05, "Pretrain/Loss": 2.0778331756591797, "Pretrain/Loss (Raw)": 2.509160041809082, "Pretrain/Step": 1757, "Pretrain/Step Time": 8.520028902217746} +{"Pretrain/Learning Rate": 4.694095746933208e-05, "Pretrain/Loss": 2.076925277709961, "Pretrain/Loss (Raw)": 1.9834831953048706, "Pretrain/Step": 1758, "Pretrain/Step Time": 8.52144330367446} +{"Pretrain/Learning Rate": 4.6936886808549004e-05, "Pretrain/Loss": 2.0790164470672607, "Pretrain/Loss (Raw)": 2.128596067428589, "Pretrain/Step": 1759, "Pretrain/Step Time": 8.520982446148992} +{"Pretrain/Learning Rate": 4.693281361790077e-05, "Pretrain/Loss": 2.0819971561431885, "Pretrain/Loss (Raw)": 2.231534481048584, "Pretrain/Step": 1760, "Pretrain/Step Time": 8.509834066033363} +{"Pretrain/Learning Rate": 4.6928737897857124e-05, "Pretrain/Loss": 2.08412766456604, "Pretrain/Loss (Raw)": 2.2667438983917236, "Pretrain/Step": 1761, "Pretrain/Step Time": 8.506877543404698} +{"Pretrain/Learning Rate": 4.692465964888809e-05, "Pretrain/Loss": 2.084014654159546, "Pretrain/Loss (Raw)": 2.1552796363830566, "Pretrain/Step": 1762, "Pretrain/Step Time": 8.51400669850409} +{"Pretrain/Learning Rate": 4.692057887146399e-05, "Pretrain/Loss": 2.0839757919311523, "Pretrain/Loss (Raw)": 2.0475940704345703, "Pretrain/Step": 1763, "Pretrain/Step Time": 8.517698807641864} +{"Pretrain/Learning Rate": 4.691649556605545e-05, "Pretrain/Loss": 2.0824215412139893, "Pretrain/Loss (Raw)": 2.0025312900543213, "Pretrain/Step": 1764, "Pretrain/Step Time": 8.517646785825491} +{"Pretrain/Learning Rate": 4.691240973313337e-05, "Pretrain/Loss": 2.083554267883301, "Pretrain/Loss (Raw)": 2.0337018966674805, "Pretrain/Step": 1765, "Pretrain/Step Time": 8.51234856620431} +{"Pretrain/Learning Rate": 4.690832137316893e-05, "Pretrain/Loss": 2.083604097366333, "Pretrain/Loss (Raw)": 2.123342752456665, "Pretrain/Step": 1766, "Pretrain/Step Time": 8.504971463233232} +{"Pretrain/Learning Rate": 4.690423048663364e-05, "Pretrain/Loss": 2.084517002105713, "Pretrain/Loss (Raw)": 2.209775686264038, "Pretrain/Step": 1767, "Pretrain/Step Time": 8.507843814790249} +{"Pretrain/Learning Rate": 4.690013707399928e-05, "Pretrain/Loss": 2.0844850540161133, "Pretrain/Loss (Raw)": 2.043067455291748, "Pretrain/Step": 1768, "Pretrain/Step Time": 8.512845236808062} +{"Pretrain/Learning Rate": 4.689604113573791e-05, "Pretrain/Loss": 2.085310459136963, "Pretrain/Loss (Raw)": 2.104222059249878, "Pretrain/Step": 1769, "Pretrain/Step Time": 8.51950910128653} +{"Pretrain/Learning Rate": 4.68919426723219e-05, "Pretrain/Loss": 2.086188316345215, "Pretrain/Loss (Raw)": 2.2153186798095703, "Pretrain/Step": 1770, "Pretrain/Step Time": 8.517469013109803} +{"Pretrain/Learning Rate": 4.6887841684223905e-05, "Pretrain/Loss": 2.086508274078369, "Pretrain/Loss (Raw)": 2.2976601123809814, "Pretrain/Step": 1771, "Pretrain/Step Time": 8.512573041021824} +{"Pretrain/Learning Rate": 4.688373817191687e-05, "Pretrain/Loss": 2.0846104621887207, "Pretrain/Loss (Raw)": 1.9479190111160278, "Pretrain/Step": 1772, "Pretrain/Step Time": 8.504179978743196} +{"Pretrain/Learning Rate": 4.687963213587402e-05, "Pretrain/Loss": 2.088329315185547, "Pretrain/Loss (Raw)": 2.5144753456115723, "Pretrain/Step": 1773, "Pretrain/Step Time": 8.503348441794515} +{"Pretrain/Learning Rate": 4.6875523576568895e-05, "Pretrain/Loss": 2.087618827819824, "Pretrain/Loss (Raw)": 2.1454639434814453, "Pretrain/Step": 1774, "Pretrain/Step Time": 8.505859326571226} +{"Pretrain/Learning Rate": 4.6871412494475316e-05, "Pretrain/Loss": 2.0865609645843506, "Pretrain/Loss (Raw)": 2.080209493637085, "Pretrain/Step": 1775, "Pretrain/Step Time": 8.508319444954395} +{"Pretrain/Learning Rate": 4.6867298890067377e-05, "Pretrain/Loss": 2.0882136821746826, "Pretrain/Loss (Raw)": 2.23899507522583, "Pretrain/Step": 1776, "Pretrain/Step Time": 8.509942699223757} +{"Pretrain/Learning Rate": 4.68631827638195e-05, "Pretrain/Loss": 2.0877532958984375, "Pretrain/Loss (Raw)": 1.8649675846099854, "Pretrain/Step": 1777, "Pretrain/Step Time": 8.503966586664319} +{"Pretrain/Learning Rate": 4.6859064116206356e-05, "Pretrain/Loss": 2.086747646331787, "Pretrain/Loss (Raw)": 2.0461647510528564, "Pretrain/Step": 1778, "Pretrain/Step Time": 8.49601212888956} +{"Pretrain/Learning Rate": 4.685494294770294e-05, "Pretrain/Loss": 2.086777448654175, "Pretrain/Loss (Raw)": 2.0188729763031006, "Pretrain/Step": 1779, "Pretrain/Step Time": 8.491954263299704} +{"Pretrain/Learning Rate": 4.685081925878452e-05, "Pretrain/Loss": 2.0861308574676514, "Pretrain/Loss (Raw)": 2.0005667209625244, "Pretrain/Step": 1780, "Pretrain/Step Time": 8.497588651254773} +{"Pretrain/Learning Rate": 4.684669304992665e-05, "Pretrain/Loss": 2.0854735374450684, "Pretrain/Loss (Raw)": 2.111346960067749, "Pretrain/Step": 1781, "Pretrain/Step Time": 8.503605477511883} +{"Pretrain/Learning Rate": 4.6842564321605196e-05, "Pretrain/Loss": 2.082913398742676, "Pretrain/Loss (Raw)": 2.0945897102355957, "Pretrain/Step": 1782, "Pretrain/Step Time": 8.503873934969306} +{"Pretrain/Learning Rate": 4.683843307429631e-05, "Pretrain/Loss": 2.0819625854492188, "Pretrain/Loss (Raw)": 2.071410655975342, "Pretrain/Step": 1783, "Pretrain/Step Time": 8.498046763241291} +{"Pretrain/Learning Rate": 4.68342993084764e-05, "Pretrain/Loss": 2.0832998752593994, "Pretrain/Loss (Raw)": 2.2864339351654053, "Pretrain/Step": 1784, "Pretrain/Step Time": 8.489889349788427} +{"Pretrain/Learning Rate": 4.683016302462221e-05, "Pretrain/Loss": 2.0837974548339844, "Pretrain/Loss (Raw)": 2.06838059425354, "Pretrain/Step": 1785, "Pretrain/Step Time": 8.49313535168767} +{"Pretrain/Learning Rate": 4.682602422321076e-05, "Pretrain/Loss": 2.0839293003082275, "Pretrain/Loss (Raw)": 2.188570976257324, "Pretrain/Step": 1786, "Pretrain/Step Time": 8.500049576163292} +{"Pretrain/Learning Rate": 4.6821882904719344e-05, "Pretrain/Loss": 2.084662914276123, "Pretrain/Loss (Raw)": 2.0262484550476074, "Pretrain/Step": 1787, "Pretrain/Step Time": 8.499350631609559} +{"Pretrain/Learning Rate": 4.6817739069625563e-05, "Pretrain/Loss": 2.0837693214416504, "Pretrain/Loss (Raw)": 2.08248233795166, "Pretrain/Step": 1788, "Pretrain/Step Time": 8.502039631828666} +{"Pretrain/Learning Rate": 4.681359271840731e-05, "Pretrain/Loss": 2.084442138671875, "Pretrain/Loss (Raw)": 2.0570549964904785, "Pretrain/Step": 1789, "Pretrain/Step Time": 8.496582362800837} +{"Pretrain/Learning Rate": 4.6809443851542744e-05, "Pretrain/Loss": 2.0848636627197266, "Pretrain/Loss (Raw)": 2.1388564109802246, "Pretrain/Step": 1790, "Pretrain/Step Time": 8.49208333529532} +{"Pretrain/Learning Rate": 4.680529246951035e-05, "Pretrain/Loss": 2.0815727710723877, "Pretrain/Loss (Raw)": 1.6336164474487305, "Pretrain/Step": 1791, "Pretrain/Step Time": 8.493747180327773} +{"Pretrain/Learning Rate": 4.6801138572788885e-05, "Pretrain/Loss": 2.082639217376709, "Pretrain/Loss (Raw)": 2.1942617893218994, "Pretrain/Step": 1792, "Pretrain/Step Time": 8.500724697485566} +{"Pretrain/Learning Rate": 4.679698216185738e-05, "Pretrain/Loss": 2.082125663757324, "Pretrain/Loss (Raw)": 2.0127525329589844, "Pretrain/Step": 1793, "Pretrain/Step Time": 8.500493785366416} +{"Pretrain/Learning Rate": 4.6792823237195185e-05, "Pretrain/Loss": 2.082207679748535, "Pretrain/Loss (Raw)": 2.02610182762146, "Pretrain/Step": 1794, "Pretrain/Step Time": 8.499613573774695} +{"Pretrain/Learning Rate": 4.678866179928193e-05, "Pretrain/Loss": 2.0822930335998535, "Pretrain/Loss (Raw)": 2.134610176086426, "Pretrain/Step": 1795, "Pretrain/Step Time": 8.49925508722663} +{"Pretrain/Learning Rate": 4.6784497848597516e-05, "Pretrain/Loss": 2.082653760910034, "Pretrain/Loss (Raw)": 2.0248453617095947, "Pretrain/Step": 1796, "Pretrain/Step Time": 8.495909411460161} +{"Pretrain/Learning Rate": 4.678033138562216e-05, "Pretrain/Loss": 2.0838277339935303, "Pretrain/Loss (Raw)": 2.132688045501709, "Pretrain/Step": 1797, "Pretrain/Step Time": 8.495924828574061} +{"Pretrain/Learning Rate": 4.6776162410836354e-05, "Pretrain/Loss": 2.08396053314209, "Pretrain/Loss (Raw)": 1.9817943572998047, "Pretrain/Step": 1798, "Pretrain/Step Time": 8.507818752899766} +{"Pretrain/Learning Rate": 4.677199092472089e-05, "Pretrain/Loss": 2.0851521492004395, "Pretrain/Loss (Raw)": 2.310361623764038, "Pretrain/Step": 1799, "Pretrain/Step Time": 8.508243098855019} +{"Pretrain/Learning Rate": 4.6767816927756834e-05, "Pretrain/Loss": 2.087721824645996, "Pretrain/Loss (Raw)": 2.0678975582122803, "Pretrain/Step": 1800, "Pretrain/Step Time": 8.510944440960884} +{"Pretrain/Learning Rate": 4.6763640420425566e-05, "Pretrain/Loss": 2.0881996154785156, "Pretrain/Loss (Raw)": 2.1166656017303467, "Pretrain/Step": 1801, "Pretrain/Step Time": 8.496626064181328} +{"Pretrain/Learning Rate": 4.675946140320873e-05, "Pretrain/Loss": 2.085969924926758, "Pretrain/Loss (Raw)": 1.9713671207427979, "Pretrain/Step": 1802, "Pretrain/Step Time": 8.494426429271698} +{"Pretrain/Learning Rate": 4.6755279876588256e-05, "Pretrain/Loss": 2.0854270458221436, "Pretrain/Loss (Raw)": 2.0090854167938232, "Pretrain/Step": 1803, "Pretrain/Step Time": 8.498850233852863} +{"Pretrain/Learning Rate": 4.67510958410464e-05, "Pretrain/Loss": 2.085709810256958, "Pretrain/Loss (Raw)": 2.2194414138793945, "Pretrain/Step": 1804, "Pretrain/Step Time": 8.505360458046198} +{"Pretrain/Learning Rate": 4.6746909297065685e-05, "Pretrain/Loss": 2.0853443145751953, "Pretrain/Loss (Raw)": 2.049318552017212, "Pretrain/Step": 1805, "Pretrain/Step Time": 8.508504731580615} +{"Pretrain/Learning Rate": 4.674272024512891e-05, "Pretrain/Loss": 2.083449602127075, "Pretrain/Loss (Raw)": 2.0879390239715576, "Pretrain/Step": 1806, "Pretrain/Step Time": 8.50253632478416} +{"Pretrain/Learning Rate": 4.6738528685719185e-05, "Pretrain/Loss": 2.084043025970459, "Pretrain/Loss (Raw)": 2.0623247623443604, "Pretrain/Step": 1807, "Pretrain/Step Time": 8.498339602723718} +{"Pretrain/Learning Rate": 4.673433461931989e-05, "Pretrain/Loss": 2.083454132080078, "Pretrain/Loss (Raw)": 2.0313572883605957, "Pretrain/Step": 1808, "Pretrain/Step Time": 8.500036282464862} +{"Pretrain/Learning Rate": 4.6730138046414714e-05, "Pretrain/Loss": 2.0852291584014893, "Pretrain/Loss (Raw)": 2.2822229862213135, "Pretrain/Step": 1809, "Pretrain/Step Time": 8.509063763543963} +{"Pretrain/Learning Rate": 4.672593896748763e-05, "Pretrain/Loss": 2.085984468460083, "Pretrain/Loss (Raw)": 1.9716500043869019, "Pretrain/Step": 1810, "Pretrain/Step Time": 8.517533797770739} +{"Pretrain/Learning Rate": 4.6721737383022876e-05, "Pretrain/Loss": 2.089895248413086, "Pretrain/Loss (Raw)": 2.5763399600982666, "Pretrain/Step": 1811, "Pretrain/Step Time": 8.521584127098322} +{"Pretrain/Learning Rate": 4.671753329350502e-05, "Pretrain/Loss": 2.0898330211639404, "Pretrain/Loss (Raw)": 1.982079029083252, "Pretrain/Step": 1812, "Pretrain/Step Time": 8.522998867556453} +{"Pretrain/Learning Rate": 4.671332669941888e-05, "Pretrain/Loss": 2.0903728008270264, "Pretrain/Loss (Raw)": 2.1345808506011963, "Pretrain/Step": 1813, "Pretrain/Step Time": 8.519332941621542} +{"Pretrain/Learning Rate": 4.6709117601249596e-05, "Pretrain/Loss": 2.090524196624756, "Pretrain/Loss (Raw)": 2.167715072631836, "Pretrain/Step": 1814, "Pretrain/Step Time": 8.515953386202455} +{"Pretrain/Learning Rate": 4.6704905999482575e-05, "Pretrain/Loss": 2.090823173522949, "Pretrain/Loss (Raw)": 2.126727342605591, "Pretrain/Step": 1815, "Pretrain/Step Time": 8.516369637101889} +{"Pretrain/Learning Rate": 4.670069189460351e-05, "Pretrain/Loss": 2.09213924407959, "Pretrain/Loss (Raw)": 2.087036371231079, "Pretrain/Step": 1816, "Pretrain/Step Time": 8.522237081080675} +{"Pretrain/Learning Rate": 4.6696475287098396e-05, "Pretrain/Loss": 2.092092275619507, "Pretrain/Loss (Raw)": 2.1050400733947754, "Pretrain/Step": 1817, "Pretrain/Step Time": 8.520719842985272} +{"Pretrain/Learning Rate": 4.669225617745352e-05, "Pretrain/Loss": 2.0933213233947754, "Pretrain/Loss (Raw)": 2.2094943523406982, "Pretrain/Step": 1818, "Pretrain/Step Time": 8.52563976496458} +{"Pretrain/Learning Rate": 4.668803456615545e-05, "Pretrain/Loss": 2.0935938358306885, "Pretrain/Loss (Raw)": 2.164722204208374, "Pretrain/Step": 1819, "Pretrain/Step Time": 8.520459758117795} +{"Pretrain/Learning Rate": 4.668381045369102e-05, "Pretrain/Loss": 2.0939862728118896, "Pretrain/Loss (Raw)": 2.0900142192840576, "Pretrain/Step": 1820, "Pretrain/Step Time": 8.520538683980703} +{"Pretrain/Learning Rate": 4.6679583840547405e-05, "Pretrain/Loss": 2.096397876739502, "Pretrain/Loss (Raw)": 2.106947898864746, "Pretrain/Step": 1821, "Pretrain/Step Time": 8.524367935955524} +{"Pretrain/Learning Rate": 4.667535472721203e-05, "Pretrain/Loss": 2.0959970951080322, "Pretrain/Loss (Raw)": 1.9942102432250977, "Pretrain/Step": 1822, "Pretrain/Step Time": 8.530812921002507} +{"Pretrain/Learning Rate": 4.66711231141726e-05, "Pretrain/Loss": 2.096497058868408, "Pretrain/Loss (Raw)": 2.2376487255096436, "Pretrain/Step": 1823, "Pretrain/Step Time": 8.530252736061811} +{"Pretrain/Learning Rate": 4.6666889001917136e-05, "Pretrain/Loss": 2.0958757400512695, "Pretrain/Loss (Raw)": 1.9633972644805908, "Pretrain/Step": 1824, "Pretrain/Step Time": 8.527305848896503} +{"Pretrain/Learning Rate": 4.666265239093393e-05, "Pretrain/Loss": 2.0993359088897705, "Pretrain/Loss (Raw)": 2.2431304454803467, "Pretrain/Step": 1825, "Pretrain/Step Time": 8.517301330342889} +{"Pretrain/Learning Rate": 4.665841328171158e-05, "Pretrain/Loss": 2.1017005443573, "Pretrain/Loss (Raw)": 2.3472089767456055, "Pretrain/Step": 1826, "Pretrain/Step Time": 8.51799570582807} +{"Pretrain/Learning Rate": 4.665417167473894e-05, "Pretrain/Loss": 2.1024889945983887, "Pretrain/Loss (Raw)": 2.0999553203582764, "Pretrain/Step": 1827, "Pretrain/Step Time": 8.521963274106383} +{"Pretrain/Learning Rate": 4.66499275705052e-05, "Pretrain/Loss": 2.1027750968933105, "Pretrain/Loss (Raw)": 2.1791086196899414, "Pretrain/Step": 1828, "Pretrain/Step Time": 8.521803699433804} +{"Pretrain/Learning Rate": 4.6645680969499795e-05, "Pretrain/Loss": 2.1014552116394043, "Pretrain/Loss (Raw)": 1.943764567375183, "Pretrain/Step": 1829, "Pretrain/Step Time": 8.525199115276337} +{"Pretrain/Learning Rate": 4.664143187221245e-05, "Pretrain/Loss": 2.1033942699432373, "Pretrain/Loss (Raw)": 2.200580358505249, "Pretrain/Step": 1830, "Pretrain/Step Time": 8.52103908918798} +{"Pretrain/Learning Rate": 4.6637180279133216e-05, "Pretrain/Loss": 2.1030197143554688, "Pretrain/Loss (Raw)": 2.108402729034424, "Pretrain/Step": 1831, "Pretrain/Step Time": 8.51954242400825} +{"Pretrain/Learning Rate": 4.6632926190752385e-05, "Pretrain/Loss": 2.1009175777435303, "Pretrain/Loss (Raw)": 1.8526734113693237, "Pretrain/Step": 1832, "Pretrain/Step Time": 8.520039224997163} +{"Pretrain/Learning Rate": 4.662866960756057e-05, "Pretrain/Loss": 2.101530075073242, "Pretrain/Loss (Raw)": 2.2176120281219482, "Pretrain/Step": 1833, "Pretrain/Step Time": 8.523723548278213} +{"Pretrain/Learning Rate": 4.662441053004866e-05, "Pretrain/Loss": 2.1023213863372803, "Pretrain/Loss (Raw)": 2.3193607330322266, "Pretrain/Step": 1834, "Pretrain/Step Time": 8.525704216212034} +{"Pretrain/Learning Rate": 4.6620148958707833e-05, "Pretrain/Loss": 2.1019997596740723, "Pretrain/Loss (Raw)": 2.056877851486206, "Pretrain/Step": 1835, "Pretrain/Step Time": 8.527931448072195} +{"Pretrain/Learning Rate": 4.661588489402955e-05, "Pretrain/Loss": 2.1005094051361084, "Pretrain/Loss (Raw)": 1.92841637134552, "Pretrain/Step": 1836, "Pretrain/Step Time": 8.52400328218937} +{"Pretrain/Learning Rate": 4.661161833650556e-05, "Pretrain/Loss": 2.096893310546875, "Pretrain/Loss (Raw)": 1.891271948814392, "Pretrain/Step": 1837, "Pretrain/Step Time": 8.52043005824089} +{"Pretrain/Learning Rate": 4.660734928662791e-05, "Pretrain/Loss": 2.097139358520508, "Pretrain/Loss (Raw)": 2.2280683517456055, "Pretrain/Step": 1838, "Pretrain/Step Time": 8.515885153785348} +{"Pretrain/Learning Rate": 4.660307774488892e-05, "Pretrain/Loss": 2.0970077514648438, "Pretrain/Loss (Raw)": 2.03979229927063, "Pretrain/Step": 1839, "Pretrain/Step Time": 8.517902750521898} +{"Pretrain/Learning Rate": 4.65988037117812e-05, "Pretrain/Loss": 2.0971803665161133, "Pretrain/Loss (Raw)": 2.0288145542144775, "Pretrain/Step": 1840, "Pretrain/Step Time": 8.524063726887107} +{"Pretrain/Learning Rate": 4.659452718779768e-05, "Pretrain/Loss": 2.0983848571777344, "Pretrain/Loss (Raw)": 2.2644050121307373, "Pretrain/Step": 1841, "Pretrain/Step Time": 8.528409942984581} +{"Pretrain/Learning Rate": 4.6590248173431505e-05, "Pretrain/Loss": 2.096649646759033, "Pretrain/Loss (Raw)": 1.9090604782104492, "Pretrain/Step": 1842, "Pretrain/Step Time": 8.518094221130013} +{"Pretrain/Learning Rate": 4.6585966669176186e-05, "Pretrain/Loss": 2.0964834690093994, "Pretrain/Loss (Raw)": 2.010831832885742, "Pretrain/Step": 1843, "Pretrain/Step Time": 8.510874580591917} +{"Pretrain/Learning Rate": 4.658168267552547e-05, "Pretrain/Loss": 2.096190929412842, "Pretrain/Loss (Raw)": 1.949931025505066, "Pretrain/Step": 1844, "Pretrain/Step Time": 8.51715767197311} +{"Pretrain/Learning Rate": 4.657739619297342e-05, "Pretrain/Loss": 2.096573829650879, "Pretrain/Loss (Raw)": 2.169799566268921, "Pretrain/Step": 1845, "Pretrain/Step Time": 8.524303581565619} +{"Pretrain/Learning Rate": 4.657310722201436e-05, "Pretrain/Loss": 2.0951783657073975, "Pretrain/Loss (Raw)": 1.8788707256317139, "Pretrain/Step": 1846, "Pretrain/Step Time": 8.526854233816266} +{"Pretrain/Learning Rate": 4.6568815763142914e-05, "Pretrain/Loss": 2.093519449234009, "Pretrain/Loss (Raw)": 2.024290084838867, "Pretrain/Step": 1847, "Pretrain/Step Time": 8.52578472904861} +{"Pretrain/Learning Rate": 4.6564521816854e-05, "Pretrain/Loss": 2.091000556945801, "Pretrain/Loss (Raw)": 1.8555240631103516, "Pretrain/Step": 1848, "Pretrain/Step Time": 8.522028408944607} +{"Pretrain/Learning Rate": 4.656022538364282e-05, "Pretrain/Loss": 2.088183879852295, "Pretrain/Loss (Raw)": 1.9375218152999878, "Pretrain/Step": 1849, "Pretrain/Step Time": 8.515537953004241} +{"Pretrain/Learning Rate": 4.655592646400485e-05, "Pretrain/Loss": 2.08518385887146, "Pretrain/Loss (Raw)": 1.7697596549987793, "Pretrain/Step": 1850, "Pretrain/Step Time": 8.517864100635052} +{"Pretrain/Learning Rate": 4.6551625058435866e-05, "Pretrain/Loss": 2.082611322402954, "Pretrain/Loss (Raw)": 1.803628921508789, "Pretrain/Step": 1851, "Pretrain/Step Time": 8.516451083123684} +{"Pretrain/Learning Rate": 4.654732116743194e-05, "Pretrain/Loss": 2.082855224609375, "Pretrain/Loss (Raw)": 2.004404067993164, "Pretrain/Step": 1852, "Pretrain/Step Time": 8.520563764497638} +{"Pretrain/Learning Rate": 4.654301479148938e-05, "Pretrain/Loss": 2.082559108734131, "Pretrain/Loss (Raw)": 2.012827157974243, "Pretrain/Step": 1853, "Pretrain/Step Time": 8.520958231762052} +{"Pretrain/Learning Rate": 4.653870593110485e-05, "Pretrain/Loss": 2.0845727920532227, "Pretrain/Loss (Raw)": 2.1609365940093994, "Pretrain/Step": 1854, "Pretrain/Step Time": 8.514939786866307} +{"Pretrain/Learning Rate": 4.6534394586775254e-05, "Pretrain/Loss": 2.0840630531311035, "Pretrain/Loss (Raw)": 1.9870926141738892, "Pretrain/Step": 1855, "Pretrain/Step Time": 8.510906631127} +{"Pretrain/Learning Rate": 4.653008075899781e-05, "Pretrain/Loss": 2.082979679107666, "Pretrain/Loss (Raw)": 2.017698287963867, "Pretrain/Step": 1856, "Pretrain/Step Time": 8.514747254550457} +{"Pretrain/Learning Rate": 4.652576444826999e-05, "Pretrain/Loss": 2.0852956771850586, "Pretrain/Loss (Raw)": 2.1691174507141113, "Pretrain/Step": 1857, "Pretrain/Step Time": 8.50958807952702} +{"Pretrain/Learning Rate": 4.652144565508959e-05, "Pretrain/Loss": 2.0853304862976074, "Pretrain/Loss (Raw)": 2.0873615741729736, "Pretrain/Step": 1858, "Pretrain/Step Time": 8.510390689596534} +{"Pretrain/Learning Rate": 4.6517124379954655e-05, "Pretrain/Loss": 2.0888819694519043, "Pretrain/Loss (Raw)": 2.0965001583099365, "Pretrain/Step": 1859, "Pretrain/Step Time": 8.510973269119859} +{"Pretrain/Learning Rate": 4.651280062336355e-05, "Pretrain/Loss": 2.0889101028442383, "Pretrain/Loss (Raw)": 2.020993709564209, "Pretrain/Step": 1860, "Pretrain/Step Time": 8.508570471778512} +{"Pretrain/Learning Rate": 4.65084743858149e-05, "Pretrain/Loss": 2.086963176727295, "Pretrain/Loss (Raw)": 1.955129623413086, "Pretrain/Step": 1861, "Pretrain/Step Time": 8.500986283645034} +{"Pretrain/Learning Rate": 4.6504145667807644e-05, "Pretrain/Loss": 2.0879158973693848, "Pretrain/Loss (Raw)": 2.1583924293518066, "Pretrain/Step": 1862, "Pretrain/Step Time": 8.500590648502111} +{"Pretrain/Learning Rate": 4.649981446984097e-05, "Pretrain/Loss": 2.089266777038574, "Pretrain/Loss (Raw)": 2.2212753295898438, "Pretrain/Step": 1863, "Pretrain/Step Time": 8.50283975712955} +{"Pretrain/Learning Rate": 4.649548079241438e-05, "Pretrain/Loss": 2.0878562927246094, "Pretrain/Loss (Raw)": 1.8163020610809326, "Pretrain/Step": 1864, "Pretrain/Step Time": 8.507168805226684} +{"Pretrain/Learning Rate": 4.649114463602766e-05, "Pretrain/Loss": 2.088118314743042, "Pretrain/Loss (Raw)": 1.9055883884429932, "Pretrain/Step": 1865, "Pretrain/Step Time": 8.504969099536538} +{"Pretrain/Learning Rate": 4.648680600118087e-05, "Pretrain/Loss": 2.0909571647644043, "Pretrain/Loss (Raw)": 2.1371309757232666, "Pretrain/Step": 1866, "Pretrain/Step Time": 8.498407758772373} +{"Pretrain/Learning Rate": 4.6482464888374365e-05, "Pretrain/Loss": 2.091303586959839, "Pretrain/Loss (Raw)": 2.064218282699585, "Pretrain/Step": 1867, "Pretrain/Step Time": 8.497868120670319} +{"Pretrain/Learning Rate": 4.6478121298108776e-05, "Pretrain/Loss": 2.0891597270965576, "Pretrain/Loss (Raw)": 1.8802812099456787, "Pretrain/Step": 1868, "Pretrain/Step Time": 8.502286428585649} +{"Pretrain/Learning Rate": 4.647377523088503e-05, "Pretrain/Loss": 2.0870182514190674, "Pretrain/Loss (Raw)": 1.748395323753357, "Pretrain/Step": 1869, "Pretrain/Step Time": 8.503409745171666} +{"Pretrain/Learning Rate": 4.6469426687204346e-05, "Pretrain/Loss": 2.0878727436065674, "Pretrain/Loss (Raw)": 1.985133409500122, "Pretrain/Step": 1870, "Pretrain/Step Time": 8.504679642617702} +{"Pretrain/Learning Rate": 4.646507566756819e-05, "Pretrain/Loss": 2.0868072509765625, "Pretrain/Loss (Raw)": 2.013996124267578, "Pretrain/Step": 1871, "Pretrain/Step Time": 8.502232139930129} +{"Pretrain/Learning Rate": 4.646072217247838e-05, "Pretrain/Loss": 2.08573317527771, "Pretrain/Loss (Raw)": 1.9994986057281494, "Pretrain/Step": 1872, "Pretrain/Step Time": 8.501958165317774} +{"Pretrain/Learning Rate": 4.645636620243695e-05, "Pretrain/Loss": 2.084163188934326, "Pretrain/Loss (Raw)": 1.8495904207229614, "Pretrain/Step": 1873, "Pretrain/Step Time": 8.503278631716967} +{"Pretrain/Learning Rate": 4.645200775794628e-05, "Pretrain/Loss": 2.084780693054199, "Pretrain/Loss (Raw)": 2.134255886077881, "Pretrain/Step": 1874, "Pretrain/Step Time": 8.506480503827333} +{"Pretrain/Learning Rate": 4.6447646839508975e-05, "Pretrain/Loss": 2.0854086875915527, "Pretrain/Loss (Raw)": 2.033341407775879, "Pretrain/Step": 1875, "Pretrain/Step Time": 8.50811374373734} +{"Pretrain/Learning Rate": 4.6443283447627974e-05, "Pretrain/Loss": 2.0861992835998535, "Pretrain/Loss (Raw)": 2.094118356704712, "Pretrain/Step": 1876, "Pretrain/Step Time": 8.512298174202442} +{"Pretrain/Learning Rate": 4.643891758280649e-05, "Pretrain/Loss": 2.0849947929382324, "Pretrain/Loss (Raw)": 2.0090904235839844, "Pretrain/Step": 1877, "Pretrain/Step Time": 8.509251331910491} +{"Pretrain/Learning Rate": 4.6434549245548e-05, "Pretrain/Loss": 2.083803176879883, "Pretrain/Loss (Raw)": 2.1062638759613037, "Pretrain/Step": 1878, "Pretrain/Step Time": 8.500200496986508} +{"Pretrain/Learning Rate": 4.643017843635629e-05, "Pretrain/Loss": 2.0835049152374268, "Pretrain/Loss (Raw)": 1.9725106954574585, "Pretrain/Step": 1879, "Pretrain/Step Time": 8.500747211277485} +{"Pretrain/Learning Rate": 4.6425805155735416e-05, "Pretrain/Loss": 2.0796585083007812, "Pretrain/Loss (Raw)": 2.2265689373016357, "Pretrain/Step": 1880, "Pretrain/Step Time": 8.498720277100801} +{"Pretrain/Learning Rate": 4.642142940418973e-05, "Pretrain/Loss": 2.0806188583374023, "Pretrain/Loss (Raw)": 2.1985092163085938, "Pretrain/Step": 1881, "Pretrain/Step Time": 8.498605962842703} +{"Pretrain/Learning Rate": 4.641705118222387e-05, "Pretrain/Loss": 2.079227924346924, "Pretrain/Loss (Raw)": 2.048830032348633, "Pretrain/Step": 1882, "Pretrain/Step Time": 8.510445220395923} +{"Pretrain/Learning Rate": 4.6412670490342747e-05, "Pretrain/Loss": 2.080155611038208, "Pretrain/Loss (Raw)": 2.2592368125915527, "Pretrain/Step": 1883, "Pretrain/Step Time": 8.498322350904346} +{"Pretrain/Learning Rate": 4.6408287329051556e-05, "Pretrain/Loss": 2.0806689262390137, "Pretrain/Loss (Raw)": 2.091083288192749, "Pretrain/Step": 1884, "Pretrain/Step Time": 8.496465310454369} +{"Pretrain/Learning Rate": 4.64039016988558e-05, "Pretrain/Loss": 2.0762529373168945, "Pretrain/Loss (Raw)": 1.9439111948013306, "Pretrain/Step": 1885, "Pretrain/Step Time": 8.496235575526953} +{"Pretrain/Learning Rate": 4.639951360026123e-05, "Pretrain/Loss": 2.0765061378479004, "Pretrain/Loss (Raw)": 2.0159220695495605, "Pretrain/Step": 1886, "Pretrain/Step Time": 8.504208529368043} +{"Pretrain/Learning Rate": 4.639512303377393e-05, "Pretrain/Loss": 2.076171875, "Pretrain/Loss (Raw)": 2.0858066082000732, "Pretrain/Step": 1887, "Pretrain/Step Time": 8.505155231803656} +{"Pretrain/Learning Rate": 4.639072999990022e-05, "Pretrain/Loss": 2.075319766998291, "Pretrain/Loss (Raw)": 2.122447967529297, "Pretrain/Step": 1888, "Pretrain/Step Time": 8.514724604785442} +{"Pretrain/Learning Rate": 4.6386334499146724e-05, "Pretrain/Loss": 2.0748467445373535, "Pretrain/Loss (Raw)": 2.206185817718506, "Pretrain/Step": 1889, "Pretrain/Step Time": 8.510017819702625} +{"Pretrain/Learning Rate": 4.638193653202035e-05, "Pretrain/Loss": 2.076268196105957, "Pretrain/Loss (Raw)": 2.3372387886047363, "Pretrain/Step": 1890, "Pretrain/Step Time": 8.501854322850704} +{"Pretrain/Learning Rate": 4.6377536099028315e-05, "Pretrain/Loss": 2.0775184631347656, "Pretrain/Loss (Raw)": 2.2076241970062256, "Pretrain/Step": 1891, "Pretrain/Step Time": 8.499059362336993} +{"Pretrain/Learning Rate": 4.637313320067808e-05, "Pretrain/Loss": 2.0798099040985107, "Pretrain/Loss (Raw)": 2.2958338260650635, "Pretrain/Step": 1892, "Pretrain/Step Time": 8.505124310031533} +{"Pretrain/Learning Rate": 4.636872783747741e-05, "Pretrain/Loss": 2.0801889896392822, "Pretrain/Loss (Raw)": 2.082242727279663, "Pretrain/Step": 1893, "Pretrain/Step Time": 8.504207409918308} +{"Pretrain/Learning Rate": 4.636432000993435e-05, "Pretrain/Loss": 2.0802674293518066, "Pretrain/Loss (Raw)": 2.133392810821533, "Pretrain/Step": 1894, "Pretrain/Step Time": 8.51608519628644} +{"Pretrain/Learning Rate": 4.635990971855724e-05, "Pretrain/Loss": 2.077852964401245, "Pretrain/Loss (Raw)": 1.9007197618484497, "Pretrain/Step": 1895, "Pretrain/Step Time": 8.513310190290213} +{"Pretrain/Learning Rate": 4.6355496963854684e-05, "Pretrain/Loss": 2.0783705711364746, "Pretrain/Loss (Raw)": 2.109318494796753, "Pretrain/Step": 1896, "Pretrain/Step Time": 8.508431265130639} +{"Pretrain/Learning Rate": 4.635108174633559e-05, "Pretrain/Loss": 2.0789995193481445, "Pretrain/Loss (Raw)": 2.1847264766693115, "Pretrain/Step": 1897, "Pretrain/Step Time": 8.502329677343369} +{"Pretrain/Learning Rate": 4.634666406650914e-05, "Pretrain/Loss": 2.07826828956604, "Pretrain/Loss (Raw)": 2.1217100620269775, "Pretrain/Step": 1898, "Pretrain/Step Time": 8.505885269492865} +{"Pretrain/Learning Rate": 4.63422439248848e-05, "Pretrain/Loss": 2.0746617317199707, "Pretrain/Loss (Raw)": 1.8360306024551392, "Pretrain/Step": 1899, "Pretrain/Step Time": 8.514475563541055} +{"Pretrain/Learning Rate": 4.633782132197232e-05, "Pretrain/Loss": 2.073683738708496, "Pretrain/Loss (Raw)": 1.822698950767517, "Pretrain/Step": 1900, "Pretrain/Step Time": 8.52003868110478} +{"Pretrain/Learning Rate": 4.633339625828173e-05, "Pretrain/Loss": 2.069971799850464, "Pretrain/Loss (Raw)": 2.0393707752227783, "Pretrain/Step": 1901, "Pretrain/Step Time": 8.51927724480629} +{"Pretrain/Learning Rate": 4.632896873432338e-05, "Pretrain/Loss": 2.0705673694610596, "Pretrain/Loss (Raw)": 2.2217178344726562, "Pretrain/Step": 1902, "Pretrain/Step Time": 8.513998176902533} +{"Pretrain/Learning Rate": 4.632453875060784e-05, "Pretrain/Loss": 2.070758581161499, "Pretrain/Loss (Raw)": 2.10467267036438, "Pretrain/Step": 1903, "Pretrain/Step Time": 8.512621704488993} +{"Pretrain/Learning Rate": 4.6320106307646e-05, "Pretrain/Loss": 2.067793607711792, "Pretrain/Loss (Raw)": 1.8594732284545898, "Pretrain/Step": 1904, "Pretrain/Step Time": 8.514785710722208} +{"Pretrain/Learning Rate": 4.6315671405949046e-05, "Pretrain/Loss": 2.069594144821167, "Pretrain/Loss (Raw)": 2.0954315662384033, "Pretrain/Step": 1905, "Pretrain/Step Time": 8.525710826739669} +{"Pretrain/Learning Rate": 4.631123404602842e-05, "Pretrain/Loss": 2.070870876312256, "Pretrain/Loss (Raw)": 2.209606885910034, "Pretrain/Step": 1906, "Pretrain/Step Time": 8.524013997986913} +{"Pretrain/Learning Rate": 4.630679422839585e-05, "Pretrain/Loss": 2.070976734161377, "Pretrain/Loss (Raw)": 2.0324132442474365, "Pretrain/Step": 1907, "Pretrain/Step Time": 8.523764874786139} +{"Pretrain/Learning Rate": 4.6302351953563385e-05, "Pretrain/Loss": 2.070869207382202, "Pretrain/Loss (Raw)": 1.9867862462997437, "Pretrain/Step": 1908, "Pretrain/Step Time": 8.514256270602345} +{"Pretrain/Learning Rate": 4.629790722204331e-05, "Pretrain/Loss": 2.0697100162506104, "Pretrain/Loss (Raw)": 1.9629889726638794, "Pretrain/Step": 1909, "Pretrain/Step Time": 8.50859958305955} +{"Pretrain/Learning Rate": 4.629346003434821e-05, "Pretrain/Loss": 2.069594383239746, "Pretrain/Loss (Raw)": 2.079813241958618, "Pretrain/Step": 1910, "Pretrain/Step Time": 8.522920923307538} +{"Pretrain/Learning Rate": 4.628901039099096e-05, "Pretrain/Loss": 2.069735527038574, "Pretrain/Loss (Raw)": 2.089451313018799, "Pretrain/Step": 1911, "Pretrain/Step Time": 8.526819288730621} +{"Pretrain/Learning Rate": 4.6284558292484724e-05, "Pretrain/Loss": 2.0682449340820312, "Pretrain/Loss (Raw)": 2.095613956451416, "Pretrain/Step": 1912, "Pretrain/Step Time": 8.530699586495757} +{"Pretrain/Learning Rate": 4.628010373934292e-05, "Pretrain/Loss": 2.069185256958008, "Pretrain/Loss (Raw)": 2.188765525817871, "Pretrain/Step": 1913, "Pretrain/Step Time": 8.528155347332358} +{"Pretrain/Learning Rate": 4.627564673207928e-05, "Pretrain/Loss": 2.0698704719543457, "Pretrain/Loss (Raw)": 2.2762722969055176, "Pretrain/Step": 1914, "Pretrain/Step Time": 8.51885319314897} +{"Pretrain/Learning Rate": 4.62711872712078e-05, "Pretrain/Loss": 2.069483757019043, "Pretrain/Loss (Raw)": 1.976773738861084, "Pretrain/Step": 1915, "Pretrain/Step Time": 8.51451668329537} +{"Pretrain/Learning Rate": 4.626672535724278e-05, "Pretrain/Loss": 2.070098400115967, "Pretrain/Loss (Raw)": 2.1611127853393555, "Pretrain/Step": 1916, "Pretrain/Step Time": 8.524658218026161} +{"Pretrain/Learning Rate": 4.626226099069878e-05, "Pretrain/Loss": 2.0698482990264893, "Pretrain/Loss (Raw)": 2.0250673294067383, "Pretrain/Step": 1917, "Pretrain/Step Time": 8.529053756967187} +{"Pretrain/Learning Rate": 4.625779417209065e-05, "Pretrain/Loss": 2.070340156555176, "Pretrain/Loss (Raw)": 2.2018120288848877, "Pretrain/Step": 1918, "Pretrain/Step Time": 8.525825332850218} +{"Pretrain/Learning Rate": 4.625332490193352e-05, "Pretrain/Loss": 2.074759006500244, "Pretrain/Loss (Raw)": 2.199251413345337, "Pretrain/Step": 1919, "Pretrain/Step Time": 8.526178495958447} +{"Pretrain/Learning Rate": 4.624885318074282e-05, "Pretrain/Loss": 2.074727773666382, "Pretrain/Loss (Raw)": 2.1902403831481934, "Pretrain/Step": 1920, "Pretrain/Step Time": 8.517860503867269} +{"Pretrain/Learning Rate": 4.624437900903424e-05, "Pretrain/Loss": 2.074939727783203, "Pretrain/Loss (Raw)": 2.0398576259613037, "Pretrain/Step": 1921, "Pretrain/Step Time": 8.519521491602063} +{"Pretrain/Learning Rate": 4.623990238732376e-05, "Pretrain/Loss": 2.0750014781951904, "Pretrain/Loss (Raw)": 2.03403639793396, "Pretrain/Step": 1922, "Pretrain/Step Time": 8.524904562160373} +{"Pretrain/Learning Rate": 4.6235423316127655e-05, "Pretrain/Loss": 2.074373722076416, "Pretrain/Loss (Raw)": 2.0542612075805664, "Pretrain/Step": 1923, "Pretrain/Step Time": 8.528369860723615} +{"Pretrain/Learning Rate": 4.623094179596248e-05, "Pretrain/Loss": 2.0708694458007812, "Pretrain/Loss (Raw)": 1.5762827396392822, "Pretrain/Step": 1924, "Pretrain/Step Time": 8.530248859897256} +{"Pretrain/Learning Rate": 4.622645782734504e-05, "Pretrain/Loss": 2.0708746910095215, "Pretrain/Loss (Raw)": 2.1333727836608887, "Pretrain/Step": 1925, "Pretrain/Step Time": 8.522730337455869} +{"Pretrain/Learning Rate": 4.6221971410792466e-05, "Pretrain/Loss": 2.072190284729004, "Pretrain/Loss (Raw)": 2.1501715183258057, "Pretrain/Step": 1926, "Pretrain/Step Time": 8.510881436988711} +{"Pretrain/Learning Rate": 4.621748254682214e-05, "Pretrain/Loss": 2.069882869720459, "Pretrain/Loss (Raw)": 2.015014886856079, "Pretrain/Step": 1927, "Pretrain/Step Time": 8.520464828237891} +{"Pretrain/Learning Rate": 4.621299123595176e-05, "Pretrain/Loss": 2.0696213245391846, "Pretrain/Loss (Raw)": 2.034421443939209, "Pretrain/Step": 1928, "Pretrain/Step Time": 8.520145151764154} +{"Pretrain/Learning Rate": 4.620849747869926e-05, "Pretrain/Loss": 2.068695306777954, "Pretrain/Loss (Raw)": 1.99812912940979, "Pretrain/Step": 1929, "Pretrain/Step Time": 8.526123490184546} +{"Pretrain/Learning Rate": 4.6204001275582904e-05, "Pretrain/Loss": 2.069744348526001, "Pretrain/Loss (Raw)": 2.1056370735168457, "Pretrain/Step": 1930, "Pretrain/Step Time": 8.529482757672668} +{"Pretrain/Learning Rate": 4.61995026271212e-05, "Pretrain/Loss": 2.070634365081787, "Pretrain/Loss (Raw)": 2.123042345046997, "Pretrain/Step": 1931, "Pretrain/Step Time": 8.524932546541095} +{"Pretrain/Learning Rate": 4.619500153383296e-05, "Pretrain/Loss": 2.069049835205078, "Pretrain/Loss (Raw)": 2.0165927410125732, "Pretrain/Step": 1932, "Pretrain/Step Time": 8.51608138345182} +{"Pretrain/Learning Rate": 4.619049799623726e-05, "Pretrain/Loss": 2.0706088542938232, "Pretrain/Loss (Raw)": 2.248901128768921, "Pretrain/Step": 1933, "Pretrain/Step Time": 8.524402452632785} +{"Pretrain/Learning Rate": 4.618599201485349e-05, "Pretrain/Loss": 2.071685314178467, "Pretrain/Loss (Raw)": 2.2256922721862793, "Pretrain/Step": 1934, "Pretrain/Step Time": 8.521853741258383} +{"Pretrain/Learning Rate": 4.618148359020128e-05, "Pretrain/Loss": 2.0714967250823975, "Pretrain/Loss (Raw)": 2.0382137298583984, "Pretrain/Step": 1935, "Pretrain/Step Time": 8.526504507288337} +{"Pretrain/Learning Rate": 4.617697272280057e-05, "Pretrain/Loss": 2.071314573287964, "Pretrain/Loss (Raw)": 2.008030891418457, "Pretrain/Step": 1936, "Pretrain/Step Time": 8.524996772408485} +{"Pretrain/Learning Rate": 4.6172459413171586e-05, "Pretrain/Loss": 2.0700531005859375, "Pretrain/Loss (Raw)": 2.12074613571167, "Pretrain/Step": 1937, "Pretrain/Step Time": 8.51418637484312} +{"Pretrain/Learning Rate": 4.616794366183481e-05, "Pretrain/Loss": 2.071578025817871, "Pretrain/Loss (Raw)": 2.1668601036071777, "Pretrain/Step": 1938, "Pretrain/Step Time": 8.507231079041958} +{"Pretrain/Learning Rate": 4.616342546931102e-05, "Pretrain/Loss": 2.067628860473633, "Pretrain/Loss (Raw)": 2.070823907852173, "Pretrain/Step": 1939, "Pretrain/Step Time": 8.506733087822795} +{"Pretrain/Learning Rate": 4.6158904836121286e-05, "Pretrain/Loss": 2.0689516067504883, "Pretrain/Loss (Raw)": 2.1514062881469727, "Pretrain/Step": 1940, "Pretrain/Step Time": 8.505510151386261} +{"Pretrain/Learning Rate": 4.6154381762786936e-05, "Pretrain/Loss": 2.0682613849639893, "Pretrain/Loss (Raw)": 2.0462324619293213, "Pretrain/Step": 1941, "Pretrain/Step Time": 8.505624115467072} +{"Pretrain/Learning Rate": 4.6149856249829606e-05, "Pretrain/Loss": 2.0664315223693848, "Pretrain/Loss (Raw)": 1.9334940910339355, "Pretrain/Step": 1942, "Pretrain/Step Time": 8.511954803019762} +{"Pretrain/Learning Rate": 4.6145328297771183e-05, "Pretrain/Loss": 2.0654807090759277, "Pretrain/Loss (Raw)": 2.005026340484619, "Pretrain/Step": 1943, "Pretrain/Step Time": 8.504420230165124} +{"Pretrain/Learning Rate": 4.614079790713387e-05, "Pretrain/Loss": 2.0653114318847656, "Pretrain/Loss (Raw)": 2.065356492996216, "Pretrain/Step": 1944, "Pretrain/Step Time": 8.499994026497006} +{"Pretrain/Learning Rate": 4.613626507844012e-05, "Pretrain/Loss": 2.0653300285339355, "Pretrain/Loss (Raw)": 2.107440710067749, "Pretrain/Step": 1945, "Pretrain/Step Time": 8.501091253012419} +{"Pretrain/Learning Rate": 4.613172981221268e-05, "Pretrain/Loss": 2.0625600814819336, "Pretrain/Loss (Raw)": 1.8549045324325562, "Pretrain/Step": 1946, "Pretrain/Step Time": 8.504816960543394} +{"Pretrain/Learning Rate": 4.612719210897459e-05, "Pretrain/Loss": 2.0623064041137695, "Pretrain/Loss (Raw)": 2.1322836875915527, "Pretrain/Step": 1947, "Pretrain/Step Time": 8.50751255825162} +{"Pretrain/Learning Rate": 4.612265196924914e-05, "Pretrain/Loss": 2.0631206035614014, "Pretrain/Loss (Raw)": 2.1942121982574463, "Pretrain/Step": 1948, "Pretrain/Step Time": 8.50360383093357} +{"Pretrain/Learning Rate": 4.611810939355995e-05, "Pretrain/Loss": 2.0610437393188477, "Pretrain/Loss (Raw)": 1.8411113023757935, "Pretrain/Step": 1949, "Pretrain/Step Time": 8.502647798508406} +{"Pretrain/Learning Rate": 4.611356438243085e-05, "Pretrain/Loss": 2.060152530670166, "Pretrain/Loss (Raw)": 1.8801268339157104, "Pretrain/Step": 1950, "Pretrain/Step Time": 8.497105652466416} +{"Pretrain/Learning Rate": 4.610901693638603e-05, "Pretrain/Loss": 2.059112548828125, "Pretrain/Loss (Raw)": 2.104543924331665, "Pretrain/Step": 1951, "Pretrain/Step Time": 8.505169177427888} +{"Pretrain/Learning Rate": 4.610446705594991e-05, "Pretrain/Loss": 2.0579588413238525, "Pretrain/Loss (Raw)": 1.815721035003662, "Pretrain/Step": 1952, "Pretrain/Step Time": 8.50426472723484} +{"Pretrain/Learning Rate": 4.6099914741647196e-05, "Pretrain/Loss": 2.0582733154296875, "Pretrain/Loss (Raw)": 2.2833685874938965, "Pretrain/Step": 1953, "Pretrain/Step Time": 8.504249893128872} +{"Pretrain/Learning Rate": 4.609535999400289e-05, "Pretrain/Loss": 2.0556769371032715, "Pretrain/Loss (Raw)": 2.0148749351501465, "Pretrain/Step": 1954, "Pretrain/Step Time": 8.503895599395037} +{"Pretrain/Learning Rate": 4.6090802813542255e-05, "Pretrain/Loss": 2.056347131729126, "Pretrain/Loss (Raw)": 2.185758113861084, "Pretrain/Step": 1955, "Pretrain/Step Time": 8.495974063873291} +{"Pretrain/Learning Rate": 4.608624320079087e-05, "Pretrain/Loss": 2.055698871612549, "Pretrain/Loss (Raw)": 2.0961453914642334, "Pretrain/Step": 1956, "Pretrain/Step Time": 8.497085956856608} +{"Pretrain/Learning Rate": 4.608168115627455e-05, "Pretrain/Loss": 2.057960033416748, "Pretrain/Loss (Raw)": 2.233180522918701, "Pretrain/Step": 1957, "Pretrain/Step Time": 8.498727466911077} +{"Pretrain/Learning Rate": 4.607711668051942e-05, "Pretrain/Loss": 2.054624319076538, "Pretrain/Loss (Raw)": 1.7736053466796875, "Pretrain/Step": 1958, "Pretrain/Step Time": 8.502803904935718} +{"Pretrain/Learning Rate": 4.6072549774051874e-05, "Pretrain/Loss": 2.049984931945801, "Pretrain/Loss (Raw)": 1.5145632028579712, "Pretrain/Step": 1959, "Pretrain/Step Time": 8.501453962177038} +{"Pretrain/Learning Rate": 4.60679804373986e-05, "Pretrain/Loss": 2.050985813140869, "Pretrain/Loss (Raw)": 1.9807761907577515, "Pretrain/Step": 1960, "Pretrain/Step Time": 8.49656480550766} +{"Pretrain/Learning Rate": 4.606340867108653e-05, "Pretrain/Loss": 2.0503134727478027, "Pretrain/Loss (Raw)": 2.131547212600708, "Pretrain/Step": 1961, "Pretrain/Step Time": 8.494463777169585} +{"Pretrain/Learning Rate": 4.605883447564293e-05, "Pretrain/Loss": 2.048649549484253, "Pretrain/Loss (Raw)": 2.1063709259033203, "Pretrain/Step": 1962, "Pretrain/Step Time": 8.493657166138291} +{"Pretrain/Learning Rate": 4.6054257851595303e-05, "Pretrain/Loss": 2.0486559867858887, "Pretrain/Loss (Raw)": 2.057742118835449, "Pretrain/Step": 1963, "Pretrain/Step Time": 8.494182910770178} +{"Pretrain/Learning Rate": 4.604967879947145e-05, "Pretrain/Loss": 2.048455238342285, "Pretrain/Loss (Raw)": 1.90269136428833, "Pretrain/Step": 1964, "Pretrain/Step Time": 8.495898012071848} +{"Pretrain/Learning Rate": 4.6045097319799447e-05, "Pretrain/Loss": 2.0479719638824463, "Pretrain/Loss (Raw)": 1.8294326066970825, "Pretrain/Step": 1965, "Pretrain/Step Time": 8.497565310448408} +{"Pretrain/Learning Rate": 4.6040513413107655e-05, "Pretrain/Loss": 2.046447277069092, "Pretrain/Loss (Raw)": 2.032898187637329, "Pretrain/Step": 1966, "Pretrain/Step Time": 8.499245187267661} +{"Pretrain/Learning Rate": 4.603592707992471e-05, "Pretrain/Loss": 2.0470032691955566, "Pretrain/Loss (Raw)": 2.1109445095062256, "Pretrain/Step": 1967, "Pretrain/Step Time": 8.494303399696946} +{"Pretrain/Learning Rate": 4.6031338320779534e-05, "Pretrain/Loss": 2.0470528602600098, "Pretrain/Loss (Raw)": 2.035151958465576, "Pretrain/Step": 1968, "Pretrain/Step Time": 8.49238926358521} +{"Pretrain/Learning Rate": 4.602674713620131e-05, "Pretrain/Loss": 2.0465593338012695, "Pretrain/Loss (Raw)": 2.201245069503784, "Pretrain/Step": 1969, "Pretrain/Step Time": 8.498017601668835} +{"Pretrain/Learning Rate": 4.6022153526719536e-05, "Pretrain/Loss": 2.047630548477173, "Pretrain/Loss (Raw)": 2.046192169189453, "Pretrain/Step": 1970, "Pretrain/Step Time": 8.500056339427829} +{"Pretrain/Learning Rate": 4.601755749286395e-05, "Pretrain/Loss": 2.0479226112365723, "Pretrain/Loss (Raw)": 2.0482017993927, "Pretrain/Step": 1971, "Pretrain/Step Time": 8.5079854875803} +{"Pretrain/Learning Rate": 4.6012959035164596e-05, "Pretrain/Loss": 2.050797462463379, "Pretrain/Loss (Raw)": 2.3179497718811035, "Pretrain/Step": 1972, "Pretrain/Step Time": 8.503907041624188} +{"Pretrain/Learning Rate": 4.6008358154151794e-05, "Pretrain/Loss": 2.051833152770996, "Pretrain/Loss (Raw)": 2.3023629188537598, "Pretrain/Step": 1973, "Pretrain/Step Time": 8.49390641786158} +{"Pretrain/Learning Rate": 4.600375485035613e-05, "Pretrain/Loss": 2.0537960529327393, "Pretrain/Loss (Raw)": 2.1301000118255615, "Pretrain/Step": 1974, "Pretrain/Step Time": 8.493837231770158} +{"Pretrain/Learning Rate": 4.599914912430849e-05, "Pretrain/Loss": 2.0548629760742188, "Pretrain/Loss (Raw)": 2.1608715057373047, "Pretrain/Step": 1975, "Pretrain/Step Time": 8.502245780080557} +{"Pretrain/Learning Rate": 4.5994540976540013e-05, "Pretrain/Loss": 2.055603265762329, "Pretrain/Loss (Raw)": 1.9502685070037842, "Pretrain/Step": 1976, "Pretrain/Step Time": 8.509738735854626} +{"Pretrain/Learning Rate": 4.598993040758215e-05, "Pretrain/Loss": 2.0572633743286133, "Pretrain/Loss (Raw)": 2.1500072479248047, "Pretrain/Step": 1977, "Pretrain/Step Time": 8.509949382394552} +{"Pretrain/Learning Rate": 4.59853174179666e-05, "Pretrain/Loss": 2.0588250160217285, "Pretrain/Loss (Raw)": 1.9696301221847534, "Pretrain/Step": 1978, "Pretrain/Step Time": 8.506121402606368} +{"Pretrain/Learning Rate": 4.5980702008225365e-05, "Pretrain/Loss": 2.0608766078948975, "Pretrain/Loss (Raw)": 2.0662577152252197, "Pretrain/Step": 1979, "Pretrain/Step Time": 8.506376344710588} +{"Pretrain/Learning Rate": 4.59760841788907e-05, "Pretrain/Loss": 2.062026023864746, "Pretrain/Loss (Raw)": 2.151549816131592, "Pretrain/Step": 1980, "Pretrain/Step Time": 8.503225995227695} +{"Pretrain/Learning Rate": 4.597146393049517e-05, "Pretrain/Loss": 2.065335750579834, "Pretrain/Loss (Raw)": 2.4364356994628906, "Pretrain/Step": 1981, "Pretrain/Step Time": 8.5023752450943} +{"Pretrain/Learning Rate": 4.59668412635716e-05, "Pretrain/Loss": 2.0611720085144043, "Pretrain/Loss (Raw)": 1.6280121803283691, "Pretrain/Step": 1982, "Pretrain/Step Time": 8.50372052565217} +{"Pretrain/Learning Rate": 4.5962216178653095e-05, "Pretrain/Loss": 2.0616769790649414, "Pretrain/Loss (Raw)": 2.051741600036621, "Pretrain/Step": 1983, "Pretrain/Step Time": 8.514145171269774} +{"Pretrain/Learning Rate": 4.5957588676273046e-05, "Pretrain/Loss": 2.0639166831970215, "Pretrain/Loss (Raw)": 2.30433988571167, "Pretrain/Step": 1984, "Pretrain/Step Time": 8.505855228751898} +{"Pretrain/Learning Rate": 4.595295875696511e-05, "Pretrain/Loss": 2.0625247955322266, "Pretrain/Loss (Raw)": 1.990970253944397, "Pretrain/Step": 1985, "Pretrain/Step Time": 8.510595606639981} +{"Pretrain/Learning Rate": 4.5948326421263244e-05, "Pretrain/Loss": 2.0618414878845215, "Pretrain/Loss (Raw)": 1.9998703002929688, "Pretrain/Step": 1986, "Pretrain/Step Time": 8.508857741951942} +{"Pretrain/Learning Rate": 4.5943691669701654e-05, "Pretrain/Loss": 2.062145709991455, "Pretrain/Loss (Raw)": 2.135458469390869, "Pretrain/Step": 1987, "Pretrain/Step Time": 8.517206134274602} +{"Pretrain/Learning Rate": 4.593905450281486e-05, "Pretrain/Loss": 2.063018798828125, "Pretrain/Loss (Raw)": 2.1327528953552246, "Pretrain/Step": 1988, "Pretrain/Step Time": 8.519511122256517} +{"Pretrain/Learning Rate": 4.593441492113763e-05, "Pretrain/Loss": 2.0646979808807373, "Pretrain/Loss (Raw)": 2.170088291168213, "Pretrain/Step": 1989, "Pretrain/Step Time": 8.524093436077237} +{"Pretrain/Learning Rate": 4.5929772925205014e-05, "Pretrain/Loss": 2.067387580871582, "Pretrain/Loss (Raw)": 2.502640724182129, "Pretrain/Step": 1990, "Pretrain/Step Time": 8.524052016437054} +{"Pretrain/Learning Rate": 4.592512851555237e-05, "Pretrain/Loss": 2.065979480743408, "Pretrain/Loss (Raw)": 2.041018009185791, "Pretrain/Step": 1991, "Pretrain/Step Time": 8.520186332985759} +{"Pretrain/Learning Rate": 4.592048169271531e-05, "Pretrain/Loss": 2.066617012023926, "Pretrain/Loss (Raw)": 1.897942066192627, "Pretrain/Step": 1992, "Pretrain/Step Time": 8.518518073484302} +{"Pretrain/Learning Rate": 4.591583245722971e-05, "Pretrain/Loss": 2.067514181137085, "Pretrain/Loss (Raw)": 2.020402431488037, "Pretrain/Step": 1993, "Pretrain/Step Time": 8.518253173679113} +{"Pretrain/Learning Rate": 4.591118080963176e-05, "Pretrain/Loss": 2.0662736892700195, "Pretrain/Loss (Raw)": 1.978369951248169, "Pretrain/Step": 1994, "Pretrain/Step Time": 8.524997308850288} +{"Pretrain/Learning Rate": 4.590652675045789e-05, "Pretrain/Loss": 2.0658087730407715, "Pretrain/Loss (Raw)": 2.0046944618225098, "Pretrain/Step": 1995, "Pretrain/Step Time": 8.521433494985104} +{"Pretrain/Learning Rate": 4.5901870280244855e-05, "Pretrain/Loss": 2.0643651485443115, "Pretrain/Loss (Raw)": 1.695502519607544, "Pretrain/Step": 1996, "Pretrain/Step Time": 8.514799179509282} +{"Pretrain/Learning Rate": 4.589721139952964e-05, "Pretrain/Loss": 2.0672969818115234, "Pretrain/Loss (Raw)": 2.1236603260040283, "Pretrain/Step": 1997, "Pretrain/Step Time": 8.51560310460627} +{"Pretrain/Learning Rate": 4.589255010884953e-05, "Pretrain/Loss": 2.0672006607055664, "Pretrain/Loss (Raw)": 1.9728227853775024, "Pretrain/Step": 1998, "Pretrain/Step Time": 8.511312991380692} +{"Pretrain/Learning Rate": 4.58878864087421e-05, "Pretrain/Loss": 2.067193031311035, "Pretrain/Loss (Raw)": 2.013017177581787, "Pretrain/Step": 1999, "Pretrain/Step Time": 8.520696500316262} +{"Pretrain/Learning Rate": 4.5883220299745176e-05, "Pretrain/Loss": 2.0669708251953125, "Pretrain/Loss (Raw)": 1.9710391759872437, "Pretrain/Step": 2000, "Pretrain/Step Time": 8.529710611328483} +{"Pretrain/Learning Rate": 4.587855178239689e-05, "Pretrain/Loss": 2.068777561187744, "Pretrain/Loss (Raw)": 2.080850839614868, "Pretrain/Step": 2001, "Pretrain/Step Time": 8.523381523787975} +{"Pretrain/Learning Rate": 4.587388085723562e-05, "Pretrain/Loss": 2.0691521167755127, "Pretrain/Loss (Raw)": 2.1822001934051514, "Pretrain/Step": 2002, "Pretrain/Step Time": 8.52220544219017} +{"Pretrain/Learning Rate": 4.586920752480006e-05, "Pretrain/Loss": 2.0717482566833496, "Pretrain/Loss (Raw)": 2.3656423091888428, "Pretrain/Step": 2003, "Pretrain/Step Time": 8.52156143821776} +{"Pretrain/Learning Rate": 4.5864531785629136e-05, "Pretrain/Loss": 2.071824550628662, "Pretrain/Loss (Raw)": 2.103886842727661, "Pretrain/Step": 2004, "Pretrain/Step Time": 8.52421996742487} +{"Pretrain/Learning Rate": 4.5859853640262104e-05, "Pretrain/Loss": 2.073090076446533, "Pretrain/Loss (Raw)": 2.1711127758026123, "Pretrain/Step": 2005, "Pretrain/Step Time": 8.527433490380645} +{"Pretrain/Learning Rate": 4.5855173089238445e-05, "Pretrain/Loss": 2.073855400085449, "Pretrain/Loss (Raw)": 2.2042148113250732, "Pretrain/Step": 2006, "Pretrain/Step Time": 8.5363445058465} +{"Pretrain/Learning Rate": 4.5850490133097957e-05, "Pretrain/Loss": 2.0745487213134766, "Pretrain/Loss (Raw)": 2.0612356662750244, "Pretrain/Step": 2007, "Pretrain/Step Time": 8.528745202347636} +{"Pretrain/Learning Rate": 4.584580477238069e-05, "Pretrain/Loss": 2.07163143157959, "Pretrain/Loss (Raw)": 1.8531662225723267, "Pretrain/Step": 2008, "Pretrain/Step Time": 8.533405737951398} +{"Pretrain/Learning Rate": 4.5841117007627e-05, "Pretrain/Loss": 2.0706446170806885, "Pretrain/Loss (Raw)": 2.072183847427368, "Pretrain/Step": 2009, "Pretrain/Step Time": 8.528246691450477} +{"Pretrain/Learning Rate": 4.583642683937748e-05, "Pretrain/Loss": 2.072321653366089, "Pretrain/Loss (Raw)": 2.26348876953125, "Pretrain/Step": 2010, "Pretrain/Step Time": 8.523191392421722} +{"Pretrain/Learning Rate": 4.583173426817304e-05, "Pretrain/Loss": 2.0706138610839844, "Pretrain/Loss (Raw)": 2.040656566619873, "Pretrain/Step": 2011, "Pretrain/Step Time": 8.53564658202231} +{"Pretrain/Learning Rate": 4.5827039294554833e-05, "Pretrain/Loss": 2.070589065551758, "Pretrain/Loss (Raw)": 2.08791184425354, "Pretrain/Step": 2012, "Pretrain/Step Time": 8.533079272136092} +{"Pretrain/Learning Rate": 4.582234191906432e-05, "Pretrain/Loss": 2.070065498352051, "Pretrain/Loss (Raw)": 1.876891851425171, "Pretrain/Step": 2013, "Pretrain/Step Time": 8.532611705362797} +{"Pretrain/Learning Rate": 4.581764214224322e-05, "Pretrain/Loss": 2.0710082054138184, "Pretrain/Loss (Raw)": 2.136594533920288, "Pretrain/Step": 2014, "Pretrain/Step Time": 8.526009790599346} +{"Pretrain/Learning Rate": 4.581293996463353e-05, "Pretrain/Loss": 2.071566581726074, "Pretrain/Loss (Raw)": 2.1572632789611816, "Pretrain/Step": 2015, "Pretrain/Step Time": 8.522256433963776} +{"Pretrain/Learning Rate": 4.580823538677753e-05, "Pretrain/Loss": 2.070051670074463, "Pretrain/Loss (Raw)": 1.9285597801208496, "Pretrain/Step": 2016, "Pretrain/Step Time": 8.515947796404362} +{"Pretrain/Learning Rate": 4.580352840921777e-05, "Pretrain/Loss": 2.0682477951049805, "Pretrain/Loss (Raw)": 1.9752930402755737, "Pretrain/Step": 2017, "Pretrain/Step Time": 8.527633003890514} +{"Pretrain/Learning Rate": 4.579881903249709e-05, "Pretrain/Loss": 2.067012310028076, "Pretrain/Loss (Raw)": 2.179094076156616, "Pretrain/Step": 2018, "Pretrain/Step Time": 8.523389916867018} +{"Pretrain/Learning Rate": 4.5794107257158595e-05, "Pretrain/Loss": 2.065880298614502, "Pretrain/Loss (Raw)": 2.06270432472229, "Pretrain/Step": 2019, "Pretrain/Step Time": 8.523962739855051} +{"Pretrain/Learning Rate": 4.578939308374566e-05, "Pretrain/Loss": 2.0639283657073975, "Pretrain/Loss (Raw)": 2.045994758605957, "Pretrain/Step": 2020, "Pretrain/Step Time": 8.517255021259189} +{"Pretrain/Learning Rate": 4.578467651280195e-05, "Pretrain/Loss": 2.063477039337158, "Pretrain/Loss (Raw)": 2.0244951248168945, "Pretrain/Step": 2021, "Pretrain/Step Time": 8.518401501700282} +{"Pretrain/Learning Rate": 4.57799575448714e-05, "Pretrain/Loss": 2.062842845916748, "Pretrain/Loss (Raw)": 2.052183151245117, "Pretrain/Step": 2022, "Pretrain/Step Time": 8.507024262100458} +{"Pretrain/Learning Rate": 4.5775236180498235e-05, "Pretrain/Loss": 2.0660629272460938, "Pretrain/Loss (Raw)": 2.312889575958252, "Pretrain/Step": 2023, "Pretrain/Step Time": 8.514642808586359} +{"Pretrain/Learning Rate": 4.5770512420226934e-05, "Pretrain/Loss": 2.0662131309509277, "Pretrain/Loss (Raw)": 2.1285386085510254, "Pretrain/Step": 2024, "Pretrain/Step Time": 8.511702548712492} +{"Pretrain/Learning Rate": 4.5765786264602274e-05, "Pretrain/Loss": 2.0657944679260254, "Pretrain/Loss (Raw)": 2.1311306953430176, "Pretrain/Step": 2025, "Pretrain/Step Time": 8.51480096951127} +{"Pretrain/Learning Rate": 4.5761057714169284e-05, "Pretrain/Loss": 2.0676605701446533, "Pretrain/Loss (Raw)": 2.3605737686157227, "Pretrain/Step": 2026, "Pretrain/Step Time": 8.5097640696913} +{"Pretrain/Learning Rate": 4.575632676947329e-05, "Pretrain/Loss": 2.0718884468078613, "Pretrain/Loss (Raw)": 2.3771939277648926, "Pretrain/Step": 2027, "Pretrain/Step Time": 8.501653917133808} +{"Pretrain/Learning Rate": 4.575159343105988e-05, "Pretrain/Loss": 2.0719809532165527, "Pretrain/Loss (Raw)": 1.83455228805542, "Pretrain/Step": 2028, "Pretrain/Step Time": 8.502519901841879} +{"Pretrain/Learning Rate": 4.5746857699474946e-05, "Pretrain/Loss": 2.0729269981384277, "Pretrain/Loss (Raw)": 2.1604907512664795, "Pretrain/Step": 2029, "Pretrain/Step Time": 8.502338519319892} +{"Pretrain/Learning Rate": 4.574211957526461e-05, "Pretrain/Loss": 2.0717592239379883, "Pretrain/Loss (Raw)": 2.0722200870513916, "Pretrain/Step": 2030, "Pretrain/Step Time": 8.5081832613796} +{"Pretrain/Learning Rate": 4.57373790589753e-05, "Pretrain/Loss": 2.071500301361084, "Pretrain/Loss (Raw)": 2.0715420246124268, "Pretrain/Step": 2031, "Pretrain/Step Time": 8.506560280919075} +{"Pretrain/Learning Rate": 4.573263615115372e-05, "Pretrain/Loss": 2.072580337524414, "Pretrain/Loss (Raw)": 1.9977058172225952, "Pretrain/Step": 2032, "Pretrain/Step Time": 8.502360800281167} +{"Pretrain/Learning Rate": 4.572789085234686e-05, "Pretrain/Loss": 2.0718305110931396, "Pretrain/Loss (Raw)": 1.9994583129882812, "Pretrain/Step": 2033, "Pretrain/Step Time": 8.496192872524261} +{"Pretrain/Learning Rate": 4.5723143163101934e-05, "Pretrain/Loss": 2.071244955062866, "Pretrain/Loss (Raw)": 2.1346611976623535, "Pretrain/Step": 2034, "Pretrain/Step Time": 8.50221522897482} +{"Pretrain/Learning Rate": 4.571839308396649e-05, "Pretrain/Loss": 2.07161283493042, "Pretrain/Loss (Raw)": 2.0795068740844727, "Pretrain/Step": 2035, "Pretrain/Step Time": 8.504367968067527} +{"Pretrain/Learning Rate": 4.571364061548834e-05, "Pretrain/Loss": 2.0713229179382324, "Pretrain/Loss (Raw)": 1.949654459953308, "Pretrain/Step": 2036, "Pretrain/Step Time": 8.505868718028069} +{"Pretrain/Learning Rate": 4.5708885758215543e-05, "Pretrain/Loss": 2.0717129707336426, "Pretrain/Loss (Raw)": 2.0129191875457764, "Pretrain/Step": 2037, "Pretrain/Step Time": 8.504419272765517} +{"Pretrain/Learning Rate": 4.570412851269645e-05, "Pretrain/Loss": 2.071157932281494, "Pretrain/Loss (Raw)": 2.008768320083618, "Pretrain/Step": 2038, "Pretrain/Step Time": 8.489900935441256} +{"Pretrain/Learning Rate": 4.56993688794797e-05, "Pretrain/Loss": 2.0692875385284424, "Pretrain/Loss (Raw)": 1.8500422239303589, "Pretrain/Step": 2039, "Pretrain/Step Time": 8.491458782926202} +{"Pretrain/Learning Rate": 4.5694606859114196e-05, "Pretrain/Loss": 2.070402145385742, "Pretrain/Loss (Raw)": 2.238304376602173, "Pretrain/Step": 2040, "Pretrain/Step Time": 8.49044737406075} +{"Pretrain/Learning Rate": 4.5689842452149114e-05, "Pretrain/Loss": 2.071406602859497, "Pretrain/Loss (Raw)": 2.3173234462738037, "Pretrain/Step": 2041, "Pretrain/Step Time": 8.496649455279112} +{"Pretrain/Learning Rate": 4.56850756591339e-05, "Pretrain/Loss": 2.0704355239868164, "Pretrain/Loss (Raw)": 2.151970624923706, "Pretrain/Step": 2042, "Pretrain/Step Time": 8.504217555746436} +{"Pretrain/Learning Rate": 4.56803064806183e-05, "Pretrain/Loss": 2.0717992782592773, "Pretrain/Loss (Raw)": 2.151344060897827, "Pretrain/Step": 2043, "Pretrain/Step Time": 8.50315922871232} +{"Pretrain/Learning Rate": 4.567553491715229e-05, "Pretrain/Loss": 2.069365978240967, "Pretrain/Loss (Raw)": 1.8496272563934326, "Pretrain/Step": 2044, "Pretrain/Step Time": 8.494748391211033} +{"Pretrain/Learning Rate": 4.567076096928618e-05, "Pretrain/Loss": 2.069383144378662, "Pretrain/Loss (Raw)": 2.027285575866699, "Pretrain/Step": 2045, "Pretrain/Step Time": 8.500768147408962} +{"Pretrain/Learning Rate": 4.566598463757051e-05, "Pretrain/Loss": 2.0687313079833984, "Pretrain/Loss (Raw)": 2.1183462142944336, "Pretrain/Step": 2046, "Pretrain/Step Time": 8.506270525977015} +{"Pretrain/Learning Rate": 4.56612059225561e-05, "Pretrain/Loss": 2.0703792572021484, "Pretrain/Loss (Raw)": 2.410208225250244, "Pretrain/Step": 2047, "Pretrain/Step Time": 8.502057703211904} +{"Pretrain/Learning Rate": 4.565642482479408e-05, "Pretrain/Loss": 2.068676471710205, "Pretrain/Loss (Raw)": 1.972304105758667, "Pretrain/Step": 2048, "Pretrain/Step Time": 8.505910288542509} +{"Pretrain/Learning Rate": 4.565164134483581e-05, "Pretrain/Loss": 2.0698957443237305, "Pretrain/Loss (Raw)": 2.1958885192871094, "Pretrain/Step": 2049, "Pretrain/Step Time": 8.505978122353554} +{"Pretrain/Learning Rate": 4.5646855483232935e-05, "Pretrain/Loss": 2.0695548057556152, "Pretrain/Loss (Raw)": 1.9904268980026245, "Pretrain/Step": 2050, "Pretrain/Step Time": 8.502052165567875} +{"Pretrain/Learning Rate": 4.56420672405374e-05, "Pretrain/Loss": 2.070690631866455, "Pretrain/Loss (Raw)": 2.1996381282806396, "Pretrain/Step": 2051, "Pretrain/Step Time": 8.497568313032389} +{"Pretrain/Learning Rate": 4.563727661730141e-05, "Pretrain/Loss": 2.0760974884033203, "Pretrain/Loss (Raw)": 2.268372058868408, "Pretrain/Step": 2052, "Pretrain/Step Time": 8.502786433324218} +{"Pretrain/Learning Rate": 4.563248361407743e-05, "Pretrain/Loss": 2.0756828784942627, "Pretrain/Loss (Raw)": 2.080287456512451, "Pretrain/Step": 2053, "Pretrain/Step Time": 8.507282439619303} +{"Pretrain/Learning Rate": 4.562768823141821e-05, "Pretrain/Loss": 2.075939178466797, "Pretrain/Loss (Raw)": 2.1830012798309326, "Pretrain/Step": 2054, "Pretrain/Step Time": 8.509085228666663} +{"Pretrain/Learning Rate": 4.562289046987679e-05, "Pretrain/Loss": 2.078195333480835, "Pretrain/Loss (Raw)": 2.3037900924682617, "Pretrain/Step": 2055, "Pretrain/Step Time": 8.502556256949902} +{"Pretrain/Learning Rate": 4.561809033000646e-05, "Pretrain/Loss": 2.079470634460449, "Pretrain/Loss (Raw)": 2.197645664215088, "Pretrain/Step": 2056, "Pretrain/Step Time": 8.498046956956387} +{"Pretrain/Learning Rate": 4.5613287812360796e-05, "Pretrain/Loss": 2.079954147338867, "Pretrain/Loss (Raw)": 2.060028314590454, "Pretrain/Step": 2057, "Pretrain/Step Time": 8.499078238382936} +{"Pretrain/Learning Rate": 4.560848291749365e-05, "Pretrain/Loss": 2.0780162811279297, "Pretrain/Loss (Raw)": 1.8575689792633057, "Pretrain/Step": 2058, "Pretrain/Step Time": 8.501485703513026} +{"Pretrain/Learning Rate": 4.560367564595914e-05, "Pretrain/Loss": 2.0779786109924316, "Pretrain/Loss (Raw)": 2.118248701095581, "Pretrain/Step": 2059, "Pretrain/Step Time": 8.50036957114935} +{"Pretrain/Learning Rate": 4.559886599831167e-05, "Pretrain/Loss": 2.077493667602539, "Pretrain/Loss (Raw)": 1.954516887664795, "Pretrain/Step": 2060, "Pretrain/Step Time": 8.510334940627217} +{"Pretrain/Learning Rate": 4.559405397510591e-05, "Pretrain/Loss": 2.0787360668182373, "Pretrain/Loss (Raw)": 2.4079084396362305, "Pretrain/Step": 2061, "Pretrain/Step Time": 8.498512638732791} +{"Pretrain/Learning Rate": 4.55892395768968e-05, "Pretrain/Loss": 2.076974630355835, "Pretrain/Loss (Raw)": 2.0002472400665283, "Pretrain/Step": 2062, "Pretrain/Step Time": 8.500036638230085} +{"Pretrain/Learning Rate": 4.5584422804239566e-05, "Pretrain/Loss": 2.075195789337158, "Pretrain/Loss (Raw)": 1.8105169534683228, "Pretrain/Step": 2063, "Pretrain/Step Time": 8.49524013698101} +{"Pretrain/Learning Rate": 4.55796036576897e-05, "Pretrain/Loss": 2.074981689453125, "Pretrain/Loss (Raw)": 1.9806430339813232, "Pretrain/Step": 2064, "Pretrain/Step Time": 8.5133444853127} +{"Pretrain/Learning Rate": 4.557478213780295e-05, "Pretrain/Loss": 2.0749526023864746, "Pretrain/Loss (Raw)": 2.1170036792755127, "Pretrain/Step": 2065, "Pretrain/Step Time": 8.515639636665583} +{"Pretrain/Learning Rate": 4.556995824513539e-05, "Pretrain/Loss": 2.0714569091796875, "Pretrain/Loss (Raw)": 1.7193830013275146, "Pretrain/Step": 2066, "Pretrain/Step Time": 8.513602413237095} +{"Pretrain/Learning Rate": 4.5565131980243305e-05, "Pretrain/Loss": 2.069922924041748, "Pretrain/Loss (Raw)": 1.8745205402374268, "Pretrain/Step": 2067, "Pretrain/Step Time": 8.51229371316731} +{"Pretrain/Learning Rate": 4.55603033436833e-05, "Pretrain/Loss": 2.06925892829895, "Pretrain/Loss (Raw)": 2.0663936138153076, "Pretrain/Step": 2068, "Pretrain/Step Time": 8.507976522669196} +{"Pretrain/Learning Rate": 4.555547233601223e-05, "Pretrain/Loss": 2.069668769836426, "Pretrain/Loss (Raw)": 2.098705291748047, "Pretrain/Step": 2069, "Pretrain/Step Time": 8.510006494820118} +{"Pretrain/Learning Rate": 4.555063895778723e-05, "Pretrain/Loss": 2.0711140632629395, "Pretrain/Loss (Raw)": 2.1185107231140137, "Pretrain/Step": 2070, "Pretrain/Step Time": 8.509742142632604} +{"Pretrain/Learning Rate": 4.5545803209565704e-05, "Pretrain/Loss": 2.0698163509368896, "Pretrain/Loss (Raw)": 1.8388817310333252, "Pretrain/Step": 2071, "Pretrain/Step Time": 8.513620808720589} +{"Pretrain/Learning Rate": 4.554096509190534e-05, "Pretrain/Loss": 2.071052312850952, "Pretrain/Loss (Raw)": 2.223576784133911, "Pretrain/Step": 2072, "Pretrain/Step Time": 8.518728481605649} +{"Pretrain/Learning Rate": 4.5536124605364085e-05, "Pretrain/Loss": 2.0714311599731445, "Pretrain/Loss (Raw)": 2.1559276580810547, "Pretrain/Step": 2073, "Pretrain/Step Time": 8.513833977282047} +{"Pretrain/Learning Rate": 4.553128175050018e-05, "Pretrain/Loss": 2.072824001312256, "Pretrain/Loss (Raw)": 2.033158302307129, "Pretrain/Step": 2074, "Pretrain/Step Time": 8.503928914666176} +{"Pretrain/Learning Rate": 4.552643652787211e-05, "Pretrain/Loss": 2.0727591514587402, "Pretrain/Loss (Raw)": 2.124025583267212, "Pretrain/Step": 2075, "Pretrain/Step Time": 8.499545898288488} +{"Pretrain/Learning Rate": 4.552158893803865e-05, "Pretrain/Loss": 2.073286533355713, "Pretrain/Loss (Raw)": 2.2617037296295166, "Pretrain/Step": 2076, "Pretrain/Step Time": 8.505608497187495} +{"Pretrain/Learning Rate": 4.551673898155886e-05, "Pretrain/Loss": 2.0721662044525146, "Pretrain/Loss (Raw)": 1.697707176208496, "Pretrain/Step": 2077, "Pretrain/Step Time": 8.50559951364994} +{"Pretrain/Learning Rate": 4.5511886658992055e-05, "Pretrain/Loss": 2.076289653778076, "Pretrain/Loss (Raw)": 2.407951831817627, "Pretrain/Step": 2078, "Pretrain/Step Time": 8.517380770295858} +{"Pretrain/Learning Rate": 4.550703197089782e-05, "Pretrain/Loss": 2.075958728790283, "Pretrain/Loss (Raw)": 2.0621492862701416, "Pretrain/Step": 2079, "Pretrain/Step Time": 8.509048821404576} +{"Pretrain/Learning Rate": 4.550217491783603e-05, "Pretrain/Loss": 2.077280282974243, "Pretrain/Loss (Raw)": 1.984910011291504, "Pretrain/Step": 2080, "Pretrain/Step Time": 8.512379508465528} +{"Pretrain/Learning Rate": 4.549731550036682e-05, "Pretrain/Loss": 2.072899103164673, "Pretrain/Loss (Raw)": 1.7225888967514038, "Pretrain/Step": 2081, "Pretrain/Step Time": 8.513435056433082} +{"Pretrain/Learning Rate": 4.5492453719050596e-05, "Pretrain/Loss": 2.0722298622131348, "Pretrain/Loss (Raw)": 1.9291720390319824, "Pretrain/Step": 2082, "Pretrain/Step Time": 8.518902080133557} +{"Pretrain/Learning Rate": 4.5487589574448046e-05, "Pretrain/Loss": 2.0718681812286377, "Pretrain/Loss (Raw)": 2.1394667625427246, "Pretrain/Step": 2083, "Pretrain/Step Time": 8.52434833906591} +{"Pretrain/Learning Rate": 4.5482723067120124e-05, "Pretrain/Loss": 2.0701684951782227, "Pretrain/Loss (Raw)": 1.8786059617996216, "Pretrain/Step": 2084, "Pretrain/Step Time": 8.527475662529469} +{"Pretrain/Learning Rate": 4.547785419762807e-05, "Pretrain/Loss": 2.0668511390686035, "Pretrain/Loss (Raw)": 1.8085651397705078, "Pretrain/Step": 2085, "Pretrain/Step Time": 8.52462780661881} +{"Pretrain/Learning Rate": 4.547298296653336e-05, "Pretrain/Loss": 2.0684454441070557, "Pretrain/Loss (Raw)": 1.9776555299758911, "Pretrain/Step": 2086, "Pretrain/Step Time": 8.515626473352313} +{"Pretrain/Learning Rate": 4.5468109374397796e-05, "Pretrain/Loss": 2.0727932453155518, "Pretrain/Loss (Raw)": 2.0710806846618652, "Pretrain/Step": 2087, "Pretrain/Step Time": 8.515585927292705} +{"Pretrain/Learning Rate": 4.54632334217834e-05, "Pretrain/Loss": 2.0742430686950684, "Pretrain/Loss (Raw)": 2.16635799407959, "Pretrain/Step": 2088, "Pretrain/Step Time": 8.520529748871922} +{"Pretrain/Learning Rate": 4.545835510925251e-05, "Pretrain/Loss": 2.0737180709838867, "Pretrain/Loss (Raw)": 2.0643646717071533, "Pretrain/Step": 2089, "Pretrain/Step Time": 8.526356115937233} +{"Pretrain/Learning Rate": 4.5453474437367695e-05, "Pretrain/Loss": 2.073096752166748, "Pretrain/Loss (Raw)": 2.0267996788024902, "Pretrain/Step": 2090, "Pretrain/Step Time": 8.527216203510761} +{"Pretrain/Learning Rate": 4.544859140669183e-05, "Pretrain/Loss": 2.072688102722168, "Pretrain/Loss (Raw)": 2.0054595470428467, "Pretrain/Step": 2091, "Pretrain/Step Time": 8.526720067486167} +{"Pretrain/Learning Rate": 4.5443706017788054e-05, "Pretrain/Loss": 2.0779004096984863, "Pretrain/Loss (Raw)": 2.5698647499084473, "Pretrain/Step": 2092, "Pretrain/Step Time": 8.52371571958065} +{"Pretrain/Learning Rate": 4.5438818271219765e-05, "Pretrain/Loss": 2.0787954330444336, "Pretrain/Loss (Raw)": 1.944015622138977, "Pretrain/Step": 2093, "Pretrain/Step Time": 8.526366975158453} +{"Pretrain/Learning Rate": 4.5433928167550634e-05, "Pretrain/Loss": 2.0833349227905273, "Pretrain/Loss (Raw)": 2.613936424255371, "Pretrain/Step": 2094, "Pretrain/Step Time": 8.530864387750626} +{"Pretrain/Learning Rate": 4.542903570734463e-05, "Pretrain/Loss": 2.0836758613586426, "Pretrain/Loss (Raw)": 2.1546027660369873, "Pretrain/Step": 2095, "Pretrain/Step Time": 8.533661296591163} +{"Pretrain/Learning Rate": 4.542414089116595e-05, "Pretrain/Loss": 2.0837042331695557, "Pretrain/Loss (Raw)": 2.0387637615203857, "Pretrain/Step": 2096, "Pretrain/Step Time": 8.530994722619653} +{"Pretrain/Learning Rate": 4.541924371957911e-05, "Pretrain/Loss": 2.083738327026367, "Pretrain/Loss (Raw)": 2.205624580383301, "Pretrain/Step": 2097, "Pretrain/Step Time": 8.523675601929426} +{"Pretrain/Learning Rate": 4.5414344193148866e-05, "Pretrain/Loss": 2.0849437713623047, "Pretrain/Loss (Raw)": 2.200490713119507, "Pretrain/Step": 2098, "Pretrain/Step Time": 8.517541879788041} +{"Pretrain/Learning Rate": 4.540944231244025e-05, "Pretrain/Loss": 2.086087226867676, "Pretrain/Loss (Raw)": 2.1945364475250244, "Pretrain/Step": 2099, "Pretrain/Step Time": 8.519485581666231} +{"Pretrain/Learning Rate": 4.540453807801858e-05, "Pretrain/Loss": 2.0847878456115723, "Pretrain/Loss (Raw)": 2.151660442352295, "Pretrain/Step": 2100, "Pretrain/Step Time": 8.522886600345373} +{"Pretrain/Learning Rate": 4.539963149044943e-05, "Pretrain/Loss": 2.0827038288116455, "Pretrain/Loss (Raw)": 2.0355827808380127, "Pretrain/Step": 2101, "Pretrain/Step Time": 8.525596564635634} +{"Pretrain/Learning Rate": 4.539472255029864e-05, "Pretrain/Loss": 2.081502914428711, "Pretrain/Loss (Raw)": 1.976374626159668, "Pretrain/Step": 2102, "Pretrain/Step Time": 8.527287650853395} +{"Pretrain/Learning Rate": 4.538981125813235e-05, "Pretrain/Loss": 2.0804619789123535, "Pretrain/Loss (Raw)": 2.0276591777801514, "Pretrain/Step": 2103, "Pretrain/Step Time": 8.516917392611504} +{"Pretrain/Learning Rate": 4.538489761451694e-05, "Pretrain/Loss": 2.0806596279144287, "Pretrain/Loss (Raw)": 1.9755582809448242, "Pretrain/Step": 2104, "Pretrain/Step Time": 8.51053954847157} +{"Pretrain/Learning Rate": 4.537998162001909e-05, "Pretrain/Loss": 2.0794436931610107, "Pretrain/Loss (Raw)": 1.9943772554397583, "Pretrain/Step": 2105, "Pretrain/Step Time": 8.5114791020751} +{"Pretrain/Learning Rate": 4.537506327520571e-05, "Pretrain/Loss": 2.080554723739624, "Pretrain/Loss (Raw)": 2.1118359565734863, "Pretrain/Step": 2106, "Pretrain/Step Time": 8.50713212788105} +{"Pretrain/Learning Rate": 4.5370142580644036e-05, "Pretrain/Loss": 2.0805697441101074, "Pretrain/Loss (Raw)": 2.0681698322296143, "Pretrain/Step": 2107, "Pretrain/Step Time": 8.514305640012026} +{"Pretrain/Learning Rate": 4.536521953690153e-05, "Pretrain/Loss": 2.078355073928833, "Pretrain/Loss (Raw)": 1.86808180809021, "Pretrain/Step": 2108, "Pretrain/Step Time": 8.51914750598371} +{"Pretrain/Learning Rate": 4.5360294144545946e-05, "Pretrain/Loss": 2.07604718208313, "Pretrain/Loss (Raw)": 2.141023635864258, "Pretrain/Step": 2109, "Pretrain/Step Time": 8.520560132339597} +{"Pretrain/Learning Rate": 4.5355366404145294e-05, "Pretrain/Loss": 2.0801239013671875, "Pretrain/Loss (Raw)": 2.149819850921631, "Pretrain/Step": 2110, "Pretrain/Step Time": 8.518451297655702} +{"Pretrain/Learning Rate": 4.5350436316267876e-05, "Pretrain/Loss": 2.0806541442871094, "Pretrain/Loss (Raw)": 2.119652509689331, "Pretrain/Step": 2111, "Pretrain/Step Time": 8.515666756778955} +{"Pretrain/Learning Rate": 4.534550388148224e-05, "Pretrain/Loss": 2.079662799835205, "Pretrain/Loss (Raw)": 2.177419424057007, "Pretrain/Step": 2112, "Pretrain/Step Time": 8.512589992955327} +{"Pretrain/Learning Rate": 4.5340569100357235e-05, "Pretrain/Loss": 2.0808980464935303, "Pretrain/Loss (Raw)": 2.1490895748138428, "Pretrain/Step": 2113, "Pretrain/Step Time": 8.51240823045373} +{"Pretrain/Learning Rate": 4.5335631973461944e-05, "Pretrain/Loss": 2.0810294151306152, "Pretrain/Loss (Raw)": 2.0166821479797363, "Pretrain/Step": 2114, "Pretrain/Step Time": 8.513809183612466} +{"Pretrain/Learning Rate": 4.5330692501365755e-05, "Pretrain/Loss": 2.0802016258239746, "Pretrain/Loss (Raw)": 2.029505729675293, "Pretrain/Step": 2115, "Pretrain/Step Time": 8.505000496283174} +{"Pretrain/Learning Rate": 4.532575068463831e-05, "Pretrain/Loss": 2.0804059505462646, "Pretrain/Loss (Raw)": 2.15889310836792, "Pretrain/Step": 2116, "Pretrain/Step Time": 8.500339560210705} +{"Pretrain/Learning Rate": 4.532080652384951e-05, "Pretrain/Loss": 2.0788629055023193, "Pretrain/Loss (Raw)": 1.9725806713104248, "Pretrain/Step": 2117, "Pretrain/Step Time": 8.499331939965487} +{"Pretrain/Learning Rate": 4.5315860019569546e-05, "Pretrain/Loss": 2.076885461807251, "Pretrain/Loss (Raw)": 2.2495296001434326, "Pretrain/Step": 2118, "Pretrain/Step Time": 8.49705271422863} +{"Pretrain/Learning Rate": 4.531091117236888e-05, "Pretrain/Loss": 2.0796611309051514, "Pretrain/Loss (Raw)": 2.3963003158569336, "Pretrain/Step": 2119, "Pretrain/Step Time": 8.505694679915905} +{"Pretrain/Learning Rate": 4.530595998281822e-05, "Pretrain/Loss": 2.0798821449279785, "Pretrain/Loss (Raw)": 1.9262497425079346, "Pretrain/Step": 2120, "Pretrain/Step Time": 8.505787495523691} +{"Pretrain/Learning Rate": 4.530100645148858e-05, "Pretrain/Loss": 2.0785717964172363, "Pretrain/Loss (Raw)": 1.8526766300201416, "Pretrain/Step": 2121, "Pretrain/Step Time": 8.50608105957508} +{"Pretrain/Learning Rate": 4.529605057895121e-05, "Pretrain/Loss": 2.077664375305176, "Pretrain/Loss (Raw)": 1.8622236251831055, "Pretrain/Step": 2122, "Pretrain/Step Time": 8.504177941009402} +{"Pretrain/Learning Rate": 4.529109236577764e-05, "Pretrain/Loss": 2.080099582672119, "Pretrain/Loss (Raw)": 2.3163866996765137, "Pretrain/Step": 2123, "Pretrain/Step Time": 8.506086464971304} +{"Pretrain/Learning Rate": 4.5286131812539704e-05, "Pretrain/Loss": 2.0827701091766357, "Pretrain/Loss (Raw)": 2.0373196601867676, "Pretrain/Step": 2124, "Pretrain/Step Time": 8.508148489519954} +{"Pretrain/Learning Rate": 4.5281168919809444e-05, "Pretrain/Loss": 2.0814120769500732, "Pretrain/Loss (Raw)": 1.9498393535614014, "Pretrain/Step": 2125, "Pretrain/Step Time": 8.509342089295387} +{"Pretrain/Learning Rate": 4.527620368815921e-05, "Pretrain/Loss": 2.08364200592041, "Pretrain/Loss (Raw)": 2.2582693099975586, "Pretrain/Step": 2126, "Pretrain/Step Time": 8.510631911456585} +{"Pretrain/Learning Rate": 4.527123611816163e-05, "Pretrain/Loss": 2.0847365856170654, "Pretrain/Loss (Raw)": 2.15311336517334, "Pretrain/Step": 2127, "Pretrain/Step Time": 8.505263766273856} +{"Pretrain/Learning Rate": 4.526626621038958e-05, "Pretrain/Loss": 2.085442066192627, "Pretrain/Loss (Raw)": 2.061359167098999, "Pretrain/Step": 2128, "Pretrain/Step Time": 8.497031800448895} +{"Pretrain/Learning Rate": 4.526129396541621e-05, "Pretrain/Loss": 2.0845718383789062, "Pretrain/Loss (Raw)": 1.9694408178329468, "Pretrain/Step": 2129, "Pretrain/Step Time": 8.49635843001306} +{"Pretrain/Learning Rate": 4.525631938381495e-05, "Pretrain/Loss": 2.0807065963745117, "Pretrain/Loss (Raw)": 1.687442421913147, "Pretrain/Step": 2130, "Pretrain/Step Time": 8.495801808312535} +{"Pretrain/Learning Rate": 4.5251342466159487e-05, "Pretrain/Loss": 2.0806002616882324, "Pretrain/Loss (Raw)": 2.3520097732543945, "Pretrain/Step": 2131, "Pretrain/Step Time": 8.494547799229622} +{"Pretrain/Learning Rate": 4.524636321302378e-05, "Pretrain/Loss": 2.080368757247925, "Pretrain/Loss (Raw)": 2.0742738246917725, "Pretrain/Step": 2132, "Pretrain/Step Time": 8.494584826752543} +{"Pretrain/Learning Rate": 4.524138162498206e-05, "Pretrain/Loss": 2.079310894012451, "Pretrain/Loss (Raw)": 2.0357277393341064, "Pretrain/Step": 2133, "Pretrain/Step Time": 8.490883074700832} +{"Pretrain/Learning Rate": 4.5236397702608833e-05, "Pretrain/Loss": 2.077850341796875, "Pretrain/Loss (Raw)": 2.0172605514526367, "Pretrain/Step": 2134, "Pretrain/Step Time": 8.484450349584222} +{"Pretrain/Learning Rate": 4.5231411446478865e-05, "Pretrain/Loss": 2.0776565074920654, "Pretrain/Loss (Raw)": 2.0364041328430176, "Pretrain/Step": 2135, "Pretrain/Step Time": 8.488596988841891} +{"Pretrain/Learning Rate": 4.5226422857167207e-05, "Pretrain/Loss": 2.081624984741211, "Pretrain/Loss (Raw)": 2.361135244369507, "Pretrain/Step": 2136, "Pretrain/Step Time": 8.49186029843986} +{"Pretrain/Learning Rate": 4.5221431935249144e-05, "Pretrain/Loss": 2.0808072090148926, "Pretrain/Loss (Raw)": 1.9675105810165405, "Pretrain/Step": 2137, "Pretrain/Step Time": 8.503173857927322} +{"Pretrain/Learning Rate": 4.5216438681300265e-05, "Pretrain/Loss": 2.077652931213379, "Pretrain/Loss (Raw)": 1.8597530126571655, "Pretrain/Step": 2138, "Pretrain/Step Time": 8.502140749245882} +{"Pretrain/Learning Rate": 4.521144309589641e-05, "Pretrain/Loss": 2.0782089233398438, "Pretrain/Loss (Raw)": 2.1118078231811523, "Pretrain/Step": 2139, "Pretrain/Step Time": 8.495130153372884} +{"Pretrain/Learning Rate": 4.520644517961371e-05, "Pretrain/Loss": 2.0780603885650635, "Pretrain/Loss (Raw)": 2.068909168243408, "Pretrain/Step": 2140, "Pretrain/Step Time": 8.496110402047634} +{"Pretrain/Learning Rate": 4.520144493302853e-05, "Pretrain/Loss": 2.0788259506225586, "Pretrain/Loss (Raw)": 1.97490656375885, "Pretrain/Step": 2141, "Pretrain/Step Time": 8.505149643868208} +{"Pretrain/Learning Rate": 4.519644235671752e-05, "Pretrain/Loss": 2.079334259033203, "Pretrain/Loss (Raw)": 2.2016656398773193, "Pretrain/Step": 2142, "Pretrain/Step Time": 8.502549277618527} +{"Pretrain/Learning Rate": 4.519143745125762e-05, "Pretrain/Loss": 2.0798747539520264, "Pretrain/Loss (Raw)": 2.2264115810394287, "Pretrain/Step": 2143, "Pretrain/Step Time": 8.50045508891344} +{"Pretrain/Learning Rate": 4.5186430217226004e-05, "Pretrain/Loss": 2.0819263458251953, "Pretrain/Loss (Raw)": 2.191185235977173, "Pretrain/Step": 2144, "Pretrain/Step Time": 8.498423034325242} +{"Pretrain/Learning Rate": 4.518142065520013e-05, "Pretrain/Loss": 2.082711696624756, "Pretrain/Loss (Raw)": 2.0757737159729004, "Pretrain/Step": 2145, "Pretrain/Step Time": 8.48877976089716} +{"Pretrain/Learning Rate": 4.5176408765757736e-05, "Pretrain/Loss": 2.081743001937866, "Pretrain/Loss (Raw)": 2.0551412105560303, "Pretrain/Step": 2146, "Pretrain/Step Time": 8.494861824437976} +{"Pretrain/Learning Rate": 4.5171394549476794e-05, "Pretrain/Loss": 2.082040548324585, "Pretrain/Loss (Raw)": 2.100766181945801, "Pretrain/Step": 2147, "Pretrain/Step Time": 8.502248257398605} +{"Pretrain/Learning Rate": 4.5166378006935595e-05, "Pretrain/Loss": 2.0816445350646973, "Pretrain/Loss (Raw)": 1.9953203201293945, "Pretrain/Step": 2148, "Pretrain/Step Time": 8.506270546466112} +{"Pretrain/Learning Rate": 4.5161359138712655e-05, "Pretrain/Loss": 2.083186149597168, "Pretrain/Loss (Raw)": 2.2218101024627686, "Pretrain/Step": 2149, "Pretrain/Step Time": 8.506601113826036} +{"Pretrain/Learning Rate": 4.5156337945386775e-05, "Pretrain/Loss": 2.083043336868286, "Pretrain/Loss (Raw)": 2.0339152812957764, "Pretrain/Step": 2150, "Pretrain/Step Time": 8.505429359152913} +{"Pretrain/Learning Rate": 4.515131442753703e-05, "Pretrain/Loss": 2.085129737854004, "Pretrain/Loss (Raw)": 2.5799508094787598, "Pretrain/Step": 2151, "Pretrain/Step Time": 8.492154616862535} +{"Pretrain/Learning Rate": 4.5146288585742737e-05, "Pretrain/Loss": 2.0850257873535156, "Pretrain/Loss (Raw)": 2.115201711654663, "Pretrain/Step": 2152, "Pretrain/Step Time": 8.496984392404556} +{"Pretrain/Learning Rate": 4.514126042058352e-05, "Pretrain/Loss": 2.0843467712402344, "Pretrain/Loss (Raw)": 2.0442328453063965, "Pretrain/Step": 2153, "Pretrain/Step Time": 8.49422357417643} +{"Pretrain/Learning Rate": 4.513622993263924e-05, "Pretrain/Loss": 2.081606149673462, "Pretrain/Loss (Raw)": 2.0097832679748535, "Pretrain/Step": 2154, "Pretrain/Step Time": 8.508427361026406} +{"Pretrain/Learning Rate": 4.5131197122490035e-05, "Pretrain/Loss": 2.0817930698394775, "Pretrain/Loss (Raw)": 2.401108980178833, "Pretrain/Step": 2155, "Pretrain/Step Time": 8.515840236097574} +{"Pretrain/Learning Rate": 4.512616199071632e-05, "Pretrain/Loss": 2.084646224975586, "Pretrain/Loss (Raw)": 2.1997857093811035, "Pretrain/Step": 2156, "Pretrain/Step Time": 8.51385829038918} +{"Pretrain/Learning Rate": 4.512112453789877e-05, "Pretrain/Loss": 2.0855679512023926, "Pretrain/Loss (Raw)": 2.278428316116333, "Pretrain/Step": 2157, "Pretrain/Step Time": 8.510142559185624} +{"Pretrain/Learning Rate": 4.5116084764618325e-05, "Pretrain/Loss": 2.0870513916015625, "Pretrain/Loss (Raw)": 2.2621142864227295, "Pretrain/Step": 2158, "Pretrain/Step Time": 8.510205529630184} +{"Pretrain/Learning Rate": 4.511104267145618e-05, "Pretrain/Loss": 2.087209701538086, "Pretrain/Loss (Raw)": 2.09181547164917, "Pretrain/Step": 2159, "Pretrain/Step Time": 8.521128157153726} +{"Pretrain/Learning Rate": 4.510599825899384e-05, "Pretrain/Loss": 2.0879361629486084, "Pretrain/Loss (Raw)": 2.0907013416290283, "Pretrain/Step": 2160, "Pretrain/Step Time": 8.519510589540005} +{"Pretrain/Learning Rate": 4.510095152781304e-05, "Pretrain/Loss": 2.0893008708953857, "Pretrain/Loss (Raw)": 2.1741256713867188, "Pretrain/Step": 2161, "Pretrain/Step Time": 8.518941700458527} +{"Pretrain/Learning Rate": 4.509590247849579e-05, "Pretrain/Loss": 2.08919620513916, "Pretrain/Loss (Raw)": 2.121256113052368, "Pretrain/Step": 2162, "Pretrain/Step Time": 8.512693567201495} +{"Pretrain/Learning Rate": 4.509085111162437e-05, "Pretrain/Loss": 2.0895488262176514, "Pretrain/Loss (Raw)": 2.1246554851531982, "Pretrain/Step": 2163, "Pretrain/Step Time": 8.512213626876473} +{"Pretrain/Learning Rate": 4.508579742778133e-05, "Pretrain/Loss": 2.090411901473999, "Pretrain/Loss (Raw)": 2.060134172439575, "Pretrain/Step": 2164, "Pretrain/Step Time": 8.512023517861962} +{"Pretrain/Learning Rate": 4.508074142754948e-05, "Pretrain/Loss": 2.089355945587158, "Pretrain/Loss (Raw)": 1.8777494430541992, "Pretrain/Step": 2165, "Pretrain/Step Time": 8.520491011440754} +{"Pretrain/Learning Rate": 4.507568311151191e-05, "Pretrain/Loss": 2.0915470123291016, "Pretrain/Loss (Raw)": 2.289216995239258, "Pretrain/Step": 2166, "Pretrain/Step Time": 8.52916175685823} +{"Pretrain/Learning Rate": 4.5070622480251955e-05, "Pretrain/Loss": 2.0936548709869385, "Pretrain/Loss (Raw)": 2.119849443435669, "Pretrain/Step": 2167, "Pretrain/Step Time": 8.533115949481726} +{"Pretrain/Learning Rate": 4.506555953435324e-05, "Pretrain/Loss": 2.0931620597839355, "Pretrain/Loss (Raw)": 2.1752121448516846, "Pretrain/Step": 2168, "Pretrain/Step Time": 8.527666782960296} +{"Pretrain/Learning Rate": 4.5060494274399654e-05, "Pretrain/Loss": 2.091874361038208, "Pretrain/Loss (Raw)": 2.1525073051452637, "Pretrain/Step": 2169, "Pretrain/Step Time": 8.523026404902339} +{"Pretrain/Learning Rate": 4.505542670097534e-05, "Pretrain/Loss": 2.0909430980682373, "Pretrain/Loss (Raw)": 2.0327653884887695, "Pretrain/Step": 2170, "Pretrain/Step Time": 8.515903435647488} +{"Pretrain/Learning Rate": 4.505035681466472e-05, "Pretrain/Loss": 2.0897274017333984, "Pretrain/Loss (Raw)": 1.9957274198532104, "Pretrain/Step": 2171, "Pretrain/Step Time": 8.518077526241541} +{"Pretrain/Learning Rate": 4.504528461605247e-05, "Pretrain/Loss": 2.092649459838867, "Pretrain/Loss (Raw)": 2.223679304122925, "Pretrain/Step": 2172, "Pretrain/Step Time": 8.52363215945661} +{"Pretrain/Learning Rate": 4.5040210105723525e-05, "Pretrain/Loss": 2.0915236473083496, "Pretrain/Loss (Raw)": 1.8831740617752075, "Pretrain/Step": 2173, "Pretrain/Step Time": 8.521970765665174} +{"Pretrain/Learning Rate": 4.5035133284263134e-05, "Pretrain/Loss": 2.0886101722717285, "Pretrain/Loss (Raw)": 1.7454049587249756, "Pretrain/Step": 2174, "Pretrain/Step Time": 8.516291089355946} +{"Pretrain/Learning Rate": 4.5030054152256756e-05, "Pretrain/Loss": 2.085653781890869, "Pretrain/Loss (Raw)": 2.031801700592041, "Pretrain/Step": 2175, "Pretrain/Step Time": 8.516745178028941} +{"Pretrain/Learning Rate": 4.502497271029015e-05, "Pretrain/Loss": 2.086503028869629, "Pretrain/Loss (Raw)": 2.0810205936431885, "Pretrain/Step": 2176, "Pretrain/Step Time": 8.517893511801958} +{"Pretrain/Learning Rate": 4.501988895894933e-05, "Pretrain/Loss": 2.0866923332214355, "Pretrain/Loss (Raw)": 2.2201297283172607, "Pretrain/Step": 2177, "Pretrain/Step Time": 8.526097325608134} +{"Pretrain/Learning Rate": 4.501480289882058e-05, "Pretrain/Loss": 2.087059497833252, "Pretrain/Loss (Raw)": 2.0374033451080322, "Pretrain/Step": 2178, "Pretrain/Step Time": 8.526794906705618} +{"Pretrain/Learning Rate": 4.5009714530490455e-05, "Pretrain/Loss": 2.086186170578003, "Pretrain/Loss (Raw)": 2.087859869003296, "Pretrain/Step": 2179, "Pretrain/Step Time": 8.525479763746262} +{"Pretrain/Learning Rate": 4.5004623854545746e-05, "Pretrain/Loss": 2.0843513011932373, "Pretrain/Loss (Raw)": 2.033498764038086, "Pretrain/Step": 2180, "Pretrain/Step Time": 8.517174616456032} +{"Pretrain/Learning Rate": 4.4999530871573556e-05, "Pretrain/Loss": 2.08465576171875, "Pretrain/Loss (Raw)": 2.119279384613037, "Pretrain/Step": 2181, "Pretrain/Step Time": 8.512309638783336} +{"Pretrain/Learning Rate": 4.499443558216123e-05, "Pretrain/Loss": 2.0839898586273193, "Pretrain/Loss (Raw)": 2.097748279571533, "Pretrain/Step": 2182, "Pretrain/Step Time": 8.515857124701142} +{"Pretrain/Learning Rate": 4.498933798689638e-05, "Pretrain/Loss": 2.083714008331299, "Pretrain/Loss (Raw)": 2.2684974670410156, "Pretrain/Step": 2183, "Pretrain/Step Time": 8.5203344989568} +{"Pretrain/Learning Rate": 4.498423808636687e-05, "Pretrain/Loss": 2.0817532539367676, "Pretrain/Loss (Raw)": 1.9466685056686401, "Pretrain/Step": 2184, "Pretrain/Step Time": 8.524478221312165} +{"Pretrain/Learning Rate": 4.497913588116085e-05, "Pretrain/Loss": 2.0809407234191895, "Pretrain/Loss (Raw)": 1.9559978246688843, "Pretrain/Step": 2185, "Pretrain/Step Time": 8.520473834127188} +{"Pretrain/Learning Rate": 4.497403137186674e-05, "Pretrain/Loss": 2.0811095237731934, "Pretrain/Loss (Raw)": 1.8791762590408325, "Pretrain/Step": 2186, "Pretrain/Step Time": 8.51732692308724} +{"Pretrain/Learning Rate": 4.496892455907322e-05, "Pretrain/Loss": 2.0805742740631104, "Pretrain/Loss (Raw)": 2.0497469902038574, "Pretrain/Step": 2187, "Pretrain/Step Time": 8.516281425952911} +{"Pretrain/Learning Rate": 4.496381544336922e-05, "Pretrain/Loss": 2.0820322036743164, "Pretrain/Loss (Raw)": 2.1411242485046387, "Pretrain/Step": 2188, "Pretrain/Step Time": 8.51631141640246} +{"Pretrain/Learning Rate": 4.495870402534394e-05, "Pretrain/Loss": 2.078709125518799, "Pretrain/Loss (Raw)": 1.9825680255889893, "Pretrain/Step": 2189, "Pretrain/Step Time": 8.518106523901224} +{"Pretrain/Learning Rate": 4.495359030558688e-05, "Pretrain/Loss": 2.0794448852539062, "Pretrain/Loss (Raw)": 2.0944390296936035, "Pretrain/Step": 2190, "Pretrain/Step Time": 8.516371866688132} +{"Pretrain/Learning Rate": 4.494847428468775e-05, "Pretrain/Loss": 2.0820250511169434, "Pretrain/Loss (Raw)": 2.1407759189605713, "Pretrain/Step": 2191, "Pretrain/Step Time": 8.519616642966866} +{"Pretrain/Learning Rate": 4.494335596323657e-05, "Pretrain/Loss": 2.0815467834472656, "Pretrain/Loss (Raw)": 1.9194022417068481, "Pretrain/Step": 2192, "Pretrain/Step Time": 8.501164665445685} +{"Pretrain/Learning Rate": 4.49382353418236e-05, "Pretrain/Loss": 2.083986282348633, "Pretrain/Loss (Raw)": 2.429267644882202, "Pretrain/Step": 2193, "Pretrain/Step Time": 8.499501759186387} +{"Pretrain/Learning Rate": 4.493311242103938e-05, "Pretrain/Loss": 2.08697247505188, "Pretrain/Loss (Raw)": 2.1016201972961426, "Pretrain/Step": 2194, "Pretrain/Step Time": 8.51160086132586} +{"Pretrain/Learning Rate": 4.4927987201474707e-05, "Pretrain/Loss": 2.088930606842041, "Pretrain/Loss (Raw)": 2.1251602172851562, "Pretrain/Step": 2195, "Pretrain/Step Time": 8.512788793072104} +{"Pretrain/Learning Rate": 4.492285968372065e-05, "Pretrain/Loss": 2.0909438133239746, "Pretrain/Loss (Raw)": 2.324068069458008, "Pretrain/Step": 2196, "Pretrain/Step Time": 8.515225909650326} +{"Pretrain/Learning Rate": 4.491772986836853e-05, "Pretrain/Loss": 2.0894060134887695, "Pretrain/Loss (Raw)": 1.901880145072937, "Pretrain/Step": 2197, "Pretrain/Step Time": 8.513082830235362} +{"Pretrain/Learning Rate": 4.4912597756009946e-05, "Pretrain/Loss": 2.0891149044036865, "Pretrain/Loss (Raw)": 2.0812485218048096, "Pretrain/Step": 2198, "Pretrain/Step Time": 8.506985060870647} +{"Pretrain/Learning Rate": 4.490746334723677e-05, "Pretrain/Loss": 2.090851306915283, "Pretrain/Loss (Raw)": 2.061159372329712, "Pretrain/Step": 2199, "Pretrain/Step Time": 8.507420849055052} +{"Pretrain/Learning Rate": 4.4902326642641095e-05, "Pretrain/Loss": 2.0916056632995605, "Pretrain/Loss (Raw)": 2.320111036300659, "Pretrain/Step": 2200, "Pretrain/Step Time": 8.508624540641904} +{"Pretrain/Learning Rate": 4.489718764281534e-05, "Pretrain/Loss": 2.090146064758301, "Pretrain/Loss (Raw)": 1.9690769910812378, "Pretrain/Step": 2201, "Pretrain/Step Time": 8.513803839683533} +{"Pretrain/Learning Rate": 4.489204634835215e-05, "Pretrain/Loss": 2.0908641815185547, "Pretrain/Loss (Raw)": 2.125091552734375, "Pretrain/Step": 2202, "Pretrain/Step Time": 8.51610946469009} +{"Pretrain/Learning Rate": 4.488690275984443e-05, "Pretrain/Loss": 2.0915956497192383, "Pretrain/Loss (Raw)": 2.217662811279297, "Pretrain/Step": 2203, "Pretrain/Step Time": 8.51241404376924} +{"Pretrain/Learning Rate": 4.488175687788538e-05, "Pretrain/Loss": 2.089094638824463, "Pretrain/Loss (Raw)": 1.9415688514709473, "Pretrain/Step": 2204, "Pretrain/Step Time": 8.507567428052425} +{"Pretrain/Learning Rate": 4.4876608703068434e-05, "Pretrain/Loss": 2.0920372009277344, "Pretrain/Loss (Raw)": 2.0743706226348877, "Pretrain/Step": 2205, "Pretrain/Step Time": 8.514386029914021} +{"Pretrain/Learning Rate": 4.487145823598732e-05, "Pretrain/Loss": 2.0900509357452393, "Pretrain/Loss (Raw)": 2.1537201404571533, "Pretrain/Step": 2206, "Pretrain/Step Time": 8.503259122371674} +{"Pretrain/Learning Rate": 4.4866305477236e-05, "Pretrain/Loss": 2.090480089187622, "Pretrain/Loss (Raw)": 2.117070198059082, "Pretrain/Step": 2207, "Pretrain/Step Time": 8.505507212132215} +{"Pretrain/Learning Rate": 4.486115042740872e-05, "Pretrain/Loss": 2.091838836669922, "Pretrain/Loss (Raw)": 2.1588335037231445, "Pretrain/Step": 2208, "Pretrain/Step Time": 8.500113002955914} +{"Pretrain/Learning Rate": 4.4855993087099984e-05, "Pretrain/Loss": 2.094571590423584, "Pretrain/Loss (Raw)": 2.0723414421081543, "Pretrain/Step": 2209, "Pretrain/Step Time": 8.503738945350051} +{"Pretrain/Learning Rate": 4.485083345690456e-05, "Pretrain/Loss": 2.097792625427246, "Pretrain/Loss (Raw)": 2.3414947986602783, "Pretrain/Step": 2210, "Pretrain/Step Time": 8.495002530515194} +{"Pretrain/Learning Rate": 4.4845671537417486e-05, "Pretrain/Loss": 2.0965709686279297, "Pretrain/Loss (Raw)": 1.9831032752990723, "Pretrain/Step": 2211, "Pretrain/Step Time": 8.49304067529738} +{"Pretrain/Learning Rate": 4.484050732923405e-05, "Pretrain/Loss": 2.0977706909179688, "Pretrain/Loss (Raw)": 2.0321483612060547, "Pretrain/Step": 2212, "Pretrain/Step Time": 8.495861545205116} +{"Pretrain/Learning Rate": 4.483534083294982e-05, "Pretrain/Loss": 2.09800386428833, "Pretrain/Loss (Raw)": 1.8384402990341187, "Pretrain/Step": 2213, "Pretrain/Step Time": 8.498965276405215} +{"Pretrain/Learning Rate": 4.483017204916061e-05, "Pretrain/Loss": 2.098479747772217, "Pretrain/Loss (Raw)": 2.038564920425415, "Pretrain/Step": 2214, "Pretrain/Step Time": 8.504449127241969} +{"Pretrain/Learning Rate": 4.482500097846253e-05, "Pretrain/Loss": 2.0993199348449707, "Pretrain/Loss (Raw)": 2.1786270141601562, "Pretrain/Step": 2215, "Pretrain/Step Time": 8.507550053298473} +{"Pretrain/Learning Rate": 4.4819827621451906e-05, "Pretrain/Loss": 2.0987744331359863, "Pretrain/Loss (Raw)": 2.09653639793396, "Pretrain/Step": 2216, "Pretrain/Step Time": 8.500995799899101} +{"Pretrain/Learning Rate": 4.481465197872538e-05, "Pretrain/Loss": 2.0978331565856934, "Pretrain/Loss (Raw)": 1.9438579082489014, "Pretrain/Step": 2217, "Pretrain/Step Time": 8.497812611982226} +{"Pretrain/Learning Rate": 4.4809474050879806e-05, "Pretrain/Loss": 2.1013026237487793, "Pretrain/Loss (Raw)": 2.4708807468414307, "Pretrain/Step": 2218, "Pretrain/Step Time": 8.497081091627479} +{"Pretrain/Learning Rate": 4.4804293838512346e-05, "Pretrain/Loss": 2.1020426750183105, "Pretrain/Loss (Raw)": 2.1001925468444824, "Pretrain/Step": 2219, "Pretrain/Step Time": 8.501267129555345} +{"Pretrain/Learning Rate": 4.47991113422204e-05, "Pretrain/Loss": 2.096750497817993, "Pretrain/Loss (Raw)": 1.8924717903137207, "Pretrain/Step": 2220, "Pretrain/Step Time": 8.507107073441148} +{"Pretrain/Learning Rate": 4.479392656260163e-05, "Pretrain/Loss": 2.097519874572754, "Pretrain/Loss (Raw)": 2.042506694793701, "Pretrain/Step": 2221, "Pretrain/Step Time": 8.502905843779445} +{"Pretrain/Learning Rate": 4.4788739500253986e-05, "Pretrain/Loss": 2.0926523208618164, "Pretrain/Loss (Raw)": 1.990880012512207, "Pretrain/Step": 2222, "Pretrain/Step Time": 8.500991912558675} +{"Pretrain/Learning Rate": 4.4783550155775647e-05, "Pretrain/Loss": 2.0916409492492676, "Pretrain/Loss (Raw)": 2.02518367767334, "Pretrain/Step": 2223, "Pretrain/Step Time": 8.506258191540837} +{"Pretrain/Learning Rate": 4.4778358529765085e-05, "Pretrain/Loss": 2.0930233001708984, "Pretrain/Loss (Raw)": 2.215651273727417, "Pretrain/Step": 2224, "Pretrain/Step Time": 8.50834614597261} +{"Pretrain/Learning Rate": 4.477316462282102e-05, "Pretrain/Loss": 2.0965328216552734, "Pretrain/Loss (Raw)": 2.6548807621002197, "Pretrain/Step": 2225, "Pretrain/Step Time": 8.509945403784513} +{"Pretrain/Learning Rate": 4.476796843554243e-05, "Pretrain/Loss": 2.0950064659118652, "Pretrain/Loss (Raw)": 2.0051157474517822, "Pretrain/Step": 2226, "Pretrain/Step Time": 8.510490875691175} +{"Pretrain/Learning Rate": 4.4762769968528575e-05, "Pretrain/Loss": 2.0950767993927, "Pretrain/Loss (Raw)": 2.203528642654419, "Pretrain/Step": 2227, "Pretrain/Step Time": 8.501947525888681} +{"Pretrain/Learning Rate": 4.475756922237896e-05, "Pretrain/Loss": 2.094675302505493, "Pretrain/Loss (Raw)": 2.100260019302368, "Pretrain/Step": 2228, "Pretrain/Step Time": 8.496008982881904} +{"Pretrain/Learning Rate": 4.4752366197693365e-05, "Pretrain/Loss": 2.0954275131225586, "Pretrain/Loss (Raw)": 2.131864547729492, "Pretrain/Step": 2229, "Pretrain/Step Time": 8.50001991353929} +{"Pretrain/Learning Rate": 4.474716089507182e-05, "Pretrain/Loss": 2.0963523387908936, "Pretrain/Loss (Raw)": 2.0947632789611816, "Pretrain/Step": 2230, "Pretrain/Step Time": 8.505781687796116} +{"Pretrain/Learning Rate": 4.474195331511464e-05, "Pretrain/Loss": 2.0976667404174805, "Pretrain/Loss (Raw)": 2.1958813667297363, "Pretrain/Step": 2231, "Pretrain/Step Time": 8.511200867593288} +{"Pretrain/Learning Rate": 4.473674345842236e-05, "Pretrain/Loss": 2.098837375640869, "Pretrain/Loss (Raw)": 2.1253933906555176, "Pretrain/Step": 2232, "Pretrain/Step Time": 8.514143539592624} +{"Pretrain/Learning Rate": 4.4731531325595835e-05, "Pretrain/Loss": 2.0989532470703125, "Pretrain/Loss (Raw)": 2.009241819381714, "Pretrain/Step": 2233, "Pretrain/Step Time": 8.509296355769038} +{"Pretrain/Learning Rate": 4.472631691723613e-05, "Pretrain/Loss": 2.098691940307617, "Pretrain/Loss (Raw)": 2.0783607959747314, "Pretrain/Step": 2234, "Pretrain/Step Time": 8.512576511129737} +{"Pretrain/Learning Rate": 4.4721100233944606e-05, "Pretrain/Loss": 2.0974583625793457, "Pretrain/Loss (Raw)": 1.910282015800476, "Pretrain/Step": 2235, "Pretrain/Step Time": 8.508438125252724} +{"Pretrain/Learning Rate": 4.471588127632288e-05, "Pretrain/Loss": 2.0989861488342285, "Pretrain/Loss (Raw)": 2.0636589527130127, "Pretrain/Step": 2236, "Pretrain/Step Time": 8.505886128172278} +{"Pretrain/Learning Rate": 4.471066004497282e-05, "Pretrain/Loss": 2.097839832305908, "Pretrain/Loss (Raw)": 1.9942575693130493, "Pretrain/Step": 2237, "Pretrain/Step Time": 8.506626514717937} +{"Pretrain/Learning Rate": 4.470543654049656e-05, "Pretrain/Loss": 2.095696449279785, "Pretrain/Loss (Raw)": 1.8754829168319702, "Pretrain/Step": 2238, "Pretrain/Step Time": 8.506708359345794} +{"Pretrain/Learning Rate": 4.47002107634965e-05, "Pretrain/Loss": 2.093562364578247, "Pretrain/Loss (Raw)": 1.8465067148208618, "Pretrain/Step": 2239, "Pretrain/Step Time": 8.499150449410081} +{"Pretrain/Learning Rate": 4.469498271457531e-05, "Pretrain/Loss": 2.091609477996826, "Pretrain/Loss (Raw)": 1.9274266958236694, "Pretrain/Step": 2240, "Pretrain/Step Time": 8.504331782460213} +{"Pretrain/Learning Rate": 4.468975239433591e-05, "Pretrain/Loss": 2.0910658836364746, "Pretrain/Loss (Raw)": 2.0795254707336426, "Pretrain/Step": 2241, "Pretrain/Step Time": 8.504770547151566} +{"Pretrain/Learning Rate": 4.468451980338148e-05, "Pretrain/Loss": 2.0916926860809326, "Pretrain/Loss (Raw)": 2.0969204902648926, "Pretrain/Step": 2242, "Pretrain/Step Time": 8.513325709849596} +{"Pretrain/Learning Rate": 4.467928494231547e-05, "Pretrain/Loss": 2.0917911529541016, "Pretrain/Loss (Raw)": 2.0421059131622314, "Pretrain/Step": 2243, "Pretrain/Step Time": 8.51474416255951} +{"Pretrain/Learning Rate": 4.4674047811741585e-05, "Pretrain/Loss": 2.091257095336914, "Pretrain/Loss (Raw)": 2.090543270111084, "Pretrain/Step": 2244, "Pretrain/Step Time": 8.51808725297451} +{"Pretrain/Learning Rate": 4.466880841226381e-05, "Pretrain/Loss": 2.092520236968994, "Pretrain/Loss (Raw)": 2.1342337131500244, "Pretrain/Step": 2245, "Pretrain/Step Time": 8.511024724692106} +{"Pretrain/Learning Rate": 4.466356674448635e-05, "Pretrain/Loss": 2.0908865928649902, "Pretrain/Loss (Raw)": 2.0404515266418457, "Pretrain/Step": 2246, "Pretrain/Step Time": 8.509616043418646} +{"Pretrain/Learning Rate": 4.4658322809013723e-05, "Pretrain/Loss": 2.088869094848633, "Pretrain/Loss (Raw)": 2.138042688369751, "Pretrain/Step": 2247, "Pretrain/Step Time": 8.50415314733982} +{"Pretrain/Learning Rate": 4.465307660645068e-05, "Pretrain/Loss": 2.0891478061676025, "Pretrain/Loss (Raw)": 1.9619255065917969, "Pretrain/Step": 2248, "Pretrain/Step Time": 8.508615422993898} +{"Pretrain/Learning Rate": 4.464782813740223e-05, "Pretrain/Loss": 2.0913760662078857, "Pretrain/Loss (Raw)": 2.1379058361053467, "Pretrain/Step": 2249, "Pretrain/Step Time": 8.516753137111664} +{"Pretrain/Learning Rate": 4.464257740247366e-05, "Pretrain/Loss": 2.092559814453125, "Pretrain/Loss (Raw)": 2.013720750808716, "Pretrain/Step": 2250, "Pretrain/Step Time": 8.519010193645954} +{"Pretrain/Learning Rate": 4.4637324402270495e-05, "Pretrain/Loss": 2.089367389678955, "Pretrain/Loss (Raw)": 1.9077845811843872, "Pretrain/Step": 2251, "Pretrain/Step Time": 8.512913834303617} +{"Pretrain/Learning Rate": 4.463206913739856e-05, "Pretrain/Loss": 2.0893402099609375, "Pretrain/Loss (Raw)": 2.0338289737701416, "Pretrain/Step": 2252, "Pretrain/Step Time": 8.51051645167172} +{"Pretrain/Learning Rate": 4.462681160846389e-05, "Pretrain/Loss": 2.0901882648468018, "Pretrain/Loss (Raw)": 2.0583808422088623, "Pretrain/Step": 2253, "Pretrain/Step Time": 8.509032255038619} +{"Pretrain/Learning Rate": 4.4621551816072835e-05, "Pretrain/Loss": 2.089573860168457, "Pretrain/Loss (Raw)": 2.1796178817749023, "Pretrain/Step": 2254, "Pretrain/Step Time": 8.519815331324935} +{"Pretrain/Learning Rate": 4.4616289760831954e-05, "Pretrain/Loss": 2.0897157192230225, "Pretrain/Loss (Raw)": 2.1712722778320312, "Pretrain/Step": 2255, "Pretrain/Step Time": 8.517315044999123} +{"Pretrain/Learning Rate": 4.46110254433481e-05, "Pretrain/Loss": 2.0896501541137695, "Pretrain/Loss (Raw)": 2.0529916286468506, "Pretrain/Step": 2256, "Pretrain/Step Time": 8.519476059824228} +{"Pretrain/Learning Rate": 4.4605758864228384e-05, "Pretrain/Loss": 2.091305732727051, "Pretrain/Loss (Raw)": 2.1813509464263916, "Pretrain/Step": 2257, "Pretrain/Step Time": 8.515347914770246} +{"Pretrain/Learning Rate": 4.460049002408018e-05, "Pretrain/Loss": 2.0909953117370605, "Pretrain/Loss (Raw)": 1.647681713104248, "Pretrain/Step": 2258, "Pretrain/Step Time": 8.513905514031649} +{"Pretrain/Learning Rate": 4.45952189235111e-05, "Pretrain/Loss": 2.0898470878601074, "Pretrain/Loss (Raw)": 2.2050273418426514, "Pretrain/Step": 2259, "Pretrain/Step Time": 8.524729365482926} +{"Pretrain/Learning Rate": 4.458994556312903e-05, "Pretrain/Loss": 2.0898823738098145, "Pretrain/Loss (Raw)": 2.078800916671753, "Pretrain/Step": 2260, "Pretrain/Step Time": 8.52732558734715} +{"Pretrain/Learning Rate": 4.458466994354214e-05, "Pretrain/Loss": 2.0911788940429688, "Pretrain/Loss (Raw)": 2.20169997215271, "Pretrain/Step": 2261, "Pretrain/Step Time": 8.5298196002841} +{"Pretrain/Learning Rate": 4.457939206535882e-05, "Pretrain/Loss": 2.090640068054199, "Pretrain/Loss (Raw)": 1.9483009576797485, "Pretrain/Step": 2262, "Pretrain/Step Time": 8.527478985488415} +{"Pretrain/Learning Rate": 4.4574111929187744e-05, "Pretrain/Loss": 2.092020034790039, "Pretrain/Loss (Raw)": 2.2130115032196045, "Pretrain/Step": 2263, "Pretrain/Step Time": 8.526562655344605} +{"Pretrain/Learning Rate": 4.4568829535637844e-05, "Pretrain/Loss": 2.088946580886841, "Pretrain/Loss (Raw)": 1.9677549600601196, "Pretrain/Step": 2264, "Pretrain/Step Time": 8.518336473032832} +{"Pretrain/Learning Rate": 4.456354488531832e-05, "Pretrain/Loss": 2.0893537998199463, "Pretrain/Loss (Raw)": 2.01962947845459, "Pretrain/Step": 2265, "Pretrain/Step Time": 8.511709181591868} +{"Pretrain/Learning Rate": 4.4558257978838605e-05, "Pretrain/Loss": 2.092275619506836, "Pretrain/Loss (Raw)": 2.2337164878845215, "Pretrain/Step": 2266, "Pretrain/Step Time": 8.511822624132037} +{"Pretrain/Learning Rate": 4.455296881680842e-05, "Pretrain/Loss": 2.0909996032714844, "Pretrain/Loss (Raw)": 1.9484913349151611, "Pretrain/Step": 2267, "Pretrain/Step Time": 8.514559783041477} +{"Pretrain/Learning Rate": 4.4547677399837726e-05, "Pretrain/Loss": 2.091017723083496, "Pretrain/Loss (Raw)": 2.071204423904419, "Pretrain/Step": 2268, "Pretrain/Step Time": 8.516312105581164} +{"Pretrain/Learning Rate": 4.4542383728536774e-05, "Pretrain/Loss": 2.0915465354919434, "Pretrain/Loss (Raw)": 2.0426366329193115, "Pretrain/Step": 2269, "Pretrain/Step Time": 8.510553658008575} +{"Pretrain/Learning Rate": 4.453708780351604e-05, "Pretrain/Loss": 2.090698480606079, "Pretrain/Loss (Raw)": 2.093096971511841, "Pretrain/Step": 2270, "Pretrain/Step Time": 8.510553861036897} +{"Pretrain/Learning Rate": 4.4531789625386274e-05, "Pretrain/Loss": 2.091437339782715, "Pretrain/Loss (Raw)": 2.320988178253174, "Pretrain/Step": 2271, "Pretrain/Step Time": 8.516646277159452} +{"Pretrain/Learning Rate": 4.45264891947585e-05, "Pretrain/Loss": 2.091221809387207, "Pretrain/Loss (Raw)": 2.1636102199554443, "Pretrain/Step": 2272, "Pretrain/Step Time": 8.517898421734571} +{"Pretrain/Learning Rate": 4.452118651224398e-05, "Pretrain/Loss": 2.0916008949279785, "Pretrain/Loss (Raw)": 2.1242966651916504, "Pretrain/Step": 2273, "Pretrain/Step Time": 8.520757237449288} +{"Pretrain/Learning Rate": 4.451588157845424e-05, "Pretrain/Loss": 2.093484878540039, "Pretrain/Loss (Raw)": 2.2962818145751953, "Pretrain/Step": 2274, "Pretrain/Step Time": 8.517329182475805} +{"Pretrain/Learning Rate": 4.451057439400108e-05, "Pretrain/Loss": 2.0941524505615234, "Pretrain/Loss (Raw)": 2.1862070560455322, "Pretrain/Step": 2275, "Pretrain/Step Time": 8.508423095569015} +{"Pretrain/Learning Rate": 4.450526495949653e-05, "Pretrain/Loss": 2.0947933197021484, "Pretrain/Loss (Raw)": 2.077353000640869, "Pretrain/Step": 2276, "Pretrain/Step Time": 8.511183489114046} +{"Pretrain/Learning Rate": 4.449995327555293e-05, "Pretrain/Loss": 2.0951507091522217, "Pretrain/Loss (Raw)": 2.267561674118042, "Pretrain/Step": 2277, "Pretrain/Step Time": 8.515473978593946} +{"Pretrain/Learning Rate": 4.449463934278282e-05, "Pretrain/Loss": 2.0961506366729736, "Pretrain/Loss (Raw)": 2.16190767288208, "Pretrain/Step": 2278, "Pretrain/Step Time": 8.519600991159678} +{"Pretrain/Learning Rate": 4.4489323161799045e-05, "Pretrain/Loss": 2.0905933380126953, "Pretrain/Loss (Raw)": 1.8686164617538452, "Pretrain/Step": 2279, "Pretrain/Step Time": 8.524273127317429} +{"Pretrain/Learning Rate": 4.4484004733214685e-05, "Pretrain/Loss": 2.0887551307678223, "Pretrain/Loss (Raw)": 1.8799262046813965, "Pretrain/Step": 2280, "Pretrain/Step Time": 8.520619360730052} +{"Pretrain/Learning Rate": 4.447868405764309e-05, "Pretrain/Loss": 2.0880298614501953, "Pretrain/Loss (Raw)": 1.951365351676941, "Pretrain/Step": 2281, "Pretrain/Step Time": 8.521400719881058} +{"Pretrain/Learning Rate": 4.4473361135697856e-05, "Pretrain/Loss": 2.088329315185547, "Pretrain/Loss (Raw)": 2.048097610473633, "Pretrain/Step": 2282, "Pretrain/Step Time": 8.511748753488064} +{"Pretrain/Learning Rate": 4.446803596799286e-05, "Pretrain/Loss": 2.086674690246582, "Pretrain/Loss (Raw)": 2.189326286315918, "Pretrain/Step": 2283, "Pretrain/Step Time": 8.511015923693776} +{"Pretrain/Learning Rate": 4.446270855514222e-05, "Pretrain/Loss": 2.085845947265625, "Pretrain/Loss (Raw)": 2.0937130451202393, "Pretrain/Step": 2284, "Pretrain/Step Time": 8.511389853432775} +{"Pretrain/Learning Rate": 4.445737889776031e-05, "Pretrain/Loss": 2.08489990234375, "Pretrain/Loss (Raw)": 2.1573452949523926, "Pretrain/Step": 2285, "Pretrain/Step Time": 8.513923207297921} +{"Pretrain/Learning Rate": 4.44520469964618e-05, "Pretrain/Loss": 2.0830092430114746, "Pretrain/Loss (Raw)": 2.020129442214966, "Pretrain/Step": 2286, "Pretrain/Step Time": 8.509994603693485} +{"Pretrain/Learning Rate": 4.444671285186155e-05, "Pretrain/Loss": 2.0846078395843506, "Pretrain/Loss (Raw)": 2.2964367866516113, "Pretrain/Step": 2287, "Pretrain/Step Time": 8.500722976401448} +{"Pretrain/Learning Rate": 4.444137646457474e-05, "Pretrain/Loss": 2.086305618286133, "Pretrain/Loss (Raw)": 2.3079824447631836, "Pretrain/Step": 2288, "Pretrain/Step Time": 8.50431102141738} +{"Pretrain/Learning Rate": 4.4436037835216784e-05, "Pretrain/Loss": 2.0858893394470215, "Pretrain/Loss (Raw)": 2.1208596229553223, "Pretrain/Step": 2289, "Pretrain/Step Time": 8.512451754882932} +{"Pretrain/Learning Rate": 4.4430696964403366e-05, "Pretrain/Loss": 2.0859787464141846, "Pretrain/Loss (Raw)": 2.1326959133148193, "Pretrain/Step": 2290, "Pretrain/Step Time": 8.513454334810376} +{"Pretrain/Learning Rate": 4.4425353852750414e-05, "Pretrain/Loss": 2.0862107276916504, "Pretrain/Loss (Raw)": 2.1543571949005127, "Pretrain/Step": 2291, "Pretrain/Step Time": 8.514033922925591} +{"Pretrain/Learning Rate": 4.4420008500874116e-05, "Pretrain/Loss": 2.085824966430664, "Pretrain/Loss (Raw)": 2.010762929916382, "Pretrain/Step": 2292, "Pretrain/Step Time": 8.51413588784635} +{"Pretrain/Learning Rate": 4.441466090939093e-05, "Pretrain/Loss": 2.0880331993103027, "Pretrain/Loss (Raw)": 2.1603875160217285, "Pretrain/Step": 2293, "Pretrain/Step Time": 8.505503825843334} +{"Pretrain/Learning Rate": 4.440931107891756e-05, "Pretrain/Loss": 2.086524248123169, "Pretrain/Loss (Raw)": 2.0960850715637207, "Pretrain/Step": 2294, "Pretrain/Step Time": 8.503296880051494} +{"Pretrain/Learning Rate": 4.440395901007098e-05, "Pretrain/Loss": 2.088805675506592, "Pretrain/Loss (Raw)": 2.411879062652588, "Pretrain/Step": 2295, "Pretrain/Step Time": 8.496543325483799} +{"Pretrain/Learning Rate": 4.4398604703468415e-05, "Pretrain/Loss": 2.0873990058898926, "Pretrain/Loss (Raw)": 1.995147943496704, "Pretrain/Step": 2296, "Pretrain/Step Time": 8.503649089485407} +{"Pretrain/Learning Rate": 4.439324815972734e-05, "Pretrain/Loss": 2.0881028175354004, "Pretrain/Loss (Raw)": 2.2425737380981445, "Pretrain/Step": 2297, "Pretrain/Step Time": 8.509851139038801} +{"Pretrain/Learning Rate": 4.438788937946551e-05, "Pretrain/Loss": 2.0887551307678223, "Pretrain/Loss (Raw)": 2.1162710189819336, "Pretrain/Step": 2298, "Pretrain/Step Time": 8.513188779354095} +{"Pretrain/Learning Rate": 4.4382528363300916e-05, "Pretrain/Loss": 2.088623523712158, "Pretrain/Loss (Raw)": 1.9789087772369385, "Pretrain/Step": 2299, "Pretrain/Step Time": 8.511246606707573} +{"Pretrain/Learning Rate": 4.437716511185181e-05, "Pretrain/Loss": 2.086101531982422, "Pretrain/Loss (Raw)": 1.9008524417877197, "Pretrain/Step": 2300, "Pretrain/Step Time": 8.510404821485281} +{"Pretrain/Learning Rate": 4.437179962573672e-05, "Pretrain/Loss": 2.088064193725586, "Pretrain/Loss (Raw)": 2.1343905925750732, "Pretrain/Step": 2301, "Pretrain/Step Time": 8.504135236144066} +{"Pretrain/Learning Rate": 4.436643190557441e-05, "Pretrain/Loss": 2.091322422027588, "Pretrain/Loss (Raw)": 2.162476062774658, "Pretrain/Step": 2302, "Pretrain/Step Time": 8.504177551716566} +{"Pretrain/Learning Rate": 4.4361061951983925e-05, "Pretrain/Loss": 2.092306137084961, "Pretrain/Loss (Raw)": 2.157712936401367, "Pretrain/Step": 2303, "Pretrain/Step Time": 8.507228963077068} +{"Pretrain/Learning Rate": 4.435568976558454e-05, "Pretrain/Loss": 2.0912885665893555, "Pretrain/Loss (Raw)": 1.9507807493209839, "Pretrain/Step": 2304, "Pretrain/Step Time": 8.505025753751397} +{"Pretrain/Learning Rate": 4.4350315346995804e-05, "Pretrain/Loss": 2.091339111328125, "Pretrain/Loss (Raw)": 2.226567506790161, "Pretrain/Step": 2305, "Pretrain/Step Time": 8.49642120115459} +{"Pretrain/Learning Rate": 4.434493869683752e-05, "Pretrain/Loss": 2.091808557510376, "Pretrain/Loss (Raw)": 2.0975072383880615, "Pretrain/Step": 2306, "Pretrain/Step Time": 8.495190262794495} +{"Pretrain/Learning Rate": 4.4339559815729746e-05, "Pretrain/Loss": 2.091071367263794, "Pretrain/Loss (Raw)": 1.9934910535812378, "Pretrain/Step": 2307, "Pretrain/Step Time": 8.510240433737636} +{"Pretrain/Learning Rate": 4.4334178704292805e-05, "Pretrain/Loss": 2.091026782989502, "Pretrain/Loss (Raw)": 2.0277950763702393, "Pretrain/Step": 2308, "Pretrain/Step Time": 8.50906465947628} +{"Pretrain/Learning Rate": 4.432879536314727e-05, "Pretrain/Loss": 2.090663433074951, "Pretrain/Loss (Raw)": 2.072763681411743, "Pretrain/Step": 2309, "Pretrain/Step Time": 8.511455474421382} +{"Pretrain/Learning Rate": 4.4323409792913974e-05, "Pretrain/Loss": 2.0898237228393555, "Pretrain/Loss (Raw)": 1.990274429321289, "Pretrain/Step": 2310, "Pretrain/Step Time": 8.507404167205095} +{"Pretrain/Learning Rate": 4.431802199421401e-05, "Pretrain/Loss": 2.0884389877319336, "Pretrain/Loss (Raw)": 2.091261625289917, "Pretrain/Step": 2311, "Pretrain/Step Time": 8.501913448795676} +{"Pretrain/Learning Rate": 4.431263196766872e-05, "Pretrain/Loss": 2.0895466804504395, "Pretrain/Loss (Raw)": 2.0884692668914795, "Pretrain/Step": 2312, "Pretrain/Step Time": 8.500823318958282} +{"Pretrain/Learning Rate": 4.43072397138997e-05, "Pretrain/Loss": 2.0895633697509766, "Pretrain/Loss (Raw)": 1.958119511604309, "Pretrain/Step": 2313, "Pretrain/Step Time": 8.510844822973013} +{"Pretrain/Learning Rate": 4.430184523352881e-05, "Pretrain/Loss": 2.091646194458008, "Pretrain/Loss (Raw)": 2.1457712650299072, "Pretrain/Step": 2314, "Pretrain/Step Time": 8.50903376750648} +{"Pretrain/Learning Rate": 4.429644852717819e-05, "Pretrain/Loss": 2.0902793407440186, "Pretrain/Loss (Raw)": 1.8747872114181519, "Pretrain/Step": 2315, "Pretrain/Step Time": 8.50874437764287} +{"Pretrain/Learning Rate": 4.4291049595470193e-05, "Pretrain/Loss": 2.0909547805786133, "Pretrain/Loss (Raw)": 2.227578639984131, "Pretrain/Step": 2316, "Pretrain/Step Time": 8.503887558355927} +{"Pretrain/Learning Rate": 4.428564843902746e-05, "Pretrain/Loss": 2.094200849533081, "Pretrain/Loss (Raw)": 2.398063898086548, "Pretrain/Step": 2317, "Pretrain/Step Time": 8.504050560295582} +{"Pretrain/Learning Rate": 4.4280245058472866e-05, "Pretrain/Loss": 2.09468936920166, "Pretrain/Loss (Raw)": 2.156982898712158, "Pretrain/Step": 2318, "Pretrain/Step Time": 8.51454227231443} +{"Pretrain/Learning Rate": 4.427483945442956e-05, "Pretrain/Loss": 2.0919599533081055, "Pretrain/Loss (Raw)": 1.7913893461227417, "Pretrain/Step": 2319, "Pretrain/Step Time": 8.513768108561635} +{"Pretrain/Learning Rate": 4.426943162752094e-05, "Pretrain/Loss": 2.093813419342041, "Pretrain/Loss (Raw)": 2.1566708087921143, "Pretrain/Step": 2320, "Pretrain/Step Time": 8.51421562768519} +{"Pretrain/Learning Rate": 4.426402157837067e-05, "Pretrain/Loss": 2.0897159576416016, "Pretrain/Loss (Raw)": 1.9047632217407227, "Pretrain/Step": 2321, "Pretrain/Step Time": 8.515852436423302} +{"Pretrain/Learning Rate": 4.425860930760265e-05, "Pretrain/Loss": 2.089843273162842, "Pretrain/Loss (Raw)": 2.117918014526367, "Pretrain/Step": 2322, "Pretrain/Step Time": 8.506397748365998} +{"Pretrain/Learning Rate": 4.4253194815841056e-05, "Pretrain/Loss": 2.089956521987915, "Pretrain/Loss (Raw)": 2.1396422386169434, "Pretrain/Step": 2323, "Pretrain/Step Time": 8.502273868769407} +{"Pretrain/Learning Rate": 4.424777810371032e-05, "Pretrain/Loss": 2.0872745513916016, "Pretrain/Loss (Raw)": 1.98080313205719, "Pretrain/Step": 2324, "Pretrain/Step Time": 8.509337604045868} +{"Pretrain/Learning Rate": 4.424235917183511e-05, "Pretrain/Loss": 2.0884368419647217, "Pretrain/Loss (Raw)": 2.0506420135498047, "Pretrain/Step": 2325, "Pretrain/Step Time": 8.516224035993218} +{"Pretrain/Learning Rate": 4.4236938020840365e-05, "Pretrain/Loss": 2.0885391235351562, "Pretrain/Loss (Raw)": 2.0943524837493896, "Pretrain/Step": 2326, "Pretrain/Step Time": 8.522042678669095} +{"Pretrain/Learning Rate": 4.423151465135128e-05, "Pretrain/Loss": 2.089033842086792, "Pretrain/Loss (Raw)": 2.124483823776245, "Pretrain/Step": 2327, "Pretrain/Step Time": 8.519928358495235} +{"Pretrain/Learning Rate": 4.422608906399331e-05, "Pretrain/Loss": 2.0863285064697266, "Pretrain/Loss (Raw)": 1.973838210105896, "Pretrain/Step": 2328, "Pretrain/Step Time": 8.513200506567955} +{"Pretrain/Learning Rate": 4.4220661259392146e-05, "Pretrain/Loss": 2.084587812423706, "Pretrain/Loss (Raw)": 1.7462469339370728, "Pretrain/Step": 2329, "Pretrain/Step Time": 8.512313034385443} +{"Pretrain/Learning Rate": 4.421523123817376e-05, "Pretrain/Loss": 2.0850257873535156, "Pretrain/Loss (Raw)": 2.1811726093292236, "Pretrain/Step": 2330, "Pretrain/Step Time": 8.510317031294107} +{"Pretrain/Learning Rate": 4.420979900096436e-05, "Pretrain/Loss": 2.0841846466064453, "Pretrain/Loss (Raw)": 2.1099910736083984, "Pretrain/Step": 2331, "Pretrain/Step Time": 8.517310654744506} +{"Pretrain/Learning Rate": 4.420436454839041e-05, "Pretrain/Loss": 2.0850601196289062, "Pretrain/Loss (Raw)": 2.0536458492279053, "Pretrain/Step": 2332, "Pretrain/Step Time": 8.518994368612766} +{"Pretrain/Learning Rate": 4.419892788107865e-05, "Pretrain/Loss": 2.0860719680786133, "Pretrain/Loss (Raw)": 2.2038466930389404, "Pretrain/Step": 2333, "Pretrain/Step Time": 8.509404890239239} +{"Pretrain/Learning Rate": 4.419348899965608e-05, "Pretrain/Loss": 2.0849316120147705, "Pretrain/Loss (Raw)": 2.0077710151672363, "Pretrain/Step": 2334, "Pretrain/Step Time": 8.510574731975794} +{"Pretrain/Learning Rate": 4.4188047904749894e-05, "Pretrain/Loss": 2.0837502479553223, "Pretrain/Loss (Raw)": 1.9658626317977905, "Pretrain/Step": 2335, "Pretrain/Step Time": 8.511983068659902} +{"Pretrain/Learning Rate": 4.418260459698761e-05, "Pretrain/Loss": 2.0843870639801025, "Pretrain/Loss (Raw)": 2.240349054336548, "Pretrain/Step": 2336, "Pretrain/Step Time": 8.518230782821774} +{"Pretrain/Learning Rate": 4.417715907699698e-05, "Pretrain/Loss": 2.0852537155151367, "Pretrain/Loss (Raw)": 2.183278799057007, "Pretrain/Step": 2337, "Pretrain/Step Time": 8.52289648912847} +{"Pretrain/Learning Rate": 4.417171134540599e-05, "Pretrain/Loss": 2.0825886726379395, "Pretrain/Loss (Raw)": 2.000366687774658, "Pretrain/Step": 2338, "Pretrain/Step Time": 8.526717159897089} +{"Pretrain/Learning Rate": 4.416626140284291e-05, "Pretrain/Loss": 2.082620143890381, "Pretrain/Loss (Raw)": 1.9871068000793457, "Pretrain/Step": 2339, "Pretrain/Step Time": 8.521794324740767} +{"Pretrain/Learning Rate": 4.416080924993625e-05, "Pretrain/Loss": 2.083847761154175, "Pretrain/Loss (Raw)": 2.1892895698547363, "Pretrain/Step": 2340, "Pretrain/Step Time": 8.511846328154206} +{"Pretrain/Learning Rate": 4.415535488731478e-05, "Pretrain/Loss": 2.085352659225464, "Pretrain/Loss (Raw)": 2.031066417694092, "Pretrain/Step": 2341, "Pretrain/Step Time": 8.509653428569436} +{"Pretrain/Learning Rate": 4.414989831560753e-05, "Pretrain/Loss": 2.0860214233398438, "Pretrain/Loss (Raw)": 2.1241884231567383, "Pretrain/Step": 2342, "Pretrain/Step Time": 8.513090323656797} +{"Pretrain/Learning Rate": 4.4144439535443763e-05, "Pretrain/Loss": 2.0856704711914062, "Pretrain/Loss (Raw)": 2.133697509765625, "Pretrain/Step": 2343, "Pretrain/Step Time": 8.51423322595656} +{"Pretrain/Learning Rate": 4.413897854745301e-05, "Pretrain/Loss": 2.08516263961792, "Pretrain/Loss (Raw)": 2.031531810760498, "Pretrain/Step": 2344, "Pretrain/Step Time": 8.521178372204304} +{"Pretrain/Learning Rate": 4.413351535226507e-05, "Pretrain/Loss": 2.085921287536621, "Pretrain/Loss (Raw)": 2.040971517562866, "Pretrain/Step": 2345, "Pretrain/Step Time": 8.518931416794658} +{"Pretrain/Learning Rate": 4.4128049950509984e-05, "Pretrain/Loss": 2.0816750526428223, "Pretrain/Loss (Raw)": 1.927377700805664, "Pretrain/Step": 2346, "Pretrain/Step Time": 8.51554836705327} +{"Pretrain/Learning Rate": 4.412258234281804e-05, "Pretrain/Loss": 2.0822010040283203, "Pretrain/Loss (Raw)": 2.1674983501434326, "Pretrain/Step": 2347, "Pretrain/Step Time": 8.508542113006115} +{"Pretrain/Learning Rate": 4.411711252981979e-05, "Pretrain/Loss": 2.0843863487243652, "Pretrain/Loss (Raw)": 2.172177314758301, "Pretrain/Step": 2348, "Pretrain/Step Time": 8.510464595630765} +{"Pretrain/Learning Rate": 4.411164051214603e-05, "Pretrain/Loss": 2.0860533714294434, "Pretrain/Loss (Raw)": 2.2559189796447754, "Pretrain/Step": 2349, "Pretrain/Step Time": 8.512870566919446} +{"Pretrain/Learning Rate": 4.4106166290427846e-05, "Pretrain/Loss": 2.0868778228759766, "Pretrain/Loss (Raw)": 2.096409797668457, "Pretrain/Step": 2350, "Pretrain/Step Time": 8.510928900912404} +{"Pretrain/Learning Rate": 4.410068986529653e-05, "Pretrain/Loss": 2.0878958702087402, "Pretrain/Loss (Raw)": 2.1554818153381348, "Pretrain/Step": 2351, "Pretrain/Step Time": 8.502412458881736} +{"Pretrain/Learning Rate": 4.409521123738365e-05, "Pretrain/Loss": 2.085573196411133, "Pretrain/Loss (Raw)": 1.918316125869751, "Pretrain/Step": 2352, "Pretrain/Step Time": 8.498370563611388} +{"Pretrain/Learning Rate": 4.4089730407321035e-05, "Pretrain/Loss": 2.081599712371826, "Pretrain/Loss (Raw)": 2.1462936401367188, "Pretrain/Step": 2353, "Pretrain/Step Time": 8.499528747051954} +{"Pretrain/Learning Rate": 4.408424737574075e-05, "Pretrain/Loss": 2.0796990394592285, "Pretrain/Loss (Raw)": 1.761817216873169, "Pretrain/Step": 2354, "Pretrain/Step Time": 8.501808226108551} +{"Pretrain/Learning Rate": 4.407876214327513e-05, "Pretrain/Loss": 2.077336311340332, "Pretrain/Loss (Raw)": 1.901124119758606, "Pretrain/Step": 2355, "Pretrain/Step Time": 8.510218221694231} +{"Pretrain/Learning Rate": 4.407327471055677e-05, "Pretrain/Loss": 2.0782148838043213, "Pretrain/Loss (Raw)": 2.212705373764038, "Pretrain/Step": 2356, "Pretrain/Step Time": 8.519117265939713} +{"Pretrain/Learning Rate": 4.406778507821848e-05, "Pretrain/Loss": 2.076833724975586, "Pretrain/Loss (Raw)": 1.955081820487976, "Pretrain/Step": 2357, "Pretrain/Step Time": 8.514190865680575} +{"Pretrain/Learning Rate": 4.4062293246893374e-05, "Pretrain/Loss": 2.078040838241577, "Pretrain/Loss (Raw)": 2.249286413192749, "Pretrain/Step": 2358, "Pretrain/Step Time": 8.504317505285144} +{"Pretrain/Learning Rate": 4.4056799217214774e-05, "Pretrain/Loss": 2.0759692192077637, "Pretrain/Loss (Raw)": 1.9307081699371338, "Pretrain/Step": 2359, "Pretrain/Step Time": 8.500932555645704} +{"Pretrain/Learning Rate": 4.4051302989816304e-05, "Pretrain/Loss": 2.0767650604248047, "Pretrain/Loss (Raw)": 2.227245330810547, "Pretrain/Step": 2360, "Pretrain/Step Time": 8.501461576670408} +{"Pretrain/Learning Rate": 4.404580456533179e-05, "Pretrain/Loss": 2.0764594078063965, "Pretrain/Loss (Raw)": 1.9701042175292969, "Pretrain/Step": 2361, "Pretrain/Step Time": 8.503819426521659} +{"Pretrain/Learning Rate": 4.404030394439535e-05, "Pretrain/Loss": 2.0751781463623047, "Pretrain/Loss (Raw)": 1.9143732786178589, "Pretrain/Step": 2362, "Pretrain/Step Time": 8.50781731493771} +{"Pretrain/Learning Rate": 4.4034801127641336e-05, "Pretrain/Loss": 2.0772125720977783, "Pretrain/Loss (Raw)": 2.1706931591033936, "Pretrain/Step": 2363, "Pretrain/Step Time": 8.503611704334617} +{"Pretrain/Learning Rate": 4.4029296115704366e-05, "Pretrain/Loss": 2.0746798515319824, "Pretrain/Loss (Raw)": 1.7394651174545288, "Pretrain/Step": 2364, "Pretrain/Step Time": 8.504942433908582} +{"Pretrain/Learning Rate": 4.40237889092193e-05, "Pretrain/Loss": 2.076936721801758, "Pretrain/Loss (Raw)": 2.283167839050293, "Pretrain/Step": 2365, "Pretrain/Step Time": 8.510027058422565} +{"Pretrain/Learning Rate": 4.401827950882125e-05, "Pretrain/Loss": 2.079305648803711, "Pretrain/Loss (Raw)": 2.17868709564209, "Pretrain/Step": 2366, "Pretrain/Step Time": 8.516316778957844} +{"Pretrain/Learning Rate": 4.4012767915145594e-05, "Pretrain/Loss": 2.0863475799560547, "Pretrain/Loss (Raw)": 2.747852087020874, "Pretrain/Step": 2367, "Pretrain/Step Time": 8.516814840957522} +{"Pretrain/Learning Rate": 4.400725412882794e-05, "Pretrain/Loss": 2.0857768058776855, "Pretrain/Loss (Raw)": 1.8543716669082642, "Pretrain/Step": 2368, "Pretrain/Step Time": 8.516272876411676} +{"Pretrain/Learning Rate": 4.400173815050418e-05, "Pretrain/Loss": 2.0861012935638428, "Pretrain/Loss (Raw)": 2.12107515335083, "Pretrain/Step": 2369, "Pretrain/Step Time": 8.513613194227219} +{"Pretrain/Learning Rate": 4.399621998081045e-05, "Pretrain/Loss": 2.086538076400757, "Pretrain/Loss (Raw)": 2.1528213024139404, "Pretrain/Step": 2370, "Pretrain/Step Time": 8.502782557159662} +{"Pretrain/Learning Rate": 4.39906996203831e-05, "Pretrain/Loss": 2.0872931480407715, "Pretrain/Loss (Raw)": 2.138745069503784, "Pretrain/Step": 2371, "Pretrain/Step Time": 8.501320894807577} +{"Pretrain/Learning Rate": 4.398517706985879e-05, "Pretrain/Loss": 2.087413787841797, "Pretrain/Loss (Raw)": 2.1060140132904053, "Pretrain/Step": 2372, "Pretrain/Step Time": 8.508391249924898} +{"Pretrain/Learning Rate": 4.39796523298744e-05, "Pretrain/Loss": 2.08601450920105, "Pretrain/Loss (Raw)": 1.9551165103912354, "Pretrain/Step": 2373, "Pretrain/Step Time": 8.515870206058025} +{"Pretrain/Learning Rate": 4.397412540106707e-05, "Pretrain/Loss": 2.085484504699707, "Pretrain/Loss (Raw)": 1.9726073741912842, "Pretrain/Step": 2374, "Pretrain/Step Time": 8.515293972566724} +{"Pretrain/Learning Rate": 4.396859628407418e-05, "Pretrain/Loss": 2.0845632553100586, "Pretrain/Loss (Raw)": 2.020111560821533, "Pretrain/Step": 2375, "Pretrain/Step Time": 8.515208508819342} +{"Pretrain/Learning Rate": 4.39630649795334e-05, "Pretrain/Loss": 2.0860190391540527, "Pretrain/Loss (Raw)": 2.1482667922973633, "Pretrain/Step": 2376, "Pretrain/Step Time": 8.510848762467504} +{"Pretrain/Learning Rate": 4.3957531488082595e-05, "Pretrain/Loss": 2.0848846435546875, "Pretrain/Loss (Raw)": 1.9927006959915161, "Pretrain/Step": 2377, "Pretrain/Step Time": 8.505481623113155} +{"Pretrain/Learning Rate": 4.395199581035994e-05, "Pretrain/Loss": 2.0852174758911133, "Pretrain/Loss (Raw)": 2.0563604831695557, "Pretrain/Step": 2378, "Pretrain/Step Time": 8.508302681148052} +{"Pretrain/Learning Rate": 4.3946457947003813e-05, "Pretrain/Loss": 2.086258888244629, "Pretrain/Loss (Raw)": 2.0410685539245605, "Pretrain/Step": 2379, "Pretrain/Step Time": 8.509456146508455} +{"Pretrain/Learning Rate": 4.394091789865288e-05, "Pretrain/Loss": 2.0873591899871826, "Pretrain/Loss (Raw)": 2.1746408939361572, "Pretrain/Step": 2380, "Pretrain/Step Time": 8.515409205108881} +{"Pretrain/Learning Rate": 4.393537566594605e-05, "Pretrain/Loss": 2.0874099731445312, "Pretrain/Loss (Raw)": 2.064918041229248, "Pretrain/Step": 2381, "Pretrain/Step Time": 8.514676675200462} +{"Pretrain/Learning Rate": 4.392983124952246e-05, "Pretrain/Loss": 2.0854408740997314, "Pretrain/Loss (Raw)": 1.9275580644607544, "Pretrain/Step": 2382, "Pretrain/Step Time": 8.506239822134376} +{"Pretrain/Learning Rate": 4.392428465002154e-05, "Pretrain/Loss": 2.0852980613708496, "Pretrain/Loss (Raw)": 2.1529815196990967, "Pretrain/Step": 2383, "Pretrain/Step Time": 8.514349369332194} +{"Pretrain/Learning Rate": 4.391873586808294e-05, "Pretrain/Loss": 2.0865836143493652, "Pretrain/Loss (Raw)": 2.2175753116607666, "Pretrain/Step": 2384, "Pretrain/Step Time": 8.517869897186756} +{"Pretrain/Learning Rate": 4.391318490434656e-05, "Pretrain/Loss": 2.086008071899414, "Pretrain/Loss (Raw)": 2.1076464653015137, "Pretrain/Step": 2385, "Pretrain/Step Time": 8.51896839775145} +{"Pretrain/Learning Rate": 4.3907631759452584e-05, "Pretrain/Loss": 2.0901856422424316, "Pretrain/Loss (Raw)": 2.1824092864990234, "Pretrain/Step": 2386, "Pretrain/Step Time": 8.519247002899647} +{"Pretrain/Learning Rate": 4.3902076434041416e-05, "Pretrain/Loss": 2.0885729789733887, "Pretrain/Loss (Raw)": 1.9986116886138916, "Pretrain/Step": 2387, "Pretrain/Step Time": 8.506910527125001} +{"Pretrain/Learning Rate": 4.389651892875373e-05, "Pretrain/Loss": 2.090160846710205, "Pretrain/Loss (Raw)": 2.282074213027954, "Pretrain/Step": 2388, "Pretrain/Step Time": 8.501624573022127} +{"Pretrain/Learning Rate": 4.389095924423043e-05, "Pretrain/Loss": 2.087186574935913, "Pretrain/Loss (Raw)": 1.820978045463562, "Pretrain/Step": 2389, "Pretrain/Step Time": 8.50387941673398} +{"Pretrain/Learning Rate": 4.388539738111269e-05, "Pretrain/Loss": 2.0885770320892334, "Pretrain/Loss (Raw)": 2.126267671585083, "Pretrain/Step": 2390, "Pretrain/Step Time": 8.512619081884623} +{"Pretrain/Learning Rate": 4.387983334004194e-05, "Pretrain/Loss": 2.088374376296997, "Pretrain/Loss (Raw)": 2.1870779991149902, "Pretrain/Step": 2391, "Pretrain/Step Time": 8.515314642339945} +{"Pretrain/Learning Rate": 4.387426712165984e-05, "Pretrain/Loss": 2.09059476852417, "Pretrain/Loss (Raw)": 2.251955032348633, "Pretrain/Step": 2392, "Pretrain/Step Time": 8.51432491466403} +{"Pretrain/Learning Rate": 4.3868698726608325e-05, "Pretrain/Loss": 2.090588092803955, "Pretrain/Loss (Raw)": 2.0187957286834717, "Pretrain/Step": 2393, "Pretrain/Step Time": 8.509408419951797} +{"Pretrain/Learning Rate": 4.3863128155529554e-05, "Pretrain/Loss": 2.0913522243499756, "Pretrain/Loss (Raw)": 2.331512689590454, "Pretrain/Step": 2394, "Pretrain/Step Time": 8.50841978751123} +{"Pretrain/Learning Rate": 4.385755540906595e-05, "Pretrain/Loss": 2.092575788497925, "Pretrain/Loss (Raw)": 2.1051132678985596, "Pretrain/Step": 2395, "Pretrain/Step Time": 8.504238605499268} +{"Pretrain/Learning Rate": 4.385198048786021e-05, "Pretrain/Loss": 2.0923736095428467, "Pretrain/Loss (Raw)": 2.045311212539673, "Pretrain/Step": 2396, "Pretrain/Step Time": 8.50589556619525} +{"Pretrain/Learning Rate": 4.384640339255525e-05, "Pretrain/Loss": 2.0926671028137207, "Pretrain/Loss (Raw)": 2.080213785171509, "Pretrain/Step": 2397, "Pretrain/Step Time": 8.507566506043077} +{"Pretrain/Learning Rate": 4.384082412379423e-05, "Pretrain/Loss": 2.095644474029541, "Pretrain/Loss (Raw)": 2.474198579788208, "Pretrain/Step": 2398, "Pretrain/Step Time": 8.513631479814649} +{"Pretrain/Learning Rate": 4.38352426822206e-05, "Pretrain/Loss": 2.092542886734009, "Pretrain/Loss (Raw)": 1.9239944219589233, "Pretrain/Step": 2399, "Pretrain/Step Time": 8.510012028738856} +{"Pretrain/Learning Rate": 4.3829659068478026e-05, "Pretrain/Loss": 2.091315746307373, "Pretrain/Loss (Raw)": 2.0065484046936035, "Pretrain/Step": 2400, "Pretrain/Step Time": 8.508426893502474} +{"Pretrain/Learning Rate": 4.3824073283210445e-05, "Pretrain/Loss": 2.091442108154297, "Pretrain/Loss (Raw)": 2.140425682067871, "Pretrain/Step": 2401, "Pretrain/Step Time": 8.512668928131461} +{"Pretrain/Learning Rate": 4.381848532706202e-05, "Pretrain/Loss": 2.087984561920166, "Pretrain/Loss (Raw)": 1.8537284135818481, "Pretrain/Step": 2402, "Pretrain/Step Time": 8.511605309322476} +{"Pretrain/Learning Rate": 4.38128952006772e-05, "Pretrain/Loss": 2.0850844383239746, "Pretrain/Loss (Raw)": 1.8150287866592407, "Pretrain/Step": 2403, "Pretrain/Step Time": 8.518310168758035} +{"Pretrain/Learning Rate": 4.380730290470065e-05, "Pretrain/Loss": 2.0845541954040527, "Pretrain/Loss (Raw)": 2.009453535079956, "Pretrain/Step": 2404, "Pretrain/Step Time": 8.515069348737597} +{"Pretrain/Learning Rate": 4.380170843977731e-05, "Pretrain/Loss": 2.08257794380188, "Pretrain/Loss (Raw)": 2.0146079063415527, "Pretrain/Step": 2405, "Pretrain/Step Time": 8.509939059615135} +{"Pretrain/Learning Rate": 4.3796111806552364e-05, "Pretrain/Loss": 2.082709312438965, "Pretrain/Loss (Raw)": 2.1787002086639404, "Pretrain/Step": 2406, "Pretrain/Step Time": 8.503142073750496} +{"Pretrain/Learning Rate": 4.379051300567123e-05, "Pretrain/Loss": 2.0839133262634277, "Pretrain/Loss (Raw)": 2.022749662399292, "Pretrain/Step": 2407, "Pretrain/Step Time": 8.505110669881105} +{"Pretrain/Learning Rate": 4.378491203777958e-05, "Pretrain/Loss": 2.085084915161133, "Pretrain/Loss (Raw)": 2.0298798084259033, "Pretrain/Step": 2408, "Pretrain/Step Time": 8.51418380253017} +{"Pretrain/Learning Rate": 4.377930890352337e-05, "Pretrain/Loss": 2.085832118988037, "Pretrain/Loss (Raw)": 2.047029733657837, "Pretrain/Step": 2409, "Pretrain/Step Time": 8.515670403838158} +{"Pretrain/Learning Rate": 4.3773703603548765e-05, "Pretrain/Loss": 2.0873453617095947, "Pretrain/Loss (Raw)": 2.2417702674865723, "Pretrain/Step": 2410, "Pretrain/Step Time": 8.513819195330143} +{"Pretrain/Learning Rate": 4.3768096138502194e-05, "Pretrain/Loss": 2.0875658988952637, "Pretrain/Loss (Raw)": 2.2175557613372803, "Pretrain/Step": 2411, "Pretrain/Step Time": 8.50485259667039} +{"Pretrain/Learning Rate": 4.376248650903033e-05, "Pretrain/Loss": 2.0882039070129395, "Pretrain/Loss (Raw)": 2.1753957271575928, "Pretrain/Step": 2412, "Pretrain/Step Time": 8.506119344383478} +{"Pretrain/Learning Rate": 4.375687471578011e-05, "Pretrain/Loss": 2.0859262943267822, "Pretrain/Loss (Raw)": 1.8658024072647095, "Pretrain/Step": 2413, "Pretrain/Step Time": 8.50483276695013} +{"Pretrain/Learning Rate": 4.375126075939873e-05, "Pretrain/Loss": 2.0859215259552, "Pretrain/Loss (Raw)": 2.019530773162842, "Pretrain/Step": 2414, "Pretrain/Step Time": 8.51090531423688} +{"Pretrain/Learning Rate": 4.374564464053359e-05, "Pretrain/Loss": 2.084726572036743, "Pretrain/Loss (Raw)": 2.1434736251831055, "Pretrain/Step": 2415, "Pretrain/Step Time": 8.51726882532239} +{"Pretrain/Learning Rate": 4.374002635983238e-05, "Pretrain/Loss": 2.0835418701171875, "Pretrain/Loss (Raw)": 2.1563451290130615, "Pretrain/Step": 2416, "Pretrain/Step Time": 8.516406454145908} +{"Pretrain/Learning Rate": 4.373440591794301e-05, "Pretrain/Loss": 2.082672595977783, "Pretrain/Loss (Raw)": 2.0095763206481934, "Pretrain/Step": 2417, "Pretrain/Step Time": 8.50221723690629} +{"Pretrain/Learning Rate": 4.372878331551369e-05, "Pretrain/Loss": 2.081562042236328, "Pretrain/Loss (Raw)": 1.9905461072921753, "Pretrain/Step": 2418, "Pretrain/Step Time": 8.504832154139876} +{"Pretrain/Learning Rate": 4.3723158553192813e-05, "Pretrain/Loss": 2.0813965797424316, "Pretrain/Loss (Raw)": 2.1332037448883057, "Pretrain/Step": 2419, "Pretrain/Step Time": 8.511784542351961} +{"Pretrain/Learning Rate": 4.3717531631629075e-05, "Pretrain/Loss": 2.082479953765869, "Pretrain/Loss (Raw)": 2.149405002593994, "Pretrain/Step": 2420, "Pretrain/Step Time": 8.510108053684235} +{"Pretrain/Learning Rate": 4.371190255147138e-05, "Pretrain/Loss": 2.0825252532958984, "Pretrain/Loss (Raw)": 2.166193962097168, "Pretrain/Step": 2421, "Pretrain/Step Time": 8.519226096570492} +{"Pretrain/Learning Rate": 4.370627131336891e-05, "Pretrain/Loss": 2.0837254524230957, "Pretrain/Loss (Raw)": 2.249703884124756, "Pretrain/Step": 2422, "Pretrain/Step Time": 8.513511426746845} +{"Pretrain/Learning Rate": 4.370063791797109e-05, "Pretrain/Loss": 2.081785202026367, "Pretrain/Loss (Raw)": 2.1635522842407227, "Pretrain/Step": 2423, "Pretrain/Step Time": 8.51059715077281} +{"Pretrain/Learning Rate": 4.3695002365927584e-05, "Pretrain/Loss": 2.082643985748291, "Pretrain/Loss (Raw)": 2.1050477027893066, "Pretrain/Step": 2424, "Pretrain/Step Time": 8.508678557351232} +{"Pretrain/Learning Rate": 4.368936465788831e-05, "Pretrain/Loss": 2.0808918476104736, "Pretrain/Loss (Raw)": 2.0183067321777344, "Pretrain/Step": 2425, "Pretrain/Step Time": 8.508577669039369} +{"Pretrain/Learning Rate": 4.3683724794503436e-05, "Pretrain/Loss": 2.0793721675872803, "Pretrain/Loss (Raw)": 1.921761393547058, "Pretrain/Step": 2426, "Pretrain/Step Time": 8.506371887400746} +{"Pretrain/Learning Rate": 4.367808277642338e-05, "Pretrain/Loss": 2.079806327819824, "Pretrain/Loss (Raw)": 2.0344924926757812, "Pretrain/Step": 2427, "Pretrain/Step Time": 8.50909092091024} +{"Pretrain/Learning Rate": 4.3672438604298806e-05, "Pretrain/Loss": 2.081393003463745, "Pretrain/Loss (Raw)": 2.1039326190948486, "Pretrain/Step": 2428, "Pretrain/Step Time": 8.507547473534942} +{"Pretrain/Learning Rate": 4.3666792278780625e-05, "Pretrain/Loss": 2.0815207958221436, "Pretrain/Loss (Raw)": 2.1507568359375, "Pretrain/Step": 2429, "Pretrain/Step Time": 8.504714358597994} +{"Pretrain/Learning Rate": 4.366114380051999e-05, "Pretrain/Loss": 2.0799598693847656, "Pretrain/Loss (Raw)": 1.9626734256744385, "Pretrain/Step": 2430, "Pretrain/Step Time": 8.503306644037366} +{"Pretrain/Learning Rate": 4.365549317016832e-05, "Pretrain/Loss": 2.0791573524475098, "Pretrain/Loss (Raw)": 2.054988145828247, "Pretrain/Step": 2431, "Pretrain/Step Time": 8.513144185766578} +{"Pretrain/Learning Rate": 4.364984038837727e-05, "Pretrain/Loss": 2.0811729431152344, "Pretrain/Loss (Raw)": 2.208791971206665, "Pretrain/Step": 2432, "Pretrain/Step Time": 8.512103801593184} +{"Pretrain/Learning Rate": 4.364418545579875e-05, "Pretrain/Loss": 2.079756736755371, "Pretrain/Loss (Raw)": 2.045258045196533, "Pretrain/Step": 2433, "Pretrain/Step Time": 8.51149632036686} +{"Pretrain/Learning Rate": 4.363852837308491e-05, "Pretrain/Loss": 2.079357147216797, "Pretrain/Loss (Raw)": 2.046370029449463, "Pretrain/Step": 2434, "Pretrain/Step Time": 8.509622843936086} +{"Pretrain/Learning Rate": 4.3632869140888144e-05, "Pretrain/Loss": 2.0797243118286133, "Pretrain/Loss (Raw)": 2.0405144691467285, "Pretrain/Step": 2435, "Pretrain/Step Time": 8.496779991313815} +{"Pretrain/Learning Rate": 4.362720775986111e-05, "Pretrain/Loss": 2.0780484676361084, "Pretrain/Loss (Raw)": 1.8132654428482056, "Pretrain/Step": 2436, "Pretrain/Step Time": 8.499907774850726} +{"Pretrain/Learning Rate": 4.362154423065671e-05, "Pretrain/Loss": 2.077907085418701, "Pretrain/Loss (Raw)": 2.0546646118164062, "Pretrain/Step": 2437, "Pretrain/Step Time": 8.508005701005459} +{"Pretrain/Learning Rate": 4.361587855392807e-05, "Pretrain/Loss": 2.078812599182129, "Pretrain/Loss (Raw)": 2.106205940246582, "Pretrain/Step": 2438, "Pretrain/Step Time": 8.50939879193902} +{"Pretrain/Learning Rate": 4.3610210730328604e-05, "Pretrain/Loss": 2.0784130096435547, "Pretrain/Loss (Raw)": 2.0401151180267334, "Pretrain/Step": 2439, "Pretrain/Step Time": 8.512342045083642} +{"Pretrain/Learning Rate": 4.3604540760511935e-05, "Pretrain/Loss": 2.0770106315612793, "Pretrain/Loss (Raw)": 1.9089512825012207, "Pretrain/Step": 2440, "Pretrain/Step Time": 8.511162577196956} +{"Pretrain/Learning Rate": 4.3598868645131964e-05, "Pretrain/Loss": 2.0774590969085693, "Pretrain/Loss (Raw)": 2.0155038833618164, "Pretrain/Step": 2441, "Pretrain/Step Time": 8.499016784131527} +{"Pretrain/Learning Rate": 4.359319438484282e-05, "Pretrain/Loss": 2.075645923614502, "Pretrain/Loss (Raw)": 1.9136708974838257, "Pretrain/Step": 2442, "Pretrain/Step Time": 8.509043782949448} +{"Pretrain/Learning Rate": 4.358751798029887e-05, "Pretrain/Loss": 2.0746889114379883, "Pretrain/Loss (Raw)": 1.7523009777069092, "Pretrain/Step": 2443, "Pretrain/Step Time": 8.51559123210609} +{"Pretrain/Learning Rate": 4.358183943215478e-05, "Pretrain/Loss": 2.074389934539795, "Pretrain/Loss (Raw)": 2.1892952919006348, "Pretrain/Step": 2444, "Pretrain/Step Time": 8.51146586239338} +{"Pretrain/Learning Rate": 4.3576158741065395e-05, "Pretrain/Loss": 2.0721399784088135, "Pretrain/Loss (Raw)": 2.1100971698760986, "Pretrain/Step": 2445, "Pretrain/Step Time": 8.511556413024664} +{"Pretrain/Learning Rate": 4.357047590768586e-05, "Pretrain/Loss": 2.0716426372528076, "Pretrain/Loss (Raw)": 2.093311071395874, "Pretrain/Step": 2446, "Pretrain/Step Time": 8.503891974687576} +{"Pretrain/Learning Rate": 4.356479093267153e-05, "Pretrain/Loss": 2.073741912841797, "Pretrain/Loss (Raw)": 2.060122489929199, "Pretrain/Step": 2447, "Pretrain/Step Time": 8.503450063988566} +{"Pretrain/Learning Rate": 4.355910381667803e-05, "Pretrain/Loss": 2.0732429027557373, "Pretrain/Loss (Raw)": 2.092780590057373, "Pretrain/Step": 2448, "Pretrain/Step Time": 8.507558373734355} +{"Pretrain/Learning Rate": 4.355341456036122e-05, "Pretrain/Loss": 2.073183298110962, "Pretrain/Loss (Raw)": 1.8971134424209595, "Pretrain/Step": 2449, "Pretrain/Step Time": 8.511236807331443} +{"Pretrain/Learning Rate": 4.354772316437722e-05, "Pretrain/Loss": 2.073312759399414, "Pretrain/Loss (Raw)": 2.134486436843872, "Pretrain/Step": 2450, "Pretrain/Step Time": 8.514103785157204} +{"Pretrain/Learning Rate": 4.354202962938239e-05, "Pretrain/Loss": 2.071765899658203, "Pretrain/Loss (Raw)": 1.9416744709014893, "Pretrain/Step": 2451, "Pretrain/Step Time": 8.517487615346909} +{"Pretrain/Learning Rate": 4.353633395603332e-05, "Pretrain/Loss": 2.0731117725372314, "Pretrain/Loss (Raw)": 2.1530649662017822, "Pretrain/Step": 2452, "Pretrain/Step Time": 8.508863048627973} +{"Pretrain/Learning Rate": 4.353063614498688e-05, "Pretrain/Loss": 2.073152780532837, "Pretrain/Loss (Raw)": 2.055898427963257, "Pretrain/Step": 2453, "Pretrain/Step Time": 8.497677193954587} +{"Pretrain/Learning Rate": 4.352493619690016e-05, "Pretrain/Loss": 2.0720553398132324, "Pretrain/Loss (Raw)": 1.953863501548767, "Pretrain/Step": 2454, "Pretrain/Step Time": 8.492110257968307} +{"Pretrain/Learning Rate": 4.351923411243049e-05, "Pretrain/Loss": 2.072503089904785, "Pretrain/Loss (Raw)": 2.18180775642395, "Pretrain/Step": 2455, "Pretrain/Step Time": 8.493471747264266} +{"Pretrain/Learning Rate": 4.35135298922355e-05, "Pretrain/Loss": 2.07326602935791, "Pretrain/Loss (Raw)": 2.0715091228485107, "Pretrain/Step": 2456, "Pretrain/Step Time": 8.506617087870836} +{"Pretrain/Learning Rate": 4.350782353697299e-05, "Pretrain/Loss": 2.077282667160034, "Pretrain/Loss (Raw)": 2.260350227355957, "Pretrain/Step": 2457, "Pretrain/Step Time": 8.509817769750953} +{"Pretrain/Learning Rate": 4.350211504730106e-05, "Pretrain/Loss": 2.0769834518432617, "Pretrain/Loss (Raw)": 2.142854928970337, "Pretrain/Step": 2458, "Pretrain/Step Time": 8.509420642629266} +{"Pretrain/Learning Rate": 4.3496404423878045e-05, "Pretrain/Loss": 2.075301170349121, "Pretrain/Loss (Raw)": 1.894667387008667, "Pretrain/Step": 2459, "Pretrain/Step Time": 8.508919335901737} +{"Pretrain/Learning Rate": 4.349069166736251e-05, "Pretrain/Loss": 2.07456111907959, "Pretrain/Loss (Raw)": 1.9589165449142456, "Pretrain/Step": 2460, "Pretrain/Step Time": 8.506416713818908} +{"Pretrain/Learning Rate": 4.348497677841328e-05, "Pretrain/Loss": 2.074601888656616, "Pretrain/Loss (Raw)": 2.209089517593384, "Pretrain/Step": 2461, "Pretrain/Step Time": 8.51446009427309} +{"Pretrain/Learning Rate": 4.3479259757689427e-05, "Pretrain/Loss": 2.0760655403137207, "Pretrain/Loss (Raw)": 2.195111036300659, "Pretrain/Step": 2462, "Pretrain/Step Time": 8.5151455886662} +{"Pretrain/Learning Rate": 4.347354060585026e-05, "Pretrain/Loss": 2.0768871307373047, "Pretrain/Loss (Raw)": 2.0710179805755615, "Pretrain/Step": 2463, "Pretrain/Step Time": 8.516133191064} +{"Pretrain/Learning Rate": 4.346781932355533e-05, "Pretrain/Loss": 2.0778019428253174, "Pretrain/Loss (Raw)": 2.3574612140655518, "Pretrain/Step": 2464, "Pretrain/Step Time": 8.510846124961972} +{"Pretrain/Learning Rate": 4.3462095911464465e-05, "Pretrain/Loss": 2.0776093006134033, "Pretrain/Loss (Raw)": 2.1586060523986816, "Pretrain/Step": 2465, "Pretrain/Step Time": 8.504410030320287} +{"Pretrain/Learning Rate": 4.34563703702377e-05, "Pretrain/Loss": 2.0783958435058594, "Pretrain/Loss (Raw)": 2.1010758876800537, "Pretrain/Step": 2466, "Pretrain/Step Time": 8.512151475995779} +{"Pretrain/Learning Rate": 4.3450642700535335e-05, "Pretrain/Loss": 2.078258752822876, "Pretrain/Loss (Raw)": 1.969538688659668, "Pretrain/Step": 2467, "Pretrain/Step Time": 8.514490215107799} +{"Pretrain/Learning Rate": 4.344491290301791e-05, "Pretrain/Loss": 2.077704906463623, "Pretrain/Loss (Raw)": 2.1183857917785645, "Pretrain/Step": 2468, "Pretrain/Step Time": 8.520168390125036} +{"Pretrain/Learning Rate": 4.3439180978346216e-05, "Pretrain/Loss": 2.077848196029663, "Pretrain/Loss (Raw)": 2.0494210720062256, "Pretrain/Step": 2469, "Pretrain/Step Time": 8.516761934384704} +{"Pretrain/Learning Rate": 4.3433446927181274e-05, "Pretrain/Loss": 2.077998399734497, "Pretrain/Loss (Raw)": 2.143434524536133, "Pretrain/Step": 2470, "Pretrain/Step Time": 8.513475455343723} +{"Pretrain/Learning Rate": 4.342771075018438e-05, "Pretrain/Loss": 2.0785984992980957, "Pretrain/Loss (Raw)": 2.2104947566986084, "Pretrain/Step": 2471, "Pretrain/Step Time": 8.50752235762775} +{"Pretrain/Learning Rate": 4.342197244801705e-05, "Pretrain/Loss": 2.0828802585601807, "Pretrain/Loss (Raw)": 2.5796010494232178, "Pretrain/Step": 2472, "Pretrain/Step Time": 8.503650058060884} +{"Pretrain/Learning Rate": 4.341623202134105e-05, "Pretrain/Loss": 2.0835909843444824, "Pretrain/Loss (Raw)": 2.131910562515259, "Pretrain/Step": 2473, "Pretrain/Step Time": 8.5136455912143} +{"Pretrain/Learning Rate": 4.341048947081839e-05, "Pretrain/Loss": 2.083233118057251, "Pretrain/Loss (Raw)": 1.881608247756958, "Pretrain/Step": 2474, "Pretrain/Step Time": 8.516696082428098} +{"Pretrain/Learning Rate": 4.340474479711133e-05, "Pretrain/Loss": 2.0837185382843018, "Pretrain/Loss (Raw)": 2.229618549346924, "Pretrain/Step": 2475, "Pretrain/Step Time": 8.51453061401844} +{"Pretrain/Learning Rate": 4.3398998000882375e-05, "Pretrain/Loss": 2.083432197570801, "Pretrain/Loss (Raw)": 2.1355249881744385, "Pretrain/Step": 2476, "Pretrain/Step Time": 8.508641935884953} +{"Pretrain/Learning Rate": 4.339324908279427e-05, "Pretrain/Loss": 2.081350326538086, "Pretrain/Loss (Raw)": 1.989452600479126, "Pretrain/Step": 2477, "Pretrain/Step Time": 8.50494789890945} +{"Pretrain/Learning Rate": 4.338749804351001e-05, "Pretrain/Loss": 2.081279754638672, "Pretrain/Loss (Raw)": 2.087374687194824, "Pretrain/Step": 2478, "Pretrain/Step Time": 8.514853373169899} +{"Pretrain/Learning Rate": 4.338174488369283e-05, "Pretrain/Loss": 2.080259323120117, "Pretrain/Loss (Raw)": 2.024848699569702, "Pretrain/Step": 2479, "Pretrain/Step Time": 8.51802073046565} +{"Pretrain/Learning Rate": 4.337598960400622e-05, "Pretrain/Loss": 2.0811820030212402, "Pretrain/Loss (Raw)": 2.0364391803741455, "Pretrain/Step": 2480, "Pretrain/Step Time": 8.518310019746423} +{"Pretrain/Learning Rate": 4.337023220511389e-05, "Pretrain/Loss": 2.079803943634033, "Pretrain/Loss (Raw)": 1.969878911972046, "Pretrain/Step": 2481, "Pretrain/Step Time": 8.516433138400316} +{"Pretrain/Learning Rate": 4.336447268767982e-05, "Pretrain/Loss": 2.083009958267212, "Pretrain/Loss (Raw)": 2.172217845916748, "Pretrain/Step": 2482, "Pretrain/Step Time": 8.51354849524796} +{"Pretrain/Learning Rate": 4.3358711052368224e-05, "Pretrain/Loss": 2.0846917629241943, "Pretrain/Loss (Raw)": 2.1163785457611084, "Pretrain/Step": 2483, "Pretrain/Step Time": 8.504319112747908} +{"Pretrain/Learning Rate": 4.335294729984356e-05, "Pretrain/Loss": 2.0825839042663574, "Pretrain/Loss (Raw)": 1.9428653717041016, "Pretrain/Step": 2484, "Pretrain/Step Time": 8.505221527069807} +{"Pretrain/Learning Rate": 4.334718143077054e-05, "Pretrain/Loss": 2.082418203353882, "Pretrain/Loss (Raw)": 1.933902382850647, "Pretrain/Step": 2485, "Pretrain/Step Time": 8.505762670189142} +{"Pretrain/Learning Rate": 4.334141344581408e-05, "Pretrain/Loss": 2.0765419006347656, "Pretrain/Loss (Raw)": 1.4971375465393066, "Pretrain/Step": 2486, "Pretrain/Step Time": 8.511871701106429} +{"Pretrain/Learning Rate": 4.3335643345639414e-05, "Pretrain/Loss": 2.0796799659729004, "Pretrain/Loss (Raw)": 2.3323655128479004, "Pretrain/Step": 2487, "Pretrain/Step Time": 8.510961715131998} +{"Pretrain/Learning Rate": 4.332987113091195e-05, "Pretrain/Loss": 2.0775203704833984, "Pretrain/Loss (Raw)": 1.9508005380630493, "Pretrain/Step": 2488, "Pretrain/Step Time": 8.512533055618405} +{"Pretrain/Learning Rate": 4.332409680229737e-05, "Pretrain/Loss": 2.0775928497314453, "Pretrain/Loss (Raw)": 1.979374647140503, "Pretrain/Step": 2489, "Pretrain/Step Time": 8.508624223992229} +{"Pretrain/Learning Rate": 4.3318320360461616e-05, "Pretrain/Loss": 2.080970525741577, "Pretrain/Loss (Raw)": 2.3467564582824707, "Pretrain/Step": 2490, "Pretrain/Step Time": 8.509871885180473} +{"Pretrain/Learning Rate": 4.331254180607083e-05, "Pretrain/Loss": 2.080395221710205, "Pretrain/Loss (Raw)": 2.0970375537872314, "Pretrain/Step": 2491, "Pretrain/Step Time": 8.51597986370325} +{"Pretrain/Learning Rate": 4.330676113979143e-05, "Pretrain/Loss": 2.082355499267578, "Pretrain/Loss (Raw)": 1.990385890007019, "Pretrain/Step": 2492, "Pretrain/Step Time": 8.514432305470109} +{"Pretrain/Learning Rate": 4.330097836229007e-05, "Pretrain/Loss": 2.08089280128479, "Pretrain/Loss (Raw)": 2.0959513187408447, "Pretrain/Step": 2493, "Pretrain/Step Time": 8.509974839165807} +{"Pretrain/Learning Rate": 4.3295193474233655e-05, "Pretrain/Loss": 2.0753934383392334, "Pretrain/Loss (Raw)": 1.4747564792633057, "Pretrain/Step": 2494, "Pretrain/Step Time": 8.506241811439395} +{"Pretrain/Learning Rate": 4.328940647628931e-05, "Pretrain/Loss": 2.0691628456115723, "Pretrain/Loss (Raw)": 1.9503083229064941, "Pretrain/Step": 2495, "Pretrain/Step Time": 8.505186269059777} +{"Pretrain/Learning Rate": 4.328361736912443e-05, "Pretrain/Loss": 2.0711798667907715, "Pretrain/Loss (Raw)": 2.112586498260498, "Pretrain/Step": 2496, "Pretrain/Step Time": 8.51331888511777} +{"Pretrain/Learning Rate": 4.3277826153406644e-05, "Pretrain/Loss": 2.071037769317627, "Pretrain/Loss (Raw)": 2.102851152420044, "Pretrain/Step": 2497, "Pretrain/Step Time": 8.515549305826426} +{"Pretrain/Learning Rate": 4.327203282980382e-05, "Pretrain/Loss": 2.069995880126953, "Pretrain/Loss (Raw)": 2.019498825073242, "Pretrain/Step": 2498, "Pretrain/Step Time": 8.517237946391106} +{"Pretrain/Learning Rate": 4.326623739898406e-05, "Pretrain/Loss": 2.0697360038757324, "Pretrain/Loss (Raw)": 2.105478048324585, "Pretrain/Step": 2499, "Pretrain/Step Time": 8.518051788210869} +{"Pretrain/Learning Rate": 4.3260439861615734e-05, "Pretrain/Loss": 2.0680627822875977, "Pretrain/Loss (Raw)": 1.891796588897705, "Pretrain/Step": 2500, "Pretrain/Step Time": 8.509793283417821} +{"Pretrain/Learning Rate": 4.325464021836744e-05, "Pretrain/Loss": 2.068873882293701, "Pretrain/Loss (Raw)": 2.0589547157287598, "Pretrain/Step": 2501, "Pretrain/Step Time": 8.509542293846607} +{"Pretrain/Learning Rate": 4.3248838469908016e-05, "Pretrain/Loss": 2.068445920944214, "Pretrain/Loss (Raw)": 1.9178458452224731, "Pretrain/Step": 2502, "Pretrain/Step Time": 8.512542933225632} +{"Pretrain/Learning Rate": 4.324303461690655e-05, "Pretrain/Loss": 2.0682291984558105, "Pretrain/Loss (Raw)": 1.992344856262207, "Pretrain/Step": 2503, "Pretrain/Step Time": 8.513179942965508} +{"Pretrain/Learning Rate": 4.3237228660032355e-05, "Pretrain/Loss": 2.0676040649414062, "Pretrain/Loss (Raw)": 2.0682830810546875, "Pretrain/Step": 2504, "Pretrain/Step Time": 8.514532448723912} +{"Pretrain/Learning Rate": 4.323142059995503e-05, "Pretrain/Loss": 2.06719970703125, "Pretrain/Loss (Raw)": 1.9409459829330444, "Pretrain/Step": 2505, "Pretrain/Step Time": 8.509996032342315} +{"Pretrain/Learning Rate": 4.3225610437344363e-05, "Pretrain/Loss": 2.0699925422668457, "Pretrain/Loss (Raw)": 2.4138453006744385, "Pretrain/Step": 2506, "Pretrain/Step Time": 8.50293086282909} +{"Pretrain/Learning Rate": 4.321979817287043e-05, "Pretrain/Loss": 2.0697989463806152, "Pretrain/Loss (Raw)": 2.016282558441162, "Pretrain/Step": 2507, "Pretrain/Step Time": 8.50740821287036} +{"Pretrain/Learning Rate": 4.32139838072035e-05, "Pretrain/Loss": 2.070803642272949, "Pretrain/Loss (Raw)": 2.303215503692627, "Pretrain/Step": 2508, "Pretrain/Step Time": 8.511152626946568} +{"Pretrain/Learning Rate": 4.320816734101415e-05, "Pretrain/Loss": 2.0711793899536133, "Pretrain/Loss (Raw)": 2.113032579421997, "Pretrain/Step": 2509, "Pretrain/Step Time": 8.510683115571737} +{"Pretrain/Learning Rate": 4.320234877497313e-05, "Pretrain/Loss": 2.0719218254089355, "Pretrain/Loss (Raw)": 2.0225906372070312, "Pretrain/Step": 2510, "Pretrain/Step Time": 8.51035807095468} +{"Pretrain/Learning Rate": 4.319652810975148e-05, "Pretrain/Loss": 2.0709385871887207, "Pretrain/Loss (Raw)": 2.0271105766296387, "Pretrain/Step": 2511, "Pretrain/Step Time": 8.49990115314722} +{"Pretrain/Learning Rate": 4.319070534602047e-05, "Pretrain/Loss": 2.0700230598449707, "Pretrain/Loss (Raw)": 2.1004116535186768, "Pretrain/Step": 2512, "Pretrain/Step Time": 8.495556252077222} +{"Pretrain/Learning Rate": 4.318488048445158e-05, "Pretrain/Loss": 2.0692267417907715, "Pretrain/Loss (Raw)": 2.0056769847869873, "Pretrain/Step": 2513, "Pretrain/Step Time": 8.498884662985802} +{"Pretrain/Learning Rate": 4.317905352571661e-05, "Pretrain/Loss": 2.0681772232055664, "Pretrain/Loss (Raw)": 2.0481250286102295, "Pretrain/Step": 2514, "Pretrain/Step Time": 8.507866863161325} +{"Pretrain/Learning Rate": 4.317322447048751e-05, "Pretrain/Loss": 2.070568084716797, "Pretrain/Loss (Raw)": 2.3046462535858154, "Pretrain/Step": 2515, "Pretrain/Step Time": 8.511839400976896} +{"Pretrain/Learning Rate": 4.316739331943653e-05, "Pretrain/Loss": 2.069226026535034, "Pretrain/Loss (Raw)": 2.1102585792541504, "Pretrain/Step": 2516, "Pretrain/Step Time": 8.512118162587285} +{"Pretrain/Learning Rate": 4.316156007323614e-05, "Pretrain/Loss": 2.073212146759033, "Pretrain/Loss (Raw)": 2.331210136413574, "Pretrain/Step": 2517, "Pretrain/Step Time": 8.509082632139325} +{"Pretrain/Learning Rate": 4.315572473255908e-05, "Pretrain/Loss": 2.071993589401245, "Pretrain/Loss (Raw)": 1.9702770709991455, "Pretrain/Step": 2518, "Pretrain/Step Time": 8.500875221565366} +{"Pretrain/Learning Rate": 4.3149887298078276e-05, "Pretrain/Loss": 2.072176933288574, "Pretrain/Loss (Raw)": 2.2105448246002197, "Pretrain/Step": 2519, "Pretrain/Step Time": 8.496809154748917} +{"Pretrain/Learning Rate": 4.314404777046694e-05, "Pretrain/Loss": 2.070610761642456, "Pretrain/Loss (Raw)": 2.051490306854248, "Pretrain/Step": 2520, "Pretrain/Step Time": 8.509367395192385} +{"Pretrain/Learning Rate": 4.313820615039853e-05, "Pretrain/Loss": 2.0701608657836914, "Pretrain/Loss (Raw)": 1.9611990451812744, "Pretrain/Step": 2521, "Pretrain/Step Time": 8.513332104310393} +{"Pretrain/Learning Rate": 4.313236243854671e-05, "Pretrain/Loss": 2.0677101612091064, "Pretrain/Loss (Raw)": 2.017855405807495, "Pretrain/Step": 2522, "Pretrain/Step Time": 8.514491254463792} +{"Pretrain/Learning Rate": 4.3126516635585414e-05, "Pretrain/Loss": 2.069380283355713, "Pretrain/Loss (Raw)": 2.318876028060913, "Pretrain/Step": 2523, "Pretrain/Step Time": 8.511753980070353} +{"Pretrain/Learning Rate": 4.312066874218881e-05, "Pretrain/Loss": 2.0688631534576416, "Pretrain/Loss (Raw)": 1.979126214981079, "Pretrain/Step": 2524, "Pretrain/Step Time": 8.505258105695248} +{"Pretrain/Learning Rate": 4.3114818759031284e-05, "Pretrain/Loss": 2.069025993347168, "Pretrain/Loss (Raw)": 2.101048469543457, "Pretrain/Step": 2525, "Pretrain/Step Time": 8.510524651035666} +{"Pretrain/Learning Rate": 4.310896668678751e-05, "Pretrain/Loss": 2.0645322799682617, "Pretrain/Loss (Raw)": 1.8989875316619873, "Pretrain/Step": 2526, "Pretrain/Step Time": 8.509269019588828} +{"Pretrain/Learning Rate": 4.3103112526132364e-05, "Pretrain/Loss": 2.064053535461426, "Pretrain/Loss (Raw)": 1.8627426624298096, "Pretrain/Step": 2527, "Pretrain/Step Time": 8.510100746527314} +{"Pretrain/Learning Rate": 4.3097256277740976e-05, "Pretrain/Loss": 2.066089153289795, "Pretrain/Loss (Raw)": 2.2670915126800537, "Pretrain/Step": 2528, "Pretrain/Step Time": 8.510585812851787} +{"Pretrain/Learning Rate": 4.309139794228871e-05, "Pretrain/Loss": 2.066579580307007, "Pretrain/Loss (Raw)": 2.203193426132202, "Pretrain/Step": 2529, "Pretrain/Step Time": 8.50119636207819} +{"Pretrain/Learning Rate": 4.3085537520451196e-05, "Pretrain/Loss": 2.0687255859375, "Pretrain/Loss (Raw)": 2.128432512283325, "Pretrain/Step": 2530, "Pretrain/Step Time": 8.499747207388282} +{"Pretrain/Learning Rate": 4.307967501290427e-05, "Pretrain/Loss": 2.06964111328125, "Pretrain/Loss (Raw)": 1.9322283267974854, "Pretrain/Step": 2531, "Pretrain/Step Time": 8.500435946509242} +{"Pretrain/Learning Rate": 4.307381042032402e-05, "Pretrain/Loss": 2.0688514709472656, "Pretrain/Loss (Raw)": 1.9083647727966309, "Pretrain/Step": 2532, "Pretrain/Step Time": 8.510578863322735} +{"Pretrain/Learning Rate": 4.3067943743386796e-05, "Pretrain/Loss": 2.0687291622161865, "Pretrain/Loss (Raw)": 1.9989399909973145, "Pretrain/Step": 2533, "Pretrain/Step Time": 8.510113703086972} +{"Pretrain/Learning Rate": 4.3062074982769155e-05, "Pretrain/Loss": 2.0680313110351562, "Pretrain/Loss (Raw)": 2.0893702507019043, "Pretrain/Step": 2534, "Pretrain/Step Time": 8.514095932245255} +{"Pretrain/Learning Rate": 4.305620413914792e-05, "Pretrain/Loss": 2.0679848194122314, "Pretrain/Loss (Raw)": 2.0168163776397705, "Pretrain/Step": 2535, "Pretrain/Step Time": 8.510045114904642} +{"Pretrain/Learning Rate": 4.305033121320013e-05, "Pretrain/Loss": 2.0692968368530273, "Pretrain/Loss (Raw)": 2.197794198989868, "Pretrain/Step": 2536, "Pretrain/Step Time": 8.49690948240459} +{"Pretrain/Learning Rate": 4.30444562056031e-05, "Pretrain/Loss": 2.0684056282043457, "Pretrain/Loss (Raw)": 1.9329888820648193, "Pretrain/Step": 2537, "Pretrain/Step Time": 8.49739002622664} +{"Pretrain/Learning Rate": 4.3038579117034347e-05, "Pretrain/Loss": 2.0666017532348633, "Pretrain/Loss (Raw)": 2.0108447074890137, "Pretrain/Step": 2538, "Pretrain/Step Time": 8.499156912788749} +{"Pretrain/Learning Rate": 4.303269994817165e-05, "Pretrain/Loss": 2.06400728225708, "Pretrain/Loss (Raw)": 1.8854761123657227, "Pretrain/Step": 2539, "Pretrain/Step Time": 8.51177965849638} +{"Pretrain/Learning Rate": 4.302681869969302e-05, "Pretrain/Loss": 2.0650951862335205, "Pretrain/Loss (Raw)": 2.3146538734436035, "Pretrain/Step": 2540, "Pretrain/Step Time": 8.510340888053179} +{"Pretrain/Learning Rate": 4.3020935372276716e-05, "Pretrain/Loss": 2.0660369396209717, "Pretrain/Loss (Raw)": 1.9863523244857788, "Pretrain/Step": 2541, "Pretrain/Step Time": 8.510562416166067} +{"Pretrain/Learning Rate": 4.3015049966601224e-05, "Pretrain/Loss": 2.066178798675537, "Pretrain/Loss (Raw)": 2.037656545639038, "Pretrain/Step": 2542, "Pretrain/Step Time": 8.50327561609447} +{"Pretrain/Learning Rate": 4.3009162483345275e-05, "Pretrain/Loss": 2.0661909580230713, "Pretrain/Loss (Raw)": 2.1450743675231934, "Pretrain/Step": 2543, "Pretrain/Step Time": 8.4998864158988} +{"Pretrain/Learning Rate": 4.300327292318786e-05, "Pretrain/Loss": 2.0652594566345215, "Pretrain/Loss (Raw)": 2.0370988845825195, "Pretrain/Step": 2544, "Pretrain/Step Time": 8.50562265701592} +{"Pretrain/Learning Rate": 4.299738128680817e-05, "Pretrain/Loss": 2.0652530193328857, "Pretrain/Loss (Raw)": 2.0087640285491943, "Pretrain/Step": 2545, "Pretrain/Step Time": 8.512614008039236} +{"Pretrain/Learning Rate": 4.299148757488567e-05, "Pretrain/Loss": 2.0650041103363037, "Pretrain/Loss (Raw)": 1.9586577415466309, "Pretrain/Step": 2546, "Pretrain/Step Time": 8.5132070556283} +{"Pretrain/Learning Rate": 4.298559178810003e-05, "Pretrain/Loss": 2.063769817352295, "Pretrain/Loss (Raw)": 1.975254774093628, "Pretrain/Step": 2547, "Pretrain/Step Time": 8.505054714158177} +{"Pretrain/Learning Rate": 4.297969392713121e-05, "Pretrain/Loss": 2.064605951309204, "Pretrain/Loss (Raw)": 2.2564070224761963, "Pretrain/Step": 2548, "Pretrain/Step Time": 8.503311423584819} +{"Pretrain/Learning Rate": 4.297379399265935e-05, "Pretrain/Loss": 2.0646145343780518, "Pretrain/Loss (Raw)": 2.167299747467041, "Pretrain/Step": 2549, "Pretrain/Step Time": 8.502122178673744} +{"Pretrain/Learning Rate": 4.296789198536488e-05, "Pretrain/Loss": 2.0635979175567627, "Pretrain/Loss (Raw)": 2.119565486907959, "Pretrain/Step": 2550, "Pretrain/Step Time": 8.512297596782446} +{"Pretrain/Learning Rate": 4.296198790592843e-05, "Pretrain/Loss": 2.0630500316619873, "Pretrain/Loss (Raw)": 2.093432903289795, "Pretrain/Step": 2551, "Pretrain/Step Time": 8.519552446901798} +{"Pretrain/Learning Rate": 4.295608175503091e-05, "Pretrain/Loss": 2.0658764839172363, "Pretrain/Loss (Raw)": 2.4667930603027344, "Pretrain/Step": 2552, "Pretrain/Step Time": 8.514561032876372} +{"Pretrain/Learning Rate": 4.295017353335342e-05, "Pretrain/Loss": 2.0648674964904785, "Pretrain/Loss (Raw)": 1.8891977071762085, "Pretrain/Step": 2553, "Pretrain/Step Time": 8.509788639843464} +{"Pretrain/Learning Rate": 4.2944263241577334e-05, "Pretrain/Loss": 2.0643858909606934, "Pretrain/Loss (Raw)": 1.8600993156433105, "Pretrain/Step": 2554, "Pretrain/Step Time": 8.511493934318423} +{"Pretrain/Learning Rate": 4.293835088038425e-05, "Pretrain/Loss": 2.0636825561523438, "Pretrain/Loss (Raw)": 1.9445005655288696, "Pretrain/Step": 2555, "Pretrain/Step Time": 8.512646675109863} +{"Pretrain/Learning Rate": 4.2932436450456025e-05, "Pretrain/Loss": 2.0637664794921875, "Pretrain/Loss (Raw)": 2.11464262008667, "Pretrain/Step": 2556, "Pretrain/Step Time": 8.507840666919947} +{"Pretrain/Learning Rate": 4.292651995247472e-05, "Pretrain/Loss": 2.0618896484375, "Pretrain/Loss (Raw)": 1.9105329513549805, "Pretrain/Step": 2557, "Pretrain/Step Time": 8.515189135447145} +{"Pretrain/Learning Rate": 4.292060138712266e-05, "Pretrain/Loss": 2.0633444786071777, "Pretrain/Loss (Raw)": 2.14886736869812, "Pretrain/Step": 2558, "Pretrain/Step Time": 8.517624646425247} +{"Pretrain/Learning Rate": 4.2914680755082414e-05, "Pretrain/Loss": 2.0643181800842285, "Pretrain/Loss (Raw)": 2.1796629428863525, "Pretrain/Step": 2559, "Pretrain/Step Time": 8.506778363138437} +{"Pretrain/Learning Rate": 4.2908758057036756e-05, "Pretrain/Loss": 2.0633602142333984, "Pretrain/Loss (Raw)": 2.0861423015594482, "Pretrain/Step": 2560, "Pretrain/Step Time": 8.505291508510709} +{"Pretrain/Learning Rate": 4.2902833293668744e-05, "Pretrain/Loss": 2.0624213218688965, "Pretrain/Loss (Raw)": 1.925107479095459, "Pretrain/Step": 2561, "Pretrain/Step Time": 8.509718023240566} +{"Pretrain/Learning Rate": 4.2896906465661623e-05, "Pretrain/Loss": 2.0654804706573486, "Pretrain/Loss (Raw)": 2.437922239303589, "Pretrain/Step": 2562, "Pretrain/Step Time": 8.516701681539416} +{"Pretrain/Learning Rate": 4.289097757369892e-05, "Pretrain/Loss": 2.065621852874756, "Pretrain/Loss (Raw)": 2.0586206912994385, "Pretrain/Step": 2563, "Pretrain/Step Time": 8.518246049061418} +{"Pretrain/Learning Rate": 4.288504661846437e-05, "Pretrain/Loss": 2.0668368339538574, "Pretrain/Loss (Raw)": 1.9687615633010864, "Pretrain/Step": 2564, "Pretrain/Step Time": 8.519210176542401} +{"Pretrain/Learning Rate": 4.2879113600641976e-05, "Pretrain/Loss": 2.0665245056152344, "Pretrain/Loss (Raw)": 2.014693021774292, "Pretrain/Step": 2565, "Pretrain/Step Time": 8.512502348050475} +{"Pretrain/Learning Rate": 4.287317852091595e-05, "Pretrain/Loss": 2.0660147666931152, "Pretrain/Loss (Raw)": 2.040959358215332, "Pretrain/Step": 2566, "Pretrain/Step Time": 8.508234338834882} +{"Pretrain/Learning Rate": 4.2867241379970754e-05, "Pretrain/Loss": 2.0661613941192627, "Pretrain/Loss (Raw)": 2.058893918991089, "Pretrain/Step": 2567, "Pretrain/Step Time": 8.504587009549141} +{"Pretrain/Learning Rate": 4.2861302178491094e-05, "Pretrain/Loss": 2.0687737464904785, "Pretrain/Loss (Raw)": 2.2433204650878906, "Pretrain/Step": 2568, "Pretrain/Step Time": 8.512527648359537} +{"Pretrain/Learning Rate": 4.28553609171619e-05, "Pretrain/Loss": 2.0698604583740234, "Pretrain/Loss (Raw)": 2.1545937061309814, "Pretrain/Step": 2569, "Pretrain/Step Time": 8.517526535317302} +{"Pretrain/Learning Rate": 4.284941759666835e-05, "Pretrain/Loss": 2.070436477661133, "Pretrain/Loss (Raw)": 1.9873906373977661, "Pretrain/Step": 2570, "Pretrain/Step Time": 8.511069413274527} +{"Pretrain/Learning Rate": 4.2843472217695844e-05, "Pretrain/Loss": 2.0738887786865234, "Pretrain/Loss (Raw)": 2.194216728210449, "Pretrain/Step": 2571, "Pretrain/Step Time": 8.50313837453723} +{"Pretrain/Learning Rate": 4.283752478093005e-05, "Pretrain/Loss": 2.0726757049560547, "Pretrain/Loss (Raw)": 2.0340383052825928, "Pretrain/Step": 2572, "Pretrain/Step Time": 8.50217261724174} +{"Pretrain/Learning Rate": 4.283157528705683e-05, "Pretrain/Loss": 2.0705080032348633, "Pretrain/Loss (Raw)": 1.8326431512832642, "Pretrain/Step": 2573, "Pretrain/Step Time": 8.510216852650046} +{"Pretrain/Learning Rate": 4.2825623736762344e-05, "Pretrain/Loss": 2.0705766677856445, "Pretrain/Loss (Raw)": 2.102064371109009, "Pretrain/Step": 2574, "Pretrain/Step Time": 8.514318566769361} +{"Pretrain/Learning Rate": 4.2819670130732926e-05, "Pretrain/Loss": 2.0704054832458496, "Pretrain/Loss (Raw)": 2.0382134914398193, "Pretrain/Step": 2575, "Pretrain/Step Time": 8.513667583465576} +{"Pretrain/Learning Rate": 4.2813714469655176e-05, "Pretrain/Loss": 2.071462631225586, "Pretrain/Loss (Raw)": 2.2281172275543213, "Pretrain/Step": 2576, "Pretrain/Step Time": 8.512463485822082} +{"Pretrain/Learning Rate": 4.280775675421593e-05, "Pretrain/Loss": 2.0742292404174805, "Pretrain/Loss (Raw)": 2.251232624053955, "Pretrain/Step": 2577, "Pretrain/Step Time": 8.5075325332582} +{"Pretrain/Learning Rate": 4.280179698510226e-05, "Pretrain/Loss": 2.0741357803344727, "Pretrain/Loss (Raw)": 2.1225099563598633, "Pretrain/Step": 2578, "Pretrain/Step Time": 8.507247941568494} +{"Pretrain/Learning Rate": 4.279583516300148e-05, "Pretrain/Loss": 2.0747551918029785, "Pretrain/Loss (Raw)": 2.020967960357666, "Pretrain/Step": 2579, "Pretrain/Step Time": 8.511427717283368} +{"Pretrain/Learning Rate": 4.2789871288601136e-05, "Pretrain/Loss": 2.072742462158203, "Pretrain/Loss (Raw)": 1.8954282999038696, "Pretrain/Step": 2580, "Pretrain/Step Time": 8.515029337257147} +{"Pretrain/Learning Rate": 4.2783905362589e-05, "Pretrain/Loss": 2.0728440284729004, "Pretrain/Loss (Raw)": 2.0688936710357666, "Pretrain/Step": 2581, "Pretrain/Step Time": 8.519408240914345} +{"Pretrain/Learning Rate": 4.27779373856531e-05, "Pretrain/Loss": 2.0741119384765625, "Pretrain/Loss (Raw)": 2.116161346435547, "Pretrain/Step": 2582, "Pretrain/Step Time": 8.523388845846057} +{"Pretrain/Learning Rate": 4.277196735848169e-05, "Pretrain/Loss": 2.0736324787139893, "Pretrain/Loss (Raw)": 2.120453119277954, "Pretrain/Step": 2583, "Pretrain/Step Time": 8.52166086435318} +{"Pretrain/Learning Rate": 4.2765995281763263e-05, "Pretrain/Loss": 2.073641300201416, "Pretrain/Loss (Raw)": 2.0726091861724854, "Pretrain/Step": 2584, "Pretrain/Step Time": 8.51639032177627} +{"Pretrain/Learning Rate": 4.2760021156186534e-05, "Pretrain/Loss": 2.0711166858673096, "Pretrain/Loss (Raw)": 1.937225341796875, "Pretrain/Step": 2585, "Pretrain/Step Time": 8.512585723772645} +{"Pretrain/Learning Rate": 4.2754044982440486e-05, "Pretrain/Loss": 2.0712063312530518, "Pretrain/Loss (Raw)": 2.15431809425354, "Pretrain/Step": 2586, "Pretrain/Step Time": 8.515368705615401} +{"Pretrain/Learning Rate": 4.2748066761214305e-05, "Pretrain/Loss": 2.0724072456359863, "Pretrain/Loss (Raw)": 2.0484118461608887, "Pretrain/Step": 2587, "Pretrain/Step Time": 8.514270002022386} +{"Pretrain/Learning Rate": 4.274208649319744e-05, "Pretrain/Loss": 2.0747313499450684, "Pretrain/Loss (Raw)": 2.256396532058716, "Pretrain/Step": 2588, "Pretrain/Step Time": 8.517708441242576} +{"Pretrain/Learning Rate": 4.273610417907955e-05, "Pretrain/Loss": 2.073251724243164, "Pretrain/Loss (Raw)": 2.0196988582611084, "Pretrain/Step": 2589, "Pretrain/Step Time": 8.507722890004516} +{"Pretrain/Learning Rate": 4.2730119819550555e-05, "Pretrain/Loss": 2.071348190307617, "Pretrain/Loss (Raw)": 1.9514297246932983, "Pretrain/Step": 2590, "Pretrain/Step Time": 8.511632207781076} +{"Pretrain/Learning Rate": 4.2724133415300596e-05, "Pretrain/Loss": 2.0718860626220703, "Pretrain/Loss (Raw)": 2.13989520072937, "Pretrain/Step": 2591, "Pretrain/Step Time": 8.512156495824456} +{"Pretrain/Learning Rate": 4.271814496702005e-05, "Pretrain/Loss": 2.068951368331909, "Pretrain/Loss (Raw)": 1.9817835092544556, "Pretrain/Step": 2592, "Pretrain/Step Time": 8.514204604551196} +{"Pretrain/Learning Rate": 4.2712154475399534e-05, "Pretrain/Loss": 2.069693088531494, "Pretrain/Loss (Raw)": 2.2535548210144043, "Pretrain/Step": 2593, "Pretrain/Step Time": 8.513360572978854} +{"Pretrain/Learning Rate": 4.2706161941129906e-05, "Pretrain/Loss": 2.0709757804870605, "Pretrain/Loss (Raw)": 2.265280246734619, "Pretrain/Step": 2594, "Pretrain/Step Time": 8.50561086460948} +{"Pretrain/Learning Rate": 4.270016736490225e-05, "Pretrain/Loss": 2.069650650024414, "Pretrain/Loss (Raw)": 1.7999306917190552, "Pretrain/Step": 2595, "Pretrain/Step Time": 8.503883928060532} +{"Pretrain/Learning Rate": 4.2694170747407886e-05, "Pretrain/Loss": 2.069350481033325, "Pretrain/Loss (Raw)": 2.079944372177124, "Pretrain/Step": 2596, "Pretrain/Step Time": 8.505440974608064} +{"Pretrain/Learning Rate": 4.268817208933837e-05, "Pretrain/Loss": 2.0695080757141113, "Pretrain/Loss (Raw)": 2.069580078125, "Pretrain/Step": 2597, "Pretrain/Step Time": 8.509901138022542} +{"Pretrain/Learning Rate": 4.268217139138551e-05, "Pretrain/Loss": 2.070817708969116, "Pretrain/Loss (Raw)": 2.3110663890838623, "Pretrain/Step": 2598, "Pretrain/Step Time": 8.5098508708179} +{"Pretrain/Learning Rate": 4.267616865424131e-05, "Pretrain/Loss": 2.0708022117614746, "Pretrain/Loss (Raw)": 2.208531618118286, "Pretrain/Step": 2599, "Pretrain/Step Time": 8.512349713593721} +{"Pretrain/Learning Rate": 4.267016387859806e-05, "Pretrain/Loss": 2.0656304359436035, "Pretrain/Loss (Raw)": 1.9176145792007446, "Pretrain/Step": 2600, "Pretrain/Step Time": 8.509476756677032} +{"Pretrain/Learning Rate": 4.266415706514824e-05, "Pretrain/Loss": 2.0636234283447266, "Pretrain/Loss (Raw)": 1.8750215768814087, "Pretrain/Step": 2601, "Pretrain/Step Time": 8.498891172930598} +{"Pretrain/Learning Rate": 4.2658148214584585e-05, "Pretrain/Loss": 2.0646557807922363, "Pretrain/Loss (Raw)": 2.013726234436035, "Pretrain/Step": 2602, "Pretrain/Step Time": 8.499113965779543} +{"Pretrain/Learning Rate": 4.265213732760008e-05, "Pretrain/Loss": 2.06449031829834, "Pretrain/Loss (Raw)": 2.2084479331970215, "Pretrain/Step": 2603, "Pretrain/Step Time": 8.510625902563334} +{"Pretrain/Learning Rate": 4.264612440488791e-05, "Pretrain/Loss": 2.063680648803711, "Pretrain/Loss (Raw)": 2.031904697418213, "Pretrain/Step": 2604, "Pretrain/Step Time": 8.509832294657826} +{"Pretrain/Learning Rate": 4.264010944714153e-05, "Pretrain/Loss": 2.063710927963257, "Pretrain/Loss (Raw)": 1.993314266204834, "Pretrain/Step": 2605, "Pretrain/Step Time": 8.510349422693253} +{"Pretrain/Learning Rate": 4.263409245505461e-05, "Pretrain/Loss": 2.0633411407470703, "Pretrain/Loss (Raw)": 2.0400118827819824, "Pretrain/Step": 2606, "Pretrain/Step Time": 8.504594411700964} +{"Pretrain/Learning Rate": 4.262807342932105e-05, "Pretrain/Loss": 2.062868118286133, "Pretrain/Loss (Raw)": 1.964307188987732, "Pretrain/Step": 2607, "Pretrain/Step Time": 8.502876482903957} +{"Pretrain/Learning Rate": 4.262205237063499e-05, "Pretrain/Loss": 2.0640292167663574, "Pretrain/Loss (Raw)": 2.1850621700286865, "Pretrain/Step": 2608, "Pretrain/Step Time": 8.50971239246428} +{"Pretrain/Learning Rate": 4.2616029279690814e-05, "Pretrain/Loss": 2.0645980834960938, "Pretrain/Loss (Raw)": 2.0427002906799316, "Pretrain/Step": 2609, "Pretrain/Step Time": 8.509671838954091} +{"Pretrain/Learning Rate": 4.261000415718312e-05, "Pretrain/Loss": 2.0626471042633057, "Pretrain/Loss (Raw)": 1.9224896430969238, "Pretrain/Step": 2610, "Pretrain/Step Time": 8.509688900783658} +{"Pretrain/Learning Rate": 4.260397700380679e-05, "Pretrain/Loss": 2.061245918273926, "Pretrain/Loss (Raw)": 1.9370428323745728, "Pretrain/Step": 2611, "Pretrain/Step Time": 8.514105951413512} +{"Pretrain/Learning Rate": 4.259794782025687e-05, "Pretrain/Loss": 2.061882972717285, "Pretrain/Loss (Raw)": 2.024409055709839, "Pretrain/Step": 2612, "Pretrain/Step Time": 8.505494631826878} +{"Pretrain/Learning Rate": 4.2591916607228675e-05, "Pretrain/Loss": 2.063086986541748, "Pretrain/Loss (Raw)": 2.088029384613037, "Pretrain/Step": 2613, "Pretrain/Step Time": 8.505394307896495} +{"Pretrain/Learning Rate": 4.2585883365417774e-05, "Pretrain/Loss": 2.0686612129211426, "Pretrain/Loss (Raw)": 2.2106261253356934, "Pretrain/Step": 2614, "Pretrain/Step Time": 8.508694358170033} +{"Pretrain/Learning Rate": 4.2579848095519926e-05, "Pretrain/Loss": 2.064763069152832, "Pretrain/Loss (Raw)": 1.8334009647369385, "Pretrain/Step": 2615, "Pretrain/Step Time": 8.51747046597302} +{"Pretrain/Learning Rate": 4.257381079823116e-05, "Pretrain/Loss": 2.0647778511047363, "Pretrain/Loss (Raw)": 1.9526913166046143, "Pretrain/Step": 2616, "Pretrain/Step Time": 8.513056114315987} +{"Pretrain/Learning Rate": 4.2567771474247726e-05, "Pretrain/Loss": 2.06494140625, "Pretrain/Loss (Raw)": 2.0002973079681396, "Pretrain/Step": 2617, "Pretrain/Step Time": 8.513010712340474} +{"Pretrain/Learning Rate": 4.2561730124266094e-05, "Pretrain/Loss": 2.0635011196136475, "Pretrain/Loss (Raw)": 2.1623923778533936, "Pretrain/Step": 2618, "Pretrain/Step Time": 8.508365366607904} +{"Pretrain/Learning Rate": 4.255568674898301e-05, "Pretrain/Loss": 2.063558578491211, "Pretrain/Loss (Raw)": 2.104445219039917, "Pretrain/Step": 2619, "Pretrain/Step Time": 8.50302636437118} +{"Pretrain/Learning Rate": 4.254964134909538e-05, "Pretrain/Loss": 2.063055992126465, "Pretrain/Loss (Raw)": 1.9260127544403076, "Pretrain/Step": 2620, "Pretrain/Step Time": 8.505099119618535} +{"Pretrain/Learning Rate": 4.254359392530043e-05, "Pretrain/Loss": 2.0629658699035645, "Pretrain/Loss (Raw)": 2.0844218730926514, "Pretrain/Step": 2621, "Pretrain/Step Time": 8.509913921356201} +{"Pretrain/Learning Rate": 4.2537544478295556e-05, "Pretrain/Loss": 2.066725730895996, "Pretrain/Loss (Raw)": 1.9560354948043823, "Pretrain/Step": 2622, "Pretrain/Step Time": 8.508025705814362} +{"Pretrain/Learning Rate": 4.253149300877841e-05, "Pretrain/Loss": 2.0673766136169434, "Pretrain/Loss (Raw)": 2.0336039066314697, "Pretrain/Step": 2623, "Pretrain/Step Time": 8.509042674675584} +{"Pretrain/Learning Rate": 4.252543951744688e-05, "Pretrain/Loss": 2.0665340423583984, "Pretrain/Loss (Raw)": 2.004734516143799, "Pretrain/Step": 2624, "Pretrain/Step Time": 8.497029168531299} +{"Pretrain/Learning Rate": 4.251938400499909e-05, "Pretrain/Loss": 2.066490650177002, "Pretrain/Loss (Raw)": 2.0973050594329834, "Pretrain/Step": 2625, "Pretrain/Step Time": 8.497139137238264} +{"Pretrain/Learning Rate": 4.251332647213337e-05, "Pretrain/Loss": 2.0671143531799316, "Pretrain/Loss (Raw)": 2.099308729171753, "Pretrain/Step": 2626, "Pretrain/Step Time": 8.506931401789188} +{"Pretrain/Learning Rate": 4.250726691954832e-05, "Pretrain/Loss": 2.066866636276245, "Pretrain/Loss (Raw)": 2.0737884044647217, "Pretrain/Step": 2627, "Pretrain/Step Time": 8.510696806013584} +{"Pretrain/Learning Rate": 4.250120534794275e-05, "Pretrain/Loss": 2.0671682357788086, "Pretrain/Loss (Raw)": 1.9304085969924927, "Pretrain/Step": 2628, "Pretrain/Step Time": 8.514026207849383} +{"Pretrain/Learning Rate": 4.249514175801572e-05, "Pretrain/Loss": 2.0673577785491943, "Pretrain/Loss (Raw)": 2.083218812942505, "Pretrain/Step": 2629, "Pretrain/Step Time": 8.510515319183469} +{"Pretrain/Learning Rate": 4.248907615046649e-05, "Pretrain/Loss": 2.06886625289917, "Pretrain/Loss (Raw)": 2.110933542251587, "Pretrain/Step": 2630, "Pretrain/Step Time": 8.506288394331932} +{"Pretrain/Learning Rate": 4.24830085259946e-05, "Pretrain/Loss": 2.0705509185791016, "Pretrain/Loss (Raw)": 2.2079625129699707, "Pretrain/Step": 2631, "Pretrain/Step Time": 8.504227198660374} +{"Pretrain/Learning Rate": 4.247693888529978e-05, "Pretrain/Loss": 2.0701372623443604, "Pretrain/Loss (Raw)": 2.0153374671936035, "Pretrain/Step": 2632, "Pretrain/Step Time": 8.506139818578959} +{"Pretrain/Learning Rate": 4.247086722908201e-05, "Pretrain/Loss": 2.0687456130981445, "Pretrain/Loss (Raw)": 1.7627992630004883, "Pretrain/Step": 2633, "Pretrain/Step Time": 8.513393972069025} +{"Pretrain/Learning Rate": 4.24647935580415e-05, "Pretrain/Loss": 2.0658397674560547, "Pretrain/Loss (Raw)": 2.0419068336486816, "Pretrain/Step": 2634, "Pretrain/Step Time": 8.516966674476862} +{"Pretrain/Learning Rate": 4.2458717872878715e-05, "Pretrain/Loss": 2.067143678665161, "Pretrain/Loss (Raw)": 2.1832096576690674, "Pretrain/Step": 2635, "Pretrain/Step Time": 8.515009999275208} +{"Pretrain/Learning Rate": 4.245264017429431e-05, "Pretrain/Loss": 2.063876152038574, "Pretrain/Loss (Raw)": 1.8849444389343262, "Pretrain/Step": 2636, "Pretrain/Step Time": 8.50432014837861} +{"Pretrain/Learning Rate": 4.2446560462989203e-05, "Pretrain/Loss": 2.063401222229004, "Pretrain/Loss (Raw)": 2.0522658824920654, "Pretrain/Step": 2637, "Pretrain/Step Time": 8.503000440075994} +{"Pretrain/Learning Rate": 4.244047873966452e-05, "Pretrain/Loss": 2.063244104385376, "Pretrain/Loss (Raw)": 2.0024592876434326, "Pretrain/Step": 2638, "Pretrain/Step Time": 8.512142421677709} +{"Pretrain/Learning Rate": 4.2434395005021666e-05, "Pretrain/Loss": 2.0634496212005615, "Pretrain/Loss (Raw)": 2.0534276962280273, "Pretrain/Step": 2639, "Pretrain/Step Time": 8.516873382031918} +{"Pretrain/Learning Rate": 4.242830925976221e-05, "Pretrain/Loss": 2.063838243484497, "Pretrain/Loss (Raw)": 2.150146484375, "Pretrain/Step": 2640, "Pretrain/Step Time": 8.516802106052637} +{"Pretrain/Learning Rate": 4.2422221504588016e-05, "Pretrain/Loss": 2.065959930419922, "Pretrain/Loss (Raw)": 2.277252435684204, "Pretrain/Step": 2641, "Pretrain/Step Time": 8.510378809645772} +{"Pretrain/Learning Rate": 4.2416131740201134e-05, "Pretrain/Loss": 2.068830966949463, "Pretrain/Loss (Raw)": 2.4156227111816406, "Pretrain/Step": 2642, "Pretrain/Step Time": 8.498954391106963} +{"Pretrain/Learning Rate": 4.241003996730388e-05, "Pretrain/Loss": 2.067004680633545, "Pretrain/Loss (Raw)": 2.070892095565796, "Pretrain/Step": 2643, "Pretrain/Step Time": 8.496574867516756} +{"Pretrain/Learning Rate": 4.240394618659878e-05, "Pretrain/Loss": 2.0675623416900635, "Pretrain/Loss (Raw)": 2.1816189289093018, "Pretrain/Step": 2644, "Pretrain/Step Time": 8.50287632085383} +{"Pretrain/Learning Rate": 4.2397850398788586e-05, "Pretrain/Loss": 2.065767765045166, "Pretrain/Loss (Raw)": 2.1015169620513916, "Pretrain/Step": 2645, "Pretrain/Step Time": 8.506782155483961} +{"Pretrain/Learning Rate": 4.239175260457631e-05, "Pretrain/Loss": 2.06732439994812, "Pretrain/Loss (Raw)": 2.1695165634155273, "Pretrain/Step": 2646, "Pretrain/Step Time": 8.51012628339231} +{"Pretrain/Learning Rate": 4.2385652804665164e-05, "Pretrain/Loss": 2.065152168273926, "Pretrain/Loss (Raw)": 1.9324923753738403, "Pretrain/Step": 2647, "Pretrain/Step Time": 8.513330167159438} +{"Pretrain/Learning Rate": 4.237955099975862e-05, "Pretrain/Loss": 2.064016103744507, "Pretrain/Loss (Raw)": 1.906083345413208, "Pretrain/Step": 2648, "Pretrain/Step Time": 8.502698602154851} +{"Pretrain/Learning Rate": 4.237344719056035e-05, "Pretrain/Loss": 2.0643811225891113, "Pretrain/Loss (Raw)": 2.007899761199951, "Pretrain/Step": 2649, "Pretrain/Step Time": 8.498719613999128} +{"Pretrain/Learning Rate": 4.236734137777429e-05, "Pretrain/Loss": 2.0647454261779785, "Pretrain/Loss (Raw)": 2.06451153755188, "Pretrain/Step": 2650, "Pretrain/Step Time": 8.502576515078545} +{"Pretrain/Learning Rate": 4.236123356210458e-05, "Pretrain/Loss": 2.063075304031372, "Pretrain/Loss (Raw)": 2.10510516166687, "Pretrain/Step": 2651, "Pretrain/Step Time": 8.51074549742043} +{"Pretrain/Learning Rate": 4.235512374425561e-05, "Pretrain/Loss": 2.063005208969116, "Pretrain/Loss (Raw)": 1.9701429605484009, "Pretrain/Step": 2652, "Pretrain/Step Time": 8.515990801155567} +{"Pretrain/Learning Rate": 4.234901192493199e-05, "Pretrain/Loss": 2.0622425079345703, "Pretrain/Loss (Raw)": 2.003446578979492, "Pretrain/Step": 2653, "Pretrain/Step Time": 8.507412943989038} +{"Pretrain/Learning Rate": 4.234289810483857e-05, "Pretrain/Loss": 2.0634522438049316, "Pretrain/Loss (Raw)": 2.0538206100463867, "Pretrain/Step": 2654, "Pretrain/Step Time": 8.500550096854568} +{"Pretrain/Learning Rate": 4.233678228468041e-05, "Pretrain/Loss": 2.067410469055176, "Pretrain/Loss (Raw)": 2.36940860748291, "Pretrain/Step": 2655, "Pretrain/Step Time": 8.50025332532823} +{"Pretrain/Learning Rate": 4.2330664465162826e-05, "Pretrain/Loss": 2.0662007331848145, "Pretrain/Loss (Raw)": 2.1122167110443115, "Pretrain/Step": 2656, "Pretrain/Step Time": 8.5133514162153} +{"Pretrain/Learning Rate": 4.232454464699135e-05, "Pretrain/Loss": 2.06494402885437, "Pretrain/Loss (Raw)": 2.042334794998169, "Pretrain/Step": 2657, "Pretrain/Step Time": 8.521064348518848} +{"Pretrain/Learning Rate": 4.231842283087175e-05, "Pretrain/Loss": 2.0642733573913574, "Pretrain/Loss (Raw)": 2.042621374130249, "Pretrain/Step": 2658, "Pretrain/Step Time": 8.525363905355334} +{"Pretrain/Learning Rate": 4.231229901751002e-05, "Pretrain/Loss": 2.0644822120666504, "Pretrain/Loss (Raw)": 1.958950400352478, "Pretrain/Step": 2659, "Pretrain/Step Time": 8.525040006265044} +{"Pretrain/Learning Rate": 4.2306173207612394e-05, "Pretrain/Loss": 2.067000150680542, "Pretrain/Loss (Raw)": 2.230637311935425, "Pretrain/Step": 2660, "Pretrain/Step Time": 8.513541454449296} +{"Pretrain/Learning Rate": 4.230004540188533e-05, "Pretrain/Loss": 2.0676109790802, "Pretrain/Loss (Raw)": 2.0771234035491943, "Pretrain/Step": 2661, "Pretrain/Step Time": 8.513531476259232} +{"Pretrain/Learning Rate": 4.22939156010355e-05, "Pretrain/Loss": 2.0683069229125977, "Pretrain/Loss (Raw)": 2.1784610748291016, "Pretrain/Step": 2662, "Pretrain/Step Time": 8.518422897905111} +{"Pretrain/Learning Rate": 4.2287783805769824e-05, "Pretrain/Loss": 2.068915367126465, "Pretrain/Loss (Raw)": 2.0946812629699707, "Pretrain/Step": 2663, "Pretrain/Step Time": 8.523986283689737} +{"Pretrain/Learning Rate": 4.2281650016795466e-05, "Pretrain/Loss": 2.0674469470977783, "Pretrain/Loss (Raw)": 2.0098440647125244, "Pretrain/Step": 2664, "Pretrain/Step Time": 8.526113472878933} +{"Pretrain/Learning Rate": 4.227551423481979e-05, "Pretrain/Loss": 2.068871021270752, "Pretrain/Loss (Raw)": 2.1152825355529785, "Pretrain/Step": 2665, "Pretrain/Step Time": 8.529220163822174} +{"Pretrain/Learning Rate": 4.2269376460550414e-05, "Pretrain/Loss": 2.0701863765716553, "Pretrain/Loss (Raw)": 2.1792187690734863, "Pretrain/Step": 2666, "Pretrain/Step Time": 8.524433929473162} +{"Pretrain/Learning Rate": 4.226323669469516e-05, "Pretrain/Loss": 2.071444034576416, "Pretrain/Loss (Raw)": 2.046450138092041, "Pretrain/Step": 2667, "Pretrain/Step Time": 8.515934899449348} +{"Pretrain/Learning Rate": 4.225709493796211e-05, "Pretrain/Loss": 2.0694429874420166, "Pretrain/Loss (Raw)": 2.0585124492645264, "Pretrain/Step": 2668, "Pretrain/Step Time": 8.519541142508388} +{"Pretrain/Learning Rate": 4.225095119105956e-05, "Pretrain/Loss": 2.0669350624084473, "Pretrain/Loss (Raw)": 1.66533362865448, "Pretrain/Step": 2669, "Pretrain/Step Time": 8.522271953523159} +{"Pretrain/Learning Rate": 4.224480545469603e-05, "Pretrain/Loss": 2.0667057037353516, "Pretrain/Loss (Raw)": 2.0082790851593018, "Pretrain/Step": 2670, "Pretrain/Step Time": 8.525407718494534} +{"Pretrain/Learning Rate": 4.223865772958026e-05, "Pretrain/Loss": 2.067295551300049, "Pretrain/Loss (Raw)": 2.220615863800049, "Pretrain/Step": 2671, "Pretrain/Step Time": 8.520413836464286} +{"Pretrain/Learning Rate": 4.223250801642126e-05, "Pretrain/Loss": 2.0678014755249023, "Pretrain/Loss (Raw)": 2.1018474102020264, "Pretrain/Step": 2672, "Pretrain/Step Time": 8.519443720579147} +{"Pretrain/Learning Rate": 4.222635631592823e-05, "Pretrain/Loss": 2.0685975551605225, "Pretrain/Loss (Raw)": 2.1106550693511963, "Pretrain/Step": 2673, "Pretrain/Step Time": 8.515606852248311} +{"Pretrain/Learning Rate": 4.2220202628810614e-05, "Pretrain/Loss": 2.0697455406188965, "Pretrain/Loss (Raw)": 2.105605125427246, "Pretrain/Step": 2674, "Pretrain/Step Time": 8.522392181679606} +{"Pretrain/Learning Rate": 4.2214046955778085e-05, "Pretrain/Loss": 2.0717103481292725, "Pretrain/Loss (Raw)": 2.226745367050171, "Pretrain/Step": 2675, "Pretrain/Step Time": 8.523928066715598} +{"Pretrain/Learning Rate": 4.2207889297540546e-05, "Pretrain/Loss": 2.0704383850097656, "Pretrain/Loss (Raw)": 2.0935919284820557, "Pretrain/Step": 2676, "Pretrain/Step Time": 8.5263865981251} +{"Pretrain/Learning Rate": 4.2201729654808136e-05, "Pretrain/Loss": 2.0705666542053223, "Pretrain/Loss (Raw)": 2.183704137802124, "Pretrain/Step": 2677, "Pretrain/Step Time": 8.522241916507483} +{"Pretrain/Learning Rate": 4.21955680282912e-05, "Pretrain/Loss": 2.0700740814208984, "Pretrain/Loss (Raw)": 2.056546211242676, "Pretrain/Step": 2678, "Pretrain/Step Time": 8.513728713616729} +{"Pretrain/Learning Rate": 4.218940441870033e-05, "Pretrain/Loss": 2.069894313812256, "Pretrain/Loss (Raw)": 2.0704264640808105, "Pretrain/Step": 2679, "Pretrain/Step Time": 8.508389035239816} +{"Pretrain/Learning Rate": 4.218323882674634e-05, "Pretrain/Loss": 2.0670313835144043, "Pretrain/Loss (Raw)": 2.100308895111084, "Pretrain/Step": 2680, "Pretrain/Step Time": 8.518989661708474} +{"Pretrain/Learning Rate": 4.217707125314029e-05, "Pretrain/Loss": 2.0680675506591797, "Pretrain/Loss (Raw)": 2.021829128265381, "Pretrain/Step": 2681, "Pretrain/Step Time": 8.518539791926742} +{"Pretrain/Learning Rate": 4.217090169859343e-05, "Pretrain/Loss": 2.071878433227539, "Pretrain/Loss (Raw)": 2.347907543182373, "Pretrain/Step": 2682, "Pretrain/Step Time": 8.515145976096392} +{"Pretrain/Learning Rate": 4.216473016381728e-05, "Pretrain/Loss": 2.0738260746002197, "Pretrain/Loss (Raw)": 2.1937992572784424, "Pretrain/Step": 2683, "Pretrain/Step Time": 8.516224743798375} +{"Pretrain/Learning Rate": 4.215855664952356e-05, "Pretrain/Loss": 2.0740199089050293, "Pretrain/Loss (Raw)": 2.13946795463562, "Pretrain/Step": 2684, "Pretrain/Step Time": 8.51940925233066} +{"Pretrain/Learning Rate": 4.215238115642424e-05, "Pretrain/Loss": 2.075279474258423, "Pretrain/Loss (Raw)": 2.0717246532440186, "Pretrain/Step": 2685, "Pretrain/Step Time": 8.51398279890418} +{"Pretrain/Learning Rate": 4.2146203685231495e-05, "Pretrain/Loss": 2.074610471725464, "Pretrain/Loss (Raw)": 2.0632481575012207, "Pretrain/Step": 2686, "Pretrain/Step Time": 8.518855173140764} +{"Pretrain/Learning Rate": 4.214002423665775e-05, "Pretrain/Loss": 2.074507713317871, "Pretrain/Loss (Raw)": 2.1665334701538086, "Pretrain/Step": 2687, "Pretrain/Step Time": 8.51685786806047} +{"Pretrain/Learning Rate": 4.213384281141563e-05, "Pretrain/Loss": 2.074521541595459, "Pretrain/Loss (Raw)": 2.087912082672119, "Pretrain/Step": 2688, "Pretrain/Step Time": 8.518304893746972} +{"Pretrain/Learning Rate": 4.212765941021804e-05, "Pretrain/Loss": 2.076545238494873, "Pretrain/Loss (Raw)": 2.1841037273406982, "Pretrain/Step": 2689, "Pretrain/Step Time": 8.512750588357449} +{"Pretrain/Learning Rate": 4.212147403377805e-05, "Pretrain/Loss": 2.074643135070801, "Pretrain/Loss (Raw)": 2.1944689750671387, "Pretrain/Step": 2690, "Pretrain/Step Time": 8.508577361702919} +{"Pretrain/Learning Rate": 4.2115286682808995e-05, "Pretrain/Loss": 2.0750980377197266, "Pretrain/Loss (Raw)": 2.1168508529663086, "Pretrain/Step": 2691, "Pretrain/Step Time": 8.517758635804057} +{"Pretrain/Learning Rate": 4.210909735802442e-05, "Pretrain/Loss": 2.0743839740753174, "Pretrain/Loss (Raw)": 1.8773529529571533, "Pretrain/Step": 2692, "Pretrain/Step Time": 8.513000743463635} +{"Pretrain/Learning Rate": 4.210290606013812e-05, "Pretrain/Loss": 2.0749258995056152, "Pretrain/Loss (Raw)": 2.084083080291748, "Pretrain/Step": 2693, "Pretrain/Step Time": 8.512268235906959} +{"Pretrain/Learning Rate": 4.209671278986412e-05, "Pretrain/Loss": 2.0740723609924316, "Pretrain/Loss (Raw)": 1.9316880702972412, "Pretrain/Step": 2694, "Pretrain/Step Time": 8.513554777950048} +{"Pretrain/Learning Rate": 4.209051754791662e-05, "Pretrain/Loss": 2.0734148025512695, "Pretrain/Loss (Raw)": 1.9747400283813477, "Pretrain/Step": 2695, "Pretrain/Step Time": 8.514180332422256} +{"Pretrain/Learning Rate": 4.208432033501011e-05, "Pretrain/Loss": 2.0695362091064453, "Pretrain/Loss (Raw)": 1.7468421459197998, "Pretrain/Step": 2696, "Pretrain/Step Time": 8.511149354279041} +{"Pretrain/Learning Rate": 4.2078121151859276e-05, "Pretrain/Loss": 2.0699150562286377, "Pretrain/Loss (Raw)": 2.2030954360961914, "Pretrain/Step": 2697, "Pretrain/Step Time": 8.51192394644022} +{"Pretrain/Learning Rate": 4.2071919999179036e-05, "Pretrain/Loss": 2.0697221755981445, "Pretrain/Loss (Raw)": 1.9626917839050293, "Pretrain/Step": 2698, "Pretrain/Step Time": 8.514228293672204} +{"Pretrain/Learning Rate": 4.206571687768454e-05, "Pretrain/Loss": 2.0679850578308105, "Pretrain/Loss (Raw)": 1.9718559980392456, "Pretrain/Step": 2699, "Pretrain/Step Time": 8.517851430922747} +{"Pretrain/Learning Rate": 4.2059511788091146e-05, "Pretrain/Loss": 2.0702545642852783, "Pretrain/Loss (Raw)": 2.324558973312378, "Pretrain/Step": 2700, "Pretrain/Step Time": 8.519836382940412} +{"Pretrain/Learning Rate": 4.205330473111447e-05, "Pretrain/Loss": 2.0743985176086426, "Pretrain/Loss (Raw)": 2.3630595207214355, "Pretrain/Step": 2701, "Pretrain/Step Time": 8.515842663124204} +{"Pretrain/Learning Rate": 4.204709570747034e-05, "Pretrain/Loss": 2.07356595993042, "Pretrain/Loss (Raw)": 1.9955172538757324, "Pretrain/Step": 2702, "Pretrain/Step Time": 8.514626063406467} +{"Pretrain/Learning Rate": 4.2040884717874804e-05, "Pretrain/Loss": 2.0730459690093994, "Pretrain/Loss (Raw)": 1.9716414213180542, "Pretrain/Step": 2703, "Pretrain/Step Time": 8.517205623909831} +{"Pretrain/Learning Rate": 4.203467176304414e-05, "Pretrain/Loss": 2.074887990951538, "Pretrain/Loss (Raw)": 2.4639008045196533, "Pretrain/Step": 2704, "Pretrain/Step Time": 8.515001809224486} +{"Pretrain/Learning Rate": 4.202845684369486e-05, "Pretrain/Loss": 2.073237657546997, "Pretrain/Loss (Raw)": 2.039968729019165, "Pretrain/Step": 2705, "Pretrain/Step Time": 8.51459157280624} +{"Pretrain/Learning Rate": 4.202223996054369e-05, "Pretrain/Loss": 2.072148323059082, "Pretrain/Loss (Raw)": 1.9830658435821533, "Pretrain/Step": 2706, "Pretrain/Step Time": 8.509825143963099} +{"Pretrain/Learning Rate": 4.20160211143076e-05, "Pretrain/Loss": 2.0748379230499268, "Pretrain/Loss (Raw)": 2.3652617931365967, "Pretrain/Step": 2707, "Pretrain/Step Time": 8.502457160502672} +{"Pretrain/Learning Rate": 4.200980030570377e-05, "Pretrain/Loss": 2.0764524936676025, "Pretrain/Loss (Raw)": 2.1020915508270264, "Pretrain/Step": 2708, "Pretrain/Step Time": 8.499343322589993} +{"Pretrain/Learning Rate": 4.2003577535449624e-05, "Pretrain/Loss": 2.0768368244171143, "Pretrain/Loss (Raw)": 2.11808443069458, "Pretrain/Step": 2709, "Pretrain/Step Time": 8.497775632888079} +{"Pretrain/Learning Rate": 4.199735280426279e-05, "Pretrain/Loss": 2.0759503841400146, "Pretrain/Loss (Raw)": 2.002700090408325, "Pretrain/Step": 2710, "Pretrain/Step Time": 8.499815806746483} +{"Pretrain/Learning Rate": 4.199112611286113e-05, "Pretrain/Loss": 2.0774941444396973, "Pretrain/Loss (Raw)": 2.3180646896362305, "Pretrain/Step": 2711, "Pretrain/Step Time": 8.50610527023673} +{"Pretrain/Learning Rate": 4.1984897461962754e-05, "Pretrain/Loss": 2.0791356563568115, "Pretrain/Loss (Raw)": 2.282714605331421, "Pretrain/Step": 2712, "Pretrain/Step Time": 8.497507700696588} +{"Pretrain/Learning Rate": 4.197866685228596e-05, "Pretrain/Loss": 2.0791776180267334, "Pretrain/Loss (Raw)": 1.9425965547561646, "Pretrain/Step": 2713, "Pretrain/Step Time": 8.49318372644484} +{"Pretrain/Learning Rate": 4.19724342845493e-05, "Pretrain/Loss": 2.0774505138397217, "Pretrain/Loss (Raw)": 1.9332367181777954, "Pretrain/Step": 2714, "Pretrain/Step Time": 8.496303781867027} +{"Pretrain/Learning Rate": 4.1966199759471535e-05, "Pretrain/Loss": 2.0783348083496094, "Pretrain/Loss (Raw)": 2.1616313457489014, "Pretrain/Step": 2715, "Pretrain/Step Time": 8.501930300146341} +{"Pretrain/Learning Rate": 4.195996327777167e-05, "Pretrain/Loss": 2.079697370529175, "Pretrain/Loss (Raw)": 2.430799722671509, "Pretrain/Step": 2716, "Pretrain/Step Time": 8.501171225681901} +{"Pretrain/Learning Rate": 4.195372484016893e-05, "Pretrain/Loss": 2.0779881477355957, "Pretrain/Loss (Raw)": 1.8008946180343628, "Pretrain/Step": 2717, "Pretrain/Step Time": 8.502117006108165} +{"Pretrain/Learning Rate": 4.1947484447382746e-05, "Pretrain/Loss": 2.0782556533813477, "Pretrain/Loss (Raw)": 1.9856679439544678, "Pretrain/Step": 2718, "Pretrain/Step Time": 8.493753626942635} +{"Pretrain/Learning Rate": 4.194124210013279e-05, "Pretrain/Loss": 2.0779061317443848, "Pretrain/Loss (Raw)": 2.095181465148926, "Pretrain/Step": 2719, "Pretrain/Step Time": 8.491182630881667} +{"Pretrain/Learning Rate": 4.1934997799138976e-05, "Pretrain/Loss": 2.079660654067993, "Pretrain/Loss (Raw)": 2.206341505050659, "Pretrain/Step": 2720, "Pretrain/Step Time": 8.497093038633466} +{"Pretrain/Learning Rate": 4.192875154512141e-05, "Pretrain/Loss": 2.0788679122924805, "Pretrain/Loss (Raw)": 2.1520838737487793, "Pretrain/Step": 2721, "Pretrain/Step Time": 8.505393221974373} +{"Pretrain/Learning Rate": 4.192250333880045e-05, "Pretrain/Loss": 2.0770702362060547, "Pretrain/Loss (Raw)": 2.03519344329834, "Pretrain/Step": 2722, "Pretrain/Step Time": 8.503265861421824} +{"Pretrain/Learning Rate": 4.191625318089666e-05, "Pretrain/Loss": 2.081087589263916, "Pretrain/Loss (Raw)": 2.31414532661438, "Pretrain/Step": 2723, "Pretrain/Step Time": 8.508855320513248} +{"Pretrain/Learning Rate": 4.191000107213084e-05, "Pretrain/Loss": 2.081144094467163, "Pretrain/Loss (Raw)": 2.0871872901916504, "Pretrain/Step": 2724, "Pretrain/Step Time": 8.501598259434104} +{"Pretrain/Learning Rate": 4.190374701322401e-05, "Pretrain/Loss": 2.0800864696502686, "Pretrain/Loss (Raw)": 1.9341895580291748, "Pretrain/Step": 2725, "Pretrain/Step Time": 8.497926265001297} +{"Pretrain/Learning Rate": 4.1897491004897435e-05, "Pretrain/Loss": 2.0771842002868652, "Pretrain/Loss (Raw)": 1.9395792484283447, "Pretrain/Step": 2726, "Pretrain/Step Time": 8.498407458886504} +{"Pretrain/Learning Rate": 4.189123304787256e-05, "Pretrain/Loss": 2.0757861137390137, "Pretrain/Loss (Raw)": 2.0295703411102295, "Pretrain/Step": 2727, "Pretrain/Step Time": 8.502543464303017} +{"Pretrain/Learning Rate": 4.1884973142871096e-05, "Pretrain/Loss": 2.0747122764587402, "Pretrain/Loss (Raw)": 1.780176043510437, "Pretrain/Step": 2728, "Pretrain/Step Time": 8.506644651293755} +{"Pretrain/Learning Rate": 4.187871129061498e-05, "Pretrain/Loss": 2.0760726928710938, "Pretrain/Loss (Raw)": 2.049166679382324, "Pretrain/Step": 2729, "Pretrain/Step Time": 8.51725877262652} +{"Pretrain/Learning Rate": 4.187244749182633e-05, "Pretrain/Loss": 2.075927734375, "Pretrain/Loss (Raw)": 1.9951527118682861, "Pretrain/Step": 2730, "Pretrain/Step Time": 8.510401824489236} +{"Pretrain/Learning Rate": 4.1866181747227526e-05, "Pretrain/Loss": 2.074249744415283, "Pretrain/Loss (Raw)": 1.9936962127685547, "Pretrain/Step": 2731, "Pretrain/Step Time": 8.503108901903033} +{"Pretrain/Learning Rate": 4.185991405754118e-05, "Pretrain/Loss": 2.0733988285064697, "Pretrain/Loss (Raw)": 1.9229564666748047, "Pretrain/Step": 2732, "Pretrain/Step Time": 8.501413818448782} +{"Pretrain/Learning Rate": 4.185364442349008e-05, "Pretrain/Loss": 2.0727710723876953, "Pretrain/Loss (Raw)": 1.9129835367202759, "Pretrain/Step": 2733, "Pretrain/Step Time": 8.508002130314708} +{"Pretrain/Learning Rate": 4.184737284579731e-05, "Pretrain/Loss": 2.072988748550415, "Pretrain/Loss (Raw)": 2.067857503890991, "Pretrain/Step": 2734, "Pretrain/Step Time": 8.511010430753231} +{"Pretrain/Learning Rate": 4.18410993251861e-05, "Pretrain/Loss": 2.0721335411071777, "Pretrain/Loss (Raw)": 1.854836106300354, "Pretrain/Step": 2735, "Pretrain/Step Time": 8.519162585958838} +{"Pretrain/Learning Rate": 4.183482386237996e-05, "Pretrain/Loss": 2.0706639289855957, "Pretrain/Loss (Raw)": 1.9969556331634521, "Pretrain/Step": 2736, "Pretrain/Step Time": 8.513807015493512} +{"Pretrain/Learning Rate": 4.182854645810261e-05, "Pretrain/Loss": 2.0720906257629395, "Pretrain/Loss (Raw)": 2.2253220081329346, "Pretrain/Step": 2737, "Pretrain/Step Time": 8.511839469894767} +{"Pretrain/Learning Rate": 4.182226711307798e-05, "Pretrain/Loss": 2.0729658603668213, "Pretrain/Loss (Raw)": 2.034518003463745, "Pretrain/Step": 2738, "Pretrain/Step Time": 8.510413138195872} +{"Pretrain/Learning Rate": 4.181598582803024e-05, "Pretrain/Loss": 2.073807716369629, "Pretrain/Loss (Raw)": 2.044795036315918, "Pretrain/Step": 2739, "Pretrain/Step Time": 8.519120581448078} +{"Pretrain/Learning Rate": 4.1809702603683776e-05, "Pretrain/Loss": 2.0730347633361816, "Pretrain/Loss (Raw)": 1.9254809617996216, "Pretrain/Step": 2740, "Pretrain/Step Time": 8.519993469119072} +{"Pretrain/Learning Rate": 4.1803417440763196e-05, "Pretrain/Loss": 2.071850538253784, "Pretrain/Loss (Raw)": 1.9364447593688965, "Pretrain/Step": 2741, "Pretrain/Step Time": 8.521877098828554} +{"Pretrain/Learning Rate": 4.179713033999333e-05, "Pretrain/Loss": 2.069347858428955, "Pretrain/Loss (Raw)": 1.8902989625930786, "Pretrain/Step": 2742, "Pretrain/Step Time": 8.517757266759872} +{"Pretrain/Learning Rate": 4.1790841302099246e-05, "Pretrain/Loss": 2.0715584754943848, "Pretrain/Loss (Raw)": 2.1163530349731445, "Pretrain/Step": 2743, "Pretrain/Step Time": 8.508026596158743} +{"Pretrain/Learning Rate": 4.1784550327806226e-05, "Pretrain/Loss": 2.0715036392211914, "Pretrain/Loss (Raw)": 1.945650339126587, "Pretrain/Step": 2744, "Pretrain/Step Time": 8.50758040882647} +{"Pretrain/Learning Rate": 4.177825741783977e-05, "Pretrain/Loss": 2.0708181858062744, "Pretrain/Loss (Raw)": 1.9125734567642212, "Pretrain/Step": 2745, "Pretrain/Step Time": 8.513052912428975} +{"Pretrain/Learning Rate": 4.1771962572925606e-05, "Pretrain/Loss": 2.0692577362060547, "Pretrain/Loss (Raw)": 1.9626495838165283, "Pretrain/Step": 2746, "Pretrain/Step Time": 8.521265456452966} +{"Pretrain/Learning Rate": 4.176566579378968e-05, "Pretrain/Loss": 2.0692644119262695, "Pretrain/Loss (Raw)": 2.105330467224121, "Pretrain/Step": 2747, "Pretrain/Step Time": 8.525906192138791} +{"Pretrain/Learning Rate": 4.175936708115818e-05, "Pretrain/Loss": 2.0711669921875, "Pretrain/Loss (Raw)": 2.1694936752319336, "Pretrain/Step": 2748, "Pretrain/Step Time": 8.521615510806441} +{"Pretrain/Learning Rate": 4.1753066435757494e-05, "Pretrain/Loss": 2.0701446533203125, "Pretrain/Loss (Raw)": 1.953578233718872, "Pretrain/Step": 2749, "Pretrain/Step Time": 8.517477063462138} +{"Pretrain/Learning Rate": 4.1746763858314244e-05, "Pretrain/Loss": 2.0709309577941895, "Pretrain/Loss (Raw)": 2.0566842555999756, "Pretrain/Step": 2750, "Pretrain/Step Time": 8.51240167953074} +{"Pretrain/Learning Rate": 4.174045934955527e-05, "Pretrain/Loss": 2.0717129707336426, "Pretrain/Loss (Raw)": 2.1337244510650635, "Pretrain/Step": 2751, "Pretrain/Step Time": 8.518580483272672} +{"Pretrain/Learning Rate": 4.173415291020764e-05, "Pretrain/Loss": 2.0717029571533203, "Pretrain/Loss (Raw)": 2.0034193992614746, "Pretrain/Step": 2752, "Pretrain/Step Time": 8.526094725355506} +{"Pretrain/Learning Rate": 4.172784454099865e-05, "Pretrain/Loss": 2.071981430053711, "Pretrain/Loss (Raw)": 2.132984161376953, "Pretrain/Step": 2753, "Pretrain/Step Time": 8.526786083355546} +{"Pretrain/Learning Rate": 4.172153424265579e-05, "Pretrain/Loss": 2.0719261169433594, "Pretrain/Loss (Raw)": 2.0921924114227295, "Pretrain/Step": 2754, "Pretrain/Step Time": 8.516262013465166} +{"Pretrain/Learning Rate": 4.171522201590682e-05, "Pretrain/Loss": 2.071413040161133, "Pretrain/Loss (Raw)": 2.008129835128784, "Pretrain/Step": 2755, "Pretrain/Step Time": 8.511991128325462} +{"Pretrain/Learning Rate": 4.170890786147967e-05, "Pretrain/Loss": 2.073859214782715, "Pretrain/Loss (Raw)": 2.243497133255005, "Pretrain/Step": 2756, "Pretrain/Step Time": 8.506120460107923} +{"Pretrain/Learning Rate": 4.170259178010254e-05, "Pretrain/Loss": 2.074258327484131, "Pretrain/Loss (Raw)": 2.134336471557617, "Pretrain/Step": 2757, "Pretrain/Step Time": 8.51503648236394} +{"Pretrain/Learning Rate": 4.169627377250382e-05, "Pretrain/Loss": 2.07454776763916, "Pretrain/Loss (Raw)": 2.147958278656006, "Pretrain/Step": 2758, "Pretrain/Step Time": 8.519132243469357} +{"Pretrain/Learning Rate": 4.1689953839412124e-05, "Pretrain/Loss": 2.074434280395508, "Pretrain/Loss (Raw)": 2.1934585571289062, "Pretrain/Step": 2759, "Pretrain/Step Time": 8.525897467508912} +{"Pretrain/Learning Rate": 4.1683631981556314e-05, "Pretrain/Loss": 2.075084686279297, "Pretrain/Loss (Raw)": 2.098595380783081, "Pretrain/Step": 2760, "Pretrain/Step Time": 8.520041273906827} +{"Pretrain/Learning Rate": 4.167730819966545e-05, "Pretrain/Loss": 2.077507495880127, "Pretrain/Loss (Raw)": 2.0729217529296875, "Pretrain/Step": 2761, "Pretrain/Step Time": 8.510527124628425} +{"Pretrain/Learning Rate": 4.167098249446881e-05, "Pretrain/Loss": 2.0769073963165283, "Pretrain/Loss (Raw)": 1.9650572538375854, "Pretrain/Step": 2762, "Pretrain/Step Time": 8.506623551249504} +{"Pretrain/Learning Rate": 4.166465486669592e-05, "Pretrain/Loss": 2.0746231079101562, "Pretrain/Loss (Raw)": 1.8908649682998657, "Pretrain/Step": 2763, "Pretrain/Step Time": 8.51176436431706} +{"Pretrain/Learning Rate": 4.16583253170765e-05, "Pretrain/Loss": 2.075995445251465, "Pretrain/Loss (Raw)": 2.0605788230895996, "Pretrain/Step": 2764, "Pretrain/Step Time": 8.516627006232738} +{"Pretrain/Learning Rate": 4.165199384634051e-05, "Pretrain/Loss": 2.0747385025024414, "Pretrain/Loss (Raw)": 1.8913863897323608, "Pretrain/Step": 2765, "Pretrain/Step Time": 8.51485782675445} +{"Pretrain/Learning Rate": 4.164566045521812e-05, "Pretrain/Loss": 2.0754458904266357, "Pretrain/Loss (Raw)": 2.092989921569824, "Pretrain/Step": 2766, "Pretrain/Step Time": 8.507392266765237} +{"Pretrain/Learning Rate": 4.163932514443973e-05, "Pretrain/Loss": 2.0767836570739746, "Pretrain/Loss (Raw)": 2.2246439456939697, "Pretrain/Step": 2767, "Pretrain/Step Time": 8.50338307581842} +{"Pretrain/Learning Rate": 4.163298791473596e-05, "Pretrain/Loss": 2.0761208534240723, "Pretrain/Loss (Raw)": 2.0653114318847656, "Pretrain/Step": 2768, "Pretrain/Step Time": 8.508993580937386} +{"Pretrain/Learning Rate": 4.1626648766837654e-05, "Pretrain/Loss": 2.0741541385650635, "Pretrain/Loss (Raw)": 2.0255239009857178, "Pretrain/Step": 2769, "Pretrain/Step Time": 8.51611521653831} +{"Pretrain/Learning Rate": 4.162030770147585e-05, "Pretrain/Loss": 2.069674015045166, "Pretrain/Loss (Raw)": 1.8421730995178223, "Pretrain/Step": 2770, "Pretrain/Step Time": 8.520032512024045} +{"Pretrain/Learning Rate": 4.161396471938185e-05, "Pretrain/Loss": 2.068680763244629, "Pretrain/Loss (Raw)": 1.9437812566757202, "Pretrain/Step": 2771, "Pretrain/Step Time": 8.520103057846427} +{"Pretrain/Learning Rate": 4.1607619821287154e-05, "Pretrain/Loss": 2.068912982940674, "Pretrain/Loss (Raw)": 2.2113091945648193, "Pretrain/Step": 2772, "Pretrain/Step Time": 8.516362063586712} +{"Pretrain/Learning Rate": 4.160127300792348e-05, "Pretrain/Loss": 2.0692687034606934, "Pretrain/Loss (Raw)": 2.1470556259155273, "Pretrain/Step": 2773, "Pretrain/Step Time": 8.512868370860815} +{"Pretrain/Learning Rate": 4.159492428002277e-05, "Pretrain/Loss": 2.0677196979522705, "Pretrain/Loss (Raw)": 1.9712389707565308, "Pretrain/Step": 2774, "Pretrain/Step Time": 8.511743688955903} +{"Pretrain/Learning Rate": 4.1588573638317195e-05, "Pretrain/Loss": 2.0689144134521484, "Pretrain/Loss (Raw)": 2.085411787033081, "Pretrain/Step": 2775, "Pretrain/Step Time": 8.51362513564527} +{"Pretrain/Learning Rate": 4.158222108353915e-05, "Pretrain/Loss": 2.0702905654907227, "Pretrain/Loss (Raw)": 2.0822250843048096, "Pretrain/Step": 2776, "Pretrain/Step Time": 8.518263442441821} +{"Pretrain/Learning Rate": 4.1575866616421224e-05, "Pretrain/Loss": 2.0714592933654785, "Pretrain/Loss (Raw)": 2.157499074935913, "Pretrain/Step": 2777, "Pretrain/Step Time": 8.521074080839753} +{"Pretrain/Learning Rate": 4.156951023769625e-05, "Pretrain/Loss": 2.071286201477051, "Pretrain/Loss (Raw)": 2.0423343181610107, "Pretrain/Step": 2778, "Pretrain/Step Time": 8.519140165299177} +{"Pretrain/Learning Rate": 4.156315194809728e-05, "Pretrain/Loss": 2.070401906967163, "Pretrain/Loss (Raw)": 1.9919567108154297, "Pretrain/Step": 2779, "Pretrain/Step Time": 8.512132169678807} +{"Pretrain/Learning Rate": 4.1556791748357584e-05, "Pretrain/Loss": 2.0698060989379883, "Pretrain/Loss (Raw)": 1.8938677310943604, "Pretrain/Step": 2780, "Pretrain/Step Time": 8.519379319623113} +{"Pretrain/Learning Rate": 4.155042963921064e-05, "Pretrain/Loss": 2.0709171295166016, "Pretrain/Loss (Raw)": 2.1456501483917236, "Pretrain/Step": 2781, "Pretrain/Step Time": 8.51821673847735} +{"Pretrain/Learning Rate": 4.1544065621390165e-05, "Pretrain/Loss": 2.0711073875427246, "Pretrain/Loss (Raw)": 2.0781867504119873, "Pretrain/Step": 2782, "Pretrain/Step Time": 8.52045625820756} +{"Pretrain/Learning Rate": 4.153769969563008e-05, "Pretrain/Loss": 2.0694832801818848, "Pretrain/Loss (Raw)": 2.1615102291107178, "Pretrain/Step": 2783, "Pretrain/Step Time": 8.520901206880808} +{"Pretrain/Learning Rate": 4.1531331862664545e-05, "Pretrain/Loss": 2.0697717666625977, "Pretrain/Loss (Raw)": 2.149160146713257, "Pretrain/Step": 2784, "Pretrain/Step Time": 8.508184740319848} +{"Pretrain/Learning Rate": 4.1524962123227914e-05, "Pretrain/Loss": 2.070250988006592, "Pretrain/Loss (Raw)": 2.103682279586792, "Pretrain/Step": 2785, "Pretrain/Step Time": 8.505723940208554} +{"Pretrain/Learning Rate": 4.151859047805479e-05, "Pretrain/Loss": 2.0700747966766357, "Pretrain/Loss (Raw)": 2.0200679302215576, "Pretrain/Step": 2786, "Pretrain/Step Time": 8.510902639478445} +{"Pretrain/Learning Rate": 4.151221692787997e-05, "Pretrain/Loss": 2.070221424102783, "Pretrain/Loss (Raw)": 1.97771155834198, "Pretrain/Step": 2787, "Pretrain/Step Time": 8.50514306128025} +{"Pretrain/Learning Rate": 4.1505841473438485e-05, "Pretrain/Loss": 2.069610357284546, "Pretrain/Loss (Raw)": 2.1523945331573486, "Pretrain/Step": 2788, "Pretrain/Step Time": 8.506107989698648} +{"Pretrain/Learning Rate": 4.149946411546558e-05, "Pretrain/Loss": 2.070107936859131, "Pretrain/Loss (Raw)": 2.1408467292785645, "Pretrain/Step": 2789, "Pretrain/Step Time": 8.504268733784556} +{"Pretrain/Learning Rate": 4.1493084854696726e-05, "Pretrain/Loss": 2.069182872772217, "Pretrain/Loss (Raw)": 2.0600435733795166, "Pretrain/Step": 2790, "Pretrain/Step Time": 8.498007552698255} +{"Pretrain/Learning Rate": 4.1486703691867616e-05, "Pretrain/Loss": 2.0708045959472656, "Pretrain/Loss (Raw)": 2.3022501468658447, "Pretrain/Step": 2791, "Pretrain/Step Time": 8.498298963531852} +{"Pretrain/Learning Rate": 4.148032062771414e-05, "Pretrain/Loss": 2.0719821453094482, "Pretrain/Loss (Raw)": 2.160560369491577, "Pretrain/Step": 2792, "Pretrain/Step Time": 8.508389228954911} +{"Pretrain/Learning Rate": 4.147393566297244e-05, "Pretrain/Loss": 2.072828531265259, "Pretrain/Loss (Raw)": 2.223623752593994, "Pretrain/Step": 2793, "Pretrain/Step Time": 8.50336329638958} +{"Pretrain/Learning Rate": 4.1467548798378847e-05, "Pretrain/Loss": 2.0723347663879395, "Pretrain/Loss (Raw)": 2.116046905517578, "Pretrain/Step": 2794, "Pretrain/Step Time": 8.505293322727084} +{"Pretrain/Learning Rate": 4.1461160034669925e-05, "Pretrain/Loss": 2.0706419944763184, "Pretrain/Loss (Raw)": 1.8297533988952637, "Pretrain/Step": 2795, "Pretrain/Step Time": 8.505110826343298} +{"Pretrain/Learning Rate": 4.145476937258247e-05, "Pretrain/Loss": 2.070833683013916, "Pretrain/Loss (Raw)": 2.083038806915283, "Pretrain/Step": 2796, "Pretrain/Step Time": 8.498674351722002} +{"Pretrain/Learning Rate": 4.144837681285346e-05, "Pretrain/Loss": 2.075465202331543, "Pretrain/Loss (Raw)": 2.258187770843506, "Pretrain/Step": 2797, "Pretrain/Step Time": 8.504324596375227} +{"Pretrain/Learning Rate": 4.1441982356220144e-05, "Pretrain/Loss": 2.0747485160827637, "Pretrain/Loss (Raw)": 1.9165397882461548, "Pretrain/Step": 2798, "Pretrain/Step Time": 8.504175143316388} +{"Pretrain/Learning Rate": 4.1435586003419935e-05, "Pretrain/Loss": 2.073986053466797, "Pretrain/Loss (Raw)": 2.12304425239563, "Pretrain/Step": 2799, "Pretrain/Step Time": 8.50442835316062} +{"Pretrain/Learning Rate": 4.1429187755190504e-05, "Pretrain/Loss": 2.0734565258026123, "Pretrain/Loss (Raw)": 2.034048318862915, "Pretrain/Step": 2800, "Pretrain/Step Time": 8.501227332279086} +{"Pretrain/Learning Rate": 4.1422787612269726e-05, "Pretrain/Loss": 2.075183153152466, "Pretrain/Loss (Raw)": 2.3316538333892822, "Pretrain/Step": 2801, "Pretrain/Step Time": 8.497759651392698} +{"Pretrain/Learning Rate": 4.1416385575395686e-05, "Pretrain/Loss": 2.0750064849853516, "Pretrain/Loss (Raw)": 2.083017587661743, "Pretrain/Step": 2802, "Pretrain/Step Time": 8.487218672409654} +{"Pretrain/Learning Rate": 4.140998164530672e-05, "Pretrain/Loss": 2.075326919555664, "Pretrain/Loss (Raw)": 2.2677323818206787, "Pretrain/Step": 2803, "Pretrain/Step Time": 8.49551228247583} +{"Pretrain/Learning Rate": 4.140357582274133e-05, "Pretrain/Loss": 2.075169563293457, "Pretrain/Loss (Raw)": 2.073451042175293, "Pretrain/Step": 2804, "Pretrain/Step Time": 8.501333301886916} +{"Pretrain/Learning Rate": 4.1397168108438286e-05, "Pretrain/Loss": 2.0738484859466553, "Pretrain/Loss (Raw)": 2.0146408081054688, "Pretrain/Step": 2805, "Pretrain/Step Time": 8.499349348247051} +{"Pretrain/Learning Rate": 4.139075850313655e-05, "Pretrain/Loss": 2.0734307765960693, "Pretrain/Loss (Raw)": 2.003051996231079, "Pretrain/Step": 2806, "Pretrain/Step Time": 8.49975730292499} +{"Pretrain/Learning Rate": 4.1384347007575305e-05, "Pretrain/Loss": 2.0719680786132812, "Pretrain/Loss (Raw)": 1.8831892013549805, "Pretrain/Step": 2807, "Pretrain/Step Time": 8.500642063096166} +{"Pretrain/Learning Rate": 4.137793362249396e-05, "Pretrain/Loss": 2.072739362716675, "Pretrain/Loss (Raw)": 2.1990551948547363, "Pretrain/Step": 2808, "Pretrain/Step Time": 8.488847587257624} +{"Pretrain/Learning Rate": 4.137151834863213e-05, "Pretrain/Loss": 2.0722804069519043, "Pretrain/Loss (Raw)": 1.9630751609802246, "Pretrain/Step": 2809, "Pretrain/Step Time": 8.49331177957356} +{"Pretrain/Learning Rate": 4.136510118672966e-05, "Pretrain/Loss": 2.0703070163726807, "Pretrain/Loss (Raw)": 2.0953259468078613, "Pretrain/Step": 2810, "Pretrain/Step Time": 8.501939784735441} +{"Pretrain/Learning Rate": 4.135868213752661e-05, "Pretrain/Loss": 2.0729808807373047, "Pretrain/Loss (Raw)": 2.536027193069458, "Pretrain/Step": 2811, "Pretrain/Step Time": 8.502032682299614} +{"Pretrain/Learning Rate": 4.135226120176325e-05, "Pretrain/Loss": 2.0767648220062256, "Pretrain/Loss (Raw)": 2.6238207817077637, "Pretrain/Step": 2812, "Pretrain/Step Time": 8.504696104675531} +{"Pretrain/Learning Rate": 4.134583838018007e-05, "Pretrain/Loss": 2.0765221118927, "Pretrain/Loss (Raw)": 2.040667772293091, "Pretrain/Step": 2813, "Pretrain/Step Time": 8.50309950299561} +{"Pretrain/Learning Rate": 4.133941367351779e-05, "Pretrain/Loss": 2.0772652626037598, "Pretrain/Loss (Raw)": 2.158374547958374, "Pretrain/Step": 2814, "Pretrain/Step Time": 8.496402971446514} +{"Pretrain/Learning Rate": 4.133298708251733e-05, "Pretrain/Loss": 2.076847553253174, "Pretrain/Loss (Raw)": 2.1130433082580566, "Pretrain/Step": 2815, "Pretrain/Step Time": 8.499214759096503} +{"Pretrain/Learning Rate": 4.132655860791983e-05, "Pretrain/Loss": 2.0746912956237793, "Pretrain/Loss (Raw)": 1.8119196891784668, "Pretrain/Step": 2816, "Pretrain/Step Time": 8.508515888825059} +{"Pretrain/Learning Rate": 4.132012825046666e-05, "Pretrain/Loss": 2.0749294757843018, "Pretrain/Loss (Raw)": 2.2145841121673584, "Pretrain/Step": 2817, "Pretrain/Step Time": 8.509153500199318} +{"Pretrain/Learning Rate": 4.13136960108994e-05, "Pretrain/Loss": 2.074646234512329, "Pretrain/Loss (Raw)": 2.158235788345337, "Pretrain/Step": 2818, "Pretrain/Step Time": 8.510560857132077} +{"Pretrain/Learning Rate": 4.130726188995985e-05, "Pretrain/Loss": 2.076195240020752, "Pretrain/Loss (Raw)": 2.3151321411132812, "Pretrain/Step": 2819, "Pretrain/Step Time": 8.498626345768571} +{"Pretrain/Learning Rate": 4.1300825888390006e-05, "Pretrain/Loss": 2.0768463611602783, "Pretrain/Loss (Raw)": 1.9606890678405762, "Pretrain/Step": 2820, "Pretrain/Step Time": 8.501501526683569} +{"Pretrain/Learning Rate": 4.1294388006932114e-05, "Pretrain/Loss": 2.074958086013794, "Pretrain/Loss (Raw)": 1.8423972129821777, "Pretrain/Step": 2821, "Pretrain/Step Time": 8.501468462869525} +{"Pretrain/Learning Rate": 4.128794824632861e-05, "Pretrain/Loss": 2.0739238262176514, "Pretrain/Loss (Raw)": 1.7992844581604004, "Pretrain/Step": 2822, "Pretrain/Step Time": 8.51202874071896} +{"Pretrain/Learning Rate": 4.1281506607322167e-05, "Pretrain/Loss": 2.0747599601745605, "Pretrain/Loss (Raw)": 2.0817618370056152, "Pretrain/Step": 2823, "Pretrain/Step Time": 8.51457990333438} +{"Pretrain/Learning Rate": 4.1275063090655666e-05, "Pretrain/Loss": 2.0760679244995117, "Pretrain/Loss (Raw)": 1.9142767190933228, "Pretrain/Step": 2824, "Pretrain/Step Time": 8.511433089151978} +{"Pretrain/Learning Rate": 4.126861769707219e-05, "Pretrain/Loss": 2.075230836868286, "Pretrain/Loss (Raw)": 2.095930337905884, "Pretrain/Step": 2825, "Pretrain/Step Time": 8.506875526160002} +{"Pretrain/Learning Rate": 4.126217042731507e-05, "Pretrain/Loss": 2.07554030418396, "Pretrain/Loss (Raw)": 2.0023179054260254, "Pretrain/Step": 2826, "Pretrain/Step Time": 8.506676947697997} +{"Pretrain/Learning Rate": 4.125572128212781e-05, "Pretrain/Loss": 2.0761046409606934, "Pretrain/Loss (Raw)": 2.0440714359283447, "Pretrain/Step": 2827, "Pretrain/Step Time": 8.50502872094512} +{"Pretrain/Learning Rate": 4.124927026225419e-05, "Pretrain/Loss": 2.0741806030273438, "Pretrain/Loss (Raw)": 2.0782835483551025, "Pretrain/Step": 2828, "Pretrain/Step Time": 8.504519244655967} +{"Pretrain/Learning Rate": 4.124281736843815e-05, "Pretrain/Loss": 2.071641206741333, "Pretrain/Loss (Raw)": 2.038022041320801, "Pretrain/Step": 2829, "Pretrain/Step Time": 8.50325520709157} +{"Pretrain/Learning Rate": 4.1236362601423865e-05, "Pretrain/Loss": 2.0733394622802734, "Pretrain/Loss (Raw)": 2.212880849838257, "Pretrain/Step": 2830, "Pretrain/Step Time": 8.50446679070592} +{"Pretrain/Learning Rate": 4.122990596195574e-05, "Pretrain/Loss": 2.075538158416748, "Pretrain/Loss (Raw)": 2.253086566925049, "Pretrain/Step": 2831, "Pretrain/Step Time": 8.499858744442463} +{"Pretrain/Learning Rate": 4.122344745077838e-05, "Pretrain/Loss": 2.07124662399292, "Pretrain/Loss (Raw)": 1.91457998752594, "Pretrain/Step": 2832, "Pretrain/Step Time": 8.502583665773273} +{"Pretrain/Learning Rate": 4.121698706863662e-05, "Pretrain/Loss": 2.0717899799346924, "Pretrain/Loss (Raw)": 2.109516143798828, "Pretrain/Step": 2833, "Pretrain/Step Time": 8.507666332647204} +{"Pretrain/Learning Rate": 4.121052481627549e-05, "Pretrain/Loss": 2.073903799057007, "Pretrain/Loss (Raw)": 2.2536370754241943, "Pretrain/Step": 2834, "Pretrain/Step Time": 8.514847572892904} +{"Pretrain/Learning Rate": 4.120406069444025e-05, "Pretrain/Loss": 2.0706639289855957, "Pretrain/Loss (Raw)": 1.9505629539489746, "Pretrain/Step": 2835, "Pretrain/Step Time": 8.516144335269928} +{"Pretrain/Learning Rate": 4.119759470387637e-05, "Pretrain/Loss": 2.071241617202759, "Pretrain/Loss (Raw)": 2.1760475635528564, "Pretrain/Step": 2836, "Pretrain/Step Time": 8.52217667736113} +{"Pretrain/Learning Rate": 4.1191126845329554e-05, "Pretrain/Loss": 2.0709099769592285, "Pretrain/Loss (Raw)": 2.075650930404663, "Pretrain/Step": 2837, "Pretrain/Step Time": 8.520409731194377} +{"Pretrain/Learning Rate": 4.118465711954569e-05, "Pretrain/Loss": 2.0721895694732666, "Pretrain/Loss (Raw)": 2.1664702892303467, "Pretrain/Step": 2838, "Pretrain/Step Time": 8.513037947937846} +{"Pretrain/Learning Rate": 4.1178185527270905e-05, "Pretrain/Loss": 2.0700976848602295, "Pretrain/Loss (Raw)": 2.0502824783325195, "Pretrain/Step": 2839, "Pretrain/Step Time": 8.515332570299506} +{"Pretrain/Learning Rate": 4.1171712069251534e-05, "Pretrain/Loss": 2.0687124729156494, "Pretrain/Loss (Raw)": 2.105421781539917, "Pretrain/Step": 2840, "Pretrain/Step Time": 8.520685017108917} +{"Pretrain/Learning Rate": 4.116523674623412e-05, "Pretrain/Loss": 2.0713114738464355, "Pretrain/Loss (Raw)": 2.2752439975738525, "Pretrain/Step": 2841, "Pretrain/Step Time": 8.523919524624944} +{"Pretrain/Learning Rate": 4.115875955896543e-05, "Pretrain/Loss": 2.0718061923980713, "Pretrain/Loss (Raw)": 1.9965934753417969, "Pretrain/Step": 2842, "Pretrain/Step Time": 8.522924594581127} +{"Pretrain/Learning Rate": 4.115228050819244e-05, "Pretrain/Loss": 2.071537494659424, "Pretrain/Loss (Raw)": 2.127232551574707, "Pretrain/Step": 2843, "Pretrain/Step Time": 8.513710899278522} +{"Pretrain/Learning Rate": 4.114579959466235e-05, "Pretrain/Loss": 2.068492889404297, "Pretrain/Loss (Raw)": 2.041090488433838, "Pretrain/Step": 2844, "Pretrain/Step Time": 8.509088836610317} +{"Pretrain/Learning Rate": 4.113931681912257e-05, "Pretrain/Loss": 2.0713934898376465, "Pretrain/Loss (Raw)": 2.1721715927124023, "Pretrain/Step": 2845, "Pretrain/Step Time": 8.51626993343234} +{"Pretrain/Learning Rate": 4.113283218232073e-05, "Pretrain/Loss": 2.0700528621673584, "Pretrain/Loss (Raw)": 1.8140676021575928, "Pretrain/Step": 2846, "Pretrain/Step Time": 8.527365708723664} +{"Pretrain/Learning Rate": 4.112634568500466e-05, "Pretrain/Loss": 2.069653034210205, "Pretrain/Loss (Raw)": 2.0439836978912354, "Pretrain/Step": 2847, "Pretrain/Step Time": 8.524742282927036} +{"Pretrain/Learning Rate": 4.111985732792242e-05, "Pretrain/Loss": 2.068571090698242, "Pretrain/Loss (Raw)": 2.0678763389587402, "Pretrain/Step": 2848, "Pretrain/Step Time": 8.52224550768733} +{"Pretrain/Learning Rate": 4.111336711182226e-05, "Pretrain/Loss": 2.0681464672088623, "Pretrain/Loss (Raw)": 2.097720146179199, "Pretrain/Step": 2849, "Pretrain/Step Time": 8.513685395941138} +{"Pretrain/Learning Rate": 4.110687503745269e-05, "Pretrain/Loss": 2.0669918060302734, "Pretrain/Loss (Raw)": 1.8874155282974243, "Pretrain/Step": 2850, "Pretrain/Step Time": 8.516846794635057} +{"Pretrain/Learning Rate": 4.1100381105562394e-05, "Pretrain/Loss": 2.0646164417266846, "Pretrain/Loss (Raw)": 2.0100672245025635, "Pretrain/Step": 2851, "Pretrain/Step Time": 8.515960706397891} +{"Pretrain/Learning Rate": 4.109388531690027e-05, "Pretrain/Loss": 2.0637266635894775, "Pretrain/Loss (Raw)": 1.9733003377914429, "Pretrain/Step": 2852, "Pretrain/Step Time": 8.521117137745023} +{"Pretrain/Learning Rate": 4.108738767221546e-05, "Pretrain/Loss": 2.0642566680908203, "Pretrain/Loss (Raw)": 2.0020575523376465, "Pretrain/Step": 2853, "Pretrain/Step Time": 8.526098879054189} +{"Pretrain/Learning Rate": 4.108088817225729e-05, "Pretrain/Loss": 2.0665645599365234, "Pretrain/Loss (Raw)": 2.2349777221679688, "Pretrain/Step": 2854, "Pretrain/Step Time": 8.522816523909569} +{"Pretrain/Learning Rate": 4.1074386817775334e-05, "Pretrain/Loss": 2.0692567825317383, "Pretrain/Loss (Raw)": 2.3741719722747803, "Pretrain/Step": 2855, "Pretrain/Step Time": 8.520451821386814} +{"Pretrain/Learning Rate": 4.106788360951934e-05, "Pretrain/Loss": 2.071084976196289, "Pretrain/Loss (Raw)": 2.0141797065734863, "Pretrain/Step": 2856, "Pretrain/Step Time": 8.514718549326062} +{"Pretrain/Learning Rate": 4.106137854823929e-05, "Pretrain/Loss": 2.071242332458496, "Pretrain/Loss (Raw)": 2.0693182945251465, "Pretrain/Step": 2857, "Pretrain/Step Time": 8.506365580484271} +{"Pretrain/Learning Rate": 4.1054871634685385e-05, "Pretrain/Loss": 2.0712320804595947, "Pretrain/Loss (Raw)": 1.9938380718231201, "Pretrain/Step": 2858, "Pretrain/Step Time": 8.516544507816434} +{"Pretrain/Learning Rate": 4.104836286960802e-05, "Pretrain/Loss": 2.0725581645965576, "Pretrain/Loss (Raw)": 2.163422107696533, "Pretrain/Step": 2859, "Pretrain/Step Time": 8.51869216375053} +{"Pretrain/Learning Rate": 4.1041852253757836e-05, "Pretrain/Loss": 2.0737924575805664, "Pretrain/Loss (Raw)": 2.0809457302093506, "Pretrain/Step": 2860, "Pretrain/Step Time": 8.520765528082848} +{"Pretrain/Learning Rate": 4.103533978788566e-05, "Pretrain/Loss": 2.074921131134033, "Pretrain/Loss (Raw)": 2.057466506958008, "Pretrain/Step": 2861, "Pretrain/Step Time": 8.514662561938167} +{"Pretrain/Learning Rate": 4.1028825472742536e-05, "Pretrain/Loss": 2.075580358505249, "Pretrain/Loss (Raw)": 2.1522281169891357, "Pretrain/Step": 2862, "Pretrain/Step Time": 8.506427774205804} +{"Pretrain/Learning Rate": 4.1022309309079734e-05, "Pretrain/Loss": 2.07596755027771, "Pretrain/Loss (Raw)": 1.9043998718261719, "Pretrain/Step": 2863, "Pretrain/Step Time": 8.497543660923839} +{"Pretrain/Learning Rate": 4.1015791297648716e-05, "Pretrain/Loss": 2.075169801712036, "Pretrain/Loss (Raw)": 1.8948534727096558, "Pretrain/Step": 2864, "Pretrain/Step Time": 8.505687339231372} +{"Pretrain/Learning Rate": 4.100927143920118e-05, "Pretrain/Loss": 2.0729329586029053, "Pretrain/Loss (Raw)": 1.9389867782592773, "Pretrain/Step": 2865, "Pretrain/Step Time": 8.512046901509166} +{"Pretrain/Learning Rate": 4.100274973448902e-05, "Pretrain/Loss": 2.0722122192382812, "Pretrain/Loss (Raw)": 1.9422601461410522, "Pretrain/Step": 2866, "Pretrain/Step Time": 8.512977881357074} +{"Pretrain/Learning Rate": 4.099622618426436e-05, "Pretrain/Loss": 2.071688652038574, "Pretrain/Loss (Raw)": 1.9777755737304688, "Pretrain/Step": 2867, "Pretrain/Step Time": 8.503397721797228} +{"Pretrain/Learning Rate": 4.098970078927951e-05, "Pretrain/Loss": 2.070729970932007, "Pretrain/Loss (Raw)": 1.8027745485305786, "Pretrain/Step": 2868, "Pretrain/Step Time": 8.50717892870307} +{"Pretrain/Learning Rate": 4.0983173550287026e-05, "Pretrain/Loss": 2.0725858211517334, "Pretrain/Loss (Raw)": 2.1740057468414307, "Pretrain/Step": 2869, "Pretrain/Step Time": 8.510469989851117} +{"Pretrain/Learning Rate": 4.0976644468039646e-05, "Pretrain/Loss": 2.0749123096466064, "Pretrain/Loss (Raw)": 2.188076972961426, "Pretrain/Step": 2870, "Pretrain/Step Time": 8.509551223367453} +{"Pretrain/Learning Rate": 4.097011354329035e-05, "Pretrain/Loss": 2.0731170177459717, "Pretrain/Loss (Raw)": 1.8865618705749512, "Pretrain/Step": 2871, "Pretrain/Step Time": 8.509907873347402} +{"Pretrain/Learning Rate": 4.096358077679231e-05, "Pretrain/Loss": 2.074946880340576, "Pretrain/Loss (Raw)": 2.179861545562744, "Pretrain/Step": 2872, "Pretrain/Step Time": 8.512234939262271} +{"Pretrain/Learning Rate": 4.0957046169298895e-05, "Pretrain/Loss": 2.075404167175293, "Pretrain/Loss (Raw)": 1.9711012840270996, "Pretrain/Step": 2873, "Pretrain/Step Time": 8.509061057120562} +{"Pretrain/Learning Rate": 4.095050972156374e-05, "Pretrain/Loss": 2.0732007026672363, "Pretrain/Loss (Raw)": 1.680627465248108, "Pretrain/Step": 2874, "Pretrain/Step Time": 8.502205923199654} +{"Pretrain/Learning Rate": 4.0943971434340633e-05, "Pretrain/Loss": 2.0742812156677246, "Pretrain/Loss (Raw)": 2.2436141967773438, "Pretrain/Step": 2875, "Pretrain/Step Time": 8.50042618624866} +{"Pretrain/Learning Rate": 4.093743130838361e-05, "Pretrain/Loss": 2.072096824645996, "Pretrain/Loss (Raw)": 1.8899202346801758, "Pretrain/Step": 2876, "Pretrain/Step Time": 8.501254808157682} +{"Pretrain/Learning Rate": 4.093088934444692e-05, "Pretrain/Loss": 2.0736379623413086, "Pretrain/Loss (Raw)": 2.1508290767669678, "Pretrain/Step": 2877, "Pretrain/Step Time": 8.501224514096975} +{"Pretrain/Learning Rate": 4.092434554328499e-05, "Pretrain/Loss": 2.073289155960083, "Pretrain/Loss (Raw)": 2.0120339393615723, "Pretrain/Step": 2878, "Pretrain/Step Time": 8.502702966332436} +{"Pretrain/Learning Rate": 4.09177999056525e-05, "Pretrain/Loss": 2.071197986602783, "Pretrain/Loss (Raw)": 1.866089940071106, "Pretrain/Step": 2879, "Pretrain/Step Time": 8.496637735515833} +{"Pretrain/Learning Rate": 4.0911252432304316e-05, "Pretrain/Loss": 2.0703396797180176, "Pretrain/Loss (Raw)": 1.8935121297836304, "Pretrain/Step": 2880, "Pretrain/Step Time": 8.493063079193234} +{"Pretrain/Learning Rate": 4.0904703123995516e-05, "Pretrain/Loss": 2.068108558654785, "Pretrain/Loss (Raw)": 1.8474093675613403, "Pretrain/Step": 2881, "Pretrain/Step Time": 8.496260298416018} +{"Pretrain/Learning Rate": 4.0898151981481416e-05, "Pretrain/Loss": 2.06770396232605, "Pretrain/Loss (Raw)": 2.040409803390503, "Pretrain/Step": 2882, "Pretrain/Step Time": 8.499396592378616} +{"Pretrain/Learning Rate": 4.089159900551752e-05, "Pretrain/Loss": 2.068594455718994, "Pretrain/Loss (Raw)": 2.122114419937134, "Pretrain/Step": 2883, "Pretrain/Step Time": 8.500468147918582} +{"Pretrain/Learning Rate": 4.0885044196859537e-05, "Pretrain/Loss": 2.067875385284424, "Pretrain/Loss (Raw)": 2.1514575481414795, "Pretrain/Step": 2884, "Pretrain/Step Time": 8.50234173797071} +{"Pretrain/Learning Rate": 4.08784875562634e-05, "Pretrain/Loss": 2.0668787956237793, "Pretrain/Loss (Raw)": 2.006774425506592, "Pretrain/Step": 2885, "Pretrain/Step Time": 8.490115331485868} +{"Pretrain/Learning Rate": 4.087192908448526e-05, "Pretrain/Loss": 2.066620111465454, "Pretrain/Loss (Raw)": 2.114835500717163, "Pretrain/Step": 2886, "Pretrain/Step Time": 8.49230351112783} +{"Pretrain/Learning Rate": 4.086536878228147e-05, "Pretrain/Loss": 2.0670559406280518, "Pretrain/Loss (Raw)": 2.249272584915161, "Pretrain/Step": 2887, "Pretrain/Step Time": 8.49667789414525} +{"Pretrain/Learning Rate": 4.0858806650408586e-05, "Pretrain/Loss": 2.0651698112487793, "Pretrain/Loss (Raw)": 1.857147455215454, "Pretrain/Step": 2888, "Pretrain/Step Time": 8.499472571536899} +{"Pretrain/Learning Rate": 4.08522426896234e-05, "Pretrain/Loss": 2.0641937255859375, "Pretrain/Loss (Raw)": 1.9479906558990479, "Pretrain/Step": 2889, "Pretrain/Step Time": 8.50187005288899} +{"Pretrain/Learning Rate": 4.0845676900682884e-05, "Pretrain/Loss": 2.064311981201172, "Pretrain/Loss (Raw)": 1.9801751375198364, "Pretrain/Step": 2890, "Pretrain/Step Time": 8.498882301151752} +{"Pretrain/Learning Rate": 4.0839109284344235e-05, "Pretrain/Loss": 2.0658864974975586, "Pretrain/Loss (Raw)": 2.0924530029296875, "Pretrain/Step": 2891, "Pretrain/Step Time": 8.49272465147078} +{"Pretrain/Learning Rate": 4.083253984136487e-05, "Pretrain/Loss": 2.065580129623413, "Pretrain/Loss (Raw)": 2.0213422775268555, "Pretrain/Step": 2892, "Pretrain/Step Time": 8.496333802118897} +{"Pretrain/Learning Rate": 4.0825968572502404e-05, "Pretrain/Loss": 2.067155599594116, "Pretrain/Loss (Raw)": 2.093050003051758, "Pretrain/Step": 2893, "Pretrain/Step Time": 8.506693424656987} +{"Pretrain/Learning Rate": 4.081939547851467e-05, "Pretrain/Loss": 2.0649538040161133, "Pretrain/Loss (Raw)": 1.8111361265182495, "Pretrain/Step": 2894, "Pretrain/Step Time": 8.504161193966866} +{"Pretrain/Learning Rate": 4.0812820560159705e-05, "Pretrain/Loss": 2.0625579357147217, "Pretrain/Loss (Raw)": 1.918014407157898, "Pretrain/Step": 2895, "Pretrain/Step Time": 8.51192974485457} +{"Pretrain/Learning Rate": 4.0806243818195765e-05, "Pretrain/Loss": 2.0631628036499023, "Pretrain/Loss (Raw)": 2.142709732055664, "Pretrain/Step": 2896, "Pretrain/Step Time": 8.501971438527107} +{"Pretrain/Learning Rate": 4.07996652533813e-05, "Pretrain/Loss": 2.064749002456665, "Pretrain/Loss (Raw)": 2.2285642623901367, "Pretrain/Step": 2897, "Pretrain/Step Time": 8.497956600040197} +{"Pretrain/Learning Rate": 4.0793084866474986e-05, "Pretrain/Loss": 2.065645933151245, "Pretrain/Loss (Raw)": 1.9569599628448486, "Pretrain/Step": 2898, "Pretrain/Step Time": 8.500285683199763} +{"Pretrain/Learning Rate": 4.078650265823571e-05, "Pretrain/Loss": 2.0701699256896973, "Pretrain/Loss (Raw)": 2.522901773452759, "Pretrain/Step": 2899, "Pretrain/Step Time": 8.50578386709094} +{"Pretrain/Learning Rate": 4.077991862942256e-05, "Pretrain/Loss": 2.0703182220458984, "Pretrain/Loss (Raw)": 2.230268716812134, "Pretrain/Step": 2900, "Pretrain/Step Time": 8.505700036883354} +{"Pretrain/Learning Rate": 4.0773332780794834e-05, "Pretrain/Loss": 2.069774627685547, "Pretrain/Loss (Raw)": 2.0774829387664795, "Pretrain/Step": 2901, "Pretrain/Step Time": 8.505010675638914} +{"Pretrain/Learning Rate": 4.076674511311205e-05, "Pretrain/Loss": 2.0696115493774414, "Pretrain/Loss (Raw)": 1.9503144025802612, "Pretrain/Step": 2902, "Pretrain/Step Time": 8.505134284496307} +{"Pretrain/Learning Rate": 4.0760155627133924e-05, "Pretrain/Loss": 2.069490671157837, "Pretrain/Loss (Raw)": 2.0699844360351562, "Pretrain/Step": 2903, "Pretrain/Step Time": 8.501260286197066} +{"Pretrain/Learning Rate": 4.075356432362037e-05, "Pretrain/Loss": 2.0701751708984375, "Pretrain/Loss (Raw)": 2.1698334217071533, "Pretrain/Step": 2904, "Pretrain/Step Time": 8.50175779685378} +{"Pretrain/Learning Rate": 4.074697120333156e-05, "Pretrain/Loss": 2.06965970993042, "Pretrain/Loss (Raw)": 2.091545820236206, "Pretrain/Step": 2905, "Pretrain/Step Time": 8.511796975508332} +{"Pretrain/Learning Rate": 4.0740376267027836e-05, "Pretrain/Loss": 2.0693724155426025, "Pretrain/Loss (Raw)": 2.005519390106201, "Pretrain/Step": 2906, "Pretrain/Step Time": 8.508268728852272} +{"Pretrain/Learning Rate": 4.0733779515469736e-05, "Pretrain/Loss": 2.0700395107269287, "Pretrain/Loss (Raw)": 2.0773634910583496, "Pretrain/Step": 2907, "Pretrain/Step Time": 8.509269759058952} +{"Pretrain/Learning Rate": 4.072718094941805e-05, "Pretrain/Loss": 2.072422504425049, "Pretrain/Loss (Raw)": 2.198880434036255, "Pretrain/Step": 2908, "Pretrain/Step Time": 8.498371183872223} +{"Pretrain/Learning Rate": 4.0720580569633746e-05, "Pretrain/Loss": 2.070772409439087, "Pretrain/Loss (Raw)": 1.9344563484191895, "Pretrain/Step": 2909, "Pretrain/Step Time": 8.501780373975635} +{"Pretrain/Learning Rate": 4.0713978376878016e-05, "Pretrain/Loss": 2.0704100131988525, "Pretrain/Loss (Raw)": 2.031759262084961, "Pretrain/Step": 2910, "Pretrain/Step Time": 8.506246211007237} +{"Pretrain/Learning Rate": 4.070737437191224e-05, "Pretrain/Loss": 2.070369005203247, "Pretrain/Loss (Raw)": 2.156301975250244, "Pretrain/Step": 2911, "Pretrain/Step Time": 8.513591211289167} +{"Pretrain/Learning Rate": 4.0700768555498045e-05, "Pretrain/Loss": 2.070922613143921, "Pretrain/Loss (Raw)": 2.220003604888916, "Pretrain/Step": 2912, "Pretrain/Step Time": 8.512863844633102} +{"Pretrain/Learning Rate": 4.069416092839724e-05, "Pretrain/Loss": 2.0710256099700928, "Pretrain/Loss (Raw)": 2.1168763637542725, "Pretrain/Step": 2913, "Pretrain/Step Time": 8.510460048913956} +{"Pretrain/Learning Rate": 4.068755149137184e-05, "Pretrain/Loss": 2.073072910308838, "Pretrain/Loss (Raw)": 2.2821288108825684, "Pretrain/Step": 2914, "Pretrain/Step Time": 8.502306098118424} +{"Pretrain/Learning Rate": 4.0680940245184076e-05, "Pretrain/Loss": 2.0747694969177246, "Pretrain/Loss (Raw)": 2.1948468685150146, "Pretrain/Step": 2915, "Pretrain/Step Time": 8.50255380757153} +{"Pretrain/Learning Rate": 4.06743271905964e-05, "Pretrain/Loss": 2.075486183166504, "Pretrain/Loss (Raw)": 2.244161367416382, "Pretrain/Step": 2916, "Pretrain/Step Time": 8.508006552234292} +{"Pretrain/Learning Rate": 4.066771232837144e-05, "Pretrain/Loss": 2.0765295028686523, "Pretrain/Loss (Raw)": 2.2744030952453613, "Pretrain/Step": 2917, "Pretrain/Step Time": 8.51615735143423} +{"Pretrain/Learning Rate": 4.066109565927208e-05, "Pretrain/Loss": 2.075883388519287, "Pretrain/Loss (Raw)": 1.977290153503418, "Pretrain/Step": 2918, "Pretrain/Step Time": 8.517017241567373} +{"Pretrain/Learning Rate": 4.0654477184061356e-05, "Pretrain/Loss": 2.0747621059417725, "Pretrain/Loss (Raw)": 2.158743143081665, "Pretrain/Step": 2919, "Pretrain/Step Time": 8.513163954019547} +{"Pretrain/Learning Rate": 4.064785690350257e-05, "Pretrain/Loss": 2.0745973587036133, "Pretrain/Loss (Raw)": 2.139462947845459, "Pretrain/Step": 2920, "Pretrain/Step Time": 8.503729853779078} +{"Pretrain/Learning Rate": 4.064123481835919e-05, "Pretrain/Loss": 2.073076009750366, "Pretrain/Loss (Raw)": 2.0289125442504883, "Pretrain/Step": 2921, "Pretrain/Step Time": 8.50533151999116} +{"Pretrain/Learning Rate": 4.0634610929394893e-05, "Pretrain/Loss": 2.071929693222046, "Pretrain/Loss (Raw)": 1.9693200588226318, "Pretrain/Step": 2922, "Pretrain/Step Time": 8.511665171012282} +{"Pretrain/Learning Rate": 4.06279852373736e-05, "Pretrain/Loss": 2.072310447692871, "Pretrain/Loss (Raw)": 1.8784573078155518, "Pretrain/Step": 2923, "Pretrain/Step Time": 8.515265429392457} +{"Pretrain/Learning Rate": 4.0621357743059415e-05, "Pretrain/Loss": 2.071155548095703, "Pretrain/Loss (Raw)": 1.935226559638977, "Pretrain/Step": 2924, "Pretrain/Step Time": 8.515804167836905} +{"Pretrain/Learning Rate": 4.061472844721664e-05, "Pretrain/Loss": 2.0688953399658203, "Pretrain/Loss (Raw)": 1.9689018726348877, "Pretrain/Step": 2925, "Pretrain/Step Time": 8.511797124519944} +{"Pretrain/Learning Rate": 4.06080973506098e-05, "Pretrain/Loss": 2.0691452026367188, "Pretrain/Loss (Raw)": 1.9485288858413696, "Pretrain/Step": 2926, "Pretrain/Step Time": 8.509700823575258} +{"Pretrain/Learning Rate": 4.0601464454003624e-05, "Pretrain/Loss": 2.0680699348449707, "Pretrain/Loss (Raw)": 1.9853758811950684, "Pretrain/Step": 2927, "Pretrain/Step Time": 8.50856614857912} +{"Pretrain/Learning Rate": 4.059482975816305e-05, "Pretrain/Loss": 2.0689330101013184, "Pretrain/Loss (Raw)": 2.1445493698120117, "Pretrain/Step": 2928, "Pretrain/Step Time": 8.513981902971864} +{"Pretrain/Learning Rate": 4.058819326385322e-05, "Pretrain/Loss": 2.0665769577026367, "Pretrain/Loss (Raw)": 2.0300827026367188, "Pretrain/Step": 2929, "Pretrain/Step Time": 8.518216952681541} +{"Pretrain/Learning Rate": 4.05815549718395e-05, "Pretrain/Loss": 2.067570447921753, "Pretrain/Loss (Raw)": 2.2101783752441406, "Pretrain/Step": 2930, "Pretrain/Step Time": 8.527932859957218} +{"Pretrain/Learning Rate": 4.057491488288743e-05, "Pretrain/Loss": 2.066319704055786, "Pretrain/Loss (Raw)": 2.1076231002807617, "Pretrain/Step": 2931, "Pretrain/Step Time": 8.519027108326554} +{"Pretrain/Learning Rate": 4.0568272997762785e-05, "Pretrain/Loss": 2.062634229660034, "Pretrain/Loss (Raw)": 1.601714849472046, "Pretrain/Step": 2932, "Pretrain/Step Time": 8.511467630043626} +{"Pretrain/Learning Rate": 4.056162931723154e-05, "Pretrain/Loss": 2.0620999336242676, "Pretrain/Loss (Raw)": 1.9462532997131348, "Pretrain/Step": 2933, "Pretrain/Step Time": 8.515100851655006} +{"Pretrain/Learning Rate": 4.055498384205987e-05, "Pretrain/Loss": 2.0627543926239014, "Pretrain/Loss (Raw)": 2.086824893951416, "Pretrain/Step": 2934, "Pretrain/Step Time": 8.517813770100474} +{"Pretrain/Learning Rate": 4.054833657301417e-05, "Pretrain/Loss": 2.0645828247070312, "Pretrain/Loss (Raw)": 2.1172139644622803, "Pretrain/Step": 2935, "Pretrain/Step Time": 8.519838301464915} +{"Pretrain/Learning Rate": 4.054168751086102e-05, "Pretrain/Loss": 2.0641894340515137, "Pretrain/Loss (Raw)": 2.148683547973633, "Pretrain/Step": 2936, "Pretrain/Step Time": 8.52457202039659} +{"Pretrain/Learning Rate": 4.053503665636724e-05, "Pretrain/Loss": 2.065683364868164, "Pretrain/Loss (Raw)": 2.154329299926758, "Pretrain/Step": 2937, "Pretrain/Step Time": 8.518295839428902} +{"Pretrain/Learning Rate": 4.052838401029984e-05, "Pretrain/Loss": 2.0650696754455566, "Pretrain/Loss (Raw)": 2.016768455505371, "Pretrain/Step": 2938, "Pretrain/Step Time": 8.509685168042779} +{"Pretrain/Learning Rate": 4.0521729573426006e-05, "Pretrain/Loss": 2.06150221824646, "Pretrain/Loss (Raw)": 2.0793874263763428, "Pretrain/Step": 2939, "Pretrain/Step Time": 8.50336898304522} +{"Pretrain/Learning Rate": 4.051507334651318e-05, "Pretrain/Loss": 2.060561180114746, "Pretrain/Loss (Raw)": 2.503394603729248, "Pretrain/Step": 2940, "Pretrain/Step Time": 8.505859108641744} +{"Pretrain/Learning Rate": 4.050841533032899e-05, "Pretrain/Loss": 2.06255841255188, "Pretrain/Loss (Raw)": 2.2962944507598877, "Pretrain/Step": 2941, "Pretrain/Step Time": 8.512166891247034} +{"Pretrain/Learning Rate": 4.050175552564127e-05, "Pretrain/Loss": 2.0614867210388184, "Pretrain/Loss (Raw)": 2.021204948425293, "Pretrain/Step": 2942, "Pretrain/Step Time": 8.518257537856698} +{"Pretrain/Learning Rate": 4.049509393321805e-05, "Pretrain/Loss": 2.0596275329589844, "Pretrain/Loss (Raw)": 1.8750272989273071, "Pretrain/Step": 2943, "Pretrain/Step Time": 8.515990812331438} +{"Pretrain/Learning Rate": 4.0488430553827585e-05, "Pretrain/Loss": 2.0626413822174072, "Pretrain/Loss (Raw)": 2.1977357864379883, "Pretrain/Step": 2944, "Pretrain/Step Time": 8.510197071358562} +{"Pretrain/Learning Rate": 4.0481765388238324e-05, "Pretrain/Loss": 2.06052827835083, "Pretrain/Loss (Raw)": 1.9441192150115967, "Pretrain/Step": 2945, "Pretrain/Step Time": 8.511160602793097} +{"Pretrain/Learning Rate": 4.047509843721893e-05, "Pretrain/Loss": 2.0587706565856934, "Pretrain/Loss (Raw)": 1.9332185983657837, "Pretrain/Step": 2946, "Pretrain/Step Time": 8.514727169647813} +{"Pretrain/Learning Rate": 4.0468429701538253e-05, "Pretrain/Loss": 2.0568792819976807, "Pretrain/Loss (Raw)": 2.0730433464050293, "Pretrain/Step": 2947, "Pretrain/Step Time": 8.514705907553434} +{"Pretrain/Learning Rate": 4.046175918196538e-05, "Pretrain/Loss": 2.0582733154296875, "Pretrain/Loss (Raw)": 2.1391382217407227, "Pretrain/Step": 2948, "Pretrain/Step Time": 8.514899592846632} +{"Pretrain/Learning Rate": 4.045508687926958e-05, "Pretrain/Loss": 2.0601463317871094, "Pretrain/Loss (Raw)": 2.0821444988250732, "Pretrain/Step": 2949, "Pretrain/Step Time": 8.513391183689237} +{"Pretrain/Learning Rate": 4.044841279422034e-05, "Pretrain/Loss": 2.0638785362243652, "Pretrain/Loss (Raw)": 2.27699875831604, "Pretrain/Step": 2950, "Pretrain/Step Time": 8.506128251552582} +{"Pretrain/Learning Rate": 4.044173692758733e-05, "Pretrain/Loss": 2.0636236667633057, "Pretrain/Loss (Raw)": 2.049135208129883, "Pretrain/Step": 2951, "Pretrain/Step Time": 8.505661107599735} +{"Pretrain/Learning Rate": 4.043505928014045e-05, "Pretrain/Loss": 2.0666441917419434, "Pretrain/Loss (Raw)": 2.3008761405944824, "Pretrain/Step": 2952, "Pretrain/Step Time": 8.504160072654486} +{"Pretrain/Learning Rate": 4.0428379852649816e-05, "Pretrain/Loss": 2.0661773681640625, "Pretrain/Loss (Raw)": 2.036203622817993, "Pretrain/Step": 2953, "Pretrain/Step Time": 8.510266961529851} +{"Pretrain/Learning Rate": 4.042169864588571e-05, "Pretrain/Loss": 2.0709667205810547, "Pretrain/Loss (Raw)": 2.615386724472046, "Pretrain/Step": 2954, "Pretrain/Step Time": 8.507884690538049} +{"Pretrain/Learning Rate": 4.041501566061865e-05, "Pretrain/Loss": 2.0729212760925293, "Pretrain/Loss (Raw)": 2.2942099571228027, "Pretrain/Step": 2955, "Pretrain/Step Time": 8.505154106765985} +{"Pretrain/Learning Rate": 4.040833089761934e-05, "Pretrain/Loss": 2.0729222297668457, "Pretrain/Loss (Raw)": 2.0783984661102295, "Pretrain/Step": 2956, "Pretrain/Step Time": 8.511635236442089} +{"Pretrain/Learning Rate": 4.040164435765871e-05, "Pretrain/Loss": 2.073637008666992, "Pretrain/Loss (Raw)": 2.1295371055603027, "Pretrain/Step": 2957, "Pretrain/Step Time": 8.505294824019074} +{"Pretrain/Learning Rate": 4.039495604150787e-05, "Pretrain/Loss": 2.0742685794830322, "Pretrain/Loss (Raw)": 2.293743133544922, "Pretrain/Step": 2958, "Pretrain/Step Time": 8.505677768960595} +{"Pretrain/Learning Rate": 4.0388265949938165e-05, "Pretrain/Loss": 2.0732479095458984, "Pretrain/Loss (Raw)": 2.1224162578582764, "Pretrain/Step": 2959, "Pretrain/Step Time": 8.508845524862409} +{"Pretrain/Learning Rate": 4.038157408372111e-05, "Pretrain/Loss": 2.0749599933624268, "Pretrain/Loss (Raw)": 2.133744955062866, "Pretrain/Step": 2960, "Pretrain/Step Time": 8.513512127101421} +{"Pretrain/Learning Rate": 4.037488044362846e-05, "Pretrain/Loss": 2.073777675628662, "Pretrain/Loss (Raw)": 1.9581794738769531, "Pretrain/Step": 2961, "Pretrain/Step Time": 8.510802825912833} +{"Pretrain/Learning Rate": 4.036818503043214e-05, "Pretrain/Loss": 2.0711755752563477, "Pretrain/Loss (Raw)": 1.9205535650253296, "Pretrain/Step": 2962, "Pretrain/Step Time": 8.510342482477427} +{"Pretrain/Learning Rate": 4.0361487844904314e-05, "Pretrain/Loss": 2.071803092956543, "Pretrain/Loss (Raw)": 2.030883550643921, "Pretrain/Step": 2963, "Pretrain/Step Time": 8.514638151973486} +{"Pretrain/Learning Rate": 4.035478888781732e-05, "Pretrain/Loss": 2.0732054710388184, "Pretrain/Loss (Raw)": 2.355564594268799, "Pretrain/Step": 2964, "Pretrain/Step Time": 8.511908367276192} +{"Pretrain/Learning Rate": 4.034808815994372e-05, "Pretrain/Loss": 2.072880268096924, "Pretrain/Loss (Raw)": 2.0339884757995605, "Pretrain/Step": 2965, "Pretrain/Step Time": 8.515315368771553} +{"Pretrain/Learning Rate": 4.0341385662056265e-05, "Pretrain/Loss": 2.0721256732940674, "Pretrain/Loss (Raw)": 2.0699214935302734, "Pretrain/Step": 2966, "Pretrain/Step Time": 8.519062675535679} +{"Pretrain/Learning Rate": 4.033468139492793e-05, "Pretrain/Loss": 2.071631908416748, "Pretrain/Loss (Raw)": 1.9870597124099731, "Pretrain/Step": 2967, "Pretrain/Step Time": 8.512019304558635} +{"Pretrain/Learning Rate": 4.032797535933187e-05, "Pretrain/Loss": 2.0716471672058105, "Pretrain/Loss (Raw)": 2.107391595840454, "Pretrain/Step": 2968, "Pretrain/Step Time": 8.506045838817954} +{"Pretrain/Learning Rate": 4.032126755604147e-05, "Pretrain/Loss": 2.070274591445923, "Pretrain/Loss (Raw)": 2.099560022354126, "Pretrain/Step": 2969, "Pretrain/Step Time": 8.510545257478952} +{"Pretrain/Learning Rate": 4.03145579858303e-05, "Pretrain/Loss": 2.068551540374756, "Pretrain/Loss (Raw)": 1.7760584354400635, "Pretrain/Step": 2970, "Pretrain/Step Time": 8.50819680467248} +{"Pretrain/Learning Rate": 4.0307846649472134e-05, "Pretrain/Loss": 2.067208766937256, "Pretrain/Loss (Raw)": 1.9553396701812744, "Pretrain/Step": 2971, "Pretrain/Step Time": 8.510556204244494} +{"Pretrain/Learning Rate": 4.030113354774096e-05, "Pretrain/Loss": 2.066551685333252, "Pretrain/Loss (Raw)": 1.9569785594940186, "Pretrain/Step": 2972, "Pretrain/Step Time": 8.514481347054243} +{"Pretrain/Learning Rate": 4.029441868141096e-05, "Pretrain/Loss": 2.0652546882629395, "Pretrain/Loss (Raw)": 2.0061392784118652, "Pretrain/Step": 2973, "Pretrain/Step Time": 8.509475195780396} +{"Pretrain/Learning Rate": 4.0287702051256535e-05, "Pretrain/Loss": 2.0653202533721924, "Pretrain/Loss (Raw)": 1.822481632232666, "Pretrain/Step": 2974, "Pretrain/Step Time": 8.499060722067952} +{"Pretrain/Learning Rate": 4.0280983658052276e-05, "Pretrain/Loss": 2.0672919750213623, "Pretrain/Loss (Raw)": 2.2963578701019287, "Pretrain/Step": 2975, "Pretrain/Step Time": 8.499798515811563} +{"Pretrain/Learning Rate": 4.0274263502572966e-05, "Pretrain/Loss": 2.0672783851623535, "Pretrain/Loss (Raw)": 2.066131114959717, "Pretrain/Step": 2976, "Pretrain/Step Time": 8.498936155810952} +{"Pretrain/Learning Rate": 4.026754158559362e-05, "Pretrain/Loss": 2.066554546356201, "Pretrain/Loss (Raw)": 2.005080461502075, "Pretrain/Step": 2977, "Pretrain/Step Time": 8.505808867514133} +{"Pretrain/Learning Rate": 4.026081790788943e-05, "Pretrain/Loss": 2.0677602291107178, "Pretrain/Loss (Raw)": 2.0417497158050537, "Pretrain/Step": 2978, "Pretrain/Step Time": 8.504488483071327} +{"Pretrain/Learning Rate": 4.025409247023581e-05, "Pretrain/Loss": 2.0687150955200195, "Pretrain/Loss (Raw)": 2.1322762966156006, "Pretrain/Step": 2979, "Pretrain/Step Time": 8.501071395352483} +{"Pretrain/Learning Rate": 4.0247365273408366e-05, "Pretrain/Loss": 2.069026231765747, "Pretrain/Loss (Raw)": 2.0131301879882812, "Pretrain/Step": 2980, "Pretrain/Step Time": 8.499662011861801} +{"Pretrain/Learning Rate": 4.024063631818291e-05, "Pretrain/Loss": 2.068300247192383, "Pretrain/Loss (Raw)": 1.9091359376907349, "Pretrain/Step": 2981, "Pretrain/Step Time": 8.499357597902417} +{"Pretrain/Learning Rate": 4.023390560533546e-05, "Pretrain/Loss": 2.06683087348938, "Pretrain/Loss (Raw)": 2.046919107437134, "Pretrain/Step": 2982, "Pretrain/Step Time": 8.509257793426514} +{"Pretrain/Learning Rate": 4.022717313564223e-05, "Pretrain/Loss": 2.065077781677246, "Pretrain/Loss (Raw)": 2.149721622467041, "Pretrain/Step": 2983, "Pretrain/Step Time": 8.507757583633065} +{"Pretrain/Learning Rate": 4.0220438909879644e-05, "Pretrain/Loss": 2.063995599746704, "Pretrain/Loss (Raw)": 1.8756769895553589, "Pretrain/Step": 2984, "Pretrain/Step Time": 8.511068869382143} +{"Pretrain/Learning Rate": 4.0213702928824315e-05, "Pretrain/Loss": 2.0655016899108887, "Pretrain/Loss (Raw)": 2.262101888656616, "Pretrain/Step": 2985, "Pretrain/Step Time": 8.507937164977193} +{"Pretrain/Learning Rate": 4.0206965193253075e-05, "Pretrain/Loss": 2.0656557083129883, "Pretrain/Loss (Raw)": 2.0135574340820312, "Pretrain/Step": 2986, "Pretrain/Step Time": 8.502013448625803} +{"Pretrain/Learning Rate": 4.0200225703942964e-05, "Pretrain/Loss": 2.064606189727783, "Pretrain/Loss (Raw)": 2.0290987491607666, "Pretrain/Step": 2987, "Pretrain/Step Time": 8.501553013920784} +{"Pretrain/Learning Rate": 4.0193484461671185e-05, "Pretrain/Loss": 2.0653786659240723, "Pretrain/Loss (Raw)": 2.1798179149627686, "Pretrain/Step": 2988, "Pretrain/Step Time": 8.507113950327039} +{"Pretrain/Learning Rate": 4.0186741467215186e-05, "Pretrain/Loss": 2.0652966499328613, "Pretrain/Loss (Raw)": 2.046940803527832, "Pretrain/Step": 2989, "Pretrain/Step Time": 8.510887069627643} +{"Pretrain/Learning Rate": 4.017999672135261e-05, "Pretrain/Loss": 2.0655288696289062, "Pretrain/Loss (Raw)": 2.1819868087768555, "Pretrain/Step": 2990, "Pretrain/Step Time": 8.5124298799783} +{"Pretrain/Learning Rate": 4.017325022486127e-05, "Pretrain/Loss": 2.067251682281494, "Pretrain/Loss (Raw)": 2.124896764755249, "Pretrain/Step": 2991, "Pretrain/Step Time": 8.513288926333189} +{"Pretrain/Learning Rate": 4.0166501978519225e-05, "Pretrain/Loss": 2.0680179595947266, "Pretrain/Loss (Raw)": 1.9929496049880981, "Pretrain/Step": 2992, "Pretrain/Step Time": 8.504586076363921} +{"Pretrain/Learning Rate": 4.015975198310469e-05, "Pretrain/Loss": 2.068721294403076, "Pretrain/Loss (Raw)": 2.029021739959717, "Pretrain/Step": 2993, "Pretrain/Step Time": 8.503434540703893} +{"Pretrain/Learning Rate": 4.0153000239396136e-05, "Pretrain/Loss": 2.0701205730438232, "Pretrain/Loss (Raw)": 2.121375322341919, "Pretrain/Step": 2994, "Pretrain/Step Time": 8.50901060923934} +{"Pretrain/Learning Rate": 4.014624674817218e-05, "Pretrain/Loss": 2.071047306060791, "Pretrain/Loss (Raw)": 2.096356153488159, "Pretrain/Step": 2995, "Pretrain/Step Time": 8.506685560569167} +{"Pretrain/Learning Rate": 4.0139491510211684e-05, "Pretrain/Loss": 2.0713553428649902, "Pretrain/Loss (Raw)": 1.8422348499298096, "Pretrain/Step": 2996, "Pretrain/Step Time": 8.507578995078802} +{"Pretrain/Learning Rate": 4.0132734526293685e-05, "Pretrain/Loss": 2.0702881813049316, "Pretrain/Loss (Raw)": 2.037414789199829, "Pretrain/Step": 2997, "Pretrain/Step Time": 8.498620226979256} +{"Pretrain/Learning Rate": 4.012597579719743e-05, "Pretrain/Loss": 2.069154977798462, "Pretrain/Loss (Raw)": 2.043022632598877, "Pretrain/Step": 2998, "Pretrain/Step Time": 8.497128006070852} +{"Pretrain/Learning Rate": 4.011921532370238e-05, "Pretrain/Loss": 2.070000171661377, "Pretrain/Loss (Raw)": 1.9947067499160767, "Pretrain/Step": 2999, "Pretrain/Step Time": 8.508734006434679} +{"Pretrain/Learning Rate": 4.0112453106588164e-05, "Pretrain/Loss": 2.0680501461029053, "Pretrain/Loss (Raw)": 1.930267095565796, "Pretrain/Step": 3000, "Pretrain/Step Time": 8.510910185053945} +{"Pretrain/Learning Rate": 4.010568914663465e-05, "Pretrain/Loss": 2.067519187927246, "Pretrain/Loss (Raw)": 1.903127908706665, "Pretrain/Step": 3001, "Pretrain/Step Time": 8.51479522511363} +{"Pretrain/Learning Rate": 4.0098923444621885e-05, "Pretrain/Loss": 2.0688281059265137, "Pretrain/Loss (Raw)": 1.848183035850525, "Pretrain/Step": 3002, "Pretrain/Step Time": 8.510264908894897} +{"Pretrain/Learning Rate": 4.0092156001330115e-05, "Pretrain/Loss": 2.0648038387298584, "Pretrain/Loss (Raw)": 1.728531837463379, "Pretrain/Step": 3003, "Pretrain/Step Time": 8.50653176009655} +{"Pretrain/Learning Rate": 4.00853868175398e-05, "Pretrain/Loss": 2.066448926925659, "Pretrain/Loss (Raw)": 2.1004858016967773, "Pretrain/Step": 3004, "Pretrain/Step Time": 8.504763701930642} +{"Pretrain/Learning Rate": 4.007861589403159e-05, "Pretrain/Loss": 2.0646138191223145, "Pretrain/Loss (Raw)": 1.9159103631973267, "Pretrain/Step": 3005, "Pretrain/Step Time": 8.508003858849406} +{"Pretrain/Learning Rate": 4.0071843231586345e-05, "Pretrain/Loss": 2.0657098293304443, "Pretrain/Loss (Raw)": 2.1523489952087402, "Pretrain/Step": 3006, "Pretrain/Step Time": 8.515598209574819} +{"Pretrain/Learning Rate": 4.006506883098512e-05, "Pretrain/Loss": 2.0662102699279785, "Pretrain/Loss (Raw)": 1.930159091949463, "Pretrain/Step": 3007, "Pretrain/Step Time": 8.525101888924837} +{"Pretrain/Learning Rate": 4.005829269300917e-05, "Pretrain/Loss": 2.0662612915039062, "Pretrain/Loss (Raw)": 1.9000117778778076, "Pretrain/Step": 3008, "Pretrain/Step Time": 8.523413209244609} +{"Pretrain/Learning Rate": 4.005151481843994e-05, "Pretrain/Loss": 2.0686144828796387, "Pretrain/Loss (Raw)": 2.1486120223999023, "Pretrain/Step": 3009, "Pretrain/Step Time": 8.517843011766672} +{"Pretrain/Learning Rate": 4.0044735208059104e-05, "Pretrain/Loss": 2.0690598487854004, "Pretrain/Loss (Raw)": 2.097445249557495, "Pretrain/Step": 3010, "Pretrain/Step Time": 8.51789584942162} +{"Pretrain/Learning Rate": 4.0037953862648504e-05, "Pretrain/Loss": 2.068340539932251, "Pretrain/Loss (Raw)": 2.0300111770629883, "Pretrain/Step": 3011, "Pretrain/Step Time": 8.52007881179452} +{"Pretrain/Learning Rate": 4.003117078299021e-05, "Pretrain/Loss": 2.066802978515625, "Pretrain/Loss (Raw)": 1.9546623229980469, "Pretrain/Step": 3012, "Pretrain/Step Time": 8.521528540179133} +{"Pretrain/Learning Rate": 4.002438596986647e-05, "Pretrain/Loss": 2.0687127113342285, "Pretrain/Loss (Raw)": 2.2512271404266357, "Pretrain/Step": 3013, "Pretrain/Step Time": 8.5244224909693} +{"Pretrain/Learning Rate": 4.001759942405974e-05, "Pretrain/Loss": 2.0678205490112305, "Pretrain/Loss (Raw)": 2.0006260871887207, "Pretrain/Step": 3014, "Pretrain/Step Time": 8.519208550453186} +{"Pretrain/Learning Rate": 4.001081114635268e-05, "Pretrain/Loss": 2.0653271675109863, "Pretrain/Loss (Raw)": 1.9301012754440308, "Pretrain/Step": 3015, "Pretrain/Step Time": 8.51234078221023} +{"Pretrain/Learning Rate": 4.000402113752815e-05, "Pretrain/Loss": 2.0677151679992676, "Pretrain/Loss (Raw)": 2.1628456115722656, "Pretrain/Step": 3016, "Pretrain/Step Time": 8.508196994662285} +{"Pretrain/Learning Rate": 3.9997229398369194e-05, "Pretrain/Loss": 2.070009708404541, "Pretrain/Loss (Raw)": 2.241671323776245, "Pretrain/Step": 3017, "Pretrain/Step Time": 8.517757628113031} +{"Pretrain/Learning Rate": 3.999043592965908e-05, "Pretrain/Loss": 2.0717625617980957, "Pretrain/Loss (Raw)": 2.204570770263672, "Pretrain/Step": 3018, "Pretrain/Step Time": 8.526979541406035} +{"Pretrain/Learning Rate": 3.998364073218126e-05, "Pretrain/Loss": 2.0713093280792236, "Pretrain/Loss (Raw)": 2.034433364868164, "Pretrain/Step": 3019, "Pretrain/Step Time": 8.531117796897888} +{"Pretrain/Learning Rate": 3.997684380671938e-05, "Pretrain/Loss": 2.070039749145508, "Pretrain/Loss (Raw)": 1.858827829360962, "Pretrain/Step": 3020, "Pretrain/Step Time": 8.527598654851317} +{"Pretrain/Learning Rate": 3.9970045154057304e-05, "Pretrain/Loss": 2.06964111328125, "Pretrain/Loss (Raw)": 2.0420029163360596, "Pretrain/Step": 3021, "Pretrain/Step Time": 8.519286075606942} +{"Pretrain/Learning Rate": 3.996324477497907e-05, "Pretrain/Loss": 2.0709776878356934, "Pretrain/Loss (Raw)": 1.982262134552002, "Pretrain/Step": 3022, "Pretrain/Step Time": 8.519174559041858} +{"Pretrain/Learning Rate": 3.9956442670268946e-05, "Pretrain/Loss": 2.072301149368286, "Pretrain/Loss (Raw)": 2.087390422821045, "Pretrain/Step": 3023, "Pretrain/Step Time": 8.519405085593462} +{"Pretrain/Learning Rate": 3.9949638840711376e-05, "Pretrain/Loss": 2.070497512817383, "Pretrain/Loss (Raw)": 1.9118762016296387, "Pretrain/Step": 3024, "Pretrain/Step Time": 8.522086737677455} +{"Pretrain/Learning Rate": 3.9942833287091006e-05, "Pretrain/Loss": 2.072150945663452, "Pretrain/Loss (Raw)": 2.4401583671569824, "Pretrain/Step": 3025, "Pretrain/Step Time": 8.521600911393762} +{"Pretrain/Learning Rate": 3.9936026010192696e-05, "Pretrain/Loss": 2.0726675987243652, "Pretrain/Loss (Raw)": 2.023101806640625, "Pretrain/Step": 3026, "Pretrain/Step Time": 8.515019720420241} +{"Pretrain/Learning Rate": 3.9929217010801476e-05, "Pretrain/Loss": 2.0675806999206543, "Pretrain/Loss (Raw)": 1.8717608451843262, "Pretrain/Step": 3027, "Pretrain/Step Time": 8.512235643342137} +{"Pretrain/Learning Rate": 3.992240628970261e-05, "Pretrain/Loss": 2.0689339637756348, "Pretrain/Loss (Raw)": 2.403533697128296, "Pretrain/Step": 3028, "Pretrain/Step Time": 8.511704230681062} +{"Pretrain/Learning Rate": 3.991559384768153e-05, "Pretrain/Loss": 2.0684125423431396, "Pretrain/Loss (Raw)": 2.0107011795043945, "Pretrain/Step": 3029, "Pretrain/Step Time": 8.518227074295282} +{"Pretrain/Learning Rate": 3.9908779685523885e-05, "Pretrain/Loss": 2.0693306922912598, "Pretrain/Loss (Raw)": 2.0678861141204834, "Pretrain/Step": 3030, "Pretrain/Step Time": 8.514991426840425} +{"Pretrain/Learning Rate": 3.9901963804015516e-05, "Pretrain/Loss": 2.069100856781006, "Pretrain/Loss (Raw)": 2.040553092956543, "Pretrain/Step": 3031, "Pretrain/Step Time": 8.511818712577224} +{"Pretrain/Learning Rate": 3.9895146203942457e-05, "Pretrain/Loss": 2.0673484802246094, "Pretrain/Loss (Raw)": 1.945496916770935, "Pretrain/Step": 3032, "Pretrain/Step Time": 8.5057680811733} +{"Pretrain/Learning Rate": 3.988832688609095e-05, "Pretrain/Loss": 2.0669281482696533, "Pretrain/Loss (Raw)": 2.037754535675049, "Pretrain/Step": 3033, "Pretrain/Step Time": 8.495295833796263} +{"Pretrain/Learning Rate": 3.988150585124743e-05, "Pretrain/Loss": 2.0690250396728516, "Pretrain/Loss (Raw)": 2.2739315032958984, "Pretrain/Step": 3034, "Pretrain/Step Time": 8.494463535025716} +{"Pretrain/Learning Rate": 3.987468310019853e-05, "Pretrain/Loss": 2.0700464248657227, "Pretrain/Loss (Raw)": 2.2080984115600586, "Pretrain/Step": 3035, "Pretrain/Step Time": 8.4921231623739} +{"Pretrain/Learning Rate": 3.986785863373109e-05, "Pretrain/Loss": 2.067692279815674, "Pretrain/Loss (Raw)": 1.8975635766983032, "Pretrain/Step": 3036, "Pretrain/Step Time": 8.502678215503693} +{"Pretrain/Learning Rate": 3.9861032452632124e-05, "Pretrain/Loss": 2.067809581756592, "Pretrain/Loss (Raw)": 1.9494335651397705, "Pretrain/Step": 3037, "Pretrain/Step Time": 8.510381370782852} +{"Pretrain/Learning Rate": 3.985420455768887e-05, "Pretrain/Loss": 2.066389799118042, "Pretrain/Loss (Raw)": 1.8500605821609497, "Pretrain/Step": 3038, "Pretrain/Step Time": 8.50954195484519} +{"Pretrain/Learning Rate": 3.9847374949688756e-05, "Pretrain/Loss": 2.066354751586914, "Pretrain/Loss (Raw)": 2.1517679691314697, "Pretrain/Step": 3039, "Pretrain/Step Time": 8.499897023662925} +{"Pretrain/Learning Rate": 3.98405436294194e-05, "Pretrain/Loss": 2.0650317668914795, "Pretrain/Loss (Raw)": 2.0506999492645264, "Pretrain/Step": 3040, "Pretrain/Step Time": 8.50656532868743} +{"Pretrain/Learning Rate": 3.9833710597668614e-05, "Pretrain/Loss": 2.0642154216766357, "Pretrain/Loss (Raw)": 2.012382984161377, "Pretrain/Step": 3041, "Pretrain/Step Time": 8.510037364438176} +{"Pretrain/Learning Rate": 3.9826875855224435e-05, "Pretrain/Loss": 2.0614843368530273, "Pretrain/Loss (Raw)": 1.9325124025344849, "Pretrain/Step": 3042, "Pretrain/Step Time": 8.512770757079124} +{"Pretrain/Learning Rate": 3.9820039402875055e-05, "Pretrain/Loss": 2.0594120025634766, "Pretrain/Loss (Raw)": 1.9296109676361084, "Pretrain/Step": 3043, "Pretrain/Step Time": 8.515806790441275} +{"Pretrain/Learning Rate": 3.98132012414089e-05, "Pretrain/Loss": 2.056410789489746, "Pretrain/Loss (Raw)": 1.8600252866744995, "Pretrain/Step": 3044, "Pretrain/Step Time": 8.509836126118898} +{"Pretrain/Learning Rate": 3.9806361371614576e-05, "Pretrain/Loss": 2.0562615394592285, "Pretrain/Loss (Raw)": 2.2552733421325684, "Pretrain/Step": 3045, "Pretrain/Step Time": 8.50431183166802} +{"Pretrain/Learning Rate": 3.979951979428089e-05, "Pretrain/Loss": 2.057182550430298, "Pretrain/Loss (Raw)": 2.095200300216675, "Pretrain/Step": 3046, "Pretrain/Step Time": 8.50955999828875} +{"Pretrain/Learning Rate": 3.9792676510196835e-05, "Pretrain/Loss": 2.0569210052490234, "Pretrain/Loss (Raw)": 2.125274658203125, "Pretrain/Step": 3047, "Pretrain/Step Time": 8.512208731845021} +{"Pretrain/Learning Rate": 3.978583152015163e-05, "Pretrain/Loss": 2.056046485900879, "Pretrain/Loss (Raw)": 2.027531623840332, "Pretrain/Step": 3048, "Pretrain/Step Time": 8.51429539732635} +{"Pretrain/Learning Rate": 3.977898482493466e-05, "Pretrain/Loss": 2.05672025680542, "Pretrain/Loss (Raw)": 2.1151204109191895, "Pretrain/Step": 3049, "Pretrain/Step Time": 8.513233963400126} +{"Pretrain/Learning Rate": 3.977213642533552e-05, "Pretrain/Loss": 2.0586538314819336, "Pretrain/Loss (Raw)": 2.2168362140655518, "Pretrain/Step": 3050, "Pretrain/Step Time": 8.505781263113022} +{"Pretrain/Learning Rate": 3.976528632214399e-05, "Pretrain/Loss": 2.056989908218384, "Pretrain/Loss (Raw)": 1.665482759475708, "Pretrain/Step": 3051, "Pretrain/Step Time": 8.499580141156912} +{"Pretrain/Learning Rate": 3.975843451615007e-05, "Pretrain/Loss": 2.05885648727417, "Pretrain/Loss (Raw)": 2.1741621494293213, "Pretrain/Step": 3052, "Pretrain/Step Time": 8.503155807033181} +{"Pretrain/Learning Rate": 3.9751581008143946e-05, "Pretrain/Loss": 2.0608420372009277, "Pretrain/Loss (Raw)": 2.223057985305786, "Pretrain/Step": 3053, "Pretrain/Step Time": 8.506412444636226} +{"Pretrain/Learning Rate": 3.9744725798915974e-05, "Pretrain/Loss": 2.061307668685913, "Pretrain/Loss (Raw)": 2.008108615875244, "Pretrain/Step": 3054, "Pretrain/Step Time": 8.508725313469768} +{"Pretrain/Learning Rate": 3.973786888925675e-05, "Pretrain/Loss": 2.061307191848755, "Pretrain/Loss (Raw)": 1.9852937459945679, "Pretrain/Step": 3055, "Pretrain/Step Time": 8.515072328969836} +{"Pretrain/Learning Rate": 3.973101027995704e-05, "Pretrain/Loss": 2.0609378814697266, "Pretrain/Loss (Raw)": 2.097308397293091, "Pretrain/Step": 3056, "Pretrain/Step Time": 8.50483562424779} +{"Pretrain/Learning Rate": 3.9724149971807814e-05, "Pretrain/Loss": 2.0619592666625977, "Pretrain/Loss (Raw)": 2.1608238220214844, "Pretrain/Step": 3057, "Pretrain/Step Time": 8.500481612980366} +{"Pretrain/Learning Rate": 3.9717287965600224e-05, "Pretrain/Loss": 2.0606956481933594, "Pretrain/Loss (Raw)": 2.0483927726745605, "Pretrain/Step": 3058, "Pretrain/Step Time": 8.495693072676659} +{"Pretrain/Learning Rate": 3.971042426212563e-05, "Pretrain/Loss": 2.059844732284546, "Pretrain/Loss (Raw)": 1.9987226724624634, "Pretrain/Step": 3059, "Pretrain/Step Time": 8.509288236498833} +{"Pretrain/Learning Rate": 3.970355886217561e-05, "Pretrain/Loss": 2.0637428760528564, "Pretrain/Loss (Raw)": 2.1006829738616943, "Pretrain/Step": 3060, "Pretrain/Step Time": 8.509667858481407} +{"Pretrain/Learning Rate": 3.9696691766541884e-05, "Pretrain/Loss": 2.0650768280029297, "Pretrain/Loss (Raw)": 2.117001533508301, "Pretrain/Step": 3061, "Pretrain/Step Time": 8.508804861456156} +{"Pretrain/Learning Rate": 3.968982297601641e-05, "Pretrain/Loss": 2.066878318786621, "Pretrain/Loss (Raw)": 2.317390203475952, "Pretrain/Step": 3062, "Pretrain/Step Time": 8.503849705681205} +{"Pretrain/Learning Rate": 3.9682952491391326e-05, "Pretrain/Loss": 2.066164016723633, "Pretrain/Loss (Raw)": 2.0257904529571533, "Pretrain/Step": 3063, "Pretrain/Step Time": 8.50281467474997} +{"Pretrain/Learning Rate": 3.967608031345898e-05, "Pretrain/Loss": 2.065168857574463, "Pretrain/Loss (Raw)": 2.0213186740875244, "Pretrain/Step": 3064, "Pretrain/Step Time": 8.500892754644156} +{"Pretrain/Learning Rate": 3.96692064430119e-05, "Pretrain/Loss": 2.0634655952453613, "Pretrain/Loss (Raw)": 1.9362947940826416, "Pretrain/Step": 3065, "Pretrain/Step Time": 8.507026579231024} +{"Pretrain/Learning Rate": 3.96623308808428e-05, "Pretrain/Loss": 2.0641355514526367, "Pretrain/Loss (Raw)": 2.1025516986846924, "Pretrain/Step": 3066, "Pretrain/Step Time": 8.513881148770452} +{"Pretrain/Learning Rate": 3.965545362774461e-05, "Pretrain/Loss": 2.0678582191467285, "Pretrain/Loss (Raw)": 2.5558700561523438, "Pretrain/Step": 3067, "Pretrain/Step Time": 8.517628414556384} +{"Pretrain/Learning Rate": 3.964857468451045e-05, "Pretrain/Loss": 2.0641345977783203, "Pretrain/Loss (Raw)": 2.026759147644043, "Pretrain/Step": 3068, "Pretrain/Step Time": 8.510706348344684} +{"Pretrain/Learning Rate": 3.9641694051933644e-05, "Pretrain/Loss": 2.060688018798828, "Pretrain/Loss (Raw)": 1.8551568984985352, "Pretrain/Step": 3069, "Pretrain/Step Time": 8.508450966328382} +{"Pretrain/Learning Rate": 3.963481173080767e-05, "Pretrain/Loss": 2.062070369720459, "Pretrain/Loss (Raw)": 2.1981146335601807, "Pretrain/Step": 3070, "Pretrain/Step Time": 8.501665027812123} +{"Pretrain/Learning Rate": 3.962792772192626e-05, "Pretrain/Loss": 2.064281463623047, "Pretrain/Loss (Raw)": 2.1580655574798584, "Pretrain/Step": 3071, "Pretrain/Step Time": 8.506009835749865} +{"Pretrain/Learning Rate": 3.962104202608329e-05, "Pretrain/Loss": 2.0638082027435303, "Pretrain/Loss (Raw)": 2.1371586322784424, "Pretrain/Step": 3072, "Pretrain/Step Time": 8.509710714221} +{"Pretrain/Learning Rate": 3.9614154644072854e-05, "Pretrain/Loss": 2.0635318756103516, "Pretrain/Loss (Raw)": 1.9087417125701904, "Pretrain/Step": 3073, "Pretrain/Step Time": 8.509152565151453} +{"Pretrain/Learning Rate": 3.960726557668924e-05, "Pretrain/Loss": 2.0638532638549805, "Pretrain/Loss (Raw)": 1.9743976593017578, "Pretrain/Step": 3074, "Pretrain/Step Time": 8.501579316332936} +{"Pretrain/Learning Rate": 3.960037482472694e-05, "Pretrain/Loss": 2.06492280960083, "Pretrain/Loss (Raw)": 2.2099111080169678, "Pretrain/Step": 3075, "Pretrain/Step Time": 8.5051439832896} +{"Pretrain/Learning Rate": 3.95934823889806e-05, "Pretrain/Loss": 2.0654406547546387, "Pretrain/Loss (Raw)": 2.2054173946380615, "Pretrain/Step": 3076, "Pretrain/Step Time": 8.51034819893539} +{"Pretrain/Learning Rate": 3.9586588270245115e-05, "Pretrain/Loss": 2.0645978450775146, "Pretrain/Loss (Raw)": 1.9742792844772339, "Pretrain/Step": 3077, "Pretrain/Step Time": 8.511917371302843} +{"Pretrain/Learning Rate": 3.957969246931553e-05, "Pretrain/Loss": 2.0628600120544434, "Pretrain/Loss (Raw)": 2.054555892944336, "Pretrain/Step": 3078, "Pretrain/Step Time": 8.514189302921295} +{"Pretrain/Learning Rate": 3.95727949869871e-05, "Pretrain/Loss": 2.061779022216797, "Pretrain/Loss (Raw)": 1.9107540845870972, "Pretrain/Step": 3079, "Pretrain/Step Time": 8.511780709028244} +{"Pretrain/Learning Rate": 3.95658958240553e-05, "Pretrain/Loss": 2.0598087310791016, "Pretrain/Loss (Raw)": 2.0486762523651123, "Pretrain/Step": 3080, "Pretrain/Step Time": 8.509668342769146} +{"Pretrain/Learning Rate": 3.955899498131575e-05, "Pretrain/Loss": 2.0598270893096924, "Pretrain/Loss (Raw)": 2.0385639667510986, "Pretrain/Step": 3081, "Pretrain/Step Time": 8.502347500994802} +{"Pretrain/Learning Rate": 3.9552092459564294e-05, "Pretrain/Loss": 2.056668758392334, "Pretrain/Loss (Raw)": 2.2111408710479736, "Pretrain/Step": 3082, "Pretrain/Step Time": 8.51438831537962} +{"Pretrain/Learning Rate": 3.9545188259596966e-05, "Pretrain/Loss": 2.0566606521606445, "Pretrain/Loss (Raw)": 2.2931394577026367, "Pretrain/Step": 3083, "Pretrain/Step Time": 8.517870331183076} +{"Pretrain/Learning Rate": 3.953828238220998e-05, "Pretrain/Loss": 2.0568175315856934, "Pretrain/Loss (Raw)": 2.0985093116760254, "Pretrain/Step": 3084, "Pretrain/Step Time": 8.516077687963843} +{"Pretrain/Learning Rate": 3.9531374828199774e-05, "Pretrain/Loss": 2.055751323699951, "Pretrain/Loss (Raw)": 1.9930270910263062, "Pretrain/Step": 3085, "Pretrain/Step Time": 8.519847644492984} +{"Pretrain/Learning Rate": 3.952446559836295e-05, "Pretrain/Loss": 2.053638458251953, "Pretrain/Loss (Raw)": 2.023298740386963, "Pretrain/Step": 3086, "Pretrain/Step Time": 8.514630829915404} +{"Pretrain/Learning Rate": 3.95175546934963e-05, "Pretrain/Loss": 2.0540168285369873, "Pretrain/Loss (Raw)": 2.170863151550293, "Pretrain/Step": 3087, "Pretrain/Step Time": 8.515793263912201} +{"Pretrain/Learning Rate": 3.951064211439684e-05, "Pretrain/Loss": 2.054272174835205, "Pretrain/Loss (Raw)": 2.1664328575134277, "Pretrain/Step": 3088, "Pretrain/Step Time": 8.513511287048459} +{"Pretrain/Learning Rate": 3.9503727861861756e-05, "Pretrain/Loss": 2.0550084114074707, "Pretrain/Loss (Raw)": 2.0523877143859863, "Pretrain/Step": 3089, "Pretrain/Step Time": 8.51168355718255} +{"Pretrain/Learning Rate": 3.9496811936688425e-05, "Pretrain/Loss": 2.0554847717285156, "Pretrain/Loss (Raw)": 1.9815874099731445, "Pretrain/Step": 3090, "Pretrain/Step Time": 8.509903874248266} +{"Pretrain/Learning Rate": 3.9489894339674435e-05, "Pretrain/Loss": 2.0540006160736084, "Pretrain/Loss (Raw)": 1.8408892154693604, "Pretrain/Step": 3091, "Pretrain/Step Time": 8.50861381366849} +{"Pretrain/Learning Rate": 3.948297507161756e-05, "Pretrain/Loss": 2.053065776824951, "Pretrain/Loss (Raw)": 2.235896587371826, "Pretrain/Step": 3092, "Pretrain/Step Time": 8.503843557089567} +{"Pretrain/Learning Rate": 3.947605413331574e-05, "Pretrain/Loss": 2.0528340339660645, "Pretrain/Loss (Raw)": 2.0043044090270996, "Pretrain/Step": 3093, "Pretrain/Step Time": 8.506506549194455} +{"Pretrain/Learning Rate": 3.946913152556715e-05, "Pretrain/Loss": 2.053241014480591, "Pretrain/Loss (Raw)": 2.1220333576202393, "Pretrain/Step": 3094, "Pretrain/Step Time": 8.50622257962823} +{"Pretrain/Learning Rate": 3.946220724917013e-05, "Pretrain/Loss": 2.054089069366455, "Pretrain/Loss (Raw)": 2.0955989360809326, "Pretrain/Step": 3095, "Pretrain/Step Time": 8.51117144152522} +{"Pretrain/Learning Rate": 3.945528130492322e-05, "Pretrain/Loss": 2.0548062324523926, "Pretrain/Loss (Raw)": 2.1992015838623047, "Pretrain/Step": 3096, "Pretrain/Step Time": 8.516244551166892} +{"Pretrain/Learning Rate": 3.944835369362516e-05, "Pretrain/Loss": 2.05424165725708, "Pretrain/Loss (Raw)": 2.0273048877716064, "Pretrain/Step": 3097, "Pretrain/Step Time": 8.514426490291953} +{"Pretrain/Learning Rate": 3.9441424416074866e-05, "Pretrain/Loss": 2.055345058441162, "Pretrain/Loss (Raw)": 1.9172903299331665, "Pretrain/Step": 3098, "Pretrain/Step Time": 8.511901112273335} +{"Pretrain/Learning Rate": 3.9434493473071456e-05, "Pretrain/Loss": 2.056457042694092, "Pretrain/Loss (Raw)": 2.0976686477661133, "Pretrain/Step": 3099, "Pretrain/Step Time": 8.513375826179981} +{"Pretrain/Learning Rate": 3.9427560865414246e-05, "Pretrain/Loss": 2.056896448135376, "Pretrain/Loss (Raw)": 2.0132124423980713, "Pretrain/Step": 3100, "Pretrain/Step Time": 8.51885656453669} +{"Pretrain/Learning Rate": 3.942062659390273e-05, "Pretrain/Loss": 2.056103229522705, "Pretrain/Loss (Raw)": 1.9046217203140259, "Pretrain/Step": 3101, "Pretrain/Step Time": 8.519491255283356} +{"Pretrain/Learning Rate": 3.94136906593366e-05, "Pretrain/Loss": 2.057455062866211, "Pretrain/Loss (Raw)": 1.9955276250839233, "Pretrain/Step": 3102, "Pretrain/Step Time": 8.52305588312447} +{"Pretrain/Learning Rate": 3.940675306251574e-05, "Pretrain/Loss": 2.0547971725463867, "Pretrain/Loss (Raw)": 1.9561083316802979, "Pretrain/Step": 3103, "Pretrain/Step Time": 8.52233194001019} +{"Pretrain/Learning Rate": 3.939981380424024e-05, "Pretrain/Loss": 2.0533928871154785, "Pretrain/Loss (Raw)": 1.8864001035690308, "Pretrain/Step": 3104, "Pretrain/Step Time": 8.52267205901444} +{"Pretrain/Learning Rate": 3.939287288531035e-05, "Pretrain/Loss": 2.053501605987549, "Pretrain/Loss (Raw)": 2.018975019454956, "Pretrain/Step": 3105, "Pretrain/Step Time": 8.522933462634683} +{"Pretrain/Learning Rate": 3.938593030652654e-05, "Pretrain/Loss": 2.0510241985321045, "Pretrain/Loss (Raw)": 1.7246757745742798, "Pretrain/Step": 3106, "Pretrain/Step Time": 8.520829046145082} +{"Pretrain/Learning Rate": 3.937898606868946e-05, "Pretrain/Loss": 2.050211191177368, "Pretrain/Loss (Raw)": 2.028207778930664, "Pretrain/Step": 3107, "Pretrain/Step Time": 8.522649953141809} +{"Pretrain/Learning Rate": 3.9372040172599956e-05, "Pretrain/Loss": 2.049747943878174, "Pretrain/Loss (Raw)": 1.9538482427597046, "Pretrain/Step": 3108, "Pretrain/Step Time": 8.517679804936051} +{"Pretrain/Learning Rate": 3.936509261905905e-05, "Pretrain/Loss": 2.0512630939483643, "Pretrain/Loss (Raw)": 2.103050470352173, "Pretrain/Step": 3109, "Pretrain/Step Time": 8.509993951767683} +{"Pretrain/Learning Rate": 3.935814340886797e-05, "Pretrain/Loss": 2.049290657043457, "Pretrain/Loss (Raw)": 1.7944670915603638, "Pretrain/Step": 3110, "Pretrain/Step Time": 8.501988992094994} +{"Pretrain/Learning Rate": 3.935119254282814e-05, "Pretrain/Loss": 2.04925799369812, "Pretrain/Loss (Raw)": 2.145519495010376, "Pretrain/Step": 3111, "Pretrain/Step Time": 8.50829542055726} +{"Pretrain/Learning Rate": 3.934424002174115e-05, "Pretrain/Loss": 2.051223039627075, "Pretrain/Loss (Raw)": 2.1272146701812744, "Pretrain/Step": 3112, "Pretrain/Step Time": 8.512634159997106} +{"Pretrain/Learning Rate": 3.9337285846408826e-05, "Pretrain/Loss": 2.050605297088623, "Pretrain/Loss (Raw)": 2.1830179691314697, "Pretrain/Step": 3113, "Pretrain/Step Time": 8.516548415645957} +{"Pretrain/Learning Rate": 3.9330330017633126e-05, "Pretrain/Loss": 2.052556037902832, "Pretrain/Loss (Raw)": 2.2632758617401123, "Pretrain/Step": 3114, "Pretrain/Step Time": 8.518778709694743} +{"Pretrain/Learning Rate": 3.932337253621624e-05, "Pretrain/Loss": 2.053490400314331, "Pretrain/Loss (Raw)": 2.1486899852752686, "Pretrain/Step": 3115, "Pretrain/Step Time": 8.515174489468336} +{"Pretrain/Learning Rate": 3.9316413402960553e-05, "Pretrain/Loss": 2.0521864891052246, "Pretrain/Loss (Raw)": 2.012887716293335, "Pretrain/Step": 3116, "Pretrain/Step Time": 8.507143812254071} +{"Pretrain/Learning Rate": 3.93094526186686e-05, "Pretrain/Loss": 2.0531041622161865, "Pretrain/Loss (Raw)": 2.164416790008545, "Pretrain/Step": 3117, "Pretrain/Step Time": 8.503885686397552} +{"Pretrain/Learning Rate": 3.930249018414315e-05, "Pretrain/Loss": 2.055084228515625, "Pretrain/Loss (Raw)": 2.4354355335235596, "Pretrain/Step": 3118, "Pretrain/Step Time": 8.512668941169977} +{"Pretrain/Learning Rate": 3.9295526100187126e-05, "Pretrain/Loss": 2.0546603202819824, "Pretrain/Loss (Raw)": 2.070619821548462, "Pretrain/Step": 3119, "Pretrain/Step Time": 8.520135255530477} +{"Pretrain/Learning Rate": 3.928856036760368e-05, "Pretrain/Loss": 2.0554957389831543, "Pretrain/Loss (Raw)": 2.099898099899292, "Pretrain/Step": 3120, "Pretrain/Step Time": 8.520193284377456} +{"Pretrain/Learning Rate": 3.9281592987196115e-05, "Pretrain/Loss": 2.057589054107666, "Pretrain/Loss (Raw)": 2.29695200920105, "Pretrain/Step": 3121, "Pretrain/Step Time": 8.512403812259436} +{"Pretrain/Learning Rate": 3.9274623959767945e-05, "Pretrain/Loss": 2.057013988494873, "Pretrain/Loss (Raw)": 2.0477778911590576, "Pretrain/Step": 3122, "Pretrain/Step Time": 8.50875560566783} +{"Pretrain/Learning Rate": 3.9267653286122886e-05, "Pretrain/Loss": 2.0570876598358154, "Pretrain/Loss (Raw)": 2.1058061122894287, "Pretrain/Step": 3123, "Pretrain/Step Time": 8.516001284122467} +{"Pretrain/Learning Rate": 3.9260680967064814e-05, "Pretrain/Loss": 2.059138298034668, "Pretrain/Loss (Raw)": 2.1047182083129883, "Pretrain/Step": 3124, "Pretrain/Step Time": 8.513716531917453} +{"Pretrain/Learning Rate": 3.9253707003397814e-05, "Pretrain/Loss": 2.059408187866211, "Pretrain/Loss (Raw)": 2.07194447517395, "Pretrain/Step": 3125, "Pretrain/Step Time": 8.516134021803737} +{"Pretrain/Learning Rate": 3.924673139592616e-05, "Pretrain/Loss": 2.05973744392395, "Pretrain/Loss (Raw)": 2.0851662158966064, "Pretrain/Step": 3126, "Pretrain/Step Time": 8.515661226585507} +{"Pretrain/Learning Rate": 3.9239754145454304e-05, "Pretrain/Loss": 2.0613327026367188, "Pretrain/Loss (Raw)": 2.1988940238952637, "Pretrain/Step": 3127, "Pretrain/Step Time": 8.505886914208531} +{"Pretrain/Learning Rate": 3.92327752527869e-05, "Pretrain/Loss": 2.060106039047241, "Pretrain/Loss (Raw)": 1.7732820510864258, "Pretrain/Step": 3128, "Pretrain/Step Time": 8.502197345718741} +{"Pretrain/Learning Rate": 3.922579471872879e-05, "Pretrain/Loss": 2.0612783432006836, "Pretrain/Loss (Raw)": 2.053163528442383, "Pretrain/Step": 3129, "Pretrain/Step Time": 8.502677142620087} +{"Pretrain/Learning Rate": 3.9218812544085004e-05, "Pretrain/Loss": 2.063607692718506, "Pretrain/Loss (Raw)": 2.146348714828491, "Pretrain/Step": 3130, "Pretrain/Step Time": 8.510618083178997} +{"Pretrain/Learning Rate": 3.921182872966075e-05, "Pretrain/Loss": 2.0642342567443848, "Pretrain/Loss (Raw)": 1.808737874031067, "Pretrain/Step": 3131, "Pretrain/Step Time": 8.511716641485691} +{"Pretrain/Learning Rate": 3.920484327626144e-05, "Pretrain/Loss": 2.063669204711914, "Pretrain/Loss (Raw)": 2.0281388759613037, "Pretrain/Step": 3132, "Pretrain/Step Time": 8.516018064692616} +{"Pretrain/Learning Rate": 3.919785618469266e-05, "Pretrain/Loss": 2.0643749237060547, "Pretrain/Loss (Raw)": 2.006254196166992, "Pretrain/Step": 3133, "Pretrain/Step Time": 8.507742699235678} +{"Pretrain/Learning Rate": 3.9190867455760213e-05, "Pretrain/Loss": 2.0617966651916504, "Pretrain/Loss (Raw)": 1.8223435878753662, "Pretrain/Step": 3134, "Pretrain/Step Time": 8.501240642741323} +{"Pretrain/Learning Rate": 3.918387709027005e-05, "Pretrain/Loss": 2.0643739700317383, "Pretrain/Loss (Raw)": 2.2600507736206055, "Pretrain/Step": 3135, "Pretrain/Step Time": 8.504435550421476} +{"Pretrain/Learning Rate": 3.917688508902835e-05, "Pretrain/Loss": 2.0654361248016357, "Pretrain/Loss (Raw)": 2.0359723567962646, "Pretrain/Step": 3136, "Pretrain/Step Time": 8.503781525418162} +{"Pretrain/Learning Rate": 3.916989145284146e-05, "Pretrain/Loss": 2.062432289123535, "Pretrain/Loss (Raw)": 1.76410973072052, "Pretrain/Step": 3137, "Pretrain/Step Time": 8.506875924766064} +{"Pretrain/Learning Rate": 3.9162896182515915e-05, "Pretrain/Loss": 2.0623981952667236, "Pretrain/Loss (Raw)": 2.09308123588562, "Pretrain/Step": 3138, "Pretrain/Step Time": 8.50630283728242} +{"Pretrain/Learning Rate": 3.9155899278858445e-05, "Pretrain/Loss": 2.0629220008850098, "Pretrain/Loss (Raw)": 2.0970733165740967, "Pretrain/Step": 3139, "Pretrain/Step Time": 8.50229330919683} +{"Pretrain/Learning Rate": 3.914890074267597e-05, "Pretrain/Loss": 2.0629374980926514, "Pretrain/Loss (Raw)": 1.956641674041748, "Pretrain/Step": 3140, "Pretrain/Step Time": 8.498450623825192} +{"Pretrain/Learning Rate": 3.914190057477558e-05, "Pretrain/Loss": 2.060901641845703, "Pretrain/Loss (Raw)": 1.9906325340270996, "Pretrain/Step": 3141, "Pretrain/Step Time": 8.503888346254826} +{"Pretrain/Learning Rate": 3.913489877596458e-05, "Pretrain/Loss": 2.0605008602142334, "Pretrain/Loss (Raw)": 1.9493019580841064, "Pretrain/Step": 3142, "Pretrain/Step Time": 8.509361701086164} +{"Pretrain/Learning Rate": 3.912789534705045e-05, "Pretrain/Loss": 2.06134295463562, "Pretrain/Loss (Raw)": 2.03790545463562, "Pretrain/Step": 3143, "Pretrain/Step Time": 8.50851453654468} +{"Pretrain/Learning Rate": 3.912089028884085e-05, "Pretrain/Loss": 2.060758590698242, "Pretrain/Loss (Raw)": 2.088066577911377, "Pretrain/Step": 3144, "Pretrain/Step Time": 8.511409474536777} +{"Pretrain/Learning Rate": 3.9113883602143645e-05, "Pretrain/Loss": 2.0577847957611084, "Pretrain/Loss (Raw)": 1.8610186576843262, "Pretrain/Step": 3145, "Pretrain/Step Time": 8.503034241497517} +{"Pretrain/Learning Rate": 3.910687528776688e-05, "Pretrain/Loss": 2.0556135177612305, "Pretrain/Loss (Raw)": 1.926648736000061, "Pretrain/Step": 3146, "Pretrain/Step Time": 8.493380343541503} +{"Pretrain/Learning Rate": 3.9099865346518786e-05, "Pretrain/Loss": 2.054917573928833, "Pretrain/Loss (Raw)": 1.9453374147415161, "Pretrain/Step": 3147, "Pretrain/Step Time": 8.497272549197078} +{"Pretrain/Learning Rate": 3.909285377920777e-05, "Pretrain/Loss": 2.056767463684082, "Pretrain/Loss (Raw)": 2.095606565475464, "Pretrain/Step": 3148, "Pretrain/Step Time": 8.500343160703778} +{"Pretrain/Learning Rate": 3.908584058664245e-05, "Pretrain/Loss": 2.0561318397521973, "Pretrain/Loss (Raw)": 1.96066153049469, "Pretrain/Step": 3149, "Pretrain/Step Time": 8.506158525124192} +{"Pretrain/Learning Rate": 3.907882576963162e-05, "Pretrain/Loss": 2.057161808013916, "Pretrain/Loss (Raw)": 2.114095687866211, "Pretrain/Step": 3150, "Pretrain/Step Time": 8.506675507873297} +{"Pretrain/Learning Rate": 3.907180932898427e-05, "Pretrain/Loss": 2.0580668449401855, "Pretrain/Loss (Raw)": 2.203233242034912, "Pretrain/Step": 3151, "Pretrain/Step Time": 8.498978301882744} +{"Pretrain/Learning Rate": 3.9064791265509546e-05, "Pretrain/Loss": 2.058786392211914, "Pretrain/Loss (Raw)": 2.0039784908294678, "Pretrain/Step": 3152, "Pretrain/Step Time": 8.502574222162366} +{"Pretrain/Learning Rate": 3.905777158001682e-05, "Pretrain/Loss": 2.0566978454589844, "Pretrain/Loss (Raw)": 2.1728262901306152, "Pretrain/Step": 3153, "Pretrain/Step Time": 8.500268103554845} +{"Pretrain/Learning Rate": 3.905075027331564e-05, "Pretrain/Loss": 2.054013252258301, "Pretrain/Loss (Raw)": 1.6794425249099731, "Pretrain/Step": 3154, "Pretrain/Step Time": 8.516946708783507} +{"Pretrain/Learning Rate": 3.9043727346215726e-05, "Pretrain/Loss": 2.055445909500122, "Pretrain/Loss (Raw)": 2.0551743507385254, "Pretrain/Step": 3155, "Pretrain/Step Time": 8.515422578901052} +{"Pretrain/Learning Rate": 3.9036702799527e-05, "Pretrain/Loss": 2.0528366565704346, "Pretrain/Loss (Raw)": 2.0695548057556152, "Pretrain/Step": 3156, "Pretrain/Step Time": 8.51311470195651} +{"Pretrain/Learning Rate": 3.902967663405956e-05, "Pretrain/Loss": 2.051640033721924, "Pretrain/Loss (Raw)": 1.8575310707092285, "Pretrain/Step": 3157, "Pretrain/Step Time": 8.50383130274713} +{"Pretrain/Learning Rate": 3.90226488506237e-05, "Pretrain/Loss": 2.0518531799316406, "Pretrain/Loss (Raw)": 2.0951449871063232, "Pretrain/Step": 3158, "Pretrain/Step Time": 8.509347027167678} +{"Pretrain/Learning Rate": 3.9015619450029904e-05, "Pretrain/Loss": 2.051499366760254, "Pretrain/Loss (Raw)": 1.9952654838562012, "Pretrain/Step": 3159, "Pretrain/Step Time": 8.517407773062587} +{"Pretrain/Learning Rate": 3.9008588433088825e-05, "Pretrain/Loss": 2.0533242225646973, "Pretrain/Loss (Raw)": 2.179108142852783, "Pretrain/Step": 3160, "Pretrain/Step Time": 8.523417364805937} +{"Pretrain/Learning Rate": 3.900155580061132e-05, "Pretrain/Loss": 2.051077365875244, "Pretrain/Loss (Raw)": 1.7501475811004639, "Pretrain/Step": 3161, "Pretrain/Step Time": 8.522939307615161} +{"Pretrain/Learning Rate": 3.899452155340842e-05, "Pretrain/Loss": 2.0489110946655273, "Pretrain/Loss (Raw)": 1.9966405630111694, "Pretrain/Step": 3162, "Pretrain/Step Time": 8.52424893155694} +{"Pretrain/Learning Rate": 3.898748569229135e-05, "Pretrain/Loss": 2.0485105514526367, "Pretrain/Loss (Raw)": 2.1568222045898438, "Pretrain/Step": 3163, "Pretrain/Step Time": 8.525488028302789} +{"Pretrain/Learning Rate": 3.898044821807152e-05, "Pretrain/Loss": 2.049985408782959, "Pretrain/Loss (Raw)": 2.0863795280456543, "Pretrain/Step": 3164, "Pretrain/Step Time": 8.516831746324897} +{"Pretrain/Learning Rate": 3.897340913156052e-05, "Pretrain/Loss": 2.051236867904663, "Pretrain/Loss (Raw)": 2.109593391418457, "Pretrain/Step": 3165, "Pretrain/Step Time": 8.511425079777837} +{"Pretrain/Learning Rate": 3.896636843357014e-05, "Pretrain/Loss": 2.0535030364990234, "Pretrain/Loss (Raw)": 2.1401288509368896, "Pretrain/Step": 3166, "Pretrain/Step Time": 8.513903819024563} +{"Pretrain/Learning Rate": 3.895932612491233e-05, "Pretrain/Loss": 2.055201292037964, "Pretrain/Loss (Raw)": 2.36913800239563, "Pretrain/Step": 3167, "Pretrain/Step Time": 8.521533524617553} +{"Pretrain/Learning Rate": 3.895228220639926e-05, "Pretrain/Loss": 2.05470609664917, "Pretrain/Loss (Raw)": 1.9873135089874268, "Pretrain/Step": 3168, "Pretrain/Step Time": 8.514385094866157} +{"Pretrain/Learning Rate": 3.8945236678843266e-05, "Pretrain/Loss": 2.054896831512451, "Pretrain/Loss (Raw)": 2.03682279586792, "Pretrain/Step": 3169, "Pretrain/Step Time": 8.516193006187677} +{"Pretrain/Learning Rate": 3.893818954305686e-05, "Pretrain/Loss": 2.0556228160858154, "Pretrain/Loss (Raw)": 2.0254225730895996, "Pretrain/Step": 3170, "Pretrain/Step Time": 8.51206306554377} +{"Pretrain/Learning Rate": 3.893114079985276e-05, "Pretrain/Loss": 2.0571060180664062, "Pretrain/Loss (Raw)": 2.1194748878479004, "Pretrain/Step": 3171, "Pretrain/Step Time": 8.51404794305563} +{"Pretrain/Learning Rate": 3.892409045004385e-05, "Pretrain/Loss": 2.059610605239868, "Pretrain/Loss (Raw)": 2.1806015968322754, "Pretrain/Step": 3172, "Pretrain/Step Time": 8.522958770394325} +{"Pretrain/Learning Rate": 3.891703849444322e-05, "Pretrain/Loss": 2.0593292713165283, "Pretrain/Loss (Raw)": 2.2192575931549072, "Pretrain/Step": 3173, "Pretrain/Step Time": 8.521967831999063} +{"Pretrain/Learning Rate": 3.890998493386414e-05, "Pretrain/Loss": 2.0584447383880615, "Pretrain/Loss (Raw)": 1.981988787651062, "Pretrain/Step": 3174, "Pretrain/Step Time": 8.519635554403067} +{"Pretrain/Learning Rate": 3.890292976912005e-05, "Pretrain/Loss": 2.059272289276123, "Pretrain/Loss (Raw)": 2.231205463409424, "Pretrain/Step": 3175, "Pretrain/Step Time": 8.515556905418634} +{"Pretrain/Learning Rate": 3.889587300102457e-05, "Pretrain/Loss": 2.063286304473877, "Pretrain/Loss (Raw)": 2.541313409805298, "Pretrain/Step": 3176, "Pretrain/Step Time": 8.515398610383272} +{"Pretrain/Learning Rate": 3.8888814630391556e-05, "Pretrain/Loss": 2.062458038330078, "Pretrain/Loss (Raw)": 2.009099006652832, "Pretrain/Step": 3177, "Pretrain/Step Time": 8.52130332030356} +{"Pretrain/Learning Rate": 3.8881754658034986e-05, "Pretrain/Loss": 2.061530113220215, "Pretrain/Loss (Raw)": 2.0980679988861084, "Pretrain/Step": 3178, "Pretrain/Step Time": 8.52704656124115} +{"Pretrain/Learning Rate": 3.8874693084769055e-05, "Pretrain/Loss": 2.0636448860168457, "Pretrain/Loss (Raw)": 1.9361701011657715, "Pretrain/Step": 3179, "Pretrain/Step Time": 8.530209358781576} +{"Pretrain/Learning Rate": 3.8867629911408135e-05, "Pretrain/Loss": 2.0621752738952637, "Pretrain/Loss (Raw)": 1.986079216003418, "Pretrain/Step": 3180, "Pretrain/Step Time": 8.523812133818865} +{"Pretrain/Learning Rate": 3.886056513876679e-05, "Pretrain/Loss": 2.060929775238037, "Pretrain/Loss (Raw)": 2.063617467880249, "Pretrain/Step": 3181, "Pretrain/Step Time": 8.519008673727512} +{"Pretrain/Learning Rate": 3.885349876765976e-05, "Pretrain/Loss": 2.0613644123077393, "Pretrain/Loss (Raw)": 2.0637221336364746, "Pretrain/Step": 3182, "Pretrain/Step Time": 8.52353453449905} +{"Pretrain/Learning Rate": 3.884643079890197e-05, "Pretrain/Loss": 2.062643051147461, "Pretrain/Loss (Raw)": 2.148972511291504, "Pretrain/Step": 3183, "Pretrain/Step Time": 8.52840630710125} +{"Pretrain/Learning Rate": 3.883936123330853e-05, "Pretrain/Loss": 2.0632452964782715, "Pretrain/Loss (Raw)": 2.1744019985198975, "Pretrain/Step": 3184, "Pretrain/Step Time": 8.53045017272234} +{"Pretrain/Learning Rate": 3.883229007169474e-05, "Pretrain/Loss": 2.061953067779541, "Pretrain/Loss (Raw)": 1.9954122304916382, "Pretrain/Step": 3185, "Pretrain/Step Time": 8.531714173033834} +{"Pretrain/Learning Rate": 3.8825217314876084e-05, "Pretrain/Loss": 2.06150484085083, "Pretrain/Loss (Raw)": 1.9910138845443726, "Pretrain/Step": 3186, "Pretrain/Step Time": 8.530926702544093} +{"Pretrain/Learning Rate": 3.881814296366822e-05, "Pretrain/Loss": 2.0597496032714844, "Pretrain/Loss (Raw)": 1.7740610837936401, "Pretrain/Step": 3187, "Pretrain/Step Time": 8.517444383352995} +{"Pretrain/Learning Rate": 3.881106701888699e-05, "Pretrain/Loss": 2.0584442615509033, "Pretrain/Loss (Raw)": 1.9335790872573853, "Pretrain/Step": 3188, "Pretrain/Step Time": 8.525286367163062} +{"Pretrain/Learning Rate": 3.880398948134845e-05, "Pretrain/Loss": 2.061612367630005, "Pretrain/Loss (Raw)": 2.5225257873535156, "Pretrain/Step": 3189, "Pretrain/Step Time": 8.52886462584138} +{"Pretrain/Learning Rate": 3.879691035186878e-05, "Pretrain/Loss": 2.0609915256500244, "Pretrain/Loss (Raw)": 2.23793888092041, "Pretrain/Step": 3190, "Pretrain/Step Time": 8.528272982686758} +{"Pretrain/Learning Rate": 3.8789829631264394e-05, "Pretrain/Loss": 2.0606913566589355, "Pretrain/Loss (Raw)": 1.9873450994491577, "Pretrain/Step": 3191, "Pretrain/Step Time": 8.529403652995825} +{"Pretrain/Learning Rate": 3.878274732035188e-05, "Pretrain/Loss": 2.061976432800293, "Pretrain/Loss (Raw)": 2.185805559158325, "Pretrain/Step": 3192, "Pretrain/Step Time": 8.529831415042281} +{"Pretrain/Learning Rate": 3.8775663419948e-05, "Pretrain/Loss": 2.062861442565918, "Pretrain/Loss (Raw)": 2.0496044158935547, "Pretrain/Step": 3193, "Pretrain/Step Time": 8.528892330825329} +{"Pretrain/Learning Rate": 3.87685779308697e-05, "Pretrain/Loss": 2.0625061988830566, "Pretrain/Loss (Raw)": 2.057072639465332, "Pretrain/Step": 3194, "Pretrain/Step Time": 8.520399076864123} +{"Pretrain/Learning Rate": 3.8761490853934115e-05, "Pretrain/Loss": 2.0580875873565674, "Pretrain/Loss (Raw)": 1.9902756214141846, "Pretrain/Step": 3195, "Pretrain/Step Time": 8.527652829885483} +{"Pretrain/Learning Rate": 3.875440218995856e-05, "Pretrain/Loss": 2.058574676513672, "Pretrain/Loss (Raw)": 2.0891292095184326, "Pretrain/Step": 3196, "Pretrain/Step Time": 8.5280797239393} +{"Pretrain/Learning Rate": 3.874731193976052e-05, "Pretrain/Loss": 2.063100814819336, "Pretrain/Loss (Raw)": 2.4344868659973145, "Pretrain/Step": 3197, "Pretrain/Step Time": 8.524008678272367} +{"Pretrain/Learning Rate": 3.87402201041577e-05, "Pretrain/Loss": 2.059922456741333, "Pretrain/Loss (Raw)": 1.7912689447402954, "Pretrain/Step": 3198, "Pretrain/Step Time": 8.52568719163537} +{"Pretrain/Learning Rate": 3.8733126683967946e-05, "Pretrain/Loss": 2.059328317642212, "Pretrain/Loss (Raw)": 2.082026958465576, "Pretrain/Step": 3199, "Pretrain/Step Time": 8.521266793832183} +{"Pretrain/Learning Rate": 3.872603168000931e-05, "Pretrain/Loss": 2.058159351348877, "Pretrain/Loss (Raw)": 1.987562894821167, "Pretrain/Step": 3200, "Pretrain/Step Time": 8.523277955129743} +{"Pretrain/Learning Rate": 3.871893509310003e-05, "Pretrain/Loss": 2.059673309326172, "Pretrain/Loss (Raw)": 2.102530002593994, "Pretrain/Step": 3201, "Pretrain/Step Time": 8.519626261666417} +{"Pretrain/Learning Rate": 3.87118369240585e-05, "Pretrain/Loss": 2.0609354972839355, "Pretrain/Loss (Raw)": 2.135913133621216, "Pretrain/Step": 3202, "Pretrain/Step Time": 8.525056393817067} +{"Pretrain/Learning Rate": 3.870473717370333e-05, "Pretrain/Loss": 2.060070514678955, "Pretrain/Loss (Raw)": 2.099210500717163, "Pretrain/Step": 3203, "Pretrain/Step Time": 8.522116415202618} +{"Pretrain/Learning Rate": 3.869763584285328e-05, "Pretrain/Loss": 2.0596189498901367, "Pretrain/Loss (Raw)": 2.147615432739258, "Pretrain/Step": 3204, "Pretrain/Step Time": 8.515100693330169} +{"Pretrain/Learning Rate": 3.869053293232733e-05, "Pretrain/Loss": 2.061232089996338, "Pretrain/Loss (Raw)": 2.1807634830474854, "Pretrain/Step": 3205, "Pretrain/Step Time": 8.514302760362625} +{"Pretrain/Learning Rate": 3.8683428442944604e-05, "Pretrain/Loss": 2.061027765274048, "Pretrain/Loss (Raw)": 2.0283889770507812, "Pretrain/Step": 3206, "Pretrain/Step Time": 8.512633826583624} +{"Pretrain/Learning Rate": 3.8676322375524435e-05, "Pretrain/Loss": 2.0628602504730225, "Pretrain/Loss (Raw)": 2.1453142166137695, "Pretrain/Step": 3207, "Pretrain/Step Time": 8.510500390082598} +{"Pretrain/Learning Rate": 3.866921473088632e-05, "Pretrain/Loss": 2.0628318786621094, "Pretrain/Loss (Raw)": 2.0450589656829834, "Pretrain/Step": 3208, "Pretrain/Step Time": 8.515026062726974} +{"Pretrain/Learning Rate": 3.866210550984996e-05, "Pretrain/Loss": 2.0633721351623535, "Pretrain/Loss (Raw)": 2.1077167987823486, "Pretrain/Step": 3209, "Pretrain/Step Time": 8.52135755494237} +{"Pretrain/Learning Rate": 3.86549947132352e-05, "Pretrain/Loss": 2.062406063079834, "Pretrain/Loss (Raw)": 2.0874645709991455, "Pretrain/Step": 3210, "Pretrain/Step Time": 8.507093515247107} +{"Pretrain/Learning Rate": 3.8647882341862115e-05, "Pretrain/Loss": 2.0610415935516357, "Pretrain/Loss (Raw)": 2.118495464324951, "Pretrain/Step": 3211, "Pretrain/Step Time": 8.510459074750543} +{"Pretrain/Learning Rate": 3.864076839655093e-05, "Pretrain/Loss": 2.0603795051574707, "Pretrain/Loss (Raw)": 2.013761520385742, "Pretrain/Step": 3212, "Pretrain/Step Time": 8.508246885612607} +{"Pretrain/Learning Rate": 3.863365287812205e-05, "Pretrain/Loss": 2.06154727935791, "Pretrain/Loss (Raw)": 2.1425282955169678, "Pretrain/Step": 3213, "Pretrain/Step Time": 8.507764551788568} +{"Pretrain/Learning Rate": 3.862653578739608e-05, "Pretrain/Loss": 2.0615406036376953, "Pretrain/Loss (Raw)": 2.022409200668335, "Pretrain/Step": 3214, "Pretrain/Step Time": 8.512961689382792} +{"Pretrain/Learning Rate": 3.861941712519379e-05, "Pretrain/Loss": 2.0613951683044434, "Pretrain/Loss (Raw)": 2.1522769927978516, "Pretrain/Step": 3215, "Pretrain/Step Time": 8.51026757992804} +{"Pretrain/Learning Rate": 3.8612296892336144e-05, "Pretrain/Loss": 2.0622501373291016, "Pretrain/Loss (Raw)": 2.275857448577881, "Pretrain/Step": 3216, "Pretrain/Step Time": 8.506506925448775} +{"Pretrain/Learning Rate": 3.8605175089644274e-05, "Pretrain/Loss": 2.0621447563171387, "Pretrain/Loss (Raw)": 2.0388870239257812, "Pretrain/Step": 3217, "Pretrain/Step Time": 8.506102837622166} +{"Pretrain/Learning Rate": 3.859805171793951e-05, "Pretrain/Loss": 2.0641133785247803, "Pretrain/Loss (Raw)": 2.233574390411377, "Pretrain/Step": 3218, "Pretrain/Step Time": 8.507369048893452} +{"Pretrain/Learning Rate": 3.8590926778043335e-05, "Pretrain/Loss": 2.0651473999023438, "Pretrain/Loss (Raw)": 1.9732528924942017, "Pretrain/Step": 3219, "Pretrain/Step Time": 8.50479555875063} +{"Pretrain/Learning Rate": 3.858380027077745e-05, "Pretrain/Loss": 2.064486265182495, "Pretrain/Loss (Raw)": 2.1512792110443115, "Pretrain/Step": 3220, "Pretrain/Step Time": 8.510784881189466} +{"Pretrain/Learning Rate": 3.8576672196963705e-05, "Pretrain/Loss": 2.0645132064819336, "Pretrain/Loss (Raw)": 2.0077297687530518, "Pretrain/Step": 3221, "Pretrain/Step Time": 8.506882471963763} +{"Pretrain/Learning Rate": 3.856954255742414e-05, "Pretrain/Loss": 2.0651235580444336, "Pretrain/Loss (Raw)": 2.2001774311065674, "Pretrain/Step": 3222, "Pretrain/Step Time": 8.505101105198264} +{"Pretrain/Learning Rate": 3.8562411352980996e-05, "Pretrain/Loss": 2.065260171890259, "Pretrain/Loss (Raw)": 2.113084316253662, "Pretrain/Step": 3223, "Pretrain/Step Time": 8.497492341324687} +{"Pretrain/Learning Rate": 3.8555278584456664e-05, "Pretrain/Loss": 2.0638675689697266, "Pretrain/Loss (Raw)": 2.0209524631500244, "Pretrain/Step": 3224, "Pretrain/Step Time": 8.49902101419866} +{"Pretrain/Learning Rate": 3.854814425267373e-05, "Pretrain/Loss": 2.068291664123535, "Pretrain/Loss (Raw)": 2.5935728549957275, "Pretrain/Step": 3225, "Pretrain/Step Time": 8.495134476572275} +{"Pretrain/Learning Rate": 3.8541008358454956e-05, "Pretrain/Loss": 2.0690715312957764, "Pretrain/Loss (Raw)": 2.0171287059783936, "Pretrain/Step": 3226, "Pretrain/Step Time": 8.501732893288136} +{"Pretrain/Learning Rate": 3.853387090262329e-05, "Pretrain/Loss": 2.070017099380493, "Pretrain/Loss (Raw)": 2.218684196472168, "Pretrain/Step": 3227, "Pretrain/Step Time": 8.500688510015607} +{"Pretrain/Learning Rate": 3.852673188600187e-05, "Pretrain/Loss": 2.0715041160583496, "Pretrain/Loss (Raw)": 2.203559637069702, "Pretrain/Step": 3228, "Pretrain/Step Time": 8.491188760846853} +{"Pretrain/Learning Rate": 3.851959130941398e-05, "Pretrain/Loss": 2.0728721618652344, "Pretrain/Loss (Raw)": 2.079706907272339, "Pretrain/Step": 3229, "Pretrain/Step Time": 8.489308133721352} +{"Pretrain/Learning Rate": 3.851244917368311e-05, "Pretrain/Loss": 2.0741019248962402, "Pretrain/Loss (Raw)": 2.152972459793091, "Pretrain/Step": 3230, "Pretrain/Step Time": 8.495597554370761} +{"Pretrain/Learning Rate": 3.8505305479632934e-05, "Pretrain/Loss": 2.0753579139709473, "Pretrain/Loss (Raw)": 2.1168625354766846, "Pretrain/Step": 3231, "Pretrain/Step Time": 8.499394746497273} +{"Pretrain/Learning Rate": 3.8498160228087284e-05, "Pretrain/Loss": 2.077669382095337, "Pretrain/Loss (Raw)": 2.182253837585449, "Pretrain/Step": 3232, "Pretrain/Step Time": 8.503761027008295} +{"Pretrain/Learning Rate": 3.8491013419870204e-05, "Pretrain/Loss": 2.077357769012451, "Pretrain/Loss (Raw)": 1.9791107177734375, "Pretrain/Step": 3233, "Pretrain/Step Time": 8.495017411187291} +{"Pretrain/Learning Rate": 3.848386505580588e-05, "Pretrain/Loss": 2.0790553092956543, "Pretrain/Loss (Raw)": 1.9419454336166382, "Pretrain/Step": 3234, "Pretrain/Step Time": 8.499575302004814} +{"Pretrain/Learning Rate": 3.84767151367187e-05, "Pretrain/Loss": 2.07903790473938, "Pretrain/Loss (Raw)": 2.025984287261963, "Pretrain/Step": 3235, "Pretrain/Step Time": 8.499127645045519} +{"Pretrain/Learning Rate": 3.846956366343322e-05, "Pretrain/Loss": 2.0799551010131836, "Pretrain/Loss (Raw)": 2.071255922317505, "Pretrain/Step": 3236, "Pretrain/Step Time": 8.504871267825365} +{"Pretrain/Learning Rate": 3.8462410636774196e-05, "Pretrain/Loss": 2.0800423622131348, "Pretrain/Loss (Raw)": 2.114213466644287, "Pretrain/Step": 3237, "Pretrain/Step Time": 8.513536751270294} +{"Pretrain/Learning Rate": 3.845525605756653e-05, "Pretrain/Loss": 2.082615852355957, "Pretrain/Loss (Raw)": 2.1238534450531006, "Pretrain/Step": 3238, "Pretrain/Step Time": 8.515179699286819} +{"Pretrain/Learning Rate": 3.844809992663534e-05, "Pretrain/Loss": 2.0826125144958496, "Pretrain/Loss (Raw)": 2.1451027393341064, "Pretrain/Step": 3239, "Pretrain/Step Time": 8.510012682527304} +{"Pretrain/Learning Rate": 3.844094224480589e-05, "Pretrain/Loss": 2.082378625869751, "Pretrain/Loss (Raw)": 2.0972700119018555, "Pretrain/Step": 3240, "Pretrain/Step Time": 8.507226729765534} +{"Pretrain/Learning Rate": 3.843378301290366e-05, "Pretrain/Loss": 2.082298994064331, "Pretrain/Loss (Raw)": 2.172830820083618, "Pretrain/Step": 3241, "Pretrain/Step Time": 8.50086148828268} +{"Pretrain/Learning Rate": 3.8426622231754255e-05, "Pretrain/Loss": 2.080461025238037, "Pretrain/Loss (Raw)": 2.028053045272827, "Pretrain/Step": 3242, "Pretrain/Step Time": 8.508543303236365} +{"Pretrain/Learning Rate": 3.8419459902183515e-05, "Pretrain/Loss": 2.0802645683288574, "Pretrain/Loss (Raw)": 2.123521566390991, "Pretrain/Step": 3243, "Pretrain/Step Time": 8.514337785542011} +{"Pretrain/Learning Rate": 3.841229602501742e-05, "Pretrain/Loss": 2.0806772708892822, "Pretrain/Loss (Raw)": 2.0657219886779785, "Pretrain/Step": 3244, "Pretrain/Step Time": 8.52086784131825} +{"Pretrain/Learning Rate": 3.840513060108214e-05, "Pretrain/Loss": 2.079216480255127, "Pretrain/Loss (Raw)": 1.977400541305542, "Pretrain/Step": 3245, "Pretrain/Step Time": 8.520882045850158} +{"Pretrain/Learning Rate": 3.8397963631204046e-05, "Pretrain/Loss": 2.075552225112915, "Pretrain/Loss (Raw)": 1.9664404392242432, "Pretrain/Step": 3246, "Pretrain/Step Time": 8.514521732926369} +{"Pretrain/Learning Rate": 3.8390795116209645e-05, "Pretrain/Loss": 2.0752434730529785, "Pretrain/Loss (Raw)": 2.0310781002044678, "Pretrain/Step": 3247, "Pretrain/Step Time": 8.503407195210457} +{"Pretrain/Learning Rate": 3.8383625056925654e-05, "Pretrain/Loss": 2.0758650302886963, "Pretrain/Loss (Raw)": 2.1794683933258057, "Pretrain/Step": 3248, "Pretrain/Step Time": 8.50990910641849} +{"Pretrain/Learning Rate": 3.837645345417895e-05, "Pretrain/Loss": 2.0738577842712402, "Pretrain/Loss (Raw)": 2.0400333404541016, "Pretrain/Step": 3249, "Pretrain/Step Time": 8.519451072439551} +{"Pretrain/Learning Rate": 3.836928030879661e-05, "Pretrain/Loss": 2.074547290802002, "Pretrain/Loss (Raw)": 2.136047124862671, "Pretrain/Step": 3250, "Pretrain/Step Time": 8.524283764883876} +{"Pretrain/Learning Rate": 3.8362105621605866e-05, "Pretrain/Loss": 2.074049472808838, "Pretrain/Loss (Raw)": 2.0420849323272705, "Pretrain/Step": 3251, "Pretrain/Step Time": 8.514588870108128} +{"Pretrain/Learning Rate": 3.835492939343413e-05, "Pretrain/Loss": 2.0723016262054443, "Pretrain/Loss (Raw)": 1.8809733390808105, "Pretrain/Step": 3252, "Pretrain/Step Time": 8.509963991120458} +{"Pretrain/Learning Rate": 3.834775162510901e-05, "Pretrain/Loss": 2.07171893119812, "Pretrain/Loss (Raw)": 1.9973613023757935, "Pretrain/Step": 3253, "Pretrain/Step Time": 8.516553863883018} +{"Pretrain/Learning Rate": 3.834057231745828e-05, "Pretrain/Loss": 2.0713086128234863, "Pretrain/Loss (Raw)": 2.0326554775238037, "Pretrain/Step": 3254, "Pretrain/Step Time": 8.516004674136639} +{"Pretrain/Learning Rate": 3.8333391471309884e-05, "Pretrain/Loss": 2.0713582038879395, "Pretrain/Loss (Raw)": 2.2052347660064697, "Pretrain/Step": 3255, "Pretrain/Step Time": 8.513088777661324} +{"Pretrain/Learning Rate": 3.8326209087491955e-05, "Pretrain/Loss": 2.0733907222747803, "Pretrain/Loss (Raw)": 2.0334489345550537, "Pretrain/Step": 3256, "Pretrain/Step Time": 8.526138780638576} +{"Pretrain/Learning Rate": 3.8319025166832794e-05, "Pretrain/Loss": 2.0738043785095215, "Pretrain/Loss (Raw)": 2.106105327606201, "Pretrain/Step": 3257, "Pretrain/Step Time": 8.520876314491034} +{"Pretrain/Learning Rate": 3.83118397101609e-05, "Pretrain/Loss": 2.069976329803467, "Pretrain/Loss (Raw)": 1.6563571691513062, "Pretrain/Step": 3258, "Pretrain/Step Time": 8.517849504947662} +{"Pretrain/Learning Rate": 3.830465271830491e-05, "Pretrain/Loss": 2.0697436332702637, "Pretrain/Loss (Raw)": 1.7789568901062012, "Pretrain/Step": 3259, "Pretrain/Step Time": 8.521184612065554} +{"Pretrain/Learning Rate": 3.829746419209369e-05, "Pretrain/Loss": 2.070352554321289, "Pretrain/Loss (Raw)": 2.106096029281616, "Pretrain/Step": 3260, "Pretrain/Step Time": 8.518735343590379} +{"Pretrain/Learning Rate": 3.829027413235623e-05, "Pretrain/Loss": 2.0703372955322266, "Pretrain/Loss (Raw)": 2.00429368019104, "Pretrain/Step": 3261, "Pretrain/Step Time": 8.531566690653563} +{"Pretrain/Learning Rate": 3.8283082539921735e-05, "Pretrain/Loss": 2.0708394050598145, "Pretrain/Loss (Raw)": 1.8866338729858398, "Pretrain/Step": 3262, "Pretrain/Step Time": 8.539496652781963} +{"Pretrain/Learning Rate": 3.827588941561956e-05, "Pretrain/Loss": 2.0687294006347656, "Pretrain/Loss (Raw)": 1.9899327754974365, "Pretrain/Step": 3263, "Pretrain/Step Time": 8.52716681919992} +{"Pretrain/Learning Rate": 3.826869476027927e-05, "Pretrain/Loss": 2.068796157836914, "Pretrain/Loss (Raw)": 2.0445146560668945, "Pretrain/Step": 3264, "Pretrain/Step Time": 8.528937503695488} +{"Pretrain/Learning Rate": 3.826149857473057e-05, "Pretrain/Loss": 2.070099353790283, "Pretrain/Loss (Raw)": 1.930916666984558, "Pretrain/Step": 3265, "Pretrain/Step Time": 8.528519222512841} +{"Pretrain/Learning Rate": 3.825430085980337e-05, "Pretrain/Loss": 2.069016456604004, "Pretrain/Loss (Raw)": 1.9544832706451416, "Pretrain/Step": 3266, "Pretrain/Step Time": 8.53208072297275} +{"Pretrain/Learning Rate": 3.8247101616327726e-05, "Pretrain/Loss": 2.0698394775390625, "Pretrain/Loss (Raw)": 2.202425956726074, "Pretrain/Step": 3267, "Pretrain/Step Time": 8.538950711488724} +{"Pretrain/Learning Rate": 3.823990084513391e-05, "Pretrain/Loss": 2.0698347091674805, "Pretrain/Loss (Raw)": 1.956009030342102, "Pretrain/Step": 3268, "Pretrain/Step Time": 8.544474061578512} +{"Pretrain/Learning Rate": 3.8232698547052345e-05, "Pretrain/Loss": 2.071089267730713, "Pretrain/Loss (Raw)": 2.1512105464935303, "Pretrain/Step": 3269, "Pretrain/Step Time": 8.540495738387108} +{"Pretrain/Learning Rate": 3.8225494722913624e-05, "Pretrain/Loss": 2.0720040798187256, "Pretrain/Loss (Raw)": 2.066444158554077, "Pretrain/Step": 3270, "Pretrain/Step Time": 8.537128921598196} +{"Pretrain/Learning Rate": 3.821828937354853e-05, "Pretrain/Loss": 2.0721449851989746, "Pretrain/Loss (Raw)": 2.0559163093566895, "Pretrain/Step": 3271, "Pretrain/Step Time": 8.533852081745863} +{"Pretrain/Learning Rate": 3.821108249978802e-05, "Pretrain/Loss": 2.0737907886505127, "Pretrain/Loss (Raw)": 2.298741340637207, "Pretrain/Step": 3272, "Pretrain/Step Time": 8.541597420349717} +{"Pretrain/Learning Rate": 3.8203874102463235e-05, "Pretrain/Loss": 2.0750019550323486, "Pretrain/Loss (Raw)": 2.0160255432128906, "Pretrain/Step": 3273, "Pretrain/Step Time": 8.548218382522464} +{"Pretrain/Learning Rate": 3.819666418240545e-05, "Pretrain/Loss": 2.074411153793335, "Pretrain/Loss (Raw)": 1.8510571718215942, "Pretrain/Step": 3274, "Pretrain/Step Time": 8.551269061863422} +{"Pretrain/Learning Rate": 3.818945274044618e-05, "Pretrain/Loss": 2.074289560317993, "Pretrain/Loss (Raw)": 1.9297525882720947, "Pretrain/Step": 3275, "Pretrain/Step Time": 8.541747661307454} +{"Pretrain/Learning Rate": 3.8182239777417066e-05, "Pretrain/Loss": 2.071235179901123, "Pretrain/Loss (Raw)": 1.7046518325805664, "Pretrain/Step": 3276, "Pretrain/Step Time": 8.538765313103795} +{"Pretrain/Learning Rate": 3.817502529414994e-05, "Pretrain/Loss": 2.0707926750183105, "Pretrain/Loss (Raw)": 1.9040201902389526, "Pretrain/Step": 3277, "Pretrain/Step Time": 8.534758415073156} +{"Pretrain/Learning Rate": 3.816780929147682e-05, "Pretrain/Loss": 2.0721325874328613, "Pretrain/Loss (Raw)": 2.285602331161499, "Pretrain/Step": 3278, "Pretrain/Step Time": 8.543215904384851} +{"Pretrain/Learning Rate": 3.816059177022988e-05, "Pretrain/Loss": 2.071878433227539, "Pretrain/Loss (Raw)": 2.1707193851470947, "Pretrain/Step": 3279, "Pretrain/Step Time": 8.544617760926485} +{"Pretrain/Learning Rate": 3.8153372731241486e-05, "Pretrain/Loss": 2.072303533554077, "Pretrain/Loss (Raw)": 2.0583748817443848, "Pretrain/Step": 3280, "Pretrain/Step Time": 8.541241992264986} +{"Pretrain/Learning Rate": 3.814615217534416e-05, "Pretrain/Loss": 2.071321964263916, "Pretrain/Loss (Raw)": 2.047187566757202, "Pretrain/Step": 3281, "Pretrain/Step Time": 8.54162348434329} +{"Pretrain/Learning Rate": 3.813893010337063e-05, "Pretrain/Loss": 2.074150800704956, "Pretrain/Loss (Raw)": 2.0415358543395996, "Pretrain/Step": 3282, "Pretrain/Step Time": 8.524863202124834} +{"Pretrain/Learning Rate": 3.813170651615376e-05, "Pretrain/Loss": 2.074061393737793, "Pretrain/Loss (Raw)": 2.043708562850952, "Pretrain/Step": 3283, "Pretrain/Step Time": 8.527990778908134} +{"Pretrain/Learning Rate": 3.8124481414526613e-05, "Pretrain/Loss": 2.0743110179901123, "Pretrain/Loss (Raw)": 2.101501226425171, "Pretrain/Step": 3284, "Pretrain/Step Time": 8.535011721774936} +{"Pretrain/Learning Rate": 3.811725479932243e-05, "Pretrain/Loss": 2.074765682220459, "Pretrain/Loss (Raw)": 1.915755271911621, "Pretrain/Step": 3285, "Pretrain/Step Time": 8.537088746204972} +{"Pretrain/Learning Rate": 3.8110026671374615e-05, "Pretrain/Loss": 2.0743634700775146, "Pretrain/Loss (Raw)": 2.043668270111084, "Pretrain/Step": 3286, "Pretrain/Step Time": 8.53617032803595} +{"Pretrain/Learning Rate": 3.810279703151674e-05, "Pretrain/Loss": 2.074382781982422, "Pretrain/Loss (Raw)": 1.9977275133132935, "Pretrain/Step": 3287, "Pretrain/Step Time": 8.529255483299494} +{"Pretrain/Learning Rate": 3.809556588058258e-05, "Pretrain/Loss": 2.0737662315368652, "Pretrain/Loss (Raw)": 2.1001908779144287, "Pretrain/Step": 3288, "Pretrain/Step Time": 8.521969744935632} +{"Pretrain/Learning Rate": 3.8088333219406046e-05, "Pretrain/Loss": 2.0764341354370117, "Pretrain/Loss (Raw)": 2.0916295051574707, "Pretrain/Step": 3289, "Pretrain/Step Time": 8.53492833673954} +{"Pretrain/Learning Rate": 3.808109904882126e-05, "Pretrain/Loss": 2.077021837234497, "Pretrain/Loss (Raw)": 2.0718729496002197, "Pretrain/Step": 3290, "Pretrain/Step Time": 8.535325225442648} +{"Pretrain/Learning Rate": 3.807386336966248e-05, "Pretrain/Loss": 2.076354503631592, "Pretrain/Loss (Raw)": 2.0714051723480225, "Pretrain/Step": 3291, "Pretrain/Step Time": 8.538575107231736} +{"Pretrain/Learning Rate": 3.8066626182764174e-05, "Pretrain/Loss": 2.0776078701019287, "Pretrain/Loss (Raw)": 2.246790885925293, "Pretrain/Step": 3292, "Pretrain/Step Time": 8.5386897418648} +{"Pretrain/Learning Rate": 3.805938748896097e-05, "Pretrain/Loss": 2.0776870250701904, "Pretrain/Loss (Raw)": 2.1197612285614014, "Pretrain/Step": 3293, "Pretrain/Step Time": 8.531792281195521} +{"Pretrain/Learning Rate": 3.805214728908765e-05, "Pretrain/Loss": 2.0782370567321777, "Pretrain/Loss (Raw)": 2.2105207443237305, "Pretrain/Step": 3294, "Pretrain/Step Time": 8.526931507512927} +{"Pretrain/Learning Rate": 3.804490558397922e-05, "Pretrain/Loss": 2.0755319595336914, "Pretrain/Loss (Raw)": 2.0228962898254395, "Pretrain/Step": 3295, "Pretrain/Step Time": 8.526797594502568} +{"Pretrain/Learning Rate": 3.803766237447079e-05, "Pretrain/Loss": 2.0773472785949707, "Pretrain/Loss (Raw)": 2.219665765762329, "Pretrain/Step": 3296, "Pretrain/Step Time": 8.52686158195138} +{"Pretrain/Learning Rate": 3.803041766139771e-05, "Pretrain/Loss": 2.077077865600586, "Pretrain/Loss (Raw)": 2.002302646636963, "Pretrain/Step": 3297, "Pretrain/Step Time": 8.52153635956347} +{"Pretrain/Learning Rate": 3.8023171445595464e-05, "Pretrain/Loss": 2.0770668983459473, "Pretrain/Loss (Raw)": 2.024040699005127, "Pretrain/Step": 3298, "Pretrain/Step Time": 8.522437522187829} +{"Pretrain/Learning Rate": 3.8015923727899714e-05, "Pretrain/Loss": 2.0747485160827637, "Pretrain/Loss (Raw)": 1.8227277994155884, "Pretrain/Step": 3299, "Pretrain/Step Time": 8.517277942970395} +{"Pretrain/Learning Rate": 3.8008674509146304e-05, "Pretrain/Loss": 2.0728256702423096, "Pretrain/Loss (Raw)": 1.934471845626831, "Pretrain/Step": 3300, "Pretrain/Step Time": 8.5080781057477} +{"Pretrain/Learning Rate": 3.800142379017127e-05, "Pretrain/Loss": 2.0730557441711426, "Pretrain/Loss (Raw)": 2.2486982345581055, "Pretrain/Step": 3301, "Pretrain/Step Time": 8.517863595858216} +{"Pretrain/Learning Rate": 3.799417157181076e-05, "Pretrain/Loss": 2.0730886459350586, "Pretrain/Loss (Raw)": 1.9862151145935059, "Pretrain/Step": 3302, "Pretrain/Step Time": 8.51360547915101} +{"Pretrain/Learning Rate": 3.798691785490115e-05, "Pretrain/Loss": 2.070455551147461, "Pretrain/Loss (Raw)": 1.8941766023635864, "Pretrain/Step": 3303, "Pretrain/Step Time": 8.513162288814783} +{"Pretrain/Learning Rate": 3.797966264027899e-05, "Pretrain/Loss": 2.0660324096679688, "Pretrain/Loss (Raw)": 1.9751651287078857, "Pretrain/Step": 3304, "Pretrain/Step Time": 8.512062326073647} +{"Pretrain/Learning Rate": 3.7972405928780974e-05, "Pretrain/Loss": 2.065765380859375, "Pretrain/Loss (Raw)": 1.9748904705047607, "Pretrain/Step": 3305, "Pretrain/Step Time": 8.507259014993906} +{"Pretrain/Learning Rate": 3.796514772124396e-05, "Pretrain/Loss": 2.065474033355713, "Pretrain/Loss (Raw)": 2.0607872009277344, "Pretrain/Step": 3306, "Pretrain/Step Time": 8.505376851186156} +{"Pretrain/Learning Rate": 3.795788801850504e-05, "Pretrain/Loss": 2.0658702850341797, "Pretrain/Loss (Raw)": 1.9868860244750977, "Pretrain/Step": 3307, "Pretrain/Step Time": 8.511083114892244} +{"Pretrain/Learning Rate": 3.7950626821401405e-05, "Pretrain/Loss": 2.066274404525757, "Pretrain/Loss (Raw)": 2.0377981662750244, "Pretrain/Step": 3308, "Pretrain/Step Time": 8.515209004282951} +{"Pretrain/Learning Rate": 3.794336413077045e-05, "Pretrain/Loss": 2.067305088043213, "Pretrain/Loss (Raw)": 2.195568323135376, "Pretrain/Step": 3309, "Pretrain/Step Time": 8.51658795401454} +{"Pretrain/Learning Rate": 3.793609994744977e-05, "Pretrain/Loss": 2.070120334625244, "Pretrain/Loss (Raw)": 2.424028158187866, "Pretrain/Step": 3310, "Pretrain/Step Time": 8.50992201268673} +{"Pretrain/Learning Rate": 3.792883427227707e-05, "Pretrain/Loss": 2.068233013153076, "Pretrain/Loss (Raw)": 1.907444953918457, "Pretrain/Step": 3311, "Pretrain/Step Time": 8.498404974117875} +{"Pretrain/Learning Rate": 3.7921567106090297e-05, "Pretrain/Loss": 2.0676560401916504, "Pretrain/Loss (Raw)": 2.1005077362060547, "Pretrain/Step": 3312, "Pretrain/Step Time": 8.506676057353616} +{"Pretrain/Learning Rate": 3.79142984497275e-05, "Pretrain/Loss": 2.0681958198547363, "Pretrain/Loss (Raw)": 2.064517021179199, "Pretrain/Step": 3313, "Pretrain/Step Time": 8.511187575757504} +{"Pretrain/Learning Rate": 3.790702830402696e-05, "Pretrain/Loss": 2.069056987762451, "Pretrain/Loss (Raw)": 2.101250410079956, "Pretrain/Step": 3314, "Pretrain/Step Time": 8.512838212773204} +{"Pretrain/Learning Rate": 3.7899756669827094e-05, "Pretrain/Loss": 2.0720374584198, "Pretrain/Loss (Raw)": 2.1555683612823486, "Pretrain/Step": 3315, "Pretrain/Step Time": 8.514446970075369} +{"Pretrain/Learning Rate": 3.789248354796651e-05, "Pretrain/Loss": 2.0735888481140137, "Pretrain/Loss (Raw)": 2.1321611404418945, "Pretrain/Step": 3316, "Pretrain/Step Time": 8.508794317021966} +{"Pretrain/Learning Rate": 3.788520893928396e-05, "Pretrain/Loss": 2.0693535804748535, "Pretrain/Loss (Raw)": 1.9803972244262695, "Pretrain/Step": 3317, "Pretrain/Step Time": 8.503539830446243} +{"Pretrain/Learning Rate": 3.78779328446184e-05, "Pretrain/Loss": 2.06772518157959, "Pretrain/Loss (Raw)": 2.029489278793335, "Pretrain/Step": 3318, "Pretrain/Step Time": 8.50157810561359} +{"Pretrain/Learning Rate": 3.7870655264808954e-05, "Pretrain/Loss": 2.0672056674957275, "Pretrain/Loss (Raw)": 1.9208738803863525, "Pretrain/Step": 3319, "Pretrain/Step Time": 8.507101384922862} +{"Pretrain/Learning Rate": 3.786337620069488e-05, "Pretrain/Loss": 2.0661778450012207, "Pretrain/Loss (Raw)": 2.0542473793029785, "Pretrain/Step": 3320, "Pretrain/Step Time": 8.51135129481554} +{"Pretrain/Learning Rate": 3.7856095653115655e-05, "Pretrain/Loss": 2.0655877590179443, "Pretrain/Loss (Raw)": 1.9740630388259888, "Pretrain/Step": 3321, "Pretrain/Step Time": 8.514368752017617} +{"Pretrain/Learning Rate": 3.7848813622910894e-05, "Pretrain/Loss": 2.0654406547546387, "Pretrain/Loss (Raw)": 2.038228988647461, "Pretrain/Step": 3322, "Pretrain/Step Time": 8.518110543489456} +{"Pretrain/Learning Rate": 3.784153011092041e-05, "Pretrain/Loss": 2.066512107849121, "Pretrain/Loss (Raw)": 2.127436876296997, "Pretrain/Step": 3323, "Pretrain/Step Time": 8.5099319498986} +{"Pretrain/Learning Rate": 3.7834245117984155e-05, "Pretrain/Loss": 2.0658888816833496, "Pretrain/Loss (Raw)": 2.0093555450439453, "Pretrain/Step": 3324, "Pretrain/Step Time": 8.509484490379691} +{"Pretrain/Learning Rate": 3.782695864494228e-05, "Pretrain/Loss": 2.063462257385254, "Pretrain/Loss (Raw)": 2.1238739490509033, "Pretrain/Step": 3325, "Pretrain/Step Time": 8.516993215307593} +{"Pretrain/Learning Rate": 3.781967069263509e-05, "Pretrain/Loss": 2.0662970542907715, "Pretrain/Loss (Raw)": 2.1541192531585693, "Pretrain/Step": 3326, "Pretrain/Step Time": 8.518857177346945} +{"Pretrain/Learning Rate": 3.781238126190306e-05, "Pretrain/Loss": 2.0661354064941406, "Pretrain/Loss (Raw)": 2.0613701343536377, "Pretrain/Step": 3327, "Pretrain/Step Time": 8.517267271876335} +{"Pretrain/Learning Rate": 3.780509035358686e-05, "Pretrain/Loss": 2.0678281784057617, "Pretrain/Loss (Raw)": 2.2042272090911865, "Pretrain/Step": 3328, "Pretrain/Step Time": 8.509488847106695} +{"Pretrain/Learning Rate": 3.77977979685273e-05, "Pretrain/Loss": 2.0659127235412598, "Pretrain/Loss (Raw)": 1.8573178052902222, "Pretrain/Step": 3329, "Pretrain/Step Time": 8.512035751715302} +{"Pretrain/Learning Rate": 3.7790504107565366e-05, "Pretrain/Loss": 2.0644538402557373, "Pretrain/Loss (Raw)": 1.9492018222808838, "Pretrain/Step": 3330, "Pretrain/Step Time": 8.506253181025386} +{"Pretrain/Learning Rate": 3.7783208771542237e-05, "Pretrain/Loss": 2.066253185272217, "Pretrain/Loss (Raw)": 2.329509973526001, "Pretrain/Step": 3331, "Pretrain/Step Time": 8.50992077589035} +{"Pretrain/Learning Rate": 3.7775911961299225e-05, "Pretrain/Loss": 2.0641918182373047, "Pretrain/Loss (Raw)": 1.8837751150131226, "Pretrain/Step": 3332, "Pretrain/Step Time": 8.512795763090253} +{"Pretrain/Learning Rate": 3.776861367767785e-05, "Pretrain/Loss": 2.063505172729492, "Pretrain/Loss (Raw)": 2.092858076095581, "Pretrain/Step": 3333, "Pretrain/Step Time": 8.511734457686543} +{"Pretrain/Learning Rate": 3.776131392151978e-05, "Pretrain/Loss": 2.063709259033203, "Pretrain/Loss (Raw)": 2.0545406341552734, "Pretrain/Step": 3334, "Pretrain/Step Time": 8.515146747231483} +{"Pretrain/Learning Rate": 3.775401269366685e-05, "Pretrain/Loss": 2.0632247924804688, "Pretrain/Loss (Raw)": 2.0832934379577637, "Pretrain/Step": 3335, "Pretrain/Step Time": 8.515051247552037} +{"Pretrain/Learning Rate": 3.7746709994961085e-05, "Pretrain/Loss": 2.0642848014831543, "Pretrain/Loss (Raw)": 2.1807143688201904, "Pretrain/Step": 3336, "Pretrain/Step Time": 8.511682754382491} +{"Pretrain/Learning Rate": 3.7739405826244645e-05, "Pretrain/Loss": 2.063832998275757, "Pretrain/Loss (Raw)": 2.0498974323272705, "Pretrain/Step": 3337, "Pretrain/Step Time": 8.50749790109694} +{"Pretrain/Learning Rate": 3.773210018835991e-05, "Pretrain/Loss": 2.064384937286377, "Pretrain/Loss (Raw)": 2.158125638961792, "Pretrain/Step": 3338, "Pretrain/Step Time": 8.508211091160774} +{"Pretrain/Learning Rate": 3.772479308214937e-05, "Pretrain/Loss": 2.0635910034179688, "Pretrain/Loss (Raw)": 2.016838312149048, "Pretrain/Step": 3339, "Pretrain/Step Time": 8.508984874933958} +{"Pretrain/Learning Rate": 3.771748450845575e-05, "Pretrain/Loss": 2.0625176429748535, "Pretrain/Loss (Raw)": 1.8763785362243652, "Pretrain/Step": 3340, "Pretrain/Step Time": 8.514078449457884} +{"Pretrain/Learning Rate": 3.771017446812187e-05, "Pretrain/Loss": 2.0629100799560547, "Pretrain/Loss (Raw)": 2.1927645206451416, "Pretrain/Step": 3341, "Pretrain/Step Time": 8.514251738786697} +{"Pretrain/Learning Rate": 3.770286296199079e-05, "Pretrain/Loss": 2.0637245178222656, "Pretrain/Loss (Raw)": 2.1266818046569824, "Pretrain/Step": 3342, "Pretrain/Step Time": 8.50829353928566} +{"Pretrain/Learning Rate": 3.7695549990905694e-05, "Pretrain/Loss": 2.0616464614868164, "Pretrain/Loss (Raw)": 1.8862890005111694, "Pretrain/Step": 3343, "Pretrain/Step Time": 8.509249243885279} +{"Pretrain/Learning Rate": 3.768823555570995e-05, "Pretrain/Loss": 2.059032678604126, "Pretrain/Loss (Raw)": 1.9412744045257568, "Pretrain/Step": 3344, "Pretrain/Step Time": 8.509090960025787} +{"Pretrain/Learning Rate": 3.768091965724709e-05, "Pretrain/Loss": 2.060192584991455, "Pretrain/Loss (Raw)": 2.1873672008514404, "Pretrain/Step": 3345, "Pretrain/Step Time": 8.512451043352485} +{"Pretrain/Learning Rate": 3.767360229636082e-05, "Pretrain/Loss": 2.056307792663574, "Pretrain/Loss (Raw)": 1.7363073825836182, "Pretrain/Step": 3346, "Pretrain/Step Time": 8.520591160282493} +{"Pretrain/Learning Rate": 3.7666283473895014e-05, "Pretrain/Loss": 2.0560567378997803, "Pretrain/Loss (Raw)": 1.9411181211471558, "Pretrain/Step": 3347, "Pretrain/Step Time": 8.519998217001557} +{"Pretrain/Learning Rate": 3.765896319069372e-05, "Pretrain/Loss": 2.0541670322418213, "Pretrain/Loss (Raw)": 1.9093965291976929, "Pretrain/Step": 3348, "Pretrain/Step Time": 8.514994891360402} +{"Pretrain/Learning Rate": 3.7651641447601126e-05, "Pretrain/Loss": 2.054349899291992, "Pretrain/Loss (Raw)": 2.031120777130127, "Pretrain/Step": 3349, "Pretrain/Step Time": 8.514310313388705} +{"Pretrain/Learning Rate": 3.764431824546163e-05, "Pretrain/Loss": 2.0513813495635986, "Pretrain/Loss (Raw)": 1.8202152252197266, "Pretrain/Step": 3350, "Pretrain/Step Time": 8.51234757900238} +{"Pretrain/Learning Rate": 3.7636993585119775e-05, "Pretrain/Loss": 2.0511651039123535, "Pretrain/Loss (Raw)": 2.085419178009033, "Pretrain/Step": 3351, "Pretrain/Step Time": 8.5131273008883} +{"Pretrain/Learning Rate": 3.762966746742027e-05, "Pretrain/Loss": 2.0516457557678223, "Pretrain/Loss (Raw)": 2.0824506282806396, "Pretrain/Step": 3352, "Pretrain/Step Time": 8.51557619124651} +{"Pretrain/Learning Rate": 3.7622339893208e-05, "Pretrain/Loss": 2.0454602241516113, "Pretrain/Loss (Raw)": 1.8018473386764526, "Pretrain/Step": 3353, "Pretrain/Step Time": 8.515441032126546} +{"Pretrain/Learning Rate": 3.761501086332802e-05, "Pretrain/Loss": 2.045779228210449, "Pretrain/Loss (Raw)": 2.0579421520233154, "Pretrain/Step": 3354, "Pretrain/Step Time": 8.507934650406241} +{"Pretrain/Learning Rate": 3.760768037862553e-05, "Pretrain/Loss": 2.0440597534179688, "Pretrain/Loss (Raw)": 1.9985978603363037, "Pretrain/Step": 3355, "Pretrain/Step Time": 8.507442532107234} +{"Pretrain/Learning Rate": 3.760034843994594e-05, "Pretrain/Loss": 2.0439870357513428, "Pretrain/Loss (Raw)": 2.194261312484741, "Pretrain/Step": 3356, "Pretrain/Step Time": 8.512360213324428} +{"Pretrain/Learning Rate": 3.7593015048134794e-05, "Pretrain/Loss": 2.0425491333007812, "Pretrain/Loss (Raw)": 1.8956594467163086, "Pretrain/Step": 3357, "Pretrain/Step Time": 8.515440249815583} +{"Pretrain/Learning Rate": 3.758568020403781e-05, "Pretrain/Loss": 2.0427157878875732, "Pretrain/Loss (Raw)": 2.174311399459839, "Pretrain/Step": 3358, "Pretrain/Step Time": 8.51019754074514} +{"Pretrain/Learning Rate": 3.757834390850088e-05, "Pretrain/Loss": 2.0425286293029785, "Pretrain/Loss (Raw)": 2.0928916931152344, "Pretrain/Step": 3359, "Pretrain/Step Time": 8.508797489106655} +{"Pretrain/Learning Rate": 3.7571006162370056e-05, "Pretrain/Loss": 2.0411784648895264, "Pretrain/Loss (Raw)": 2.009432792663574, "Pretrain/Step": 3360, "Pretrain/Step Time": 8.502820383757353} +{"Pretrain/Learning Rate": 3.7563666966491564e-05, "Pretrain/Loss": 2.0409886837005615, "Pretrain/Loss (Raw)": 1.954803228378296, "Pretrain/Step": 3361, "Pretrain/Step Time": 8.50694677978754} +{"Pretrain/Learning Rate": 3.7556326321711796e-05, "Pretrain/Loss": 2.042802095413208, "Pretrain/Loss (Raw)": 2.174069881439209, "Pretrain/Step": 3362, "Pretrain/Step Time": 8.5050945635885} +{"Pretrain/Learning Rate": 3.7548984228877313e-05, "Pretrain/Loss": 2.0436716079711914, "Pretrain/Loss (Raw)": 2.1372907161712646, "Pretrain/Step": 3363, "Pretrain/Step Time": 8.510684607550502} +{"Pretrain/Learning Rate": 3.754164068883484e-05, "Pretrain/Loss": 2.043931007385254, "Pretrain/Loss (Raw)": 2.1044678688049316, "Pretrain/Step": 3364, "Pretrain/Step Time": 8.506250081583858} +{"Pretrain/Learning Rate": 3.7534295702431254e-05, "Pretrain/Loss": 2.0438454151153564, "Pretrain/Loss (Raw)": 2.1032350063323975, "Pretrain/Step": 3365, "Pretrain/Step Time": 8.502311607822776} +{"Pretrain/Learning Rate": 3.7526949270513635e-05, "Pretrain/Loss": 2.043527126312256, "Pretrain/Loss (Raw)": 2.083134651184082, "Pretrain/Step": 3366, "Pretrain/Step Time": 8.50099011324346} +{"Pretrain/Learning Rate": 3.751960139392919e-05, "Pretrain/Loss": 2.0447723865509033, "Pretrain/Loss (Raw)": 2.3044795989990234, "Pretrain/Step": 3367, "Pretrain/Step Time": 8.497833397239447} +{"Pretrain/Learning Rate": 3.7512252073525325e-05, "Pretrain/Loss": 2.0444254875183105, "Pretrain/Loss (Raw)": 2.052861452102661, "Pretrain/Step": 3368, "Pretrain/Step Time": 8.49686106108129} +{"Pretrain/Learning Rate": 3.7504901310149574e-05, "Pretrain/Loss": 2.0435984134674072, "Pretrain/Loss (Raw)": 2.0669822692871094, "Pretrain/Step": 3369, "Pretrain/Step Time": 8.503148885443807} +{"Pretrain/Learning Rate": 3.74975491046497e-05, "Pretrain/Loss": 2.044063091278076, "Pretrain/Loss (Raw)": 2.0875024795532227, "Pretrain/Step": 3370, "Pretrain/Step Time": 8.493759658187628} +{"Pretrain/Learning Rate": 3.7490195457873555e-05, "Pretrain/Loss": 2.0426788330078125, "Pretrain/Loss (Raw)": 1.9463653564453125, "Pretrain/Step": 3371, "Pretrain/Step Time": 8.488512467592955} +{"Pretrain/Learning Rate": 3.748284037066922e-05, "Pretrain/Loss": 2.0423991680145264, "Pretrain/Loss (Raw)": 2.0299265384674072, "Pretrain/Step": 3372, "Pretrain/Step Time": 8.483456192538142} +{"Pretrain/Learning Rate": 3.7475483843884916e-05, "Pretrain/Loss": 2.041374444961548, "Pretrain/Loss (Raw)": 1.846240758895874, "Pretrain/Step": 3373, "Pretrain/Step Time": 8.484082320705056} +{"Pretrain/Learning Rate": 3.746812587836903e-05, "Pretrain/Loss": 2.042490005493164, "Pretrain/Loss (Raw)": 2.1092238426208496, "Pretrain/Step": 3374, "Pretrain/Step Time": 8.48923210427165} +{"Pretrain/Learning Rate": 3.746076647497011e-05, "Pretrain/Loss": 2.0415706634521484, "Pretrain/Loss (Raw)": 1.9134018421173096, "Pretrain/Step": 3375, "Pretrain/Step Time": 8.492181746289134} +{"Pretrain/Learning Rate": 3.7453405634536894e-05, "Pretrain/Loss": 2.040477752685547, "Pretrain/Loss (Raw)": 2.0395901203155518, "Pretrain/Step": 3376, "Pretrain/Step Time": 8.484803618863225} +{"Pretrain/Learning Rate": 3.744604335791825e-05, "Pretrain/Loss": 2.0420587062835693, "Pretrain/Loss (Raw)": 2.2423744201660156, "Pretrain/Step": 3377, "Pretrain/Step Time": 8.475253090262413} +{"Pretrain/Learning Rate": 3.743867964596324e-05, "Pretrain/Loss": 2.041347026824951, "Pretrain/Loss (Raw)": 2.044975996017456, "Pretrain/Step": 3378, "Pretrain/Step Time": 8.472383068874478} +{"Pretrain/Learning Rate": 3.743131449952107e-05, "Pretrain/Loss": 2.0408079624176025, "Pretrain/Loss (Raw)": 1.9730712175369263, "Pretrain/Step": 3379, "Pretrain/Step Time": 8.478525256738067} +{"Pretrain/Learning Rate": 3.7423947919441147e-05, "Pretrain/Loss": 2.04213809967041, "Pretrain/Loss (Raw)": 2.0512337684631348, "Pretrain/Step": 3380, "Pretrain/Step Time": 8.484661495313048} +{"Pretrain/Learning Rate": 3.7416579906573e-05, "Pretrain/Loss": 2.0428242683410645, "Pretrain/Loss (Raw)": 2.085197925567627, "Pretrain/Step": 3381, "Pretrain/Step Time": 8.476593602448702} +{"Pretrain/Learning Rate": 3.7409210461766355e-05, "Pretrain/Loss": 2.042842388153076, "Pretrain/Loss (Raw)": 2.034993886947632, "Pretrain/Step": 3382, "Pretrain/Step Time": 8.478017289191484} +{"Pretrain/Learning Rate": 3.740183958587108e-05, "Pretrain/Loss": 2.041584014892578, "Pretrain/Loss (Raw)": 2.044144868850708, "Pretrain/Step": 3383, "Pretrain/Step Time": 8.479018228128552} +{"Pretrain/Learning Rate": 3.7394467279737224e-05, "Pretrain/Loss": 2.042128086090088, "Pretrain/Loss (Raw)": 2.103071689605713, "Pretrain/Step": 3384, "Pretrain/Step Time": 8.469993934035301} +{"Pretrain/Learning Rate": 3.7387093544215003e-05, "Pretrain/Loss": 2.0420823097229004, "Pretrain/Loss (Raw)": 2.100231409072876, "Pretrain/Step": 3385, "Pretrain/Step Time": 8.469860522076488} +{"Pretrain/Learning Rate": 3.7379718380154777e-05, "Pretrain/Loss": 2.0451979637145996, "Pretrain/Loss (Raw)": 2.055171251296997, "Pretrain/Step": 3386, "Pretrain/Step Time": 8.46864464879036} +{"Pretrain/Learning Rate": 3.737234178840709e-05, "Pretrain/Loss": 2.0488719940185547, "Pretrain/Loss (Raw)": 2.2492170333862305, "Pretrain/Step": 3387, "Pretrain/Step Time": 8.464650375768542} +{"Pretrain/Learning Rate": 3.736496376982266e-05, "Pretrain/Loss": 2.046933174133301, "Pretrain/Loss (Raw)": 1.8579788208007812, "Pretrain/Step": 3388, "Pretrain/Step Time": 8.467008534818888} +{"Pretrain/Learning Rate": 3.7357584325252336e-05, "Pretrain/Loss": 2.0470969676971436, "Pretrain/Loss (Raw)": 2.0252254009246826, "Pretrain/Step": 3389, "Pretrain/Step Time": 8.459908043965697} +{"Pretrain/Learning Rate": 3.7350203455547155e-05, "Pretrain/Loss": 2.048900842666626, "Pretrain/Loss (Raw)": 2.117546558380127, "Pretrain/Step": 3390, "Pretrain/Step Time": 8.454062765464187} +{"Pretrain/Learning Rate": 3.7342821161558316e-05, "Pretrain/Loss": 2.049379348754883, "Pretrain/Loss (Raw)": 2.0511906147003174, "Pretrain/Step": 3391, "Pretrain/Step Time": 8.454870583489537} +{"Pretrain/Learning Rate": 3.7335437444137175e-05, "Pretrain/Loss": 2.048628807067871, "Pretrain/Loss (Raw)": 1.948439359664917, "Pretrain/Step": 3392, "Pretrain/Step Time": 8.455327555537224} +{"Pretrain/Learning Rate": 3.732805230413527e-05, "Pretrain/Loss": 2.048006534576416, "Pretrain/Loss (Raw)": 1.8512405157089233, "Pretrain/Step": 3393, "Pretrain/Step Time": 8.455383101478219} +{"Pretrain/Learning Rate": 3.732066574240428e-05, "Pretrain/Loss": 2.049492835998535, "Pretrain/Loss (Raw)": 2.1447458267211914, "Pretrain/Step": 3394, "Pretrain/Step Time": 8.452451221644878} +{"Pretrain/Learning Rate": 3.731327775979605e-05, "Pretrain/Loss": 2.046520471572876, "Pretrain/Loss (Raw)": 1.8219668865203857, "Pretrain/Step": 3395, "Pretrain/Step Time": 8.445929311215878} +{"Pretrain/Learning Rate": 3.730588835716262e-05, "Pretrain/Loss": 2.0477309226989746, "Pretrain/Loss (Raw)": 2.1109299659729004, "Pretrain/Step": 3396, "Pretrain/Step Time": 8.444407546892762} +{"Pretrain/Learning Rate": 3.729849753535615e-05, "Pretrain/Loss": 2.0470447540283203, "Pretrain/Loss (Raw)": 2.0634047985076904, "Pretrain/Step": 3397, "Pretrain/Step Time": 8.44546777009964} +{"Pretrain/Learning Rate": 3.7291105295229004e-05, "Pretrain/Loss": 2.0450682640075684, "Pretrain/Loss (Raw)": 1.8134541511535645, "Pretrain/Step": 3398, "Pretrain/Step Time": 8.44874102063477} +{"Pretrain/Learning Rate": 3.728371163763366e-05, "Pretrain/Loss": 2.042287826538086, "Pretrain/Loss (Raw)": 1.7000188827514648, "Pretrain/Step": 3399, "Pretrain/Step Time": 8.449912190437317} +{"Pretrain/Learning Rate": 3.727631656342282e-05, "Pretrain/Loss": 2.039544105529785, "Pretrain/Loss (Raw)": 1.9475340843200684, "Pretrain/Step": 3400, "Pretrain/Step Time": 8.443200122565031} +{"Pretrain/Learning Rate": 3.7268920073449296e-05, "Pretrain/Loss": 2.040057897567749, "Pretrain/Loss (Raw)": 2.0817904472351074, "Pretrain/Step": 3401, "Pretrain/Step Time": 8.439607568085194} +{"Pretrain/Learning Rate": 3.72615221685661e-05, "Pretrain/Loss": 2.0398483276367188, "Pretrain/Loss (Raw)": 1.8242295980453491, "Pretrain/Step": 3402, "Pretrain/Step Time": 8.441258082166314} +{"Pretrain/Learning Rate": 3.725412284962639e-05, "Pretrain/Loss": 2.0410594940185547, "Pretrain/Loss (Raw)": 2.0848114490509033, "Pretrain/Step": 3403, "Pretrain/Step Time": 8.445136666297913} +{"Pretrain/Learning Rate": 3.724672211748349e-05, "Pretrain/Loss": 2.0444631576538086, "Pretrain/Loss (Raw)": 2.1403138637542725, "Pretrain/Step": 3404, "Pretrain/Step Time": 8.448493903502822} +{"Pretrain/Learning Rate": 3.723931997299089e-05, "Pretrain/Loss": 2.046210289001465, "Pretrain/Loss (Raw)": 2.1276466846466064, "Pretrain/Step": 3405, "Pretrain/Step Time": 8.447048135101795} +{"Pretrain/Learning Rate": 3.723191641700223e-05, "Pretrain/Loss": 2.0428810119628906, "Pretrain/Loss (Raw)": 1.8594518899917603, "Pretrain/Step": 3406, "Pretrain/Step Time": 8.440398398786783} +{"Pretrain/Learning Rate": 3.7224511450371334e-05, "Pretrain/Loss": 2.041126251220703, "Pretrain/Loss (Raw)": 1.9461195468902588, "Pretrain/Step": 3407, "Pretrain/Step Time": 8.442036928609014} +{"Pretrain/Learning Rate": 3.721710507395218e-05, "Pretrain/Loss": 2.0397238731384277, "Pretrain/Loss (Raw)": 1.8788565397262573, "Pretrain/Step": 3408, "Pretrain/Step Time": 8.442600172013044} +{"Pretrain/Learning Rate": 3.720969728859889e-05, "Pretrain/Loss": 2.0413570404052734, "Pretrain/Loss (Raw)": 2.2562174797058105, "Pretrain/Step": 3409, "Pretrain/Step Time": 8.4526880197227} +{"Pretrain/Learning Rate": 3.720228809516578e-05, "Pretrain/Loss": 2.0383198261260986, "Pretrain/Loss (Raw)": 1.6527750492095947, "Pretrain/Step": 3410, "Pretrain/Step Time": 8.454217432066798} +{"Pretrain/Learning Rate": 3.719487749450731e-05, "Pretrain/Loss": 2.037010908126831, "Pretrain/Loss (Raw)": 1.8761835098266602, "Pretrain/Step": 3411, "Pretrain/Step Time": 8.447328245267272} +{"Pretrain/Learning Rate": 3.718746548747809e-05, "Pretrain/Loss": 2.0352940559387207, "Pretrain/Loss (Raw)": 1.8817168474197388, "Pretrain/Step": 3412, "Pretrain/Step Time": 8.43745432794094} +{"Pretrain/Learning Rate": 3.7180052074932934e-05, "Pretrain/Loss": 2.036200523376465, "Pretrain/Loss (Raw)": 2.0318028926849365, "Pretrain/Step": 3413, "Pretrain/Step Time": 8.440187709406018} +{"Pretrain/Learning Rate": 3.7172637257726774e-05, "Pretrain/Loss": 2.03714656829834, "Pretrain/Loss (Raw)": 2.164740800857544, "Pretrain/Step": 3414, "Pretrain/Step Time": 8.438039779663086} +{"Pretrain/Learning Rate": 3.716522103671473e-05, "Pretrain/Loss": 2.03674578666687, "Pretrain/Loss (Raw)": 1.9464513063430786, "Pretrain/Step": 3415, "Pretrain/Step Time": 8.449734484776855} +{"Pretrain/Learning Rate": 3.715780341275207e-05, "Pretrain/Loss": 2.036579132080078, "Pretrain/Loss (Raw)": 2.078831195831299, "Pretrain/Step": 3416, "Pretrain/Step Time": 8.452469604089856} +{"Pretrain/Learning Rate": 3.715038438669423e-05, "Pretrain/Loss": 2.037522077560425, "Pretrain/Loss (Raw)": 2.2123632431030273, "Pretrain/Step": 3417, "Pretrain/Step Time": 8.439299616962671} +{"Pretrain/Learning Rate": 3.7142963959396806e-05, "Pretrain/Loss": 2.0378029346466064, "Pretrain/Loss (Raw)": 2.1078035831451416, "Pretrain/Step": 3418, "Pretrain/Step Time": 8.436151968315244} +{"Pretrain/Learning Rate": 3.713554213171556e-05, "Pretrain/Loss": 2.034815788269043, "Pretrain/Loss (Raw)": 1.6890712976455688, "Pretrain/Step": 3419, "Pretrain/Step Time": 8.434970561414957} +{"Pretrain/Learning Rate": 3.712811890450641e-05, "Pretrain/Loss": 2.034024715423584, "Pretrain/Loss (Raw)": 2.145498752593994, "Pretrain/Step": 3420, "Pretrain/Step Time": 8.434784971177578} +{"Pretrain/Learning Rate": 3.712069427862544e-05, "Pretrain/Loss": 2.0333638191223145, "Pretrain/Loss (Raw)": 2.0351815223693848, "Pretrain/Step": 3421, "Pretrain/Step Time": 8.446080001071095} +{"Pretrain/Learning Rate": 3.711326825492889e-05, "Pretrain/Loss": 2.032104253768921, "Pretrain/Loss (Raw)": 2.0492806434631348, "Pretrain/Step": 3422, "Pretrain/Step Time": 8.44582892768085} +{"Pretrain/Learning Rate": 3.7105840834273164e-05, "Pretrain/Loss": 2.0314390659332275, "Pretrain/Loss (Raw)": 1.9377679824829102, "Pretrain/Step": 3423, "Pretrain/Step Time": 8.437635377049446} +{"Pretrain/Learning Rate": 3.7098412017514835e-05, "Pretrain/Loss": 2.033802032470703, "Pretrain/Loss (Raw)": 2.522106647491455, "Pretrain/Step": 3424, "Pretrain/Step Time": 8.43752359971404} +{"Pretrain/Learning Rate": 3.7090981805510615e-05, "Pretrain/Loss": 2.0353379249572754, "Pretrain/Loss (Raw)": 2.198930501937866, "Pretrain/Step": 3425, "Pretrain/Step Time": 8.439237913116813} +{"Pretrain/Learning Rate": 3.7083550199117403e-05, "Pretrain/Loss": 2.034675121307373, "Pretrain/Loss (Raw)": 1.9391844272613525, "Pretrain/Step": 3426, "Pretrain/Step Time": 8.449960248544812} +{"Pretrain/Learning Rate": 3.707611719919224e-05, "Pretrain/Loss": 2.0359418392181396, "Pretrain/Loss (Raw)": 1.9848936796188354, "Pretrain/Step": 3427, "Pretrain/Step Time": 8.44767751544714} +{"Pretrain/Learning Rate": 3.706868280659234e-05, "Pretrain/Loss": 2.0367307662963867, "Pretrain/Loss (Raw)": 2.0354366302490234, "Pretrain/Step": 3428, "Pretrain/Step Time": 8.44883475638926} +{"Pretrain/Learning Rate": 3.7061247022175064e-05, "Pretrain/Loss": 2.033132791519165, "Pretrain/Loss (Raw)": 1.7881618738174438, "Pretrain/Step": 3429, "Pretrain/Step Time": 8.437770517542958} +{"Pretrain/Learning Rate": 3.705380984679795e-05, "Pretrain/Loss": 2.035858154296875, "Pretrain/Loss (Raw)": 2.3350627422332764, "Pretrain/Step": 3430, "Pretrain/Step Time": 8.436827380210161} +{"Pretrain/Learning Rate": 3.704637128131868e-05, "Pretrain/Loss": 2.035593271255493, "Pretrain/Loss (Raw)": 1.8602761030197144, "Pretrain/Step": 3431, "Pretrain/Step Time": 8.437824312597513} +{"Pretrain/Learning Rate": 3.7038931326595115e-05, "Pretrain/Loss": 2.037325859069824, "Pretrain/Loss (Raw)": 2.1969330310821533, "Pretrain/Step": 3432, "Pretrain/Step Time": 8.444678796455264} +{"Pretrain/Learning Rate": 3.703148998348526e-05, "Pretrain/Loss": 2.0381741523742676, "Pretrain/Loss (Raw)": 2.0834763050079346, "Pretrain/Step": 3433, "Pretrain/Step Time": 8.441497894003987} +{"Pretrain/Learning Rate": 3.702404725284728e-05, "Pretrain/Loss": 2.0384156703948975, "Pretrain/Loss (Raw)": 2.091683864593506, "Pretrain/Step": 3434, "Pretrain/Step Time": 8.439685504883528} +{"Pretrain/Learning Rate": 3.7016603135539524e-05, "Pretrain/Loss": 2.039327383041382, "Pretrain/Loss (Raw)": 2.103599786758423, "Pretrain/Step": 3435, "Pretrain/Step Time": 8.433409549295902} +{"Pretrain/Learning Rate": 3.700915763242046e-05, "Pretrain/Loss": 2.038851737976074, "Pretrain/Loss (Raw)": 1.9769062995910645, "Pretrain/Step": 3436, "Pretrain/Step Time": 8.432275995612144} +{"Pretrain/Learning Rate": 3.700171074434876e-05, "Pretrain/Loss": 2.0380754470825195, "Pretrain/Loss (Raw)": 2.0962071418762207, "Pretrain/Step": 3437, "Pretrain/Step Time": 8.433881409466267} +{"Pretrain/Learning Rate": 3.699426247218321e-05, "Pretrain/Loss": 2.0358657836914062, "Pretrain/Loss (Raw)": 2.141164541244507, "Pretrain/Step": 3438, "Pretrain/Step Time": 8.440054804086685} +{"Pretrain/Learning Rate": 3.69868128167828e-05, "Pretrain/Loss": 2.0377357006073, "Pretrain/Loss (Raw)": 2.1468069553375244, "Pretrain/Step": 3439, "Pretrain/Step Time": 8.446224292740226} +{"Pretrain/Learning Rate": 3.697936177900665e-05, "Pretrain/Loss": 2.037224292755127, "Pretrain/Loss (Raw)": 2.0350611209869385, "Pretrain/Step": 3440, "Pretrain/Step Time": 8.440735736861825} +{"Pretrain/Learning Rate": 3.697190935971405e-05, "Pretrain/Loss": 2.0371487140655518, "Pretrain/Loss (Raw)": 2.054856777191162, "Pretrain/Step": 3441, "Pretrain/Step Time": 8.437746591866016} +{"Pretrain/Learning Rate": 3.696445555976445e-05, "Pretrain/Loss": 2.0382492542266846, "Pretrain/Loss (Raw)": 2.242094039916992, "Pretrain/Step": 3442, "Pretrain/Step Time": 8.433342950418591} +{"Pretrain/Learning Rate": 3.695700038001746e-05, "Pretrain/Loss": 2.0371506214141846, "Pretrain/Loss (Raw)": 2.0149643421173096, "Pretrain/Step": 3443, "Pretrain/Step Time": 8.436197025701404} +{"Pretrain/Learning Rate": 3.694954382133284e-05, "Pretrain/Loss": 2.0371592044830322, "Pretrain/Loss (Raw)": 2.1332457065582275, "Pretrain/Step": 3444, "Pretrain/Step Time": 8.432239243760705} +{"Pretrain/Learning Rate": 3.694208588457051e-05, "Pretrain/Loss": 2.036973476409912, "Pretrain/Loss (Raw)": 1.956615924835205, "Pretrain/Step": 3445, "Pretrain/Step Time": 8.432722060009837} +{"Pretrain/Learning Rate": 3.693462657059058e-05, "Pretrain/Loss": 2.033958911895752, "Pretrain/Loss (Raw)": 1.6436141729354858, "Pretrain/Step": 3446, "Pretrain/Step Time": 8.435708260163665} +{"Pretrain/Learning Rate": 3.6927165880253266e-05, "Pretrain/Loss": 2.0352959632873535, "Pretrain/Loss (Raw)": 2.0920403003692627, "Pretrain/Step": 3447, "Pretrain/Step Time": 8.426772905513644} +{"Pretrain/Learning Rate": 3.691970381441898e-05, "Pretrain/Loss": 2.0369534492492676, "Pretrain/Loss (Raw)": 2.2663955688476562, "Pretrain/Step": 3448, "Pretrain/Step Time": 8.427180064842105} +{"Pretrain/Learning Rate": 3.691224037394828e-05, "Pretrain/Loss": 2.0387513637542725, "Pretrain/Loss (Raw)": 2.2042150497436523, "Pretrain/Step": 3449, "Pretrain/Step Time": 8.422936044633389} +{"Pretrain/Learning Rate": 3.69047755597019e-05, "Pretrain/Loss": 2.037374496459961, "Pretrain/Loss (Raw)": 1.8619582653045654, "Pretrain/Step": 3450, "Pretrain/Step Time": 8.422252722084522} +{"Pretrain/Learning Rate": 3.68973093725407e-05, "Pretrain/Loss": 2.0359697341918945, "Pretrain/Loss (Raw)": 1.9476721286773682, "Pretrain/Step": 3451, "Pretrain/Step Time": 8.421259013935924} +{"Pretrain/Learning Rate": 3.688984181332572e-05, "Pretrain/Loss": 2.0384140014648438, "Pretrain/Loss (Raw)": 2.322194814682007, "Pretrain/Step": 3452, "Pretrain/Step Time": 8.421019403263927} +{"Pretrain/Learning Rate": 3.688237288291815e-05, "Pretrain/Loss": 2.037710666656494, "Pretrain/Loss (Raw)": 2.0338666439056396, "Pretrain/Step": 3453, "Pretrain/Step Time": 8.415676414966583} +{"Pretrain/Learning Rate": 3.687490258217935e-05, "Pretrain/Loss": 2.038243293762207, "Pretrain/Loss (Raw)": 2.222273826599121, "Pretrain/Step": 3454, "Pretrain/Step Time": 8.42381507717073} +{"Pretrain/Learning Rate": 3.6867430911970824e-05, "Pretrain/Loss": 2.0377469062805176, "Pretrain/Loss (Raw)": 1.9978495836257935, "Pretrain/Step": 3455, "Pretrain/Step Time": 8.424743067473173} +{"Pretrain/Learning Rate": 3.6859957873154256e-05, "Pretrain/Loss": 2.037126064300537, "Pretrain/Loss (Raw)": 2.124764919281006, "Pretrain/Step": 3456, "Pretrain/Step Time": 8.421339314430952} +{"Pretrain/Learning Rate": 3.6852483466591447e-05, "Pretrain/Loss": 2.0387511253356934, "Pretrain/Loss (Raw)": 2.0653154850006104, "Pretrain/Step": 3457, "Pretrain/Step Time": 8.421085771173239} +{"Pretrain/Learning Rate": 3.6845007693144404e-05, "Pretrain/Loss": 2.0404210090637207, "Pretrain/Loss (Raw)": 2.1629416942596436, "Pretrain/Step": 3458, "Pretrain/Step Time": 8.425148317590356} +{"Pretrain/Learning Rate": 3.683753055367526e-05, "Pretrain/Loss": 2.036802053451538, "Pretrain/Loss (Raw)": 1.866276502609253, "Pretrain/Step": 3459, "Pretrain/Step Time": 8.42744735814631} +{"Pretrain/Learning Rate": 3.68300520490463e-05, "Pretrain/Loss": 2.0389089584350586, "Pretrain/Loss (Raw)": 2.1534438133239746, "Pretrain/Step": 3460, "Pretrain/Step Time": 8.423247914761305} +{"Pretrain/Learning Rate": 3.682257218012e-05, "Pretrain/Loss": 2.0397491455078125, "Pretrain/Loss (Raw)": 2.2004337310791016, "Pretrain/Step": 3461, "Pretrain/Step Time": 8.426852254197001} +{"Pretrain/Learning Rate": 3.6815090947758966e-05, "Pretrain/Loss": 2.0398716926574707, "Pretrain/Loss (Raw)": 2.07023286819458, "Pretrain/Step": 3462, "Pretrain/Step Time": 8.42209899239242} +{"Pretrain/Learning Rate": 3.6807608352825975e-05, "Pretrain/Loss": 2.040259838104248, "Pretrain/Loss (Raw)": 2.132948637008667, "Pretrain/Step": 3463, "Pretrain/Step Time": 8.423263324424624} +{"Pretrain/Learning Rate": 3.680012439618394e-05, "Pretrain/Loss": 2.039952278137207, "Pretrain/Loss (Raw)": 2.1413674354553223, "Pretrain/Step": 3464, "Pretrain/Step Time": 8.422709112986922} +{"Pretrain/Learning Rate": 3.679263907869596e-05, "Pretrain/Loss": 2.04196834564209, "Pretrain/Loss (Raw)": 2.3079638481140137, "Pretrain/Step": 3465, "Pretrain/Step Time": 8.430077092722058} +{"Pretrain/Learning Rate": 3.678515240122527e-05, "Pretrain/Loss": 2.041581630706787, "Pretrain/Loss (Raw)": 2.108603000640869, "Pretrain/Step": 3466, "Pretrain/Step Time": 8.430151268839836} +{"Pretrain/Learning Rate": 3.677766436463527e-05, "Pretrain/Loss": 2.0437397956848145, "Pretrain/Loss (Raw)": 2.2930705547332764, "Pretrain/Step": 3467, "Pretrain/Step Time": 8.426718842238188} +{"Pretrain/Learning Rate": 3.677017496978952e-05, "Pretrain/Loss": 2.0462417602539062, "Pretrain/Loss (Raw)": 2.1966404914855957, "Pretrain/Step": 3468, "Pretrain/Step Time": 8.419630013406277} +{"Pretrain/Learning Rate": 3.6762684217551735e-05, "Pretrain/Loss": 2.047469139099121, "Pretrain/Loss (Raw)": 2.3498997688293457, "Pretrain/Step": 3469, "Pretrain/Step Time": 8.418075988069177} +{"Pretrain/Learning Rate": 3.675519210878577e-05, "Pretrain/Loss": 2.0457704067230225, "Pretrain/Loss (Raw)": 1.9092202186584473, "Pretrain/Step": 3470, "Pretrain/Step Time": 8.42374312877655} +{"Pretrain/Learning Rate": 3.6747698644355664e-05, "Pretrain/Loss": 2.0473828315734863, "Pretrain/Loss (Raw)": 2.092656135559082, "Pretrain/Step": 3471, "Pretrain/Step Time": 8.429085090756416} +{"Pretrain/Learning Rate": 3.674020382512559e-05, "Pretrain/Loss": 2.048499584197998, "Pretrain/Loss (Raw)": 2.0842444896698, "Pretrain/Step": 3472, "Pretrain/Step Time": 8.429869633167982} +{"Pretrain/Learning Rate": 3.673270765195989e-05, "Pretrain/Loss": 2.0466856956481934, "Pretrain/Loss (Raw)": 1.9551712274551392, "Pretrain/Step": 3473, "Pretrain/Step Time": 8.423437686637044} +{"Pretrain/Learning Rate": 3.672521012572307e-05, "Pretrain/Loss": 2.0480446815490723, "Pretrain/Loss (Raw)": 1.9102839231491089, "Pretrain/Step": 3474, "Pretrain/Step Time": 8.41267928108573} +{"Pretrain/Learning Rate": 3.671771124727975e-05, "Pretrain/Loss": 2.0481433868408203, "Pretrain/Loss (Raw)": 1.9537514448165894, "Pretrain/Step": 3475, "Pretrain/Step Time": 8.414465699344873} +{"Pretrain/Learning Rate": 3.671021101749476e-05, "Pretrain/Loss": 2.0481393337249756, "Pretrain/Loss (Raw)": 1.9088523387908936, "Pretrain/Step": 3476, "Pretrain/Step Time": 8.4165881536901} +{"Pretrain/Learning Rate": 3.670270943723305e-05, "Pretrain/Loss": 2.0471019744873047, "Pretrain/Loss (Raw)": 1.898356318473816, "Pretrain/Step": 3477, "Pretrain/Step Time": 8.426498349756002} +{"Pretrain/Learning Rate": 3.669520650735975e-05, "Pretrain/Loss": 2.0502278804779053, "Pretrain/Loss (Raw)": 2.2203352451324463, "Pretrain/Step": 3478, "Pretrain/Step Time": 8.426453597843647} +{"Pretrain/Learning Rate": 3.668770222874012e-05, "Pretrain/Loss": 2.0498247146606445, "Pretrain/Loss (Raw)": 2.033811569213867, "Pretrain/Step": 3479, "Pretrain/Step Time": 8.42682320997119} +{"Pretrain/Learning Rate": 3.6680196602239596e-05, "Pretrain/Loss": 2.050058364868164, "Pretrain/Loss (Raw)": 2.1123721599578857, "Pretrain/Step": 3480, "Pretrain/Step Time": 8.419301582500339} +{"Pretrain/Learning Rate": 3.667268962872376e-05, "Pretrain/Loss": 2.0516765117645264, "Pretrain/Loss (Raw)": 2.0089499950408936, "Pretrain/Step": 3481, "Pretrain/Step Time": 8.42068368382752} +{"Pretrain/Learning Rate": 3.666518130905836e-05, "Pretrain/Loss": 2.052863597869873, "Pretrain/Loss (Raw)": 2.209890127182007, "Pretrain/Step": 3482, "Pretrain/Step Time": 8.424032090231776} +{"Pretrain/Learning Rate": 3.665767164410928e-05, "Pretrain/Loss": 2.0536701679229736, "Pretrain/Loss (Raw)": 2.1018290519714355, "Pretrain/Step": 3483, "Pretrain/Step Time": 8.433587402105331} +{"Pretrain/Learning Rate": 3.665016063474257e-05, "Pretrain/Loss": 2.0532896518707275, "Pretrain/Loss (Raw)": 2.1455585956573486, "Pretrain/Step": 3484, "Pretrain/Step Time": 8.429274894297123} +{"Pretrain/Learning Rate": 3.664264828182444e-05, "Pretrain/Loss": 2.053379535675049, "Pretrain/Loss (Raw)": 1.9071670770645142, "Pretrain/Step": 3485, "Pretrain/Step Time": 8.422751694917679} +{"Pretrain/Learning Rate": 3.663513458622124e-05, "Pretrain/Loss": 2.0517725944519043, "Pretrain/Loss (Raw)": 1.9686204195022583, "Pretrain/Step": 3486, "Pretrain/Step Time": 8.422504175454378} +{"Pretrain/Learning Rate": 3.662761954879951e-05, "Pretrain/Loss": 2.0512712001800537, "Pretrain/Loss (Raw)": 2.0287041664123535, "Pretrain/Step": 3487, "Pretrain/Step Time": 8.419248728081584} +{"Pretrain/Learning Rate": 3.662010317042589e-05, "Pretrain/Loss": 2.052299976348877, "Pretrain/Loss (Raw)": 2.141097068786621, "Pretrain/Step": 3488, "Pretrain/Step Time": 8.424759481102228} +{"Pretrain/Learning Rate": 3.661258545196722e-05, "Pretrain/Loss": 2.052077293395996, "Pretrain/Loss (Raw)": 1.9263211488723755, "Pretrain/Step": 3489, "Pretrain/Step Time": 8.431815098971128} +{"Pretrain/Learning Rate": 3.6605066394290476e-05, "Pretrain/Loss": 2.0497324466705322, "Pretrain/Loss (Raw)": 1.8739585876464844, "Pretrain/Step": 3490, "Pretrain/Step Time": 8.42808428965509} +{"Pretrain/Learning Rate": 3.659754599826279e-05, "Pretrain/Loss": 2.048388957977295, "Pretrain/Loss (Raw)": 1.9653245210647583, "Pretrain/Step": 3491, "Pretrain/Step Time": 8.422267826274037} +{"Pretrain/Learning Rate": 3.659002426475145e-05, "Pretrain/Loss": 2.0455918312072754, "Pretrain/Loss (Raw)": 1.7464187145233154, "Pretrain/Step": 3492, "Pretrain/Step Time": 8.423079036176205} +{"Pretrain/Learning Rate": 3.65825011946239e-05, "Pretrain/Loss": 2.0447349548339844, "Pretrain/Loss (Raw)": 1.993565559387207, "Pretrain/Step": 3493, "Pretrain/Step Time": 8.42801796272397} +{"Pretrain/Learning Rate": 3.6574976788747725e-05, "Pretrain/Loss": 2.041891574859619, "Pretrain/Loss (Raw)": 1.7191715240478516, "Pretrain/Step": 3494, "Pretrain/Step Time": 8.430121954530478} +{"Pretrain/Learning Rate": 3.6567451047990696e-05, "Pretrain/Loss": 2.0385639667510986, "Pretrain/Loss (Raw)": 1.8785618543624878, "Pretrain/Step": 3495, "Pretrain/Step Time": 8.430260630324483} +{"Pretrain/Learning Rate": 3.6559923973220695e-05, "Pretrain/Loss": 2.036956548690796, "Pretrain/Loss (Raw)": 1.8470959663391113, "Pretrain/Step": 3496, "Pretrain/Step Time": 8.434348169714212} +{"Pretrain/Learning Rate": 3.65523955653058e-05, "Pretrain/Loss": 2.0368118286132812, "Pretrain/Loss (Raw)": 2.0484654903411865, "Pretrain/Step": 3497, "Pretrain/Step Time": 8.429095713421702} +{"Pretrain/Learning Rate": 3.65448658251142e-05, "Pretrain/Loss": 2.038033962249756, "Pretrain/Loss (Raw)": 2.243964433670044, "Pretrain/Step": 3498, "Pretrain/Step Time": 8.427836559712887} +{"Pretrain/Learning Rate": 3.653733475351428e-05, "Pretrain/Loss": 2.038381576538086, "Pretrain/Loss (Raw)": 1.9908097982406616, "Pretrain/Step": 3499, "Pretrain/Step Time": 8.428674940019846} +{"Pretrain/Learning Rate": 3.6529802351374545e-05, "Pretrain/Loss": 2.0371687412261963, "Pretrain/Loss (Raw)": 1.8746997117996216, "Pretrain/Step": 3500, "Pretrain/Step Time": 8.435889180749655} +{"Pretrain/Learning Rate": 3.652226861956368e-05, "Pretrain/Loss": 2.040398120880127, "Pretrain/Loss (Raw)": 2.259610414505005, "Pretrain/Step": 3501, "Pretrain/Step Time": 8.431558821350336} +{"Pretrain/Learning Rate": 3.65147335589505e-05, "Pretrain/Loss": 2.0402791500091553, "Pretrain/Loss (Raw)": 2.0939764976501465, "Pretrain/Step": 3502, "Pretrain/Step Time": 8.425951041281223} +{"Pretrain/Learning Rate": 3.650719717040398e-05, "Pretrain/Loss": 2.039811372756958, "Pretrain/Loss (Raw)": 1.8535192012786865, "Pretrain/Step": 3503, "Pretrain/Step Time": 8.424053261056542} +{"Pretrain/Learning Rate": 3.649965945479326e-05, "Pretrain/Loss": 2.0405125617980957, "Pretrain/Loss (Raw)": 2.1293680667877197, "Pretrain/Step": 3504, "Pretrain/Step Time": 8.427728405222297} +{"Pretrain/Learning Rate": 3.649212041298763e-05, "Pretrain/Loss": 2.0363821983337402, "Pretrain/Loss (Raw)": 1.7136811017990112, "Pretrain/Step": 3505, "Pretrain/Step Time": 8.433511916548014} +{"Pretrain/Learning Rate": 3.648458004585652e-05, "Pretrain/Loss": 2.034823417663574, "Pretrain/Loss (Raw)": 1.8454433679580688, "Pretrain/Step": 3506, "Pretrain/Step Time": 8.431294040754437} +{"Pretrain/Learning Rate": 3.647703835426952e-05, "Pretrain/Loss": 2.0336194038391113, "Pretrain/Loss (Raw)": 1.8189396858215332, "Pretrain/Step": 3507, "Pretrain/Step Time": 8.42679731734097} +{"Pretrain/Learning Rate": 3.646949533909637e-05, "Pretrain/Loss": 2.033818483352661, "Pretrain/Loss (Raw)": 2.076733112335205, "Pretrain/Step": 3508, "Pretrain/Step Time": 8.422802107408643} +{"Pretrain/Learning Rate": 3.646195100120698e-05, "Pretrain/Loss": 2.0337960720062256, "Pretrain/Loss (Raw)": 2.082324504852295, "Pretrain/Step": 3509, "Pretrain/Step Time": 8.423102522268891} +{"Pretrain/Learning Rate": 3.645440534147139e-05, "Pretrain/Loss": 2.032841205596924, "Pretrain/Loss (Raw)": 1.9127627611160278, "Pretrain/Step": 3510, "Pretrain/Step Time": 8.424340235069394} +{"Pretrain/Learning Rate": 3.644685836075979e-05, "Pretrain/Loss": 2.0329957008361816, "Pretrain/Loss (Raw)": 2.063934326171875, "Pretrain/Step": 3511, "Pretrain/Step Time": 8.431680733337998} +{"Pretrain/Learning Rate": 3.643931005994255e-05, "Pretrain/Loss": 2.030299425125122, "Pretrain/Loss (Raw)": 1.757956624031067, "Pretrain/Step": 3512, "Pretrain/Step Time": 8.428177209571004} +{"Pretrain/Learning Rate": 3.643176043989018e-05, "Pretrain/Loss": 2.0291337966918945, "Pretrain/Loss (Raw)": 1.9510211944580078, "Pretrain/Step": 3513, "Pretrain/Step Time": 8.429087614640594} +{"Pretrain/Learning Rate": 3.6424209501473314e-05, "Pretrain/Loss": 2.0287866592407227, "Pretrain/Loss (Raw)": 2.0107569694519043, "Pretrain/Step": 3514, "Pretrain/Step Time": 8.427940232679248} +{"Pretrain/Learning Rate": 3.641665724556278e-05, "Pretrain/Loss": 2.026273250579834, "Pretrain/Loss (Raw)": 1.9274754524230957, "Pretrain/Step": 3515, "Pretrain/Step Time": 8.433378828689456} +{"Pretrain/Learning Rate": 3.6409103673029535e-05, "Pretrain/Loss": 2.02579927444458, "Pretrain/Loss (Raw)": 1.7973347902297974, "Pretrain/Step": 3516, "Pretrain/Step Time": 8.431066077202559} +{"Pretrain/Learning Rate": 3.64015487847447e-05, "Pretrain/Loss": 2.0263240337371826, "Pretrain/Loss (Raw)": 2.092376470565796, "Pretrain/Step": 3517, "Pretrain/Step Time": 8.43443926051259} +{"Pretrain/Learning Rate": 3.6393992581579526e-05, "Pretrain/Loss": 2.0251386165618896, "Pretrain/Loss (Raw)": 1.9658151865005493, "Pretrain/Step": 3518, "Pretrain/Step Time": 8.43519394658506} +{"Pretrain/Learning Rate": 3.638643506440544e-05, "Pretrain/Loss": 2.0248818397521973, "Pretrain/Loss (Raw)": 2.0183279514312744, "Pretrain/Step": 3519, "Pretrain/Step Time": 8.433567186817527} +{"Pretrain/Learning Rate": 3.6378876234094014e-05, "Pretrain/Loss": 2.025052547454834, "Pretrain/Loss (Raw)": 1.9703091382980347, "Pretrain/Step": 3520, "Pretrain/Step Time": 8.430662108585238} +{"Pretrain/Learning Rate": 3.6371316091516955e-05, "Pretrain/Loss": 2.025256633758545, "Pretrain/Loss (Raw)": 1.8773349523544312, "Pretrain/Step": 3521, "Pretrain/Step Time": 8.428809707984328} +{"Pretrain/Learning Rate": 3.636375463754614e-05, "Pretrain/Loss": 2.0244803428649902, "Pretrain/Loss (Raw)": 2.0453879833221436, "Pretrain/Step": 3522, "Pretrain/Step Time": 8.437400437891483} +{"Pretrain/Learning Rate": 3.6356191873053594e-05, "Pretrain/Loss": 2.0251412391662598, "Pretrain/Loss (Raw)": 1.9065278768539429, "Pretrain/Step": 3523, "Pretrain/Step Time": 8.437547402456403} +{"Pretrain/Learning Rate": 3.634862779891148e-05, "Pretrain/Loss": 2.0243940353393555, "Pretrain/Loss (Raw)": 2.015305995941162, "Pretrain/Step": 3524, "Pretrain/Step Time": 8.433946454897523} +{"Pretrain/Learning Rate": 3.634106241599215e-05, "Pretrain/Loss": 2.028182029724121, "Pretrain/Loss (Raw)": 2.5482847690582275, "Pretrain/Step": 3525, "Pretrain/Step Time": 8.429881883785129} +{"Pretrain/Learning Rate": 3.633349572516805e-05, "Pretrain/Loss": 2.0306317806243896, "Pretrain/Loss (Raw)": 2.127018928527832, "Pretrain/Step": 3526, "Pretrain/Step Time": 8.424481861293316} +{"Pretrain/Learning Rate": 3.632592772731182e-05, "Pretrain/Loss": 2.032348155975342, "Pretrain/Loss (Raw)": 1.9197300672531128, "Pretrain/Step": 3527, "Pretrain/Step Time": 8.423227317631245} +{"Pretrain/Learning Rate": 3.631835842329624e-05, "Pretrain/Loss": 2.033153772354126, "Pretrain/Loss (Raw)": 2.0506579875946045, "Pretrain/Step": 3528, "Pretrain/Step Time": 8.426660558208823} +{"Pretrain/Learning Rate": 3.6310787813994226e-05, "Pretrain/Loss": 2.0329904556274414, "Pretrain/Loss (Raw)": 2.060854196548462, "Pretrain/Step": 3529, "Pretrain/Step Time": 8.42455730214715} +{"Pretrain/Learning Rate": 3.6303215900278864e-05, "Pretrain/Loss": 2.0348124504089355, "Pretrain/Loss (Raw)": 2.0574562549591064, "Pretrain/Step": 3530, "Pretrain/Step Time": 8.423910828307271} +{"Pretrain/Learning Rate": 3.629564268302338e-05, "Pretrain/Loss": 2.0345561504364014, "Pretrain/Loss (Raw)": 2.05200457572937, "Pretrain/Step": 3531, "Pretrain/Step Time": 8.419940853491426} +{"Pretrain/Learning Rate": 3.6288068163101156e-05, "Pretrain/Loss": 2.0330886840820312, "Pretrain/Loss (Raw)": 1.9524896144866943, "Pretrain/Step": 3532, "Pretrain/Step Time": 8.415723910555243} +{"Pretrain/Learning Rate": 3.628049234138572e-05, "Pretrain/Loss": 2.031528949737549, "Pretrain/Loss (Raw)": 1.9279865026474, "Pretrain/Step": 3533, "Pretrain/Step Time": 8.423196421936154} +{"Pretrain/Learning Rate": 3.6272915218750755e-05, "Pretrain/Loss": 2.0343668460845947, "Pretrain/Loss (Raw)": 2.222721815109253, "Pretrain/Step": 3534, "Pretrain/Step Time": 8.42191942408681} +{"Pretrain/Learning Rate": 3.6265336796070083e-05, "Pretrain/Loss": 2.0343194007873535, "Pretrain/Loss (Raw)": 1.940049171447754, "Pretrain/Step": 3535, "Pretrain/Step Time": 8.422727938741446} +{"Pretrain/Learning Rate": 3.62577570742177e-05, "Pretrain/Loss": 2.035325050354004, "Pretrain/Loss (Raw)": 2.007561206817627, "Pretrain/Step": 3536, "Pretrain/Step Time": 8.423035684973001} +{"Pretrain/Learning Rate": 3.625017605406771e-05, "Pretrain/Loss": 2.033043622970581, "Pretrain/Loss (Raw)": 1.9641913175582886, "Pretrain/Step": 3537, "Pretrain/Step Time": 8.415356008335948} +{"Pretrain/Learning Rate": 3.624259373649441e-05, "Pretrain/Loss": 2.035135507583618, "Pretrain/Loss (Raw)": 1.920552134513855, "Pretrain/Step": 3538, "Pretrain/Step Time": 8.419425930827856} +{"Pretrain/Learning Rate": 3.6235010122372214e-05, "Pretrain/Loss": 2.036574125289917, "Pretrain/Loss (Raw)": 2.0603106021881104, "Pretrain/Step": 3539, "Pretrain/Step Time": 8.42787141352892} +{"Pretrain/Learning Rate": 3.6227425212575725e-05, "Pretrain/Loss": 2.037355661392212, "Pretrain/Loss (Raw)": 1.981758713722229, "Pretrain/Step": 3540, "Pretrain/Step Time": 8.427483100444078} +{"Pretrain/Learning Rate": 3.621983900797964e-05, "Pretrain/Loss": 2.0390830039978027, "Pretrain/Loss (Raw)": 2.252896308898926, "Pretrain/Step": 3541, "Pretrain/Step Time": 8.42568490281701} +{"Pretrain/Learning Rate": 3.621225150945886e-05, "Pretrain/Loss": 2.0367226600646973, "Pretrain/Loss (Raw)": 1.8626081943511963, "Pretrain/Step": 3542, "Pretrain/Step Time": 8.424213411286473} +{"Pretrain/Learning Rate": 3.620466271788841e-05, "Pretrain/Loss": 2.038256883621216, "Pretrain/Loss (Raw)": 2.1428427696228027, "Pretrain/Step": 3543, "Pretrain/Step Time": 8.410827439278364} +{"Pretrain/Learning Rate": 3.6197072634143436e-05, "Pretrain/Loss": 2.037982940673828, "Pretrain/Loss (Raw)": 2.043781280517578, "Pretrain/Step": 3544, "Pretrain/Step Time": 8.414828082546592} +{"Pretrain/Learning Rate": 3.61894812590993e-05, "Pretrain/Loss": 2.036242961883545, "Pretrain/Loss (Raw)": 1.9896124601364136, "Pretrain/Step": 3545, "Pretrain/Step Time": 8.421180181205273} +{"Pretrain/Learning Rate": 3.6181888593631454e-05, "Pretrain/Loss": 2.0356287956237793, "Pretrain/Loss (Raw)": 2.029221534729004, "Pretrain/Step": 3546, "Pretrain/Step Time": 8.420839117839932} +{"Pretrain/Learning Rate": 3.6174294638615524e-05, "Pretrain/Loss": 2.0382699966430664, "Pretrain/Loss (Raw)": 2.0271472930908203, "Pretrain/Step": 3547, "Pretrain/Step Time": 8.420000044628978} +{"Pretrain/Learning Rate": 3.616669939492728e-05, "Pretrain/Loss": 2.037202835083008, "Pretrain/Loss (Raw)": 2.0088839530944824, "Pretrain/Step": 3548, "Pretrain/Step Time": 8.421822791919112} +{"Pretrain/Learning Rate": 3.615910286344265e-05, "Pretrain/Loss": 2.036855697631836, "Pretrain/Loss (Raw)": 1.9907407760620117, "Pretrain/Step": 3549, "Pretrain/Step Time": 8.411028975620866} +{"Pretrain/Learning Rate": 3.615150504503768e-05, "Pretrain/Loss": 2.0372090339660645, "Pretrain/Loss (Raw)": 2.094538688659668, "Pretrain/Step": 3550, "Pretrain/Step Time": 8.419557271525264} +{"Pretrain/Learning Rate": 3.6143905940588616e-05, "Pretrain/Loss": 2.038886547088623, "Pretrain/Loss (Raw)": 2.1524658203125, "Pretrain/Step": 3551, "Pretrain/Step Time": 8.419430764392018} +{"Pretrain/Learning Rate": 3.613630555097179e-05, "Pretrain/Loss": 2.034881353378296, "Pretrain/Loss (Raw)": 2.009464740753174, "Pretrain/Step": 3552, "Pretrain/Step Time": 8.424335969612002} +{"Pretrain/Learning Rate": 3.6128703877063755e-05, "Pretrain/Loss": 2.0313825607299805, "Pretrain/Loss (Raw)": 1.7510559558868408, "Pretrain/Step": 3553, "Pretrain/Step Time": 8.420829199254513} +{"Pretrain/Learning Rate": 3.6121100919741126e-05, "Pretrain/Loss": 2.032128095626831, "Pretrain/Loss (Raw)": 2.034634828567505, "Pretrain/Step": 3554, "Pretrain/Step Time": 8.412467947229743} +{"Pretrain/Learning Rate": 3.611349667988074e-05, "Pretrain/Loss": 2.032576560974121, "Pretrain/Loss (Raw)": 2.0422768592834473, "Pretrain/Step": 3555, "Pretrain/Step Time": 8.412439590319991} +{"Pretrain/Learning Rate": 3.6105891158359563e-05, "Pretrain/Loss": 2.0327394008636475, "Pretrain/Loss (Raw)": 2.056288242340088, "Pretrain/Step": 3556, "Pretrain/Step Time": 8.41849609836936} +{"Pretrain/Learning Rate": 3.6098284356054666e-05, "Pretrain/Loss": 2.0347506999969482, "Pretrain/Loss (Raw)": 2.0456204414367676, "Pretrain/Step": 3557, "Pretrain/Step Time": 8.42129067145288} +{"Pretrain/Learning Rate": 3.609067627384333e-05, "Pretrain/Loss": 2.032658576965332, "Pretrain/Loss (Raw)": 2.067262649536133, "Pretrain/Step": 3558, "Pretrain/Step Time": 8.42364620603621} +{"Pretrain/Learning Rate": 3.608306691260295e-05, "Pretrain/Loss": 2.032217025756836, "Pretrain/Loss (Raw)": 1.8037408590316772, "Pretrain/Step": 3559, "Pretrain/Step Time": 8.424302499741316} +{"Pretrain/Learning Rate": 3.607545627321106e-05, "Pretrain/Loss": 2.0308361053466797, "Pretrain/Loss (Raw)": 2.0201900005340576, "Pretrain/Step": 3560, "Pretrain/Step Time": 8.41633171401918} +{"Pretrain/Learning Rate": 3.606784435654536e-05, "Pretrain/Loss": 2.030911922454834, "Pretrain/Loss (Raw)": 2.0931665897369385, "Pretrain/Step": 3561, "Pretrain/Step Time": 8.423010222613811} +{"Pretrain/Learning Rate": 3.6060231163483704e-05, "Pretrain/Loss": 2.03088641166687, "Pretrain/Loss (Raw)": 2.088433027267456, "Pretrain/Step": 3562, "Pretrain/Step Time": 8.42808254249394} +{"Pretrain/Learning Rate": 3.6052616694904066e-05, "Pretrain/Loss": 2.0313186645507812, "Pretrain/Loss (Raw)": 2.158954381942749, "Pretrain/Step": 3563, "Pretrain/Step Time": 8.424705216661096} +{"Pretrain/Learning Rate": 3.60450009516846e-05, "Pretrain/Loss": 2.0314760208129883, "Pretrain/Loss (Raw)": 1.997045874595642, "Pretrain/Step": 3564, "Pretrain/Step Time": 8.427626134827733} +{"Pretrain/Learning Rate": 3.603738393470357e-05, "Pretrain/Loss": 2.03116512298584, "Pretrain/Loss (Raw)": 2.0563902854919434, "Pretrain/Step": 3565, "Pretrain/Step Time": 8.422870352864265} +{"Pretrain/Learning Rate": 3.6029765644839416e-05, "Pretrain/Loss": 2.0294110774993896, "Pretrain/Loss (Raw)": 1.9166462421417236, "Pretrain/Step": 3566, "Pretrain/Step Time": 8.4156179074198} +{"Pretrain/Learning Rate": 3.602214608297071e-05, "Pretrain/Loss": 2.028597831726074, "Pretrain/Loss (Raw)": 2.042733669281006, "Pretrain/Step": 3567, "Pretrain/Step Time": 8.414104362949729} +{"Pretrain/Learning Rate": 3.601452524997619e-05, "Pretrain/Loss": 2.028364658355713, "Pretrain/Loss (Raw)": 2.0052168369293213, "Pretrain/Step": 3568, "Pretrain/Step Time": 8.416488459333777} +{"Pretrain/Learning Rate": 3.600690314673471e-05, "Pretrain/Loss": 2.028676748275757, "Pretrain/Loss (Raw)": 2.0947678089141846, "Pretrain/Step": 3569, "Pretrain/Step Time": 8.424029560759664} +{"Pretrain/Learning Rate": 3.599927977412529e-05, "Pretrain/Loss": 2.0275866985321045, "Pretrain/Loss (Raw)": 2.1025912761688232, "Pretrain/Step": 3570, "Pretrain/Step Time": 8.421317752450705} +{"Pretrain/Learning Rate": 3.59916551330271e-05, "Pretrain/Loss": 2.0264925956726074, "Pretrain/Loss (Raw)": 1.8748888969421387, "Pretrain/Step": 3571, "Pretrain/Step Time": 8.42109270952642} +{"Pretrain/Learning Rate": 3.598402922431944e-05, "Pretrain/Loss": 2.0255300998687744, "Pretrain/Loss (Raw)": 2.010061740875244, "Pretrain/Step": 3572, "Pretrain/Step Time": 8.422806369140744} +{"Pretrain/Learning Rate": 3.5976402048881786e-05, "Pretrain/Loss": 2.0278143882751465, "Pretrain/Loss (Raw)": 2.2490408420562744, "Pretrain/Step": 3573, "Pretrain/Step Time": 8.429867582395673} +{"Pretrain/Learning Rate": 3.596877360759371e-05, "Pretrain/Loss": 2.030897855758667, "Pretrain/Loss (Raw)": 2.0382635593414307, "Pretrain/Step": 3574, "Pretrain/Step Time": 8.427805490791798} +{"Pretrain/Learning Rate": 3.5961143901334984e-05, "Pretrain/Loss": 2.0302748680114746, "Pretrain/Loss (Raw)": 2.012310028076172, "Pretrain/Step": 3575, "Pretrain/Step Time": 8.428672023117542} +{"Pretrain/Learning Rate": 3.5953512930985486e-05, "Pretrain/Loss": 2.029447317123413, "Pretrain/Loss (Raw)": 2.160449743270874, "Pretrain/Step": 3576, "Pretrain/Step Time": 8.424609247595072} +{"Pretrain/Learning Rate": 3.594588069742527e-05, "Pretrain/Loss": 2.0289158821105957, "Pretrain/Loss (Raw)": 2.136185884475708, "Pretrain/Step": 3577, "Pretrain/Step Time": 8.420663822442293} +{"Pretrain/Learning Rate": 3.5938247201534505e-05, "Pretrain/Loss": 2.0294787883758545, "Pretrain/Loss (Raw)": 1.9340155124664307, "Pretrain/Step": 3578, "Pretrain/Step Time": 8.429405875504017} +{"Pretrain/Learning Rate": 3.5930612444193535e-05, "Pretrain/Loss": 2.030045509338379, "Pretrain/Loss (Raw)": 2.020224094390869, "Pretrain/Step": 3579, "Pretrain/Step Time": 8.431111209094524} +{"Pretrain/Learning Rate": 3.592297642628283e-05, "Pretrain/Loss": 2.027397871017456, "Pretrain/Loss (Raw)": 1.98330557346344, "Pretrain/Step": 3580, "Pretrain/Step Time": 8.431261399760842} +{"Pretrain/Learning Rate": 3.5915339148683005e-05, "Pretrain/Loss": 2.0256447792053223, "Pretrain/Loss (Raw)": 1.8094635009765625, "Pretrain/Step": 3581, "Pretrain/Step Time": 8.428890043869615} +{"Pretrain/Learning Rate": 3.590770061227484e-05, "Pretrain/Loss": 2.024632692337036, "Pretrain/Loss (Raw)": 2.092719793319702, "Pretrain/Step": 3582, "Pretrain/Step Time": 8.418940486386418} +{"Pretrain/Learning Rate": 3.590006081793925e-05, "Pretrain/Loss": 2.0258185863494873, "Pretrain/Loss (Raw)": 2.1496376991271973, "Pretrain/Step": 3583, "Pretrain/Step Time": 8.42293019220233} +{"Pretrain/Learning Rate": 3.589241976655727e-05, "Pretrain/Loss": 2.0249061584472656, "Pretrain/Loss (Raw)": 2.007962703704834, "Pretrain/Step": 3584, "Pretrain/Step Time": 8.428848661482334} +{"Pretrain/Learning Rate": 3.588477745901013e-05, "Pretrain/Loss": 2.023428440093994, "Pretrain/Loss (Raw)": 1.876166820526123, "Pretrain/Step": 3585, "Pretrain/Step Time": 8.42841062322259} +{"Pretrain/Learning Rate": 3.587713389617916e-05, "Pretrain/Loss": 2.0207247734069824, "Pretrain/Loss (Raw)": 1.8168792724609375, "Pretrain/Step": 3586, "Pretrain/Step Time": 8.42538981884718} +{"Pretrain/Learning Rate": 3.5869489078945845e-05, "Pretrain/Loss": 2.022397518157959, "Pretrain/Loss (Raw)": 2.0804097652435303, "Pretrain/Step": 3587, "Pretrain/Step Time": 8.423274187371135} +{"Pretrain/Learning Rate": 3.586184300819184e-05, "Pretrain/Loss": 2.0212342739105225, "Pretrain/Loss (Raw)": 2.004546880722046, "Pretrain/Step": 3588, "Pretrain/Step Time": 8.426821621134877} +{"Pretrain/Learning Rate": 3.585419568479891e-05, "Pretrain/Loss": 2.019960403442383, "Pretrain/Loss (Raw)": 2.037386178970337, "Pretrain/Step": 3589, "Pretrain/Step Time": 8.426207626238465} +{"Pretrain/Learning Rate": 3.584654710964899e-05, "Pretrain/Loss": 2.0196919441223145, "Pretrain/Loss (Raw)": 2.0358500480651855, "Pretrain/Step": 3590, "Pretrain/Step Time": 8.429251598194242} +{"Pretrain/Learning Rate": 3.583889728362414e-05, "Pretrain/Loss": 2.0190510749816895, "Pretrain/Loss (Raw)": 2.0509371757507324, "Pretrain/Step": 3591, "Pretrain/Step Time": 8.434163104742765} +{"Pretrain/Learning Rate": 3.583124620760659e-05, "Pretrain/Loss": 2.0204854011535645, "Pretrain/Loss (Raw)": 2.3249425888061523, "Pretrain/Step": 3592, "Pretrain/Step Time": 8.432766200974584} +{"Pretrain/Learning Rate": 3.582359388247869e-05, "Pretrain/Loss": 2.0185546875, "Pretrain/Loss (Raw)": 2.060844898223877, "Pretrain/Step": 3593, "Pretrain/Step Time": 8.42865958623588} +{"Pretrain/Learning Rate": 3.581594030912294e-05, "Pretrain/Loss": 2.016866683959961, "Pretrain/Loss (Raw)": 1.8925249576568604, "Pretrain/Step": 3594, "Pretrain/Step Time": 8.43133495748043} +{"Pretrain/Learning Rate": 3.580828548842198e-05, "Pretrain/Loss": 2.012889862060547, "Pretrain/Loss (Raw)": 1.784010887145996, "Pretrain/Step": 3595, "Pretrain/Step Time": 8.43041411973536} +{"Pretrain/Learning Rate": 3.5800629421258606e-05, "Pretrain/Loss": 2.011557102203369, "Pretrain/Loss (Raw)": 2.0260891914367676, "Pretrain/Step": 3596, "Pretrain/Step Time": 8.440416041761637} +{"Pretrain/Learning Rate": 3.579297210851576e-05, "Pretrain/Loss": 2.009084701538086, "Pretrain/Loss (Raw)": 2.033433675765991, "Pretrain/Step": 3597, "Pretrain/Step Time": 8.439982952550054} +{"Pretrain/Learning Rate": 3.5785313551076505e-05, "Pretrain/Loss": 2.0097646713256836, "Pretrain/Loss (Raw)": 1.9962390661239624, "Pretrain/Step": 3598, "Pretrain/Step Time": 8.434034124016762} +{"Pretrain/Learning Rate": 3.577765374982408e-05, "Pretrain/Loss": 2.0093421936035156, "Pretrain/Loss (Raw)": 2.038565158843994, "Pretrain/Step": 3599, "Pretrain/Step Time": 8.427186414599419} +{"Pretrain/Learning Rate": 3.576999270564183e-05, "Pretrain/Loss": 2.0100932121276855, "Pretrain/Loss (Raw)": 2.1803832054138184, "Pretrain/Step": 3600, "Pretrain/Step Time": 8.426433935761452} +{"Pretrain/Learning Rate": 3.5762330419413273e-05, "Pretrain/Loss": 2.0090200901031494, "Pretrain/Loss (Raw)": 1.8178166151046753, "Pretrain/Step": 3601, "Pretrain/Step Time": 8.439577803015709} +{"Pretrain/Learning Rate": 3.575466689202206e-05, "Pretrain/Loss": 2.009890556335449, "Pretrain/Loss (Raw)": 2.021709442138672, "Pretrain/Step": 3602, "Pretrain/Step Time": 8.4355151001364} +{"Pretrain/Learning Rate": 3.5747002124351986e-05, "Pretrain/Loss": 2.0108017921447754, "Pretrain/Loss (Raw)": 2.07037091255188, "Pretrain/Step": 3603, "Pretrain/Step Time": 8.433567006140947} +{"Pretrain/Learning Rate": 3.573933611728698e-05, "Pretrain/Loss": 2.0101735591888428, "Pretrain/Loss (Raw)": 1.8284530639648438, "Pretrain/Step": 3604, "Pretrain/Step Time": 8.43022895231843} +{"Pretrain/Learning Rate": 3.573166887171113e-05, "Pretrain/Loss": 2.0123517513275146, "Pretrain/Loss (Raw)": 2.1771793365478516, "Pretrain/Step": 3605, "Pretrain/Step Time": 8.420964626595378} +{"Pretrain/Learning Rate": 3.5724000388508655e-05, "Pretrain/Loss": 2.0090255737304688, "Pretrain/Loss (Raw)": 1.7945529222488403, "Pretrain/Step": 3606, "Pretrain/Step Time": 8.429796384647489} +{"Pretrain/Learning Rate": 3.571633066856392e-05, "Pretrain/Loss": 2.0102767944335938, "Pretrain/Loss (Raw)": 2.194002866744995, "Pretrain/Step": 3607, "Pretrain/Step Time": 8.436222240328789} +{"Pretrain/Learning Rate": 3.570865971276144e-05, "Pretrain/Loss": 2.010554790496826, "Pretrain/Loss (Raw)": 2.1479504108428955, "Pretrain/Step": 3608, "Pretrain/Step Time": 8.435311201959848} +{"Pretrain/Learning Rate": 3.570098752198586e-05, "Pretrain/Loss": 2.0113518238067627, "Pretrain/Loss (Raw)": 2.1109676361083984, "Pretrain/Step": 3609, "Pretrain/Step Time": 8.436062945052981} +{"Pretrain/Learning Rate": 3.569331409712198e-05, "Pretrain/Loss": 2.0091464519500732, "Pretrain/Loss (Raw)": 1.9275953769683838, "Pretrain/Step": 3610, "Pretrain/Step Time": 8.436793439090252} +{"Pretrain/Learning Rate": 3.568563943905472e-05, "Pretrain/Loss": 2.009274959564209, "Pretrain/Loss (Raw)": 2.1182713508605957, "Pretrain/Step": 3611, "Pretrain/Step Time": 8.423737172037363} +{"Pretrain/Learning Rate": 3.5677963548669175e-05, "Pretrain/Loss": 2.0086617469787598, "Pretrain/Loss (Raw)": 2.0670688152313232, "Pretrain/Step": 3612, "Pretrain/Step Time": 8.432313794270158} +{"Pretrain/Learning Rate": 3.567028642685055e-05, "Pretrain/Loss": 2.0091075897216797, "Pretrain/Loss (Raw)": 1.9642369747161865, "Pretrain/Step": 3613, "Pretrain/Step Time": 8.4348808452487} +{"Pretrain/Learning Rate": 3.566260807448422e-05, "Pretrain/Loss": 2.0090999603271484, "Pretrain/Loss (Raw)": 1.967627763748169, "Pretrain/Step": 3614, "Pretrain/Step Time": 8.433320073410869} +{"Pretrain/Learning Rate": 3.565492849245568e-05, "Pretrain/Loss": 2.0086748600006104, "Pretrain/Loss (Raw)": 1.9743189811706543, "Pretrain/Step": 3615, "Pretrain/Step Time": 8.43445509672165} +{"Pretrain/Learning Rate": 3.564724768165058e-05, "Pretrain/Loss": 2.0079922676086426, "Pretrain/Loss (Raw)": 2.0537211894989014, "Pretrain/Step": 3616, "Pretrain/Step Time": 8.429821755737066} +{"Pretrain/Learning Rate": 3.5639565642954705e-05, "Pretrain/Loss": 2.0099964141845703, "Pretrain/Loss (Raw)": 2.1828675270080566, "Pretrain/Step": 3617, "Pretrain/Step Time": 8.420351376757026} +{"Pretrain/Learning Rate": 3.563188237725399e-05, "Pretrain/Loss": 2.0129547119140625, "Pretrain/Loss (Raw)": 2.2525839805603027, "Pretrain/Step": 3618, "Pretrain/Step Time": 8.425947897136211} +{"Pretrain/Learning Rate": 3.562419788543449e-05, "Pretrain/Loss": 2.0176587104797363, "Pretrain/Loss (Raw)": 2.567441701889038, "Pretrain/Step": 3619, "Pretrain/Step Time": 8.427590833976865} +{"Pretrain/Learning Rate": 3.561651216838243e-05, "Pretrain/Loss": 2.0192949771881104, "Pretrain/Loss (Raw)": 1.9558650255203247, "Pretrain/Step": 3620, "Pretrain/Step Time": 8.426827320829034} +{"Pretrain/Learning Rate": 3.560882522698417e-05, "Pretrain/Loss": 2.018183708190918, "Pretrain/Loss (Raw)": 1.8513429164886475, "Pretrain/Step": 3621, "Pretrain/Step Time": 8.42179461941123} +{"Pretrain/Learning Rate": 3.560113706212618e-05, "Pretrain/Loss": 2.021322250366211, "Pretrain/Loss (Raw)": 2.1209189891815186, "Pretrain/Step": 3622, "Pretrain/Step Time": 8.418735543265939} +{"Pretrain/Learning Rate": 3.559344767469512e-05, "Pretrain/Loss": 2.023395538330078, "Pretrain/Loss (Raw)": 2.1439208984375, "Pretrain/Step": 3623, "Pretrain/Step Time": 8.418138857930899} +{"Pretrain/Learning Rate": 3.5585757065577755e-05, "Pretrain/Loss": 2.0246422290802, "Pretrain/Loss (Raw)": 2.006674289703369, "Pretrain/Step": 3624, "Pretrain/Step Time": 8.418690534308553} +{"Pretrain/Learning Rate": 3.557806523566099e-05, "Pretrain/Loss": 2.0243067741394043, "Pretrain/Loss (Raw)": 2.0055270195007324, "Pretrain/Step": 3625, "Pretrain/Step Time": 8.425244104117155} +{"Pretrain/Learning Rate": 3.557037218583191e-05, "Pretrain/Loss": 2.024388551712036, "Pretrain/Loss (Raw)": 2.2544283866882324, "Pretrain/Step": 3626, "Pretrain/Step Time": 8.428889675065875} +{"Pretrain/Learning Rate": 3.5562677916977704e-05, "Pretrain/Loss": 2.0262770652770996, "Pretrain/Loss (Raw)": 2.232542037963867, "Pretrain/Step": 3627, "Pretrain/Step Time": 8.429140899330378} +{"Pretrain/Learning Rate": 3.55549824299857e-05, "Pretrain/Loss": 2.0267796516418457, "Pretrain/Loss (Raw)": 1.9389983415603638, "Pretrain/Step": 3628, "Pretrain/Step Time": 8.425620045512915} +{"Pretrain/Learning Rate": 3.554728572574339e-05, "Pretrain/Loss": 2.0233712196350098, "Pretrain/Loss (Raw)": 1.8233702182769775, "Pretrain/Step": 3629, "Pretrain/Step Time": 8.436147259548306} +{"Pretrain/Learning Rate": 3.5539587805138385e-05, "Pretrain/Loss": 2.0226640701293945, "Pretrain/Loss (Raw)": 2.0034680366516113, "Pretrain/Step": 3630, "Pretrain/Step Time": 8.432895002886653} +{"Pretrain/Learning Rate": 3.5531888669058455e-05, "Pretrain/Loss": 2.0255231857299805, "Pretrain/Loss (Raw)": 2.219494342803955, "Pretrain/Step": 3631, "Pretrain/Step Time": 8.4323890209198} +{"Pretrain/Learning Rate": 3.552418831839149e-05, "Pretrain/Loss": 2.025378942489624, "Pretrain/Loss (Raw)": 2.110875129699707, "Pretrain/Step": 3632, "Pretrain/Step Time": 8.432764222845435} +{"Pretrain/Learning Rate": 3.551648675402554e-05, "Pretrain/Loss": 2.028205394744873, "Pretrain/Loss (Raw)": 2.0754575729370117, "Pretrain/Step": 3633, "Pretrain/Step Time": 8.42885546386242} +{"Pretrain/Learning Rate": 3.550878397684878e-05, "Pretrain/Loss": 2.029707908630371, "Pretrain/Loss (Raw)": 2.0377659797668457, "Pretrain/Step": 3634, "Pretrain/Step Time": 8.431887589395046} +{"Pretrain/Learning Rate": 3.5501079987749535e-05, "Pretrain/Loss": 2.032353401184082, "Pretrain/Loss (Raw)": 2.157600164413452, "Pretrain/Step": 3635, "Pretrain/Step Time": 8.432237517088652} +{"Pretrain/Learning Rate": 3.549337478761626e-05, "Pretrain/Loss": 2.0322747230529785, "Pretrain/Loss (Raw)": 2.066643476486206, "Pretrain/Step": 3636, "Pretrain/Step Time": 8.435910172760487} +{"Pretrain/Learning Rate": 3.548566837733756e-05, "Pretrain/Loss": 2.0309829711914062, "Pretrain/Loss (Raw)": 1.9169856309890747, "Pretrain/Step": 3637, "Pretrain/Step Time": 8.436597641557455} +{"Pretrain/Learning Rate": 3.547796075780218e-05, "Pretrain/Loss": 2.0308899879455566, "Pretrain/Loss (Raw)": 1.9008625745773315, "Pretrain/Step": 3638, "Pretrain/Step Time": 8.435866853222251} +{"Pretrain/Learning Rate": 3.547025192989898e-05, "Pretrain/Loss": 2.0315794944763184, "Pretrain/Loss (Raw)": 2.1521613597869873, "Pretrain/Step": 3639, "Pretrain/Step Time": 8.430483493953943} +{"Pretrain/Learning Rate": 3.546254189451699e-05, "Pretrain/Loss": 2.0327043533325195, "Pretrain/Loss (Raw)": 1.9019643068313599, "Pretrain/Step": 3640, "Pretrain/Step Time": 8.430545652285218} +{"Pretrain/Learning Rate": 3.5454830652545374e-05, "Pretrain/Loss": 2.032520294189453, "Pretrain/Loss (Raw)": 1.927437424659729, "Pretrain/Step": 3641, "Pretrain/Step Time": 8.434615064412355} +{"Pretrain/Learning Rate": 3.544711820487343e-05, "Pretrain/Loss": 2.0328712463378906, "Pretrain/Loss (Raw)": 2.0556838512420654, "Pretrain/Step": 3642, "Pretrain/Step Time": 8.437381267547607} +{"Pretrain/Learning Rate": 3.543940455239057e-05, "Pretrain/Loss": 2.034435272216797, "Pretrain/Loss (Raw)": 2.127687454223633, "Pretrain/Step": 3643, "Pretrain/Step Time": 8.433410320430994} +{"Pretrain/Learning Rate": 3.543168969598639e-05, "Pretrain/Loss": 2.0367929935455322, "Pretrain/Loss (Raw)": 2.0991060733795166, "Pretrain/Step": 3644, "Pretrain/Step Time": 8.430326888337731} +{"Pretrain/Learning Rate": 3.54239736365506e-05, "Pretrain/Loss": 2.0330018997192383, "Pretrain/Loss (Raw)": 1.6071323156356812, "Pretrain/Step": 3645, "Pretrain/Step Time": 8.425555134192109} +{"Pretrain/Learning Rate": 3.541625637497306e-05, "Pretrain/Loss": 2.033310651779175, "Pretrain/Loss (Raw)": 2.0053322315216064, "Pretrain/Step": 3646, "Pretrain/Step Time": 8.424442624673247} +{"Pretrain/Learning Rate": 3.540853791214373e-05, "Pretrain/Loss": 2.0351033210754395, "Pretrain/Loss (Raw)": 2.247767686843872, "Pretrain/Step": 3647, "Pretrain/Step Time": 8.431745644658804} +{"Pretrain/Learning Rate": 3.5400818248952786e-05, "Pretrain/Loss": 2.0340757369995117, "Pretrain/Loss (Raw)": 1.8388046026229858, "Pretrain/Step": 3648, "Pretrain/Step Time": 8.436278246343136} +{"Pretrain/Learning Rate": 3.539309738629045e-05, "Pretrain/Loss": 2.034636974334717, "Pretrain/Loss (Raw)": 1.9491662979125977, "Pretrain/Step": 3649, "Pretrain/Step Time": 8.438705883920193} +{"Pretrain/Learning Rate": 3.5385375325047166e-05, "Pretrain/Loss": 2.033780574798584, "Pretrain/Loss (Raw)": 1.9357593059539795, "Pretrain/Step": 3650, "Pretrain/Step Time": 8.428607411682606} +{"Pretrain/Learning Rate": 3.537765206611345e-05, "Pretrain/Loss": 2.0347344875335693, "Pretrain/Loss (Raw)": 2.028648853302002, "Pretrain/Step": 3651, "Pretrain/Step Time": 8.428841030225158} +{"Pretrain/Learning Rate": 3.536992761038001e-05, "Pretrain/Loss": 2.0344810485839844, "Pretrain/Loss (Raw)": 1.9828704595565796, "Pretrain/Step": 3652, "Pretrain/Step Time": 8.435629216954112} +{"Pretrain/Learning Rate": 3.536220195873764e-05, "Pretrain/Loss": 2.0314064025878906, "Pretrain/Loss (Raw)": 2.154735565185547, "Pretrain/Step": 3653, "Pretrain/Step Time": 8.436518432572484} +{"Pretrain/Learning Rate": 3.535447511207731e-05, "Pretrain/Loss": 2.0315334796905518, "Pretrain/Loss (Raw)": 2.1432738304138184, "Pretrain/Step": 3654, "Pretrain/Step Time": 8.434293989092112} +{"Pretrain/Learning Rate": 3.534674707129013e-05, "Pretrain/Loss": 2.0357789993286133, "Pretrain/Loss (Raw)": 2.463136911392212, "Pretrain/Step": 3655, "Pretrain/Step Time": 8.43567717820406} +{"Pretrain/Learning Rate": 3.5339017837267316e-05, "Pretrain/Loss": 2.0369114875793457, "Pretrain/Loss (Raw)": 2.1956348419189453, "Pretrain/Step": 3656, "Pretrain/Step Time": 8.431351706385612} +{"Pretrain/Learning Rate": 3.5331287410900246e-05, "Pretrain/Loss": 2.0379011631011963, "Pretrain/Loss (Raw)": 2.1875312328338623, "Pretrain/Step": 3657, "Pretrain/Step Time": 8.429257011041045} +{"Pretrain/Learning Rate": 3.532355579308043e-05, "Pretrain/Loss": 2.0381994247436523, "Pretrain/Loss (Raw)": 2.095616579055786, "Pretrain/Step": 3658, "Pretrain/Step Time": 8.435685439035296} +{"Pretrain/Learning Rate": 3.531582298469952e-05, "Pretrain/Loss": 2.0361461639404297, "Pretrain/Loss (Raw)": 1.7892004251480103, "Pretrain/Step": 3659, "Pretrain/Step Time": 8.436178226023912} +{"Pretrain/Learning Rate": 3.530808898664928e-05, "Pretrain/Loss": 2.0347213745117188, "Pretrain/Loss (Raw)": 1.770119309425354, "Pretrain/Step": 3660, "Pretrain/Step Time": 8.435297483578324} +{"Pretrain/Learning Rate": 3.530035379982166e-05, "Pretrain/Loss": 2.035526752471924, "Pretrain/Loss (Raw)": 2.031076669692993, "Pretrain/Step": 3661, "Pretrain/Step Time": 8.4285775013268} +{"Pretrain/Learning Rate": 3.5292617425108694e-05, "Pretrain/Loss": 2.035162925720215, "Pretrain/Loss (Raw)": 2.176145553588867, "Pretrain/Step": 3662, "Pretrain/Step Time": 8.427137283608317} +{"Pretrain/Learning Rate": 3.5284879863402585e-05, "Pretrain/Loss": 2.036259889602661, "Pretrain/Loss (Raw)": 2.080449104309082, "Pretrain/Step": 3663, "Pretrain/Step Time": 8.426191627979279} +{"Pretrain/Learning Rate": 3.527714111559567e-05, "Pretrain/Loss": 2.035548210144043, "Pretrain/Loss (Raw)": 1.916465401649475, "Pretrain/Step": 3664, "Pretrain/Step Time": 8.425482373684645} +{"Pretrain/Learning Rate": 3.526940118258041e-05, "Pretrain/Loss": 2.033892869949341, "Pretrain/Loss (Raw)": 1.7523138523101807, "Pretrain/Step": 3665, "Pretrain/Step Time": 8.43199516646564} +{"Pretrain/Learning Rate": 3.526166006524942e-05, "Pretrain/Loss": 2.034752368927002, "Pretrain/Loss (Raw)": 2.030576229095459, "Pretrain/Step": 3666, "Pretrain/Step Time": 8.4279566090554} +{"Pretrain/Learning Rate": 3.525391776449544e-05, "Pretrain/Loss": 2.0352556705474854, "Pretrain/Loss (Raw)": 2.124734401702881, "Pretrain/Step": 3667, "Pretrain/Step Time": 8.421192960813642} +{"Pretrain/Learning Rate": 3.5246174281211344e-05, "Pretrain/Loss": 2.0367064476013184, "Pretrain/Loss (Raw)": 2.1674606800079346, "Pretrain/Step": 3668, "Pretrain/Step Time": 8.42531575076282} +{"Pretrain/Learning Rate": 3.523842961629014e-05, "Pretrain/Loss": 2.035719871520996, "Pretrain/Loss (Raw)": 2.126589059829712, "Pretrain/Step": 3669, "Pretrain/Step Time": 8.434153316542506} +{"Pretrain/Learning Rate": 3.5230683770624987e-05, "Pretrain/Loss": 2.036022901535034, "Pretrain/Loss (Raw)": 1.901435375213623, "Pretrain/Step": 3670, "Pretrain/Step Time": 8.434001289308071} +{"Pretrain/Learning Rate": 3.522293674510918e-05, "Pretrain/Loss": 2.0364699363708496, "Pretrain/Loss (Raw)": 2.2000467777252197, "Pretrain/Step": 3671, "Pretrain/Step Time": 8.43634026311338} +{"Pretrain/Learning Rate": 3.5215188540636134e-05, "Pretrain/Loss": 2.037151336669922, "Pretrain/Loss (Raw)": 2.131011724472046, "Pretrain/Step": 3672, "Pretrain/Step Time": 8.432596184313297} +{"Pretrain/Learning Rate": 3.520743915809941e-05, "Pretrain/Loss": 2.036472797393799, "Pretrain/Loss (Raw)": 1.9027469158172607, "Pretrain/Step": 3673, "Pretrain/Step Time": 8.42879094183445} +{"Pretrain/Learning Rate": 3.51996885983927e-05, "Pretrain/Loss": 2.036597490310669, "Pretrain/Loss (Raw)": 2.045177936553955, "Pretrain/Step": 3674, "Pretrain/Step Time": 8.430081997066736} +{"Pretrain/Learning Rate": 3.519193686240984e-05, "Pretrain/Loss": 2.037349224090576, "Pretrain/Loss (Raw)": 2.1233553886413574, "Pretrain/Step": 3675, "Pretrain/Step Time": 8.435116231441498} +{"Pretrain/Learning Rate": 3.51841839510448e-05, "Pretrain/Loss": 2.038748264312744, "Pretrain/Loss (Raw)": 2.1879663467407227, "Pretrain/Step": 3676, "Pretrain/Step Time": 8.434349283576012} +{"Pretrain/Learning Rate": 3.517642986519167e-05, "Pretrain/Loss": 2.038808584213257, "Pretrain/Loss (Raw)": 1.9984729290008545, "Pretrain/Step": 3677, "Pretrain/Step Time": 8.438599072396755} +{"Pretrain/Learning Rate": 3.51686746057447e-05, "Pretrain/Loss": 2.0371296405792236, "Pretrain/Loss (Raw)": 1.8796439170837402, "Pretrain/Step": 3678, "Pretrain/Step Time": 8.430691046640277} +{"Pretrain/Learning Rate": 3.516091817359825e-05, "Pretrain/Loss": 2.036006212234497, "Pretrain/Loss (Raw)": 2.0086424350738525, "Pretrain/Step": 3679, "Pretrain/Step Time": 8.433035651221871} +{"Pretrain/Learning Rate": 3.515316056964684e-05, "Pretrain/Loss": 2.034810781478882, "Pretrain/Loss (Raw)": 1.856468915939331, "Pretrain/Step": 3680, "Pretrain/Step Time": 8.432169422507286} +{"Pretrain/Learning Rate": 3.5145401794785116e-05, "Pretrain/Loss": 2.038647174835205, "Pretrain/Loss (Raw)": 2.242122173309326, "Pretrain/Step": 3681, "Pretrain/Step Time": 8.440012289211154} +{"Pretrain/Learning Rate": 3.5137641849907844e-05, "Pretrain/Loss": 2.03889536857605, "Pretrain/Loss (Raw)": 2.0663845539093018, "Pretrain/Step": 3682, "Pretrain/Step Time": 8.436783803626895} +{"Pretrain/Learning Rate": 3.5129880735909945e-05, "Pretrain/Loss": 2.0391650199890137, "Pretrain/Loss (Raw)": 2.0767886638641357, "Pretrain/Step": 3683, "Pretrain/Step Time": 8.440621621906757} +{"Pretrain/Learning Rate": 3.512211845368647e-05, "Pretrain/Loss": 2.0378403663635254, "Pretrain/Loss (Raw)": 1.8867470026016235, "Pretrain/Step": 3684, "Pretrain/Step Time": 8.433524288237095} +{"Pretrain/Learning Rate": 3.511435500413259e-05, "Pretrain/Loss": 2.038151741027832, "Pretrain/Loss (Raw)": 2.085484504699707, "Pretrain/Step": 3685, "Pretrain/Step Time": 8.437548737972975} +{"Pretrain/Learning Rate": 3.510659038814364e-05, "Pretrain/Loss": 2.0363757610321045, "Pretrain/Loss (Raw)": 1.8399388790130615, "Pretrain/Step": 3686, "Pretrain/Step Time": 8.442608948796988} +{"Pretrain/Learning Rate": 3.509882460661506e-05, "Pretrain/Loss": 2.0405261516571045, "Pretrain/Loss (Raw)": 2.334980010986328, "Pretrain/Step": 3687, "Pretrain/Step Time": 8.441554568707943} +{"Pretrain/Learning Rate": 3.5091057660442434e-05, "Pretrain/Loss": 2.038907051086426, "Pretrain/Loss (Raw)": 1.8129218816757202, "Pretrain/Step": 3688, "Pretrain/Step Time": 8.445845987647772} +{"Pretrain/Learning Rate": 3.5083289550521495e-05, "Pretrain/Loss": 2.0389323234558105, "Pretrain/Loss (Raw)": 2.0964343547821045, "Pretrain/Step": 3689, "Pretrain/Step Time": 8.442284688353539} +{"Pretrain/Learning Rate": 3.507552027774809e-05, "Pretrain/Loss": 2.04063081741333, "Pretrain/Loss (Raw)": 2.3058369159698486, "Pretrain/Step": 3690, "Pretrain/Step Time": 8.436420198529959} +{"Pretrain/Learning Rate": 3.5067749843018205e-05, "Pretrain/Loss": 2.0391688346862793, "Pretrain/Loss (Raw)": 1.9717936515808105, "Pretrain/Step": 3691, "Pretrain/Step Time": 8.44448797032237} +{"Pretrain/Learning Rate": 3.5059978247227965e-05, "Pretrain/Loss": 2.039017677307129, "Pretrain/Loss (Raw)": 1.9776989221572876, "Pretrain/Step": 3692, "Pretrain/Step Time": 8.448098849505186} +{"Pretrain/Learning Rate": 3.505220549127364e-05, "Pretrain/Loss": 2.0388987064361572, "Pretrain/Loss (Raw)": 2.0411696434020996, "Pretrain/Step": 3693, "Pretrain/Step Time": 8.445538913831115} +{"Pretrain/Learning Rate": 3.50444315760516e-05, "Pretrain/Loss": 2.0403947830200195, "Pretrain/Loss (Raw)": 2.108167886734009, "Pretrain/Step": 3694, "Pretrain/Step Time": 8.447570836171508} +{"Pretrain/Learning Rate": 3.503665650245838e-05, "Pretrain/Loss": 2.040623903274536, "Pretrain/Loss (Raw)": 2.072040319442749, "Pretrain/Step": 3695, "Pretrain/Step Time": 8.44650630094111} +{"Pretrain/Learning Rate": 3.502888027139065e-05, "Pretrain/Loss": 2.0406746864318848, "Pretrain/Loss (Raw)": 2.0117099285125732, "Pretrain/Step": 3696, "Pretrain/Step Time": 8.442486137151718} +{"Pretrain/Learning Rate": 3.502110288374517e-05, "Pretrain/Loss": 2.0403923988342285, "Pretrain/Loss (Raw)": 2.0586657524108887, "Pretrain/Step": 3697, "Pretrain/Step Time": 8.433560306206346} +{"Pretrain/Learning Rate": 3.50133243404189e-05, "Pretrain/Loss": 2.0403077602386475, "Pretrain/Loss (Raw)": 2.091732978820801, "Pretrain/Step": 3698, "Pretrain/Step Time": 8.441741501912475} +{"Pretrain/Learning Rate": 3.5005544642308874e-05, "Pretrain/Loss": 2.0414013862609863, "Pretrain/Loss (Raw)": 2.0149030685424805, "Pretrain/Step": 3699, "Pretrain/Step Time": 8.438964696601033} +{"Pretrain/Learning Rate": 3.49977637903123e-05, "Pretrain/Loss": 2.0411527156829834, "Pretrain/Loss (Raw)": 1.978203535079956, "Pretrain/Step": 3700, "Pretrain/Step Time": 8.438258921727538} +{"Pretrain/Learning Rate": 3.4989981785326485e-05, "Pretrain/Loss": 2.039360284805298, "Pretrain/Loss (Raw)": 2.01961612701416, "Pretrain/Step": 3701, "Pretrain/Step Time": 8.433817114681005} +{"Pretrain/Learning Rate": 3.498219862824891e-05, "Pretrain/Loss": 2.040281295776367, "Pretrain/Loss (Raw)": 2.156151056289673, "Pretrain/Step": 3702, "Pretrain/Step Time": 8.434869732707739} +{"Pretrain/Learning Rate": 3.497441431997714e-05, "Pretrain/Loss": 2.039869785308838, "Pretrain/Loss (Raw)": 1.9596495628356934, "Pretrain/Step": 3703, "Pretrain/Step Time": 8.438628900796175} +{"Pretrain/Learning Rate": 3.4966628861408914e-05, "Pretrain/Loss": 2.038743734359741, "Pretrain/Loss (Raw)": 2.0162854194641113, "Pretrain/Step": 3704, "Pretrain/Step Time": 8.440166929736733} +{"Pretrain/Learning Rate": 3.495884225344208e-05, "Pretrain/Loss": 2.038513660430908, "Pretrain/Loss (Raw)": 2.106771469116211, "Pretrain/Step": 3705, "Pretrain/Step Time": 8.445287434384227} +{"Pretrain/Learning Rate": 3.495105449697463e-05, "Pretrain/Loss": 2.039051055908203, "Pretrain/Loss (Raw)": 2.002805709838867, "Pretrain/Step": 3706, "Pretrain/Step Time": 8.436608927324414} +{"Pretrain/Learning Rate": 3.494326559290469e-05, "Pretrain/Loss": 2.041043281555176, "Pretrain/Loss (Raw)": 2.2752010822296143, "Pretrain/Step": 3707, "Pretrain/Step Time": 8.435581678524613} +{"Pretrain/Learning Rate": 3.4935475542130505e-05, "Pretrain/Loss": 2.0403590202331543, "Pretrain/Loss (Raw)": 1.8957161903381348, "Pretrain/Step": 3708, "Pretrain/Step Time": 8.435838509351015} +{"Pretrain/Learning Rate": 3.492768434555046e-05, "Pretrain/Loss": 2.0425641536712646, "Pretrain/Loss (Raw)": 2.0917298793792725, "Pretrain/Step": 3709, "Pretrain/Step Time": 8.442468727007508} +{"Pretrain/Learning Rate": 3.4919892004063084e-05, "Pretrain/Loss": 2.042773723602295, "Pretrain/Loss (Raw)": 2.119563102722168, "Pretrain/Step": 3710, "Pretrain/Step Time": 8.440335065126419} +{"Pretrain/Learning Rate": 3.491209851856701e-05, "Pretrain/Loss": 2.041818618774414, "Pretrain/Loss (Raw)": 2.0273869037628174, "Pretrain/Step": 3711, "Pretrain/Step Time": 8.435862818732858} +{"Pretrain/Learning Rate": 3.490430388996103e-05, "Pretrain/Loss": 2.042311191558838, "Pretrain/Loss (Raw)": 2.070997714996338, "Pretrain/Step": 3712, "Pretrain/Step Time": 8.431760400533676} +{"Pretrain/Learning Rate": 3.4896508119144056e-05, "Pretrain/Loss": 2.043776035308838, "Pretrain/Loss (Raw)": 2.063660144805908, "Pretrain/Step": 3713, "Pretrain/Step Time": 8.432337956503034} +{"Pretrain/Learning Rate": 3.4888711207015124e-05, "Pretrain/Loss": 2.046006679534912, "Pretrain/Loss (Raw)": 2.102421760559082, "Pretrain/Step": 3714, "Pretrain/Step Time": 8.436920084059238} +{"Pretrain/Learning Rate": 3.488091315447343e-05, "Pretrain/Loss": 2.0487282276153564, "Pretrain/Loss (Raw)": 2.428762435913086, "Pretrain/Step": 3715, "Pretrain/Step Time": 8.438047973439097} +{"Pretrain/Learning Rate": 3.487311396241826e-05, "Pretrain/Loss": 2.049806594848633, "Pretrain/Loss (Raw)": 2.1425588130950928, "Pretrain/Step": 3716, "Pretrain/Step Time": 8.435443349182606} +{"Pretrain/Learning Rate": 3.486531363174908e-05, "Pretrain/Loss": 2.047065258026123, "Pretrain/Loss (Raw)": 1.6864856481552124, "Pretrain/Step": 3717, "Pretrain/Step Time": 8.435025595128536} +{"Pretrain/Learning Rate": 3.4857512163365424e-05, "Pretrain/Loss": 2.0474815368652344, "Pretrain/Loss (Raw)": 2.0891616344451904, "Pretrain/Step": 3718, "Pretrain/Step Time": 8.4338174238801} +{"Pretrain/Learning Rate": 3.484970955816703e-05, "Pretrain/Loss": 2.046459674835205, "Pretrain/Loss (Raw)": 1.9201570749282837, "Pretrain/Step": 3719, "Pretrain/Step Time": 8.432310840114951} +{"Pretrain/Learning Rate": 3.484190581705371e-05, "Pretrain/Loss": 2.0457112789154053, "Pretrain/Loss (Raw)": 2.2291107177734375, "Pretrain/Step": 3720, "Pretrain/Step Time": 8.438142400234938} +{"Pretrain/Learning Rate": 3.483410094092543e-05, "Pretrain/Loss": 2.045036554336548, "Pretrain/Loss (Raw)": 1.9744863510131836, "Pretrain/Step": 3721, "Pretrain/Step Time": 8.432978879660368} +{"Pretrain/Learning Rate": 3.48262949306823e-05, "Pretrain/Loss": 2.0462565422058105, "Pretrain/Loss (Raw)": 2.048701763153076, "Pretrain/Step": 3722, "Pretrain/Step Time": 8.43586433492601} +{"Pretrain/Learning Rate": 3.481848778722453e-05, "Pretrain/Loss": 2.0484561920166016, "Pretrain/Loss (Raw)": 2.0655603408813477, "Pretrain/Step": 3723, "Pretrain/Step Time": 8.435785042122006} +{"Pretrain/Learning Rate": 3.4810679511452484e-05, "Pretrain/Loss": 2.046549081802368, "Pretrain/Loss (Raw)": 1.7819536924362183, "Pretrain/Step": 3724, "Pretrain/Step Time": 8.426639949902892} +{"Pretrain/Learning Rate": 3.480287010426664e-05, "Pretrain/Loss": 2.0474777221679688, "Pretrain/Loss (Raw)": 2.152311325073242, "Pretrain/Step": 3725, "Pretrain/Step Time": 8.431650644168258} +{"Pretrain/Learning Rate": 3.479505956656764e-05, "Pretrain/Loss": 2.050403594970703, "Pretrain/Loss (Raw)": 2.370763063430786, "Pretrain/Step": 3726, "Pretrain/Step Time": 8.433901017531753} +{"Pretrain/Learning Rate": 3.47872478992562e-05, "Pretrain/Loss": 2.050271511077881, "Pretrain/Loss (Raw)": 2.0216782093048096, "Pretrain/Step": 3727, "Pretrain/Step Time": 8.434551170095801} +{"Pretrain/Learning Rate": 3.477943510323322e-05, "Pretrain/Loss": 2.050232410430908, "Pretrain/Loss (Raw)": 2.175340414047241, "Pretrain/Step": 3728, "Pretrain/Step Time": 8.433683162555099} +{"Pretrain/Learning Rate": 3.4771621179399696e-05, "Pretrain/Loss": 2.053349733352661, "Pretrain/Loss (Raw)": 2.216837167739868, "Pretrain/Step": 3729, "Pretrain/Step Time": 8.42259756848216} +{"Pretrain/Learning Rate": 3.476380612865679e-05, "Pretrain/Loss": 2.0538110733032227, "Pretrain/Loss (Raw)": 2.0807554721832275, "Pretrain/Step": 3730, "Pretrain/Step Time": 8.42595505528152} +{"Pretrain/Learning Rate": 3.475598995190572e-05, "Pretrain/Loss": 2.052919387817383, "Pretrain/Loss (Raw)": 1.9562692642211914, "Pretrain/Step": 3731, "Pretrain/Step Time": 8.431248949840665} +{"Pretrain/Learning Rate": 3.4748172650047945e-05, "Pretrain/Loss": 2.054752826690674, "Pretrain/Loss (Raw)": 2.0631346702575684, "Pretrain/Step": 3732, "Pretrain/Step Time": 8.437134772539139} +{"Pretrain/Learning Rate": 3.474035422398496e-05, "Pretrain/Loss": 2.0542826652526855, "Pretrain/Loss (Raw)": 2.116988182067871, "Pretrain/Step": 3733, "Pretrain/Step Time": 8.437033578753471} +{"Pretrain/Learning Rate": 3.473253467461842e-05, "Pretrain/Loss": 2.055617332458496, "Pretrain/Loss (Raw)": 1.9653613567352295, "Pretrain/Step": 3734, "Pretrain/Step Time": 8.430439099669456} +{"Pretrain/Learning Rate": 3.4724714002850125e-05, "Pretrain/Loss": 2.055548667907715, "Pretrain/Loss (Raw)": 2.185222625732422, "Pretrain/Step": 3735, "Pretrain/Step Time": 8.428915102034807} +{"Pretrain/Learning Rate": 3.471689220958198e-05, "Pretrain/Loss": 2.0547282695770264, "Pretrain/Loss (Raw)": 2.0429441928863525, "Pretrain/Step": 3736, "Pretrain/Step Time": 8.429635027423501} +{"Pretrain/Learning Rate": 3.470906929571605e-05, "Pretrain/Loss": 2.053236961364746, "Pretrain/Loss (Raw)": 1.9200834035873413, "Pretrain/Step": 3737, "Pretrain/Step Time": 8.43181124702096} +{"Pretrain/Learning Rate": 3.470124526215449e-05, "Pretrain/Loss": 2.052581310272217, "Pretrain/Loss (Raw)": 1.8436875343322754, "Pretrain/Step": 3738, "Pretrain/Step Time": 8.436271980404854} +{"Pretrain/Learning Rate": 3.469342010979962e-05, "Pretrain/Loss": 2.0517072677612305, "Pretrain/Loss (Raw)": 2.0063729286193848, "Pretrain/Step": 3739, "Pretrain/Step Time": 8.437002565711737} +{"Pretrain/Learning Rate": 3.4685593839553856e-05, "Pretrain/Loss": 2.051520824432373, "Pretrain/Loss (Raw)": 2.0432045459747314, "Pretrain/Step": 3740, "Pretrain/Step Time": 8.429109750315547} +{"Pretrain/Learning Rate": 3.467776645231978e-05, "Pretrain/Loss": 2.0503978729248047, "Pretrain/Loss (Raw)": 1.8205053806304932, "Pretrain/Step": 3741, "Pretrain/Step Time": 8.431813945993781} +{"Pretrain/Learning Rate": 3.466993794900007e-05, "Pretrain/Loss": 2.0511317253112793, "Pretrain/Loss (Raw)": 2.061575174331665, "Pretrain/Step": 3742, "Pretrain/Step Time": 8.434000704437494} +{"Pretrain/Learning Rate": 3.466210833049755e-05, "Pretrain/Loss": 2.052371025085449, "Pretrain/Loss (Raw)": 2.132932424545288, "Pretrain/Step": 3743, "Pretrain/Step Time": 8.438744710758328} +{"Pretrain/Learning Rate": 3.465427759771516e-05, "Pretrain/Loss": 2.0530803203582764, "Pretrain/Loss (Raw)": 2.1445133686065674, "Pretrain/Step": 3744, "Pretrain/Step Time": 8.432359971106052} +{"Pretrain/Learning Rate": 3.464644575155599e-05, "Pretrain/Loss": 2.049266815185547, "Pretrain/Loss (Raw)": 1.6947170495986938, "Pretrain/Step": 3745, "Pretrain/Step Time": 8.4345215074718} +{"Pretrain/Learning Rate": 3.463861279292324e-05, "Pretrain/Loss": 2.048297882080078, "Pretrain/Loss (Raw)": 2.1285927295684814, "Pretrain/Step": 3746, "Pretrain/Step Time": 8.428062753751874} +{"Pretrain/Learning Rate": 3.4630778722720244e-05, "Pretrain/Loss": 2.0440492630004883, "Pretrain/Loss (Raw)": 2.0236001014709473, "Pretrain/Step": 3747, "Pretrain/Step Time": 8.426592882722616} +{"Pretrain/Learning Rate": 3.462294354185046e-05, "Pretrain/Loss": 2.0443058013916016, "Pretrain/Loss (Raw)": 1.9886834621429443, "Pretrain/Step": 3748, "Pretrain/Step Time": 8.428620334714651} +{"Pretrain/Learning Rate": 3.4615107251217496e-05, "Pretrain/Loss": 2.0450448989868164, "Pretrain/Loss (Raw)": 1.9459645748138428, "Pretrain/Step": 3749, "Pretrain/Step Time": 8.429715668782592} +{"Pretrain/Learning Rate": 3.460726985172504e-05, "Pretrain/Loss": 2.045776605606079, "Pretrain/Loss (Raw)": 2.214597463607788, "Pretrain/Step": 3750, "Pretrain/Step Time": 8.42965167015791} +{"Pretrain/Learning Rate": 3.4599431344276966e-05, "Pretrain/Loss": 2.0440735816955566, "Pretrain/Loss (Raw)": 1.9259252548217773, "Pretrain/Step": 3751, "Pretrain/Step Time": 8.433389699086547} +{"Pretrain/Learning Rate": 3.459159172977723e-05, "Pretrain/Loss": 2.0446090698242188, "Pretrain/Loss (Raw)": 2.0751867294311523, "Pretrain/Step": 3752, "Pretrain/Step Time": 8.429513989016414} +{"Pretrain/Learning Rate": 3.4583751009129936e-05, "Pretrain/Loss": 2.0457117557525635, "Pretrain/Loss (Raw)": 2.1466987133026123, "Pretrain/Step": 3753, "Pretrain/Step Time": 8.424773333594203} +{"Pretrain/Learning Rate": 3.457590918323932e-05, "Pretrain/Loss": 2.0434224605560303, "Pretrain/Loss (Raw)": 1.9614061117172241, "Pretrain/Step": 3754, "Pretrain/Step Time": 8.431933170184493} +{"Pretrain/Learning Rate": 3.4568066253009736e-05, "Pretrain/Loss": 2.0427803993225098, "Pretrain/Loss (Raw)": 2.1503748893737793, "Pretrain/Step": 3755, "Pretrain/Step Time": 8.429501790553331} +{"Pretrain/Learning Rate": 3.456022221934566e-05, "Pretrain/Loss": 2.046194314956665, "Pretrain/Loss (Raw)": 2.3759605884552, "Pretrain/Step": 3756, "Pretrain/Step Time": 8.424149483442307} +{"Pretrain/Learning Rate": 3.455237708315171e-05, "Pretrain/Loss": 2.0474908351898193, "Pretrain/Loss (Raw)": 1.9893114566802979, "Pretrain/Step": 3757, "Pretrain/Step Time": 8.417603265494108} +{"Pretrain/Learning Rate": 3.454453084533262e-05, "Pretrain/Loss": 2.0490260124206543, "Pretrain/Loss (Raw)": 2.1999709606170654, "Pretrain/Step": 3758, "Pretrain/Step Time": 8.419045727699995} +{"Pretrain/Learning Rate": 3.453668350679327e-05, "Pretrain/Loss": 2.046957015991211, "Pretrain/Loss (Raw)": 1.9546399116516113, "Pretrain/Step": 3759, "Pretrain/Step Time": 8.421347178518772} +{"Pretrain/Learning Rate": 3.4528835068438625e-05, "Pretrain/Loss": 2.04718017578125, "Pretrain/Loss (Raw)": 2.1394691467285156, "Pretrain/Step": 3760, "Pretrain/Step Time": 8.428547067567706} +{"Pretrain/Learning Rate": 3.452098553117382e-05, "Pretrain/Loss": 2.0475869178771973, "Pretrain/Loss (Raw)": 2.1274967193603516, "Pretrain/Step": 3761, "Pretrain/Step Time": 8.429529547691345} +{"Pretrain/Learning Rate": 3.4513134895904105e-05, "Pretrain/Loss": 2.0465173721313477, "Pretrain/Loss (Raw)": 1.9009045362472534, "Pretrain/Step": 3762, "Pretrain/Step Time": 8.424865202978253} +{"Pretrain/Learning Rate": 3.450528316353484e-05, "Pretrain/Loss": 2.0460782051086426, "Pretrain/Loss (Raw)": 2.101372718811035, "Pretrain/Step": 3763, "Pretrain/Step Time": 8.427411245182157} +{"Pretrain/Learning Rate": 3.4497430334971534e-05, "Pretrain/Loss": 2.0444529056549072, "Pretrain/Loss (Raw)": 1.8585907220840454, "Pretrain/Step": 3764, "Pretrain/Step Time": 8.424929287284613} +{"Pretrain/Learning Rate": 3.448957641111981e-05, "Pretrain/Loss": 2.044178009033203, "Pretrain/Loss (Raw)": 1.8818031549453735, "Pretrain/Step": 3765, "Pretrain/Step Time": 8.424199188128114} +{"Pretrain/Learning Rate": 3.4481721392885414e-05, "Pretrain/Loss": 2.0438804626464844, "Pretrain/Loss (Raw)": 1.8627874851226807, "Pretrain/Step": 3766, "Pretrain/Step Time": 8.430243659764528} +{"Pretrain/Learning Rate": 3.447386528117423e-05, "Pretrain/Loss": 2.0434632301330566, "Pretrain/Loss (Raw)": 2.098767042160034, "Pretrain/Step": 3767, "Pretrain/Step Time": 8.433582048863173} +{"Pretrain/Learning Rate": 3.446600807689226e-05, "Pretrain/Loss": 2.0473828315734863, "Pretrain/Loss (Raw)": 2.403674602508545, "Pretrain/Step": 3768, "Pretrain/Step Time": 8.431980887427926} +{"Pretrain/Learning Rate": 3.4458149780945636e-05, "Pretrain/Loss": 2.0477747917175293, "Pretrain/Loss (Raw)": 1.9775807857513428, "Pretrain/Step": 3769, "Pretrain/Step Time": 8.430189860984683} +{"Pretrain/Learning Rate": 3.4450290394240606e-05, "Pretrain/Loss": 2.0484437942504883, "Pretrain/Loss (Raw)": 2.1413393020629883, "Pretrain/Step": 3770, "Pretrain/Step Time": 8.427041618153453} +{"Pretrain/Learning Rate": 3.444242991768356e-05, "Pretrain/Loss": 2.0473289489746094, "Pretrain/Loss (Raw)": 1.9849932193756104, "Pretrain/Step": 3771, "Pretrain/Step Time": 8.4323350507766} +{"Pretrain/Learning Rate": 3.4434568352181e-05, "Pretrain/Loss": 2.047602891921997, "Pretrain/Loss (Raw)": 2.1341488361358643, "Pretrain/Step": 3772, "Pretrain/Step Time": 8.43721223808825} +{"Pretrain/Learning Rate": 3.442670569863956e-05, "Pretrain/Loss": 2.05141544342041, "Pretrain/Loss (Raw)": 2.0951220989227295, "Pretrain/Step": 3773, "Pretrain/Step Time": 8.441028898581862} +{"Pretrain/Learning Rate": 3.4418841957965995e-05, "Pretrain/Loss": 2.0498292446136475, "Pretrain/Loss (Raw)": 1.8023253679275513, "Pretrain/Step": 3774, "Pretrain/Step Time": 8.4399534445256} +{"Pretrain/Learning Rate": 3.44109771310672e-05, "Pretrain/Loss": 2.0495619773864746, "Pretrain/Loss (Raw)": 2.2135262489318848, "Pretrain/Step": 3775, "Pretrain/Step Time": 8.438724948093295} +{"Pretrain/Learning Rate": 3.440311121885018e-05, "Pretrain/Loss": 2.0516555309295654, "Pretrain/Loss (Raw)": 2.106801748275757, "Pretrain/Step": 3776, "Pretrain/Step Time": 8.43473850376904} +{"Pretrain/Learning Rate": 3.4395244222222054e-05, "Pretrain/Loss": 2.0516343116760254, "Pretrain/Loss (Raw)": 1.946446418762207, "Pretrain/Step": 3777, "Pretrain/Step Time": 8.436382252722979} +{"Pretrain/Learning Rate": 3.43873761420901e-05, "Pretrain/Loss": 2.052480936050415, "Pretrain/Loss (Raw)": 2.044142961502075, "Pretrain/Step": 3778, "Pretrain/Step Time": 8.43463203124702} +{"Pretrain/Learning Rate": 3.4379506979361694e-05, "Pretrain/Loss": 2.0524086952209473, "Pretrain/Loss (Raw)": 2.0193893909454346, "Pretrain/Step": 3779, "Pretrain/Step Time": 8.436540201306343} +{"Pretrain/Learning Rate": 3.437163673494434e-05, "Pretrain/Loss": 2.0525500774383545, "Pretrain/Loss (Raw)": 2.000981330871582, "Pretrain/Step": 3780, "Pretrain/Step Time": 8.436739780008793} +{"Pretrain/Learning Rate": 3.436376540974568e-05, "Pretrain/Loss": 2.054811716079712, "Pretrain/Loss (Raw)": 2.4442148208618164, "Pretrain/Step": 3781, "Pretrain/Step Time": 8.439776750281453} +{"Pretrain/Learning Rate": 3.4355893004673476e-05, "Pretrain/Loss": 2.053224563598633, "Pretrain/Loss (Raw)": 1.9401094913482666, "Pretrain/Step": 3782, "Pretrain/Step Time": 8.446355814114213} +{"Pretrain/Learning Rate": 3.4348019520635587e-05, "Pretrain/Loss": 2.0495691299438477, "Pretrain/Loss (Raw)": 1.9952728748321533, "Pretrain/Step": 3783, "Pretrain/Step Time": 8.45076934993267} +{"Pretrain/Learning Rate": 3.434014495854006e-05, "Pretrain/Loss": 2.0469489097595215, "Pretrain/Loss (Raw)": 1.8602370023727417, "Pretrain/Step": 3784, "Pretrain/Step Time": 8.449796440079808} +{"Pretrain/Learning Rate": 3.4332269319294984e-05, "Pretrain/Loss": 2.0445289611816406, "Pretrain/Loss (Raw)": 1.8777568340301514, "Pretrain/Step": 3785, "Pretrain/Step Time": 8.45132696814835} +{"Pretrain/Learning Rate": 3.432439260380865e-05, "Pretrain/Loss": 2.0446889400482178, "Pretrain/Loss (Raw)": 2.116123914718628, "Pretrain/Step": 3786, "Pretrain/Step Time": 8.44907626695931} +{"Pretrain/Learning Rate": 3.4316514812989406e-05, "Pretrain/Loss": 2.0479226112365723, "Pretrain/Loss (Raw)": 2.203070878982544, "Pretrain/Step": 3787, "Pretrain/Step Time": 8.44855116866529} +{"Pretrain/Learning Rate": 3.4308635947745796e-05, "Pretrain/Loss": 2.0502617359161377, "Pretrain/Loss (Raw)": 2.0695579051971436, "Pretrain/Step": 3788, "Pretrain/Step Time": 8.452379567548633} +{"Pretrain/Learning Rate": 3.43007560089864e-05, "Pretrain/Loss": 2.050682544708252, "Pretrain/Loss (Raw)": 2.0849127769470215, "Pretrain/Step": 3789, "Pretrain/Step Time": 8.451346164569259} +{"Pretrain/Learning Rate": 3.429287499762001e-05, "Pretrain/Loss": 2.0562784671783447, "Pretrain/Loss (Raw)": 2.892442226409912, "Pretrain/Step": 3790, "Pretrain/Step Time": 8.454987550154328} +{"Pretrain/Learning Rate": 3.428499291455548e-05, "Pretrain/Loss": 2.0563480854034424, "Pretrain/Loss (Raw)": 2.0893585681915283, "Pretrain/Step": 3791, "Pretrain/Step Time": 8.451350783929229} +{"Pretrain/Learning Rate": 3.427710976070182e-05, "Pretrain/Loss": 2.0567734241485596, "Pretrain/Loss (Raw)": 1.9709113836288452, "Pretrain/Step": 3792, "Pretrain/Step Time": 8.45188045874238} +{"Pretrain/Learning Rate": 3.426922553696814e-05, "Pretrain/Loss": 2.0594825744628906, "Pretrain/Loss (Raw)": 2.099074363708496, "Pretrain/Step": 3793, "Pretrain/Step Time": 8.44876436702907} +{"Pretrain/Learning Rate": 3.426134024426371e-05, "Pretrain/Loss": 2.059999942779541, "Pretrain/Loss (Raw)": 2.0968143939971924, "Pretrain/Step": 3794, "Pretrain/Step Time": 8.453600129112601} +{"Pretrain/Learning Rate": 3.425345388349786e-05, "Pretrain/Loss": 2.0597596168518066, "Pretrain/Loss (Raw)": 2.093963384628296, "Pretrain/Step": 3795, "Pretrain/Step Time": 8.45355098694563} +{"Pretrain/Learning Rate": 3.4245566455580116e-05, "Pretrain/Loss": 2.0588464736938477, "Pretrain/Loss (Raw)": 2.0505881309509277, "Pretrain/Step": 3796, "Pretrain/Step Time": 8.450769590213895} +{"Pretrain/Learning Rate": 3.423767796142008e-05, "Pretrain/Loss": 2.0589165687561035, "Pretrain/Loss (Raw)": 2.135554313659668, "Pretrain/Step": 3797, "Pretrain/Step Time": 8.443422392010689} +{"Pretrain/Learning Rate": 3.422978840192749e-05, "Pretrain/Loss": 2.061659812927246, "Pretrain/Loss (Raw)": 2.2525742053985596, "Pretrain/Step": 3798, "Pretrain/Step Time": 8.44449670985341} +{"Pretrain/Learning Rate": 3.4221897778012214e-05, "Pretrain/Loss": 2.059692621231079, "Pretrain/Loss (Raw)": 1.9482489824295044, "Pretrain/Step": 3799, "Pretrain/Step Time": 8.45089091360569} +{"Pretrain/Learning Rate": 3.421400609058423e-05, "Pretrain/Loss": 2.058115243911743, "Pretrain/Loss (Raw)": 1.9291090965270996, "Pretrain/Step": 3800, "Pretrain/Step Time": 8.449555426836014} +{"Pretrain/Learning Rate": 3.420611334055365e-05, "Pretrain/Loss": 2.0586793422698975, "Pretrain/Loss (Raw)": 1.9749464988708496, "Pretrain/Step": 3801, "Pretrain/Step Time": 8.446375856176019} +{"Pretrain/Learning Rate": 3.4198219528830675e-05, "Pretrain/Loss": 2.058055877685547, "Pretrain/Loss (Raw)": 1.9653650522232056, "Pretrain/Step": 3802, "Pretrain/Step Time": 8.44767514616251} +{"Pretrain/Learning Rate": 3.4190324656325704e-05, "Pretrain/Loss": 2.057668685913086, "Pretrain/Loss (Raw)": 2.073791265487671, "Pretrain/Step": 3803, "Pretrain/Step Time": 8.443238703534007} +{"Pretrain/Learning Rate": 3.418242872394919e-05, "Pretrain/Loss": 2.055689573287964, "Pretrain/Loss (Raw)": 1.934665322303772, "Pretrain/Step": 3804, "Pretrain/Step Time": 8.443652560934424} +{"Pretrain/Learning Rate": 3.417453173261171e-05, "Pretrain/Loss": 2.056936740875244, "Pretrain/Loss (Raw)": 2.1581203937530518, "Pretrain/Step": 3805, "Pretrain/Step Time": 8.44769498333335} +{"Pretrain/Learning Rate": 3.4166633683224015e-05, "Pretrain/Loss": 2.0574421882629395, "Pretrain/Loss (Raw)": 1.9443303346633911, "Pretrain/Step": 3806, "Pretrain/Step Time": 8.446212599053979} +{"Pretrain/Learning Rate": 3.4158734576696915e-05, "Pretrain/Loss": 2.0581884384155273, "Pretrain/Loss (Raw)": 2.104163885116577, "Pretrain/Step": 3807, "Pretrain/Step Time": 8.445655539631844} +{"Pretrain/Learning Rate": 3.4150834413941394e-05, "Pretrain/Loss": 2.0572524070739746, "Pretrain/Loss (Raw)": 1.736651062965393, "Pretrain/Step": 3808, "Pretrain/Step Time": 8.44298036955297} +{"Pretrain/Learning Rate": 3.414293319586853e-05, "Pretrain/Loss": 2.056898593902588, "Pretrain/Loss (Raw)": 2.196823835372925, "Pretrain/Step": 3809, "Pretrain/Step Time": 8.438470544293523} +{"Pretrain/Learning Rate": 3.4135030923389525e-05, "Pretrain/Loss": 2.056063652038574, "Pretrain/Loss (Raw)": 1.9595260620117188, "Pretrain/Step": 3810, "Pretrain/Step Time": 8.439816262573004} +{"Pretrain/Learning Rate": 3.412712759741571e-05, "Pretrain/Loss": 2.0561158657073975, "Pretrain/Loss (Raw)": 2.0834543704986572, "Pretrain/Step": 3811, "Pretrain/Step Time": 8.442863950505853} +{"Pretrain/Learning Rate": 3.411922321885853e-05, "Pretrain/Loss": 2.0564801692962646, "Pretrain/Loss (Raw)": 1.9333781003952026, "Pretrain/Step": 3812, "Pretrain/Step Time": 8.444464115425944} +{"Pretrain/Learning Rate": 3.411131778862955e-05, "Pretrain/Loss": 2.0562000274658203, "Pretrain/Loss (Raw)": 2.0496113300323486, "Pretrain/Step": 3813, "Pretrain/Step Time": 8.437920697033405} +{"Pretrain/Learning Rate": 3.4103411307640475e-05, "Pretrain/Loss": 2.0574440956115723, "Pretrain/Loss (Raw)": 1.9992029666900635, "Pretrain/Step": 3814, "Pretrain/Step Time": 8.432672245427966} +{"Pretrain/Learning Rate": 3.409550377680311e-05, "Pretrain/Loss": 2.0552427768707275, "Pretrain/Loss (Raw)": 2.053194999694824, "Pretrain/Step": 3815, "Pretrain/Step Time": 8.432431245222688} +{"Pretrain/Learning Rate": 3.408759519702939e-05, "Pretrain/Loss": 2.0565266609191895, "Pretrain/Loss (Raw)": 1.977292776107788, "Pretrain/Step": 3816, "Pretrain/Step Time": 8.431129146367311} +{"Pretrain/Learning Rate": 3.407968556923137e-05, "Pretrain/Loss": 2.054979085922241, "Pretrain/Loss (Raw)": 1.8983187675476074, "Pretrain/Step": 3817, "Pretrain/Step Time": 8.437440119683743} +{"Pretrain/Learning Rate": 3.407177489432123e-05, "Pretrain/Loss": 2.0537023544311523, "Pretrain/Loss (Raw)": 2.142443895339966, "Pretrain/Step": 3818, "Pretrain/Step Time": 8.44313027523458} +{"Pretrain/Learning Rate": 3.406386317321126e-05, "Pretrain/Loss": 2.054327964782715, "Pretrain/Loss (Raw)": 2.0518479347229004, "Pretrain/Step": 3819, "Pretrain/Step Time": 8.436544623225927} +{"Pretrain/Learning Rate": 3.4055950406813875e-05, "Pretrain/Loss": 2.0550789833068848, "Pretrain/Loss (Raw)": 2.07384991645813, "Pretrain/Step": 3820, "Pretrain/Step Time": 8.42843809351325} +{"Pretrain/Learning Rate": 3.404803659604162e-05, "Pretrain/Loss": 2.054903268814087, "Pretrain/Loss (Raw)": 2.0186567306518555, "Pretrain/Step": 3821, "Pretrain/Step Time": 8.435589054599404} +{"Pretrain/Learning Rate": 3.4040121741807146e-05, "Pretrain/Loss": 2.0547428131103516, "Pretrain/Loss (Raw)": 2.0876147747039795, "Pretrain/Step": 3822, "Pretrain/Step Time": 8.435675416141748} +{"Pretrain/Learning Rate": 3.403220584502323e-05, "Pretrain/Loss": 2.0542349815368652, "Pretrain/Loss (Raw)": 2.007058620452881, "Pretrain/Step": 3823, "Pretrain/Step Time": 8.436751049011946} +{"Pretrain/Learning Rate": 3.402428890660279e-05, "Pretrain/Loss": 2.055105686187744, "Pretrain/Loss (Raw)": 2.123147487640381, "Pretrain/Step": 3824, "Pretrain/Step Time": 8.434874275699258} +{"Pretrain/Learning Rate": 3.401637092745882e-05, "Pretrain/Loss": 2.0539205074310303, "Pretrain/Loss (Raw)": 1.906965970993042, "Pretrain/Step": 3825, "Pretrain/Step Time": 8.437145916745067} +{"Pretrain/Learning Rate": 3.4008451908504457e-05, "Pretrain/Loss": 2.0522677898406982, "Pretrain/Loss (Raw)": 1.880191445350647, "Pretrain/Step": 3826, "Pretrain/Step Time": 8.431789690628648} +{"Pretrain/Learning Rate": 3.400053185065298e-05, "Pretrain/Loss": 2.0524742603302, "Pretrain/Loss (Raw)": 2.0413167476654053, "Pretrain/Step": 3827, "Pretrain/Step Time": 8.431265896186233} +{"Pretrain/Learning Rate": 3.399261075481776e-05, "Pretrain/Loss": 2.0531651973724365, "Pretrain/Loss (Raw)": 2.066645860671997, "Pretrain/Step": 3828, "Pretrain/Step Time": 8.435012036934495} +{"Pretrain/Learning Rate": 3.39846886219123e-05, "Pretrain/Loss": 2.05523419380188, "Pretrain/Loss (Raw)": 2.2844436168670654, "Pretrain/Step": 3829, "Pretrain/Step Time": 8.433045679703355} +{"Pretrain/Learning Rate": 3.3976765452850194e-05, "Pretrain/Loss": 2.0562214851379395, "Pretrain/Loss (Raw)": 2.282526969909668, "Pretrain/Step": 3830, "Pretrain/Step Time": 8.435127720236778} +{"Pretrain/Learning Rate": 3.3968841248545214e-05, "Pretrain/Loss": 2.0573389530181885, "Pretrain/Loss (Raw)": 2.1026880741119385, "Pretrain/Step": 3831, "Pretrain/Step Time": 8.430857306346297} +{"Pretrain/Learning Rate": 3.396091600991118e-05, "Pretrain/Loss": 2.0592880249023438, "Pretrain/Loss (Raw)": 2.265763998031616, "Pretrain/Step": 3832, "Pretrain/Step Time": 8.430722126737237} +{"Pretrain/Learning Rate": 3.39529897378621e-05, "Pretrain/Loss": 2.0589730739593506, "Pretrain/Loss (Raw)": 2.0664656162261963, "Pretrain/Step": 3833, "Pretrain/Step Time": 8.429015511646867} +{"Pretrain/Learning Rate": 3.3945062433312055e-05, "Pretrain/Loss": 2.059278964996338, "Pretrain/Loss (Raw)": 2.041954755783081, "Pretrain/Step": 3834, "Pretrain/Step Time": 8.425630440935493} +{"Pretrain/Learning Rate": 3.3937134097175256e-05, "Pretrain/Loss": 2.056821823120117, "Pretrain/Loss (Raw)": 1.9606727361679077, "Pretrain/Step": 3835, "Pretrain/Step Time": 8.432438220828772} +{"Pretrain/Learning Rate": 3.392920473036604e-05, "Pretrain/Loss": 2.0569376945495605, "Pretrain/Loss (Raw)": 1.9105730056762695, "Pretrain/Step": 3836, "Pretrain/Step Time": 8.434779116883874} +{"Pretrain/Learning Rate": 3.392127433379886e-05, "Pretrain/Loss": 2.0555481910705566, "Pretrain/Loss (Raw)": 1.9138662815093994, "Pretrain/Step": 3837, "Pretrain/Step Time": 8.430022547021508} +{"Pretrain/Learning Rate": 3.391334290838829e-05, "Pretrain/Loss": 2.054091215133667, "Pretrain/Loss (Raw)": 1.9330837726593018, "Pretrain/Step": 3838, "Pretrain/Step Time": 8.435685401782393} +{"Pretrain/Learning Rate": 3.3905410455049e-05, "Pretrain/Loss": 2.052701473236084, "Pretrain/Loss (Raw)": 1.8494813442230225, "Pretrain/Step": 3839, "Pretrain/Step Time": 8.440093256533146} +{"Pretrain/Learning Rate": 3.389747697469583e-05, "Pretrain/Loss": 2.053069591522217, "Pretrain/Loss (Raw)": 2.1181447505950928, "Pretrain/Step": 3840, "Pretrain/Step Time": 8.438375802710652} +{"Pretrain/Learning Rate": 3.388954246824367e-05, "Pretrain/Loss": 2.0529651641845703, "Pretrain/Loss (Raw)": 2.050294876098633, "Pretrain/Step": 3841, "Pretrain/Step Time": 8.438291100785136} +{"Pretrain/Learning Rate": 3.3881606936607604e-05, "Pretrain/Loss": 2.05234432220459, "Pretrain/Loss (Raw)": 2.0229249000549316, "Pretrain/Step": 3842, "Pretrain/Step Time": 8.436741789802909} +{"Pretrain/Learning Rate": 3.387367038070275e-05, "Pretrain/Loss": 2.050100326538086, "Pretrain/Loss (Raw)": 2.1415090560913086, "Pretrain/Step": 3843, "Pretrain/Step Time": 8.429706767201424} +{"Pretrain/Learning Rate": 3.386573280144444e-05, "Pretrain/Loss": 2.0485599040985107, "Pretrain/Loss (Raw)": 1.9454145431518555, "Pretrain/Step": 3844, "Pretrain/Step Time": 8.431971011683345} +{"Pretrain/Learning Rate": 3.385779419974803e-05, "Pretrain/Loss": 2.054326057434082, "Pretrain/Loss (Raw)": 2.4245336055755615, "Pretrain/Step": 3845, "Pretrain/Step Time": 8.438823781907558} +{"Pretrain/Learning Rate": 3.384985457652906e-05, "Pretrain/Loss": 2.0558555126190186, "Pretrain/Loss (Raw)": 2.2849361896514893, "Pretrain/Step": 3846, "Pretrain/Step Time": 8.433006834238768} +{"Pretrain/Learning Rate": 3.384191393270316e-05, "Pretrain/Loss": 2.055640459060669, "Pretrain/Loss (Raw)": 1.8926454782485962, "Pretrain/Step": 3847, "Pretrain/Step Time": 8.4349623657763} +{"Pretrain/Learning Rate": 3.383397226918607e-05, "Pretrain/Loss": 2.0537726879119873, "Pretrain/Loss (Raw)": 1.9900329113006592, "Pretrain/Step": 3848, "Pretrain/Step Time": 8.429151855409145} +{"Pretrain/Learning Rate": 3.382602958689369e-05, "Pretrain/Loss": 2.0552315711975098, "Pretrain/Loss (Raw)": 2.1612374782562256, "Pretrain/Step": 3849, "Pretrain/Step Time": 8.432997616007924} +{"Pretrain/Learning Rate": 3.381808588674197e-05, "Pretrain/Loss": 2.0555386543273926, "Pretrain/Loss (Raw)": 2.0879762172698975, "Pretrain/Step": 3850, "Pretrain/Step Time": 8.43052469752729} +{"Pretrain/Learning Rate": 3.381014116964705e-05, "Pretrain/Loss": 2.0555734634399414, "Pretrain/Loss (Raw)": 2.070035934448242, "Pretrain/Step": 3851, "Pretrain/Step Time": 8.431771986186504} +{"Pretrain/Learning Rate": 3.380219543652512e-05, "Pretrain/Loss": 2.055901050567627, "Pretrain/Loss (Raw)": 1.8238844871520996, "Pretrain/Step": 3852, "Pretrain/Step Time": 8.428139042109251} +{"Pretrain/Learning Rate": 3.379424868829254e-05, "Pretrain/Loss": 2.05749773979187, "Pretrain/Loss (Raw)": 2.3566863536834717, "Pretrain/Step": 3853, "Pretrain/Step Time": 8.42907946370542} +{"Pretrain/Learning Rate": 3.378630092586576e-05, "Pretrain/Loss": 2.0539634227752686, "Pretrain/Loss (Raw)": 1.9183769226074219, "Pretrain/Step": 3854, "Pretrain/Step Time": 8.42757861316204} +{"Pretrain/Learning Rate": 3.377835215016136e-05, "Pretrain/Loss": 2.0532524585723877, "Pretrain/Loss (Raw)": 1.930646538734436, "Pretrain/Step": 3855, "Pretrain/Step Time": 8.425948955118656} +{"Pretrain/Learning Rate": 3.3770402362096024e-05, "Pretrain/Loss": 2.052990198135376, "Pretrain/Loss (Raw)": 2.1417996883392334, "Pretrain/Step": 3856, "Pretrain/Step Time": 8.426916234195232} +{"Pretrain/Learning Rate": 3.3762451562586565e-05, "Pretrain/Loss": 2.051131010055542, "Pretrain/Loss (Raw)": 1.9788577556610107, "Pretrain/Step": 3857, "Pretrain/Step Time": 8.434534950181842} +{"Pretrain/Learning Rate": 3.3754499752549885e-05, "Pretrain/Loss": 2.05058217048645, "Pretrain/Loss (Raw)": 2.0104787349700928, "Pretrain/Step": 3858, "Pretrain/Step Time": 8.43063560500741} +{"Pretrain/Learning Rate": 3.374654693290306e-05, "Pretrain/Loss": 2.0516881942749023, "Pretrain/Loss (Raw)": 2.097872018814087, "Pretrain/Step": 3859, "Pretrain/Step Time": 8.429116286337376} +{"Pretrain/Learning Rate": 3.373859310456321e-05, "Pretrain/Loss": 2.051800489425659, "Pretrain/Loss (Raw)": 2.077496290206909, "Pretrain/Step": 3860, "Pretrain/Step Time": 8.428078783676028} +{"Pretrain/Learning Rate": 3.373063826844764e-05, "Pretrain/Loss": 2.052347183227539, "Pretrain/Loss (Raw)": 2.186948299407959, "Pretrain/Step": 3861, "Pretrain/Step Time": 8.427522921934724} +{"Pretrain/Learning Rate": 3.3722682425473715e-05, "Pretrain/Loss": 2.052286386489868, "Pretrain/Loss (Raw)": 1.9575947523117065, "Pretrain/Step": 3862, "Pretrain/Step Time": 8.431910451501608} +{"Pretrain/Learning Rate": 3.371472557655896e-05, "Pretrain/Loss": 2.0516185760498047, "Pretrain/Loss (Raw)": 2.0997276306152344, "Pretrain/Step": 3863, "Pretrain/Step Time": 8.434792472049594} +{"Pretrain/Learning Rate": 3.370676772262098e-05, "Pretrain/Loss": 2.050445556640625, "Pretrain/Loss (Raw)": 1.8927998542785645, "Pretrain/Step": 3864, "Pretrain/Step Time": 8.433792049065232} +{"Pretrain/Learning Rate": 3.369880886457751e-05, "Pretrain/Loss": 2.0512232780456543, "Pretrain/Loss (Raw)": 2.0196533203125, "Pretrain/Step": 3865, "Pretrain/Step Time": 8.431977979838848} +{"Pretrain/Learning Rate": 3.369084900334643e-05, "Pretrain/Loss": 2.0517075061798096, "Pretrain/Loss (Raw)": 1.9056625366210938, "Pretrain/Step": 3866, "Pretrain/Step Time": 8.427032556384802} +{"Pretrain/Learning Rate": 3.368288813984568e-05, "Pretrain/Loss": 2.053015947341919, "Pretrain/Loss (Raw)": 2.173854112625122, "Pretrain/Step": 3867, "Pretrain/Step Time": 8.426729559898376} +{"Pretrain/Learning Rate": 3.3674926274993356e-05, "Pretrain/Loss": 2.053985118865967, "Pretrain/Loss (Raw)": 2.167262077331543, "Pretrain/Step": 3868, "Pretrain/Step Time": 8.437896812334657} +{"Pretrain/Learning Rate": 3.3666963409707655e-05, "Pretrain/Loss": 2.059262275695801, "Pretrain/Loss (Raw)": 2.4959537982940674, "Pretrain/Step": 3869, "Pretrain/Step Time": 8.437651036307216} +{"Pretrain/Learning Rate": 3.36589995449069e-05, "Pretrain/Loss": 2.0597593784332275, "Pretrain/Loss (Raw)": 2.125223159790039, "Pretrain/Step": 3870, "Pretrain/Step Time": 8.435938354581594} +{"Pretrain/Learning Rate": 3.36510346815095e-05, "Pretrain/Loss": 2.0586342811584473, "Pretrain/Loss (Raw)": 1.988904356956482, "Pretrain/Step": 3871, "Pretrain/Step Time": 8.430778127163649} +{"Pretrain/Learning Rate": 3.3643068820434035e-05, "Pretrain/Loss": 2.058285713195801, "Pretrain/Loss (Raw)": 2.0999343395233154, "Pretrain/Step": 3872, "Pretrain/Step Time": 8.434038329869509} +{"Pretrain/Learning Rate": 3.363510196259913e-05, "Pretrain/Loss": 2.061506748199463, "Pretrain/Loss (Raw)": 2.1069889068603516, "Pretrain/Step": 3873, "Pretrain/Step Time": 8.432175541296601} +{"Pretrain/Learning Rate": 3.362713410892359e-05, "Pretrain/Loss": 2.0607266426086426, "Pretrain/Loss (Raw)": 2.028736114501953, "Pretrain/Step": 3874, "Pretrain/Step Time": 8.44842896796763} +{"Pretrain/Learning Rate": 3.361916526032628e-05, "Pretrain/Loss": 2.0609986782073975, "Pretrain/Loss (Raw)": 2.0584239959716797, "Pretrain/Step": 3875, "Pretrain/Step Time": 8.446571446955204} +{"Pretrain/Learning Rate": 3.361119541772622e-05, "Pretrain/Loss": 2.0628983974456787, "Pretrain/Loss (Raw)": 2.2318427562713623, "Pretrain/Step": 3876, "Pretrain/Step Time": 8.447300300002098} +{"Pretrain/Learning Rate": 3.360322458204253e-05, "Pretrain/Loss": 2.0635926723480225, "Pretrain/Loss (Raw)": 2.0348410606384277, "Pretrain/Step": 3877, "Pretrain/Step Time": 8.444103997200727} +{"Pretrain/Learning Rate": 3.3595252754194445e-05, "Pretrain/Loss": 2.062009572982788, "Pretrain/Loss (Raw)": 2.0119571685791016, "Pretrain/Step": 3878, "Pretrain/Step Time": 8.443028699606657} +{"Pretrain/Learning Rate": 3.3587279935101306e-05, "Pretrain/Loss": 2.0620789527893066, "Pretrain/Loss (Raw)": 1.9347755908966064, "Pretrain/Step": 3879, "Pretrain/Step Time": 8.45107614248991} +{"Pretrain/Learning Rate": 3.357930612568258e-05, "Pretrain/Loss": 2.064162015914917, "Pretrain/Loss (Raw)": 2.341830253601074, "Pretrain/Step": 3880, "Pretrain/Step Time": 8.45041841827333} +{"Pretrain/Learning Rate": 3.3571331326857844e-05, "Pretrain/Loss": 2.063331127166748, "Pretrain/Loss (Raw)": 2.0403711795806885, "Pretrain/Step": 3881, "Pretrain/Step Time": 8.452492835000157} +{"Pretrain/Learning Rate": 3.3563355539546795e-05, "Pretrain/Loss": 2.064546823501587, "Pretrain/Loss (Raw)": 2.117006301879883, "Pretrain/Step": 3882, "Pretrain/Step Time": 8.44093893840909} +{"Pretrain/Learning Rate": 3.355537876466923e-05, "Pretrain/Loss": 2.061948299407959, "Pretrain/Loss (Raw)": 1.8177815675735474, "Pretrain/Step": 3883, "Pretrain/Step Time": 8.444170856848359} +{"Pretrain/Learning Rate": 3.354740100314506e-05, "Pretrain/Loss": 2.059898853302002, "Pretrain/Loss (Raw)": 2.1136064529418945, "Pretrain/Step": 3884, "Pretrain/Step Time": 8.447710372507572} +{"Pretrain/Learning Rate": 3.3539422255894345e-05, "Pretrain/Loss": 2.059331178665161, "Pretrain/Loss (Raw)": 1.9166576862335205, "Pretrain/Step": 3885, "Pretrain/Step Time": 8.45016274228692} +{"Pretrain/Learning Rate": 3.353144252383721e-05, "Pretrain/Loss": 2.056382417678833, "Pretrain/Loss (Raw)": 1.8225336074829102, "Pretrain/Step": 3886, "Pretrain/Step Time": 8.448965463787317} +{"Pretrain/Learning Rate": 3.3523461807893925e-05, "Pretrain/Loss": 2.0568113327026367, "Pretrain/Loss (Raw)": 2.009537935256958, "Pretrain/Step": 3887, "Pretrain/Step Time": 8.448330149054527} +{"Pretrain/Learning Rate": 3.351548010898486e-05, "Pretrain/Loss": 2.0565075874328613, "Pretrain/Loss (Raw)": 2.1005728244781494, "Pretrain/Step": 3888, "Pretrain/Step Time": 8.438467372208834} +{"Pretrain/Learning Rate": 3.35074974280305e-05, "Pretrain/Loss": 2.055600881576538, "Pretrain/Loss (Raw)": 2.011446475982666, "Pretrain/Step": 3889, "Pretrain/Step Time": 8.438919056206942} +{"Pretrain/Learning Rate": 3.349951376595145e-05, "Pretrain/Loss": 2.0573806762695312, "Pretrain/Loss (Raw)": 2.1287245750427246, "Pretrain/Step": 3890, "Pretrain/Step Time": 8.44243354164064} +{"Pretrain/Learning Rate": 3.3491529123668425e-05, "Pretrain/Loss": 2.056178569793701, "Pretrain/Loss (Raw)": 1.9475198984146118, "Pretrain/Step": 3891, "Pretrain/Step Time": 8.446254869922996} +{"Pretrain/Learning Rate": 3.348354350210224e-05, "Pretrain/Loss": 2.0582680702209473, "Pretrain/Loss (Raw)": 2.126030445098877, "Pretrain/Step": 3892, "Pretrain/Step Time": 8.443630427122116} +{"Pretrain/Learning Rate": 3.347555690217385e-05, "Pretrain/Loss": 2.060619354248047, "Pretrain/Loss (Raw)": 2.1827831268310547, "Pretrain/Step": 3893, "Pretrain/Step Time": 8.44654480740428} +{"Pretrain/Learning Rate": 3.34675693248043e-05, "Pretrain/Loss": 2.0632083415985107, "Pretrain/Loss (Raw)": 2.194153308868408, "Pretrain/Step": 3894, "Pretrain/Step Time": 8.437646999955177} +{"Pretrain/Learning Rate": 3.3459580770914744e-05, "Pretrain/Loss": 2.0633819103240967, "Pretrain/Loss (Raw)": 2.121002674102783, "Pretrain/Step": 3895, "Pretrain/Step Time": 8.433488653972745} +{"Pretrain/Learning Rate": 3.3451591241426486e-05, "Pretrain/Loss": 2.0619568824768066, "Pretrain/Loss (Raw)": 2.221264362335205, "Pretrain/Step": 3896, "Pretrain/Step Time": 8.44099479354918} +{"Pretrain/Learning Rate": 3.3443600737260885e-05, "Pretrain/Loss": 2.063171148300171, "Pretrain/Loss (Raw)": 2.1330204010009766, "Pretrain/Step": 3897, "Pretrain/Step Time": 8.44041908159852} +{"Pretrain/Learning Rate": 3.343560925933947e-05, "Pretrain/Loss": 2.063356637954712, "Pretrain/Loss (Raw)": 2.1650454998016357, "Pretrain/Step": 3898, "Pretrain/Step Time": 8.437507964670658} +{"Pretrain/Learning Rate": 3.342761680858385e-05, "Pretrain/Loss": 2.063436985015869, "Pretrain/Loss (Raw)": 1.9953261613845825, "Pretrain/Step": 3899, "Pretrain/Step Time": 8.43013059347868} +{"Pretrain/Learning Rate": 3.3419623385915736e-05, "Pretrain/Loss": 2.06180739402771, "Pretrain/Loss (Raw)": 1.9255386590957642, "Pretrain/Step": 3900, "Pretrain/Step Time": 8.428279059007764} +{"Pretrain/Learning Rate": 3.3411628992256984e-05, "Pretrain/Loss": 2.0622854232788086, "Pretrain/Loss (Raw)": 2.1563103199005127, "Pretrain/Step": 3901, "Pretrain/Step Time": 8.42802264355123} +{"Pretrain/Learning Rate": 3.340363362852954e-05, "Pretrain/Loss": 2.0638322830200195, "Pretrain/Loss (Raw)": 2.000312566757202, "Pretrain/Step": 3902, "Pretrain/Step Time": 8.430874694138765} +{"Pretrain/Learning Rate": 3.339563729565547e-05, "Pretrain/Loss": 2.0617377758026123, "Pretrain/Loss (Raw)": 1.9454594850540161, "Pretrain/Step": 3903, "Pretrain/Step Time": 8.427920000627637} +{"Pretrain/Learning Rate": 3.3387639994556934e-05, "Pretrain/Loss": 2.061272382736206, "Pretrain/Loss (Raw)": 2.0472192764282227, "Pretrain/Step": 3904, "Pretrain/Step Time": 8.426890840753913} +{"Pretrain/Learning Rate": 3.337964172615624e-05, "Pretrain/Loss": 2.0622289180755615, "Pretrain/Loss (Raw)": 2.0688552856445312, "Pretrain/Step": 3905, "Pretrain/Step Time": 8.424902234226465} +{"Pretrain/Learning Rate": 3.337164249137577e-05, "Pretrain/Loss": 2.0620522499084473, "Pretrain/Loss (Raw)": 2.0215327739715576, "Pretrain/Step": 3906, "Pretrain/Step Time": 8.424709809944034} +{"Pretrain/Learning Rate": 3.3363642291138046e-05, "Pretrain/Loss": 2.0621213912963867, "Pretrain/Loss (Raw)": 2.0282814502716064, "Pretrain/Step": 3907, "Pretrain/Step Time": 8.429439581930637} +{"Pretrain/Learning Rate": 3.3355641126365676e-05, "Pretrain/Loss": 2.0638251304626465, "Pretrain/Loss (Raw)": 2.2190165519714355, "Pretrain/Step": 3908, "Pretrain/Step Time": 8.423879522830248} +{"Pretrain/Learning Rate": 3.33476389979814e-05, "Pretrain/Loss": 2.0607643127441406, "Pretrain/Loss (Raw)": 2.0524346828460693, "Pretrain/Step": 3909, "Pretrain/Step Time": 8.420804852619767} +{"Pretrain/Learning Rate": 3.3339635906908064e-05, "Pretrain/Loss": 2.062626361846924, "Pretrain/Loss (Raw)": 2.1784586906433105, "Pretrain/Step": 3910, "Pretrain/Step Time": 8.415543721988797} +{"Pretrain/Learning Rate": 3.3331631854068616e-05, "Pretrain/Loss": 2.0608677864074707, "Pretrain/Loss (Raw)": 1.770213007926941, "Pretrain/Step": 3911, "Pretrain/Step Time": 8.413792932406068} +{"Pretrain/Learning Rate": 3.3323626840386115e-05, "Pretrain/Loss": 2.061286687850952, "Pretrain/Loss (Raw)": 1.9138470888137817, "Pretrain/Step": 3912, "Pretrain/Step Time": 8.412881705909967} +{"Pretrain/Learning Rate": 3.3315620866783755e-05, "Pretrain/Loss": 2.061866521835327, "Pretrain/Loss (Raw)": 1.9519542455673218, "Pretrain/Step": 3913, "Pretrain/Step Time": 8.421851145103574} +{"Pretrain/Learning Rate": 3.33076139341848e-05, "Pretrain/Loss": 2.061920166015625, "Pretrain/Loss (Raw)": 2.122992753982544, "Pretrain/Step": 3914, "Pretrain/Step Time": 8.418651638552547} +{"Pretrain/Learning Rate": 3.329960604351267e-05, "Pretrain/Loss": 2.0608160495758057, "Pretrain/Loss (Raw)": 2.0617568492889404, "Pretrain/Step": 3915, "Pretrain/Step Time": 8.417651046067476} +{"Pretrain/Learning Rate": 3.329159719569085e-05, "Pretrain/Loss": 2.0605874061584473, "Pretrain/Loss (Raw)": 2.040266275405884, "Pretrain/Step": 3916, "Pretrain/Step Time": 8.413458466529846} +{"Pretrain/Learning Rate": 3.328358739164299e-05, "Pretrain/Loss": 2.063058853149414, "Pretrain/Loss (Raw)": 2.4012839794158936, "Pretrain/Step": 3917, "Pretrain/Step Time": 8.416619833558798} +{"Pretrain/Learning Rate": 3.327557663229278e-05, "Pretrain/Loss": 2.0563225746154785, "Pretrain/Loss (Raw)": 2.0301895141601562, "Pretrain/Step": 3918, "Pretrain/Step Time": 8.418086742982268} +{"Pretrain/Learning Rate": 3.326756491856409e-05, "Pretrain/Loss": 2.0546488761901855, "Pretrain/Loss (Raw)": 1.8751434087753296, "Pretrain/Step": 3919, "Pretrain/Step Time": 8.423290889710188} +{"Pretrain/Learning Rate": 3.325955225138085e-05, "Pretrain/Loss": 2.0554912090301514, "Pretrain/Loss (Raw)": 2.0787031650543213, "Pretrain/Step": 3920, "Pretrain/Step Time": 8.427530949935317} +{"Pretrain/Learning Rate": 3.3251538631667125e-05, "Pretrain/Loss": 2.0538556575775146, "Pretrain/Loss (Raw)": 1.8897206783294678, "Pretrain/Step": 3921, "Pretrain/Step Time": 8.424358870834112} +{"Pretrain/Learning Rate": 3.324352406034707e-05, "Pretrain/Loss": 2.0519890785217285, "Pretrain/Loss (Raw)": 1.8578875064849854, "Pretrain/Step": 3922, "Pretrain/Step Time": 8.419515481218696} +{"Pretrain/Learning Rate": 3.3235508538344996e-05, "Pretrain/Loss": 2.0501270294189453, "Pretrain/Loss (Raw)": 1.8556240797042847, "Pretrain/Step": 3923, "Pretrain/Step Time": 8.42342833057046} +{"Pretrain/Learning Rate": 3.322749206658526e-05, "Pretrain/Loss": 2.0485310554504395, "Pretrain/Loss (Raw)": 1.8463335037231445, "Pretrain/Step": 3924, "Pretrain/Step Time": 8.430300895124674} +{"Pretrain/Learning Rate": 3.3219474645992366e-05, "Pretrain/Loss": 2.0477094650268555, "Pretrain/Loss (Raw)": 2.0303637981414795, "Pretrain/Step": 3925, "Pretrain/Step Time": 8.425898477435112} +{"Pretrain/Learning Rate": 3.3211456277490926e-05, "Pretrain/Loss": 2.0452356338500977, "Pretrain/Loss (Raw)": 1.9359490871429443, "Pretrain/Step": 3926, "Pretrain/Step Time": 8.42743275128305} +{"Pretrain/Learning Rate": 3.3203436962005655e-05, "Pretrain/Loss": 2.047969102859497, "Pretrain/Loss (Raw)": 2.298124313354492, "Pretrain/Step": 3927, "Pretrain/Step Time": 8.418202221393585} +{"Pretrain/Learning Rate": 3.3195416700461385e-05, "Pretrain/Loss": 2.0514004230499268, "Pretrain/Loss (Raw)": 2.3683104515075684, "Pretrain/Step": 3928, "Pretrain/Step Time": 8.420733546838164} +{"Pretrain/Learning Rate": 3.318739549378304e-05, "Pretrain/Loss": 2.0542469024658203, "Pretrain/Loss (Raw)": 2.3392856121063232, "Pretrain/Step": 3929, "Pretrain/Step Time": 8.42290242947638} +{"Pretrain/Learning Rate": 3.317937334289566e-05, "Pretrain/Loss": 2.0558366775512695, "Pretrain/Loss (Raw)": 2.1688365936279297, "Pretrain/Step": 3930, "Pretrain/Step Time": 8.432100888341665} +{"Pretrain/Learning Rate": 3.317135024872442e-05, "Pretrain/Loss": 2.057243824005127, "Pretrain/Loss (Raw)": 2.2539327144622803, "Pretrain/Step": 3931, "Pretrain/Step Time": 8.429816421121359} +{"Pretrain/Learning Rate": 3.3163326212194546e-05, "Pretrain/Loss": 2.058603286743164, "Pretrain/Loss (Raw)": 2.1086580753326416, "Pretrain/Step": 3932, "Pretrain/Step Time": 8.43091032654047} +{"Pretrain/Learning Rate": 3.315530123423143e-05, "Pretrain/Loss": 2.0587079524993896, "Pretrain/Loss (Raw)": 2.1715242862701416, "Pretrain/Step": 3933, "Pretrain/Step Time": 8.421813894063234} +{"Pretrain/Learning Rate": 3.314727531576055e-05, "Pretrain/Loss": 2.0605974197387695, "Pretrain/Loss (Raw)": 2.186211585998535, "Pretrain/Step": 3934, "Pretrain/Step Time": 8.422143906354904} +{"Pretrain/Learning Rate": 3.3139248457707495e-05, "Pretrain/Loss": 2.060434341430664, "Pretrain/Loss (Raw)": 2.0832746028900146, "Pretrain/Step": 3935, "Pretrain/Step Time": 8.428844947367907} +{"Pretrain/Learning Rate": 3.313122066099794e-05, "Pretrain/Loss": 2.0622708797454834, "Pretrain/Loss (Raw)": 1.9717013835906982, "Pretrain/Step": 3936, "Pretrain/Step Time": 8.436008227989078} +{"Pretrain/Learning Rate": 3.312319192655772e-05, "Pretrain/Loss": 2.0620155334472656, "Pretrain/Loss (Raw)": 2.1641743183135986, "Pretrain/Step": 3937, "Pretrain/Step Time": 8.432118745520711} +{"Pretrain/Learning Rate": 3.311516225531271e-05, "Pretrain/Loss": 2.062506675720215, "Pretrain/Loss (Raw)": 2.022376775741577, "Pretrain/Step": 3938, "Pretrain/Step Time": 8.432097086682916} +{"Pretrain/Learning Rate": 3.3107131648188966e-05, "Pretrain/Loss": 2.062143325805664, "Pretrain/Loss (Raw)": 2.0369319915771484, "Pretrain/Step": 3939, "Pretrain/Step Time": 8.42711972631514} +{"Pretrain/Learning Rate": 3.309910010611259e-05, "Pretrain/Loss": 2.0641050338745117, "Pretrain/Loss (Raw)": 2.1844873428344727, "Pretrain/Step": 3940, "Pretrain/Step Time": 8.427125331014395} +{"Pretrain/Learning Rate": 3.3091067630009834e-05, "Pretrain/Loss": 2.061758041381836, "Pretrain/Loss (Raw)": 1.7492104768753052, "Pretrain/Step": 3941, "Pretrain/Step Time": 8.435977159067988} +{"Pretrain/Learning Rate": 3.3083034220807016e-05, "Pretrain/Loss": 2.061807870864868, "Pretrain/Loss (Raw)": 2.005573272705078, "Pretrain/Step": 3942, "Pretrain/Step Time": 8.435145867988467} +{"Pretrain/Learning Rate": 3.307499987943062e-05, "Pretrain/Loss": 2.061647653579712, "Pretrain/Loss (Raw)": 2.032679319381714, "Pretrain/Step": 3943, "Pretrain/Step Time": 8.43817994557321} +{"Pretrain/Learning Rate": 3.3066964606807175e-05, "Pretrain/Loss": 2.059843063354492, "Pretrain/Loss (Raw)": 1.7463128566741943, "Pretrain/Step": 3944, "Pretrain/Step Time": 8.437963953241706} +{"Pretrain/Learning Rate": 3.3058928403863364e-05, "Pretrain/Loss": 2.0601673126220703, "Pretrain/Loss (Raw)": 1.9398351907730103, "Pretrain/Step": 3945, "Pretrain/Step Time": 8.431966302916408} +{"Pretrain/Learning Rate": 3.305089127152596e-05, "Pretrain/Loss": 2.0592267513275146, "Pretrain/Loss (Raw)": 2.022028684616089, "Pretrain/Step": 3946, "Pretrain/Step Time": 8.425805868580937} +{"Pretrain/Learning Rate": 3.304285321072183e-05, "Pretrain/Loss": 2.060391426086426, "Pretrain/Loss (Raw)": 2.2009434700012207, "Pretrain/Step": 3947, "Pretrain/Step Time": 8.428923517465591} +{"Pretrain/Learning Rate": 3.303481422237797e-05, "Pretrain/Loss": 2.0593676567077637, "Pretrain/Loss (Raw)": 1.9427977800369263, "Pretrain/Step": 3948, "Pretrain/Step Time": 8.433919770643115} +{"Pretrain/Learning Rate": 3.3026774307421476e-05, "Pretrain/Loss": 2.059396266937256, "Pretrain/Loss (Raw)": 2.022321939468384, "Pretrain/Step": 3949, "Pretrain/Step Time": 8.435128090903163} +{"Pretrain/Learning Rate": 3.301873346677954e-05, "Pretrain/Loss": 2.058145046234131, "Pretrain/Loss (Raw)": 1.9274680614471436, "Pretrain/Step": 3950, "Pretrain/Step Time": 8.433159099891782} +{"Pretrain/Learning Rate": 3.301069170137948e-05, "Pretrain/Loss": 2.058079481124878, "Pretrain/Loss (Raw)": 1.9986506700515747, "Pretrain/Step": 3951, "Pretrain/Step Time": 8.430185096338391} +{"Pretrain/Learning Rate": 3.3002649012148704e-05, "Pretrain/Loss": 2.0574264526367188, "Pretrain/Loss (Raw)": 2.039551258087158, "Pretrain/Step": 3952, "Pretrain/Step Time": 8.432046381756663} +{"Pretrain/Learning Rate": 3.2994605400014736e-05, "Pretrain/Loss": 2.0571038722991943, "Pretrain/Loss (Raw)": 1.8657015562057495, "Pretrain/Step": 3953, "Pretrain/Step Time": 8.43879851512611} +{"Pretrain/Learning Rate": 3.29865608659052e-05, "Pretrain/Loss": 2.0578999519348145, "Pretrain/Loss (Raw)": 1.982086181640625, "Pretrain/Step": 3954, "Pretrain/Step Time": 8.442512350156903} +{"Pretrain/Learning Rate": 3.297851541074782e-05, "Pretrain/Loss": 2.05765438079834, "Pretrain/Loss (Raw)": 2.0098836421966553, "Pretrain/Step": 3955, "Pretrain/Step Time": 8.442573610693216} +{"Pretrain/Learning Rate": 3.297046903547046e-05, "Pretrain/Loss": 2.0570733547210693, "Pretrain/Loss (Raw)": 1.9922621250152588, "Pretrain/Step": 3956, "Pretrain/Step Time": 8.437392445281148} +{"Pretrain/Learning Rate": 3.296242174100105e-05, "Pretrain/Loss": 2.055959463119507, "Pretrain/Loss (Raw)": 2.141855239868164, "Pretrain/Step": 3957, "Pretrain/Step Time": 8.436291268095374} +{"Pretrain/Learning Rate": 3.2954373528267646e-05, "Pretrain/Loss": 2.0544047355651855, "Pretrain/Loss (Raw)": 2.0835044384002686, "Pretrain/Step": 3958, "Pretrain/Step Time": 8.441552460193634} +{"Pretrain/Learning Rate": 3.29463243981984e-05, "Pretrain/Loss": 2.0548362731933594, "Pretrain/Loss (Raw)": 2.157959461212158, "Pretrain/Step": 3959, "Pretrain/Step Time": 8.44567290134728} +{"Pretrain/Learning Rate": 3.2938274351721587e-05, "Pretrain/Loss": 2.0518410205841064, "Pretrain/Loss (Raw)": 1.8823633193969727, "Pretrain/Step": 3960, "Pretrain/Step Time": 8.445625133812428} +{"Pretrain/Learning Rate": 3.2930223389765566e-05, "Pretrain/Loss": 2.054152011871338, "Pretrain/Loss (Raw)": 2.362300395965576, "Pretrain/Step": 3961, "Pretrain/Step Time": 8.440664902329445} +{"Pretrain/Learning Rate": 3.292217151325882e-05, "Pretrain/Loss": 2.054168939590454, "Pretrain/Loss (Raw)": 2.0440900325775146, "Pretrain/Step": 3962, "Pretrain/Step Time": 8.447137312963605} +{"Pretrain/Learning Rate": 3.2914118723129916e-05, "Pretrain/Loss": 2.0549633502960205, "Pretrain/Loss (Raw)": 2.062377691268921, "Pretrain/Step": 3963, "Pretrain/Step Time": 8.439933445304632} +{"Pretrain/Learning Rate": 3.2906065020307545e-05, "Pretrain/Loss": 2.0564520359039307, "Pretrain/Loss (Raw)": 2.1011157035827637, "Pretrain/Step": 3964, "Pretrain/Step Time": 8.438524898141623} +{"Pretrain/Learning Rate": 3.289801040572051e-05, "Pretrain/Loss": 2.0555872917175293, "Pretrain/Loss (Raw)": 1.8031702041625977, "Pretrain/Step": 3965, "Pretrain/Step Time": 8.446119334548712} +{"Pretrain/Learning Rate": 3.288995488029769e-05, "Pretrain/Loss": 2.0603761672973633, "Pretrain/Loss (Raw)": 2.5460550785064697, "Pretrain/Step": 3966, "Pretrain/Step Time": 8.44062122516334} +{"Pretrain/Learning Rate": 3.288189844496811e-05, "Pretrain/Loss": 2.0621633529663086, "Pretrain/Loss (Raw)": 2.078275442123413, "Pretrain/Step": 3967, "Pretrain/Step Time": 8.435567339882255} +{"Pretrain/Learning Rate": 3.287384110066084e-05, "Pretrain/Loss": 2.0612680912017822, "Pretrain/Loss (Raw)": 2.003523111343384, "Pretrain/Step": 3968, "Pretrain/Step Time": 8.440499586984515} +{"Pretrain/Learning Rate": 3.286578284830513e-05, "Pretrain/Loss": 2.060060739517212, "Pretrain/Loss (Raw)": 1.8957775831222534, "Pretrain/Step": 3969, "Pretrain/Step Time": 8.449021875858307} +{"Pretrain/Learning Rate": 3.2857723688830264e-05, "Pretrain/Loss": 2.0588743686676025, "Pretrain/Loss (Raw)": 1.8710362911224365, "Pretrain/Step": 3970, "Pretrain/Step Time": 8.445548336952925} +{"Pretrain/Learning Rate": 3.284966362316568e-05, "Pretrain/Loss": 2.057631254196167, "Pretrain/Loss (Raw)": 1.9824106693267822, "Pretrain/Step": 3971, "Pretrain/Step Time": 8.447278873994946} +{"Pretrain/Learning Rate": 3.28416026522409e-05, "Pretrain/Loss": 2.057265520095825, "Pretrain/Loss (Raw)": 1.8985973596572876, "Pretrain/Step": 3972, "Pretrain/Step Time": 8.443044809624553} +{"Pretrain/Learning Rate": 3.283354077698555e-05, "Pretrain/Loss": 2.0516443252563477, "Pretrain/Loss (Raw)": 1.7050201892852783, "Pretrain/Step": 3973, "Pretrain/Step Time": 8.435571849346161} +{"Pretrain/Learning Rate": 3.2825477998329366e-05, "Pretrain/Loss": 2.051105260848999, "Pretrain/Loss (Raw)": 2.215927839279175, "Pretrain/Step": 3974, "Pretrain/Step Time": 8.438874311745167} +{"Pretrain/Learning Rate": 3.281741431720219e-05, "Pretrain/Loss": 2.0527238845825195, "Pretrain/Loss (Raw)": 2.0998542308807373, "Pretrain/Step": 3975, "Pretrain/Step Time": 8.43887796625495} +{"Pretrain/Learning Rate": 3.280934973453395e-05, "Pretrain/Loss": 2.0565881729125977, "Pretrain/Loss (Raw)": 2.4846532344818115, "Pretrain/Step": 3976, "Pretrain/Step Time": 8.439667889848351} +{"Pretrain/Learning Rate": 3.28012842512547e-05, "Pretrain/Loss": 2.0560479164123535, "Pretrain/Loss (Raw)": 2.0921030044555664, "Pretrain/Step": 3977, "Pretrain/Step Time": 8.437124408781528} +{"Pretrain/Learning Rate": 3.279321786829459e-05, "Pretrain/Loss": 2.0561861991882324, "Pretrain/Loss (Raw)": 2.1056439876556396, "Pretrain/Step": 3978, "Pretrain/Step Time": 8.441532192751765} +{"Pretrain/Learning Rate": 3.278515058658387e-05, "Pretrain/Loss": 2.0543766021728516, "Pretrain/Loss (Raw)": 1.8384041786193848, "Pretrain/Step": 3979, "Pretrain/Step Time": 8.43937866576016} +{"Pretrain/Learning Rate": 3.27770824070529e-05, "Pretrain/Loss": 2.0559890270233154, "Pretrain/Loss (Raw)": 2.0302929878234863, "Pretrain/Step": 3980, "Pretrain/Step Time": 8.442291185259819} +{"Pretrain/Learning Rate": 3.276901333063215e-05, "Pretrain/Loss": 2.0533952713012695, "Pretrain/Loss (Raw)": 2.0246713161468506, "Pretrain/Step": 3981, "Pretrain/Step Time": 8.444714061915874} +{"Pretrain/Learning Rate": 3.276094335825217e-05, "Pretrain/Loss": 2.0540947914123535, "Pretrain/Loss (Raw)": 2.0079345703125, "Pretrain/Step": 3982, "Pretrain/Step Time": 8.44576064683497} +{"Pretrain/Learning Rate": 3.2752872490843626e-05, "Pretrain/Loss": 2.0540082454681396, "Pretrain/Loss (Raw)": 1.919559121131897, "Pretrain/Step": 3983, "Pretrain/Step Time": 8.44463950023055} +{"Pretrain/Learning Rate": 3.274480072933729e-05, "Pretrain/Loss": 2.0523266792297363, "Pretrain/Loss (Raw)": 1.9265576601028442, "Pretrain/Step": 3984, "Pretrain/Step Time": 8.445773150771856} +{"Pretrain/Learning Rate": 3.273672807466405e-05, "Pretrain/Loss": 2.0519790649414062, "Pretrain/Loss (Raw)": 1.9343510866165161, "Pretrain/Step": 3985, "Pretrain/Step Time": 8.442312460392714} +{"Pretrain/Learning Rate": 3.272865452775487e-05, "Pretrain/Loss": 2.051856517791748, "Pretrain/Loss (Raw)": 1.994784951210022, "Pretrain/Step": 3986, "Pretrain/Step Time": 8.44976063258946} +{"Pretrain/Learning Rate": 3.272058008954083e-05, "Pretrain/Loss": 2.050507068634033, "Pretrain/Loss (Raw)": 1.9251347780227661, "Pretrain/Step": 3987, "Pretrain/Step Time": 8.445297313854098} +{"Pretrain/Learning Rate": 3.271250476095311e-05, "Pretrain/Loss": 2.051241397857666, "Pretrain/Loss (Raw)": 2.1715242862701416, "Pretrain/Step": 3988, "Pretrain/Step Time": 8.444597447291017} +{"Pretrain/Learning Rate": 3.2704428542923e-05, "Pretrain/Loss": 2.0487313270568848, "Pretrain/Loss (Raw)": 1.865637183189392, "Pretrain/Step": 3989, "Pretrain/Step Time": 8.447016818448901} +{"Pretrain/Learning Rate": 3.269635143638188e-05, "Pretrain/Loss": 2.0506114959716797, "Pretrain/Loss (Raw)": 2.1982815265655518, "Pretrain/Step": 3990, "Pretrain/Step Time": 8.442546473816037} +{"Pretrain/Learning Rate": 3.2688273442261255e-05, "Pretrain/Loss": 2.0508499145507812, "Pretrain/Loss (Raw)": 2.1302497386932373, "Pretrain/Step": 3991, "Pretrain/Step Time": 8.433557840064168} +{"Pretrain/Learning Rate": 3.26801945614927e-05, "Pretrain/Loss": 2.0528342723846436, "Pretrain/Loss (Raw)": 2.14677095413208, "Pretrain/Step": 3992, "Pretrain/Step Time": 8.437192972749472} +{"Pretrain/Learning Rate": 3.2672114795007926e-05, "Pretrain/Loss": 2.0523900985717773, "Pretrain/Loss (Raw)": 1.962811827659607, "Pretrain/Step": 3993, "Pretrain/Step Time": 8.437097938731313} +{"Pretrain/Learning Rate": 3.266403414373872e-05, "Pretrain/Loss": 2.05240535736084, "Pretrain/Loss (Raw)": 1.9076181650161743, "Pretrain/Step": 3994, "Pretrain/Step Time": 8.43681206740439} +{"Pretrain/Learning Rate": 3.265595260861698e-05, "Pretrain/Loss": 2.051753044128418, "Pretrain/Loss (Raw)": 2.090334892272949, "Pretrain/Step": 3995, "Pretrain/Step Time": 8.440568465739489} +{"Pretrain/Learning Rate": 3.264787019057471e-05, "Pretrain/Loss": 2.050906181335449, "Pretrain/Loss (Raw)": 2.058870792388916, "Pretrain/Step": 3996, "Pretrain/Step Time": 8.428999200463295} +{"Pretrain/Learning Rate": 3.2639786890544014e-05, "Pretrain/Loss": 2.046952724456787, "Pretrain/Loss (Raw)": 1.989888310432434, "Pretrain/Step": 3997, "Pretrain/Step Time": 8.427256857976317} +{"Pretrain/Learning Rate": 3.263170270945709e-05, "Pretrain/Loss": 2.047537326812744, "Pretrain/Loss (Raw)": 2.2000954151153564, "Pretrain/Step": 3998, "Pretrain/Step Time": 8.434610445052385} +{"Pretrain/Learning Rate": 3.262361764824625e-05, "Pretrain/Loss": 2.0483222007751465, "Pretrain/Loss (Raw)": 2.0893588066101074, "Pretrain/Step": 3999, "Pretrain/Step Time": 8.433229565620422} +{"Pretrain/Learning Rate": 3.26155317078439e-05, "Pretrain/Loss": 2.049023151397705, "Pretrain/Loss (Raw)": 2.189650535583496, "Pretrain/Step": 4000, "Pretrain/Step Time": 8.431111607700586} +{"Pretrain/Learning Rate": 3.260744488918254e-05, "Pretrain/Loss": 2.0488367080688477, "Pretrain/Loss (Raw)": 2.083090305328369, "Pretrain/Step": 4001, "Pretrain/Step Time": 8.4362530130893} +{"Pretrain/Learning Rate": 3.25993571931948e-05, "Pretrain/Loss": 2.0456557273864746, "Pretrain/Loss (Raw)": 1.6216129064559937, "Pretrain/Step": 4002, "Pretrain/Step Time": 8.42330813035369} +{"Pretrain/Learning Rate": 3.259126862081337e-05, "Pretrain/Loss": 2.0466318130493164, "Pretrain/Loss (Raw)": 2.1833317279815674, "Pretrain/Step": 4003, "Pretrain/Step Time": 8.426144180819392} +{"Pretrain/Learning Rate": 3.258317917297108e-05, "Pretrain/Loss": 2.0456924438476562, "Pretrain/Loss (Raw)": 2.111621379852295, "Pretrain/Step": 4004, "Pretrain/Step Time": 8.434334721416235} +{"Pretrain/Learning Rate": 3.2575088850600826e-05, "Pretrain/Loss": 2.0458502769470215, "Pretrain/Loss (Raw)": 2.055067300796509, "Pretrain/Step": 4005, "Pretrain/Step Time": 8.433712868019938} +{"Pretrain/Learning Rate": 3.2566997654635634e-05, "Pretrain/Loss": 2.0447635650634766, "Pretrain/Loss (Raw)": 1.8728619813919067, "Pretrain/Step": 4006, "Pretrain/Step Time": 8.433064185082912} +{"Pretrain/Learning Rate": 3.2558905586008616e-05, "Pretrain/Loss": 2.0458147525787354, "Pretrain/Loss (Raw)": 2.069312334060669, "Pretrain/Step": 4007, "Pretrain/Step Time": 8.425600772723556} +{"Pretrain/Learning Rate": 3.2550812645652985e-05, "Pretrain/Loss": 2.0456671714782715, "Pretrain/Loss (Raw)": 2.322953701019287, "Pretrain/Step": 4008, "Pretrain/Step Time": 8.42436675913632} +{"Pretrain/Learning Rate": 3.2542718834502056e-05, "Pretrain/Loss": 2.0460667610168457, "Pretrain/Loss (Raw)": 2.091492176055908, "Pretrain/Step": 4009, "Pretrain/Step Time": 8.427886450663209} +{"Pretrain/Learning Rate": 3.253462415348926e-05, "Pretrain/Loss": 2.048450469970703, "Pretrain/Loss (Raw)": 2.4221134185791016, "Pretrain/Step": 4010, "Pretrain/Step Time": 8.43266898021102} +{"Pretrain/Learning Rate": 3.252652860354809e-05, "Pretrain/Loss": 2.048583745956421, "Pretrain/Loss (Raw)": 1.8348501920700073, "Pretrain/Step": 4011, "Pretrain/Step Time": 8.432458773255348} +{"Pretrain/Learning Rate": 3.2518432185612184e-05, "Pretrain/Loss": 2.0482840538024902, "Pretrain/Loss (Raw)": 2.075244665145874, "Pretrain/Step": 4012, "Pretrain/Step Time": 8.430847655981779} +{"Pretrain/Learning Rate": 3.2510334900615254e-05, "Pretrain/Loss": 2.0489232540130615, "Pretrain/Loss (Raw)": 1.998458981513977, "Pretrain/Step": 4013, "Pretrain/Step Time": 8.428383283317089} +{"Pretrain/Learning Rate": 3.25022367494911e-05, "Pretrain/Loss": 2.0499563217163086, "Pretrain/Loss (Raw)": 1.9547861814498901, "Pretrain/Step": 4014, "Pretrain/Step Time": 8.428138019517064} +{"Pretrain/Learning Rate": 3.2494137733173666e-05, "Pretrain/Loss": 2.0493874549865723, "Pretrain/Loss (Raw)": 1.9366950988769531, "Pretrain/Step": 4015, "Pretrain/Step Time": 8.431828076019883} +{"Pretrain/Learning Rate": 3.2486037852596946e-05, "Pretrain/Loss": 2.0493693351745605, "Pretrain/Loss (Raw)": 2.098285436630249, "Pretrain/Step": 4016, "Pretrain/Step Time": 8.437980519607663} +{"Pretrain/Learning Rate": 3.247793710869507e-05, "Pretrain/Loss": 2.048821449279785, "Pretrain/Loss (Raw)": 1.9413074254989624, "Pretrain/Step": 4017, "Pretrain/Step Time": 8.436253251507878} +{"Pretrain/Learning Rate": 3.2469835502402246e-05, "Pretrain/Loss": 2.0496721267700195, "Pretrain/Loss (Raw)": 2.2376186847686768, "Pretrain/Step": 4018, "Pretrain/Step Time": 8.43283429555595} +{"Pretrain/Learning Rate": 3.2461733034652794e-05, "Pretrain/Loss": 2.050659656524658, "Pretrain/Loss (Raw)": 2.0739235877990723, "Pretrain/Step": 4019, "Pretrain/Step Time": 8.431303802877665} +{"Pretrain/Learning Rate": 3.245362970638113e-05, "Pretrain/Loss": 2.052744150161743, "Pretrain/Loss (Raw)": 2.3928630352020264, "Pretrain/Step": 4020, "Pretrain/Step Time": 8.431447055190802} +{"Pretrain/Learning Rate": 3.244552551852176e-05, "Pretrain/Loss": 2.050973892211914, "Pretrain/Loss (Raw)": 1.9561833143234253, "Pretrain/Step": 4021, "Pretrain/Step Time": 8.435502212494612} +{"Pretrain/Learning Rate": 3.24374204720093e-05, "Pretrain/Loss": 2.050004005432129, "Pretrain/Loss (Raw)": 2.069988250732422, "Pretrain/Step": 4022, "Pretrain/Step Time": 8.436035245656967} +{"Pretrain/Learning Rate": 3.242931456777848e-05, "Pretrain/Loss": 2.0497922897338867, "Pretrain/Loss (Raw)": 2.0939106941223145, "Pretrain/Step": 4023, "Pretrain/Step Time": 8.435778917744756} +{"Pretrain/Learning Rate": 3.242120780676408e-05, "Pretrain/Loss": 2.0473289489746094, "Pretrain/Loss (Raw)": 1.9059555530548096, "Pretrain/Step": 4024, "Pretrain/Step Time": 8.4302744474262} +{"Pretrain/Learning Rate": 3.2413100189901036e-05, "Pretrain/Loss": 2.046818971633911, "Pretrain/Loss (Raw)": 2.0677330493927, "Pretrain/Step": 4025, "Pretrain/Step Time": 8.43060364574194} +{"Pretrain/Learning Rate": 3.2404991718124346e-05, "Pretrain/Loss": 2.0482938289642334, "Pretrain/Loss (Raw)": 2.353847026824951, "Pretrain/Step": 4026, "Pretrain/Step Time": 8.434228176251054} +{"Pretrain/Learning Rate": 3.239688239236911e-05, "Pretrain/Loss": 2.048283100128174, "Pretrain/Loss (Raw)": 1.9939568042755127, "Pretrain/Step": 4027, "Pretrain/Step Time": 8.44436178356409} +{"Pretrain/Learning Rate": 3.238877221357054e-05, "Pretrain/Loss": 2.0504231452941895, "Pretrain/Loss (Raw)": 2.1994762420654297, "Pretrain/Step": 4028, "Pretrain/Step Time": 8.441107511520386} +{"Pretrain/Learning Rate": 3.2380661182663956e-05, "Pretrain/Loss": 2.0503783226013184, "Pretrain/Loss (Raw)": 2.150545358657837, "Pretrain/Step": 4029, "Pretrain/Step Time": 8.437316123396158} +{"Pretrain/Learning Rate": 3.237254930058474e-05, "Pretrain/Loss": 2.0492541790008545, "Pretrain/Loss (Raw)": 1.856411337852478, "Pretrain/Step": 4030, "Pretrain/Step Time": 8.43560765683651} +{"Pretrain/Learning Rate": 3.236443656826839e-05, "Pretrain/Loss": 2.049665927886963, "Pretrain/Loss (Raw)": 1.9981659650802612, "Pretrain/Step": 4031, "Pretrain/Step Time": 8.43381511233747} +{"Pretrain/Learning Rate": 3.235632298665052e-05, "Pretrain/Loss": 2.048631191253662, "Pretrain/Loss (Raw)": 1.9147849082946777, "Pretrain/Step": 4032, "Pretrain/Step Time": 8.440286040306091} +{"Pretrain/Learning Rate": 3.234820855666681e-05, "Pretrain/Loss": 2.048731803894043, "Pretrain/Loss (Raw)": 2.081727981567383, "Pretrain/Step": 4033, "Pretrain/Step Time": 8.444038353860378} +{"Pretrain/Learning Rate": 3.234009327925308e-05, "Pretrain/Loss": 2.049455165863037, "Pretrain/Loss (Raw)": 2.1141250133514404, "Pretrain/Step": 4034, "Pretrain/Step Time": 8.443536402657628} +{"Pretrain/Learning Rate": 3.23319771553452e-05, "Pretrain/Loss": 2.050804615020752, "Pretrain/Loss (Raw)": 2.2010433673858643, "Pretrain/Step": 4035, "Pretrain/Step Time": 8.434532461687922} +{"Pretrain/Learning Rate": 3.232386018587916e-05, "Pretrain/Loss": 2.0495073795318604, "Pretrain/Loss (Raw)": 2.052948474884033, "Pretrain/Step": 4036, "Pretrain/Step Time": 8.438898729160428} +{"Pretrain/Learning Rate": 3.2315742371791046e-05, "Pretrain/Loss": 2.0504603385925293, "Pretrain/Loss (Raw)": 2.1743860244750977, "Pretrain/Step": 4037, "Pretrain/Step Time": 8.439947756007314} +{"Pretrain/Learning Rate": 3.230762371401705e-05, "Pretrain/Loss": 2.04872727394104, "Pretrain/Loss (Raw)": 1.9566541910171509, "Pretrain/Step": 4038, "Pretrain/Step Time": 8.445737220346928} +{"Pretrain/Learning Rate": 3.2299504213493464e-05, "Pretrain/Loss": 2.050218105316162, "Pretrain/Loss (Raw)": 1.9610435962677002, "Pretrain/Step": 4039, "Pretrain/Step Time": 8.448538340628147} +{"Pretrain/Learning Rate": 3.229138387115665e-05, "Pretrain/Loss": 2.0501058101654053, "Pretrain/Loss (Raw)": 1.8994581699371338, "Pretrain/Step": 4040, "Pretrain/Step Time": 8.449247039854527} +{"Pretrain/Learning Rate": 3.228326268794309e-05, "Pretrain/Loss": 2.052827835083008, "Pretrain/Loss (Raw)": 2.300377607345581, "Pretrain/Step": 4041, "Pretrain/Step Time": 8.438320828601718} +{"Pretrain/Learning Rate": 3.227514066478936e-05, "Pretrain/Loss": 2.051485061645508, "Pretrain/Loss (Raw)": 1.951116681098938, "Pretrain/Step": 4042, "Pretrain/Step Time": 8.440937591716647} +{"Pretrain/Learning Rate": 3.226701780263212e-05, "Pretrain/Loss": 2.051267147064209, "Pretrain/Loss (Raw)": 2.0338988304138184, "Pretrain/Step": 4043, "Pretrain/Step Time": 8.442665785551071} +{"Pretrain/Learning Rate": 3.225889410240815e-05, "Pretrain/Loss": 2.0518717765808105, "Pretrain/Loss (Raw)": 2.117640972137451, "Pretrain/Step": 4044, "Pretrain/Step Time": 8.446464410051703} +{"Pretrain/Learning Rate": 3.2250769565054305e-05, "Pretrain/Loss": 2.049699306488037, "Pretrain/Loss (Raw)": 2.1231846809387207, "Pretrain/Step": 4045, "Pretrain/Step Time": 8.440590402111411} +{"Pretrain/Learning Rate": 3.2242644191507545e-05, "Pretrain/Loss": 2.0491623878479004, "Pretrain/Loss (Raw)": 1.96145761013031, "Pretrain/Step": 4046, "Pretrain/Step Time": 8.43763374723494} +{"Pretrain/Learning Rate": 3.223451798270493e-05, "Pretrain/Loss": 2.050013303756714, "Pretrain/Loss (Raw)": 1.9840714931488037, "Pretrain/Step": 4047, "Pretrain/Step Time": 8.435031794011593} +{"Pretrain/Learning Rate": 3.222639093958361e-05, "Pretrain/Loss": 2.0492124557495117, "Pretrain/Loss (Raw)": 1.9761747121810913, "Pretrain/Step": 4048, "Pretrain/Step Time": 8.428107952699065} +{"Pretrain/Learning Rate": 3.2218263063080836e-05, "Pretrain/Loss": 2.0506153106689453, "Pretrain/Loss (Raw)": 2.069319248199463, "Pretrain/Step": 4049, "Pretrain/Step Time": 8.431298281997442} +{"Pretrain/Learning Rate": 3.221013435413395e-05, "Pretrain/Loss": 2.0522472858428955, "Pretrain/Loss (Raw)": 2.0667715072631836, "Pretrain/Step": 4050, "Pretrain/Step Time": 8.434662876650691} +{"Pretrain/Learning Rate": 3.220200481368039e-05, "Pretrain/Loss": 2.0536913871765137, "Pretrain/Loss (Raw)": 2.040482759475708, "Pretrain/Step": 4051, "Pretrain/Step Time": 8.43700591661036} +{"Pretrain/Learning Rate": 3.219387444265771e-05, "Pretrain/Loss": 2.054654598236084, "Pretrain/Loss (Raw)": 1.969616413116455, "Pretrain/Step": 4052, "Pretrain/Step Time": 8.434111468493938} +{"Pretrain/Learning Rate": 3.2185743242003524e-05, "Pretrain/Loss": 2.056318521499634, "Pretrain/Loss (Raw)": 2.2433290481567383, "Pretrain/Step": 4053, "Pretrain/Step Time": 8.436299379914999} +{"Pretrain/Learning Rate": 3.217761121265557e-05, "Pretrain/Loss": 2.0569236278533936, "Pretrain/Loss (Raw)": 2.0134003162384033, "Pretrain/Step": 4054, "Pretrain/Step Time": 8.438028868287802} +{"Pretrain/Learning Rate": 3.2169478355551665e-05, "Pretrain/Loss": 2.0564541816711426, "Pretrain/Loss (Raw)": 2.2380380630493164, "Pretrain/Step": 4055, "Pretrain/Step Time": 8.44284439086914} +{"Pretrain/Learning Rate": 3.216134467162973e-05, "Pretrain/Loss": 2.0545544624328613, "Pretrain/Loss (Raw)": 2.125154495239258, "Pretrain/Step": 4056, "Pretrain/Step Time": 8.444148709997535} +{"Pretrain/Learning Rate": 3.215321016182779e-05, "Pretrain/Loss": 2.053229808807373, "Pretrain/Loss (Raw)": 2.1697211265563965, "Pretrain/Step": 4057, "Pretrain/Step Time": 8.443115210160613} +{"Pretrain/Learning Rate": 3.2145074827083946e-05, "Pretrain/Loss": 2.053356409072876, "Pretrain/Loss (Raw)": 2.1850647926330566, "Pretrain/Step": 4058, "Pretrain/Step Time": 8.434070564806461} +{"Pretrain/Learning Rate": 3.21369386683364e-05, "Pretrain/Loss": 2.0529706478118896, "Pretrain/Loss (Raw)": 2.204556941986084, "Pretrain/Step": 4059, "Pretrain/Step Time": 8.434965929016471} +{"Pretrain/Learning Rate": 3.212880168652346e-05, "Pretrain/Loss": 2.053524971008301, "Pretrain/Loss (Raw)": 2.1795785427093506, "Pretrain/Step": 4060, "Pretrain/Step Time": 8.436268482357264} +{"Pretrain/Learning Rate": 3.2120663882583514e-05, "Pretrain/Loss": 2.052446126937866, "Pretrain/Loss (Raw)": 2.033446788787842, "Pretrain/Step": 4061, "Pretrain/Step Time": 8.44485049135983} +{"Pretrain/Learning Rate": 3.2112525257455064e-05, "Pretrain/Loss": 2.0514397621154785, "Pretrain/Loss (Raw)": 2.0573999881744385, "Pretrain/Step": 4062, "Pretrain/Step Time": 8.444831056520343} +{"Pretrain/Learning Rate": 3.210438581207667e-05, "Pretrain/Loss": 2.0524635314941406, "Pretrain/Loss (Raw)": 2.214301109313965, "Pretrain/Step": 4063, "Pretrain/Step Time": 8.436181461438537} +{"Pretrain/Learning Rate": 3.209624554738704e-05, "Pretrain/Loss": 2.0531985759735107, "Pretrain/Loss (Raw)": 2.065802574157715, "Pretrain/Step": 4064, "Pretrain/Step Time": 8.427238455042243} +{"Pretrain/Learning Rate": 3.208810446432493e-05, "Pretrain/Loss": 2.051931858062744, "Pretrain/Loss (Raw)": 2.002040386199951, "Pretrain/Step": 4065, "Pretrain/Step Time": 8.428792219609022} +{"Pretrain/Learning Rate": 3.207996256382922e-05, "Pretrain/Loss": 2.051701784133911, "Pretrain/Loss (Raw)": 1.9929141998291016, "Pretrain/Step": 4066, "Pretrain/Step Time": 8.438570076599717} +{"Pretrain/Learning Rate": 3.207181984683886e-05, "Pretrain/Loss": 2.0500826835632324, "Pretrain/Loss (Raw)": 1.8296855688095093, "Pretrain/Step": 4067, "Pretrain/Step Time": 8.438727898523211} +{"Pretrain/Learning Rate": 3.2063676314292914e-05, "Pretrain/Loss": 2.0505218505859375, "Pretrain/Loss (Raw)": 2.240724563598633, "Pretrain/Step": 4068, "Pretrain/Step Time": 8.438013950362802} +{"Pretrain/Learning Rate": 3.205553196713052e-05, "Pretrain/Loss": 2.053804397583008, "Pretrain/Loss (Raw)": 2.1693532466888428, "Pretrain/Step": 4069, "Pretrain/Step Time": 8.430443927645683} +{"Pretrain/Learning Rate": 3.204738680629094e-05, "Pretrain/Loss": 2.055109739303589, "Pretrain/Loss (Raw)": 2.1726491451263428, "Pretrain/Step": 4070, "Pretrain/Step Time": 8.431272806599736} +{"Pretrain/Learning Rate": 3.2039240832713516e-05, "Pretrain/Loss": 2.054203987121582, "Pretrain/Loss (Raw)": 1.916731357574463, "Pretrain/Step": 4071, "Pretrain/Step Time": 8.42955362983048} +{"Pretrain/Learning Rate": 3.203109404733765e-05, "Pretrain/Loss": 2.0570037364959717, "Pretrain/Loss (Raw)": 2.104702949523926, "Pretrain/Step": 4072, "Pretrain/Step Time": 8.435101717710495} +{"Pretrain/Learning Rate": 3.20229464511029e-05, "Pretrain/Loss": 2.055157423019409, "Pretrain/Loss (Raw)": 1.7035080194473267, "Pretrain/Step": 4073, "Pretrain/Step Time": 8.437157269567251} +{"Pretrain/Learning Rate": 3.2014798044948866e-05, "Pretrain/Loss": 2.055957794189453, "Pretrain/Loss (Raw)": 2.1244866847991943, "Pretrain/Step": 4074, "Pretrain/Step Time": 8.435787195339799} +{"Pretrain/Learning Rate": 3.2006648829815265e-05, "Pretrain/Loss": 2.055203437805176, "Pretrain/Loss (Raw)": 2.104395627975464, "Pretrain/Step": 4075, "Pretrain/Step Time": 8.434854662045836} +{"Pretrain/Learning Rate": 3.1998498806641907e-05, "Pretrain/Loss": 2.0558831691741943, "Pretrain/Loss (Raw)": 2.029788017272949, "Pretrain/Step": 4076, "Pretrain/Step Time": 8.43328120186925} +{"Pretrain/Learning Rate": 3.19903479763687e-05, "Pretrain/Loss": 2.054715156555176, "Pretrain/Loss (Raw)": 1.872840166091919, "Pretrain/Step": 4077, "Pretrain/Step Time": 8.435256868600845} +{"Pretrain/Learning Rate": 3.19821963399356e-05, "Pretrain/Loss": 2.0562286376953125, "Pretrain/Loss (Raw)": 2.1211721897125244, "Pretrain/Step": 4078, "Pretrain/Step Time": 8.43433347903192} +{"Pretrain/Learning Rate": 3.1974043898282744e-05, "Pretrain/Loss": 2.0519192218780518, "Pretrain/Loss (Raw)": 1.4470434188842773, "Pretrain/Step": 4079, "Pretrain/Step Time": 8.440730102360249} +{"Pretrain/Learning Rate": 3.196589065235026e-05, "Pretrain/Loss": 2.0515198707580566, "Pretrain/Loss (Raw)": 1.9884313344955444, "Pretrain/Step": 4080, "Pretrain/Step Time": 8.442150518298149} +{"Pretrain/Learning Rate": 3.195773660307846e-05, "Pretrain/Loss": 2.0526671409606934, "Pretrain/Loss (Raw)": 2.0125679969787598, "Pretrain/Step": 4081, "Pretrain/Step Time": 8.43233772367239} +{"Pretrain/Learning Rate": 3.1949581751407676e-05, "Pretrain/Loss": 2.052408218383789, "Pretrain/Loss (Raw)": 1.948903203010559, "Pretrain/Step": 4082, "Pretrain/Step Time": 8.431302571669221} +{"Pretrain/Learning Rate": 3.1941426098278383e-05, "Pretrain/Loss": 2.050638198852539, "Pretrain/Loss (Raw)": 1.7833483219146729, "Pretrain/Step": 4083, "Pretrain/Step Time": 8.43521922826767} +{"Pretrain/Learning Rate": 3.193326964463112e-05, "Pretrain/Loss": 2.0515248775482178, "Pretrain/Loss (Raw)": 2.1057653427124023, "Pretrain/Step": 4084, "Pretrain/Step Time": 8.439689718186855} +{"Pretrain/Learning Rate": 3.192511239140653e-05, "Pretrain/Loss": 2.0509467124938965, "Pretrain/Loss (Raw)": 2.067854881286621, "Pretrain/Step": 4085, "Pretrain/Step Time": 8.439107211306691} +{"Pretrain/Learning Rate": 3.1916954339545355e-05, "Pretrain/Loss": 2.050936460494995, "Pretrain/Loss (Raw)": 2.0821692943573, "Pretrain/Step": 4086, "Pretrain/Step Time": 8.432555973529816} +{"Pretrain/Learning Rate": 3.19087954899884e-05, "Pretrain/Loss": 2.0504302978515625, "Pretrain/Loss (Raw)": 2.0931951999664307, "Pretrain/Step": 4087, "Pretrain/Step Time": 8.429002916440368} +{"Pretrain/Learning Rate": 3.190063584367661e-05, "Pretrain/Loss": 2.051419258117676, "Pretrain/Loss (Raw)": 2.0089101791381836, "Pretrain/Step": 4088, "Pretrain/Step Time": 8.427585864439607} +{"Pretrain/Learning Rate": 3.1892475401550956e-05, "Pretrain/Loss": 2.04927921295166, "Pretrain/Loss (Raw)": 2.0883841514587402, "Pretrain/Step": 4089, "Pretrain/Step Time": 8.435325486585498} +{"Pretrain/Learning Rate": 3.1884314164552576e-05, "Pretrain/Loss": 2.0493667125701904, "Pretrain/Loss (Raw)": 2.0553059577941895, "Pretrain/Step": 4090, "Pretrain/Step Time": 8.430315246805549} +{"Pretrain/Learning Rate": 3.187615213362264e-05, "Pretrain/Loss": 2.049193859100342, "Pretrain/Loss (Raw)": 2.0402402877807617, "Pretrain/Step": 4091, "Pretrain/Step Time": 8.43003905005753} +{"Pretrain/Learning Rate": 3.186798930970244e-05, "Pretrain/Loss": 2.0496044158935547, "Pretrain/Loss (Raw)": 2.153684139251709, "Pretrain/Step": 4092, "Pretrain/Step Time": 8.431835988536477} +{"Pretrain/Learning Rate": 3.185982569373335e-05, "Pretrain/Loss": 2.0508108139038086, "Pretrain/Loss (Raw)": 1.9575759172439575, "Pretrain/Step": 4093, "Pretrain/Step Time": 8.42498154938221} +{"Pretrain/Learning Rate": 3.185166128665684e-05, "Pretrain/Loss": 2.0472593307495117, "Pretrain/Loss (Raw)": 2.0914628505706787, "Pretrain/Step": 4094, "Pretrain/Step Time": 8.426550446078181} +{"Pretrain/Learning Rate": 3.184349608941446e-05, "Pretrain/Loss": 2.0467662811279297, "Pretrain/Loss (Raw)": 2.015174388885498, "Pretrain/Step": 4095, "Pretrain/Step Time": 8.431847287341952} +{"Pretrain/Learning Rate": 3.183533010294787e-05, "Pretrain/Loss": 2.0510342121124268, "Pretrain/Loss (Raw)": 2.549818515777588, "Pretrain/Step": 4096, "Pretrain/Step Time": 8.427475735545158} +{"Pretrain/Learning Rate": 3.18271633281988e-05, "Pretrain/Loss": 2.0516791343688965, "Pretrain/Loss (Raw)": 1.9783114194869995, "Pretrain/Step": 4097, "Pretrain/Step Time": 8.42181403748691} +{"Pretrain/Learning Rate": 3.181899576610908e-05, "Pretrain/Loss": 2.0524682998657227, "Pretrain/Loss (Raw)": 1.9720796346664429, "Pretrain/Step": 4098, "Pretrain/Step Time": 8.425571247935295} +{"Pretrain/Learning Rate": 3.1810827417620634e-05, "Pretrain/Loss": 2.0537948608398438, "Pretrain/Loss (Raw)": 2.1522085666656494, "Pretrain/Step": 4099, "Pretrain/Step Time": 8.424437390640378} +{"Pretrain/Learning Rate": 3.1802658283675486e-05, "Pretrain/Loss": 2.0562071800231934, "Pretrain/Loss (Raw)": 2.207383632659912, "Pretrain/Step": 4100, "Pretrain/Step Time": 8.431083565577865} +{"Pretrain/Learning Rate": 3.179448836521573e-05, "Pretrain/Loss": 2.0604476928710938, "Pretrain/Loss (Raw)": 2.247783899307251, "Pretrain/Step": 4101, "Pretrain/Step Time": 8.432012058794498} +{"Pretrain/Learning Rate": 3.178631766318355e-05, "Pretrain/Loss": 2.0583648681640625, "Pretrain/Loss (Raw)": 1.9493440389633179, "Pretrain/Step": 4102, "Pretrain/Step Time": 8.429756589233875} +{"Pretrain/Learning Rate": 3.177814617852124e-05, "Pretrain/Loss": 2.05781888961792, "Pretrain/Loss (Raw)": 2.0299501419067383, "Pretrain/Step": 4103, "Pretrain/Step Time": 8.423952791839838} +{"Pretrain/Learning Rate": 3.176997391217117e-05, "Pretrain/Loss": 2.055854082107544, "Pretrain/Loss (Raw)": 2.2331454753875732, "Pretrain/Step": 4104, "Pretrain/Step Time": 8.424679206684232} +{"Pretrain/Learning Rate": 3.176180086507582e-05, "Pretrain/Loss": 2.0550284385681152, "Pretrain/Loss (Raw)": 1.9864107370376587, "Pretrain/Step": 4105, "Pretrain/Step Time": 8.42506429925561} +{"Pretrain/Learning Rate": 3.175362703817773e-05, "Pretrain/Loss": 2.054119110107422, "Pretrain/Loss (Raw)": 1.9892771244049072, "Pretrain/Step": 4106, "Pretrain/Step Time": 8.422847619280219} +{"Pretrain/Learning Rate": 3.1745452432419534e-05, "Pretrain/Loss": 2.0551867485046387, "Pretrain/Loss (Raw)": 1.975046157836914, "Pretrain/Step": 4107, "Pretrain/Step Time": 8.422398641705513} +{"Pretrain/Learning Rate": 3.1737277048743984e-05, "Pretrain/Loss": 2.05610990524292, "Pretrain/Loss (Raw)": 2.148498773574829, "Pretrain/Step": 4108, "Pretrain/Step Time": 8.42163754068315} +{"Pretrain/Learning Rate": 3.17291008880939e-05, "Pretrain/Loss": 2.0562973022460938, "Pretrain/Loss (Raw)": 2.0486128330230713, "Pretrain/Step": 4109, "Pretrain/Step Time": 8.415088586509228} +{"Pretrain/Learning Rate": 3.172092395141219e-05, "Pretrain/Loss": 2.057283878326416, "Pretrain/Loss (Raw)": 2.134256601333618, "Pretrain/Step": 4110, "Pretrain/Step Time": 8.416776433587074} +{"Pretrain/Learning Rate": 3.171274623964186e-05, "Pretrain/Loss": 2.0565853118896484, "Pretrain/Loss (Raw)": 1.8301156759262085, "Pretrain/Step": 4111, "Pretrain/Step Time": 8.421955598518252} +{"Pretrain/Learning Rate": 3.170456775372601e-05, "Pretrain/Loss": 2.0567331314086914, "Pretrain/Loss (Raw)": 1.9455004930496216, "Pretrain/Step": 4112, "Pretrain/Step Time": 8.42764556594193} +{"Pretrain/Learning Rate": 3.1696388494607804e-05, "Pretrain/Loss": 2.057105541229248, "Pretrain/Loss (Raw)": 1.9819990396499634, "Pretrain/Step": 4113, "Pretrain/Step Time": 8.422278182581067} +{"Pretrain/Learning Rate": 3.168820846323053e-05, "Pretrain/Loss": 2.0558111667633057, "Pretrain/Loss (Raw)": 1.8291088342666626, "Pretrain/Step": 4114, "Pretrain/Step Time": 8.418428864330053} +{"Pretrain/Learning Rate": 3.1680027660537524e-05, "Pretrain/Loss": 2.0572476387023926, "Pretrain/Loss (Raw)": 2.1090023517608643, "Pretrain/Step": 4115, "Pretrain/Step Time": 8.4203439373523} +{"Pretrain/Learning Rate": 3.167184608747227e-05, "Pretrain/Loss": 2.05564546585083, "Pretrain/Loss (Raw)": 1.9664288759231567, "Pretrain/Step": 4116, "Pretrain/Step Time": 8.421390453353524} +{"Pretrain/Learning Rate": 3.1663663744978276e-05, "Pretrain/Loss": 2.057394504547119, "Pretrain/Loss (Raw)": 2.089529037475586, "Pretrain/Step": 4117, "Pretrain/Step Time": 8.428121311590075} +{"Pretrain/Learning Rate": 3.165548063399919e-05, "Pretrain/Loss": 2.057340383529663, "Pretrain/Loss (Raw)": 2.191357135772705, "Pretrain/Step": 4118, "Pretrain/Step Time": 8.4278615526855} +{"Pretrain/Learning Rate": 3.1647296755478694e-05, "Pretrain/Loss": 2.056786298751831, "Pretrain/Loss (Raw)": 2.0593314170837402, "Pretrain/Step": 4119, "Pretrain/Step Time": 8.427785452455282} +{"Pretrain/Learning Rate": 3.163911211036063e-05, "Pretrain/Loss": 2.0576980113983154, "Pretrain/Loss (Raw)": 2.2634623050689697, "Pretrain/Step": 4120, "Pretrain/Step Time": 8.42580846324563} +{"Pretrain/Learning Rate": 3.163092669958887e-05, "Pretrain/Loss": 2.057494640350342, "Pretrain/Loss (Raw)": 1.9367586374282837, "Pretrain/Step": 4121, "Pretrain/Step Time": 8.423287626355886} +{"Pretrain/Learning Rate": 3.16227405241074e-05, "Pretrain/Loss": 2.0580098628997803, "Pretrain/Loss (Raw)": 1.9735894203186035, "Pretrain/Step": 4122, "Pretrain/Step Time": 8.426260601729155} +{"Pretrain/Learning Rate": 3.161455358486028e-05, "Pretrain/Loss": 2.058779001235962, "Pretrain/Loss (Raw)": 2.188784122467041, "Pretrain/Step": 4123, "Pretrain/Step Time": 8.428936325013638} +{"Pretrain/Learning Rate": 3.160636588279167e-05, "Pretrain/Loss": 2.062774181365967, "Pretrain/Loss (Raw)": 2.570242404937744, "Pretrain/Step": 4124, "Pretrain/Step Time": 8.428718119859695} +{"Pretrain/Learning Rate": 3.159817741884582e-05, "Pretrain/Loss": 2.0626864433288574, "Pretrain/Loss (Raw)": 1.9786802530288696, "Pretrain/Step": 4125, "Pretrain/Step Time": 8.426481293514371} +{"Pretrain/Learning Rate": 3.1589988193967056e-05, "Pretrain/Loss": 2.06010103225708, "Pretrain/Loss (Raw)": 1.8691589832305908, "Pretrain/Step": 4126, "Pretrain/Step Time": 8.420677024871111} +{"Pretrain/Learning Rate": 3.15817982090998e-05, "Pretrain/Loss": 2.057892322540283, "Pretrain/Loss (Raw)": 1.806644082069397, "Pretrain/Step": 4127, "Pretrain/Step Time": 8.420354871079326} +{"Pretrain/Learning Rate": 3.157360746518857e-05, "Pretrain/Loss": 2.055464744567871, "Pretrain/Loss (Raw)": 1.878922700881958, "Pretrain/Step": 4128, "Pretrain/Step Time": 8.424896260723472} +{"Pretrain/Learning Rate": 3.1565415963177944e-05, "Pretrain/Loss": 2.052978754043579, "Pretrain/Loss (Raw)": 1.764878749847412, "Pretrain/Step": 4129, "Pretrain/Step Time": 8.433359479531646} +{"Pretrain/Learning Rate": 3.1557223704012606e-05, "Pretrain/Loss": 2.05769419670105, "Pretrain/Loss (Raw)": 2.2251803874969482, "Pretrain/Step": 4130, "Pretrain/Step Time": 8.430563190951943} +{"Pretrain/Learning Rate": 3.154903068863734e-05, "Pretrain/Loss": 2.056434392929077, "Pretrain/Loss (Raw)": 2.022094488143921, "Pretrain/Step": 4131, "Pretrain/Step Time": 8.429441198706627} +{"Pretrain/Learning Rate": 3.154083691799699e-05, "Pretrain/Loss": 2.0576207637786865, "Pretrain/Loss (Raw)": 2.2634706497192383, "Pretrain/Step": 4132, "Pretrain/Step Time": 8.422785207629204} +{"Pretrain/Learning Rate": 3.1532642393036506e-05, "Pretrain/Loss": 2.05692720413208, "Pretrain/Loss (Raw)": 1.9663063287734985, "Pretrain/Step": 4133, "Pretrain/Step Time": 8.423110758885741} +{"Pretrain/Learning Rate": 3.1524447114700914e-05, "Pretrain/Loss": 2.0586023330688477, "Pretrain/Loss (Raw)": 2.087252140045166, "Pretrain/Step": 4134, "Pretrain/Step Time": 8.433334019035101} +{"Pretrain/Learning Rate": 3.151625108393534e-05, "Pretrain/Loss": 2.0582921504974365, "Pretrain/Loss (Raw)": 2.0296125411987305, "Pretrain/Step": 4135, "Pretrain/Step Time": 8.433568138629198} +{"Pretrain/Learning Rate": 3.150805430168499e-05, "Pretrain/Loss": 2.059387445449829, "Pretrain/Loss (Raw)": 2.4631638526916504, "Pretrain/Step": 4136, "Pretrain/Step Time": 8.436574475839734} +{"Pretrain/Learning Rate": 3.149985676889515e-05, "Pretrain/Loss": 2.059058666229248, "Pretrain/Loss (Raw)": 2.0494017601013184, "Pretrain/Step": 4137, "Pretrain/Step Time": 8.429223967716098} +{"Pretrain/Learning Rate": 3.14916584865112e-05, "Pretrain/Loss": 2.055997371673584, "Pretrain/Loss (Raw)": 2.0302720069885254, "Pretrain/Step": 4138, "Pretrain/Step Time": 8.42762741073966} +{"Pretrain/Learning Rate": 3.1483459455478603e-05, "Pretrain/Loss": 2.0576252937316895, "Pretrain/Loss (Raw)": 2.0432064533233643, "Pretrain/Step": 4139, "Pretrain/Step Time": 8.42531893402338} +{"Pretrain/Learning Rate": 3.147525967674291e-05, "Pretrain/Loss": 2.055671215057373, "Pretrain/Loss (Raw)": 1.8251367807388306, "Pretrain/Step": 4140, "Pretrain/Step Time": 8.42875823751092} +{"Pretrain/Learning Rate": 3.146705915124976e-05, "Pretrain/Loss": 2.056711435317993, "Pretrain/Loss (Raw)": 2.1316075325012207, "Pretrain/Step": 4141, "Pretrain/Step Time": 8.426463657990098} +{"Pretrain/Learning Rate": 3.145885787994487e-05, "Pretrain/Loss": 2.0571227073669434, "Pretrain/Loss (Raw)": 2.007429361343384, "Pretrain/Step": 4142, "Pretrain/Step Time": 8.425934612751007} +{"Pretrain/Learning Rate": 3.1450655863774056e-05, "Pretrain/Loss": 2.058060646057129, "Pretrain/Loss (Raw)": 2.0567469596862793, "Pretrain/Step": 4143, "Pretrain/Step Time": 8.423812074586749} +{"Pretrain/Learning Rate": 3.144245310368321e-05, "Pretrain/Loss": 2.058405876159668, "Pretrain/Loss (Raw)": 2.142484426498413, "Pretrain/Step": 4144, "Pretrain/Step Time": 8.418824180960655} +{"Pretrain/Learning Rate": 3.1434249600618315e-05, "Pretrain/Loss": 2.0598185062408447, "Pretrain/Loss (Raw)": 2.1221132278442383, "Pretrain/Step": 4145, "Pretrain/Step Time": 8.422944396734238} +{"Pretrain/Learning Rate": 3.142604535552544e-05, "Pretrain/Loss": 2.0587754249572754, "Pretrain/Loss (Raw)": 2.1041040420532227, "Pretrain/Step": 4146, "Pretrain/Step Time": 8.435914235189557} +{"Pretrain/Learning Rate": 3.1417840369350735e-05, "Pretrain/Loss": 2.0581107139587402, "Pretrain/Loss (Raw)": 1.9888280630111694, "Pretrain/Step": 4147, "Pretrain/Step Time": 8.430256804451346} +{"Pretrain/Learning Rate": 3.140963464304043e-05, "Pretrain/Loss": 2.0546741485595703, "Pretrain/Loss (Raw)": 1.9530141353607178, "Pretrain/Step": 4148, "Pretrain/Step Time": 8.437273224815726} +{"Pretrain/Learning Rate": 3.140142817754086e-05, "Pretrain/Loss": 2.0571537017822266, "Pretrain/Loss (Raw)": 2.273529529571533, "Pretrain/Step": 4149, "Pretrain/Step Time": 8.430616896599531} +{"Pretrain/Learning Rate": 3.1393220973798425e-05, "Pretrain/Loss": 2.0568742752075195, "Pretrain/Loss (Raw)": 2.0342657566070557, "Pretrain/Step": 4150, "Pretrain/Step Time": 8.432898472994566} +{"Pretrain/Learning Rate": 3.1385013032759623e-05, "Pretrain/Loss": 2.056086540222168, "Pretrain/Loss (Raw)": 1.9930408000946045, "Pretrain/Step": 4151, "Pretrain/Step Time": 8.43365666270256} +{"Pretrain/Learning Rate": 3.137680435537104e-05, "Pretrain/Loss": 2.057651996612549, "Pretrain/Loss (Raw)": 2.106372117996216, "Pretrain/Step": 4152, "Pretrain/Step Time": 8.443741880357265} +{"Pretrain/Learning Rate": 3.136859494257931e-05, "Pretrain/Loss": 2.0564918518066406, "Pretrain/Loss (Raw)": 1.919204831123352, "Pretrain/Step": 4153, "Pretrain/Step Time": 8.441000858321786} +{"Pretrain/Learning Rate": 3.136038479533122e-05, "Pretrain/Loss": 2.053901195526123, "Pretrain/Loss (Raw)": 2.0222461223602295, "Pretrain/Step": 4154, "Pretrain/Step Time": 8.438700878992677} +{"Pretrain/Learning Rate": 3.135217391457358e-05, "Pretrain/Loss": 2.053187370300293, "Pretrain/Loss (Raw)": 1.9026002883911133, "Pretrain/Step": 4155, "Pretrain/Step Time": 8.433629769831896} +{"Pretrain/Learning Rate": 3.1343962301253305e-05, "Pretrain/Loss": 2.0544989109039307, "Pretrain/Loss (Raw)": 2.367357015609741, "Pretrain/Step": 4156, "Pretrain/Step Time": 8.436193635687232} +{"Pretrain/Learning Rate": 3.133574995631741e-05, "Pretrain/Loss": 2.054183006286621, "Pretrain/Loss (Raw)": 2.1100895404815674, "Pretrain/Step": 4157, "Pretrain/Step Time": 8.441201031208038} +{"Pretrain/Learning Rate": 3.132753688071297e-05, "Pretrain/Loss": 2.055675506591797, "Pretrain/Loss (Raw)": 2.0474607944488525, "Pretrain/Step": 4158, "Pretrain/Step Time": 8.443761324509978} +{"Pretrain/Learning Rate": 3.1319323075387165e-05, "Pretrain/Loss": 2.0569300651550293, "Pretrain/Loss (Raw)": 2.1587653160095215, "Pretrain/Step": 4159, "Pretrain/Step Time": 8.443471217527986} +{"Pretrain/Learning Rate": 3.131110854128724e-05, "Pretrain/Loss": 2.0586562156677246, "Pretrain/Loss (Raw)": 2.135707139968872, "Pretrain/Step": 4160, "Pretrain/Step Time": 8.437967037782073} +{"Pretrain/Learning Rate": 3.130289327936055e-05, "Pretrain/Loss": 2.0582756996154785, "Pretrain/Loss (Raw)": 2.0330512523651123, "Pretrain/Step": 4161, "Pretrain/Step Time": 8.43041580170393} +{"Pretrain/Learning Rate": 3.1294677290554494e-05, "Pretrain/Loss": 2.0581579208374023, "Pretrain/Loss (Raw)": 2.0990400314331055, "Pretrain/Step": 4162, "Pretrain/Step Time": 8.435601880773902} +{"Pretrain/Learning Rate": 3.128646057581659e-05, "Pretrain/Loss": 2.0598502159118652, "Pretrain/Loss (Raw)": 2.417651414871216, "Pretrain/Step": 4163, "Pretrain/Step Time": 8.443852324038744} +{"Pretrain/Learning Rate": 3.1278243136094436e-05, "Pretrain/Loss": 2.0625102519989014, "Pretrain/Loss (Raw)": 2.393440008163452, "Pretrain/Step": 4164, "Pretrain/Step Time": 8.437607849016786} +{"Pretrain/Learning Rate": 3.1270024972335706e-05, "Pretrain/Loss": 2.0620248317718506, "Pretrain/Loss (Raw)": 2.1122303009033203, "Pretrain/Step": 4165, "Pretrain/Step Time": 8.438038004562259} +{"Pretrain/Learning Rate": 3.1261806085488144e-05, "Pretrain/Loss": 2.063253402709961, "Pretrain/Loss (Raw)": 2.113938570022583, "Pretrain/Step": 4166, "Pretrain/Step Time": 8.435084391385317} +{"Pretrain/Learning Rate": 3.1253586476499594e-05, "Pretrain/Loss": 2.0634512901306152, "Pretrain/Loss (Raw)": 1.9863617420196533, "Pretrain/Step": 4167, "Pretrain/Step Time": 8.428746512159705} +{"Pretrain/Learning Rate": 3.124536614631799e-05, "Pretrain/Loss": 2.06402587890625, "Pretrain/Loss (Raw)": 1.9730148315429688, "Pretrain/Step": 4168, "Pretrain/Step Time": 8.435844806954265} +{"Pretrain/Learning Rate": 3.123714509589133e-05, "Pretrain/Loss": 2.0625505447387695, "Pretrain/Loss (Raw)": 2.111518383026123, "Pretrain/Step": 4169, "Pretrain/Step Time": 8.435672299936414} +{"Pretrain/Learning Rate": 3.122892332616771e-05, "Pretrain/Loss": 2.0621085166931152, "Pretrain/Loss (Raw)": 1.894511103630066, "Pretrain/Step": 4170, "Pretrain/Step Time": 8.43124526180327} +{"Pretrain/Learning Rate": 3.12207008380953e-05, "Pretrain/Loss": 2.0614352226257324, "Pretrain/Loss (Raw)": 1.9477319717407227, "Pretrain/Step": 4171, "Pretrain/Step Time": 8.432135047391057} +{"Pretrain/Learning Rate": 3.121247763262235e-05, "Pretrain/Loss": 2.0618255138397217, "Pretrain/Loss (Raw)": 2.167628288269043, "Pretrain/Step": 4172, "Pretrain/Step Time": 8.426864117383957} +{"Pretrain/Learning Rate": 3.120425371069721e-05, "Pretrain/Loss": 2.060814380645752, "Pretrain/Loss (Raw)": 1.9937424659729004, "Pretrain/Step": 4173, "Pretrain/Step Time": 8.436870232224464} +{"Pretrain/Learning Rate": 3.119602907326829e-05, "Pretrain/Loss": 2.060384750366211, "Pretrain/Loss (Raw)": 1.9064536094665527, "Pretrain/Step": 4174, "Pretrain/Step Time": 8.437968127429485} +{"Pretrain/Learning Rate": 3.118780372128411e-05, "Pretrain/Loss": 2.0613632202148438, "Pretrain/Loss (Raw)": 2.1093227863311768, "Pretrain/Step": 4175, "Pretrain/Step Time": 8.436689719557762} +{"Pretrain/Learning Rate": 3.1179577655693245e-05, "Pretrain/Loss": 2.0606799125671387, "Pretrain/Loss (Raw)": 1.8887262344360352, "Pretrain/Step": 4176, "Pretrain/Step Time": 8.436334097757936} +{"Pretrain/Learning Rate": 3.1171350877444365e-05, "Pretrain/Loss": 2.060903787612915, "Pretrain/Loss (Raw)": 2.0979807376861572, "Pretrain/Step": 4177, "Pretrain/Step Time": 8.430116266012192} +{"Pretrain/Learning Rate": 3.116312338748623e-05, "Pretrain/Loss": 2.061077356338501, "Pretrain/Loss (Raw)": 2.0889639854431152, "Pretrain/Step": 4178, "Pretrain/Step Time": 8.428815942257643} +{"Pretrain/Learning Rate": 3.115489518676765e-05, "Pretrain/Loss": 2.061835527420044, "Pretrain/Loss (Raw)": 2.1375274658203125, "Pretrain/Step": 4179, "Pretrain/Step Time": 8.426489047706127} +{"Pretrain/Learning Rate": 3.1146666276237554e-05, "Pretrain/Loss": 2.0622458457946777, "Pretrain/Loss (Raw)": 2.0221776962280273, "Pretrain/Step": 4180, "Pretrain/Step Time": 8.424219068139791} +{"Pretrain/Learning Rate": 3.113843665684495e-05, "Pretrain/Loss": 2.060476541519165, "Pretrain/Loss (Raw)": 2.01682710647583, "Pretrain/Step": 4181, "Pretrain/Step Time": 8.42257221788168} +{"Pretrain/Learning Rate": 3.1130206329538905e-05, "Pretrain/Loss": 2.0588889122009277, "Pretrain/Loss (Raw)": 1.8101646900177002, "Pretrain/Step": 4182, "Pretrain/Step Time": 8.419807625934482} +{"Pretrain/Learning Rate": 3.112197529526857e-05, "Pretrain/Loss": 2.0570478439331055, "Pretrain/Loss (Raw)": 2.002384901046753, "Pretrain/Step": 4183, "Pretrain/Step Time": 8.416869398206472} +{"Pretrain/Learning Rate": 3.11137435549832e-05, "Pretrain/Loss": 2.056175947189331, "Pretrain/Loss (Raw)": 2.013561964035034, "Pretrain/Step": 4184, "Pretrain/Step Time": 8.418733596801758} +{"Pretrain/Learning Rate": 3.110551110963212e-05, "Pretrain/Loss": 2.0559070110321045, "Pretrain/Loss (Raw)": 2.135298252105713, "Pretrain/Step": 4185, "Pretrain/Step Time": 8.429689129814506} +{"Pretrain/Learning Rate": 3.109727796016472e-05, "Pretrain/Loss": 2.054187536239624, "Pretrain/Loss (Raw)": 1.9649734497070312, "Pretrain/Step": 4186, "Pretrain/Step Time": 8.427208015695214} +{"Pretrain/Learning Rate": 3.10890441075305e-05, "Pretrain/Loss": 2.0535218715667725, "Pretrain/Loss (Raw)": 2.1193559169769287, "Pretrain/Step": 4187, "Pretrain/Step Time": 8.426495473831892} +{"Pretrain/Learning Rate": 3.108080955267902e-05, "Pretrain/Loss": 2.051359176635742, "Pretrain/Loss (Raw)": 1.9027429819107056, "Pretrain/Step": 4188, "Pretrain/Step Time": 8.42604741640389} +{"Pretrain/Learning Rate": 3.107257429655993e-05, "Pretrain/Loss": 2.055886745452881, "Pretrain/Loss (Raw)": 2.6129918098449707, "Pretrain/Step": 4189, "Pretrain/Step Time": 8.424515906721354} +{"Pretrain/Learning Rate": 3.1064338340122953e-05, "Pretrain/Loss": 2.0541648864746094, "Pretrain/Loss (Raw)": 1.8369758129119873, "Pretrain/Step": 4190, "Pretrain/Step Time": 8.42541766539216} +{"Pretrain/Learning Rate": 3.105610168431791e-05, "Pretrain/Loss": 2.053431749343872, "Pretrain/Loss (Raw)": 2.1204802989959717, "Pretrain/Step": 4191, "Pretrain/Step Time": 8.433916686102748} +{"Pretrain/Learning Rate": 3.1047864330094675e-05, "Pretrain/Loss": 2.0539793968200684, "Pretrain/Loss (Raw)": 2.1358985900878906, "Pretrain/Step": 4192, "Pretrain/Step Time": 8.433856518939137} +{"Pretrain/Learning Rate": 3.1039626278403234e-05, "Pretrain/Loss": 2.0537827014923096, "Pretrain/Loss (Raw)": 1.9768739938735962, "Pretrain/Step": 4193, "Pretrain/Step Time": 8.434464480727911} +{"Pretrain/Learning Rate": 3.1031387530193626e-05, "Pretrain/Loss": 2.056119918823242, "Pretrain/Loss (Raw)": 2.2920730113983154, "Pretrain/Step": 4194, "Pretrain/Step Time": 8.423498267307878} +{"Pretrain/Learning Rate": 3.1023148086415984e-05, "Pretrain/Loss": 2.0587754249572754, "Pretrain/Loss (Raw)": 2.169609546661377, "Pretrain/Step": 4195, "Pretrain/Step Time": 8.426828207448125} +{"Pretrain/Learning Rate": 3.101490794802053e-05, "Pretrain/Loss": 2.0584335327148438, "Pretrain/Loss (Raw)": 2.196927309036255, "Pretrain/Step": 4196, "Pretrain/Step Time": 8.433612251654267} +{"Pretrain/Learning Rate": 3.100666711595754e-05, "Pretrain/Loss": 2.0570526123046875, "Pretrain/Loss (Raw)": 1.992585301399231, "Pretrain/Step": 4197, "Pretrain/Step Time": 8.432339115068316} +{"Pretrain/Learning Rate": 3.09984255911774e-05, "Pretrain/Loss": 2.05527925491333, "Pretrain/Loss (Raw)": 1.9456987380981445, "Pretrain/Step": 4198, "Pretrain/Step Time": 8.429586168378592} +{"Pretrain/Learning Rate": 3.099018337463056e-05, "Pretrain/Loss": 2.0562264919281006, "Pretrain/Loss (Raw)": 2.037968397140503, "Pretrain/Step": 4199, "Pretrain/Step Time": 8.426754320040345} +{"Pretrain/Learning Rate": 3.0981940467267547e-05, "Pretrain/Loss": 2.0551955699920654, "Pretrain/Loss (Raw)": 1.9727333784103394, "Pretrain/Step": 4200, "Pretrain/Step Time": 8.420697305351496} +{"Pretrain/Learning Rate": 3.097369687003896e-05, "Pretrain/Loss": 2.0576109886169434, "Pretrain/Loss (Raw)": 2.012688159942627, "Pretrain/Step": 4201, "Pretrain/Step Time": 8.422638634219766} +{"Pretrain/Learning Rate": 3.096545258389551e-05, "Pretrain/Loss": 2.0565783977508545, "Pretrain/Loss (Raw)": 1.992322564125061, "Pretrain/Step": 4202, "Pretrain/Step Time": 8.43530304543674} +{"Pretrain/Learning Rate": 3.0957207609787945e-05, "Pretrain/Loss": 2.0566930770874023, "Pretrain/Loss (Raw)": 2.1190567016601562, "Pretrain/Step": 4203, "Pretrain/Step Time": 8.432641061022878} +{"Pretrain/Learning Rate": 3.094896194866714e-05, "Pretrain/Loss": 2.054652452468872, "Pretrain/Loss (Raw)": 1.768593430519104, "Pretrain/Step": 4204, "Pretrain/Step Time": 8.432383000850677} +{"Pretrain/Learning Rate": 3.094071560148401e-05, "Pretrain/Loss": 2.055159091949463, "Pretrain/Loss (Raw)": 1.9377089738845825, "Pretrain/Step": 4205, "Pretrain/Step Time": 8.42512576840818} +{"Pretrain/Learning Rate": 3.093246856918956e-05, "Pretrain/Loss": 2.0564675331115723, "Pretrain/Loss (Raw)": 2.2886178493499756, "Pretrain/Step": 4206, "Pretrain/Step Time": 8.427284130826592} +{"Pretrain/Learning Rate": 3.092422085273488e-05, "Pretrain/Loss": 2.061924695968628, "Pretrain/Loss (Raw)": 2.145596742630005, "Pretrain/Step": 4207, "Pretrain/Step Time": 8.42139364592731} +{"Pretrain/Learning Rate": 3.091597245307114e-05, "Pretrain/Loss": 2.0630691051483154, "Pretrain/Loss (Raw)": 2.134894609451294, "Pretrain/Step": 4208, "Pretrain/Step Time": 8.42887200973928} +{"Pretrain/Learning Rate": 3.0907723371149575e-05, "Pretrain/Loss": 2.0651965141296387, "Pretrain/Loss (Raw)": 2.284898281097412, "Pretrain/Step": 4209, "Pretrain/Step Time": 8.429741216823459} +{"Pretrain/Learning Rate": 3.0899473607921513e-05, "Pretrain/Loss": 2.06606388092041, "Pretrain/Loss (Raw)": 2.0599005222320557, "Pretrain/Step": 4210, "Pretrain/Step Time": 8.427026038989425} +{"Pretrain/Learning Rate": 3.0891223164338354e-05, "Pretrain/Loss": 2.0696818828582764, "Pretrain/Loss (Raw)": 2.2464852333068848, "Pretrain/Step": 4211, "Pretrain/Step Time": 8.421024780720472} +{"Pretrain/Learning Rate": 3.0882972041351585e-05, "Pretrain/Loss": 2.0680291652679443, "Pretrain/Loss (Raw)": 1.8941786289215088, "Pretrain/Step": 4212, "Pretrain/Step Time": 8.42012090422213} +{"Pretrain/Learning Rate": 3.0874720239912744e-05, "Pretrain/Loss": 2.068455696105957, "Pretrain/Loss (Raw)": 2.1224732398986816, "Pretrain/Step": 4213, "Pretrain/Step Time": 8.427044974640012} +{"Pretrain/Learning Rate": 3.0866467760973495e-05, "Pretrain/Loss": 2.0681190490722656, "Pretrain/Loss (Raw)": 2.039080858230591, "Pretrain/Step": 4214, "Pretrain/Step Time": 8.425002789124846} +{"Pretrain/Learning Rate": 3.0858214605485545e-05, "Pretrain/Loss": 2.068308115005493, "Pretrain/Loss (Raw)": 2.1173958778381348, "Pretrain/Step": 4215, "Pretrain/Step Time": 8.426883865147829} +{"Pretrain/Learning Rate": 3.0849960774400667e-05, "Pretrain/Loss": 2.0709946155548096, "Pretrain/Loss (Raw)": 2.3527607917785645, "Pretrain/Step": 4216, "Pretrain/Step Time": 8.424175648018718} +{"Pretrain/Learning Rate": 3.0841706268670756e-05, "Pretrain/Loss": 2.0701677799224854, "Pretrain/Loss (Raw)": 1.9825506210327148, "Pretrain/Step": 4217, "Pretrain/Step Time": 8.419365825131536} +{"Pretrain/Learning Rate": 3.083345108924775e-05, "Pretrain/Loss": 2.070125102996826, "Pretrain/Loss (Raw)": 2.0498464107513428, "Pretrain/Step": 4218, "Pretrain/Step Time": 8.4237240254879} +{"Pretrain/Learning Rate": 3.082519523708368e-05, "Pretrain/Loss": 2.0703868865966797, "Pretrain/Loss (Raw)": 2.0737767219543457, "Pretrain/Step": 4219, "Pretrain/Step Time": 8.428341798484325} +{"Pretrain/Learning Rate": 3.081693871313064e-05, "Pretrain/Loss": 2.0672965049743652, "Pretrain/Loss (Raw)": 1.7580686807632446, "Pretrain/Step": 4220, "Pretrain/Step Time": 8.427236279472709} +{"Pretrain/Learning Rate": 3.080868151834082e-05, "Pretrain/Loss": 2.0688886642456055, "Pretrain/Loss (Raw)": 2.1614019870758057, "Pretrain/Step": 4221, "Pretrain/Step Time": 8.423104781657457} +{"Pretrain/Learning Rate": 3.080042365366648e-05, "Pretrain/Loss": 2.063354730606079, "Pretrain/Loss (Raw)": 1.383109450340271, "Pretrain/Step": 4222, "Pretrain/Step Time": 8.427046306431293} +{"Pretrain/Learning Rate": 3.079216512005994e-05, "Pretrain/Loss": 2.061464309692383, "Pretrain/Loss (Raw)": 1.7732337713241577, "Pretrain/Step": 4223, "Pretrain/Step Time": 8.422265255823731} +{"Pretrain/Learning Rate": 3.078390591847363e-05, "Pretrain/Loss": 2.058069944381714, "Pretrain/Loss (Raw)": 2.1153008937835693, "Pretrain/Step": 4224, "Pretrain/Step Time": 8.426426470279694} +{"Pretrain/Learning Rate": 3.077564604986004e-05, "Pretrain/Loss": 2.0585925579071045, "Pretrain/Loss (Raw)": 2.0452187061309814, "Pretrain/Step": 4225, "Pretrain/Step Time": 8.430161960422993} +{"Pretrain/Learning Rate": 3.076738551517173e-05, "Pretrain/Loss": 2.0596628189086914, "Pretrain/Loss (Raw)": 2.1090891361236572, "Pretrain/Step": 4226, "Pretrain/Step Time": 8.42367935180664} +{"Pretrain/Learning Rate": 3.0759124315361344e-05, "Pretrain/Loss": 2.060192823410034, "Pretrain/Loss (Raw)": 2.220053195953369, "Pretrain/Step": 4227, "Pretrain/Step Time": 8.433066492900252} +{"Pretrain/Learning Rate": 3.07508624513816e-05, "Pretrain/Loss": 2.0583114624023438, "Pretrain/Loss (Raw)": 1.9665136337280273, "Pretrain/Step": 4228, "Pretrain/Step Time": 8.430631371214986} +{"Pretrain/Learning Rate": 3.0742599924185306e-05, "Pretrain/Loss": 2.0562491416931152, "Pretrain/Loss (Raw)": 1.9838563203811646, "Pretrain/Step": 4229, "Pretrain/Step Time": 8.427669053897262} +{"Pretrain/Learning Rate": 3.073433673472533e-05, "Pretrain/Loss": 2.0570883750915527, "Pretrain/Loss (Raw)": 2.056732416152954, "Pretrain/Step": 4230, "Pretrain/Step Time": 8.431920381262898} +{"Pretrain/Learning Rate": 3.072607288395461e-05, "Pretrain/Loss": 2.056504964828491, "Pretrain/Loss (Raw)": 1.9552861452102661, "Pretrain/Step": 4231, "Pretrain/Step Time": 8.440221648663282} +{"Pretrain/Learning Rate": 3.071780837282619e-05, "Pretrain/Loss": 2.05517578125, "Pretrain/Loss (Raw)": 2.063001871109009, "Pretrain/Step": 4232, "Pretrain/Step Time": 8.439308224245906} +{"Pretrain/Learning Rate": 3.0709543202293164e-05, "Pretrain/Loss": 2.0554065704345703, "Pretrain/Loss (Raw)": 2.015960454940796, "Pretrain/Step": 4233, "Pretrain/Step Time": 8.43959578871727} +{"Pretrain/Learning Rate": 3.070127737330871e-05, "Pretrain/Loss": 2.0546891689300537, "Pretrain/Loss (Raw)": 1.89743173122406, "Pretrain/Step": 4234, "Pretrain/Step Time": 8.435144674032927} +{"Pretrain/Learning Rate": 3.069301088682609e-05, "Pretrain/Loss": 2.055360794067383, "Pretrain/Loss (Raw)": 2.0610249042510986, "Pretrain/Step": 4235, "Pretrain/Step Time": 8.43712479621172} +{"Pretrain/Learning Rate": 3.068474374379863e-05, "Pretrain/Loss": 2.05454683303833, "Pretrain/Loss (Raw)": 2.0442869663238525, "Pretrain/Step": 4236, "Pretrain/Step Time": 8.441058855503798} +{"Pretrain/Learning Rate": 3.067647594517972e-05, "Pretrain/Loss": 2.0557355880737305, "Pretrain/Loss (Raw)": 2.2007803916931152, "Pretrain/Step": 4237, "Pretrain/Step Time": 8.443643271923065} +{"Pretrain/Learning Rate": 3.0668207491922866e-05, "Pretrain/Loss": 2.055148124694824, "Pretrain/Loss (Raw)": 2.059093952178955, "Pretrain/Step": 4238, "Pretrain/Step Time": 8.444688107818365} +{"Pretrain/Learning Rate": 3.0659938384981616e-05, "Pretrain/Loss": 2.056097984313965, "Pretrain/Loss (Raw)": 1.9516934156417847, "Pretrain/Step": 4239, "Pretrain/Step Time": 8.44332061521709} +{"Pretrain/Learning Rate": 3.0651668625309594e-05, "Pretrain/Loss": 2.058037519454956, "Pretrain/Loss (Raw)": 2.193740129470825, "Pretrain/Step": 4240, "Pretrain/Step Time": 8.434415915980935} +{"Pretrain/Learning Rate": 3.0643398213860525e-05, "Pretrain/Loss": 2.0582528114318848, "Pretrain/Loss (Raw)": 2.0095577239990234, "Pretrain/Step": 4241, "Pretrain/Step Time": 8.437452433630824} +{"Pretrain/Learning Rate": 3.0635127151588175e-05, "Pretrain/Loss": 2.060378313064575, "Pretrain/Loss (Raw)": 2.1012074947357178, "Pretrain/Step": 4242, "Pretrain/Step Time": 8.447148213163018} +{"Pretrain/Learning Rate": 3.0626855439446405e-05, "Pretrain/Loss": 2.059412956237793, "Pretrain/Loss (Raw)": 1.9854387044906616, "Pretrain/Step": 4243, "Pretrain/Step Time": 8.446001531556249} +{"Pretrain/Learning Rate": 3.061858307838915e-05, "Pretrain/Loss": 2.060608386993408, "Pretrain/Loss (Raw)": 2.119429349899292, "Pretrain/Step": 4244, "Pretrain/Step Time": 8.440688915550709} +{"Pretrain/Learning Rate": 3.061031006937043e-05, "Pretrain/Loss": 2.0599522590637207, "Pretrain/Loss (Raw)": 2.005533456802368, "Pretrain/Step": 4245, "Pretrain/Step Time": 8.43152965977788} +{"Pretrain/Learning Rate": 3.060203641334431e-05, "Pretrain/Loss": 2.0592520236968994, "Pretrain/Loss (Raw)": 2.101732015609741, "Pretrain/Step": 4246, "Pretrain/Step Time": 8.43345382064581} +{"Pretrain/Learning Rate": 3.059376211126495e-05, "Pretrain/Loss": 2.0585408210754395, "Pretrain/Loss (Raw)": 1.9682902097702026, "Pretrain/Step": 4247, "Pretrain/Step Time": 8.444292183965445} +{"Pretrain/Learning Rate": 3.058548716408658e-05, "Pretrain/Loss": 2.057058095932007, "Pretrain/Loss (Raw)": 2.0736894607543945, "Pretrain/Step": 4248, "Pretrain/Step Time": 8.445796120911837} +{"Pretrain/Learning Rate": 3.057721157276352e-05, "Pretrain/Loss": 2.0556840896606445, "Pretrain/Loss (Raw)": 1.7608741521835327, "Pretrain/Step": 4249, "Pretrain/Step Time": 8.449378449469805} +{"Pretrain/Learning Rate": 3.056893533825014e-05, "Pretrain/Loss": 2.056035041809082, "Pretrain/Loss (Raw)": 2.0184884071350098, "Pretrain/Step": 4250, "Pretrain/Step Time": 8.446582401171327} +{"Pretrain/Learning Rate": 3.056065846150089e-05, "Pretrain/Loss": 2.0556488037109375, "Pretrain/Loss (Raw)": 2.1393492221832275, "Pretrain/Step": 4251, "Pretrain/Step Time": 8.441135993227363} +{"Pretrain/Learning Rate": 3.0552380943470306e-05, "Pretrain/Loss": 2.050830841064453, "Pretrain/Loss (Raw)": 1.9535640478134155, "Pretrain/Step": 4252, "Pretrain/Step Time": 8.442577885463834} +{"Pretrain/Learning Rate": 3.054410278511299e-05, "Pretrain/Loss": 2.0515213012695312, "Pretrain/Loss (Raw)": 2.0670270919799805, "Pretrain/Step": 4253, "Pretrain/Step Time": 8.448279365897179} +{"Pretrain/Learning Rate": 3.053582398738362e-05, "Pretrain/Loss": 2.0531890392303467, "Pretrain/Loss (Raw)": 2.0826544761657715, "Pretrain/Step": 4254, "Pretrain/Step Time": 8.450830720365047} +{"Pretrain/Learning Rate": 3.052754455123693e-05, "Pretrain/Loss": 2.0542967319488525, "Pretrain/Loss (Raw)": 1.9484423398971558, "Pretrain/Step": 4255, "Pretrain/Step Time": 8.45155979692936} +{"Pretrain/Learning Rate": 3.051926447762776e-05, "Pretrain/Loss": 2.0549440383911133, "Pretrain/Loss (Raw)": 1.96177339553833, "Pretrain/Step": 4256, "Pretrain/Step Time": 8.447556458413601} +{"Pretrain/Learning Rate": 3.0510983767511007e-05, "Pretrain/Loss": 2.057926654815674, "Pretrain/Loss (Raw)": 2.14664888381958, "Pretrain/Step": 4257, "Pretrain/Step Time": 8.436446614563465} +{"Pretrain/Learning Rate": 3.050270242184164e-05, "Pretrain/Loss": 2.057206630706787, "Pretrain/Loss (Raw)": 2.1330227851867676, "Pretrain/Step": 4258, "Pretrain/Step Time": 8.444944843649864} +{"Pretrain/Learning Rate": 3.049442044157469e-05, "Pretrain/Loss": 2.0578904151916504, "Pretrain/Loss (Raw)": 2.109644889831543, "Pretrain/Step": 4259, "Pretrain/Step Time": 8.44876467809081} +{"Pretrain/Learning Rate": 3.0486137827665296e-05, "Pretrain/Loss": 2.0568370819091797, "Pretrain/Loss (Raw)": 2.128607988357544, "Pretrain/Step": 4260, "Pretrain/Step Time": 8.450556237250566} +{"Pretrain/Learning Rate": 3.0477854581068626e-05, "Pretrain/Loss": 2.05806040763855, "Pretrain/Loss (Raw)": 2.1228885650634766, "Pretrain/Step": 4261, "Pretrain/Step Time": 8.448998203501105} +{"Pretrain/Learning Rate": 3.0469570702739958e-05, "Pretrain/Loss": 2.0590028762817383, "Pretrain/Loss (Raw)": 2.2079079151153564, "Pretrain/Step": 4262, "Pretrain/Step Time": 8.443007685244083} +{"Pretrain/Learning Rate": 3.0461286193634626e-05, "Pretrain/Loss": 2.058558464050293, "Pretrain/Loss (Raw)": 1.9727356433868408, "Pretrain/Step": 4263, "Pretrain/Step Time": 8.441022286191583} +{"Pretrain/Learning Rate": 3.045300105470803e-05, "Pretrain/Loss": 2.0568525791168213, "Pretrain/Loss (Raw)": 2.2448081970214844, "Pretrain/Step": 4264, "Pretrain/Step Time": 8.444528970867395} +{"Pretrain/Learning Rate": 3.0444715286915658e-05, "Pretrain/Loss": 2.0559158325195312, "Pretrain/Loss (Raw)": 1.929495096206665, "Pretrain/Step": 4265, "Pretrain/Step Time": 8.446853537112474} +{"Pretrain/Learning Rate": 3.0436428891213063e-05, "Pretrain/Loss": 2.057403087615967, "Pretrain/Loss (Raw)": 2.2206010818481445, "Pretrain/Step": 4266, "Pretrain/Step Time": 8.445323955267668} +{"Pretrain/Learning Rate": 3.0428141868555875e-05, "Pretrain/Loss": 2.0564727783203125, "Pretrain/Loss (Raw)": 1.9241411685943604, "Pretrain/Step": 4267, "Pretrain/Step Time": 8.445276664569974} +{"Pretrain/Learning Rate": 3.0419854219899786e-05, "Pretrain/Loss": 2.0587096214294434, "Pretrain/Loss (Raw)": 2.1114649772644043, "Pretrain/Step": 4268, "Pretrain/Step Time": 8.441881451755762} +{"Pretrain/Learning Rate": 3.041156594620057e-05, "Pretrain/Loss": 2.0583953857421875, "Pretrain/Loss (Raw)": 2.0913732051849365, "Pretrain/Step": 4269, "Pretrain/Step Time": 8.445677338168025} +{"Pretrain/Learning Rate": 3.0403277048414063e-05, "Pretrain/Loss": 2.0588181018829346, "Pretrain/Loss (Raw)": 2.0615432262420654, "Pretrain/Step": 4270, "Pretrain/Step Time": 8.446410574018955} +{"Pretrain/Learning Rate": 3.0394987527496192e-05, "Pretrain/Loss": 2.058256149291992, "Pretrain/Loss (Raw)": 1.9848484992980957, "Pretrain/Step": 4271, "Pretrain/Step Time": 8.442595517262816} +{"Pretrain/Learning Rate": 3.0386697384402935e-05, "Pretrain/Loss": 2.0582351684570312, "Pretrain/Loss (Raw)": 2.1397500038146973, "Pretrain/Step": 4272, "Pretrain/Step Time": 8.441821252927184} +{"Pretrain/Learning Rate": 3.0378406620090354e-05, "Pretrain/Loss": 2.0582284927368164, "Pretrain/Loss (Raw)": 2.1212680339813232, "Pretrain/Step": 4273, "Pretrain/Step Time": 8.438687345013022} +{"Pretrain/Learning Rate": 3.0370115235514574e-05, "Pretrain/Loss": 2.0561137199401855, "Pretrain/Loss (Raw)": 1.8334217071533203, "Pretrain/Step": 4274, "Pretrain/Step Time": 8.430590452626348} +{"Pretrain/Learning Rate": 3.036182323163181e-05, "Pretrain/Loss": 2.055673122406006, "Pretrain/Loss (Raw)": 1.9324549436569214, "Pretrain/Step": 4275, "Pretrain/Step Time": 8.429910570383072} +{"Pretrain/Learning Rate": 3.0353530609398313e-05, "Pretrain/Loss": 2.057492256164551, "Pretrain/Loss (Raw)": 2.1858482360839844, "Pretrain/Step": 4276, "Pretrain/Step Time": 8.430992843583226} +{"Pretrain/Learning Rate": 3.0345237369770448e-05, "Pretrain/Loss": 2.0550217628479004, "Pretrain/Loss (Raw)": 1.957315444946289, "Pretrain/Step": 4277, "Pretrain/Step Time": 8.431122373789549} +{"Pretrain/Learning Rate": 3.0336943513704613e-05, "Pretrain/Loss": 2.0563762187957764, "Pretrain/Loss (Raw)": 2.207617998123169, "Pretrain/Step": 4278, "Pretrain/Step Time": 8.430655116215348} +{"Pretrain/Learning Rate": 3.0328649042157315e-05, "Pretrain/Loss": 2.0563464164733887, "Pretrain/Loss (Raw)": 1.9892600774765015, "Pretrain/Step": 4279, "Pretrain/Step Time": 8.431900257244706} +{"Pretrain/Learning Rate": 3.0320353956085095e-05, "Pretrain/Loss": 2.0550127029418945, "Pretrain/Loss (Raw)": 1.9356470108032227, "Pretrain/Step": 4280, "Pretrain/Step Time": 8.421485686674714} +{"Pretrain/Learning Rate": 3.0312058256444587e-05, "Pretrain/Loss": 2.0558080673217773, "Pretrain/Loss (Raw)": 2.021019458770752, "Pretrain/Step": 4281, "Pretrain/Step Time": 8.422987485304475} +{"Pretrain/Learning Rate": 3.0303761944192488e-05, "Pretrain/Loss": 2.0551235675811768, "Pretrain/Loss (Raw)": 1.934597373008728, "Pretrain/Step": 4282, "Pretrain/Step Time": 8.430822158232331} +{"Pretrain/Learning Rate": 3.0295465020285567e-05, "Pretrain/Loss": 2.0588603019714355, "Pretrain/Loss (Raw)": 2.380934476852417, "Pretrain/Step": 4283, "Pretrain/Step Time": 8.429223157465458} +{"Pretrain/Learning Rate": 3.0287167485680672e-05, "Pretrain/Loss": 2.0565149784088135, "Pretrain/Loss (Raw)": 2.067131996154785, "Pretrain/Step": 4284, "Pretrain/Step Time": 8.43108100257814} +{"Pretrain/Learning Rate": 3.0278869341334702e-05, "Pretrain/Loss": 2.0550904273986816, "Pretrain/Loss (Raw)": 1.9277489185333252, "Pretrain/Step": 4285, "Pretrain/Step Time": 8.428100746124983} +{"Pretrain/Learning Rate": 3.0270570588204655e-05, "Pretrain/Loss": 2.055654525756836, "Pretrain/Loss (Raw)": 2.1196436882019043, "Pretrain/Step": 4286, "Pretrain/Step Time": 8.424222899600863} +{"Pretrain/Learning Rate": 3.0262271227247563e-05, "Pretrain/Loss": 2.0529565811157227, "Pretrain/Loss (Raw)": 1.8134359121322632, "Pretrain/Step": 4287, "Pretrain/Step Time": 8.429515643045306} +{"Pretrain/Learning Rate": 3.025397125942056e-05, "Pretrain/Loss": 2.0495924949645996, "Pretrain/Loss (Raw)": 1.7050985097885132, "Pretrain/Step": 4288, "Pretrain/Step Time": 8.431839838624} +{"Pretrain/Learning Rate": 3.0245670685680833e-05, "Pretrain/Loss": 2.05020809173584, "Pretrain/Loss (Raw)": 2.1118927001953125, "Pretrain/Step": 4289, "Pretrain/Step Time": 8.429376691579819} +{"Pretrain/Learning Rate": 3.0237369506985646e-05, "Pretrain/Loss": 2.04830265045166, "Pretrain/Loss (Raw)": 1.8550937175750732, "Pretrain/Step": 4290, "Pretrain/Step Time": 8.425486620515585} +{"Pretrain/Learning Rate": 3.022906772429232e-05, "Pretrain/Loss": 2.045191764831543, "Pretrain/Loss (Raw)": 2.0194573402404785, "Pretrain/Step": 4291, "Pretrain/Step Time": 8.420238554477692} +{"Pretrain/Learning Rate": 3.0220765338558278e-05, "Pretrain/Loss": 2.0423007011413574, "Pretrain/Loss (Raw)": 2.023423910140991, "Pretrain/Step": 4292, "Pretrain/Step Time": 8.426352933049202} +{"Pretrain/Learning Rate": 3.021246235074096e-05, "Pretrain/Loss": 2.0411009788513184, "Pretrain/Loss (Raw)": 1.9586679935455322, "Pretrain/Step": 4293, "Pretrain/Step Time": 8.43186648376286} +{"Pretrain/Learning Rate": 3.0204158761797936e-05, "Pretrain/Loss": 2.0399463176727295, "Pretrain/Loss (Raw)": 1.9661190509796143, "Pretrain/Step": 4294, "Pretrain/Step Time": 8.42699364386499} +{"Pretrain/Learning Rate": 3.0195854572686793e-05, "Pretrain/Loss": 2.0402560234069824, "Pretrain/Loss (Raw)": 2.026008367538452, "Pretrain/Step": 4295, "Pretrain/Step Time": 8.428477296605706} +{"Pretrain/Learning Rate": 3.0187549784365214e-05, "Pretrain/Loss": 2.0371007919311523, "Pretrain/Loss (Raw)": 1.5691683292388916, "Pretrain/Step": 4296, "Pretrain/Step Time": 8.421849142760038} +{"Pretrain/Learning Rate": 3.0179244397790956e-05, "Pretrain/Loss": 2.0367980003356934, "Pretrain/Loss (Raw)": 2.072747230529785, "Pretrain/Step": 4297, "Pretrain/Step Time": 8.424266645684838} +{"Pretrain/Learning Rate": 3.017093841392183e-05, "Pretrain/Loss": 2.036398410797119, "Pretrain/Loss (Raw)": 1.8433454036712646, "Pretrain/Step": 4298, "Pretrain/Step Time": 8.428725549951196} +{"Pretrain/Learning Rate": 3.0162631833715715e-05, "Pretrain/Loss": 2.038379669189453, "Pretrain/Loss (Raw)": 2.2013275623321533, "Pretrain/Step": 4299, "Pretrain/Step Time": 8.427653620019555} +{"Pretrain/Learning Rate": 3.0154324658130572e-05, "Pretrain/Loss": 2.0380139350891113, "Pretrain/Loss (Raw)": 2.1208086013793945, "Pretrain/Step": 4300, "Pretrain/Step Time": 8.429049843922257} +{"Pretrain/Learning Rate": 3.0146016888124423e-05, "Pretrain/Loss": 2.0382323265075684, "Pretrain/Loss (Raw)": 2.0217337608337402, "Pretrain/Step": 4301, "Pretrain/Step Time": 8.4203280787915} +{"Pretrain/Learning Rate": 3.013770852465535e-05, "Pretrain/Loss": 2.041250228881836, "Pretrain/Loss (Raw)": 2.2927358150482178, "Pretrain/Step": 4302, "Pretrain/Step Time": 8.425015058368444} +{"Pretrain/Learning Rate": 3.0129399568681533e-05, "Pretrain/Loss": 2.0403552055358887, "Pretrain/Loss (Raw)": 1.9947441816329956, "Pretrain/Step": 4303, "Pretrain/Step Time": 8.427955653518438} +{"Pretrain/Learning Rate": 3.0121090021161175e-05, "Pretrain/Loss": 2.0425567626953125, "Pretrain/Loss (Raw)": 2.170530319213867, "Pretrain/Step": 4304, "Pretrain/Step Time": 8.436326932162046} +{"Pretrain/Learning Rate": 3.0112779883052593e-05, "Pretrain/Loss": 2.041922092437744, "Pretrain/Loss (Raw)": 2.0167579650878906, "Pretrain/Step": 4305, "Pretrain/Step Time": 8.439493468031287} +{"Pretrain/Learning Rate": 3.010446915531414e-05, "Pretrain/Loss": 2.044254779815674, "Pretrain/Loss (Raw)": 2.387539863586426, "Pretrain/Step": 4306, "Pretrain/Step Time": 8.435373570770025} +{"Pretrain/Learning Rate": 3.0096157838904247e-05, "Pretrain/Loss": 2.0421743392944336, "Pretrain/Loss (Raw)": 1.8712513446807861, "Pretrain/Step": 4307, "Pretrain/Step Time": 8.435855764895678} +{"Pretrain/Learning Rate": 3.0087845934781424e-05, "Pretrain/Loss": 2.044283866882324, "Pretrain/Loss (Raw)": 2.292192220687866, "Pretrain/Step": 4308, "Pretrain/Step Time": 8.435935229063034} +{"Pretrain/Learning Rate": 3.0079533443904227e-05, "Pretrain/Loss": 2.0457868576049805, "Pretrain/Loss (Raw)": 2.2092127799987793, "Pretrain/Step": 4309, "Pretrain/Step Time": 8.436722345650196} +{"Pretrain/Learning Rate": 3.0071220367231306e-05, "Pretrain/Loss": 2.0478341579437256, "Pretrain/Loss (Raw)": 2.0721967220306396, "Pretrain/Step": 4310, "Pretrain/Step Time": 8.442215036600828} +{"Pretrain/Learning Rate": 3.006290670572135e-05, "Pretrain/Loss": 2.0488827228546143, "Pretrain/Loss (Raw)": 2.1365859508514404, "Pretrain/Step": 4311, "Pretrain/Step Time": 8.44076907262206} +{"Pretrain/Learning Rate": 3.0054592460333137e-05, "Pretrain/Loss": 2.049924373626709, "Pretrain/Loss (Raw)": 2.1469147205352783, "Pretrain/Step": 4312, "Pretrain/Step Time": 8.434984311461449} +{"Pretrain/Learning Rate": 3.00462776320255e-05, "Pretrain/Loss": 2.050306797027588, "Pretrain/Loss (Raw)": 2.1842615604400635, "Pretrain/Step": 4313, "Pretrain/Step Time": 8.420542292296886} +{"Pretrain/Learning Rate": 3.0037962221757354e-05, "Pretrain/Loss": 2.0527281761169434, "Pretrain/Loss (Raw)": 2.2748734951019287, "Pretrain/Step": 4314, "Pretrain/Step Time": 8.423330944031477} +{"Pretrain/Learning Rate": 3.0029646230487657e-05, "Pretrain/Loss": 2.053542137145996, "Pretrain/Loss (Raw)": 2.223562240600586, "Pretrain/Step": 4315, "Pretrain/Step Time": 8.4316351916641} +{"Pretrain/Learning Rate": 3.002132965917547e-05, "Pretrain/Loss": 2.0538153648376465, "Pretrain/Loss (Raw)": 1.9377083778381348, "Pretrain/Step": 4316, "Pretrain/Step Time": 8.433417597785592} +{"Pretrain/Learning Rate": 3.001301250877987e-05, "Pretrain/Loss": 2.050272226333618, "Pretrain/Loss (Raw)": 2.159484624862671, "Pretrain/Step": 4317, "Pretrain/Step Time": 8.428523050621152} +{"Pretrain/Learning Rate": 3.000469478026005e-05, "Pretrain/Loss": 2.0511345863342285, "Pretrain/Loss (Raw)": 1.9473484754562378, "Pretrain/Step": 4318, "Pretrain/Step Time": 8.428213778883219} +{"Pretrain/Learning Rate": 2.9996376474575244e-05, "Pretrain/Loss": 2.0503151416778564, "Pretrain/Loss (Raw)": 2.015577793121338, "Pretrain/Step": 4319, "Pretrain/Step Time": 8.423695147037506} +{"Pretrain/Learning Rate": 2.9988057592684766e-05, "Pretrain/Loss": 2.051093101501465, "Pretrain/Loss (Raw)": 2.2354917526245117, "Pretrain/Step": 4320, "Pretrain/Step Time": 8.425061510875821} +{"Pretrain/Learning Rate": 2.9979738135547973e-05, "Pretrain/Loss": 2.0515871047973633, "Pretrain/Loss (Raw)": 2.040090799331665, "Pretrain/Step": 4321, "Pretrain/Step Time": 8.427757577970624} +{"Pretrain/Learning Rate": 2.9971418104124322e-05, "Pretrain/Loss": 2.050593137741089, "Pretrain/Loss (Raw)": 2.1648480892181396, "Pretrain/Step": 4322, "Pretrain/Step Time": 8.44297501258552} +{"Pretrain/Learning Rate": 2.9963097499373312e-05, "Pretrain/Loss": 2.0481491088867188, "Pretrain/Loss (Raw)": 1.8568174839019775, "Pretrain/Step": 4323, "Pretrain/Step Time": 8.44049715809524} +{"Pretrain/Learning Rate": 2.9954776322254495e-05, "Pretrain/Loss": 2.0478758811950684, "Pretrain/Loss (Raw)": 2.1619479656219482, "Pretrain/Step": 4324, "Pretrain/Step Time": 8.43462035804987} +{"Pretrain/Learning Rate": 2.994645457372754e-05, "Pretrain/Loss": 2.0447423458099365, "Pretrain/Loss (Raw)": 1.591483473777771, "Pretrain/Step": 4325, "Pretrain/Step Time": 8.435829827561975} +{"Pretrain/Learning Rate": 2.9938132254752126e-05, "Pretrain/Loss": 2.0445809364318848, "Pretrain/Loss (Raw)": 1.925039291381836, "Pretrain/Step": 4326, "Pretrain/Step Time": 8.436893379315734} +{"Pretrain/Learning Rate": 2.9929809366288035e-05, "Pretrain/Loss": 2.049034833908081, "Pretrain/Loss (Raw)": 2.608035087585449, "Pretrain/Step": 4327, "Pretrain/Step Time": 8.447975693270564} +{"Pretrain/Learning Rate": 2.99214859092951e-05, "Pretrain/Loss": 2.0532805919647217, "Pretrain/Loss (Raw)": 2.516211986541748, "Pretrain/Step": 4328, "Pretrain/Step Time": 8.448205173015594} +{"Pretrain/Learning Rate": 2.9913161884733215e-05, "Pretrain/Loss": 2.0514657497406006, "Pretrain/Loss (Raw)": 1.7803916931152344, "Pretrain/Step": 4329, "Pretrain/Step Time": 8.441734144464135} +{"Pretrain/Learning Rate": 2.9904837293562348e-05, "Pretrain/Loss": 2.0516204833984375, "Pretrain/Loss (Raw)": 2.012120008468628, "Pretrain/Step": 4330, "Pretrain/Step Time": 8.43099637515843} +{"Pretrain/Learning Rate": 2.989651213674254e-05, "Pretrain/Loss": 2.049891471862793, "Pretrain/Loss (Raw)": 1.8977704048156738, "Pretrain/Step": 4331, "Pretrain/Step Time": 8.43473868444562} +{"Pretrain/Learning Rate": 2.988818641523387e-05, "Pretrain/Loss": 2.0535712242126465, "Pretrain/Loss (Raw)": 2.2395875453948975, "Pretrain/Step": 4332, "Pretrain/Step Time": 8.429505664855242} +{"Pretrain/Learning Rate": 2.9879860129996517e-05, "Pretrain/Loss": 2.0541439056396484, "Pretrain/Loss (Raw)": 2.0110111236572266, "Pretrain/Step": 4333, "Pretrain/Step Time": 8.440771758556366} +{"Pretrain/Learning Rate": 2.9871533281990692e-05, "Pretrain/Loss": 2.051112413406372, "Pretrain/Loss (Raw)": 1.9005886316299438, "Pretrain/Step": 4334, "Pretrain/Step Time": 8.438560757786036} +{"Pretrain/Learning Rate": 2.9863205872176703e-05, "Pretrain/Loss": 2.050966501235962, "Pretrain/Loss (Raw)": 2.1269164085388184, "Pretrain/Step": 4335, "Pretrain/Step Time": 8.437128843739629} +{"Pretrain/Learning Rate": 2.9854877901514884e-05, "Pretrain/Loss": 2.050070285797119, "Pretrain/Loss (Raw)": 2.0201449394226074, "Pretrain/Step": 4336, "Pretrain/Step Time": 8.42738776654005} +{"Pretrain/Learning Rate": 2.9846549370965672e-05, "Pretrain/Loss": 2.047464609146118, "Pretrain/Loss (Raw)": 1.951405644416809, "Pretrain/Step": 4337, "Pretrain/Step Time": 8.429533377289772} +{"Pretrain/Learning Rate": 2.9838220281489553e-05, "Pretrain/Loss": 2.047168254852295, "Pretrain/Loss (Raw)": 2.021977663040161, "Pretrain/Step": 4338, "Pretrain/Step Time": 8.437229659408331} +{"Pretrain/Learning Rate": 2.9829890634047068e-05, "Pretrain/Loss": 2.0448880195617676, "Pretrain/Loss (Raw)": 1.9545739889144897, "Pretrain/Step": 4339, "Pretrain/Step Time": 8.445007715374231} +{"Pretrain/Learning Rate": 2.9821560429598844e-05, "Pretrain/Loss": 2.046952724456787, "Pretrain/Loss (Raw)": 2.1584885120391846, "Pretrain/Step": 4340, "Pretrain/Step Time": 8.44942469894886} +{"Pretrain/Learning Rate": 2.9813229669105546e-05, "Pretrain/Loss": 2.0463507175445557, "Pretrain/Loss (Raw)": 2.0454282760620117, "Pretrain/Step": 4341, "Pretrain/Step Time": 8.442276613786817} +{"Pretrain/Learning Rate": 2.9804898353527928e-05, "Pretrain/Loss": 2.0463743209838867, "Pretrain/Loss (Raw)": 2.042076826095581, "Pretrain/Step": 4342, "Pretrain/Step Time": 8.444212587550282} +{"Pretrain/Learning Rate": 2.9796566483826777e-05, "Pretrain/Loss": 2.045071601867676, "Pretrain/Loss (Raw)": 1.9506371021270752, "Pretrain/Step": 4343, "Pretrain/Step Time": 8.444762650877237} +{"Pretrain/Learning Rate": 2.9788234060962988e-05, "Pretrain/Loss": 2.0416154861450195, "Pretrain/Loss (Raw)": 1.9104235172271729, "Pretrain/Step": 4344, "Pretrain/Step Time": 8.447216786444187} +{"Pretrain/Learning Rate": 2.9779901085897478e-05, "Pretrain/Loss": 2.0405163764953613, "Pretrain/Loss (Raw)": 1.8418521881103516, "Pretrain/Step": 4345, "Pretrain/Step Time": 8.448358960449696} +{"Pretrain/Learning Rate": 2.9771567559591257e-05, "Pretrain/Loss": 2.0387728214263916, "Pretrain/Loss (Raw)": 1.8266675472259521, "Pretrain/Step": 4346, "Pretrain/Step Time": 8.445747992023826} +{"Pretrain/Learning Rate": 2.9763233483005383e-05, "Pretrain/Loss": 2.038468599319458, "Pretrain/Loss (Raw)": 2.0348284244537354, "Pretrain/Step": 4347, "Pretrain/Step Time": 8.445585729554296} +{"Pretrain/Learning Rate": 2.975489885710097e-05, "Pretrain/Loss": 2.0401530265808105, "Pretrain/Loss (Raw)": 1.9736831188201904, "Pretrain/Step": 4348, "Pretrain/Step Time": 8.443955766037107} +{"Pretrain/Learning Rate": 2.9746563682839225e-05, "Pretrain/Loss": 2.039290428161621, "Pretrain/Loss (Raw)": 2.0510058403015137, "Pretrain/Step": 4349, "Pretrain/Step Time": 8.448644161224365} +{"Pretrain/Learning Rate": 2.9738227961181374e-05, "Pretrain/Loss": 2.0463016033172607, "Pretrain/Loss (Raw)": 2.2805073261260986, "Pretrain/Step": 4350, "Pretrain/Step Time": 8.444338098168373} +{"Pretrain/Learning Rate": 2.972989169308876e-05, "Pretrain/Loss": 2.0497069358825684, "Pretrain/Loss (Raw)": 2.2091164588928223, "Pretrain/Step": 4351, "Pretrain/Step Time": 8.444063737988472} +{"Pretrain/Learning Rate": 2.9721554879522743e-05, "Pretrain/Loss": 2.048980236053467, "Pretrain/Loss (Raw)": 2.022268533706665, "Pretrain/Step": 4352, "Pretrain/Step Time": 8.4455607496202} +{"Pretrain/Learning Rate": 2.9713217521444774e-05, "Pretrain/Loss": 2.050042152404785, "Pretrain/Loss (Raw)": 2.1811776161193848, "Pretrain/Step": 4353, "Pretrain/Step Time": 8.439297029748559} +{"Pretrain/Learning Rate": 2.9704879619816346e-05, "Pretrain/Loss": 2.0484652519226074, "Pretrain/Loss (Raw)": 1.9072375297546387, "Pretrain/Step": 4354, "Pretrain/Step Time": 8.444446537643671} +{"Pretrain/Learning Rate": 2.969654117559903e-05, "Pretrain/Loss": 2.048966646194458, "Pretrain/Loss (Raw)": 2.284207582473755, "Pretrain/Step": 4355, "Pretrain/Step Time": 8.437546759843826} +{"Pretrain/Learning Rate": 2.9688202189754456e-05, "Pretrain/Loss": 2.0496857166290283, "Pretrain/Loss (Raw)": 2.05856990814209, "Pretrain/Step": 4356, "Pretrain/Step Time": 8.437223894521594} +{"Pretrain/Learning Rate": 2.9679862663244317e-05, "Pretrain/Loss": 2.048238754272461, "Pretrain/Loss (Raw)": 1.798643946647644, "Pretrain/Step": 4357, "Pretrain/Step Time": 8.43929767422378} +{"Pretrain/Learning Rate": 2.9671522597030355e-05, "Pretrain/Loss": 2.0494070053100586, "Pretrain/Loss (Raw)": 2.206300735473633, "Pretrain/Step": 4358, "Pretrain/Step Time": 8.433782380074263} +{"Pretrain/Learning Rate": 2.9663181992074402e-05, "Pretrain/Loss": 2.0482287406921387, "Pretrain/Loss (Raw)": 1.8044177293777466, "Pretrain/Step": 4359, "Pretrain/Step Time": 8.42761011235416} +{"Pretrain/Learning Rate": 2.9654840849338322e-05, "Pretrain/Loss": 2.047360897064209, "Pretrain/Loss (Raw)": 1.9519236087799072, "Pretrain/Step": 4360, "Pretrain/Step Time": 8.433221289888024} +{"Pretrain/Learning Rate": 2.964649916978407e-05, "Pretrain/Loss": 2.0474183559417725, "Pretrain/Loss (Raw)": 2.023322820663452, "Pretrain/Step": 4361, "Pretrain/Step Time": 8.438421059399843} +{"Pretrain/Learning Rate": 2.963815695437363e-05, "Pretrain/Loss": 2.0489447116851807, "Pretrain/Loss (Raw)": 2.092820167541504, "Pretrain/Step": 4362, "Pretrain/Step Time": 8.438775608316064} +{"Pretrain/Learning Rate": 2.962981420406908e-05, "Pretrain/Loss": 2.049899101257324, "Pretrain/Loss (Raw)": 2.183182716369629, "Pretrain/Step": 4363, "Pretrain/Step Time": 8.435001226142049} +{"Pretrain/Learning Rate": 2.9621470919832538e-05, "Pretrain/Loss": 2.0504486560821533, "Pretrain/Loss (Raw)": 2.1146295070648193, "Pretrain/Step": 4364, "Pretrain/Step Time": 8.429474018514156} +{"Pretrain/Learning Rate": 2.9613127102626187e-05, "Pretrain/Loss": 2.048231601715088, "Pretrain/Loss (Raw)": 1.9170050621032715, "Pretrain/Step": 4365, "Pretrain/Step Time": 8.425268543884158} +{"Pretrain/Learning Rate": 2.9604782753412292e-05, "Pretrain/Loss": 2.0481204986572266, "Pretrain/Loss (Raw)": 2.0448389053344727, "Pretrain/Step": 4366, "Pretrain/Step Time": 8.426514076068997} +{"Pretrain/Learning Rate": 2.9596437873153137e-05, "Pretrain/Loss": 2.0484166145324707, "Pretrain/Loss (Raw)": 1.9895989894866943, "Pretrain/Step": 4367, "Pretrain/Step Time": 8.431119689717889} +{"Pretrain/Learning Rate": 2.9588092462811122e-05, "Pretrain/Loss": 2.0472488403320312, "Pretrain/Loss (Raw)": 2.0442819595336914, "Pretrain/Step": 4368, "Pretrain/Step Time": 8.435874773189425} +{"Pretrain/Learning Rate": 2.957974652334865e-05, "Pretrain/Loss": 2.0484344959259033, "Pretrain/Loss (Raw)": 2.161310911178589, "Pretrain/Step": 4369, "Pretrain/Step Time": 8.432844895869493} +{"Pretrain/Learning Rate": 2.9571400055728242e-05, "Pretrain/Loss": 2.046844005584717, "Pretrain/Loss (Raw)": 1.8976575136184692, "Pretrain/Step": 4370, "Pretrain/Step Time": 8.422992542386055} +{"Pretrain/Learning Rate": 2.9563053060912426e-05, "Pretrain/Loss": 2.045588731765747, "Pretrain/Loss (Raw)": 1.8247274160385132, "Pretrain/Step": 4371, "Pretrain/Step Time": 8.429682698100805} +{"Pretrain/Learning Rate": 2.9554705539863842e-05, "Pretrain/Loss": 2.0449461936950684, "Pretrain/Loss (Raw)": 2.0372068881988525, "Pretrain/Step": 4372, "Pretrain/Step Time": 8.432842168956995} +{"Pretrain/Learning Rate": 2.954635749354514e-05, "Pretrain/Loss": 2.0495376586914062, "Pretrain/Loss (Raw)": 2.5932657718658447, "Pretrain/Step": 4373, "Pretrain/Step Time": 8.433960804715753} +{"Pretrain/Learning Rate": 2.953800892291908e-05, "Pretrain/Loss": 2.047914505004883, "Pretrain/Loss (Raw)": 1.893945574760437, "Pretrain/Step": 4374, "Pretrain/Step Time": 8.433797569945455} +{"Pretrain/Learning Rate": 2.9529659828948442e-05, "Pretrain/Loss": 2.0492331981658936, "Pretrain/Loss (Raw)": 2.1370725631713867, "Pretrain/Step": 4375, "Pretrain/Step Time": 8.427381670102477} +{"Pretrain/Learning Rate": 2.9521310212596087e-05, "Pretrain/Loss": 2.048212766647339, "Pretrain/Loss (Raw)": 1.9430750608444214, "Pretrain/Step": 4376, "Pretrain/Step Time": 8.428394163027406} +{"Pretrain/Learning Rate": 2.951296007482493e-05, "Pretrain/Loss": 2.049640655517578, "Pretrain/Loss (Raw)": 1.9436498880386353, "Pretrain/Step": 4377, "Pretrain/Step Time": 8.426996029913425} +{"Pretrain/Learning Rate": 2.9504609416597956e-05, "Pretrain/Loss": 2.0502986907958984, "Pretrain/Loss (Raw)": 2.1026899814605713, "Pretrain/Step": 4378, "Pretrain/Step Time": 8.430093467235565} +{"Pretrain/Learning Rate": 2.9496258238878198e-05, "Pretrain/Loss": 2.051888942718506, "Pretrain/Loss (Raw)": 2.3429183959960938, "Pretrain/Step": 4379, "Pretrain/Step Time": 8.431490197777748} +{"Pretrain/Learning Rate": 2.9487906542628753e-05, "Pretrain/Loss": 2.052128791809082, "Pretrain/Loss (Raw)": 1.9842406511306763, "Pretrain/Step": 4380, "Pretrain/Step Time": 8.430713754147291} +{"Pretrain/Learning Rate": 2.9479554328812775e-05, "Pretrain/Loss": 2.0508854389190674, "Pretrain/Loss (Raw)": 1.9079126119613647, "Pretrain/Step": 4381, "Pretrain/Step Time": 8.427306443452835} +{"Pretrain/Learning Rate": 2.9471201598393482e-05, "Pretrain/Loss": 2.0487828254699707, "Pretrain/Loss (Raw)": 1.813501238822937, "Pretrain/Step": 4382, "Pretrain/Step Time": 8.420691542327404} +{"Pretrain/Learning Rate": 2.946284835233416e-05, "Pretrain/Loss": 2.048722267150879, "Pretrain/Loss (Raw)": 1.9406946897506714, "Pretrain/Step": 4383, "Pretrain/Step Time": 8.425370952114463} +{"Pretrain/Learning Rate": 2.945449459159813e-05, "Pretrain/Loss": 2.0497825145721436, "Pretrain/Loss (Raw)": 2.097505807876587, "Pretrain/Step": 4384, "Pretrain/Step Time": 8.42658120021224} +{"Pretrain/Learning Rate": 2.9446140317148795e-05, "Pretrain/Loss": 2.0486414432525635, "Pretrain/Loss (Raw)": 2.0005886554718018, "Pretrain/Step": 4385, "Pretrain/Step Time": 8.424768969416618} +{"Pretrain/Learning Rate": 2.9437785529949606e-05, "Pretrain/Loss": 2.0501339435577393, "Pretrain/Loss (Raw)": 2.3240585327148438, "Pretrain/Step": 4386, "Pretrain/Step Time": 8.416775712743402} +{"Pretrain/Learning Rate": 2.9429430230964084e-05, "Pretrain/Loss": 2.0488357543945312, "Pretrain/Loss (Raw)": 1.9434832334518433, "Pretrain/Step": 4387, "Pretrain/Step Time": 8.413551105186343} +{"Pretrain/Learning Rate": 2.9421074421155787e-05, "Pretrain/Loss": 2.047226905822754, "Pretrain/Loss (Raw)": 1.9226725101470947, "Pretrain/Step": 4388, "Pretrain/Step Time": 8.412677900865674} +{"Pretrain/Learning Rate": 2.9412718101488364e-05, "Pretrain/Loss": 2.0452475547790527, "Pretrain/Loss (Raw)": 1.8695305585861206, "Pretrain/Step": 4389, "Pretrain/Step Time": 8.42745141685009} +{"Pretrain/Learning Rate": 2.9404361272925497e-05, "Pretrain/Loss": 2.0457606315612793, "Pretrain/Loss (Raw)": 2.273562431335449, "Pretrain/Step": 4390, "Pretrain/Step Time": 8.421641614288092} +{"Pretrain/Learning Rate": 2.939600393643092e-05, "Pretrain/Loss": 2.044772148132324, "Pretrain/Loss (Raw)": 1.8462237119674683, "Pretrain/Step": 4391, "Pretrain/Step Time": 8.423121489584446} +{"Pretrain/Learning Rate": 2.9387646092968468e-05, "Pretrain/Loss": 2.0438060760498047, "Pretrain/Loss (Raw)": 2.1211607456207275, "Pretrain/Step": 4392, "Pretrain/Step Time": 8.416057532653213} +{"Pretrain/Learning Rate": 2.9379287743501983e-05, "Pretrain/Loss": 2.0453598499298096, "Pretrain/Loss (Raw)": 2.128392457962036, "Pretrain/Step": 4393, "Pretrain/Step Time": 8.419282058253884} +{"Pretrain/Learning Rate": 2.9370928888995407e-05, "Pretrain/Loss": 2.043858289718628, "Pretrain/Loss (Raw)": 2.0283725261688232, "Pretrain/Step": 4394, "Pretrain/Step Time": 8.419105043634772} +{"Pretrain/Learning Rate": 2.936256953041271e-05, "Pretrain/Loss": 2.0446314811706543, "Pretrain/Loss (Raw)": 2.023118019104004, "Pretrain/Step": 4395, "Pretrain/Step Time": 8.426452899351716} +{"Pretrain/Learning Rate": 2.935420966871795e-05, "Pretrain/Loss": 2.045699119567871, "Pretrain/Loss (Raw)": 2.248124837875366, "Pretrain/Step": 4396, "Pretrain/Step Time": 8.424857959151268} +{"Pretrain/Learning Rate": 2.9345849304875195e-05, "Pretrain/Loss": 2.045642375946045, "Pretrain/Loss (Raw)": 2.0840940475463867, "Pretrain/Step": 4397, "Pretrain/Step Time": 8.422189839184284} +{"Pretrain/Learning Rate": 2.9337488439848633e-05, "Pretrain/Loss": 2.0452003479003906, "Pretrain/Loss (Raw)": 2.0049948692321777, "Pretrain/Step": 4398, "Pretrain/Step Time": 8.426153808832169} +{"Pretrain/Learning Rate": 2.9329127074602458e-05, "Pretrain/Loss": 2.0475656986236572, "Pretrain/Loss (Raw)": 2.2876009941101074, "Pretrain/Step": 4399, "Pretrain/Step Time": 8.428767392411828} +{"Pretrain/Learning Rate": 2.9320765210100952e-05, "Pretrain/Loss": 2.0480480194091797, "Pretrain/Loss (Raw)": 2.2014904022216797, "Pretrain/Step": 4400, "Pretrain/Step Time": 8.433830292895436} +{"Pretrain/Learning Rate": 2.931240284730844e-05, "Pretrain/Loss": 2.0479419231414795, "Pretrain/Loss (Raw)": 2.1076958179473877, "Pretrain/Step": 4401, "Pretrain/Step Time": 8.435791561380029} +{"Pretrain/Learning Rate": 2.9304039987189313e-05, "Pretrain/Loss": 2.0503740310668945, "Pretrain/Loss (Raw)": 2.144714832305908, "Pretrain/Step": 4402, "Pretrain/Step Time": 8.430389849469066} +{"Pretrain/Learning Rate": 2.9295676630708013e-05, "Pretrain/Loss": 2.0515971183776855, "Pretrain/Loss (Raw)": 2.0890064239501953, "Pretrain/Step": 4403, "Pretrain/Step Time": 8.432031655684114} +{"Pretrain/Learning Rate": 2.9287312778829047e-05, "Pretrain/Loss": 2.0493783950805664, "Pretrain/Loss (Raw)": 1.9018350839614868, "Pretrain/Step": 4404, "Pretrain/Step Time": 8.425574094057083} +{"Pretrain/Learning Rate": 2.9278948432516968e-05, "Pretrain/Loss": 2.0499253273010254, "Pretrain/Loss (Raw)": 2.027339220046997, "Pretrain/Step": 4405, "Pretrain/Step Time": 8.426500706002116} +{"Pretrain/Learning Rate": 2.9270583592736385e-05, "Pretrain/Loss": 2.047427177429199, "Pretrain/Loss (Raw)": 1.887851595878601, "Pretrain/Step": 4406, "Pretrain/Step Time": 8.43221803382039} +{"Pretrain/Learning Rate": 2.9262218260451984e-05, "Pretrain/Loss": 2.047271966934204, "Pretrain/Loss (Raw)": 1.9694006443023682, "Pretrain/Step": 4407, "Pretrain/Step Time": 8.43562226369977} +{"Pretrain/Learning Rate": 2.9253852436628483e-05, "Pretrain/Loss": 2.0470833778381348, "Pretrain/Loss (Raw)": 1.9115126132965088, "Pretrain/Step": 4408, "Pretrain/Step Time": 8.435715874657035} +{"Pretrain/Learning Rate": 2.924548612223068e-05, "Pretrain/Loss": 2.0461883544921875, "Pretrain/Loss (Raw)": 1.9064429998397827, "Pretrain/Step": 4409, "Pretrain/Step Time": 8.434183256700635} +{"Pretrain/Learning Rate": 2.923711931822341e-05, "Pretrain/Loss": 2.0470774173736572, "Pretrain/Loss (Raw)": 2.0484039783477783, "Pretrain/Step": 4410, "Pretrain/Step Time": 8.42668954655528} +{"Pretrain/Learning Rate": 2.9228752025571575e-05, "Pretrain/Loss": 2.0450844764709473, "Pretrain/Loss (Raw)": 2.1258554458618164, "Pretrain/Step": 4411, "Pretrain/Step Time": 8.424357639625669} +{"Pretrain/Learning Rate": 2.922038424524013e-05, "Pretrain/Loss": 2.0456743240356445, "Pretrain/Loss (Raw)": 2.1426029205322266, "Pretrain/Step": 4412, "Pretrain/Step Time": 8.4252457190305} +{"Pretrain/Learning Rate": 2.9212015978194083e-05, "Pretrain/Loss": 2.0478811264038086, "Pretrain/Loss (Raw)": 2.2102622985839844, "Pretrain/Step": 4413, "Pretrain/Step Time": 8.429793817922473} +{"Pretrain/Learning Rate": 2.920364722539851e-05, "Pretrain/Loss": 2.046731948852539, "Pretrain/Loss (Raw)": 1.9725250005722046, "Pretrain/Step": 4414, "Pretrain/Step Time": 8.431666089221835} +{"Pretrain/Learning Rate": 2.9195277987818533e-05, "Pretrain/Loss": 2.048377752304077, "Pretrain/Loss (Raw)": 2.024095296859741, "Pretrain/Step": 4415, "Pretrain/Step Time": 8.424979142844677} +{"Pretrain/Learning Rate": 2.918690826641932e-05, "Pretrain/Loss": 2.049978256225586, "Pretrain/Loss (Raw)": 1.9099664688110352, "Pretrain/Step": 4416, "Pretrain/Step Time": 8.428956450894475} +{"Pretrain/Learning Rate": 2.917853806216613e-05, "Pretrain/Loss": 2.0505852699279785, "Pretrain/Loss (Raw)": 2.1895885467529297, "Pretrain/Step": 4417, "Pretrain/Step Time": 8.43651750124991} +{"Pretrain/Learning Rate": 2.9170167376024228e-05, "Pretrain/Loss": 2.0495920181274414, "Pretrain/Loss (Raw)": 1.7279767990112305, "Pretrain/Step": 4418, "Pretrain/Step Time": 8.443896556273103} +{"Pretrain/Learning Rate": 2.9161796208958974e-05, "Pretrain/Loss": 2.0483388900756836, "Pretrain/Loss (Raw)": 1.8590370416641235, "Pretrain/Step": 4419, "Pretrain/Step Time": 8.440920514985919} +{"Pretrain/Learning Rate": 2.9153424561935782e-05, "Pretrain/Loss": 2.047694444656372, "Pretrain/Loss (Raw)": 1.940941333770752, "Pretrain/Step": 4420, "Pretrain/Step Time": 8.438639478757977} +{"Pretrain/Learning Rate": 2.914505243592009e-05, "Pretrain/Loss": 2.0480003356933594, "Pretrain/Loss (Raw)": 1.9978073835372925, "Pretrain/Step": 4421, "Pretrain/Step Time": 8.43080896884203} +{"Pretrain/Learning Rate": 2.913667983187742e-05, "Pretrain/Loss": 2.0500986576080322, "Pretrain/Loss (Raw)": 2.234712600708008, "Pretrain/Step": 4422, "Pretrain/Step Time": 8.432290568947792} +{"Pretrain/Learning Rate": 2.9128306750773338e-05, "Pretrain/Loss": 2.0506677627563477, "Pretrain/Loss (Raw)": 2.098857879638672, "Pretrain/Step": 4423, "Pretrain/Step Time": 8.434137700125575} +{"Pretrain/Learning Rate": 2.911993319357347e-05, "Pretrain/Loss": 2.053809642791748, "Pretrain/Loss (Raw)": 1.971309781074524, "Pretrain/Step": 4424, "Pretrain/Step Time": 8.437652442604303} +{"Pretrain/Learning Rate": 2.911155916124349e-05, "Pretrain/Loss": 2.0543465614318848, "Pretrain/Loss (Raw)": 2.1414802074432373, "Pretrain/Step": 4425, "Pretrain/Step Time": 8.440571393817663} +{"Pretrain/Learning Rate": 2.910318465474914e-05, "Pretrain/Loss": 2.0548996925354004, "Pretrain/Loss (Raw)": 1.914153814315796, "Pretrain/Step": 4426, "Pretrain/Step Time": 8.435616543516517} +{"Pretrain/Learning Rate": 2.9094809675056188e-05, "Pretrain/Loss": 2.0532262325286865, "Pretrain/Loss (Raw)": 1.9871290922164917, "Pretrain/Step": 4427, "Pretrain/Step Time": 8.435013456270099} +{"Pretrain/Learning Rate": 2.9086434223130504e-05, "Pretrain/Loss": 2.0528171062469482, "Pretrain/Loss (Raw)": 2.068430185317993, "Pretrain/Step": 4428, "Pretrain/Step Time": 8.434586364775896} +{"Pretrain/Learning Rate": 2.9078058299937962e-05, "Pretrain/Loss": 2.054537534713745, "Pretrain/Loss (Raw)": 2.24196457862854, "Pretrain/Step": 4429, "Pretrain/Step Time": 8.443448467180133} +{"Pretrain/Learning Rate": 2.9069681906444518e-05, "Pretrain/Loss": 2.051340341567993, "Pretrain/Loss (Raw)": 1.8834799528121948, "Pretrain/Step": 4430, "Pretrain/Step Time": 8.435497300699353} +{"Pretrain/Learning Rate": 2.906130504361619e-05, "Pretrain/Loss": 2.0524582862854004, "Pretrain/Loss (Raw)": 2.1378395557403564, "Pretrain/Step": 4431, "Pretrain/Step Time": 8.437313182279468} +{"Pretrain/Learning Rate": 2.9052927712419013e-05, "Pretrain/Loss": 2.0509791374206543, "Pretrain/Loss (Raw)": 1.9812166690826416, "Pretrain/Step": 4432, "Pretrain/Step Time": 8.43117856234312} +{"Pretrain/Learning Rate": 2.9044549913819124e-05, "Pretrain/Loss": 2.0507988929748535, "Pretrain/Loss (Raw)": 1.9936782121658325, "Pretrain/Step": 4433, "Pretrain/Step Time": 8.430531941354275} +{"Pretrain/Learning Rate": 2.9036171648782672e-05, "Pretrain/Loss": 2.048492908477783, "Pretrain/Loss (Raw)": 2.092360496520996, "Pretrain/Step": 4434, "Pretrain/Step Time": 8.432934269309044} +{"Pretrain/Learning Rate": 2.9027792918275894e-05, "Pretrain/Loss": 2.050370216369629, "Pretrain/Loss (Raw)": 2.111567735671997, "Pretrain/Step": 4435, "Pretrain/Step Time": 8.43421765230596} +{"Pretrain/Learning Rate": 2.9019413723265053e-05, "Pretrain/Loss": 2.0457425117492676, "Pretrain/Loss (Raw)": 1.6998491287231445, "Pretrain/Step": 4436, "Pretrain/Step Time": 8.434961685910821} +{"Pretrain/Learning Rate": 2.9011034064716485e-05, "Pretrain/Loss": 2.0450210571289062, "Pretrain/Loss (Raw)": 2.116872787475586, "Pretrain/Step": 4437, "Pretrain/Step Time": 8.437699364498258} +{"Pretrain/Learning Rate": 2.9002653943596564e-05, "Pretrain/Loss": 2.0436344146728516, "Pretrain/Loss (Raw)": 1.894680380821228, "Pretrain/Step": 4438, "Pretrain/Step Time": 8.432273048907518} +{"Pretrain/Learning Rate": 2.8994273360871734e-05, "Pretrain/Loss": 2.043057441711426, "Pretrain/Loss (Raw)": 2.0627529621124268, "Pretrain/Step": 4439, "Pretrain/Step Time": 8.43321986310184} +{"Pretrain/Learning Rate": 2.898589231750847e-05, "Pretrain/Loss": 2.040062427520752, "Pretrain/Loss (Raw)": 1.763527274131775, "Pretrain/Step": 4440, "Pretrain/Step Time": 8.450175192207098} +{"Pretrain/Learning Rate": 2.897751081447333e-05, "Pretrain/Loss": 2.037139654159546, "Pretrain/Loss (Raw)": 1.810156226158142, "Pretrain/Step": 4441, "Pretrain/Step Time": 8.45123889297247} +{"Pretrain/Learning Rate": 2.8969128852732896e-05, "Pretrain/Loss": 2.033111333847046, "Pretrain/Loss (Raw)": 1.7592636346817017, "Pretrain/Step": 4442, "Pretrain/Step Time": 8.449000673368573} +{"Pretrain/Learning Rate": 2.896074643325382e-05, "Pretrain/Loss": 2.031813383102417, "Pretrain/Loss (Raw)": 2.057413101196289, "Pretrain/Step": 4443, "Pretrain/Step Time": 8.441202281042933} +{"Pretrain/Learning Rate": 2.8952363557002798e-05, "Pretrain/Loss": 2.032780647277832, "Pretrain/Loss (Raw)": 2.061525344848633, "Pretrain/Step": 4444, "Pretrain/Step Time": 8.437210831791162} +{"Pretrain/Learning Rate": 2.89439802249466e-05, "Pretrain/Loss": 2.033224105834961, "Pretrain/Loss (Raw)": 2.2162320613861084, "Pretrain/Step": 4445, "Pretrain/Step Time": 8.447029076516628} +{"Pretrain/Learning Rate": 2.8935596438052003e-05, "Pretrain/Loss": 2.0339879989624023, "Pretrain/Loss (Raw)": 2.0451509952545166, "Pretrain/Step": 4446, "Pretrain/Step Time": 8.45569409430027} +{"Pretrain/Learning Rate": 2.8927212197285885e-05, "Pretrain/Loss": 2.0344321727752686, "Pretrain/Loss (Raw)": 2.072427749633789, "Pretrain/Step": 4447, "Pretrain/Step Time": 8.45344203338027} +{"Pretrain/Learning Rate": 2.8918827503615154e-05, "Pretrain/Loss": 2.032806396484375, "Pretrain/Loss (Raw)": 2.02736759185791, "Pretrain/Step": 4448, "Pretrain/Step Time": 8.455034540966153} +{"Pretrain/Learning Rate": 2.891044235800676e-05, "Pretrain/Loss": 2.032073736190796, "Pretrain/Loss (Raw)": 1.9463337659835815, "Pretrain/Step": 4449, "Pretrain/Step Time": 8.452135093510151} +{"Pretrain/Learning Rate": 2.8902056761427744e-05, "Pretrain/Loss": 2.03183650970459, "Pretrain/Loss (Raw)": 2.134493589401245, "Pretrain/Step": 4450, "Pretrain/Step Time": 8.43740431778133} +{"Pretrain/Learning Rate": 2.889367071484514e-05, "Pretrain/Loss": 2.033024787902832, "Pretrain/Loss (Raw)": 2.008882761001587, "Pretrain/Step": 4451, "Pretrain/Step Time": 8.443054934963584} +{"Pretrain/Learning Rate": 2.888528421922608e-05, "Pretrain/Loss": 2.0312721729278564, "Pretrain/Loss (Raw)": 1.9376317262649536, "Pretrain/Step": 4452, "Pretrain/Step Time": 8.445472737774253} +{"Pretrain/Learning Rate": 2.8876897275537744e-05, "Pretrain/Loss": 2.034745931625366, "Pretrain/Loss (Raw)": 2.0361292362213135, "Pretrain/Step": 4453, "Pretrain/Step Time": 8.444659715518355} +{"Pretrain/Learning Rate": 2.8868509884747348e-05, "Pretrain/Loss": 2.035489082336426, "Pretrain/Loss (Raw)": 2.020148992538452, "Pretrain/Step": 4454, "Pretrain/Step Time": 8.443801257759333} +{"Pretrain/Learning Rate": 2.8860122047822154e-05, "Pretrain/Loss": 2.0323963165283203, "Pretrain/Loss (Raw)": 2.212167739868164, "Pretrain/Step": 4455, "Pretrain/Step Time": 8.433629581704736} +{"Pretrain/Learning Rate": 2.88517337657295e-05, "Pretrain/Loss": 2.027158498764038, "Pretrain/Loss (Raw)": 1.845750093460083, "Pretrain/Step": 4456, "Pretrain/Step Time": 8.43637471459806} +{"Pretrain/Learning Rate": 2.8843345039436758e-05, "Pretrain/Loss": 2.0290122032165527, "Pretrain/Loss (Raw)": 2.0176520347595215, "Pretrain/Step": 4457, "Pretrain/Step Time": 8.443543063476682} +{"Pretrain/Learning Rate": 2.8834955869911356e-05, "Pretrain/Loss": 2.029078483581543, "Pretrain/Loss (Raw)": 2.0206406116485596, "Pretrain/Step": 4458, "Pretrain/Step Time": 8.442148650065064} +{"Pretrain/Learning Rate": 2.8826566258120768e-05, "Pretrain/Loss": 2.030838966369629, "Pretrain/Loss (Raw)": 2.123117446899414, "Pretrain/Step": 4459, "Pretrain/Step Time": 8.442074226215482} +{"Pretrain/Learning Rate": 2.8818176205032533e-05, "Pretrain/Loss": 2.028517484664917, "Pretrain/Loss (Raw)": 1.9424306154251099, "Pretrain/Step": 4460, "Pretrain/Step Time": 8.442697253078222} +{"Pretrain/Learning Rate": 2.8809785711614228e-05, "Pretrain/Loss": 2.0270400047302246, "Pretrain/Loss (Raw)": 1.821899175643921, "Pretrain/Step": 4461, "Pretrain/Step Time": 8.4301597494632} +{"Pretrain/Learning Rate": 2.8801394778833475e-05, "Pretrain/Loss": 2.02437162399292, "Pretrain/Loss (Raw)": 1.5590314865112305, "Pretrain/Step": 4462, "Pretrain/Step Time": 8.434654854238033} +{"Pretrain/Learning Rate": 2.879300340765797e-05, "Pretrain/Loss": 2.022902250289917, "Pretrain/Loss (Raw)": 1.9388293027877808, "Pretrain/Step": 4463, "Pretrain/Step Time": 8.439484015107155} +{"Pretrain/Learning Rate": 2.8784611599055435e-05, "Pretrain/Loss": 2.0238194465637207, "Pretrain/Loss (Raw)": 2.1375210285186768, "Pretrain/Step": 4464, "Pretrain/Step Time": 8.444874484091997} +{"Pretrain/Learning Rate": 2.8776219353993662e-05, "Pretrain/Loss": 2.023981809616089, "Pretrain/Loss (Raw)": 1.9722158908843994, "Pretrain/Step": 4465, "Pretrain/Step Time": 8.443689500913024} +{"Pretrain/Learning Rate": 2.8767826673440467e-05, "Pretrain/Loss": 2.025609016418457, "Pretrain/Loss (Raw)": 2.23026180267334, "Pretrain/Step": 4466, "Pretrain/Step Time": 8.433486765250564} +{"Pretrain/Learning Rate": 2.8759433558363758e-05, "Pretrain/Loss": 2.026583433151245, "Pretrain/Loss (Raw)": 2.0792880058288574, "Pretrain/Step": 4467, "Pretrain/Step Time": 8.426724672317505} +{"Pretrain/Learning Rate": 2.875104000973145e-05, "Pretrain/Loss": 2.02604341506958, "Pretrain/Loss (Raw)": 2.089360475540161, "Pretrain/Step": 4468, "Pretrain/Step Time": 8.426582962274551} +{"Pretrain/Learning Rate": 2.874264602851154e-05, "Pretrain/Loss": 2.025777578353882, "Pretrain/Loss (Raw)": 2.0114240646362305, "Pretrain/Step": 4469, "Pretrain/Step Time": 8.432671321555972} +{"Pretrain/Learning Rate": 2.8734251615672043e-05, "Pretrain/Loss": 2.0260000228881836, "Pretrain/Loss (Raw)": 2.070526599884033, "Pretrain/Step": 4470, "Pretrain/Step Time": 8.431992249563336} +{"Pretrain/Learning Rate": 2.8725856772181058e-05, "Pretrain/Loss": 2.0256662368774414, "Pretrain/Loss (Raw)": 1.9079099893569946, "Pretrain/Step": 4471, "Pretrain/Step Time": 8.430838311091065} +{"Pretrain/Learning Rate": 2.8717461499006714e-05, "Pretrain/Loss": 2.026498317718506, "Pretrain/Loss (Raw)": 2.0169122219085693, "Pretrain/Step": 4472, "Pretrain/Step Time": 8.42981568351388} +{"Pretrain/Learning Rate": 2.8709065797117198e-05, "Pretrain/Loss": 2.027592897415161, "Pretrain/Loss (Raw)": 1.9819785356521606, "Pretrain/Step": 4473, "Pretrain/Step Time": 8.432462763041258} +{"Pretrain/Learning Rate": 2.8700669667480732e-05, "Pretrain/Loss": 2.029287338256836, "Pretrain/Loss (Raw)": 2.0435853004455566, "Pretrain/Step": 4474, "Pretrain/Step Time": 8.434806056320667} +{"Pretrain/Learning Rate": 2.86922731110656e-05, "Pretrain/Loss": 2.028022289276123, "Pretrain/Loss (Raw)": 1.8728731870651245, "Pretrain/Step": 4475, "Pretrain/Step Time": 8.431762566789985} +{"Pretrain/Learning Rate": 2.8683876128840138e-05, "Pretrain/Loss": 2.0283706188201904, "Pretrain/Loss (Raw)": 2.0182886123657227, "Pretrain/Step": 4476, "Pretrain/Step Time": 8.43169298581779} +{"Pretrain/Learning Rate": 2.8675478721772715e-05, "Pretrain/Loss": 2.028812885284424, "Pretrain/Loss (Raw)": 2.107590913772583, "Pretrain/Step": 4477, "Pretrain/Step Time": 8.432481253519654} +{"Pretrain/Learning Rate": 2.866708089083177e-05, "Pretrain/Loss": 2.026548385620117, "Pretrain/Loss (Raw)": 1.9906946420669556, "Pretrain/Step": 4478, "Pretrain/Step Time": 8.429905768483877} +{"Pretrain/Learning Rate": 2.865868263698578e-05, "Pretrain/Loss": 2.022667646408081, "Pretrain/Loss (Raw)": 1.7123552560806274, "Pretrain/Step": 4479, "Pretrain/Step Time": 8.430666010826826} +{"Pretrain/Learning Rate": 2.8650283961203267e-05, "Pretrain/Loss": 2.023606777191162, "Pretrain/Loss (Raw)": 2.1424474716186523, "Pretrain/Step": 4480, "Pretrain/Step Time": 8.43086258508265} +{"Pretrain/Learning Rate": 2.86418848644528e-05, "Pretrain/Loss": 2.021789073944092, "Pretrain/Loss (Raw)": 1.9485249519348145, "Pretrain/Step": 4481, "Pretrain/Step Time": 8.433795846998692} +{"Pretrain/Learning Rate": 2.8633485347703015e-05, "Pretrain/Loss": 2.0221123695373535, "Pretrain/Loss (Raw)": 1.9486374855041504, "Pretrain/Step": 4482, "Pretrain/Step Time": 8.43579119630158} +{"Pretrain/Learning Rate": 2.8625085411922575e-05, "Pretrain/Loss": 2.019934892654419, "Pretrain/Loss (Raw)": 2.005491018295288, "Pretrain/Step": 4483, "Pretrain/Step Time": 8.435038764029741} +{"Pretrain/Learning Rate": 2.861668505808021e-05, "Pretrain/Loss": 2.0188941955566406, "Pretrain/Loss (Raw)": 1.925364375114441, "Pretrain/Step": 4484, "Pretrain/Step Time": 8.435527013614774} +{"Pretrain/Learning Rate": 2.8608284287144675e-05, "Pretrain/Loss": 2.022777557373047, "Pretrain/Loss (Raw)": 2.2957088947296143, "Pretrain/Step": 4485, "Pretrain/Step Time": 8.440764656290412} +{"Pretrain/Learning Rate": 2.85998831000848e-05, "Pretrain/Loss": 2.021256446838379, "Pretrain/Loss (Raw)": 2.0115909576416016, "Pretrain/Step": 4486, "Pretrain/Step Time": 8.443930825218558} +{"Pretrain/Learning Rate": 2.8591481497869433e-05, "Pretrain/Loss": 2.024193286895752, "Pretrain/Loss (Raw)": 2.180324077606201, "Pretrain/Step": 4487, "Pretrain/Step Time": 8.441040299832821} +{"Pretrain/Learning Rate": 2.8583079481467507e-05, "Pretrain/Loss": 2.0264744758605957, "Pretrain/Loss (Raw)": 2.2439348697662354, "Pretrain/Step": 4488, "Pretrain/Step Time": 8.438017796725035} +{"Pretrain/Learning Rate": 2.857467705184797e-05, "Pretrain/Loss": 2.0242176055908203, "Pretrain/Loss (Raw)": 1.734446406364441, "Pretrain/Step": 4489, "Pretrain/Step Time": 8.433673080056906} +{"Pretrain/Learning Rate": 2.856627420997982e-05, "Pretrain/Loss": 2.025057792663574, "Pretrain/Loss (Raw)": 2.200329065322876, "Pretrain/Step": 4490, "Pretrain/Step Time": 8.435329865664244} +{"Pretrain/Learning Rate": 2.8557870956832132e-05, "Pretrain/Loss": 2.0229058265686035, "Pretrain/Loss (Raw)": 1.9077554941177368, "Pretrain/Step": 4491, "Pretrain/Step Time": 8.446227075532079} +{"Pretrain/Learning Rate": 2.8549467293374e-05, "Pretrain/Loss": 2.0220534801483154, "Pretrain/Loss (Raw)": 2.0055441856384277, "Pretrain/Step": 4492, "Pretrain/Step Time": 8.44694747030735} +{"Pretrain/Learning Rate": 2.854106322057457e-05, "Pretrain/Loss": 2.0231761932373047, "Pretrain/Loss (Raw)": 2.060682535171509, "Pretrain/Step": 4493, "Pretrain/Step Time": 8.448107708245516} +{"Pretrain/Learning Rate": 2.8532658739403046e-05, "Pretrain/Loss": 2.023132562637329, "Pretrain/Loss (Raw)": 2.039268732070923, "Pretrain/Step": 4494, "Pretrain/Step Time": 8.442575814202428} +{"Pretrain/Learning Rate": 2.852425385082867e-05, "Pretrain/Loss": 2.023343324661255, "Pretrain/Loss (Raw)": 2.0165750980377197, "Pretrain/Step": 4495, "Pretrain/Step Time": 8.438672119751573} +{"Pretrain/Learning Rate": 2.851584855582073e-05, "Pretrain/Loss": 2.0224061012268066, "Pretrain/Loss (Raw)": 1.9243117570877075, "Pretrain/Step": 4496, "Pretrain/Step Time": 8.438884707167745} +{"Pretrain/Learning Rate": 2.8507442855348577e-05, "Pretrain/Loss": 2.022676944732666, "Pretrain/Loss (Raw)": 2.1959750652313232, "Pretrain/Step": 4497, "Pretrain/Step Time": 8.443894241005182} +{"Pretrain/Learning Rate": 2.8499036750381576e-05, "Pretrain/Loss": 2.0230422019958496, "Pretrain/Loss (Raw)": 1.9444197416305542, "Pretrain/Step": 4498, "Pretrain/Step Time": 8.44499509781599} +{"Pretrain/Learning Rate": 2.849063024188917e-05, "Pretrain/Loss": 2.0261998176574707, "Pretrain/Loss (Raw)": 2.2289109230041504, "Pretrain/Step": 4499, "Pretrain/Step Time": 8.438810583204031} +{"Pretrain/Learning Rate": 2.8482223330840836e-05, "Pretrain/Loss": 2.025726795196533, "Pretrain/Loss (Raw)": 1.9766803979873657, "Pretrain/Step": 4500, "Pretrain/Step Time": 8.437724540010095} +{"Pretrain/Learning Rate": 2.84738160182061e-05, "Pretrain/Loss": 2.022289276123047, "Pretrain/Loss (Raw)": 2.1532444953918457, "Pretrain/Step": 4501, "Pretrain/Step Time": 8.440628930926323} +{"Pretrain/Learning Rate": 2.8465408304954533e-05, "Pretrain/Loss": 2.025169610977173, "Pretrain/Loss (Raw)": 2.262615442276001, "Pretrain/Step": 4502, "Pretrain/Step Time": 8.440979721024632} +{"Pretrain/Learning Rate": 2.8457000192055748e-05, "Pretrain/Loss": 2.0261282920837402, "Pretrain/Loss (Raw)": 2.2597813606262207, "Pretrain/Step": 4503, "Pretrain/Step Time": 8.44318239018321} +{"Pretrain/Learning Rate": 2.8448591680479415e-05, "Pretrain/Loss": 2.0284626483917236, "Pretrain/Loss (Raw)": 2.241874933242798, "Pretrain/Step": 4504, "Pretrain/Step Time": 8.443297289311886} +{"Pretrain/Learning Rate": 2.8440182771195235e-05, "Pretrain/Loss": 2.0317797660827637, "Pretrain/Loss (Raw)": 2.368242025375366, "Pretrain/Step": 4505, "Pretrain/Step Time": 8.4428724758327} +{"Pretrain/Learning Rate": 2.8431773465172972e-05, "Pretrain/Loss": 2.0326132774353027, "Pretrain/Loss (Raw)": 2.2093870639801025, "Pretrain/Step": 4506, "Pretrain/Step Time": 8.43801163136959} +{"Pretrain/Learning Rate": 2.8423363763382415e-05, "Pretrain/Loss": 2.02781343460083, "Pretrain/Loss (Raw)": 1.7285569906234741, "Pretrain/Step": 4507, "Pretrain/Step Time": 8.436305617913604} +{"Pretrain/Learning Rate": 2.8414953666793426e-05, "Pretrain/Loss": 2.028278112411499, "Pretrain/Loss (Raw)": 2.0437090396881104, "Pretrain/Step": 4508, "Pretrain/Step Time": 8.441130744293332} +{"Pretrain/Learning Rate": 2.8406543176375882e-05, "Pretrain/Loss": 2.030092716217041, "Pretrain/Loss (Raw)": 2.1402037143707275, "Pretrain/Step": 4509, "Pretrain/Step Time": 8.440991332754493} +{"Pretrain/Learning Rate": 2.839813229309973e-05, "Pretrain/Loss": 2.0346059799194336, "Pretrain/Loss (Raw)": 2.3911545276641846, "Pretrain/Step": 4510, "Pretrain/Step Time": 8.442134758457541} +{"Pretrain/Learning Rate": 2.8389721017934945e-05, "Pretrain/Loss": 2.0352165699005127, "Pretrain/Loss (Raw)": 2.0188491344451904, "Pretrain/Step": 4511, "Pretrain/Step Time": 8.438756760209799} +{"Pretrain/Learning Rate": 2.8381309351851564e-05, "Pretrain/Loss": 2.0370097160339355, "Pretrain/Loss (Raw)": 2.3270227909088135, "Pretrain/Step": 4512, "Pretrain/Step Time": 8.440337780863047} +{"Pretrain/Learning Rate": 2.837289729581965e-05, "Pretrain/Loss": 2.036033868789673, "Pretrain/Loss (Raw)": 1.87570059299469, "Pretrain/Step": 4513, "Pretrain/Step Time": 8.44126147404313} +{"Pretrain/Learning Rate": 2.8364484850809337e-05, "Pretrain/Loss": 2.033888578414917, "Pretrain/Loss (Raw)": 2.0494582653045654, "Pretrain/Step": 4514, "Pretrain/Step Time": 8.457512931898236} +{"Pretrain/Learning Rate": 2.835607201779077e-05, "Pretrain/Loss": 2.0329504013061523, "Pretrain/Loss (Raw)": 1.8233834505081177, "Pretrain/Step": 4515, "Pretrain/Step Time": 8.454768646508455} +{"Pretrain/Learning Rate": 2.834765879773416e-05, "Pretrain/Loss": 2.0338938236236572, "Pretrain/Loss (Raw)": 2.043452501296997, "Pretrain/Step": 4516, "Pretrain/Step Time": 8.447174286469817} +{"Pretrain/Learning Rate": 2.833924519160977e-05, "Pretrain/Loss": 2.0372328758239746, "Pretrain/Loss (Raw)": 2.296937942504883, "Pretrain/Step": 4517, "Pretrain/Step Time": 8.43543865159154} +{"Pretrain/Learning Rate": 2.8330831200387885e-05, "Pretrain/Loss": 2.0366950035095215, "Pretrain/Loss (Raw)": 2.2046897411346436, "Pretrain/Step": 4518, "Pretrain/Step Time": 8.440021425485611} +{"Pretrain/Learning Rate": 2.8322416825038855e-05, "Pretrain/Loss": 2.04044246673584, "Pretrain/Loss (Raw)": 2.32590913772583, "Pretrain/Step": 4519, "Pretrain/Step Time": 8.438129588961601} +{"Pretrain/Learning Rate": 2.831400206653305e-05, "Pretrain/Loss": 2.039832353591919, "Pretrain/Loss (Raw)": 2.0430614948272705, "Pretrain/Step": 4520, "Pretrain/Step Time": 8.445651777088642} +{"Pretrain/Learning Rate": 2.830558692584092e-05, "Pretrain/Loss": 2.0406832695007324, "Pretrain/Loss (Raw)": 2.2373061180114746, "Pretrain/Step": 4521, "Pretrain/Step Time": 8.446806276217103} +{"Pretrain/Learning Rate": 2.8297171403932928e-05, "Pretrain/Loss": 2.0410289764404297, "Pretrain/Loss (Raw)": 2.072648048400879, "Pretrain/Step": 4522, "Pretrain/Step Time": 8.448536584153771} +{"Pretrain/Learning Rate": 2.8288755501779597e-05, "Pretrain/Loss": 2.041524887084961, "Pretrain/Loss (Raw)": 2.0866141319274902, "Pretrain/Step": 4523, "Pretrain/Step Time": 8.441856851801276} +{"Pretrain/Learning Rate": 2.8280339220351475e-05, "Pretrain/Loss": 2.0393142700195312, "Pretrain/Loss (Raw)": 1.9651224613189697, "Pretrain/Step": 4524, "Pretrain/Step Time": 8.443529959768057} +{"Pretrain/Learning Rate": 2.8271922560619184e-05, "Pretrain/Loss": 2.0388567447662354, "Pretrain/Loss (Raw)": 2.0255656242370605, "Pretrain/Step": 4525, "Pretrain/Step Time": 8.444943003356457} +{"Pretrain/Learning Rate": 2.8263505523553357e-05, "Pretrain/Loss": 2.0391581058502197, "Pretrain/Loss (Raw)": 2.043534517288208, "Pretrain/Step": 4526, "Pretrain/Step Time": 8.450718006119132} +{"Pretrain/Learning Rate": 2.8255088110124705e-05, "Pretrain/Loss": 2.0370125770568848, "Pretrain/Loss (Raw)": 2.0129756927490234, "Pretrain/Step": 4527, "Pretrain/Step Time": 8.449289835989475} +{"Pretrain/Learning Rate": 2.8246670321303947e-05, "Pretrain/Loss": 2.035647392272949, "Pretrain/Loss (Raw)": 2.0267410278320312, "Pretrain/Step": 4528, "Pretrain/Step Time": 8.443878885358572} +{"Pretrain/Learning Rate": 2.8238252158061873e-05, "Pretrain/Loss": 2.035503387451172, "Pretrain/Loss (Raw)": 2.089279890060425, "Pretrain/Step": 4529, "Pretrain/Step Time": 8.442647146061063} +{"Pretrain/Learning Rate": 2.8229833621369295e-05, "Pretrain/Loss": 2.0338382720947266, "Pretrain/Loss (Raw)": 1.9315704107284546, "Pretrain/Step": 4530, "Pretrain/Step Time": 8.44458700157702} +{"Pretrain/Learning Rate": 2.822141471219709e-05, "Pretrain/Loss": 2.0328476428985596, "Pretrain/Loss (Raw)": 1.9622174501419067, "Pretrain/Step": 4531, "Pretrain/Step Time": 8.447135772556067} +{"Pretrain/Learning Rate": 2.8212995431516163e-05, "Pretrain/Loss": 2.0338034629821777, "Pretrain/Loss (Raw)": 2.024172782897949, "Pretrain/Step": 4532, "Pretrain/Step Time": 8.448268352076411} +{"Pretrain/Learning Rate": 2.820457578029746e-05, "Pretrain/Loss": 2.0309524536132812, "Pretrain/Loss (Raw)": 1.6624202728271484, "Pretrain/Step": 4533, "Pretrain/Step Time": 8.453761037439108} +{"Pretrain/Learning Rate": 2.8196155759511977e-05, "Pretrain/Loss": 2.032008647918701, "Pretrain/Loss (Raw)": 2.02302622795105, "Pretrain/Step": 4534, "Pretrain/Step Time": 8.447633974254131} +{"Pretrain/Learning Rate": 2.8187735370130745e-05, "Pretrain/Loss": 2.0326008796691895, "Pretrain/Loss (Raw)": 2.0452070236206055, "Pretrain/Step": 4535, "Pretrain/Step Time": 8.44371091015637} +{"Pretrain/Learning Rate": 2.8179314613124858e-05, "Pretrain/Loss": 2.032667398452759, "Pretrain/Loss (Raw)": 1.9200328588485718, "Pretrain/Step": 4536, "Pretrain/Step Time": 8.441973825916648} +{"Pretrain/Learning Rate": 2.817089348946542e-05, "Pretrain/Loss": 2.0358784198760986, "Pretrain/Loss (Raw)": 2.3174707889556885, "Pretrain/Step": 4537, "Pretrain/Step Time": 8.449961576610804} +{"Pretrain/Learning Rate": 2.8162472000123613e-05, "Pretrain/Loss": 2.034949779510498, "Pretrain/Loss (Raw)": 1.929505705833435, "Pretrain/Step": 4538, "Pretrain/Step Time": 8.449506588280201} +{"Pretrain/Learning Rate": 2.8154050146070627e-05, "Pretrain/Loss": 2.033332347869873, "Pretrain/Loss (Raw)": 1.9188395738601685, "Pretrain/Step": 4539, "Pretrain/Step Time": 8.449568804353476} +{"Pretrain/Learning Rate": 2.814562792827772e-05, "Pretrain/Loss": 2.03269100189209, "Pretrain/Loss (Raw)": 2.0605032444000244, "Pretrain/Step": 4540, "Pretrain/Step Time": 8.446008026599884} +{"Pretrain/Learning Rate": 2.8137205347716165e-05, "Pretrain/Loss": 2.030571460723877, "Pretrain/Loss (Raw)": 1.9389747381210327, "Pretrain/Step": 4541, "Pretrain/Step Time": 8.438842315226793} +{"Pretrain/Learning Rate": 2.8128782405357312e-05, "Pretrain/Loss": 2.0314717292785645, "Pretrain/Loss (Raw)": 2.08774995803833, "Pretrain/Step": 4542, "Pretrain/Step Time": 8.436384884640574} +{"Pretrain/Learning Rate": 2.812035910217254e-05, "Pretrain/Loss": 2.0308287143707275, "Pretrain/Loss (Raw)": 1.9417791366577148, "Pretrain/Step": 4543, "Pretrain/Step Time": 8.444874243810773} +{"Pretrain/Learning Rate": 2.811193543913324e-05, "Pretrain/Loss": 2.03218412399292, "Pretrain/Loss (Raw)": 2.08345890045166, "Pretrain/Step": 4544, "Pretrain/Step Time": 8.438591009005904} +{"Pretrain/Learning Rate": 2.8103511417210886e-05, "Pretrain/Loss": 2.0317258834838867, "Pretrain/Loss (Raw)": 2.1309409141540527, "Pretrain/Step": 4545, "Pretrain/Step Time": 8.433260696008801} +{"Pretrain/Learning Rate": 2.809508703737697e-05, "Pretrain/Loss": 2.0346407890319824, "Pretrain/Loss (Raw)": 2.1011083126068115, "Pretrain/Step": 4546, "Pretrain/Step Time": 8.426821812987328} +{"Pretrain/Learning Rate": 2.808666230060304e-05, "Pretrain/Loss": 2.0375685691833496, "Pretrain/Loss (Raw)": 2.2337963581085205, "Pretrain/Step": 4547, "Pretrain/Step Time": 8.427932146936655} +{"Pretrain/Learning Rate": 2.8078237207860658e-05, "Pretrain/Loss": 2.037045955657959, "Pretrain/Loss (Raw)": 1.874010682106018, "Pretrain/Step": 4548, "Pretrain/Step Time": 8.435666220262647} +{"Pretrain/Learning Rate": 2.806981176012146e-05, "Pretrain/Loss": 2.0351195335388184, "Pretrain/Loss (Raw)": 1.7512627840042114, "Pretrain/Step": 4549, "Pretrain/Step Time": 8.43642514012754} +{"Pretrain/Learning Rate": 2.80613859583571e-05, "Pretrain/Loss": 2.034785509109497, "Pretrain/Loss (Raw)": 2.191929817199707, "Pretrain/Step": 4550, "Pretrain/Step Time": 8.440396508201957} +{"Pretrain/Learning Rate": 2.8052959803539298e-05, "Pretrain/Loss": 2.034040927886963, "Pretrain/Loss (Raw)": 2.003554344177246, "Pretrain/Step": 4551, "Pretrain/Step Time": 8.438048562034965} +{"Pretrain/Learning Rate": 2.8044533296639774e-05, "Pretrain/Loss": 2.034823417663574, "Pretrain/Loss (Raw)": 2.071485996246338, "Pretrain/Step": 4552, "Pretrain/Step Time": 8.437813581898808} +{"Pretrain/Learning Rate": 2.8036106438630327e-05, "Pretrain/Loss": 2.035623073577881, "Pretrain/Loss (Raw)": 2.2438313961029053, "Pretrain/Step": 4553, "Pretrain/Step Time": 8.432655369862914} +{"Pretrain/Learning Rate": 2.802767923048278e-05, "Pretrain/Loss": 2.0390610694885254, "Pretrain/Loss (Raw)": 2.3542234897613525, "Pretrain/Step": 4554, "Pretrain/Step Time": 8.43592674471438} +{"Pretrain/Learning Rate": 2.8019251673168993e-05, "Pretrain/Loss": 2.039513111114502, "Pretrain/Loss (Raw)": 2.0449910163879395, "Pretrain/Step": 4555, "Pretrain/Step Time": 8.43549183383584} +{"Pretrain/Learning Rate": 2.8010823767660887e-05, "Pretrain/Loss": 2.041322708129883, "Pretrain/Loss (Raw)": 2.3000354766845703, "Pretrain/Step": 4556, "Pretrain/Step Time": 8.437992628663778} +{"Pretrain/Learning Rate": 2.8002395514930385e-05, "Pretrain/Loss": 2.0378901958465576, "Pretrain/Loss (Raw)": 1.8026177883148193, "Pretrain/Step": 4557, "Pretrain/Step Time": 8.43040930852294} +{"Pretrain/Learning Rate": 2.7993966915949493e-05, "Pretrain/Loss": 2.0374693870544434, "Pretrain/Loss (Raw)": 1.829591989517212, "Pretrain/Step": 4558, "Pretrain/Step Time": 8.434152377769351} +{"Pretrain/Learning Rate": 2.7985537971690216e-05, "Pretrain/Loss": 2.0364556312561035, "Pretrain/Loss (Raw)": 2.0080785751342773, "Pretrain/Step": 4559, "Pretrain/Step Time": 8.434328505769372} +{"Pretrain/Learning Rate": 2.7977108683124647e-05, "Pretrain/Loss": 2.036712408065796, "Pretrain/Loss (Raw)": 2.0140864849090576, "Pretrain/Step": 4560, "Pretrain/Step Time": 8.438687229529023} +{"Pretrain/Learning Rate": 2.7968679051224868e-05, "Pretrain/Loss": 2.036418914794922, "Pretrain/Loss (Raw)": 1.9561270475387573, "Pretrain/Step": 4561, "Pretrain/Step Time": 8.447419254109263} +{"Pretrain/Learning Rate": 2.796024907696303e-05, "Pretrain/Loss": 2.036388397216797, "Pretrain/Loss (Raw)": 2.088465452194214, "Pretrain/Step": 4562, "Pretrain/Step Time": 8.448170728981495} +{"Pretrain/Learning Rate": 2.795181876131132e-05, "Pretrain/Loss": 2.0364248752593994, "Pretrain/Loss (Raw)": 2.116215944290161, "Pretrain/Step": 4563, "Pretrain/Step Time": 8.443085664883256} +{"Pretrain/Learning Rate": 2.7943388105241968e-05, "Pretrain/Loss": 2.038841724395752, "Pretrain/Loss (Raw)": 2.0092341899871826, "Pretrain/Step": 4564, "Pretrain/Step Time": 8.44388380087912} +{"Pretrain/Learning Rate": 2.793495710972722e-05, "Pretrain/Loss": 2.0385172367095947, "Pretrain/Loss (Raw)": 2.07532000541687, "Pretrain/Step": 4565, "Pretrain/Step Time": 8.450590200722218} +{"Pretrain/Learning Rate": 2.79265257757394e-05, "Pretrain/Loss": 2.0401830673217773, "Pretrain/Loss (Raw)": 2.107905864715576, "Pretrain/Step": 4566, "Pretrain/Step Time": 8.448489990085363} +{"Pretrain/Learning Rate": 2.7918094104250826e-05, "Pretrain/Loss": 2.042234420776367, "Pretrain/Loss (Raw)": 2.3253350257873535, "Pretrain/Step": 4567, "Pretrain/Step Time": 8.447144851088524} +{"Pretrain/Learning Rate": 2.7909662096233897e-05, "Pretrain/Loss": 2.0444016456604004, "Pretrain/Loss (Raw)": 2.0409016609191895, "Pretrain/Step": 4568, "Pretrain/Step Time": 8.431546960026026} +{"Pretrain/Learning Rate": 2.7901229752661018e-05, "Pretrain/Loss": 2.047488212585449, "Pretrain/Loss (Raw)": 2.205272674560547, "Pretrain/Step": 4569, "Pretrain/Step Time": 8.43428572639823} +{"Pretrain/Learning Rate": 2.7892797074504656e-05, "Pretrain/Loss": 2.050121307373047, "Pretrain/Loss (Raw)": 2.0962955951690674, "Pretrain/Step": 4570, "Pretrain/Step Time": 8.433957001194358} +{"Pretrain/Learning Rate": 2.78843640627373e-05, "Pretrain/Loss": 2.0501790046691895, "Pretrain/Loss (Raw)": 2.064790964126587, "Pretrain/Step": 4571, "Pretrain/Step Time": 8.438737688586116} +{"Pretrain/Learning Rate": 2.7875930718331496e-05, "Pretrain/Loss": 2.0490012168884277, "Pretrain/Loss (Raw)": 1.9107661247253418, "Pretrain/Step": 4572, "Pretrain/Step Time": 8.437949173152447} +{"Pretrain/Learning Rate": 2.786749704225981e-05, "Pretrain/Loss": 2.048327922821045, "Pretrain/Loss (Raw)": 2.130028247833252, "Pretrain/Step": 4573, "Pretrain/Step Time": 8.430654788389802} +{"Pretrain/Learning Rate": 2.785906303549485e-05, "Pretrain/Loss": 2.046543598175049, "Pretrain/Loss (Raw)": 1.816778540611267, "Pretrain/Step": 4574, "Pretrain/Step Time": 8.419882867485285} +{"Pretrain/Learning Rate": 2.7850628699009268e-05, "Pretrain/Loss": 2.0448648929595947, "Pretrain/Loss (Raw)": 1.8575561046600342, "Pretrain/Step": 4575, "Pretrain/Step Time": 8.421919979155064} +{"Pretrain/Learning Rate": 2.7842194033775747e-05, "Pretrain/Loss": 2.0434112548828125, "Pretrain/Loss (Raw)": 1.8412971496582031, "Pretrain/Step": 4576, "Pretrain/Step Time": 8.423068348318338} +{"Pretrain/Learning Rate": 2.7833759040767027e-05, "Pretrain/Loss": 2.044055938720703, "Pretrain/Loss (Raw)": 2.0288472175598145, "Pretrain/Step": 4577, "Pretrain/Step Time": 8.433262763544917} +{"Pretrain/Learning Rate": 2.7825323720955853e-05, "Pretrain/Loss": 2.0449957847595215, "Pretrain/Loss (Raw)": 2.2548065185546875, "Pretrain/Step": 4578, "Pretrain/Step Time": 8.430603999644518} +{"Pretrain/Learning Rate": 2.781688807531504e-05, "Pretrain/Loss": 2.0455026626586914, "Pretrain/Loss (Raw)": 2.073753833770752, "Pretrain/Step": 4579, "Pretrain/Step Time": 8.427068972960114} +{"Pretrain/Learning Rate": 2.7808452104817412e-05, "Pretrain/Loss": 2.04638934135437, "Pretrain/Loss (Raw)": 2.0511562824249268, "Pretrain/Step": 4580, "Pretrain/Step Time": 8.42299885675311} +{"Pretrain/Learning Rate": 2.7800015810435865e-05, "Pretrain/Loss": 2.0483031272888184, "Pretrain/Loss (Raw)": 2.2810800075531006, "Pretrain/Step": 4581, "Pretrain/Step Time": 8.424383336678147} +{"Pretrain/Learning Rate": 2.779157919314329e-05, "Pretrain/Loss": 2.0497446060180664, "Pretrain/Loss (Raw)": 2.2046399116516113, "Pretrain/Step": 4582, "Pretrain/Step Time": 8.430335234850645} +{"Pretrain/Learning Rate": 2.7783142253912647e-05, "Pretrain/Loss": 2.0491182804107666, "Pretrain/Loss (Raw)": 2.1320064067840576, "Pretrain/Step": 4583, "Pretrain/Step Time": 8.430979797616601} +{"Pretrain/Learning Rate": 2.7774704993716937e-05, "Pretrain/Loss": 2.051283121109009, "Pretrain/Loss (Raw)": 2.122861862182617, "Pretrain/Step": 4584, "Pretrain/Step Time": 8.42537409439683} +{"Pretrain/Learning Rate": 2.776626741352916e-05, "Pretrain/Loss": 2.0507454872131348, "Pretrain/Loss (Raw)": 1.9488192796707153, "Pretrain/Step": 4585, "Pretrain/Step Time": 8.423018207773566} +{"Pretrain/Learning Rate": 2.7757829514322397e-05, "Pretrain/Loss": 2.0515871047973633, "Pretrain/Loss (Raw)": 2.128359079360962, "Pretrain/Step": 4586, "Pretrain/Step Time": 8.425424847751856} +{"Pretrain/Learning Rate": 2.774939129706974e-05, "Pretrain/Loss": 2.0513782501220703, "Pretrain/Loss (Raw)": 2.09641170501709, "Pretrain/Step": 4587, "Pretrain/Step Time": 8.421896394342184} +{"Pretrain/Learning Rate": 2.7740952762744322e-05, "Pretrain/Loss": 2.0535502433776855, "Pretrain/Loss (Raw)": 2.2204532623291016, "Pretrain/Step": 4588, "Pretrain/Step Time": 8.432884346693754} +{"Pretrain/Learning Rate": 2.7732513912319314e-05, "Pretrain/Loss": 2.055793523788452, "Pretrain/Loss (Raw)": 2.109008312225342, "Pretrain/Step": 4589, "Pretrain/Step Time": 8.432745289057493} +{"Pretrain/Learning Rate": 2.7724074746767926e-05, "Pretrain/Loss": 2.059098720550537, "Pretrain/Loss (Raw)": 1.9821101427078247, "Pretrain/Step": 4590, "Pretrain/Step Time": 8.428099827840924} +{"Pretrain/Learning Rate": 2.77156352670634e-05, "Pretrain/Loss": 2.059999704360962, "Pretrain/Loss (Raw)": 2.054164171218872, "Pretrain/Step": 4591, "Pretrain/Step Time": 8.42716046795249} +{"Pretrain/Learning Rate": 2.770719547417902e-05, "Pretrain/Loss": 2.0568766593933105, "Pretrain/Loss (Raw)": 1.7377593517303467, "Pretrain/Step": 4592, "Pretrain/Step Time": 8.42157632485032} +{"Pretrain/Learning Rate": 2.76987553690881e-05, "Pretrain/Loss": 2.057827949523926, "Pretrain/Loss (Raw)": 2.093966007232666, "Pretrain/Step": 4593, "Pretrain/Step Time": 8.4249925352633} +{"Pretrain/Learning Rate": 2.7690314952764e-05, "Pretrain/Loss": 2.057133674621582, "Pretrain/Loss (Raw)": 2.1413791179656982, "Pretrain/Step": 4594, "Pretrain/Step Time": 8.43540090881288} +{"Pretrain/Learning Rate": 2.7681874226180093e-05, "Pretrain/Loss": 2.0542619228363037, "Pretrain/Loss (Raw)": 1.711734652519226, "Pretrain/Step": 4595, "Pretrain/Step Time": 8.435343628749251} +{"Pretrain/Learning Rate": 2.7673433190309823e-05, "Pretrain/Loss": 2.053743362426758, "Pretrain/Loss (Raw)": 2.022984743118286, "Pretrain/Step": 4596, "Pretrain/Step Time": 8.431146420538425} +{"Pretrain/Learning Rate": 2.766499184612663e-05, "Pretrain/Loss": 2.051920175552368, "Pretrain/Loss (Raw)": 1.7780545949935913, "Pretrain/Step": 4597, "Pretrain/Step Time": 8.424709688872099} +{"Pretrain/Learning Rate": 2.7656550194604026e-05, "Pretrain/Loss": 2.0511858463287354, "Pretrain/Loss (Raw)": 1.9765375852584839, "Pretrain/Step": 4598, "Pretrain/Step Time": 8.425900492817163} +{"Pretrain/Learning Rate": 2.7648108236715536e-05, "Pretrain/Loss": 2.0522043704986572, "Pretrain/Loss (Raw)": 2.0382697582244873, "Pretrain/Step": 4599, "Pretrain/Step Time": 8.428853124380112} +{"Pretrain/Learning Rate": 2.7639665973434725e-05, "Pretrain/Loss": 2.0526883602142334, "Pretrain/Loss (Raw)": 2.0788869857788086, "Pretrain/Step": 4600, "Pretrain/Step Time": 8.432853415608406} +{"Pretrain/Learning Rate": 2.7631223405735196e-05, "Pretrain/Loss": 2.0520870685577393, "Pretrain/Loss (Raw)": 1.904990553855896, "Pretrain/Step": 4601, "Pretrain/Step Time": 8.433324990794063} +{"Pretrain/Learning Rate": 2.7622780534590582e-05, "Pretrain/Loss": 2.048572301864624, "Pretrain/Loss (Raw)": 1.5936903953552246, "Pretrain/Step": 4602, "Pretrain/Step Time": 8.433421736583114} +{"Pretrain/Learning Rate": 2.7614337360974558e-05, "Pretrain/Loss": 2.049879550933838, "Pretrain/Loss (Raw)": 2.0401861667633057, "Pretrain/Step": 4603, "Pretrain/Step Time": 8.432659525424242} +{"Pretrain/Learning Rate": 2.760589388586083e-05, "Pretrain/Loss": 2.0506250858306885, "Pretrain/Loss (Raw)": 2.1137592792510986, "Pretrain/Step": 4604, "Pretrain/Step Time": 8.43047944828868} +{"Pretrain/Learning Rate": 2.7597450110223145e-05, "Pretrain/Loss": 2.0499322414398193, "Pretrain/Loss (Raw)": 2.018890380859375, "Pretrain/Step": 4605, "Pretrain/Step Time": 8.433554576709867} +{"Pretrain/Learning Rate": 2.7589006035035264e-05, "Pretrain/Loss": 2.049170970916748, "Pretrain/Loss (Raw)": 1.893235683441162, "Pretrain/Step": 4606, "Pretrain/Step Time": 8.435204599052668} +{"Pretrain/Learning Rate": 2.7580561661271014e-05, "Pretrain/Loss": 2.053107261657715, "Pretrain/Loss (Raw)": 2.2162153720855713, "Pretrain/Step": 4607, "Pretrain/Step Time": 8.433140443637967} +{"Pretrain/Learning Rate": 2.7572116989904228e-05, "Pretrain/Loss": 2.052415370941162, "Pretrain/Loss (Raw)": 2.0538885593414307, "Pretrain/Step": 4608, "Pretrain/Step Time": 8.429920891299844} +{"Pretrain/Learning Rate": 2.7563672021908797e-05, "Pretrain/Loss": 2.052100658416748, "Pretrain/Loss (Raw)": 1.9082175493240356, "Pretrain/Step": 4609, "Pretrain/Step Time": 8.425846373662353} +{"Pretrain/Learning Rate": 2.7555226758258624e-05, "Pretrain/Loss": 2.052076816558838, "Pretrain/Loss (Raw)": 1.9456006288528442, "Pretrain/Step": 4610, "Pretrain/Step Time": 8.426185075193644} +{"Pretrain/Learning Rate": 2.7546781199927667e-05, "Pretrain/Loss": 2.0538058280944824, "Pretrain/Loss (Raw)": 2.22680926322937, "Pretrain/Step": 4611, "Pretrain/Step Time": 8.430821171030402} +{"Pretrain/Learning Rate": 2.7538335347889892e-05, "Pretrain/Loss": 2.0552377700805664, "Pretrain/Loss (Raw)": 2.108665704727173, "Pretrain/Step": 4612, "Pretrain/Step Time": 8.430356975644827} +{"Pretrain/Learning Rate": 2.752988920311933e-05, "Pretrain/Loss": 2.053086280822754, "Pretrain/Loss (Raw)": 2.020322561264038, "Pretrain/Step": 4613, "Pretrain/Step Time": 8.427818965166807} +{"Pretrain/Learning Rate": 2.7521442766590027e-05, "Pretrain/Loss": 2.053967237472534, "Pretrain/Loss (Raw)": 2.124346971511841, "Pretrain/Step": 4614, "Pretrain/Step Time": 8.427412467077374} +{"Pretrain/Learning Rate": 2.7512996039276055e-05, "Pretrain/Loss": 2.0528645515441895, "Pretrain/Loss (Raw)": 2.0391829013824463, "Pretrain/Step": 4615, "Pretrain/Step Time": 8.428624151274562} +{"Pretrain/Learning Rate": 2.7504549022151543e-05, "Pretrain/Loss": 2.0517115592956543, "Pretrain/Loss (Raw)": 2.096362590789795, "Pretrain/Step": 4616, "Pretrain/Step Time": 8.435222178697586} +{"Pretrain/Learning Rate": 2.749610171619063e-05, "Pretrain/Loss": 2.053579568862915, "Pretrain/Loss (Raw)": 1.973528265953064, "Pretrain/Step": 4617, "Pretrain/Step Time": 8.4361636582762} +{"Pretrain/Learning Rate": 2.748765412236751e-05, "Pretrain/Loss": 2.0537519454956055, "Pretrain/Loss (Raw)": 2.2224044799804688, "Pretrain/Step": 4618, "Pretrain/Step Time": 8.432066276669502} +{"Pretrain/Learning Rate": 2.747920624165639e-05, "Pretrain/Loss": 2.0541727542877197, "Pretrain/Loss (Raw)": 1.9616186618804932, "Pretrain/Step": 4619, "Pretrain/Step Time": 8.423330353572965} +{"Pretrain/Learning Rate": 2.7470758075031533e-05, "Pretrain/Loss": 2.0539958477020264, "Pretrain/Loss (Raw)": 1.9829108715057373, "Pretrain/Step": 4620, "Pretrain/Step Time": 8.426710464060307} +{"Pretrain/Learning Rate": 2.7462309623467204e-05, "Pretrain/Loss": 2.0533878803253174, "Pretrain/Loss (Raw)": 1.9828506708145142, "Pretrain/Step": 4621, "Pretrain/Step Time": 8.432585503906012} +{"Pretrain/Learning Rate": 2.7453860887937732e-05, "Pretrain/Loss": 2.0525197982788086, "Pretrain/Loss (Raw)": 1.9281294345855713, "Pretrain/Step": 4622, "Pretrain/Step Time": 8.437547113746405} +{"Pretrain/Learning Rate": 2.7445411869417453e-05, "Pretrain/Loss": 2.0521650314331055, "Pretrain/Loss (Raw)": 1.9711856842041016, "Pretrain/Step": 4623, "Pretrain/Step Time": 8.43191034719348} +{"Pretrain/Learning Rate": 2.7436962568880752e-05, "Pretrain/Loss": 2.0542514324188232, "Pretrain/Loss (Raw)": 2.1913654804229736, "Pretrain/Step": 4624, "Pretrain/Step Time": 8.434369908645749} +{"Pretrain/Learning Rate": 2.7428512987302053e-05, "Pretrain/Loss": 2.052950382232666, "Pretrain/Loss (Raw)": 2.0294435024261475, "Pretrain/Step": 4625, "Pretrain/Step Time": 8.428927130997181} +{"Pretrain/Learning Rate": 2.7420063125655787e-05, "Pretrain/Loss": 2.055392265319824, "Pretrain/Loss (Raw)": 2.257014274597168, "Pretrain/Step": 4626, "Pretrain/Step Time": 8.4253103248775} +{"Pretrain/Learning Rate": 2.741161298491644e-05, "Pretrain/Loss": 2.051307201385498, "Pretrain/Loss (Raw)": 1.7059967517852783, "Pretrain/Step": 4627, "Pretrain/Step Time": 8.429939594119787} +{"Pretrain/Learning Rate": 2.7403162566058517e-05, "Pretrain/Loss": 2.0503907203674316, "Pretrain/Loss (Raw)": 1.8593631982803345, "Pretrain/Step": 4628, "Pretrain/Step Time": 8.435161309316754} +{"Pretrain/Learning Rate": 2.7394711870056567e-05, "Pretrain/Loss": 2.050508499145508, "Pretrain/Loss (Raw)": 2.1683225631713867, "Pretrain/Step": 4629, "Pretrain/Step Time": 8.429423451423645} +{"Pretrain/Learning Rate": 2.7386260897885156e-05, "Pretrain/Loss": 2.049084424972534, "Pretrain/Loss (Raw)": 2.080341100692749, "Pretrain/Step": 4630, "Pretrain/Step Time": 8.429915208369493} +{"Pretrain/Learning Rate": 2.73778096505189e-05, "Pretrain/Loss": 2.047445297241211, "Pretrain/Loss (Raw)": 2.049969434738159, "Pretrain/Step": 4631, "Pretrain/Step Time": 8.428063750267029} +{"Pretrain/Learning Rate": 2.7369358128932422e-05, "Pretrain/Loss": 2.046656608581543, "Pretrain/Loss (Raw)": 2.140935182571411, "Pretrain/Step": 4632, "Pretrain/Step Time": 8.427864076569676} +{"Pretrain/Learning Rate": 2.7360906334100407e-05, "Pretrain/Loss": 2.0419702529907227, "Pretrain/Loss (Raw)": 1.7683875560760498, "Pretrain/Step": 4633, "Pretrain/Step Time": 8.425700694322586} +{"Pretrain/Learning Rate": 2.7352454266997545e-05, "Pretrain/Loss": 2.03981876373291, "Pretrain/Loss (Raw)": 1.933982253074646, "Pretrain/Step": 4634, "Pretrain/Step Time": 8.435389939695597} +{"Pretrain/Learning Rate": 2.734400192859857e-05, "Pretrain/Loss": 2.0430774688720703, "Pretrain/Loss (Raw)": 2.1456961631774902, "Pretrain/Step": 4635, "Pretrain/Step Time": 8.432527847588062} +{"Pretrain/Learning Rate": 2.7335549319878252e-05, "Pretrain/Loss": 2.0409786701202393, "Pretrain/Loss (Raw)": 1.7750463485717773, "Pretrain/Step": 4636, "Pretrain/Step Time": 8.431060502305627} +{"Pretrain/Learning Rate": 2.7327096441811383e-05, "Pretrain/Loss": 2.0415263175964355, "Pretrain/Loss (Raw)": 2.210318088531494, "Pretrain/Step": 4637, "Pretrain/Step Time": 8.431016704067588} +{"Pretrain/Learning Rate": 2.7318643295372776e-05, "Pretrain/Loss": 2.0374488830566406, "Pretrain/Loss (Raw)": 1.8692190647125244, "Pretrain/Step": 4638, "Pretrain/Step Time": 8.429928051307797} +{"Pretrain/Learning Rate": 2.7310189881537307e-05, "Pretrain/Loss": 2.0365681648254395, "Pretrain/Loss (Raw)": 1.9061301946640015, "Pretrain/Step": 4639, "Pretrain/Step Time": 8.43813069164753} +{"Pretrain/Learning Rate": 2.7301736201279858e-05, "Pretrain/Loss": 2.0347352027893066, "Pretrain/Loss (Raw)": 2.0923595428466797, "Pretrain/Step": 4640, "Pretrain/Step Time": 8.44111954793334} +{"Pretrain/Learning Rate": 2.7293282255575335e-05, "Pretrain/Loss": 2.035823345184326, "Pretrain/Loss (Raw)": 2.015033721923828, "Pretrain/Step": 4641, "Pretrain/Step Time": 8.440764607861638} +{"Pretrain/Learning Rate": 2.7284828045398703e-05, "Pretrain/Loss": 2.0349650382995605, "Pretrain/Loss (Raw)": 1.9395906925201416, "Pretrain/Step": 4642, "Pretrain/Step Time": 8.428468767553568} +{"Pretrain/Learning Rate": 2.7276373571724927e-05, "Pretrain/Loss": 2.0358104705810547, "Pretrain/Loss (Raw)": 1.9315719604492188, "Pretrain/Step": 4643, "Pretrain/Step Time": 8.431913236156106} +{"Pretrain/Learning Rate": 2.7267918835529033e-05, "Pretrain/Loss": 2.035266876220703, "Pretrain/Loss (Raw)": 1.9738801717758179, "Pretrain/Step": 4644, "Pretrain/Step Time": 8.432946125045419} +{"Pretrain/Learning Rate": 2.725946383778605e-05, "Pretrain/Loss": 2.034694194793701, "Pretrain/Loss (Raw)": 2.2236666679382324, "Pretrain/Step": 4645, "Pretrain/Step Time": 8.43531595915556} +{"Pretrain/Learning Rate": 2.7251008579471044e-05, "Pretrain/Loss": 2.033456802368164, "Pretrain/Loss (Raw)": 2.0462746620178223, "Pretrain/Step": 4646, "Pretrain/Step Time": 8.437310181558132} +{"Pretrain/Learning Rate": 2.7242553061559123e-05, "Pretrain/Loss": 2.02995228767395, "Pretrain/Loss (Raw)": 1.8773248195648193, "Pretrain/Step": 4647, "Pretrain/Step Time": 8.43748070858419} +{"Pretrain/Learning Rate": 2.7234097285025424e-05, "Pretrain/Loss": 2.0300841331481934, "Pretrain/Loss (Raw)": 2.0599372386932373, "Pretrain/Step": 4648, "Pretrain/Step Time": 8.431356329470873} +{"Pretrain/Learning Rate": 2.7225641250845085e-05, "Pretrain/Loss": 2.0267903804779053, "Pretrain/Loss (Raw)": 1.815723180770874, "Pretrain/Step": 4649, "Pretrain/Step Time": 8.424381859600544} +{"Pretrain/Learning Rate": 2.7217184959993326e-05, "Pretrain/Loss": 2.0258567333221436, "Pretrain/Loss (Raw)": 1.9531104564666748, "Pretrain/Step": 4650, "Pretrain/Step Time": 8.426268104463816} +{"Pretrain/Learning Rate": 2.7208728413445332e-05, "Pretrain/Loss": 2.0248842239379883, "Pretrain/Loss (Raw)": 1.9621639251708984, "Pretrain/Step": 4651, "Pretrain/Step Time": 8.43141377530992} +{"Pretrain/Learning Rate": 2.720027161217638e-05, "Pretrain/Loss": 2.0248208045959473, "Pretrain/Loss (Raw)": 1.956984519958496, "Pretrain/Step": 4652, "Pretrain/Step Time": 8.431390963494778} +{"Pretrain/Learning Rate": 2.7191814557161736e-05, "Pretrain/Loss": 2.026963949203491, "Pretrain/Loss (Raw)": 2.299905300140381, "Pretrain/Step": 4653, "Pretrain/Step Time": 8.431370344012976} +{"Pretrain/Learning Rate": 2.7183357249376712e-05, "Pretrain/Loss": 2.0294547080993652, "Pretrain/Loss (Raw)": 2.362321376800537, "Pretrain/Step": 4654, "Pretrain/Step Time": 8.42327370122075} +{"Pretrain/Learning Rate": 2.7174899689796636e-05, "Pretrain/Loss": 2.029989242553711, "Pretrain/Loss (Raw)": 2.081416606903076, "Pretrain/Step": 4655, "Pretrain/Step Time": 8.424754779785872} +{"Pretrain/Learning Rate": 2.7166441879396887e-05, "Pretrain/Loss": 2.0281457901000977, "Pretrain/Loss (Raw)": 1.7907565832138062, "Pretrain/Step": 4656, "Pretrain/Step Time": 8.430711751803756} +{"Pretrain/Learning Rate": 2.7157983819152848e-05, "Pretrain/Loss": 2.027726173400879, "Pretrain/Loss (Raw)": 2.0355799198150635, "Pretrain/Step": 4657, "Pretrain/Step Time": 8.428790800273418} +{"Pretrain/Learning Rate": 2.714952551003994e-05, "Pretrain/Loss": 2.0291647911071777, "Pretrain/Loss (Raw)": 2.115734100341797, "Pretrain/Step": 4658, "Pretrain/Step Time": 8.429723469540477} +{"Pretrain/Learning Rate": 2.714106695303363e-05, "Pretrain/Loss": 2.0292410850524902, "Pretrain/Loss (Raw)": 1.9719523191452026, "Pretrain/Step": 4659, "Pretrain/Step Time": 8.425467371940613} +{"Pretrain/Learning Rate": 2.7132608149109383e-05, "Pretrain/Loss": 2.027905225753784, "Pretrain/Loss (Raw)": 1.8532025814056396, "Pretrain/Step": 4660, "Pretrain/Step Time": 8.423320591449738} +{"Pretrain/Learning Rate": 2.7124149099242724e-05, "Pretrain/Loss": 2.030456066131592, "Pretrain/Loss (Raw)": 1.98894464969635, "Pretrain/Step": 4661, "Pretrain/Step Time": 8.43049804866314} +{"Pretrain/Learning Rate": 2.7115689804409174e-05, "Pretrain/Loss": 2.03143310546875, "Pretrain/Loss (Raw)": 2.1480627059936523, "Pretrain/Step": 4662, "Pretrain/Step Time": 8.432697994634509} +{"Pretrain/Learning Rate": 2.710723026558431e-05, "Pretrain/Loss": 2.032144069671631, "Pretrain/Loss (Raw)": 2.1362342834472656, "Pretrain/Step": 4663, "Pretrain/Step Time": 8.42990561015904} +{"Pretrain/Learning Rate": 2.709877048374371e-05, "Pretrain/Loss": 2.033501148223877, "Pretrain/Loss (Raw)": 2.0937113761901855, "Pretrain/Step": 4664, "Pretrain/Step Time": 8.431904861703515} +{"Pretrain/Learning Rate": 2.709031045986302e-05, "Pretrain/Loss": 2.031529188156128, "Pretrain/Loss (Raw)": 2.0650854110717773, "Pretrain/Step": 4665, "Pretrain/Step Time": 8.423887718468904} +{"Pretrain/Learning Rate": 2.708185019491788e-05, "Pretrain/Loss": 2.031586170196533, "Pretrain/Loss (Raw)": 1.9367644786834717, "Pretrain/Step": 4666, "Pretrain/Step Time": 8.422954512760043} +{"Pretrain/Learning Rate": 2.707338968988396e-05, "Pretrain/Loss": 2.0323333740234375, "Pretrain/Loss (Raw)": 2.0144989490509033, "Pretrain/Step": 4667, "Pretrain/Step Time": 8.4265773948282} +{"Pretrain/Learning Rate": 2.7064928945736974e-05, "Pretrain/Loss": 2.0345637798309326, "Pretrain/Loss (Raw)": 2.3460021018981934, "Pretrain/Step": 4668, "Pretrain/Step Time": 8.429736780002713} +{"Pretrain/Learning Rate": 2.7056467963452646e-05, "Pretrain/Loss": 2.034968614578247, "Pretrain/Loss (Raw)": 1.99079167842865, "Pretrain/Step": 4669, "Pretrain/Step Time": 8.429897703230381} +{"Pretrain/Learning Rate": 2.704800674400675e-05, "Pretrain/Loss": 2.034970760345459, "Pretrain/Loss (Raw)": 2.088024854660034, "Pretrain/Step": 4670, "Pretrain/Step Time": 8.434947684407234} +{"Pretrain/Learning Rate": 2.703954528837506e-05, "Pretrain/Loss": 2.034834623336792, "Pretrain/Loss (Raw)": 1.924344539642334, "Pretrain/Step": 4671, "Pretrain/Step Time": 8.428339255973697} +{"Pretrain/Learning Rate": 2.7031083597533402e-05, "Pretrain/Loss": 2.034945487976074, "Pretrain/Loss (Raw)": 2.097646951675415, "Pretrain/Step": 4672, "Pretrain/Step Time": 8.430223777890205} +{"Pretrain/Learning Rate": 2.702262167245761e-05, "Pretrain/Loss": 2.036437511444092, "Pretrain/Loss (Raw)": 2.3219103813171387, "Pretrain/Step": 4673, "Pretrain/Step Time": 8.43499581515789} +{"Pretrain/Learning Rate": 2.7014159514123555e-05, "Pretrain/Loss": 2.0352442264556885, "Pretrain/Loss (Raw)": 1.948402762413025, "Pretrain/Step": 4674, "Pretrain/Step Time": 8.436018573120236} +{"Pretrain/Learning Rate": 2.7005697123507134e-05, "Pretrain/Loss": 2.0333657264709473, "Pretrain/Loss (Raw)": 1.993337869644165, "Pretrain/Step": 4675, "Pretrain/Step Time": 8.439601972699165} +{"Pretrain/Learning Rate": 2.6997234501584267e-05, "Pretrain/Loss": 2.0358798503875732, "Pretrain/Loss (Raw)": 2.1958093643188477, "Pretrain/Step": 4676, "Pretrain/Step Time": 8.427660673856735} +{"Pretrain/Learning Rate": 2.6988771649330906e-05, "Pretrain/Loss": 2.038756847381592, "Pretrain/Loss (Raw)": 2.119528293609619, "Pretrain/Step": 4677, "Pretrain/Step Time": 8.426856517791748} +{"Pretrain/Learning Rate": 2.6980308567723035e-05, "Pretrain/Loss": 2.0383963584899902, "Pretrain/Loss (Raw)": 2.145782470703125, "Pretrain/Step": 4678, "Pretrain/Step Time": 8.428527617827058} +{"Pretrain/Learning Rate": 2.697184525773664e-05, "Pretrain/Loss": 2.0403780937194824, "Pretrain/Loss (Raw)": 2.257225751876831, "Pretrain/Step": 4679, "Pretrain/Step Time": 8.432696498930454} +{"Pretrain/Learning Rate": 2.6963381720347764e-05, "Pretrain/Loss": 2.0407466888427734, "Pretrain/Loss (Raw)": 2.118635892868042, "Pretrain/Step": 4680, "Pretrain/Step Time": 8.437143443152308} +{"Pretrain/Learning Rate": 2.6954917956532455e-05, "Pretrain/Loss": 2.0395150184631348, "Pretrain/Loss (Raw)": 2.0861880779266357, "Pretrain/Step": 4681, "Pretrain/Step Time": 8.438232949003577} +{"Pretrain/Learning Rate": 2.6946453967266792e-05, "Pretrain/Loss": 2.0371196269989014, "Pretrain/Loss (Raw)": 2.0476181507110596, "Pretrain/Step": 4682, "Pretrain/Step Time": 8.43439763225615} +{"Pretrain/Learning Rate": 2.693798975352689e-05, "Pretrain/Loss": 2.0350561141967773, "Pretrain/Loss (Raw)": 1.7808679342269897, "Pretrain/Step": 4683, "Pretrain/Step Time": 8.437141597270966} +{"Pretrain/Learning Rate": 2.6929525316288874e-05, "Pretrain/Loss": 2.030388355255127, "Pretrain/Loss (Raw)": 1.7025492191314697, "Pretrain/Step": 4684, "Pretrain/Step Time": 8.43888396024704} +{"Pretrain/Learning Rate": 2.692106065652891e-05, "Pretrain/Loss": 2.0324368476867676, "Pretrain/Loss (Raw)": 2.0648510456085205, "Pretrain/Step": 4685, "Pretrain/Step Time": 8.436732770875096} +{"Pretrain/Learning Rate": 2.6912595775223175e-05, "Pretrain/Loss": 2.0331544876098633, "Pretrain/Loss (Raw)": 1.9214329719543457, "Pretrain/Step": 4686, "Pretrain/Step Time": 8.434691859409213} +{"Pretrain/Learning Rate": 2.6904130673347887e-05, "Pretrain/Loss": 2.034451961517334, "Pretrain/Loss (Raw)": 2.1741607189178467, "Pretrain/Step": 4687, "Pretrain/Step Time": 8.430844815447927} +{"Pretrain/Learning Rate": 2.6895665351879274e-05, "Pretrain/Loss": 2.034592390060425, "Pretrain/Loss (Raw)": 2.0320522785186768, "Pretrain/Step": 4688, "Pretrain/Step Time": 8.42941515147686} +{"Pretrain/Learning Rate": 2.68871998117936e-05, "Pretrain/Loss": 2.0421111583709717, "Pretrain/Loss (Raw)": 2.918529987335205, "Pretrain/Step": 4689, "Pretrain/Step Time": 8.418250933289528} +{"Pretrain/Learning Rate": 2.687873405406715e-05, "Pretrain/Loss": 2.0423107147216797, "Pretrain/Loss (Raw)": 2.1140313148498535, "Pretrain/Step": 4690, "Pretrain/Step Time": 8.423718547448516} +{"Pretrain/Learning Rate": 2.6870268079676237e-05, "Pretrain/Loss": 2.040907382965088, "Pretrain/Loss (Raw)": 1.9365875720977783, "Pretrain/Step": 4691, "Pretrain/Step Time": 8.423744907602668} +{"Pretrain/Learning Rate": 2.6861801889597193e-05, "Pretrain/Loss": 2.0402722358703613, "Pretrain/Loss (Raw)": 1.927903413772583, "Pretrain/Step": 4692, "Pretrain/Step Time": 8.423464260995388} +{"Pretrain/Learning Rate": 2.685333548480639e-05, "Pretrain/Loss": 2.0412380695343018, "Pretrain/Loss (Raw)": 2.1989731788635254, "Pretrain/Step": 4693, "Pretrain/Step Time": 8.416850727051497} +{"Pretrain/Learning Rate": 2.68448688662802e-05, "Pretrain/Loss": 2.04229736328125, "Pretrain/Loss (Raw)": 2.2434885501861572, "Pretrain/Step": 4694, "Pretrain/Step Time": 8.41709553822875} +{"Pretrain/Learning Rate": 2.683640203499504e-05, "Pretrain/Loss": 2.039720296859741, "Pretrain/Loss (Raw)": 1.995459794998169, "Pretrain/Step": 4695, "Pretrain/Step Time": 8.422091074287891} +{"Pretrain/Learning Rate": 2.682793499192734e-05, "Pretrain/Loss": 2.039954900741577, "Pretrain/Loss (Raw)": 2.0709335803985596, "Pretrain/Step": 4696, "Pretrain/Step Time": 8.428396183997393} +{"Pretrain/Learning Rate": 2.6819467738053572e-05, "Pretrain/Loss": 2.0383028984069824, "Pretrain/Loss (Raw)": 1.9938337802886963, "Pretrain/Step": 4697, "Pretrain/Step Time": 8.425790911540389} +{"Pretrain/Learning Rate": 2.6811000274350205e-05, "Pretrain/Loss": 2.0388376712799072, "Pretrain/Loss (Raw)": 2.164746046066284, "Pretrain/Step": 4698, "Pretrain/Step Time": 8.42745235003531} +{"Pretrain/Learning Rate": 2.680253260179375e-05, "Pretrain/Loss": 2.038837432861328, "Pretrain/Loss (Raw)": 2.06477427482605, "Pretrain/Step": 4699, "Pretrain/Step Time": 8.428983116522431} +{"Pretrain/Learning Rate": 2.6794064721360752e-05, "Pretrain/Loss": 2.042128562927246, "Pretrain/Loss (Raw)": 2.3320207595825195, "Pretrain/Step": 4700, "Pretrain/Step Time": 8.427502324804664} +{"Pretrain/Learning Rate": 2.6785596634027745e-05, "Pretrain/Loss": 2.042126178741455, "Pretrain/Loss (Raw)": 2.1297197341918945, "Pretrain/Step": 4701, "Pretrain/Step Time": 8.432975236326456} +{"Pretrain/Learning Rate": 2.677712834077133e-05, "Pretrain/Loss": 2.0431652069091797, "Pretrain/Loss (Raw)": 1.9497830867767334, "Pretrain/Step": 4702, "Pretrain/Step Time": 8.43425559066236} +{"Pretrain/Learning Rate": 2.676865984256809e-05, "Pretrain/Loss": 2.0466768741607666, "Pretrain/Loss (Raw)": 2.307049512863159, "Pretrain/Step": 4703, "Pretrain/Step Time": 8.432232543826103} +{"Pretrain/Learning Rate": 2.6760191140394668e-05, "Pretrain/Loss": 2.049323797225952, "Pretrain/Loss (Raw)": 2.180088520050049, "Pretrain/Step": 4704, "Pretrain/Step Time": 8.428242152556777} +{"Pretrain/Learning Rate": 2.675172223522771e-05, "Pretrain/Loss": 2.052088737487793, "Pretrain/Loss (Raw)": 2.38273024559021, "Pretrain/Step": 4705, "Pretrain/Step Time": 8.417028300464153} +{"Pretrain/Learning Rate": 2.6743253128043887e-05, "Pretrain/Loss": 2.0502312183380127, "Pretrain/Loss (Raw)": 2.017073631286621, "Pretrain/Step": 4706, "Pretrain/Step Time": 8.42708571255207} +{"Pretrain/Learning Rate": 2.6734783819819903e-05, "Pretrain/Loss": 2.0494704246520996, "Pretrain/Loss (Raw)": 1.976386308670044, "Pretrain/Step": 4707, "Pretrain/Step Time": 8.43245736323297} +{"Pretrain/Learning Rate": 2.6726314311532467e-05, "Pretrain/Loss": 2.048388719558716, "Pretrain/Loss (Raw)": 1.9126756191253662, "Pretrain/Step": 4708, "Pretrain/Step Time": 8.432494062930346} +{"Pretrain/Learning Rate": 2.671784460415834e-05, "Pretrain/Loss": 2.0469393730163574, "Pretrain/Loss (Raw)": 2.095585584640503, "Pretrain/Step": 4709, "Pretrain/Step Time": 8.433932906016707} +{"Pretrain/Learning Rate": 2.6709374698674267e-05, "Pretrain/Loss": 2.0462379455566406, "Pretrain/Loss (Raw)": 2.1148462295532227, "Pretrain/Step": 4710, "Pretrain/Step Time": 8.427584474906325} +{"Pretrain/Learning Rate": 2.670090459605706e-05, "Pretrain/Loss": 2.0459327697753906, "Pretrain/Loss (Raw)": 2.0929534435272217, "Pretrain/Step": 4711, "Pretrain/Step Time": 8.425456896424294} +{"Pretrain/Learning Rate": 2.6692434297283514e-05, "Pretrain/Loss": 2.043747901916504, "Pretrain/Loss (Raw)": 1.8431802988052368, "Pretrain/Step": 4712, "Pretrain/Step Time": 8.428470365703106} +{"Pretrain/Learning Rate": 2.6683963803330468e-05, "Pretrain/Loss": 2.043774366378784, "Pretrain/Loss (Raw)": 1.9521894454956055, "Pretrain/Step": 4713, "Pretrain/Step Time": 8.431242307648063} +{"Pretrain/Learning Rate": 2.6675493115174786e-05, "Pretrain/Loss": 2.0440773963928223, "Pretrain/Loss (Raw)": 2.167171001434326, "Pretrain/Step": 4714, "Pretrain/Step Time": 8.43061346001923} +{"Pretrain/Learning Rate": 2.6667022233793342e-05, "Pretrain/Loss": 2.043017864227295, "Pretrain/Loss (Raw)": 1.9607787132263184, "Pretrain/Step": 4715, "Pretrain/Step Time": 8.428840924054384} +{"Pretrain/Learning Rate": 2.6658551160163036e-05, "Pretrain/Loss": 2.0419225692749023, "Pretrain/Loss (Raw)": 2.0802786350250244, "Pretrain/Step": 4716, "Pretrain/Step Time": 8.419302679598331} +{"Pretrain/Learning Rate": 2.6650079895260798e-05, "Pretrain/Loss": 2.041287899017334, "Pretrain/Loss (Raw)": 2.0277631282806396, "Pretrain/Step": 4717, "Pretrain/Step Time": 8.42500925064087} +{"Pretrain/Learning Rate": 2.664160844006357e-05, "Pretrain/Loss": 2.041869640350342, "Pretrain/Loss (Raw)": 2.0565578937530518, "Pretrain/Step": 4718, "Pretrain/Step Time": 8.429036147892475} +{"Pretrain/Learning Rate": 2.6633136795548326e-05, "Pretrain/Loss": 2.0413479804992676, "Pretrain/Loss (Raw)": 1.9874156713485718, "Pretrain/Step": 4719, "Pretrain/Step Time": 8.433630887418985} +{"Pretrain/Learning Rate": 2.662466496269204e-05, "Pretrain/Loss": 2.0468592643737793, "Pretrain/Loss (Raw)": 2.4432027339935303, "Pretrain/Step": 4720, "Pretrain/Step Time": 8.43603634275496} +{"Pretrain/Learning Rate": 2.661619294247174e-05, "Pretrain/Loss": 2.0465762615203857, "Pretrain/Loss (Raw)": 2.0577147006988525, "Pretrain/Step": 4721, "Pretrain/Step Time": 8.432045951485634} +{"Pretrain/Learning Rate": 2.6607720735864454e-05, "Pretrain/Loss": 2.044053077697754, "Pretrain/Loss (Raw)": 1.8184317350387573, "Pretrain/Step": 4722, "Pretrain/Step Time": 8.425200130790472} +{"Pretrain/Learning Rate": 2.6599248343847244e-05, "Pretrain/Loss": 2.046375036239624, "Pretrain/Loss (Raw)": 2.00895094871521, "Pretrain/Step": 4723, "Pretrain/Step Time": 8.424166882410645} +{"Pretrain/Learning Rate": 2.6590775767397174e-05, "Pretrain/Loss": 2.0436625480651855, "Pretrain/Loss (Raw)": 1.6757922172546387, "Pretrain/Step": 4724, "Pretrain/Step Time": 8.42941932938993} +{"Pretrain/Learning Rate": 2.6582303007491345e-05, "Pretrain/Loss": 2.045092821121216, "Pretrain/Loss (Raw)": 1.9611059427261353, "Pretrain/Step": 4725, "Pretrain/Step Time": 8.427661184221506} +{"Pretrain/Learning Rate": 2.6573830065106874e-05, "Pretrain/Loss": 2.0440311431884766, "Pretrain/Loss (Raw)": 1.8406206369400024, "Pretrain/Step": 4726, "Pretrain/Step Time": 8.428830472752452} +{"Pretrain/Learning Rate": 2.6565356941220908e-05, "Pretrain/Loss": 2.0438857078552246, "Pretrain/Loss (Raw)": 2.019674062728882, "Pretrain/Step": 4727, "Pretrain/Step Time": 8.427006075158715} +{"Pretrain/Learning Rate": 2.6556883636810605e-05, "Pretrain/Loss": 2.0426993370056152, "Pretrain/Loss (Raw)": 1.9270375967025757, "Pretrain/Step": 4728, "Pretrain/Step Time": 8.420996995642781} +{"Pretrain/Learning Rate": 2.6548410152853142e-05, "Pretrain/Loss": 2.042933940887451, "Pretrain/Loss (Raw)": 1.9350043535232544, "Pretrain/Step": 4729, "Pretrain/Step Time": 8.421627456322312} +{"Pretrain/Learning Rate": 2.6539936490325725e-05, "Pretrain/Loss": 2.0472970008850098, "Pretrain/Loss (Raw)": 2.15215802192688, "Pretrain/Step": 4730, "Pretrain/Step Time": 8.424236811697483} +{"Pretrain/Learning Rate": 2.6531462650205575e-05, "Pretrain/Loss": 2.0474934577941895, "Pretrain/Loss (Raw)": 2.0653531551361084, "Pretrain/Step": 4731, "Pretrain/Step Time": 8.426846131682396} +{"Pretrain/Learning Rate": 2.6522988633469938e-05, "Pretrain/Loss": 2.0461902618408203, "Pretrain/Loss (Raw)": 1.946934461593628, "Pretrain/Step": 4732, "Pretrain/Step Time": 8.431830631569028} +{"Pretrain/Learning Rate": 2.6514514441096066e-05, "Pretrain/Loss": 2.045544385910034, "Pretrain/Loss (Raw)": 1.9362270832061768, "Pretrain/Step": 4733, "Pretrain/Step Time": 8.427304681390524} +{"Pretrain/Learning Rate": 2.650604007406126e-05, "Pretrain/Loss": 2.0458004474639893, "Pretrain/Loss (Raw)": 1.9259997606277466, "Pretrain/Step": 4734, "Pretrain/Step Time": 8.426841149106622} +{"Pretrain/Learning Rate": 2.6497565533342816e-05, "Pretrain/Loss": 2.0439040660858154, "Pretrain/Loss (Raw)": 1.9734994173049927, "Pretrain/Step": 4735, "Pretrain/Step Time": 8.436508562415838} +{"Pretrain/Learning Rate": 2.6489090819918057e-05, "Pretrain/Loss": 2.042337656021118, "Pretrain/Loss (Raw)": 1.8533999919891357, "Pretrain/Step": 4736, "Pretrain/Step Time": 8.441191334277391} +{"Pretrain/Learning Rate": 2.6480615934764323e-05, "Pretrain/Loss": 2.0438807010650635, "Pretrain/Loss (Raw)": 2.105703115463257, "Pretrain/Step": 4737, "Pretrain/Step Time": 8.441025588661432} +{"Pretrain/Learning Rate": 2.6472140878858994e-05, "Pretrain/Loss": 2.0441102981567383, "Pretrain/Loss (Raw)": 1.9750103950500488, "Pretrain/Step": 4738, "Pretrain/Step Time": 8.436791468411684} +{"Pretrain/Learning Rate": 2.646366565317943e-05, "Pretrain/Loss": 2.042202949523926, "Pretrain/Loss (Raw)": 1.9826328754425049, "Pretrain/Step": 4739, "Pretrain/Step Time": 8.43261262215674} +{"Pretrain/Learning Rate": 2.6455190258703056e-05, "Pretrain/Loss": 2.0419278144836426, "Pretrain/Loss (Raw)": 2.0734801292419434, "Pretrain/Step": 4740, "Pretrain/Step Time": 8.431789392605424} +{"Pretrain/Learning Rate": 2.644671469640728e-05, "Pretrain/Loss": 2.0408453941345215, "Pretrain/Loss (Raw)": 1.8817741870880127, "Pretrain/Step": 4741, "Pretrain/Step Time": 8.434832697734237} +{"Pretrain/Learning Rate": 2.6438238967269546e-05, "Pretrain/Loss": 2.040003538131714, "Pretrain/Loss (Raw)": 2.0165538787841797, "Pretrain/Step": 4742, "Pretrain/Step Time": 8.431311724707484} +{"Pretrain/Learning Rate": 2.6429763072267317e-05, "Pretrain/Loss": 2.0398921966552734, "Pretrain/Loss (Raw)": 2.024925708770752, "Pretrain/Step": 4743, "Pretrain/Step Time": 8.432854741811752} +{"Pretrain/Learning Rate": 2.642128701237807e-05, "Pretrain/Loss": 2.0399231910705566, "Pretrain/Loss (Raw)": 2.1003308296203613, "Pretrain/Step": 4744, "Pretrain/Step Time": 8.427113484591246} +{"Pretrain/Learning Rate": 2.641281078857932e-05, "Pretrain/Loss": 2.039393901824951, "Pretrain/Loss (Raw)": 1.9058233499526978, "Pretrain/Step": 4745, "Pretrain/Step Time": 8.426789905875921} +{"Pretrain/Learning Rate": 2.6404334401848558e-05, "Pretrain/Loss": 2.0376574993133545, "Pretrain/Loss (Raw)": 2.0001041889190674, "Pretrain/Step": 4746, "Pretrain/Step Time": 8.432638661935925} +{"Pretrain/Learning Rate": 2.6395857853163346e-05, "Pretrain/Loss": 2.0363640785217285, "Pretrain/Loss (Raw)": 1.7960641384124756, "Pretrain/Step": 4747, "Pretrain/Step Time": 8.436726704239845} +{"Pretrain/Learning Rate": 2.6387381143501217e-05, "Pretrain/Loss": 2.0367183685302734, "Pretrain/Loss (Raw)": 2.028280735015869, "Pretrain/Step": 4748, "Pretrain/Step Time": 8.4383694678545} +{"Pretrain/Learning Rate": 2.6378904273839765e-05, "Pretrain/Loss": 2.0376670360565186, "Pretrain/Loss (Raw)": 2.104292869567871, "Pretrain/Step": 4749, "Pretrain/Step Time": 8.430499844253063} +{"Pretrain/Learning Rate": 2.6370427245156574e-05, "Pretrain/Loss": 2.0384812355041504, "Pretrain/Loss (Raw)": 2.032299041748047, "Pretrain/Step": 4750, "Pretrain/Step Time": 8.42728771083057} +{"Pretrain/Learning Rate": 2.6361950058429257e-05, "Pretrain/Loss": 2.0396783351898193, "Pretrain/Loss (Raw)": 2.1244547367095947, "Pretrain/Step": 4751, "Pretrain/Step Time": 8.43176880478859} +{"Pretrain/Learning Rate": 2.635347271463544e-05, "Pretrain/Loss": 2.0384178161621094, "Pretrain/Loss (Raw)": 2.0300064086914062, "Pretrain/Step": 4752, "Pretrain/Step Time": 8.43196315318346} +{"Pretrain/Learning Rate": 2.6344995214752772e-05, "Pretrain/Loss": 2.038968563079834, "Pretrain/Loss (Raw)": 2.0999248027801514, "Pretrain/Step": 4753, "Pretrain/Step Time": 8.43786952458322} +{"Pretrain/Learning Rate": 2.6336517559758915e-05, "Pretrain/Loss": 2.0378637313842773, "Pretrain/Loss (Raw)": 2.1156210899353027, "Pretrain/Step": 4754, "Pretrain/Step Time": 8.440166059881449} +{"Pretrain/Learning Rate": 2.632803975063156e-05, "Pretrain/Loss": 2.0405006408691406, "Pretrain/Loss (Raw)": 2.0435328483581543, "Pretrain/Step": 4755, "Pretrain/Step Time": 8.439000139012933} +{"Pretrain/Learning Rate": 2.6319561788348402e-05, "Pretrain/Loss": 2.0416181087493896, "Pretrain/Loss (Raw)": 2.0023815631866455, "Pretrain/Step": 4756, "Pretrain/Step Time": 8.431727893650532} +{"Pretrain/Learning Rate": 2.6311083673887154e-05, "Pretrain/Loss": 2.0395467281341553, "Pretrain/Loss (Raw)": 1.903196930885315, "Pretrain/Step": 4757, "Pretrain/Step Time": 8.436330035328865} +{"Pretrain/Learning Rate": 2.6302605408225572e-05, "Pretrain/Loss": 2.0426833629608154, "Pretrain/Loss (Raw)": 2.481801986694336, "Pretrain/Step": 4758, "Pretrain/Step Time": 8.43827304057777} +{"Pretrain/Learning Rate": 2.6294126992341382e-05, "Pretrain/Loss": 2.042295455932617, "Pretrain/Loss (Raw)": 2.000324010848999, "Pretrain/Step": 4759, "Pretrain/Step Time": 8.442377807572484} +{"Pretrain/Learning Rate": 2.628564842721238e-05, "Pretrain/Loss": 2.0439398288726807, "Pretrain/Loss (Raw)": 2.3514156341552734, "Pretrain/Step": 4760, "Pretrain/Step Time": 8.439598642289639} +{"Pretrain/Learning Rate": 2.6277169713816337e-05, "Pretrain/Loss": 2.046909809112549, "Pretrain/Loss (Raw)": 2.148548126220703, "Pretrain/Step": 4761, "Pretrain/Step Time": 8.440483966842294} +{"Pretrain/Learning Rate": 2.6268690853131067e-05, "Pretrain/Loss": 2.048292875289917, "Pretrain/Loss (Raw)": 2.111008644104004, "Pretrain/Step": 4762, "Pretrain/Step Time": 8.430995849892497} +{"Pretrain/Learning Rate": 2.6260211846134387e-05, "Pretrain/Loss": 2.047091007232666, "Pretrain/Loss (Raw)": 1.9918477535247803, "Pretrain/Step": 4763, "Pretrain/Step Time": 8.437338871881366} +{"Pretrain/Learning Rate": 2.6251732693804144e-05, "Pretrain/Loss": 2.0499649047851562, "Pretrain/Loss (Raw)": 2.142940044403076, "Pretrain/Step": 4764, "Pretrain/Step Time": 8.434311877936125} +{"Pretrain/Learning Rate": 2.6243253397118178e-05, "Pretrain/Loss": 2.050112724304199, "Pretrain/Loss (Raw)": 2.2292561531066895, "Pretrain/Step": 4765, "Pretrain/Step Time": 8.434070244431496} +{"Pretrain/Learning Rate": 2.6234773957054383e-05, "Pretrain/Loss": 2.049022674560547, "Pretrain/Loss (Raw)": 1.7296417951583862, "Pretrain/Step": 4766, "Pretrain/Step Time": 8.438446450978518} +{"Pretrain/Learning Rate": 2.6226294374590638e-05, "Pretrain/Loss": 2.0497193336486816, "Pretrain/Loss (Raw)": 1.995336651802063, "Pretrain/Step": 4767, "Pretrain/Step Time": 8.427756668999791} +{"Pretrain/Learning Rate": 2.6217814650704835e-05, "Pretrain/Loss": 2.049720287322998, "Pretrain/Loss (Raw)": 2.09248685836792, "Pretrain/Step": 4768, "Pretrain/Step Time": 8.424664814025164} +{"Pretrain/Learning Rate": 2.620933478637492e-05, "Pretrain/Loss": 2.0505340099334717, "Pretrain/Loss (Raw)": 2.1191816329956055, "Pretrain/Step": 4769, "Pretrain/Step Time": 8.429626137018204} +{"Pretrain/Learning Rate": 2.620085478257881e-05, "Pretrain/Loss": 2.051866054534912, "Pretrain/Loss (Raw)": 2.11008620262146, "Pretrain/Step": 4770, "Pretrain/Step Time": 8.426706083118916} +{"Pretrain/Learning Rate": 2.6192374640294477e-05, "Pretrain/Loss": 2.0521187782287598, "Pretrain/Loss (Raw)": 1.9639259576797485, "Pretrain/Step": 4771, "Pretrain/Step Time": 8.424795733764768} +{"Pretrain/Learning Rate": 2.618389436049987e-05, "Pretrain/Loss": 2.0537452697753906, "Pretrain/Loss (Raw)": 2.182072162628174, "Pretrain/Step": 4772, "Pretrain/Step Time": 8.423686567693949} +{"Pretrain/Learning Rate": 2.6175413944172995e-05, "Pretrain/Loss": 2.0482397079467773, "Pretrain/Loss (Raw)": 1.5189664363861084, "Pretrain/Step": 4773, "Pretrain/Step Time": 8.422307088971138} +{"Pretrain/Learning Rate": 2.6166933392291843e-05, "Pretrain/Loss": 2.0475411415100098, "Pretrain/Loss (Raw)": 1.9568226337432861, "Pretrain/Step": 4774, "Pretrain/Step Time": 8.425894785672426} +{"Pretrain/Learning Rate": 2.6158452705834434e-05, "Pretrain/Loss": 2.0488972663879395, "Pretrain/Loss (Raw)": 2.0509374141693115, "Pretrain/Step": 4775, "Pretrain/Step Time": 8.428224515169859} +{"Pretrain/Learning Rate": 2.6149971885778795e-05, "Pretrain/Loss": 2.047929525375366, "Pretrain/Loss (Raw)": 1.9360544681549072, "Pretrain/Step": 4776, "Pretrain/Step Time": 8.430678045377135} +{"Pretrain/Learning Rate": 2.6141490933102987e-05, "Pretrain/Loss": 2.0492196083068848, "Pretrain/Loss (Raw)": 1.9808639287948608, "Pretrain/Step": 4777, "Pretrain/Step Time": 8.43115508183837} +{"Pretrain/Learning Rate": 2.6133009848785062e-05, "Pretrain/Loss": 2.0505404472351074, "Pretrain/Loss (Raw)": 2.1221776008605957, "Pretrain/Step": 4778, "Pretrain/Step Time": 8.428879391402006} +{"Pretrain/Learning Rate": 2.6124528633803103e-05, "Pretrain/Loss": 2.0496461391448975, "Pretrain/Loss (Raw)": 1.8476901054382324, "Pretrain/Step": 4779, "Pretrain/Step Time": 8.421558750793338} +{"Pretrain/Learning Rate": 2.61160472891352e-05, "Pretrain/Loss": 2.0498104095458984, "Pretrain/Loss (Raw)": 1.9780325889587402, "Pretrain/Step": 4780, "Pretrain/Step Time": 8.422032482922077} +{"Pretrain/Learning Rate": 2.6107565815759473e-05, "Pretrain/Loss": 2.0484609603881836, "Pretrain/Loss (Raw)": 2.1271774768829346, "Pretrain/Step": 4781, "Pretrain/Step Time": 8.423620769754052} +{"Pretrain/Learning Rate": 2.6099084214654034e-05, "Pretrain/Loss": 2.0461535453796387, "Pretrain/Loss (Raw)": 2.066915512084961, "Pretrain/Step": 4782, "Pretrain/Step Time": 8.432119132950902} +{"Pretrain/Learning Rate": 2.6090602486797017e-05, "Pretrain/Loss": 2.045506000518799, "Pretrain/Loss (Raw)": 1.9985644817352295, "Pretrain/Step": 4783, "Pretrain/Step Time": 8.428984249010682} +{"Pretrain/Learning Rate": 2.608212063316659e-05, "Pretrain/Loss": 2.0471110343933105, "Pretrain/Loss (Raw)": 1.996193766593933, "Pretrain/Step": 4784, "Pretrain/Step Time": 8.429027171805501} +{"Pretrain/Learning Rate": 2.6073638654740908e-05, "Pretrain/Loss": 2.049041271209717, "Pretrain/Loss (Raw)": 2.2826826572418213, "Pretrain/Step": 4785, "Pretrain/Step Time": 8.431682009249926} +{"Pretrain/Learning Rate": 2.606515655249816e-05, "Pretrain/Loss": 2.046638250350952, "Pretrain/Loss (Raw)": 1.8081215620040894, "Pretrain/Step": 4786, "Pretrain/Step Time": 8.442443875595927} +{"Pretrain/Learning Rate": 2.6056674327416537e-05, "Pretrain/Loss": 2.046823501586914, "Pretrain/Loss (Raw)": 1.9956414699554443, "Pretrain/Step": 4787, "Pretrain/Step Time": 8.442042049020529} +{"Pretrain/Learning Rate": 2.604819198047425e-05, "Pretrain/Loss": 2.047426700592041, "Pretrain/Loss (Raw)": 1.9304447174072266, "Pretrain/Step": 4788, "Pretrain/Step Time": 8.442693358287215} +{"Pretrain/Learning Rate": 2.6039709512649522e-05, "Pretrain/Loss": 2.0482287406921387, "Pretrain/Loss (Raw)": 2.091614007949829, "Pretrain/Step": 4789, "Pretrain/Step Time": 8.43126573972404} +{"Pretrain/Learning Rate": 2.60312269249206e-05, "Pretrain/Loss": 2.047074317932129, "Pretrain/Loss (Raw)": 2.0002646446228027, "Pretrain/Step": 4790, "Pretrain/Step Time": 8.430137518793344} +{"Pretrain/Learning Rate": 2.602274421826573e-05, "Pretrain/Loss": 2.0465240478515625, "Pretrain/Loss (Raw)": 2.065819025039673, "Pretrain/Step": 4791, "Pretrain/Step Time": 8.433773266151547} +{"Pretrain/Learning Rate": 2.6014261393663176e-05, "Pretrain/Loss": 2.0466175079345703, "Pretrain/Loss (Raw)": 2.105659008026123, "Pretrain/Step": 4792, "Pretrain/Step Time": 8.438333416357636} +{"Pretrain/Learning Rate": 2.600577845209122e-05, "Pretrain/Loss": 2.046586275100708, "Pretrain/Loss (Raw)": 2.061105728149414, "Pretrain/Step": 4793, "Pretrain/Step Time": 8.44155127927661} +{"Pretrain/Learning Rate": 2.599729539452815e-05, "Pretrain/Loss": 2.047140121459961, "Pretrain/Loss (Raw)": 2.0076370239257812, "Pretrain/Step": 4794, "Pretrain/Step Time": 8.443160530179739} +{"Pretrain/Learning Rate": 2.598881222195228e-05, "Pretrain/Loss": 2.046861171722412, "Pretrain/Loss (Raw)": 1.9788156747817993, "Pretrain/Step": 4795, "Pretrain/Step Time": 8.438342401757836} +{"Pretrain/Learning Rate": 2.5980328935341918e-05, "Pretrain/Loss": 2.0453553199768066, "Pretrain/Loss (Raw)": 2.1532700061798096, "Pretrain/Step": 4796, "Pretrain/Step Time": 8.438184883445501} +{"Pretrain/Learning Rate": 2.597184553567541e-05, "Pretrain/Loss": 2.046420097351074, "Pretrain/Loss (Raw)": 2.127049684524536, "Pretrain/Step": 4797, "Pretrain/Step Time": 8.44670532271266} +{"Pretrain/Learning Rate": 2.5963362023931092e-05, "Pretrain/Loss": 2.043109655380249, "Pretrain/Loss (Raw)": 1.66428804397583, "Pretrain/Step": 4798, "Pretrain/Step Time": 8.44037189334631} +{"Pretrain/Learning Rate": 2.595487840108733e-05, "Pretrain/Loss": 2.0427515506744385, "Pretrain/Loss (Raw)": 1.8785138130187988, "Pretrain/Step": 4799, "Pretrain/Step Time": 8.44076256453991} +{"Pretrain/Learning Rate": 2.5946394668122485e-05, "Pretrain/Loss": 2.043529748916626, "Pretrain/Loss (Raw)": 2.1972362995147705, "Pretrain/Step": 4800, "Pretrain/Step Time": 8.437850758433342} +{"Pretrain/Learning Rate": 2.5937910826014955e-05, "Pretrain/Loss": 2.0444016456604004, "Pretrain/Loss (Raw)": 2.433544635772705, "Pretrain/Step": 4801, "Pretrain/Step Time": 8.43775419332087} +{"Pretrain/Learning Rate": 2.5929426875743123e-05, "Pretrain/Loss": 2.046182155609131, "Pretrain/Loss (Raw)": 2.1762945652008057, "Pretrain/Step": 4802, "Pretrain/Step Time": 8.434353828430176} +{"Pretrain/Learning Rate": 2.592094281828541e-05, "Pretrain/Loss": 2.046760082244873, "Pretrain/Loss (Raw)": 2.067298412322998, "Pretrain/Step": 4803, "Pretrain/Step Time": 8.437642706558108} +{"Pretrain/Learning Rate": 2.5912458654620226e-05, "Pretrain/Loss": 2.0433602333068848, "Pretrain/Loss (Raw)": 1.7606514692306519, "Pretrain/Step": 4804, "Pretrain/Step Time": 8.441859602928162} +{"Pretrain/Learning Rate": 2.5903974385726014e-05, "Pretrain/Loss": 2.044236660003662, "Pretrain/Loss (Raw)": 2.2317233085632324, "Pretrain/Step": 4805, "Pretrain/Step Time": 8.442729661241174} +{"Pretrain/Learning Rate": 2.589549001258121e-05, "Pretrain/Loss": 2.0452566146850586, "Pretrain/Loss (Raw)": 2.2763123512268066, "Pretrain/Step": 4806, "Pretrain/Step Time": 8.437356704846025} +{"Pretrain/Learning Rate": 2.5887005536164288e-05, "Pretrain/Loss": 2.0430045127868652, "Pretrain/Loss (Raw)": 1.9689399003982544, "Pretrain/Step": 4807, "Pretrain/Step Time": 8.434406902641058} +{"Pretrain/Learning Rate": 2.58785209574537e-05, "Pretrain/Loss": 2.0402255058288574, "Pretrain/Loss (Raw)": 1.7629390954971313, "Pretrain/Step": 4808, "Pretrain/Step Time": 8.428990541025996} +{"Pretrain/Learning Rate": 2.587003627742794e-05, "Pretrain/Loss": 2.0390424728393555, "Pretrain/Loss (Raw)": 1.934773564338684, "Pretrain/Step": 4809, "Pretrain/Step Time": 8.435515746474266} +{"Pretrain/Learning Rate": 2.5861551497065496e-05, "Pretrain/Loss": 2.039194107055664, "Pretrain/Loss (Raw)": 2.0670106410980225, "Pretrain/Step": 4810, "Pretrain/Step Time": 8.436559857800603} +{"Pretrain/Learning Rate": 2.5853066617344868e-05, "Pretrain/Loss": 2.0400893688201904, "Pretrain/Loss (Raw)": 1.8954670429229736, "Pretrain/Step": 4811, "Pretrain/Step Time": 8.433847095817327} +{"Pretrain/Learning Rate": 2.5844581639244586e-05, "Pretrain/Loss": 2.0424017906188965, "Pretrain/Loss (Raw)": 1.9985541105270386, "Pretrain/Step": 4812, "Pretrain/Step Time": 8.431043699383736} +{"Pretrain/Learning Rate": 2.583609656374316e-05, "Pretrain/Loss": 2.041748523712158, "Pretrain/Loss (Raw)": 1.9812145233154297, "Pretrain/Step": 4813, "Pretrain/Step Time": 8.433545282110572} +{"Pretrain/Learning Rate": 2.5827611391819152e-05, "Pretrain/Loss": 2.041755199432373, "Pretrain/Loss (Raw)": 1.9222850799560547, "Pretrain/Step": 4814, "Pretrain/Step Time": 8.440032618120313} +{"Pretrain/Learning Rate": 2.581912612445108e-05, "Pretrain/Loss": 2.041816234588623, "Pretrain/Loss (Raw)": 2.1819825172424316, "Pretrain/Step": 4815, "Pretrain/Step Time": 8.440851848572493} +{"Pretrain/Learning Rate": 2.5810640762617538e-05, "Pretrain/Loss": 2.042332172393799, "Pretrain/Loss (Raw)": 2.098086357116699, "Pretrain/Step": 4816, "Pretrain/Step Time": 8.436805410310626} +{"Pretrain/Learning Rate": 2.5802155307297077e-05, "Pretrain/Loss": 2.0360960960388184, "Pretrain/Loss (Raw)": 2.120337724685669, "Pretrain/Step": 4817, "Pretrain/Step Time": 8.434672387316823} +{"Pretrain/Learning Rate": 2.5793669759468292e-05, "Pretrain/Loss": 2.0361602306365967, "Pretrain/Loss (Raw)": 2.122227430343628, "Pretrain/Step": 4818, "Pretrain/Step Time": 8.429198795929551} +{"Pretrain/Learning Rate": 2.578518412010976e-05, "Pretrain/Loss": 2.0366313457489014, "Pretrain/Loss (Raw)": 1.996891736984253, "Pretrain/Step": 4819, "Pretrain/Step Time": 8.432187287136912} +{"Pretrain/Learning Rate": 2.577669839020011e-05, "Pretrain/Loss": 2.036926507949829, "Pretrain/Loss (Raw)": 1.9656646251678467, "Pretrain/Step": 4820, "Pretrain/Step Time": 8.43638290464878} +{"Pretrain/Learning Rate": 2.576821257071793e-05, "Pretrain/Loss": 2.03585147857666, "Pretrain/Loss (Raw)": 2.0613791942596436, "Pretrain/Step": 4821, "Pretrain/Step Time": 8.432484297081828} +{"Pretrain/Learning Rate": 2.5759726662641865e-05, "Pretrain/Loss": 2.035233974456787, "Pretrain/Loss (Raw)": 2.1644299030303955, "Pretrain/Step": 4822, "Pretrain/Step Time": 8.438594475388527} +{"Pretrain/Learning Rate": 2.5751240666950532e-05, "Pretrain/Loss": 2.0353078842163086, "Pretrain/Loss (Raw)": 2.004927396774292, "Pretrain/Step": 4823, "Pretrain/Step Time": 8.434939119964838} +{"Pretrain/Learning Rate": 2.5742754584622592e-05, "Pretrain/Loss": 2.035878896713257, "Pretrain/Loss (Raw)": 2.144033908843994, "Pretrain/Step": 4824, "Pretrain/Step Time": 8.431737337261438} +{"Pretrain/Learning Rate": 2.5734268416636697e-05, "Pretrain/Loss": 2.035846710205078, "Pretrain/Loss (Raw)": 1.9897284507751465, "Pretrain/Step": 4825, "Pretrain/Step Time": 8.430928204208612} +{"Pretrain/Learning Rate": 2.5725782163971495e-05, "Pretrain/Loss": 2.0341620445251465, "Pretrain/Loss (Raw)": 1.949101448059082, "Pretrain/Step": 4826, "Pretrain/Step Time": 8.436991831287742} +{"Pretrain/Learning Rate": 2.5717295827605686e-05, "Pretrain/Loss": 2.0318498611450195, "Pretrain/Loss (Raw)": 1.7688117027282715, "Pretrain/Step": 4827, "Pretrain/Step Time": 8.427672056481242} +{"Pretrain/Learning Rate": 2.5708809408517937e-05, "Pretrain/Loss": 2.028872013092041, "Pretrain/Loss (Raw)": 1.9508235454559326, "Pretrain/Step": 4828, "Pretrain/Step Time": 8.42899619974196} +{"Pretrain/Learning Rate": 2.5700322907686946e-05, "Pretrain/Loss": 2.0275158882141113, "Pretrain/Loss (Raw)": 1.9561492204666138, "Pretrain/Step": 4829, "Pretrain/Step Time": 8.425024876371026} +{"Pretrain/Learning Rate": 2.5691836326091414e-05, "Pretrain/Loss": 2.0267763137817383, "Pretrain/Loss (Raw)": 1.8551080226898193, "Pretrain/Step": 4830, "Pretrain/Step Time": 8.42601066455245} +{"Pretrain/Learning Rate": 2.5683349664710067e-05, "Pretrain/Loss": 2.0253171920776367, "Pretrain/Loss (Raw)": 2.1202902793884277, "Pretrain/Step": 4831, "Pretrain/Step Time": 8.426417978480458} +{"Pretrain/Learning Rate": 2.5674862924521605e-05, "Pretrain/Loss": 2.0230872631073, "Pretrain/Loss (Raw)": 1.8946750164031982, "Pretrain/Step": 4832, "Pretrain/Step Time": 8.43269962631166} +{"Pretrain/Learning Rate": 2.566637610650478e-05, "Pretrain/Loss": 2.0179171562194824, "Pretrain/Loss (Raw)": 1.7209433317184448, "Pretrain/Step": 4833, "Pretrain/Step Time": 8.438642024993896} +{"Pretrain/Learning Rate": 2.565788921163832e-05, "Pretrain/Loss": 2.01766300201416, "Pretrain/Loss (Raw)": 1.9845492839813232, "Pretrain/Step": 4834, "Pretrain/Step Time": 8.431496316567063} +{"Pretrain/Learning Rate": 2.5649402240900972e-05, "Pretrain/Loss": 2.0186853408813477, "Pretrain/Loss (Raw)": 2.107238292694092, "Pretrain/Step": 4835, "Pretrain/Step Time": 8.423704523593187} +{"Pretrain/Learning Rate": 2.5640915195271504e-05, "Pretrain/Loss": 2.018104076385498, "Pretrain/Loss (Raw)": 1.838289499282837, "Pretrain/Step": 4836, "Pretrain/Step Time": 8.422356644645333} +{"Pretrain/Learning Rate": 2.563242807572867e-05, "Pretrain/Loss": 2.0173861980438232, "Pretrain/Loss (Raw)": 2.003679037094116, "Pretrain/Step": 4837, "Pretrain/Step Time": 8.429780004546046} +{"Pretrain/Learning Rate": 2.5623940883251256e-05, "Pretrain/Loss": 2.017066478729248, "Pretrain/Loss (Raw)": 2.073955535888672, "Pretrain/Step": 4838, "Pretrain/Step Time": 8.43289273045957} +{"Pretrain/Learning Rate": 2.561545361881803e-05, "Pretrain/Loss": 2.0164952278137207, "Pretrain/Loss (Raw)": 2.0198028087615967, "Pretrain/Step": 4839, "Pretrain/Step Time": 8.435863869264722} +{"Pretrain/Learning Rate": 2.5606966283407803e-05, "Pretrain/Loss": 2.018608570098877, "Pretrain/Loss (Raw)": 2.113701105117798, "Pretrain/Step": 4840, "Pretrain/Step Time": 8.434616414830089} +{"Pretrain/Learning Rate": 2.5598478877999356e-05, "Pretrain/Loss": 2.0196337699890137, "Pretrain/Loss (Raw)": 2.0834081172943115, "Pretrain/Step": 4841, "Pretrain/Step Time": 8.428821232169867} +{"Pretrain/Learning Rate": 2.558999140357151e-05, "Pretrain/Loss": 2.018362522125244, "Pretrain/Loss (Raw)": 2.0044751167297363, "Pretrain/Step": 4842, "Pretrain/Step Time": 8.429436903446913} +{"Pretrain/Learning Rate": 2.5581503861103073e-05, "Pretrain/Loss": 2.019439697265625, "Pretrain/Loss (Raw)": 2.098646640777588, "Pretrain/Step": 4843, "Pretrain/Step Time": 8.441531984135509} +{"Pretrain/Learning Rate": 2.5573016251572872e-05, "Pretrain/Loss": 2.0211124420166016, "Pretrain/Loss (Raw)": 2.294381618499756, "Pretrain/Step": 4844, "Pretrain/Step Time": 8.443979414179921} +{"Pretrain/Learning Rate": 2.5564528575959733e-05, "Pretrain/Loss": 2.0206236839294434, "Pretrain/Loss (Raw)": 1.965216040611267, "Pretrain/Step": 4845, "Pretrain/Step Time": 8.438322661444545} +{"Pretrain/Learning Rate": 2.55560408352425e-05, "Pretrain/Loss": 2.0208983421325684, "Pretrain/Loss (Raw)": 2.0916855335235596, "Pretrain/Step": 4846, "Pretrain/Step Time": 8.436118546873331} +{"Pretrain/Learning Rate": 2.5547553030400016e-05, "Pretrain/Loss": 2.0247929096221924, "Pretrain/Loss (Raw)": 2.48590350151062, "Pretrain/Step": 4847, "Pretrain/Step Time": 8.427866706624627} +{"Pretrain/Learning Rate": 2.5539065162411143e-05, "Pretrain/Loss": 2.0215983390808105, "Pretrain/Loss (Raw)": 2.0343265533447266, "Pretrain/Step": 4848, "Pretrain/Step Time": 8.431068778038025} +{"Pretrain/Learning Rate": 2.5530577232254733e-05, "Pretrain/Loss": 2.021411418914795, "Pretrain/Loss (Raw)": 2.0337796211242676, "Pretrain/Step": 4849, "Pretrain/Step Time": 8.43141001649201} +{"Pretrain/Learning Rate": 2.5522089240909652e-05, "Pretrain/Loss": 2.019918918609619, "Pretrain/Loss (Raw)": 1.627415418624878, "Pretrain/Step": 4850, "Pretrain/Step Time": 8.4321412704885} +{"Pretrain/Learning Rate": 2.5513601189354786e-05, "Pretrain/Loss": 2.019746780395508, "Pretrain/Loss (Raw)": 1.9868963956832886, "Pretrain/Step": 4851, "Pretrain/Step Time": 8.434771263971925} +{"Pretrain/Learning Rate": 2.5505113078569004e-05, "Pretrain/Loss": 2.0218052864074707, "Pretrain/Loss (Raw)": 1.9392865896224976, "Pretrain/Step": 4852, "Pretrain/Step Time": 8.430196607485414} +{"Pretrain/Learning Rate": 2.5496624909531207e-05, "Pretrain/Loss": 2.0246570110321045, "Pretrain/Loss (Raw)": 2.326125383377075, "Pretrain/Step": 4853, "Pretrain/Step Time": 8.429921377450228} +{"Pretrain/Learning Rate": 2.548813668322028e-05, "Pretrain/Loss": 2.02510929107666, "Pretrain/Loss (Raw)": 1.8984944820404053, "Pretrain/Step": 4854, "Pretrain/Step Time": 8.434792345389724} +{"Pretrain/Learning Rate": 2.5479648400615136e-05, "Pretrain/Loss": 2.0254602432250977, "Pretrain/Loss (Raw)": 2.0645945072174072, "Pretrain/Step": 4855, "Pretrain/Step Time": 8.429279709234834} +{"Pretrain/Learning Rate": 2.547116006269467e-05, "Pretrain/Loss": 2.027589797973633, "Pretrain/Loss (Raw)": 2.199648141860962, "Pretrain/Step": 4856, "Pretrain/Step Time": 8.433303812518716} +{"Pretrain/Learning Rate": 2.5462671670437816e-05, "Pretrain/Loss": 2.027634859085083, "Pretrain/Loss (Raw)": 1.940748691558838, "Pretrain/Step": 4857, "Pretrain/Step Time": 8.427580380812287} +{"Pretrain/Learning Rate": 2.545418322482348e-05, "Pretrain/Loss": 2.026986837387085, "Pretrain/Loss (Raw)": 2.0692338943481445, "Pretrain/Step": 4858, "Pretrain/Step Time": 8.420744627714157} +{"Pretrain/Learning Rate": 2.5445694726830593e-05, "Pretrain/Loss": 2.026292562484741, "Pretrain/Loss (Raw)": 1.976473331451416, "Pretrain/Step": 4859, "Pretrain/Step Time": 8.42029906064272} +{"Pretrain/Learning Rate": 2.543720617743809e-05, "Pretrain/Loss": 2.0274500846862793, "Pretrain/Loss (Raw)": 2.095093250274658, "Pretrain/Step": 4860, "Pretrain/Step Time": 8.42615893855691} +{"Pretrain/Learning Rate": 2.5428717577624915e-05, "Pretrain/Loss": 2.0286030769348145, "Pretrain/Loss (Raw)": 2.083832263946533, "Pretrain/Step": 4861, "Pretrain/Step Time": 8.423954403027892} +{"Pretrain/Learning Rate": 2.5420228928370005e-05, "Pretrain/Loss": 2.029254913330078, "Pretrain/Loss (Raw)": 2.009432792663574, "Pretrain/Step": 4862, "Pretrain/Step Time": 8.424194039776921} +{"Pretrain/Learning Rate": 2.5411740230652315e-05, "Pretrain/Loss": 2.0297060012817383, "Pretrain/Loss (Raw)": 2.0312154293060303, "Pretrain/Step": 4863, "Pretrain/Step Time": 8.417948516085744} +{"Pretrain/Learning Rate": 2.5403251485450795e-05, "Pretrain/Loss": 2.0313894748687744, "Pretrain/Loss (Raw)": 2.068916082382202, "Pretrain/Step": 4864, "Pretrain/Step Time": 8.413758650422096} +{"Pretrain/Learning Rate": 2.5394762693744428e-05, "Pretrain/Loss": 2.032019853591919, "Pretrain/Loss (Raw)": 2.1863510608673096, "Pretrain/Step": 4865, "Pretrain/Step Time": 8.415632463991642} +{"Pretrain/Learning Rate": 2.538627385651216e-05, "Pretrain/Loss": 2.0331287384033203, "Pretrain/Loss (Raw)": 2.1169753074645996, "Pretrain/Step": 4866, "Pretrain/Step Time": 8.426110301166773} +{"Pretrain/Learning Rate": 2.5377784974732965e-05, "Pretrain/Loss": 2.0341596603393555, "Pretrain/Loss (Raw)": 2.114595651626587, "Pretrain/Step": 4867, "Pretrain/Step Time": 8.422298500314355} +{"Pretrain/Learning Rate": 2.536929604938584e-05, "Pretrain/Loss": 2.035943031311035, "Pretrain/Loss (Raw)": 2.301755905151367, "Pretrain/Step": 4868, "Pretrain/Step Time": 8.424862947314978} +{"Pretrain/Learning Rate": 2.5360807081449738e-05, "Pretrain/Loss": 2.0371429920196533, "Pretrain/Loss (Raw)": 2.03536319732666, "Pretrain/Step": 4869, "Pretrain/Step Time": 8.41821532137692} +{"Pretrain/Learning Rate": 2.5352318071903675e-05, "Pretrain/Loss": 2.038163661956787, "Pretrain/Loss (Raw)": 2.147197723388672, "Pretrain/Step": 4870, "Pretrain/Step Time": 8.423891412094235} +{"Pretrain/Learning Rate": 2.5343829021726618e-05, "Pretrain/Loss": 2.041081190109253, "Pretrain/Loss (Raw)": 2.3983466625213623, "Pretrain/Step": 4871, "Pretrain/Step Time": 8.433392057195306} +{"Pretrain/Learning Rate": 2.533533993189759e-05, "Pretrain/Loss": 2.038780689239502, "Pretrain/Loss (Raw)": 1.805892825126648, "Pretrain/Step": 4872, "Pretrain/Step Time": 8.43256682343781} +{"Pretrain/Learning Rate": 2.5326850803395575e-05, "Pretrain/Loss": 2.0382814407348633, "Pretrain/Loss (Raw)": 1.8419054746627808, "Pretrain/Step": 4873, "Pretrain/Step Time": 8.435679417103529} +{"Pretrain/Learning Rate": 2.5318361637199594e-05, "Pretrain/Loss": 2.038836717605591, "Pretrain/Loss (Raw)": 2.0711851119995117, "Pretrain/Step": 4874, "Pretrain/Step Time": 8.42977887392044} +{"Pretrain/Learning Rate": 2.5309872434288645e-05, "Pretrain/Loss": 2.0418972969055176, "Pretrain/Loss (Raw)": 2.187814474105835, "Pretrain/Step": 4875, "Pretrain/Step Time": 8.42737728357315} +{"Pretrain/Learning Rate": 2.5301383195641742e-05, "Pretrain/Loss": 2.0413804054260254, "Pretrain/Loss (Raw)": 1.9621249437332153, "Pretrain/Step": 4876, "Pretrain/Step Time": 8.422562019899487} +{"Pretrain/Learning Rate": 2.5292893922237913e-05, "Pretrain/Loss": 2.0411059856414795, "Pretrain/Loss (Raw)": 2.069148063659668, "Pretrain/Step": 4877, "Pretrain/Step Time": 8.430426379665732} +{"Pretrain/Learning Rate": 2.5284404615056172e-05, "Pretrain/Loss": 2.0395030975341797, "Pretrain/Loss (Raw)": 1.8271327018737793, "Pretrain/Step": 4878, "Pretrain/Step Time": 8.43296778947115} +{"Pretrain/Learning Rate": 2.5275915275075556e-05, "Pretrain/Loss": 2.0379726886749268, "Pretrain/Loss (Raw)": 1.9285728931427002, "Pretrain/Step": 4879, "Pretrain/Step Time": 8.431126216426492} +{"Pretrain/Learning Rate": 2.5267425903275088e-05, "Pretrain/Loss": 2.0359385013580322, "Pretrain/Loss (Raw)": 1.7696276903152466, "Pretrain/Step": 4880, "Pretrain/Step Time": 8.428056752309203} +{"Pretrain/Learning Rate": 2.5258936500633807e-05, "Pretrain/Loss": 2.036379814147949, "Pretrain/Loss (Raw)": 2.1564154624938965, "Pretrain/Step": 4881, "Pretrain/Step Time": 8.42251730710268} +{"Pretrain/Learning Rate": 2.5250447068130746e-05, "Pretrain/Loss": 2.0360865592956543, "Pretrain/Loss (Raw)": 2.078097105026245, "Pretrain/Step": 4882, "Pretrain/Step Time": 8.426850447431207} +{"Pretrain/Learning Rate": 2.5241957606744952e-05, "Pretrain/Loss": 2.0361411571502686, "Pretrain/Loss (Raw)": 2.0505127906799316, "Pretrain/Step": 4883, "Pretrain/Step Time": 8.430143995210528} +{"Pretrain/Learning Rate": 2.523346811745546e-05, "Pretrain/Loss": 2.037801742553711, "Pretrain/Loss (Raw)": 2.2149248123168945, "Pretrain/Step": 4884, "Pretrain/Step Time": 8.431490322574973} +{"Pretrain/Learning Rate": 2.5224978601241333e-05, "Pretrain/Loss": 2.03904390335083, "Pretrain/Loss (Raw)": 2.0622153282165527, "Pretrain/Step": 4885, "Pretrain/Step Time": 8.427017346024513} +{"Pretrain/Learning Rate": 2.5216489059081607e-05, "Pretrain/Loss": 2.0339765548706055, "Pretrain/Loss (Raw)": 1.8331745862960815, "Pretrain/Step": 4886, "Pretrain/Step Time": 8.42527942173183} +{"Pretrain/Learning Rate": 2.5207999491955347e-05, "Pretrain/Loss": 2.0347840785980225, "Pretrain/Loss (Raw)": 2.103677749633789, "Pretrain/Step": 4887, "Pretrain/Step Time": 8.417101707309484} +{"Pretrain/Learning Rate": 2.51995099008416e-05, "Pretrain/Loss": 2.033163070678711, "Pretrain/Loss (Raw)": 2.1438963413238525, "Pretrain/Step": 4888, "Pretrain/Step Time": 8.429173551499844} +{"Pretrain/Learning Rate": 2.519102028671944e-05, "Pretrain/Loss": 2.0309512615203857, "Pretrain/Loss (Raw)": 1.8654698133468628, "Pretrain/Step": 4889, "Pretrain/Step Time": 8.427100397646427} +{"Pretrain/Learning Rate": 2.518253065056791e-05, "Pretrain/Loss": 2.029878854751587, "Pretrain/Loss (Raw)": 1.973730206489563, "Pretrain/Step": 4890, "Pretrain/Step Time": 8.428110208362341} +{"Pretrain/Learning Rate": 2.5174040993366094e-05, "Pretrain/Loss": 2.0301060676574707, "Pretrain/Loss (Raw)": 2.0209312438964844, "Pretrain/Step": 4891, "Pretrain/Step Time": 8.424432748928666} +{"Pretrain/Learning Rate": 2.516555131609305e-05, "Pretrain/Loss": 2.0289039611816406, "Pretrain/Loss (Raw)": 1.9890788793563843, "Pretrain/Step": 4892, "Pretrain/Step Time": 8.424686575308442} +{"Pretrain/Learning Rate": 2.5157061619727844e-05, "Pretrain/Loss": 2.025198459625244, "Pretrain/Loss (Raw)": 1.7549264430999756, "Pretrain/Step": 4893, "Pretrain/Step Time": 8.427364191040397} +{"Pretrain/Learning Rate": 2.514857190524955e-05, "Pretrain/Loss": 2.0247344970703125, "Pretrain/Loss (Raw)": 1.670271873474121, "Pretrain/Step": 4894, "Pretrain/Step Time": 8.428969303146005} +{"Pretrain/Learning Rate": 2.514008217363725e-05, "Pretrain/Loss": 2.0249056816101074, "Pretrain/Loss (Raw)": 2.017251968383789, "Pretrain/Step": 4895, "Pretrain/Step Time": 8.42913880199194} +{"Pretrain/Learning Rate": 2.513159242587001e-05, "Pretrain/Loss": 2.022345542907715, "Pretrain/Loss (Raw)": 1.7647621631622314, "Pretrain/Step": 4896, "Pretrain/Step Time": 8.432657267898321} +{"Pretrain/Learning Rate": 2.5123102662926913e-05, "Pretrain/Loss": 2.02292537689209, "Pretrain/Loss (Raw)": 2.1934332847595215, "Pretrain/Step": 4897, "Pretrain/Step Time": 8.425689926370978} +{"Pretrain/Learning Rate": 2.5114612885787037e-05, "Pretrain/Loss": 2.021833896636963, "Pretrain/Loss (Raw)": 1.9703649282455444, "Pretrain/Step": 4898, "Pretrain/Step Time": 8.426562564447522} +{"Pretrain/Learning Rate": 2.5106123095429456e-05, "Pretrain/Loss": 2.023833990097046, "Pretrain/Loss (Raw)": 2.219949245452881, "Pretrain/Step": 4899, "Pretrain/Step Time": 8.430565435439348} +{"Pretrain/Learning Rate": 2.5097633292833268e-05, "Pretrain/Loss": 2.0236339569091797, "Pretrain/Loss (Raw)": 2.156458854675293, "Pretrain/Step": 4900, "Pretrain/Step Time": 8.432613572105765} +{"Pretrain/Learning Rate": 2.5089143478977546e-05, "Pretrain/Loss": 2.026529312133789, "Pretrain/Loss (Raw)": 1.8895630836486816, "Pretrain/Step": 4901, "Pretrain/Step Time": 8.430657429620624} +{"Pretrain/Learning Rate": 2.5080653654841378e-05, "Pretrain/Loss": 2.026020050048828, "Pretrain/Loss (Raw)": 1.8916672468185425, "Pretrain/Step": 4902, "Pretrain/Step Time": 8.423769515007734} +{"Pretrain/Learning Rate": 2.507216382140385e-05, "Pretrain/Loss": 2.0257701873779297, "Pretrain/Loss (Raw)": 2.018934965133667, "Pretrain/Step": 4903, "Pretrain/Step Time": 8.418917573988438} +{"Pretrain/Learning Rate": 2.5063673979644054e-05, "Pretrain/Loss": 2.0263330936431885, "Pretrain/Loss (Raw)": 2.008089542388916, "Pretrain/Step": 4904, "Pretrain/Step Time": 8.421482644975185} +{"Pretrain/Learning Rate": 2.5055184130541065e-05, "Pretrain/Loss": 2.0243377685546875, "Pretrain/Loss (Raw)": 1.7255064249038696, "Pretrain/Step": 4905, "Pretrain/Step Time": 8.434249555692077} +{"Pretrain/Learning Rate": 2.504669427507399e-05, "Pretrain/Loss": 2.0262527465820312, "Pretrain/Loss (Raw)": 2.367274284362793, "Pretrain/Step": 4906, "Pretrain/Step Time": 8.430729307234287} +{"Pretrain/Learning Rate": 2.503820441422191e-05, "Pretrain/Loss": 2.029174327850342, "Pretrain/Loss (Raw)": 2.2216408252716064, "Pretrain/Step": 4907, "Pretrain/Step Time": 8.44027964770794} +{"Pretrain/Learning Rate": 2.5029714548963917e-05, "Pretrain/Loss": 2.028238296508789, "Pretrain/Loss (Raw)": 1.8582353591918945, "Pretrain/Step": 4908, "Pretrain/Step Time": 8.435921331867576} +{"Pretrain/Learning Rate": 2.5021224680279105e-05, "Pretrain/Loss": 2.0265560150146484, "Pretrain/Loss (Raw)": 1.9118608236312866, "Pretrain/Step": 4909, "Pretrain/Step Time": 8.434275962412357} +{"Pretrain/Learning Rate": 2.5012734809146554e-05, "Pretrain/Loss": 2.0257301330566406, "Pretrain/Loss (Raw)": 1.9611760377883911, "Pretrain/Step": 4910, "Pretrain/Step Time": 8.431928781792521} +{"Pretrain/Learning Rate": 2.5004244936545374e-05, "Pretrain/Loss": 2.0259695053100586, "Pretrain/Loss (Raw)": 2.0292065143585205, "Pretrain/Step": 4911, "Pretrain/Step Time": 8.436090743169188} +{"Pretrain/Learning Rate": 2.499575506345464e-05, "Pretrain/Loss": 2.0258731842041016, "Pretrain/Loss (Raw)": 1.9838528633117676, "Pretrain/Step": 4912, "Pretrain/Step Time": 8.430723866447806} +{"Pretrain/Learning Rate": 2.498726519085345e-05, "Pretrain/Loss": 2.023375988006592, "Pretrain/Loss (Raw)": 1.9630683660507202, "Pretrain/Step": 4913, "Pretrain/Step Time": 8.43227120488882} +{"Pretrain/Learning Rate": 2.497877531972091e-05, "Pretrain/Loss": 2.02445650100708, "Pretrain/Loss (Raw)": 1.946408748626709, "Pretrain/Step": 4914, "Pretrain/Step Time": 8.422010397538543} +{"Pretrain/Learning Rate": 2.497028545103609e-05, "Pretrain/Loss": 2.0243046283721924, "Pretrain/Loss (Raw)": 1.9762204885482788, "Pretrain/Step": 4915, "Pretrain/Step Time": 8.42606377787888} +{"Pretrain/Learning Rate": 2.49617955857781e-05, "Pretrain/Loss": 2.0247082710266113, "Pretrain/Loss (Raw)": 1.9821102619171143, "Pretrain/Step": 4916, "Pretrain/Step Time": 8.42692719772458} +{"Pretrain/Learning Rate": 2.4953305724926017e-05, "Pretrain/Loss": 2.024181842803955, "Pretrain/Loss (Raw)": 2.024228572845459, "Pretrain/Step": 4917, "Pretrain/Step Time": 8.42824425548315} +{"Pretrain/Learning Rate": 2.494481586945894e-05, "Pretrain/Loss": 2.0245609283447266, "Pretrain/Loss (Raw)": 2.048807144165039, "Pretrain/Step": 4918, "Pretrain/Step Time": 8.438222039490938} +{"Pretrain/Learning Rate": 2.4936326020355955e-05, "Pretrain/Loss": 2.022522449493408, "Pretrain/Loss (Raw)": 1.8048501014709473, "Pretrain/Step": 4919, "Pretrain/Step Time": 8.435937188565731} +{"Pretrain/Learning Rate": 2.4927836178596156e-05, "Pretrain/Loss": 2.0211470127105713, "Pretrain/Loss (Raw)": 1.9296032190322876, "Pretrain/Step": 4920, "Pretrain/Step Time": 8.43112968467176} +{"Pretrain/Learning Rate": 2.4919346345158624e-05, "Pretrain/Loss": 2.02030348777771, "Pretrain/Loss (Raw)": 1.9531588554382324, "Pretrain/Step": 4921, "Pretrain/Step Time": 8.435193633660674} +{"Pretrain/Learning Rate": 2.491085652102246e-05, "Pretrain/Loss": 2.019667148590088, "Pretrain/Loss (Raw)": 1.9261749982833862, "Pretrain/Step": 4922, "Pretrain/Step Time": 8.441555241122842} +{"Pretrain/Learning Rate": 2.4902366707166734e-05, "Pretrain/Loss": 2.01650333404541, "Pretrain/Loss (Raw)": 1.573839545249939, "Pretrain/Step": 4923, "Pretrain/Step Time": 8.442046709358692} +{"Pretrain/Learning Rate": 2.4893876904570554e-05, "Pretrain/Loss": 2.016233444213867, "Pretrain/Loss (Raw)": 2.118744134902954, "Pretrain/Step": 4924, "Pretrain/Step Time": 8.439183842390776} +{"Pretrain/Learning Rate": 2.488538711421297e-05, "Pretrain/Loss": 2.0149893760681152, "Pretrain/Loss (Raw)": 1.967788815498352, "Pretrain/Step": 4925, "Pretrain/Step Time": 8.433752590790391} +{"Pretrain/Learning Rate": 2.4876897337073103e-05, "Pretrain/Loss": 2.0159454345703125, "Pretrain/Loss (Raw)": 1.7866967916488647, "Pretrain/Step": 4926, "Pretrain/Step Time": 8.433552399277687} +{"Pretrain/Learning Rate": 2.4868407574129994e-05, "Pretrain/Loss": 2.0178043842315674, "Pretrain/Loss (Raw)": 2.116438865661621, "Pretrain/Step": 4927, "Pretrain/Step Time": 8.44239342585206} +{"Pretrain/Learning Rate": 2.4859917826362764e-05, "Pretrain/Loss": 2.0169687271118164, "Pretrain/Loss (Raw)": 2.0902740955352783, "Pretrain/Step": 4928, "Pretrain/Step Time": 8.441949475556612} +{"Pretrain/Learning Rate": 2.485142809475045e-05, "Pretrain/Loss": 2.0121443271636963, "Pretrain/Loss (Raw)": 1.81602144241333, "Pretrain/Step": 4929, "Pretrain/Step Time": 8.440024195238948} +{"Pretrain/Learning Rate": 2.4842938380272168e-05, "Pretrain/Loss": 2.011972665786743, "Pretrain/Loss (Raw)": 2.1543266773223877, "Pretrain/Step": 4930, "Pretrain/Step Time": 8.442974023520947} +{"Pretrain/Learning Rate": 2.4834448683906957e-05, "Pretrain/Loss": 2.013009786605835, "Pretrain/Loss (Raw)": 2.2000467777252197, "Pretrain/Step": 4931, "Pretrain/Step Time": 8.440500931814313} +{"Pretrain/Learning Rate": 2.482595900663392e-05, "Pretrain/Loss": 2.01521635055542, "Pretrain/Loss (Raw)": 2.04310941696167, "Pretrain/Step": 4932, "Pretrain/Step Time": 8.44536098279059} +{"Pretrain/Learning Rate": 2.481746934943209e-05, "Pretrain/Loss": 2.0123817920684814, "Pretrain/Loss (Raw)": 1.8688832521438599, "Pretrain/Step": 4933, "Pretrain/Step Time": 8.457160456106067} +{"Pretrain/Learning Rate": 2.480897971328056e-05, "Pretrain/Loss": 2.010763168334961, "Pretrain/Loss (Raw)": 2.069126605987549, "Pretrain/Step": 4934, "Pretrain/Step Time": 8.458023315295577} +{"Pretrain/Learning Rate": 2.4800490099158403e-05, "Pretrain/Loss": 2.0111663341522217, "Pretrain/Loss (Raw)": 2.020538568496704, "Pretrain/Step": 4935, "Pretrain/Step Time": 8.456992130726576} +{"Pretrain/Learning Rate": 2.4792000508044652e-05, "Pretrain/Loss": 2.0121428966522217, "Pretrain/Loss (Raw)": 1.8879375457763672, "Pretrain/Step": 4936, "Pretrain/Step Time": 8.45350164361298} +{"Pretrain/Learning Rate": 2.4783510940918396e-05, "Pretrain/Loss": 2.0127289295196533, "Pretrain/Loss (Raw)": 2.0097901821136475, "Pretrain/Step": 4937, "Pretrain/Step Time": 8.451618487015367} +{"Pretrain/Learning Rate": 2.4775021398758666e-05, "Pretrain/Loss": 2.012040615081787, "Pretrain/Loss (Raw)": 1.9788870811462402, "Pretrain/Step": 4938, "Pretrain/Step Time": 8.461750101298094} +{"Pretrain/Learning Rate": 2.4766531882544545e-05, "Pretrain/Loss": 2.0116984844207764, "Pretrain/Loss (Raw)": 1.8516870737075806, "Pretrain/Step": 4939, "Pretrain/Step Time": 8.465807471424341} +{"Pretrain/Learning Rate": 2.475804239325505e-05, "Pretrain/Loss": 2.0110692977905273, "Pretrain/Loss (Raw)": 1.9180220365524292, "Pretrain/Step": 4940, "Pretrain/Step Time": 8.464466767385602} +{"Pretrain/Learning Rate": 2.474955293186926e-05, "Pretrain/Loss": 2.01057505607605, "Pretrain/Loss (Raw)": 1.9179511070251465, "Pretrain/Step": 4941, "Pretrain/Step Time": 8.462608180940151} +{"Pretrain/Learning Rate": 2.4741063499366195e-05, "Pretrain/Loss": 2.0114998817443848, "Pretrain/Loss (Raw)": 2.0406570434570312, "Pretrain/Step": 4942, "Pretrain/Step Time": 8.456173518672585} +{"Pretrain/Learning Rate": 2.4732574096724918e-05, "Pretrain/Loss": 2.009269952774048, "Pretrain/Loss (Raw)": 1.8965470790863037, "Pretrain/Step": 4943, "Pretrain/Step Time": 8.459438810124993} +{"Pretrain/Learning Rate": 2.4724084724924446e-05, "Pretrain/Loss": 2.0100760459899902, "Pretrain/Loss (Raw)": 2.2012784481048584, "Pretrain/Step": 4944, "Pretrain/Step Time": 8.473610425367951} +{"Pretrain/Learning Rate": 2.471559538494383e-05, "Pretrain/Loss": 2.0085644721984863, "Pretrain/Loss (Raw)": 1.9268373250961304, "Pretrain/Step": 4945, "Pretrain/Step Time": 8.479395743459463} +{"Pretrain/Learning Rate": 2.470710607776209e-05, "Pretrain/Loss": 2.0082411766052246, "Pretrain/Loss (Raw)": 2.080871343612671, "Pretrain/Step": 4946, "Pretrain/Step Time": 8.479287112131715} +{"Pretrain/Learning Rate": 2.4698616804358263e-05, "Pretrain/Loss": 2.0123608112335205, "Pretrain/Loss (Raw)": 2.5241971015930176, "Pretrain/Step": 4947, "Pretrain/Step Time": 8.476703466847539} +{"Pretrain/Learning Rate": 2.469012756571136e-05, "Pretrain/Loss": 2.0135250091552734, "Pretrain/Loss (Raw)": 2.114698886871338, "Pretrain/Step": 4948, "Pretrain/Step Time": 8.475187918171287} +{"Pretrain/Learning Rate": 2.4681638362800415e-05, "Pretrain/Loss": 2.0143282413482666, "Pretrain/Loss (Raw)": 2.1641685962677, "Pretrain/Step": 4949, "Pretrain/Step Time": 8.484556259587407} +{"Pretrain/Learning Rate": 2.4673149196604424e-05, "Pretrain/Loss": 2.0143566131591797, "Pretrain/Loss (Raw)": 2.168056011199951, "Pretrain/Step": 4950, "Pretrain/Step Time": 8.47991962917149} +{"Pretrain/Learning Rate": 2.4664660068102416e-05, "Pretrain/Loss": 2.013747453689575, "Pretrain/Loss (Raw)": 1.9269767999649048, "Pretrain/Step": 4951, "Pretrain/Step Time": 8.481875708326697} +{"Pretrain/Learning Rate": 2.465617097827338e-05, "Pretrain/Loss": 2.013336181640625, "Pretrain/Loss (Raw)": 2.091395139694214, "Pretrain/Step": 4952, "Pretrain/Step Time": 8.48055542819202} +{"Pretrain/Learning Rate": 2.4647681928096337e-05, "Pretrain/Loss": 2.013540267944336, "Pretrain/Loss (Raw)": 2.0158333778381348, "Pretrain/Step": 4953, "Pretrain/Step Time": 8.481485608965158} +{"Pretrain/Learning Rate": 2.4639192918550268e-05, "Pretrain/Loss": 2.0150883197784424, "Pretrain/Loss (Raw)": 2.14725661277771, "Pretrain/Step": 4954, "Pretrain/Step Time": 8.475965114310384} +{"Pretrain/Learning Rate": 2.4630703950614176e-05, "Pretrain/Loss": 2.0185351371765137, "Pretrain/Loss (Raw)": 2.2099862098693848, "Pretrain/Step": 4955, "Pretrain/Step Time": 8.484690198674798} +{"Pretrain/Learning Rate": 2.462221502526704e-05, "Pretrain/Loss": 2.0190389156341553, "Pretrain/Loss (Raw)": 2.0153417587280273, "Pretrain/Step": 4956, "Pretrain/Step Time": 8.484791051596403} +{"Pretrain/Learning Rate": 2.461372614348785e-05, "Pretrain/Loss": 2.0217795372009277, "Pretrain/Loss (Raw)": 2.3069398403167725, "Pretrain/Step": 4957, "Pretrain/Step Time": 8.48289218917489} +{"Pretrain/Learning Rate": 2.460523730625558e-05, "Pretrain/Loss": 2.023195266723633, "Pretrain/Loss (Raw)": 2.036320447921753, "Pretrain/Step": 4958, "Pretrain/Step Time": 8.480099631473422} +{"Pretrain/Learning Rate": 2.4596748514549208e-05, "Pretrain/Loss": 2.022144317626953, "Pretrain/Loss (Raw)": 1.9857516288757324, "Pretrain/Step": 4959, "Pretrain/Step Time": 8.479345068335533} +{"Pretrain/Learning Rate": 2.458825976934769e-05, "Pretrain/Loss": 2.023233413696289, "Pretrain/Loss (Raw)": 2.0341169834136963, "Pretrain/Step": 4960, "Pretrain/Step Time": 8.480395469814539} +{"Pretrain/Learning Rate": 2.4579771071630004e-05, "Pretrain/Loss": 2.023207664489746, "Pretrain/Loss (Raw)": 1.7176169157028198, "Pretrain/Step": 4961, "Pretrain/Step Time": 8.486343156546354} +{"Pretrain/Learning Rate": 2.457128242237509e-05, "Pretrain/Loss": 2.022803783416748, "Pretrain/Loss (Raw)": 1.9328515529632568, "Pretrain/Step": 4962, "Pretrain/Step Time": 8.489761743694544} +{"Pretrain/Learning Rate": 2.4562793822561914e-05, "Pretrain/Loss": 2.0203447341918945, "Pretrain/Loss (Raw)": 1.7924773693084717, "Pretrain/Step": 4963, "Pretrain/Step Time": 8.487946769222617} +{"Pretrain/Learning Rate": 2.455430527316941e-05, "Pretrain/Loss": 2.0218400955200195, "Pretrain/Loss (Raw)": 2.029719114303589, "Pretrain/Step": 4964, "Pretrain/Step Time": 8.489022409543395} +{"Pretrain/Learning Rate": 2.4545816775176532e-05, "Pretrain/Loss": 2.021770477294922, "Pretrain/Loss (Raw)": 1.9947338104248047, "Pretrain/Step": 4965, "Pretrain/Step Time": 8.481723261997104} +{"Pretrain/Learning Rate": 2.4537328329562186e-05, "Pretrain/Loss": 2.0219719409942627, "Pretrain/Loss (Raw)": 2.099752902984619, "Pretrain/Step": 4966, "Pretrain/Step Time": 8.487684965133667} +{"Pretrain/Learning Rate": 2.4528839937305336e-05, "Pretrain/Loss": 2.0235300064086914, "Pretrain/Loss (Raw)": 2.2192559242248535, "Pretrain/Step": 4967, "Pretrain/Step Time": 8.48678958043456} +{"Pretrain/Learning Rate": 2.452035159938487e-05, "Pretrain/Loss": 2.0231547355651855, "Pretrain/Loss (Raw)": 2.065650463104248, "Pretrain/Step": 4968, "Pretrain/Step Time": 8.487626548856497} +{"Pretrain/Learning Rate": 2.4511863316779728e-05, "Pretrain/Loss": 2.0226378440856934, "Pretrain/Loss (Raw)": 2.0172629356384277, "Pretrain/Step": 4969, "Pretrain/Step Time": 8.488329650834203} +{"Pretrain/Learning Rate": 2.4503375090468795e-05, "Pretrain/Loss": 2.0223217010498047, "Pretrain/Loss (Raw)": 1.9639995098114014, "Pretrain/Step": 4970, "Pretrain/Step Time": 8.487348092719913} +{"Pretrain/Learning Rate": 2.4494886921431005e-05, "Pretrain/Loss": 2.022024631500244, "Pretrain/Loss (Raw)": 2.0606393814086914, "Pretrain/Step": 4971, "Pretrain/Step Time": 8.488619565963745} +{"Pretrain/Learning Rate": 2.448639881064522e-05, "Pretrain/Loss": 2.0200304985046387, "Pretrain/Loss (Raw)": 2.039123296737671, "Pretrain/Step": 4972, "Pretrain/Step Time": 8.487500892952085} +{"Pretrain/Learning Rate": 2.4477910759090357e-05, "Pretrain/Loss": 2.024113178253174, "Pretrain/Loss (Raw)": 2.4877898693084717, "Pretrain/Step": 4973, "Pretrain/Step Time": 8.49553787149489} +{"Pretrain/Learning Rate": 2.446942276774527e-05, "Pretrain/Loss": 2.0220775604248047, "Pretrain/Loss (Raw)": 1.8311140537261963, "Pretrain/Step": 4974, "Pretrain/Step Time": 8.495728394016623} +{"Pretrain/Learning Rate": 2.4460934837588856e-05, "Pretrain/Loss": 2.017836809158325, "Pretrain/Loss (Raw)": 1.9430981874465942, "Pretrain/Step": 4975, "Pretrain/Step Time": 8.495845671743155} +{"Pretrain/Learning Rate": 2.4452446969599986e-05, "Pretrain/Loss": 2.018740653991699, "Pretrain/Loss (Raw)": 2.1500322818756104, "Pretrain/Step": 4976, "Pretrain/Step Time": 8.489638479426503} +{"Pretrain/Learning Rate": 2.44439591647575e-05, "Pretrain/Loss": 2.019110679626465, "Pretrain/Loss (Raw)": 2.0811421871185303, "Pretrain/Step": 4977, "Pretrain/Step Time": 8.491511920467019} +{"Pretrain/Learning Rate": 2.4435471424040273e-05, "Pretrain/Loss": 2.0223841667175293, "Pretrain/Loss (Raw)": 2.0464060306549072, "Pretrain/Step": 4978, "Pretrain/Step Time": 8.498368540778756} +{"Pretrain/Learning Rate": 2.442698374842713e-05, "Pretrain/Loss": 2.0217809677124023, "Pretrain/Loss (Raw)": 1.9096778631210327, "Pretrain/Step": 4979, "Pretrain/Step Time": 8.49725567549467} +{"Pretrain/Learning Rate": 2.4418496138896936e-05, "Pretrain/Loss": 2.021634101867676, "Pretrain/Loss (Raw)": 1.9204976558685303, "Pretrain/Step": 4980, "Pretrain/Step Time": 8.494979375973344} +{"Pretrain/Learning Rate": 2.4410008596428492e-05, "Pretrain/Loss": 2.0182712078094482, "Pretrain/Loss (Raw)": 1.8956646919250488, "Pretrain/Step": 4981, "Pretrain/Step Time": 8.501129038631916} +{"Pretrain/Learning Rate": 2.440152112200065e-05, "Pretrain/Loss": 2.019946336746216, "Pretrain/Loss (Raw)": 2.112905740737915, "Pretrain/Step": 4982, "Pretrain/Step Time": 8.496244549751282} +{"Pretrain/Learning Rate": 2.4393033716592196e-05, "Pretrain/Loss": 2.0197932720184326, "Pretrain/Loss (Raw)": 2.045034408569336, "Pretrain/Step": 4983, "Pretrain/Step Time": 8.505533777177334} +{"Pretrain/Learning Rate": 2.4384546381181976e-05, "Pretrain/Loss": 2.016955852508545, "Pretrain/Loss (Raw)": 1.8364498615264893, "Pretrain/Step": 4984, "Pretrain/Step Time": 8.506935054436326} +{"Pretrain/Learning Rate": 2.437605911674875e-05, "Pretrain/Loss": 2.0163846015930176, "Pretrain/Loss (Raw)": 1.8676146268844604, "Pretrain/Step": 4985, "Pretrain/Step Time": 8.509897973388433} +{"Pretrain/Learning Rate": 2.4367571924271335e-05, "Pretrain/Loss": 2.0156755447387695, "Pretrain/Loss (Raw)": 1.9784905910491943, "Pretrain/Step": 4986, "Pretrain/Step Time": 8.51440011151135} +{"Pretrain/Learning Rate": 2.43590848047285e-05, "Pretrain/Loss": 2.015021800994873, "Pretrain/Loss (Raw)": 1.8927953243255615, "Pretrain/Step": 4987, "Pretrain/Step Time": 8.515150111168623} +{"Pretrain/Learning Rate": 2.4350597759099034e-05, "Pretrain/Loss": 2.012141466140747, "Pretrain/Loss (Raw)": 1.7264089584350586, "Pretrain/Step": 4988, "Pretrain/Step Time": 8.504068661481142} +{"Pretrain/Learning Rate": 2.4342110788361685e-05, "Pretrain/Loss": 2.0087711811065674, "Pretrain/Loss (Raw)": 1.6524442434310913, "Pretrain/Step": 4989, "Pretrain/Step Time": 8.510311989113688} +{"Pretrain/Learning Rate": 2.433362389349523e-05, "Pretrain/Loss": 2.006955623626709, "Pretrain/Loss (Raw)": 1.7770274877548218, "Pretrain/Step": 4990, "Pretrain/Step Time": 8.52064255811274} +{"Pretrain/Learning Rate": 2.4325137075478398e-05, "Pretrain/Loss": 2.006317138671875, "Pretrain/Loss (Raw)": 1.9494765996932983, "Pretrain/Step": 4991, "Pretrain/Step Time": 8.517952332273126} +{"Pretrain/Learning Rate": 2.4316650335289942e-05, "Pretrain/Loss": 2.0079991817474365, "Pretrain/Loss (Raw)": 2.284238815307617, "Pretrain/Step": 4992, "Pretrain/Step Time": 8.519101550802588} +{"Pretrain/Learning Rate": 2.430816367390859e-05, "Pretrain/Loss": 2.0058162212371826, "Pretrain/Loss (Raw)": 1.9069228172302246, "Pretrain/Step": 4993, "Pretrain/Step Time": 8.518583916127682} +{"Pretrain/Learning Rate": 2.429967709231306e-05, "Pretrain/Loss": 2.0055489540100098, "Pretrain/Loss (Raw)": 2.082752227783203, "Pretrain/Step": 4994, "Pretrain/Step Time": 8.508129181340337} +{"Pretrain/Learning Rate": 2.429119059148207e-05, "Pretrain/Loss": 2.0044126510620117, "Pretrain/Loss (Raw)": 1.9691693782806396, "Pretrain/Step": 4995, "Pretrain/Step Time": 8.516319777816534} +{"Pretrain/Learning Rate": 2.4282704172394323e-05, "Pretrain/Loss": 2.0000882148742676, "Pretrain/Loss (Raw)": 1.748208999633789, "Pretrain/Step": 4996, "Pretrain/Step Time": 8.52308114990592} +{"Pretrain/Learning Rate": 2.4274217836028507e-05, "Pretrain/Loss": 1.998401165008545, "Pretrain/Loss (Raw)": 1.8194307088851929, "Pretrain/Step": 4997, "Pretrain/Step Time": 8.521668629720807} +{"Pretrain/Learning Rate": 2.4265731583363316e-05, "Pretrain/Loss": 1.997752070426941, "Pretrain/Loss (Raw)": 2.06410813331604, "Pretrain/Step": 4998, "Pretrain/Step Time": 8.519379692152143} +{"Pretrain/Learning Rate": 2.425724541537741e-05, "Pretrain/Loss": 1.9939721822738647, "Pretrain/Loss (Raw)": 1.914539098739624, "Pretrain/Step": 4999, "Pretrain/Step Time": 8.509437143802643} +{"Pretrain/Learning Rate": 2.4248759333049474e-05, "Pretrain/Loss": 1.9948811531066895, "Pretrain/Loss (Raw)": 1.9222368001937866, "Pretrain/Step": 5000, "Pretrain/Step Time": 8.5085404869169} +{"Pretrain/Learning Rate": 2.424027333735814e-05, "Pretrain/Loss": 1.9961093664169312, "Pretrain/Loss (Raw)": 1.9991095066070557, "Pretrain/Step": 5001, "Pretrain/Step Time": 9.020089587196708} +{"Pretrain/Learning Rate": 2.4231787429282073e-05, "Pretrain/Loss": 1.9935555458068848, "Pretrain/Loss (Raw)": 1.7442870140075684, "Pretrain/Step": 5002, "Pretrain/Step Time": 9.020700816065073} +{"Pretrain/Learning Rate": 2.4223301609799895e-05, "Pretrain/Loss": 1.9935781955718994, "Pretrain/Loss (Raw)": 2.190721035003662, "Pretrain/Step": 5003, "Pretrain/Step Time": 9.02256901934743} +{"Pretrain/Learning Rate": 2.421481587989024e-05, "Pretrain/Loss": 1.9921610355377197, "Pretrain/Loss (Raw)": 1.78074049949646, "Pretrain/Step": 5004, "Pretrain/Step Time": 9.021146606653929} +{"Pretrain/Learning Rate": 2.4206330240531713e-05, "Pretrain/Loss": 1.9932624101638794, "Pretrain/Loss (Raw)": 2.2101149559020996, "Pretrain/Step": 5005, "Pretrain/Step Time": 9.021634433418512} +{"Pretrain/Learning Rate": 2.4197844692702925e-05, "Pretrain/Loss": 1.9942903518676758, "Pretrain/Loss (Raw)": 1.9587109088897705, "Pretrain/Step": 5006, "Pretrain/Step Time": 9.016082780435681} +{"Pretrain/Learning Rate": 2.4189359237382464e-05, "Pretrain/Loss": 1.9955825805664062, "Pretrain/Loss (Raw)": 2.093993902206421, "Pretrain/Step": 5007, "Pretrain/Step Time": 9.032029012218118} +{"Pretrain/Learning Rate": 2.4180873875548925e-05, "Pretrain/Loss": 1.998544454574585, "Pretrain/Loss (Raw)": 2.1487128734588623, "Pretrain/Step": 5008, "Pretrain/Step Time": 9.033540764823556} +{"Pretrain/Learning Rate": 2.4172388608180857e-05, "Pretrain/Loss": 1.9976587295532227, "Pretrain/Loss (Raw)": 2.043065309524536, "Pretrain/Step": 5009, "Pretrain/Step Time": 9.036233112215996} +{"Pretrain/Learning Rate": 2.4163903436256848e-05, "Pretrain/Loss": 1.9975485801696777, "Pretrain/Loss (Raw)": 2.0639889240264893, "Pretrain/Step": 5010, "Pretrain/Step Time": 9.029938450083137} +{"Pretrain/Learning Rate": 2.4155418360755423e-05, "Pretrain/Loss": 1.9982936382293701, "Pretrain/Loss (Raw)": 2.145885944366455, "Pretrain/Step": 5011, "Pretrain/Step Time": 9.022630989551544} +{"Pretrain/Learning Rate": 2.4146933382655145e-05, "Pretrain/Loss": 1.9962488412857056, "Pretrain/Loss (Raw)": 1.9531885385513306, "Pretrain/Step": 5012, "Pretrain/Step Time": 9.027078310027719} +{"Pretrain/Learning Rate": 2.413844850293451e-05, "Pretrain/Loss": 1.9964361190795898, "Pretrain/Loss (Raw)": 2.0861804485321045, "Pretrain/Step": 5013, "Pretrain/Step Time": 9.030683500692248} +{"Pretrain/Learning Rate": 2.4129963722572074e-05, "Pretrain/Loss": 1.9974033832550049, "Pretrain/Loss (Raw)": 1.956984519958496, "Pretrain/Step": 5014, "Pretrain/Step Time": 9.040995240211487} +{"Pretrain/Learning Rate": 2.41214790425463e-05, "Pretrain/Loss": 1.996317744255066, "Pretrain/Loss (Raw)": 1.9647389650344849, "Pretrain/Step": 5015, "Pretrain/Step Time": 9.04240001551807} +{"Pretrain/Learning Rate": 2.4112994463835714e-05, "Pretrain/Loss": 1.9967565536499023, "Pretrain/Loss (Raw)": 2.2000482082366943, "Pretrain/Step": 5016, "Pretrain/Step Time": 9.028889888897538} +{"Pretrain/Learning Rate": 2.4104509987418793e-05, "Pretrain/Loss": 1.9969866275787354, "Pretrain/Loss (Raw)": 1.8949244022369385, "Pretrain/Step": 5017, "Pretrain/Step Time": 9.035294882953167} +{"Pretrain/Learning Rate": 2.4096025614273988e-05, "Pretrain/Loss": 1.996884822845459, "Pretrain/Loss (Raw)": 1.9607045650482178, "Pretrain/Step": 5018, "Pretrain/Step Time": 9.044316099956632} +{"Pretrain/Learning Rate": 2.408754134537978e-05, "Pretrain/Loss": 1.9978597164154053, "Pretrain/Loss (Raw)": 2.1457173824310303, "Pretrain/Step": 5019, "Pretrain/Step Time": 9.050325790420175} +{"Pretrain/Learning Rate": 2.407905718171459e-05, "Pretrain/Loss": 1.9975486993789673, "Pretrain/Loss (Raw)": 1.9492604732513428, "Pretrain/Step": 5020, "Pretrain/Step Time": 9.052083067595959} +{"Pretrain/Learning Rate": 2.4070573124256883e-05, "Pretrain/Loss": 1.9984114170074463, "Pretrain/Loss (Raw)": 1.8653676509857178, "Pretrain/Step": 5021, "Pretrain/Step Time": 9.04767451621592} +{"Pretrain/Learning Rate": 2.4062089173985044e-05, "Pretrain/Loss": 2.001182794570923, "Pretrain/Loss (Raw)": 2.0249674320220947, "Pretrain/Step": 5022, "Pretrain/Step Time": 9.044203544035554} +{"Pretrain/Learning Rate": 2.4053605331877517e-05, "Pretrain/Loss": 2.003135919570923, "Pretrain/Loss (Raw)": 2.2672743797302246, "Pretrain/Step": 5023, "Pretrain/Step Time": 9.048975257202983} +{"Pretrain/Learning Rate": 2.404512159891267e-05, "Pretrain/Loss": 2.0051357746124268, "Pretrain/Loss (Raw)": 2.0207464694976807, "Pretrain/Step": 5024, "Pretrain/Step Time": 9.049745896831155} +{"Pretrain/Learning Rate": 2.4036637976068914e-05, "Pretrain/Loss": 2.002636194229126, "Pretrain/Loss (Raw)": 1.8734861612319946, "Pretrain/Step": 5025, "Pretrain/Step Time": 9.05487465672195} +{"Pretrain/Learning Rate": 2.4028154464324592e-05, "Pretrain/Loss": 2.0013599395751953, "Pretrain/Loss (Raw)": 1.8069862127304077, "Pretrain/Step": 5026, "Pretrain/Step Time": 9.059887208044529} +{"Pretrain/Learning Rate": 2.4019671064658088e-05, "Pretrain/Loss": 1.9992238283157349, "Pretrain/Loss (Raw)": 1.9465452432632446, "Pretrain/Step": 5027, "Pretrain/Step Time": 9.05555816553533} +{"Pretrain/Learning Rate": 2.4011187778047727e-05, "Pretrain/Loss": 1.996234655380249, "Pretrain/Loss (Raw)": 1.7738425731658936, "Pretrain/Step": 5028, "Pretrain/Step Time": 9.05550709553063} +{"Pretrain/Learning Rate": 2.4002704605471857e-05, "Pretrain/Loss": 1.998929500579834, "Pretrain/Loss (Raw)": 2.2344930171966553, "Pretrain/Step": 5029, "Pretrain/Step Time": 9.059125265106559} +{"Pretrain/Learning Rate": 2.3994221547908783e-05, "Pretrain/Loss": 1.9984855651855469, "Pretrain/Loss (Raw)": 1.8348467350006104, "Pretrain/Step": 5030, "Pretrain/Step Time": 9.061379699036479} +{"Pretrain/Learning Rate": 2.398573860633683e-05, "Pretrain/Loss": 1.9982848167419434, "Pretrain/Loss (Raw)": 1.9932547807693481, "Pretrain/Step": 5031, "Pretrain/Step Time": 9.069444805383682} +{"Pretrain/Learning Rate": 2.3977255781734275e-05, "Pretrain/Loss": 1.9990086555480957, "Pretrain/Loss (Raw)": 2.1007275581359863, "Pretrain/Step": 5032, "Pretrain/Step Time": 9.064834289252758} +{"Pretrain/Learning Rate": 2.3968773075079404e-05, "Pretrain/Loss": 2.0021767616271973, "Pretrain/Loss (Raw)": 2.1310386657714844, "Pretrain/Step": 5033, "Pretrain/Step Time": 9.053295060992241} +{"Pretrain/Learning Rate": 2.396029048735048e-05, "Pretrain/Loss": 1.999833106994629, "Pretrain/Loss (Raw)": 2.0672781467437744, "Pretrain/Step": 5034, "Pretrain/Step Time": 9.053950192406774} +{"Pretrain/Learning Rate": 2.3951808019525758e-05, "Pretrain/Loss": 1.993905782699585, "Pretrain/Loss (Raw)": 1.4629563093185425, "Pretrain/Step": 5035, "Pretrain/Step Time": 9.049773404374719} +{"Pretrain/Learning Rate": 2.394332567258347e-05, "Pretrain/Loss": 1.995326280593872, "Pretrain/Loss (Raw)": 2.040048599243164, "Pretrain/Step": 5036, "Pretrain/Step Time": 9.060730623081326} +{"Pretrain/Learning Rate": 2.3934843447501852e-05, "Pretrain/Loss": 1.9970805644989014, "Pretrain/Loss (Raw)": 2.136415958404541, "Pretrain/Step": 5037, "Pretrain/Step Time": 9.069934463128448} +{"Pretrain/Learning Rate": 2.3926361345259098e-05, "Pretrain/Loss": 1.9964940547943115, "Pretrain/Loss (Raw)": 1.886063814163208, "Pretrain/Step": 5038, "Pretrain/Step Time": 9.066331619396806} +{"Pretrain/Learning Rate": 2.391787936683342e-05, "Pretrain/Loss": 1.9958940744400024, "Pretrain/Loss (Raw)": 1.9524399042129517, "Pretrain/Step": 5039, "Pretrain/Step Time": 9.069993918761611} +{"Pretrain/Learning Rate": 2.390939751320299e-05, "Pretrain/Loss": 1.9972443580627441, "Pretrain/Loss (Raw)": 2.1566920280456543, "Pretrain/Step": 5040, "Pretrain/Step Time": 9.0710284486413} +{"Pretrain/Learning Rate": 2.390091578534598e-05, "Pretrain/Loss": 1.9994187355041504, "Pretrain/Loss (Raw)": 2.2413828372955322, "Pretrain/Step": 5041, "Pretrain/Step Time": 9.069499773904681} +{"Pretrain/Learning Rate": 2.3892434184240533e-05, "Pretrain/Loss": 2.0006115436553955, "Pretrain/Loss (Raw)": 2.0990869998931885, "Pretrain/Step": 5042, "Pretrain/Step Time": 9.075943768024445} +{"Pretrain/Learning Rate": 2.3883952710864804e-05, "Pretrain/Loss": 2.0000250339508057, "Pretrain/Loss (Raw)": 1.9011471271514893, "Pretrain/Step": 5043, "Pretrain/Step Time": 9.074566533789039} +{"Pretrain/Learning Rate": 2.3875471366196903e-05, "Pretrain/Loss": 1.999618649482727, "Pretrain/Loss (Raw)": 1.9300857782363892, "Pretrain/Step": 5044, "Pretrain/Step Time": 9.074799040332437} +{"Pretrain/Learning Rate": 2.3866990151214947e-05, "Pretrain/Loss": 2.0009891986846924, "Pretrain/Loss (Raw)": 2.199681520462036, "Pretrain/Step": 5045, "Pretrain/Step Time": 9.072911011055112} +{"Pretrain/Learning Rate": 2.3858509066897016e-05, "Pretrain/Loss": 2.0003843307495117, "Pretrain/Loss (Raw)": 1.971384048461914, "Pretrain/Step": 5046, "Pretrain/Step Time": 9.062873501330614} +{"Pretrain/Learning Rate": 2.385002811422121e-05, "Pretrain/Loss": 2.002516746520996, "Pretrain/Loss (Raw)": 2.0777857303619385, "Pretrain/Step": 5047, "Pretrain/Step Time": 9.06264223717153} +{"Pretrain/Learning Rate": 2.384154729416557e-05, "Pretrain/Loss": 2.0042877197265625, "Pretrain/Loss (Raw)": 2.15627384185791, "Pretrain/Step": 5048, "Pretrain/Step Time": 9.0741077773273} +{"Pretrain/Learning Rate": 2.383306660770817e-05, "Pretrain/Loss": 2.0036776065826416, "Pretrain/Loss (Raw)": 1.875082015991211, "Pretrain/Step": 5049, "Pretrain/Step Time": 9.06669787503779} +{"Pretrain/Learning Rate": 2.382458605582701e-05, "Pretrain/Loss": 2.003080129623413, "Pretrain/Loss (Raw)": 1.8496893644332886, "Pretrain/Step": 5050, "Pretrain/Step Time": 9.063282741233706} +{"Pretrain/Learning Rate": 2.3816105639500142e-05, "Pretrain/Loss": 2.006535530090332, "Pretrain/Loss (Raw)": 2.016140937805176, "Pretrain/Step": 5051, "Pretrain/Step Time": 9.065452862530947} +{"Pretrain/Learning Rate": 2.3807625359705532e-05, "Pretrain/Loss": 2.005484104156494, "Pretrain/Loss (Raw)": 1.9841493368148804, "Pretrain/Step": 5052, "Pretrain/Step Time": 9.06433156132698} +{"Pretrain/Learning Rate": 2.37991452174212e-05, "Pretrain/Loss": 2.005023717880249, "Pretrain/Loss (Raw)": 1.9088695049285889, "Pretrain/Step": 5053, "Pretrain/Step Time": 9.066137893125415} +{"Pretrain/Learning Rate": 2.3790665213625087e-05, "Pretrain/Loss": 2.0058577060699463, "Pretrain/Loss (Raw)": 1.8934379816055298, "Pretrain/Step": 5054, "Pretrain/Step Time": 9.07674433477223} +{"Pretrain/Learning Rate": 2.3782185349295174e-05, "Pretrain/Loss": 2.005467414855957, "Pretrain/Loss (Raw)": 2.066467761993408, "Pretrain/Step": 5055, "Pretrain/Step Time": 9.072284365072846} +{"Pretrain/Learning Rate": 2.377370562540937e-05, "Pretrain/Loss": 2.005136013031006, "Pretrain/Loss (Raw)": 2.0478529930114746, "Pretrain/Step": 5056, "Pretrain/Step Time": 9.076682476326823} +{"Pretrain/Learning Rate": 2.3765226042945616e-05, "Pretrain/Loss": 2.004275321960449, "Pretrain/Loss (Raw)": 1.7058833837509155, "Pretrain/Step": 5057, "Pretrain/Step Time": 9.077551817521453} +{"Pretrain/Learning Rate": 2.3756746602881824e-05, "Pretrain/Loss": 2.000866413116455, "Pretrain/Loss (Raw)": 1.7179979085922241, "Pretrain/Step": 5058, "Pretrain/Step Time": 9.07743152603507} +{"Pretrain/Learning Rate": 2.3748267306195855e-05, "Pretrain/Loss": 2.0003867149353027, "Pretrain/Loss (Raw)": 2.1386094093322754, "Pretrain/Step": 5059, "Pretrain/Step Time": 9.073162799701095} +{"Pretrain/Learning Rate": 2.373978815386562e-05, "Pretrain/Loss": 1.9995226860046387, "Pretrain/Loss (Raw)": 1.9325248003005981, "Pretrain/Step": 5060, "Pretrain/Step Time": 9.07730340026319} +{"Pretrain/Learning Rate": 2.3731309146868932e-05, "Pretrain/Loss": 2.000559091567993, "Pretrain/Loss (Raw)": 2.001558780670166, "Pretrain/Step": 5061, "Pretrain/Step Time": 9.065704640001059} +{"Pretrain/Learning Rate": 2.372283028618367e-05, "Pretrain/Loss": 2.0016465187072754, "Pretrain/Loss (Raw)": 2.2083003520965576, "Pretrain/Step": 5062, "Pretrain/Step Time": 9.065922306850553} +{"Pretrain/Learning Rate": 2.371435157278762e-05, "Pretrain/Loss": 2.00215744972229, "Pretrain/Loss (Raw)": 2.0859434604644775, "Pretrain/Step": 5063, "Pretrain/Step Time": 9.064513942226768} +{"Pretrain/Learning Rate": 2.370587300765862e-05, "Pretrain/Loss": 2.0036702156066895, "Pretrain/Loss (Raw)": 2.081585645675659, "Pretrain/Step": 5064, "Pretrain/Step Time": 9.066645700484514} +{"Pretrain/Learning Rate": 2.369739459177443e-05, "Pretrain/Loss": 2.0106160640716553, "Pretrain/Loss (Raw)": 2.898855447769165, "Pretrain/Step": 5065, "Pretrain/Step Time": 9.061991846188903} +{"Pretrain/Learning Rate": 2.3688916326112848e-05, "Pretrain/Loss": 2.0113632678985596, "Pretrain/Loss (Raw)": 2.0745248794555664, "Pretrain/Step": 5066, "Pretrain/Step Time": 9.052956001833081} +{"Pretrain/Learning Rate": 2.3680438211651597e-05, "Pretrain/Loss": 2.0131523609161377, "Pretrain/Loss (Raw)": 2.0806891918182373, "Pretrain/Step": 5067, "Pretrain/Step Time": 9.050195962190628} +{"Pretrain/Learning Rate": 2.3671960249368448e-05, "Pretrain/Loss": 2.0125350952148438, "Pretrain/Loss (Raw)": 1.8390275239944458, "Pretrain/Step": 5068, "Pretrain/Step Time": 9.047739690169692} +{"Pretrain/Learning Rate": 2.3663482440241087e-05, "Pretrain/Loss": 2.013765335083008, "Pretrain/Loss (Raw)": 2.075401782989502, "Pretrain/Step": 5069, "Pretrain/Step Time": 9.048843758180737} +{"Pretrain/Learning Rate": 2.3655004785247234e-05, "Pretrain/Loss": 2.0136613845825195, "Pretrain/Loss (Raw)": 2.027345895767212, "Pretrain/Step": 5070, "Pretrain/Step Time": 9.050589006394148} +{"Pretrain/Learning Rate": 2.3646527285364565e-05, "Pretrain/Loss": 2.0154619216918945, "Pretrain/Loss (Raw)": 2.1270318031311035, "Pretrain/Step": 5071, "Pretrain/Step Time": 9.046232981607318} +{"Pretrain/Learning Rate": 2.363804994157075e-05, "Pretrain/Loss": 2.0141701698303223, "Pretrain/Loss (Raw)": 2.0359203815460205, "Pretrain/Step": 5072, "Pretrain/Step Time": 9.035784509032965} +{"Pretrain/Learning Rate": 2.3629572754843428e-05, "Pretrain/Loss": 2.015268564224243, "Pretrain/Loss (Raw)": 2.067444324493408, "Pretrain/Step": 5073, "Pretrain/Step Time": 9.034066714346409} +{"Pretrain/Learning Rate": 2.3621095726160237e-05, "Pretrain/Loss": 2.015956163406372, "Pretrain/Loss (Raw)": 2.1688735485076904, "Pretrain/Step": 5074, "Pretrain/Step Time": 9.032681973651052} +{"Pretrain/Learning Rate": 2.3612618856498785e-05, "Pretrain/Loss": 2.0097923278808594, "Pretrain/Loss (Raw)": 1.7352153062820435, "Pretrain/Step": 5075, "Pretrain/Step Time": 9.036055048927665} +{"Pretrain/Learning Rate": 2.3604142146836666e-05, "Pretrain/Loss": 2.009157657623291, "Pretrain/Loss (Raw)": 2.0334861278533936, "Pretrain/Step": 5076, "Pretrain/Step Time": 9.036086263135076} +{"Pretrain/Learning Rate": 2.3595665598151444e-05, "Pretrain/Loss": 2.009934186935425, "Pretrain/Loss (Raw)": 2.2635629177093506, "Pretrain/Step": 5077, "Pretrain/Step Time": 9.03079623915255} +{"Pretrain/Learning Rate": 2.3587189211420694e-05, "Pretrain/Loss": 2.00939679145813, "Pretrain/Loss (Raw)": 2.099255323410034, "Pretrain/Step": 5078, "Pretrain/Step Time": 9.029534375295043} +{"Pretrain/Learning Rate": 2.3578712987621932e-05, "Pretrain/Loss": 2.010204315185547, "Pretrain/Loss (Raw)": 2.0303337574005127, "Pretrain/Step": 5079, "Pretrain/Step Time": 9.033490650355816} +{"Pretrain/Learning Rate": 2.3570236927732692e-05, "Pretrain/Loss": 2.009471893310547, "Pretrain/Loss (Raw)": 1.9976637363433838, "Pretrain/Step": 5080, "Pretrain/Step Time": 9.031317396089435} +{"Pretrain/Learning Rate": 2.3561761032730463e-05, "Pretrain/Loss": 2.010955810546875, "Pretrain/Loss (Raw)": 2.205777168273926, "Pretrain/Step": 5081, "Pretrain/Step Time": 9.031369214877486} +{"Pretrain/Learning Rate": 2.355328530359273e-05, "Pretrain/Loss": 2.009373903274536, "Pretrain/Loss (Raw)": 1.9447720050811768, "Pretrain/Step": 5082, "Pretrain/Step Time": 9.03981382586062} +{"Pretrain/Learning Rate": 2.3544809741296954e-05, "Pretrain/Loss": 2.0075767040252686, "Pretrain/Loss (Raw)": 1.979945182800293, "Pretrain/Step": 5083, "Pretrain/Step Time": 9.037044642493129} +{"Pretrain/Learning Rate": 2.3536334346820578e-05, "Pretrain/Loss": 2.009204864501953, "Pretrain/Loss (Raw)": 2.223726272583008, "Pretrain/Step": 5084, "Pretrain/Step Time": 9.03376105427742} +{"Pretrain/Learning Rate": 2.3527859121141012e-05, "Pretrain/Loss": 2.006392478942871, "Pretrain/Loss (Raw)": 1.9469486474990845, "Pretrain/Step": 5085, "Pretrain/Step Time": 9.03319277614355} +{"Pretrain/Learning Rate": 2.351938406523568e-05, "Pretrain/Loss": 2.008314609527588, "Pretrain/Loss (Raw)": 2.282360315322876, "Pretrain/Step": 5086, "Pretrain/Step Time": 9.036768291145563} +{"Pretrain/Learning Rate": 2.3510909180081946e-05, "Pretrain/Loss": 2.0052971839904785, "Pretrain/Loss (Raw)": 1.5995005369186401, "Pretrain/Step": 5087, "Pretrain/Step Time": 9.03720591403544} +{"Pretrain/Learning Rate": 2.350243446665719e-05, "Pretrain/Loss": 2.004286289215088, "Pretrain/Loss (Raw)": 1.9047354459762573, "Pretrain/Step": 5088, "Pretrain/Step Time": 9.035640770569444} +{"Pretrain/Learning Rate": 2.3493959925938746e-05, "Pretrain/Loss": 2.0066277980804443, "Pretrain/Loss (Raw)": 2.017366886138916, "Pretrain/Step": 5089, "Pretrain/Step Time": 9.033215463161469} +{"Pretrain/Learning Rate": 2.348548555890394e-05, "Pretrain/Loss": 2.0078177452087402, "Pretrain/Loss (Raw)": 2.085142135620117, "Pretrain/Step": 5090, "Pretrain/Step Time": 9.032694559544325} +{"Pretrain/Learning Rate": 2.3477011366530068e-05, "Pretrain/Loss": 2.010646343231201, "Pretrain/Loss (Raw)": 2.154542922973633, "Pretrain/Step": 5091, "Pretrain/Step Time": 9.038017135113478} +{"Pretrain/Learning Rate": 2.3468537349794438e-05, "Pretrain/Loss": 2.012026309967041, "Pretrain/Loss (Raw)": 2.206331491470337, "Pretrain/Step": 5092, "Pretrain/Step Time": 9.038075555115938} +{"Pretrain/Learning Rate": 2.3460063509674278e-05, "Pretrain/Loss": 2.012287139892578, "Pretrain/Loss (Raw)": 2.028125762939453, "Pretrain/Step": 5093, "Pretrain/Step Time": 9.037959268316627} +{"Pretrain/Learning Rate": 2.345158984714687e-05, "Pretrain/Loss": 2.0127248764038086, "Pretrain/Loss (Raw)": 2.1558189392089844, "Pretrain/Step": 5094, "Pretrain/Step Time": 9.029562518000603} +{"Pretrain/Learning Rate": 2.3443116363189398e-05, "Pretrain/Loss": 2.012087106704712, "Pretrain/Loss (Raw)": 2.1375856399536133, "Pretrain/Step": 5095, "Pretrain/Step Time": 9.039399726316333} +{"Pretrain/Learning Rate": 2.3434643058779104e-05, "Pretrain/Loss": 2.012580394744873, "Pretrain/Loss (Raw)": 2.128786325454712, "Pretrain/Step": 5096, "Pretrain/Step Time": 9.041548047214746} +{"Pretrain/Learning Rate": 2.342616993489313e-05, "Pretrain/Loss": 2.0135507583618164, "Pretrain/Loss (Raw)": 2.141495704650879, "Pretrain/Step": 5097, "Pretrain/Step Time": 9.042740110307932} +{"Pretrain/Learning Rate": 2.3417696992508657e-05, "Pretrain/Loss": 2.0088865756988525, "Pretrain/Loss (Raw)": 1.366983413696289, "Pretrain/Step": 5098, "Pretrain/Step Time": 9.042283937335014} +{"Pretrain/Learning Rate": 2.3409224232602832e-05, "Pretrain/Loss": 2.008063793182373, "Pretrain/Loss (Raw)": 1.9553027153015137, "Pretrain/Step": 5099, "Pretrain/Step Time": 9.031415972858667} +{"Pretrain/Learning Rate": 2.340075165615276e-05, "Pretrain/Loss": 2.0090765953063965, "Pretrain/Loss (Raw)": 2.1687979698181152, "Pretrain/Step": 5100, "Pretrain/Step Time": 9.033032670617104} +{"Pretrain/Learning Rate": 2.339227926413555e-05, "Pretrain/Loss": 2.0067625045776367, "Pretrain/Loss (Raw)": 2.1915721893310547, "Pretrain/Step": 5101, "Pretrain/Step Time": 9.035271409898996} +{"Pretrain/Learning Rate": 2.3383807057528256e-05, "Pretrain/Loss": 2.0098772048950195, "Pretrain/Loss (Raw)": 2.229778289794922, "Pretrain/Step": 5102, "Pretrain/Step Time": 9.034088961780071} +{"Pretrain/Learning Rate": 2.3375335037307965e-05, "Pretrain/Loss": 2.0093278884887695, "Pretrain/Loss (Raw)": 1.872763991355896, "Pretrain/Step": 5103, "Pretrain/Step Time": 9.03405088186264} +{"Pretrain/Learning Rate": 2.3366863204451677e-05, "Pretrain/Loss": 2.007917881011963, "Pretrain/Loss (Raw)": 1.9695749282836914, "Pretrain/Step": 5104, "Pretrain/Step Time": 9.038840852677822} +{"Pretrain/Learning Rate": 2.3358391559936438e-05, "Pretrain/Loss": 2.0062875747680664, "Pretrain/Loss (Raw)": 1.872483491897583, "Pretrain/Step": 5105, "Pretrain/Step Time": 9.036331560462713} +{"Pretrain/Learning Rate": 2.33499201047392e-05, "Pretrain/Loss": 2.004481554031372, "Pretrain/Loss (Raw)": 1.8152339458465576, "Pretrain/Step": 5106, "Pretrain/Step Time": 9.029497975483537} +{"Pretrain/Learning Rate": 2.334144883983697e-05, "Pretrain/Loss": 2.003565788269043, "Pretrain/Loss (Raw)": 1.7924609184265137, "Pretrain/Step": 5107, "Pretrain/Step Time": 9.037623884156346} +{"Pretrain/Learning Rate": 2.3332977766206657e-05, "Pretrain/Loss": 2.004347562789917, "Pretrain/Loss (Raw)": 2.0205612182617188, "Pretrain/Step": 5108, "Pretrain/Step Time": 9.038753375411034} +{"Pretrain/Learning Rate": 2.332450688482522e-05, "Pretrain/Loss": 2.0051169395446777, "Pretrain/Loss (Raw)": 1.9941508769989014, "Pretrain/Step": 5109, "Pretrain/Step Time": 9.038001459091902} +{"Pretrain/Learning Rate": 2.3316036196669534e-05, "Pretrain/Loss": 2.0040206909179688, "Pretrain/Loss (Raw)": 1.9725613594055176, "Pretrain/Step": 5110, "Pretrain/Step Time": 9.035729287192225} +{"Pretrain/Learning Rate": 2.3307565702716495e-05, "Pretrain/Loss": 2.004236936569214, "Pretrain/Loss (Raw)": 2.0727193355560303, "Pretrain/Step": 5111, "Pretrain/Step Time": 9.031539959833026} +{"Pretrain/Learning Rate": 2.3299095403942943e-05, "Pretrain/Loss": 2.0075032711029053, "Pretrain/Loss (Raw)": 2.2545392513275146, "Pretrain/Step": 5112, "Pretrain/Step Time": 9.028826333582401} +{"Pretrain/Learning Rate": 2.3290625301325735e-05, "Pretrain/Loss": 2.0072383880615234, "Pretrain/Loss (Raw)": 1.8336937427520752, "Pretrain/Step": 5113, "Pretrain/Step Time": 9.026636444032192} +{"Pretrain/Learning Rate": 2.3282155395841667e-05, "Pretrain/Loss": 2.008784532546997, "Pretrain/Loss (Raw)": 2.1764252185821533, "Pretrain/Step": 5114, "Pretrain/Step Time": 9.030850322917104} +{"Pretrain/Learning Rate": 2.327368568846754e-05, "Pretrain/Loss": 2.011448383331299, "Pretrain/Loss (Raw)": 2.233773708343506, "Pretrain/Step": 5115, "Pretrain/Step Time": 9.037036787718534} +{"Pretrain/Learning Rate": 2.3265216180180106e-05, "Pretrain/Loss": 2.013068675994873, "Pretrain/Loss (Raw)": 1.9337871074676514, "Pretrain/Step": 5116, "Pretrain/Step Time": 9.039148472249508} +{"Pretrain/Learning Rate": 2.325674687195612e-05, "Pretrain/Loss": 2.016845703125, "Pretrain/Loss (Raw)": 2.1359119415283203, "Pretrain/Step": 5117, "Pretrain/Step Time": 9.032283186912537} +{"Pretrain/Learning Rate": 2.32482777647723e-05, "Pretrain/Loss": 2.0185694694519043, "Pretrain/Loss (Raw)": 1.9976619482040405, "Pretrain/Step": 5118, "Pretrain/Step Time": 9.023697264492512} +{"Pretrain/Learning Rate": 2.323980885960534e-05, "Pretrain/Loss": 2.019190788269043, "Pretrain/Loss (Raw)": 2.0289907455444336, "Pretrain/Step": 5119, "Pretrain/Step Time": 9.033778119832277} +{"Pretrain/Learning Rate": 2.3231340157431917e-05, "Pretrain/Loss": 2.0175137519836426, "Pretrain/Loss (Raw)": 2.069608211517334, "Pretrain/Step": 5120, "Pretrain/Step Time": 9.03291098959744} +{"Pretrain/Learning Rate": 2.3222871659228685e-05, "Pretrain/Loss": 2.0191640853881836, "Pretrain/Loss (Raw)": 2.1181552410125732, "Pretrain/Step": 5121, "Pretrain/Step Time": 9.043261252343655} +{"Pretrain/Learning Rate": 2.3214403365972258e-05, "Pretrain/Loss": 2.0194811820983887, "Pretrain/Loss (Raw)": 2.1233291625976562, "Pretrain/Step": 5122, "Pretrain/Step Time": 9.042956344783306} +{"Pretrain/Learning Rate": 2.320593527863926e-05, "Pretrain/Loss": 2.0194220542907715, "Pretrain/Loss (Raw)": 1.961586833000183, "Pretrain/Step": 5123, "Pretrain/Step Time": 9.039365977048874} +{"Pretrain/Learning Rate": 2.319746739820625e-05, "Pretrain/Loss": 2.0216429233551025, "Pretrain/Loss (Raw)": 2.032517910003662, "Pretrain/Step": 5124, "Pretrain/Step Time": 9.032335987314582} +{"Pretrain/Learning Rate": 2.3188999725649804e-05, "Pretrain/Loss": 2.0224690437316895, "Pretrain/Loss (Raw)": 1.9251515865325928, "Pretrain/Step": 5125, "Pretrain/Step Time": 9.039653427898884} +{"Pretrain/Learning Rate": 2.3180532261946437e-05, "Pretrain/Loss": 2.022895336151123, "Pretrain/Loss (Raw)": 2.118683338165283, "Pretrain/Step": 5126, "Pretrain/Step Time": 9.040012557059526} +{"Pretrain/Learning Rate": 2.3172065008072663e-05, "Pretrain/Loss": 2.0252482891082764, "Pretrain/Loss (Raw)": 2.215731382369995, "Pretrain/Step": 5127, "Pretrain/Step Time": 9.046867541968822} +{"Pretrain/Learning Rate": 2.3163597965004967e-05, "Pretrain/Loss": 2.025960922241211, "Pretrain/Loss (Raw)": 2.013423442840576, "Pretrain/Step": 5128, "Pretrain/Step Time": 9.050846045836806} +{"Pretrain/Learning Rate": 2.315513113371981e-05, "Pretrain/Loss": 2.0254244804382324, "Pretrain/Loss (Raw)": 1.9304739236831665, "Pretrain/Step": 5129, "Pretrain/Step Time": 8.534480530768633} +{"Pretrain/Learning Rate": 2.3146664515193616e-05, "Pretrain/Loss": 2.0258100032806396, "Pretrain/Loss (Raw)": 1.79362952709198, "Pretrain/Step": 5130, "Pretrain/Step Time": 8.538870489224792} +{"Pretrain/Learning Rate": 2.3138198110402812e-05, "Pretrain/Loss": 2.0263662338256836, "Pretrain/Loss (Raw)": 2.2619094848632812, "Pretrain/Step": 5131, "Pretrain/Step Time": 8.539191216230392} +{"Pretrain/Learning Rate": 2.3129731920323765e-05, "Pretrain/Loss": 2.028197765350342, "Pretrain/Loss (Raw)": 2.015197515487671, "Pretrain/Step": 5132, "Pretrain/Step Time": 8.546698719263077} +{"Pretrain/Learning Rate": 2.3121265945932862e-05, "Pretrain/Loss": 2.029149055480957, "Pretrain/Loss (Raw)": 2.331852436065674, "Pretrain/Step": 5133, "Pretrain/Step Time": 8.543999023735523} +{"Pretrain/Learning Rate": 2.3112800188206404e-05, "Pretrain/Loss": 2.028247356414795, "Pretrain/Loss (Raw)": 1.8433197736740112, "Pretrain/Step": 5134, "Pretrain/Step Time": 8.548738352954388} +{"Pretrain/Learning Rate": 2.310433464812074e-05, "Pretrain/Loss": 2.028319835662842, "Pretrain/Loss (Raw)": 2.1032426357269287, "Pretrain/Step": 5135, "Pretrain/Step Time": 8.534602938219905} +{"Pretrain/Learning Rate": 2.309586932665212e-05, "Pretrain/Loss": 2.029489040374756, "Pretrain/Loss (Raw)": 2.298403024673462, "Pretrain/Step": 5136, "Pretrain/Step Time": 8.527200065553188} +{"Pretrain/Learning Rate": 2.3087404224776835e-05, "Pretrain/Loss": 2.0293095111846924, "Pretrain/Loss (Raw)": 2.020052433013916, "Pretrain/Step": 5137, "Pretrain/Step Time": 8.536010172218084} +{"Pretrain/Learning Rate": 2.307893934347109e-05, "Pretrain/Loss": 2.028635263442993, "Pretrain/Loss (Raw)": 1.9777013063430786, "Pretrain/Step": 5138, "Pretrain/Step Time": 8.537849761545658} +{"Pretrain/Learning Rate": 2.3070474683711125e-05, "Pretrain/Loss": 2.029367446899414, "Pretrain/Loss (Raw)": 2.239603042602539, "Pretrain/Step": 5139, "Pretrain/Step Time": 8.541707642376423} +{"Pretrain/Learning Rate": 2.306201024647311e-05, "Pretrain/Loss": 2.0296380519866943, "Pretrain/Loss (Raw)": 1.987829566001892, "Pretrain/Step": 5140, "Pretrain/Step Time": 8.53758661262691} +{"Pretrain/Learning Rate": 2.3053546032733207e-05, "Pretrain/Loss": 2.0280911922454834, "Pretrain/Loss (Raw)": 1.888179063796997, "Pretrain/Step": 5141, "Pretrain/Step Time": 8.533527864143252} +{"Pretrain/Learning Rate": 2.3045082043467554e-05, "Pretrain/Loss": 2.029503345489502, "Pretrain/Loss (Raw)": 2.137739419937134, "Pretrain/Step": 5142, "Pretrain/Step Time": 8.523257875815034} +{"Pretrain/Learning Rate": 2.3036618279652232e-05, "Pretrain/Loss": 2.0316269397735596, "Pretrain/Loss (Raw)": 2.236567258834839, "Pretrain/Step": 5143, "Pretrain/Step Time": 8.53080977872014} +{"Pretrain/Learning Rate": 2.3028154742263362e-05, "Pretrain/Loss": 2.0304784774780273, "Pretrain/Loss (Raw)": 2.0530483722686768, "Pretrain/Step": 5144, "Pretrain/Step Time": 8.538796041160822} +{"Pretrain/Learning Rate": 2.3019691432276964e-05, "Pretrain/Loss": 2.0344858169555664, "Pretrain/Loss (Raw)": 2.407850980758667, "Pretrain/Step": 5145, "Pretrain/Step Time": 8.533667290583253} +{"Pretrain/Learning Rate": 2.3011228350669096e-05, "Pretrain/Loss": 2.0351665019989014, "Pretrain/Loss (Raw)": 2.047842025756836, "Pretrain/Step": 5146, "Pretrain/Step Time": 8.52436200901866} +{"Pretrain/Learning Rate": 2.3002765498415728e-05, "Pretrain/Loss": 2.0353403091430664, "Pretrain/Loss (Raw)": 2.1679577827453613, "Pretrain/Step": 5147, "Pretrain/Step Time": 8.51872999407351} +{"Pretrain/Learning Rate": 2.2994302876492875e-05, "Pretrain/Loss": 2.036479949951172, "Pretrain/Loss (Raw)": 2.0951485633850098, "Pretrain/Step": 5148, "Pretrain/Step Time": 8.522530309855938} +{"Pretrain/Learning Rate": 2.2985840485876444e-05, "Pretrain/Loss": 2.0377633571624756, "Pretrain/Loss (Raw)": 2.0296332836151123, "Pretrain/Step": 5149, "Pretrain/Step Time": 8.525710105895996} +{"Pretrain/Learning Rate": 2.2977378327542397e-05, "Pretrain/Loss": 2.038151741027832, "Pretrain/Loss (Raw)": 2.074688196182251, "Pretrain/Step": 5150, "Pretrain/Step Time": 8.52305536530912} +{"Pretrain/Learning Rate": 2.2968916402466604e-05, "Pretrain/Loss": 2.03488826751709, "Pretrain/Loss (Raw)": 1.8495370149612427, "Pretrain/Step": 5151, "Pretrain/Step Time": 8.51939089037478} +{"Pretrain/Learning Rate": 2.2960454711624945e-05, "Pretrain/Loss": 2.034133195877075, "Pretrain/Loss (Raw)": 1.9240970611572266, "Pretrain/Step": 5152, "Pretrain/Step Time": 8.51346075721085} +{"Pretrain/Learning Rate": 2.2951993255993252e-05, "Pretrain/Loss": 2.0346429347991943, "Pretrain/Loss (Raw)": 1.938712477684021, "Pretrain/Step": 5153, "Pretrain/Step Time": 8.513342428952456} +{"Pretrain/Learning Rate": 2.2943532036547356e-05, "Pretrain/Loss": 2.037219524383545, "Pretrain/Loss (Raw)": 2.1368322372436523, "Pretrain/Step": 5154, "Pretrain/Step Time": 8.515479413792491} +{"Pretrain/Learning Rate": 2.293507105426303e-05, "Pretrain/Loss": 2.0392727851867676, "Pretrain/Loss (Raw)": 2.209336519241333, "Pretrain/Step": 5155, "Pretrain/Step Time": 8.51583326049149} +{"Pretrain/Learning Rate": 2.2926610310116047e-05, "Pretrain/Loss": 2.0428459644317627, "Pretrain/Loss (Raw)": 2.231212615966797, "Pretrain/Step": 5156, "Pretrain/Step Time": 8.515731401741505} +{"Pretrain/Learning Rate": 2.2918149805082127e-05, "Pretrain/Loss": 2.040818691253662, "Pretrain/Loss (Raw)": 1.974987506866455, "Pretrain/Step": 5157, "Pretrain/Step Time": 8.518053468316793} +{"Pretrain/Learning Rate": 2.2909689540136985e-05, "Pretrain/Loss": 2.0421783924102783, "Pretrain/Loss (Raw)": 2.0088906288146973, "Pretrain/Step": 5158, "Pretrain/Step Time": 8.518348161131144} +{"Pretrain/Learning Rate": 2.290122951625629e-05, "Pretrain/Loss": 2.043447256088257, "Pretrain/Loss (Raw)": 2.155689239501953, "Pretrain/Step": 5159, "Pretrain/Step Time": 8.51581048592925} +{"Pretrain/Learning Rate": 2.2892769734415703e-05, "Pretrain/Loss": 2.04262113571167, "Pretrain/Loss (Raw)": 1.9950006008148193, "Pretrain/Step": 5160, "Pretrain/Step Time": 8.520451312884688} +{"Pretrain/Learning Rate": 2.2884310195590835e-05, "Pretrain/Loss": 2.0435328483581543, "Pretrain/Loss (Raw)": 2.2477307319641113, "Pretrain/Step": 5161, "Pretrain/Step Time": 8.51792355813086} +{"Pretrain/Learning Rate": 2.2875850900757288e-05, "Pretrain/Loss": 2.045531988143921, "Pretrain/Loss (Raw)": 2.3231592178344727, "Pretrain/Step": 5162, "Pretrain/Step Time": 8.524360420182347} +{"Pretrain/Learning Rate": 2.2867391850890623e-05, "Pretrain/Loss": 2.0504472255706787, "Pretrain/Loss (Raw)": 2.0921034812927246, "Pretrain/Step": 5163, "Pretrain/Step Time": 8.52342252060771} +{"Pretrain/Learning Rate": 2.285893304696638e-05, "Pretrain/Loss": 2.049656391143799, "Pretrain/Loss (Raw)": 1.9388396739959717, "Pretrain/Step": 5164, "Pretrain/Step Time": 8.514711074531078} +{"Pretrain/Learning Rate": 2.2850474489960065e-05, "Pretrain/Loss": 2.047640800476074, "Pretrain/Loss (Raw)": 1.8783856630325317, "Pretrain/Step": 5165, "Pretrain/Step Time": 8.504584034904838} +{"Pretrain/Learning Rate": 2.2842016180847165e-05, "Pretrain/Loss": 2.047421455383301, "Pretrain/Loss (Raw)": 1.8579703569412231, "Pretrain/Step": 5166, "Pretrain/Step Time": 8.510115696117282} +{"Pretrain/Learning Rate": 2.2833558120603122e-05, "Pretrain/Loss": 2.0485143661499023, "Pretrain/Loss (Raw)": 2.0923821926116943, "Pretrain/Step": 5167, "Pretrain/Step Time": 8.505585934966803} +{"Pretrain/Learning Rate": 2.282510031020337e-05, "Pretrain/Loss": 2.0476605892181396, "Pretrain/Loss (Raw)": 2.0473837852478027, "Pretrain/Step": 5168, "Pretrain/Step Time": 8.503730870783329} +{"Pretrain/Learning Rate": 2.2816642750623294e-05, "Pretrain/Loss": 2.0459628105163574, "Pretrain/Loss (Raw)": 2.024055242538452, "Pretrain/Step": 5169, "Pretrain/Step Time": 8.501923257485032} +{"Pretrain/Learning Rate": 2.280818544283827e-05, "Pretrain/Loss": 2.045198917388916, "Pretrain/Loss (Raw)": 2.001342296600342, "Pretrain/Step": 5170, "Pretrain/Step Time": 8.492051236331463} +{"Pretrain/Learning Rate": 2.279972838782362e-05, "Pretrain/Loss": 2.0462350845336914, "Pretrain/Loss (Raw)": 2.033761978149414, "Pretrain/Step": 5171, "Pretrain/Step Time": 8.494953565299511} +{"Pretrain/Learning Rate": 2.279127158655467e-05, "Pretrain/Loss": 2.0476596355438232, "Pretrain/Loss (Raw)": 2.112431049346924, "Pretrain/Step": 5172, "Pretrain/Step Time": 8.503171775490046} +{"Pretrain/Learning Rate": 2.2782815040006683e-05, "Pretrain/Loss": 2.044909954071045, "Pretrain/Loss (Raw)": 1.8477274179458618, "Pretrain/Step": 5173, "Pretrain/Step Time": 8.502684133127332} +{"Pretrain/Learning Rate": 2.2774358749154917e-05, "Pretrain/Loss": 2.044970989227295, "Pretrain/Loss (Raw)": 1.97917640209198, "Pretrain/Step": 5174, "Pretrain/Step Time": 8.501815009862185} +{"Pretrain/Learning Rate": 2.2765902714974585e-05, "Pretrain/Loss": 2.046051025390625, "Pretrain/Loss (Raw)": 2.216043710708618, "Pretrain/Step": 5175, "Pretrain/Step Time": 8.503502542153} +{"Pretrain/Learning Rate": 2.2757446938440886e-05, "Pretrain/Loss": 2.045231342315674, "Pretrain/Loss (Raw)": 2.0513713359832764, "Pretrain/Step": 5176, "Pretrain/Step Time": 8.492150129750371} +{"Pretrain/Learning Rate": 2.274899142052896e-05, "Pretrain/Loss": 2.0467171669006348, "Pretrain/Loss (Raw)": 2.065264940261841, "Pretrain/Step": 5177, "Pretrain/Step Time": 8.498067090287805} +{"Pretrain/Learning Rate": 2.2740536162213967e-05, "Pretrain/Loss": 2.0475239753723145, "Pretrain/Loss (Raw)": 1.9529356956481934, "Pretrain/Step": 5178, "Pretrain/Step Time": 8.506467813625932} +{"Pretrain/Learning Rate": 2.2732081164470973e-05, "Pretrain/Loss": 2.0450963973999023, "Pretrain/Loss (Raw)": 1.7054187059402466, "Pretrain/Step": 5179, "Pretrain/Step Time": 8.504214968532324} +{"Pretrain/Learning Rate": 2.2723626428275072e-05, "Pretrain/Loss": 2.0461816787719727, "Pretrain/Loss (Raw)": 2.123037099838257, "Pretrain/Step": 5180, "Pretrain/Step Time": 8.504885135218501} +{"Pretrain/Learning Rate": 2.2715171954601303e-05, "Pretrain/Loss": 2.0464911460876465, "Pretrain/Loss (Raw)": 1.9485039710998535, "Pretrain/Step": 5181, "Pretrain/Step Time": 8.500861264765263} +{"Pretrain/Learning Rate": 2.2706717744424664e-05, "Pretrain/Loss": 2.048617362976074, "Pretrain/Loss (Raw)": 2.1656079292297363, "Pretrain/Step": 5182, "Pretrain/Step Time": 8.495271798223257} +{"Pretrain/Learning Rate": 2.2698263798720148e-05, "Pretrain/Loss": 2.0505807399749756, "Pretrain/Loss (Raw)": 2.3177833557128906, "Pretrain/Step": 5183, "Pretrain/Step Time": 8.4990537725389} +{"Pretrain/Learning Rate": 2.268981011846269e-05, "Pretrain/Loss": 2.0504283905029297, "Pretrain/Loss (Raw)": 2.028338670730591, "Pretrain/Step": 5184, "Pretrain/Step Time": 8.497191905975342} +{"Pretrain/Learning Rate": 2.2681356704627226e-05, "Pretrain/Loss": 2.053205728530884, "Pretrain/Loss (Raw)": 2.0613858699798584, "Pretrain/Step": 5185, "Pretrain/Step Time": 8.494761686772108} +{"Pretrain/Learning Rate": 2.267290355818862e-05, "Pretrain/Loss": 2.056157112121582, "Pretrain/Loss (Raw)": 2.0957603454589844, "Pretrain/Step": 5186, "Pretrain/Step Time": 8.494493540376425} +{"Pretrain/Learning Rate": 2.2664450680121754e-05, "Pretrain/Loss": 2.0535969734191895, "Pretrain/Loss (Raw)": 1.8109278678894043, "Pretrain/Step": 5187, "Pretrain/Step Time": 8.494754169136286} +{"Pretrain/Learning Rate": 2.2655998071401424e-05, "Pretrain/Loss": 2.056025266647339, "Pretrain/Loss (Raw)": 2.2433464527130127, "Pretrain/Step": 5188, "Pretrain/Step Time": 8.480336604639888} +{"Pretrain/Learning Rate": 2.264754573300246e-05, "Pretrain/Loss": 2.0567209720611572, "Pretrain/Loss (Raw)": 2.0906004905700684, "Pretrain/Step": 5189, "Pretrain/Step Time": 8.485839158296585} +{"Pretrain/Learning Rate": 2.2639093665899592e-05, "Pretrain/Loss": 2.056375503540039, "Pretrain/Loss (Raw)": 2.1640937328338623, "Pretrain/Step": 5190, "Pretrain/Step Time": 8.491811776533723} +{"Pretrain/Learning Rate": 2.263064187106758e-05, "Pretrain/Loss": 2.0560073852539062, "Pretrain/Loss (Raw)": 2.0388143062591553, "Pretrain/Step": 5191, "Pretrain/Step Time": 8.49268058501184} +{"Pretrain/Learning Rate": 2.2622190349481102e-05, "Pretrain/Loss": 2.055596351623535, "Pretrain/Loss (Raw)": 2.028986692428589, "Pretrain/Step": 5192, "Pretrain/Step Time": 8.493031119927764} +{"Pretrain/Learning Rate": 2.2613739102114846e-05, "Pretrain/Loss": 2.049480438232422, "Pretrain/Loss (Raw)": 2.116002082824707, "Pretrain/Step": 5193, "Pretrain/Step Time": 8.492992186918855} +{"Pretrain/Learning Rate": 2.2605288129943435e-05, "Pretrain/Loss": 2.0491509437561035, "Pretrain/Loss (Raw)": 2.0323548316955566, "Pretrain/Step": 5194, "Pretrain/Step Time": 8.491559954360127} +{"Pretrain/Learning Rate": 2.2596837433941486e-05, "Pretrain/Loss": 2.0494871139526367, "Pretrain/Loss (Raw)": 2.1237246990203857, "Pretrain/Step": 5195, "Pretrain/Step Time": 8.493009705096483} +{"Pretrain/Learning Rate": 2.2588387015083566e-05, "Pretrain/Loss": 2.0492727756500244, "Pretrain/Loss (Raw)": 1.8115743398666382, "Pretrain/Step": 5196, "Pretrain/Step Time": 8.493482641875744} +{"Pretrain/Learning Rate": 2.257993687434422e-05, "Pretrain/Loss": 2.048313856124878, "Pretrain/Loss (Raw)": 1.952676773071289, "Pretrain/Step": 5197, "Pretrain/Step Time": 8.506843717768788} +{"Pretrain/Learning Rate": 2.2571487012697952e-05, "Pretrain/Loss": 2.0488264560699463, "Pretrain/Loss (Raw)": 2.0929481983184814, "Pretrain/Step": 5198, "Pretrain/Step Time": 8.508062964305282} +{"Pretrain/Learning Rate": 2.2563037431119254e-05, "Pretrain/Loss": 2.0522961616516113, "Pretrain/Loss (Raw)": 2.5711569786071777, "Pretrain/Step": 5199, "Pretrain/Step Time": 8.506725640967488} +{"Pretrain/Learning Rate": 2.2554588130582556e-05, "Pretrain/Loss": 2.0538718700408936, "Pretrain/Loss (Raw)": 2.2376132011413574, "Pretrain/Step": 5200, "Pretrain/Step Time": 8.503021342679858} +{"Pretrain/Learning Rate": 2.254613911206228e-05, "Pretrain/Loss": 2.0554027557373047, "Pretrain/Loss (Raw)": 2.26340651512146, "Pretrain/Step": 5201, "Pretrain/Step Time": 8.50295433960855} +{"Pretrain/Learning Rate": 2.25376903765328e-05, "Pretrain/Loss": 2.053748607635498, "Pretrain/Loss (Raw)": 1.9571540355682373, "Pretrain/Step": 5202, "Pretrain/Step Time": 8.505273658782244} +{"Pretrain/Learning Rate": 2.252924192496848e-05, "Pretrain/Loss": 2.055804967880249, "Pretrain/Loss (Raw)": 1.9984214305877686, "Pretrain/Step": 5203, "Pretrain/Step Time": 8.511668609455228} +{"Pretrain/Learning Rate": 2.2520793758343614e-05, "Pretrain/Loss": 2.0537121295928955, "Pretrain/Loss (Raw)": 1.7655946016311646, "Pretrain/Step": 5204, "Pretrain/Step Time": 8.518174985423684} +{"Pretrain/Learning Rate": 2.2512345877632498e-05, "Pretrain/Loss": 2.052138090133667, "Pretrain/Loss (Raw)": 2.062091827392578, "Pretrain/Step": 5205, "Pretrain/Step Time": 8.519295539706945} +{"Pretrain/Learning Rate": 2.2503898283809374e-05, "Pretrain/Loss": 2.0518839359283447, "Pretrain/Loss (Raw)": 2.066704273223877, "Pretrain/Step": 5206, "Pretrain/Step Time": 8.52056384459138} +{"Pretrain/Learning Rate": 2.2495450977848467e-05, "Pretrain/Loss": 2.050717830657959, "Pretrain/Loss (Raw)": 1.881095051765442, "Pretrain/Step": 5207, "Pretrain/Step Time": 8.51313710771501} +{"Pretrain/Learning Rate": 2.248700396072395e-05, "Pretrain/Loss": 2.051302433013916, "Pretrain/Loss (Raw)": 2.0724778175354004, "Pretrain/Step": 5208, "Pretrain/Step Time": 8.518497625365853} +{"Pretrain/Learning Rate": 2.2478557233409986e-05, "Pretrain/Loss": 2.050858497619629, "Pretrain/Loss (Raw)": 2.1489672660827637, "Pretrain/Step": 5209, "Pretrain/Step Time": 8.521961154416203} +{"Pretrain/Learning Rate": 2.2470110796880673e-05, "Pretrain/Loss": 2.0515329837799072, "Pretrain/Loss (Raw)": 2.031095027923584, "Pretrain/Step": 5210, "Pretrain/Step Time": 8.523654403164983} +{"Pretrain/Learning Rate": 2.246166465211011e-05, "Pretrain/Loss": 2.0518155097961426, "Pretrain/Loss (Raw)": 2.0161190032958984, "Pretrain/Step": 5211, "Pretrain/Step Time": 8.521134415641427} +{"Pretrain/Learning Rate": 2.245321880007234e-05, "Pretrain/Loss": 2.0501604080200195, "Pretrain/Loss (Raw)": 2.0118541717529297, "Pretrain/Step": 5212, "Pretrain/Step Time": 8.5234963465482} +{"Pretrain/Learning Rate": 2.244477324174138e-05, "Pretrain/Loss": 2.050326108932495, "Pretrain/Loss (Raw)": 1.9681721925735474, "Pretrain/Step": 5213, "Pretrain/Step Time": 8.521186910569668} +{"Pretrain/Learning Rate": 2.2436327978091205e-05, "Pretrain/Loss": 2.0512285232543945, "Pretrain/Loss (Raw)": 2.3978748321533203, "Pretrain/Step": 5214, "Pretrain/Step Time": 8.523705312982202} +{"Pretrain/Learning Rate": 2.2427883010095775e-05, "Pretrain/Loss": 2.0551838874816895, "Pretrain/Loss (Raw)": 2.1057724952697754, "Pretrain/Step": 5215, "Pretrain/Step Time": 8.525318011641502} +{"Pretrain/Learning Rate": 2.241943833872899e-05, "Pretrain/Loss": 2.055335760116577, "Pretrain/Loss (Raw)": 1.9241786003112793, "Pretrain/Step": 5216, "Pretrain/Step Time": 8.529262285679579} +{"Pretrain/Learning Rate": 2.2410993964964745e-05, "Pretrain/Loss": 2.056060791015625, "Pretrain/Loss (Raw)": 2.110175609588623, "Pretrain/Step": 5217, "Pretrain/Step Time": 8.525802170857787} +{"Pretrain/Learning Rate": 2.2402549889776864e-05, "Pretrain/Loss": 2.0564985275268555, "Pretrain/Loss (Raw)": 2.141187906265259, "Pretrain/Step": 5218, "Pretrain/Step Time": 8.521147007122636} +{"Pretrain/Learning Rate": 2.2394106114139183e-05, "Pretrain/Loss": 2.055779218673706, "Pretrain/Loss (Raw)": 2.062455177307129, "Pretrain/Step": 5219, "Pretrain/Step Time": 8.51937859132886} +{"Pretrain/Learning Rate": 2.2385662639025448e-05, "Pretrain/Loss": 2.050318956375122, "Pretrain/Loss (Raw)": 1.5074174404144287, "Pretrain/Step": 5220, "Pretrain/Step Time": 8.526037774980068} +{"Pretrain/Learning Rate": 2.237721946540942e-05, "Pretrain/Loss": 2.049941301345825, "Pretrain/Loss (Raw)": 1.9797899723052979, "Pretrain/Step": 5221, "Pretrain/Step Time": 8.528034513816237} +{"Pretrain/Learning Rate": 2.2368776594264813e-05, "Pretrain/Loss": 2.0481929779052734, "Pretrain/Loss (Raw)": 1.9320282936096191, "Pretrain/Step": 5222, "Pretrain/Step Time": 8.532013459131122} +{"Pretrain/Learning Rate": 2.2360334026565277e-05, "Pretrain/Loss": 2.0451717376708984, "Pretrain/Loss (Raw)": 1.7508515119552612, "Pretrain/Step": 5223, "Pretrain/Step Time": 8.524354981258512} +{"Pretrain/Learning Rate": 2.2351891763284466e-05, "Pretrain/Loss": 2.045506477355957, "Pretrain/Loss (Raw)": 2.171626567840576, "Pretrain/Step": 5224, "Pretrain/Step Time": 8.522352484986186} +{"Pretrain/Learning Rate": 2.2343449805395973e-05, "Pretrain/Loss": 2.0422165393829346, "Pretrain/Loss (Raw)": 1.7204071283340454, "Pretrain/Step": 5225, "Pretrain/Step Time": 8.52579789236188} +{"Pretrain/Learning Rate": 2.2335008153873375e-05, "Pretrain/Loss": 2.050114393234253, "Pretrain/Loss (Raw)": 2.3779008388519287, "Pretrain/Step": 5226, "Pretrain/Step Time": 8.529951862990856} +{"Pretrain/Learning Rate": 2.2326566809690176e-05, "Pretrain/Loss": 2.050079345703125, "Pretrain/Loss (Raw)": 1.9508144855499268, "Pretrain/Step": 5227, "Pretrain/Step Time": 8.529741706326604} +{"Pretrain/Learning Rate": 2.2318125773819913e-05, "Pretrain/Loss": 2.0495247840881348, "Pretrain/Loss (Raw)": 2.0978431701660156, "Pretrain/Step": 5228, "Pretrain/Step Time": 8.528150973841548} +{"Pretrain/Learning Rate": 2.2309685047236002e-05, "Pretrain/Loss": 2.047740936279297, "Pretrain/Loss (Raw)": 1.9632318019866943, "Pretrain/Step": 5229, "Pretrain/Step Time": 8.518716195598245} +{"Pretrain/Learning Rate": 2.2301244630911904e-05, "Pretrain/Loss": 2.046814441680908, "Pretrain/Loss (Raw)": 2.1111602783203125, "Pretrain/Step": 5230, "Pretrain/Step Time": 8.51839050091803} +{"Pretrain/Learning Rate": 2.229280452582098e-05, "Pretrain/Loss": 2.048569917678833, "Pretrain/Loss (Raw)": 2.0974717140197754, "Pretrain/Step": 5231, "Pretrain/Step Time": 8.521784976124763} +{"Pretrain/Learning Rate": 2.2284364732936608e-05, "Pretrain/Loss": 2.0503926277160645, "Pretrain/Loss (Raw)": 2.202878952026367, "Pretrain/Step": 5232, "Pretrain/Step Time": 8.532235991209745} +{"Pretrain/Learning Rate": 2.2275925253232073e-05, "Pretrain/Loss": 2.0522680282592773, "Pretrain/Loss (Raw)": 2.1125574111938477, "Pretrain/Step": 5233, "Pretrain/Step Time": 8.53086999244988} +{"Pretrain/Learning Rate": 2.2267486087680695e-05, "Pretrain/Loss": 2.055398464202881, "Pretrain/Loss (Raw)": 2.215893268585205, "Pretrain/Step": 5234, "Pretrain/Step Time": 8.53428615257144} +{"Pretrain/Learning Rate": 2.2259047237255684e-05, "Pretrain/Loss": 2.0569872856140137, "Pretrain/Loss (Raw)": 1.9958381652832031, "Pretrain/Step": 5235, "Pretrain/Step Time": 8.52436326816678} +{"Pretrain/Learning Rate": 2.2250608702930266e-05, "Pretrain/Loss": 2.055962085723877, "Pretrain/Loss (Raw)": 1.8893542289733887, "Pretrain/Step": 5236, "Pretrain/Step Time": 8.527685917913914} +{"Pretrain/Learning Rate": 2.2242170485677606e-05, "Pretrain/Loss": 2.0542807579040527, "Pretrain/Loss (Raw)": 1.7789171934127808, "Pretrain/Step": 5237, "Pretrain/Step Time": 8.527172157540917} +{"Pretrain/Learning Rate": 2.223373258647084e-05, "Pretrain/Loss": 2.0575711727142334, "Pretrain/Loss (Raw)": 2.3937668800354004, "Pretrain/Step": 5238, "Pretrain/Step Time": 8.535171682015061} +{"Pretrain/Learning Rate": 2.222529500628307e-05, "Pretrain/Loss": 2.058518171310425, "Pretrain/Loss (Raw)": 2.1939175128936768, "Pretrain/Step": 5239, "Pretrain/Step Time": 8.534639129415154} +{"Pretrain/Learning Rate": 2.2216857746087355e-05, "Pretrain/Loss": 2.057122230529785, "Pretrain/Loss (Raw)": 2.07584810256958, "Pretrain/Step": 5240, "Pretrain/Step Time": 8.534578384831548} +{"Pretrain/Learning Rate": 2.2208420806856718e-05, "Pretrain/Loss": 2.0584936141967773, "Pretrain/Loss (Raw)": 2.009253978729248, "Pretrain/Step": 5241, "Pretrain/Step Time": 8.53633051365614} +{"Pretrain/Learning Rate": 2.2199984189564148e-05, "Pretrain/Loss": 2.0561575889587402, "Pretrain/Loss (Raw)": 1.877418875694275, "Pretrain/Step": 5242, "Pretrain/Step Time": 8.527832860127091} +{"Pretrain/Learning Rate": 2.2191547895182594e-05, "Pretrain/Loss": 2.0558102130889893, "Pretrain/Loss (Raw)": 2.1892881393432617, "Pretrain/Step": 5243, "Pretrain/Step Time": 8.522642605006695} +{"Pretrain/Learning Rate": 2.2183111924684975e-05, "Pretrain/Loss": 2.0566911697387695, "Pretrain/Loss (Raw)": 2.0465798377990723, "Pretrain/Step": 5244, "Pretrain/Step Time": 8.523695236071944} +{"Pretrain/Learning Rate": 2.2174676279044153e-05, "Pretrain/Loss": 2.0569372177124023, "Pretrain/Loss (Raw)": 2.1673765182495117, "Pretrain/Step": 5245, "Pretrain/Step Time": 8.525602193549275} +{"Pretrain/Learning Rate": 2.2166240959232985e-05, "Pretrain/Loss": 2.0579442977905273, "Pretrain/Loss (Raw)": 2.1265921592712402, "Pretrain/Step": 5246, "Pretrain/Step Time": 8.523928888142109} +{"Pretrain/Learning Rate": 2.215780596622426e-05, "Pretrain/Loss": 2.058330535888672, "Pretrain/Loss (Raw)": 2.0784058570861816, "Pretrain/Step": 5247, "Pretrain/Step Time": 8.51663082279265} +{"Pretrain/Learning Rate": 2.2149371300990745e-05, "Pretrain/Loss": 2.0590224266052246, "Pretrain/Loss (Raw)": 2.158195734024048, "Pretrain/Step": 5248, "Pretrain/Step Time": 8.517364375293255} +{"Pretrain/Learning Rate": 2.214093696450516e-05, "Pretrain/Loss": 2.055718421936035, "Pretrain/Loss (Raw)": 1.6952166557312012, "Pretrain/Step": 5249, "Pretrain/Step Time": 8.510213697329164} +{"Pretrain/Learning Rate": 2.21325029577402e-05, "Pretrain/Loss": 2.055325508117676, "Pretrain/Loss (Raw)": 2.073054790496826, "Pretrain/Step": 5250, "Pretrain/Step Time": 8.5160590428859} +{"Pretrain/Learning Rate": 2.2124069281668507e-05, "Pretrain/Loss": 2.0567140579223633, "Pretrain/Loss (Raw)": 2.139289617538452, "Pretrain/Step": 5251, "Pretrain/Step Time": 8.514309875667095} +{"Pretrain/Learning Rate": 2.2115635937262706e-05, "Pretrain/Loss": 2.0564284324645996, "Pretrain/Loss (Raw)": 1.99599027633667, "Pretrain/Step": 5252, "Pretrain/Step Time": 8.514719950035214} +{"Pretrain/Learning Rate": 2.210720292549535e-05, "Pretrain/Loss": 2.0572807788848877, "Pretrain/Loss (Raw)": 2.0342319011688232, "Pretrain/Step": 5253, "Pretrain/Step Time": 8.506423514336348} +{"Pretrain/Learning Rate": 2.209877024733899e-05, "Pretrain/Loss": 2.0568838119506836, "Pretrain/Loss (Raw)": 2.0678670406341553, "Pretrain/Step": 5254, "Pretrain/Step Time": 8.506869265809655} +{"Pretrain/Learning Rate": 2.209033790376611e-05, "Pretrain/Loss": 2.055243968963623, "Pretrain/Loss (Raw)": 2.0058393478393555, "Pretrain/Step": 5255, "Pretrain/Step Time": 8.507683401927352} +{"Pretrain/Learning Rate": 2.2081905895749183e-05, "Pretrain/Loss": 2.0558135509490967, "Pretrain/Loss (Raw)": 2.0863399505615234, "Pretrain/Step": 5256, "Pretrain/Step Time": 8.506946336477995} +{"Pretrain/Learning Rate": 2.207347422426061e-05, "Pretrain/Loss": 2.0571093559265137, "Pretrain/Loss (Raw)": 2.0963215827941895, "Pretrain/Step": 5257, "Pretrain/Step Time": 8.511424221098423} +{"Pretrain/Learning Rate": 2.206504289027279e-05, "Pretrain/Loss": 2.0574026107788086, "Pretrain/Loss (Raw)": 1.8311821222305298, "Pretrain/Step": 5258, "Pretrain/Step Time": 8.510316111147404} +{"Pretrain/Learning Rate": 2.2056611894758038e-05, "Pretrain/Loss": 2.0544140338897705, "Pretrain/Loss (Raw)": 1.8793588876724243, "Pretrain/Step": 5259, "Pretrain/Step Time": 8.512016260996461} +{"Pretrain/Learning Rate": 2.204818123868869e-05, "Pretrain/Loss": 2.0539541244506836, "Pretrain/Loss (Raw)": 1.9563294649124146, "Pretrain/Step": 5260, "Pretrain/Step Time": 8.510368168354034} +{"Pretrain/Learning Rate": 2.203975092303697e-05, "Pretrain/Loss": 2.0514464378356934, "Pretrain/Loss (Raw)": 2.010861873626709, "Pretrain/Step": 5261, "Pretrain/Step Time": 8.51506619155407} +{"Pretrain/Learning Rate": 2.2031320948775135e-05, "Pretrain/Loss": 2.053030014038086, "Pretrain/Loss (Raw)": 2.0460262298583984, "Pretrain/Step": 5262, "Pretrain/Step Time": 8.512451788410544} +{"Pretrain/Learning Rate": 2.2022891316875362e-05, "Pretrain/Loss": 2.0519068241119385, "Pretrain/Loss (Raw)": 1.9594709873199463, "Pretrain/Step": 5263, "Pretrain/Step Time": 8.51226027496159} +{"Pretrain/Learning Rate": 2.201446202830978e-05, "Pretrain/Loss": 2.0492055416107178, "Pretrain/Loss (Raw)": 1.952648639678955, "Pretrain/Step": 5264, "Pretrain/Step Time": 8.516476852819324} +{"Pretrain/Learning Rate": 2.2006033084050516e-05, "Pretrain/Loss": 2.0507850646972656, "Pretrain/Loss (Raw)": 2.2222115993499756, "Pretrain/Step": 5265, "Pretrain/Step Time": 8.504405830055475} +{"Pretrain/Learning Rate": 2.1997604485069614e-05, "Pretrain/Loss": 2.0516414642333984, "Pretrain/Loss (Raw)": 2.087327718734741, "Pretrain/Step": 5266, "Pretrain/Step Time": 8.508857084438205} +{"Pretrain/Learning Rate": 2.1989176232339122e-05, "Pretrain/Loss": 2.0499818325042725, "Pretrain/Loss (Raw)": 2.027160882949829, "Pretrain/Step": 5267, "Pretrain/Step Time": 8.504107559099793} +{"Pretrain/Learning Rate": 2.1980748326831002e-05, "Pretrain/Loss": 2.051260471343994, "Pretrain/Loss (Raw)": 2.151526927947998, "Pretrain/Step": 5268, "Pretrain/Step Time": 8.506111500784755} +{"Pretrain/Learning Rate": 2.1972320769517226e-05, "Pretrain/Loss": 2.0526485443115234, "Pretrain/Loss (Raw)": 2.0658493041992188, "Pretrain/Step": 5269, "Pretrain/Step Time": 8.506573924794793} +{"Pretrain/Learning Rate": 2.1963893561369672e-05, "Pretrain/Loss": 2.050516128540039, "Pretrain/Loss (Raw)": 1.8647570610046387, "Pretrain/Step": 5270, "Pretrain/Step Time": 8.50501806102693} +{"Pretrain/Learning Rate": 2.1955466703360232e-05, "Pretrain/Loss": 2.0498199462890625, "Pretrain/Loss (Raw)": 2.1474738121032715, "Pretrain/Step": 5271, "Pretrain/Step Time": 8.498817011713982} +{"Pretrain/Learning Rate": 2.1947040196460704e-05, "Pretrain/Loss": 2.048902988433838, "Pretrain/Loss (Raw)": 1.9356639385223389, "Pretrain/Step": 5272, "Pretrain/Step Time": 8.497179105877876} +{"Pretrain/Learning Rate": 2.1938614041642903e-05, "Pretrain/Loss": 2.0454413890838623, "Pretrain/Loss (Raw)": 1.9647870063781738, "Pretrain/Step": 5273, "Pretrain/Step Time": 8.497116107493639} +{"Pretrain/Learning Rate": 2.1930188239878537e-05, "Pretrain/Loss": 2.045147657394409, "Pretrain/Loss (Raw)": 2.010241746902466, "Pretrain/Step": 5274, "Pretrain/Step Time": 8.50038549490273} +{"Pretrain/Learning Rate": 2.192176279213935e-05, "Pretrain/Loss": 2.045152425765991, "Pretrain/Loss (Raw)": 2.168562889099121, "Pretrain/Step": 5275, "Pretrain/Step Time": 8.500798778608441} +{"Pretrain/Learning Rate": 2.191333769939696e-05, "Pretrain/Loss": 2.043844699859619, "Pretrain/Loss (Raw)": 1.927782416343689, "Pretrain/Step": 5276, "Pretrain/Step Time": 8.499242665246129} +{"Pretrain/Learning Rate": 2.1904912962623035e-05, "Pretrain/Loss": 2.041923999786377, "Pretrain/Loss (Raw)": 1.783761978149414, "Pretrain/Step": 5277, "Pretrain/Step Time": 8.49878204986453} +{"Pretrain/Learning Rate": 2.1896488582789117e-05, "Pretrain/Loss": 2.041090250015259, "Pretrain/Loss (Raw)": 1.9679621458053589, "Pretrain/Step": 5278, "Pretrain/Step Time": 8.503337502479553} +{"Pretrain/Learning Rate": 2.1888064560866765e-05, "Pretrain/Loss": 2.0429534912109375, "Pretrain/Loss (Raw)": 2.0880234241485596, "Pretrain/Step": 5279, "Pretrain/Step Time": 8.507514078170061} +{"Pretrain/Learning Rate": 2.187964089782747e-05, "Pretrain/Loss": 2.044656753540039, "Pretrain/Loss (Raw)": 2.142125129699707, "Pretrain/Step": 5280, "Pretrain/Step Time": 8.511311696842313} +{"Pretrain/Learning Rate": 2.187121759464269e-05, "Pretrain/Loss": 2.0432848930358887, "Pretrain/Loss (Raw)": 1.7631404399871826, "Pretrain/Step": 5281, "Pretrain/Step Time": 8.5083620082587} +{"Pretrain/Learning Rate": 2.1862794652283837e-05, "Pretrain/Loss": 2.0435357093811035, "Pretrain/Loss (Raw)": 2.168933391571045, "Pretrain/Step": 5282, "Pretrain/Step Time": 8.501127498224378} +{"Pretrain/Learning Rate": 2.1854372071722297e-05, "Pretrain/Loss": 2.04195499420166, "Pretrain/Loss (Raw)": 2.0069565773010254, "Pretrain/Step": 5283, "Pretrain/Step Time": 8.504323568195105} +{"Pretrain/Learning Rate": 2.1845949853929382e-05, "Pretrain/Loss": 2.039527177810669, "Pretrain/Loss (Raw)": 1.920480728149414, "Pretrain/Step": 5284, "Pretrain/Step Time": 8.506946155801415} +{"Pretrain/Learning Rate": 2.1837527999876396e-05, "Pretrain/Loss": 2.039081573486328, "Pretrain/Loss (Raw)": 1.9179418087005615, "Pretrain/Step": 5285, "Pretrain/Step Time": 8.512796338647604} +{"Pretrain/Learning Rate": 2.1829106510534585e-05, "Pretrain/Loss": 2.040468454360962, "Pretrain/Loss (Raw)": 2.186403512954712, "Pretrain/Step": 5286, "Pretrain/Step Time": 8.509521370753646} +{"Pretrain/Learning Rate": 2.1820685386875155e-05, "Pretrain/Loss": 2.0395591259002686, "Pretrain/Loss (Raw)": 2.0393099784851074, "Pretrain/Step": 5287, "Pretrain/Step Time": 8.505291054025292} +{"Pretrain/Learning Rate": 2.1812264629869257e-05, "Pretrain/Loss": 2.0389890670776367, "Pretrain/Loss (Raw)": 1.922048568725586, "Pretrain/Step": 5288, "Pretrain/Step Time": 8.497483603656292} +{"Pretrain/Learning Rate": 2.1803844240488036e-05, "Pretrain/Loss": 2.03574800491333, "Pretrain/Loss (Raw)": 1.8328503370285034, "Pretrain/Step": 5289, "Pretrain/Step Time": 8.506329342722893} +{"Pretrain/Learning Rate": 2.179542421970255e-05, "Pretrain/Loss": 2.033093214035034, "Pretrain/Loss (Raw)": 1.9833742380142212, "Pretrain/Step": 5290, "Pretrain/Step Time": 8.502447528764606} +{"Pretrain/Learning Rate": 2.1787004568483846e-05, "Pretrain/Loss": 2.0327725410461426, "Pretrain/Loss (Raw)": 2.051025867462158, "Pretrain/Step": 5291, "Pretrain/Step Time": 8.505319219082594} +{"Pretrain/Learning Rate": 2.1778585287802914e-05, "Pretrain/Loss": 2.032622814178467, "Pretrain/Loss (Raw)": 1.9197160005569458, "Pretrain/Step": 5292, "Pretrain/Step Time": 8.506226086989045} +{"Pretrain/Learning Rate": 2.1770166378630708e-05, "Pretrain/Loss": 2.037397861480713, "Pretrain/Loss (Raw)": 2.4895989894866943, "Pretrain/Step": 5293, "Pretrain/Step Time": 8.516597544774413} +{"Pretrain/Learning Rate": 2.1761747841938133e-05, "Pretrain/Loss": 2.038936138153076, "Pretrain/Loss (Raw)": 2.054842948913574, "Pretrain/Step": 5294, "Pretrain/Step Time": 8.506742049008608} +{"Pretrain/Learning Rate": 2.175332967869606e-05, "Pretrain/Loss": 2.0395030975341797, "Pretrain/Loss (Raw)": 2.1649558544158936, "Pretrain/Step": 5295, "Pretrain/Step Time": 8.508203661069274} +{"Pretrain/Learning Rate": 2.17449118898753e-05, "Pretrain/Loss": 2.0401558876037598, "Pretrain/Loss (Raw)": 2.130915641784668, "Pretrain/Step": 5296, "Pretrain/Step Time": 8.507414050400257} +{"Pretrain/Learning Rate": 2.1736494476446646e-05, "Pretrain/Loss": 2.0405616760253906, "Pretrain/Loss (Raw)": 2.0760209560394287, "Pretrain/Step": 5297, "Pretrain/Step Time": 8.518644632771611} +{"Pretrain/Learning Rate": 2.172807743938082e-05, "Pretrain/Loss": 2.0403709411621094, "Pretrain/Loss (Raw)": 1.9769169092178345, "Pretrain/Step": 5298, "Pretrain/Step Time": 8.521342284977436} +{"Pretrain/Learning Rate": 2.171966077964853e-05, "Pretrain/Loss": 2.0388998985290527, "Pretrain/Loss (Raw)": 1.8454703092575073, "Pretrain/Step": 5299, "Pretrain/Step Time": 8.522234054282308} +{"Pretrain/Learning Rate": 2.1711244498220412e-05, "Pretrain/Loss": 2.03695011138916, "Pretrain/Loss (Raw)": 1.8628861904144287, "Pretrain/Step": 5300, "Pretrain/Step Time": 8.512498281896114} +{"Pretrain/Learning Rate": 2.170282859606708e-05, "Pretrain/Loss": 2.0388402938842773, "Pretrain/Loss (Raw)": 2.0896499156951904, "Pretrain/Step": 5301, "Pretrain/Step Time": 8.510384963825345} +{"Pretrain/Learning Rate": 2.1694413074159082e-05, "Pretrain/Loss": 2.0394906997680664, "Pretrain/Loss (Raw)": 2.062396287918091, "Pretrain/Step": 5302, "Pretrain/Step Time": 8.510936547070742} +{"Pretrain/Learning Rate": 2.1685997933466948e-05, "Pretrain/Loss": 2.0381393432617188, "Pretrain/Loss (Raw)": 2.0431201457977295, "Pretrain/Step": 5303, "Pretrain/Step Time": 8.516857823356986} +{"Pretrain/Learning Rate": 2.167758317496115e-05, "Pretrain/Loss": 2.0383083820343018, "Pretrain/Loss (Raw)": 2.072990894317627, "Pretrain/Step": 5304, "Pretrain/Step Time": 8.518854226917028} +{"Pretrain/Learning Rate": 2.1669168799612118e-05, "Pretrain/Loss": 2.0387330055236816, "Pretrain/Loss (Raw)": 2.119596242904663, "Pretrain/Step": 5305, "Pretrain/Step Time": 8.52084913291037} +{"Pretrain/Learning Rate": 2.1660754808390235e-05, "Pretrain/Loss": 2.0383877754211426, "Pretrain/Loss (Raw)": 1.9087640047073364, "Pretrain/Step": 5306, "Pretrain/Step Time": 8.506903221830726} +{"Pretrain/Learning Rate": 2.1652341202265838e-05, "Pretrain/Loss": 2.0416765213012695, "Pretrain/Loss (Raw)": 2.126352548599243, "Pretrain/Step": 5307, "Pretrain/Step Time": 8.510469667613506} +{"Pretrain/Learning Rate": 2.1643927982209233e-05, "Pretrain/Loss": 2.039816379547119, "Pretrain/Loss (Raw)": 1.884961485862732, "Pretrain/Step": 5308, "Pretrain/Step Time": 8.511093778535724} +{"Pretrain/Learning Rate": 2.1635515149190665e-05, "Pretrain/Loss": 2.0411932468414307, "Pretrain/Loss (Raw)": 2.1247477531433105, "Pretrain/Step": 5309, "Pretrain/Step Time": 8.51972989924252} +{"Pretrain/Learning Rate": 2.1627102704180353e-05, "Pretrain/Loss": 2.04066801071167, "Pretrain/Loss (Raw)": 2.0983667373657227, "Pretrain/Step": 5310, "Pretrain/Step Time": 8.523466879501939} +{"Pretrain/Learning Rate": 2.1618690648148435e-05, "Pretrain/Loss": 2.037621259689331, "Pretrain/Loss (Raw)": 1.927807092666626, "Pretrain/Step": 5311, "Pretrain/Step Time": 8.517202405259013} +{"Pretrain/Learning Rate": 2.161027898206506e-05, "Pretrain/Loss": 2.037165641784668, "Pretrain/Loss (Raw)": 1.970028281211853, "Pretrain/Step": 5312, "Pretrain/Step Time": 8.521192846819758} +{"Pretrain/Learning Rate": 2.160186770690027e-05, "Pretrain/Loss": 2.035757541656494, "Pretrain/Loss (Raw)": 1.8811262845993042, "Pretrain/Step": 5313, "Pretrain/Step Time": 8.520218780264258} +{"Pretrain/Learning Rate": 2.1593456823624127e-05, "Pretrain/Loss": 2.036020278930664, "Pretrain/Loss (Raw)": 2.1294310092926025, "Pretrain/Step": 5314, "Pretrain/Step Time": 8.524178544059396} +{"Pretrain/Learning Rate": 2.1585046333206573e-05, "Pretrain/Loss": 2.0379695892333984, "Pretrain/Loss (Raw)": 2.0603933334350586, "Pretrain/Step": 5315, "Pretrain/Step Time": 8.53495578840375} +{"Pretrain/Learning Rate": 2.157663623661759e-05, "Pretrain/Loss": 2.0357303619384766, "Pretrain/Loss (Raw)": 1.9567607641220093, "Pretrain/Step": 5316, "Pretrain/Step Time": 8.536830784752965} +{"Pretrain/Learning Rate": 2.156822653482703e-05, "Pretrain/Loss": 2.035733938217163, "Pretrain/Loss (Raw)": 2.0910415649414062, "Pretrain/Step": 5317, "Pretrain/Step Time": 8.530871704220772} +{"Pretrain/Learning Rate": 2.155981722880477e-05, "Pretrain/Loss": 2.035663366317749, "Pretrain/Loss (Raw)": 2.1550562381744385, "Pretrain/Step": 5318, "Pretrain/Step Time": 8.524660885334015} +{"Pretrain/Learning Rate": 2.1551408319520588e-05, "Pretrain/Loss": 2.0351576805114746, "Pretrain/Loss (Raw)": 1.9740877151489258, "Pretrain/Step": 5319, "Pretrain/Step Time": 8.52469609491527} +{"Pretrain/Learning Rate": 2.1542999807944258e-05, "Pretrain/Loss": 2.034679889678955, "Pretrain/Loss (Raw)": 1.9678632020950317, "Pretrain/Step": 5320, "Pretrain/Step Time": 8.534462226554751} +{"Pretrain/Learning Rate": 2.1534591695045473e-05, "Pretrain/Loss": 2.034740447998047, "Pretrain/Loss (Raw)": 2.123721122741699, "Pretrain/Step": 5321, "Pretrain/Step Time": 8.533651262521744} +{"Pretrain/Learning Rate": 2.1526183981793908e-05, "Pretrain/Loss": 2.035536289215088, "Pretrain/Loss (Raw)": 2.134244441986084, "Pretrain/Step": 5322, "Pretrain/Step Time": 8.537992212921381} +{"Pretrain/Learning Rate": 2.1517776669159166e-05, "Pretrain/Loss": 2.036177635192871, "Pretrain/Loss (Raw)": 2.2057952880859375, "Pretrain/Step": 5323, "Pretrain/Step Time": 8.537176290526986} +{"Pretrain/Learning Rate": 2.150936975811084e-05, "Pretrain/Loss": 2.038252115249634, "Pretrain/Loss (Raw)": 2.077124834060669, "Pretrain/Step": 5324, "Pretrain/Step Time": 8.538180449977517} +{"Pretrain/Learning Rate": 2.1500963249618433e-05, "Pretrain/Loss": 2.0351510047912598, "Pretrain/Loss (Raw)": 1.555694818496704, "Pretrain/Step": 5325, "Pretrain/Step Time": 8.532162383198738} +{"Pretrain/Learning Rate": 2.149255714465144e-05, "Pretrain/Loss": 2.0364174842834473, "Pretrain/Loss (Raw)": 2.2550549507141113, "Pretrain/Step": 5326, "Pretrain/Step Time": 8.527667256072164} +{"Pretrain/Learning Rate": 2.1484151444179273e-05, "Pretrain/Loss": 2.031632900238037, "Pretrain/Loss (Raw)": 1.9587541818618774, "Pretrain/Step": 5327, "Pretrain/Step Time": 8.54081286676228} +{"Pretrain/Learning Rate": 2.147574614917134e-05, "Pretrain/Loss": 2.0297951698303223, "Pretrain/Loss (Raw)": 2.002415180206299, "Pretrain/Step": 5328, "Pretrain/Step Time": 8.540027253329754} +{"Pretrain/Learning Rate": 2.146734126059696e-05, "Pretrain/Loss": 2.02901554107666, "Pretrain/Loss (Raw)": 2.163594961166382, "Pretrain/Step": 5329, "Pretrain/Step Time": 8.538502724841237} +{"Pretrain/Learning Rate": 2.1458936779425438e-05, "Pretrain/Loss": 2.029236316680908, "Pretrain/Loss (Raw)": 1.9854029417037964, "Pretrain/Step": 5330, "Pretrain/Step Time": 8.540572434663773} +{"Pretrain/Learning Rate": 2.145053270662601e-05, "Pretrain/Loss": 2.029470920562744, "Pretrain/Loss (Raw)": 2.0284762382507324, "Pretrain/Step": 5331, "Pretrain/Step Time": 8.527503410354257} +{"Pretrain/Learning Rate": 2.1442129043167874e-05, "Pretrain/Loss": 2.0306901931762695, "Pretrain/Loss (Raw)": 1.9216258525848389, "Pretrain/Step": 5332, "Pretrain/Step Time": 8.520425863564014} +{"Pretrain/Learning Rate": 2.1433725790020186e-05, "Pretrain/Loss": 2.031602382659912, "Pretrain/Loss (Raw)": 2.1788814067840576, "Pretrain/Step": 5333, "Pretrain/Step Time": 8.523896561935544} +{"Pretrain/Learning Rate": 2.1425322948152042e-05, "Pretrain/Loss": 2.030195713043213, "Pretrain/Loss (Raw)": 1.8866270780563354, "Pretrain/Step": 5334, "Pretrain/Step Time": 8.523951210081577} +{"Pretrain/Learning Rate": 2.14169205185325e-05, "Pretrain/Loss": 2.0302810668945312, "Pretrain/Loss (Raw)": 1.8920202255249023, "Pretrain/Step": 5335, "Pretrain/Step Time": 8.526439666748047} +{"Pretrain/Learning Rate": 2.140851850213057e-05, "Pretrain/Loss": 2.0310332775115967, "Pretrain/Loss (Raw)": 2.1687772274017334, "Pretrain/Step": 5336, "Pretrain/Step Time": 8.525353897362947} +{"Pretrain/Learning Rate": 2.1400116899915205e-05, "Pretrain/Loss": 2.03212308883667, "Pretrain/Loss (Raw)": 2.2884531021118164, "Pretrain/Step": 5337, "Pretrain/Step Time": 8.51998563297093} +{"Pretrain/Learning Rate": 2.1391715712855327e-05, "Pretrain/Loss": 2.0335288047790527, "Pretrain/Loss (Raw)": 2.2110211849212646, "Pretrain/Step": 5338, "Pretrain/Step Time": 8.52018111385405} +{"Pretrain/Learning Rate": 2.1383314941919795e-05, "Pretrain/Loss": 2.0334601402282715, "Pretrain/Loss (Raw)": 2.0073230266571045, "Pretrain/Step": 5339, "Pretrain/Step Time": 8.526082618162036} +{"Pretrain/Learning Rate": 2.1374914588077427e-05, "Pretrain/Loss": 2.0314362049102783, "Pretrain/Loss (Raw)": 1.752799391746521, "Pretrain/Step": 5340, "Pretrain/Step Time": 8.524903010576963} +{"Pretrain/Learning Rate": 2.1366514652296987e-05, "Pretrain/Loss": 2.0288777351379395, "Pretrain/Loss (Raw)": 1.6406887769699097, "Pretrain/Step": 5341, "Pretrain/Step Time": 8.52562508918345} +{"Pretrain/Learning Rate": 2.135811513554721e-05, "Pretrain/Loss": 2.0264010429382324, "Pretrain/Loss (Raw)": 2.080864667892456, "Pretrain/Step": 5342, "Pretrain/Step Time": 8.522195354104042} +{"Pretrain/Learning Rate": 2.1349716038796742e-05, "Pretrain/Loss": 2.027021884918213, "Pretrain/Loss (Raw)": 2.1852104663848877, "Pretrain/Step": 5343, "Pretrain/Step Time": 8.52439415641129} +{"Pretrain/Learning Rate": 2.1341317363014223e-05, "Pretrain/Loss": 2.028240203857422, "Pretrain/Loss (Raw)": 2.0801403522491455, "Pretrain/Step": 5344, "Pretrain/Step Time": 8.523164054378867} +{"Pretrain/Learning Rate": 2.133291910916823e-05, "Pretrain/Loss": 2.0304646492004395, "Pretrain/Loss (Raw)": 2.3949215412139893, "Pretrain/Step": 5345, "Pretrain/Step Time": 8.516434686258435} +{"Pretrain/Learning Rate": 2.1324521278227287e-05, "Pretrain/Loss": 2.0301730632781982, "Pretrain/Loss (Raw)": 2.1038522720336914, "Pretrain/Step": 5346, "Pretrain/Step Time": 8.520774813368917} +{"Pretrain/Learning Rate": 2.131612387115987e-05, "Pretrain/Loss": 2.031355142593384, "Pretrain/Loss (Raw)": 2.2137744426727295, "Pretrain/Step": 5347, "Pretrain/Step Time": 8.519269971176982} +{"Pretrain/Learning Rate": 2.13077268889344e-05, "Pretrain/Loss": 2.0351059436798096, "Pretrain/Loss (Raw)": 1.9875140190124512, "Pretrain/Step": 5348, "Pretrain/Step Time": 8.513609686866403} +{"Pretrain/Learning Rate": 2.1299330332519273e-05, "Pretrain/Loss": 2.0361194610595703, "Pretrain/Loss (Raw)": 2.109534502029419, "Pretrain/Step": 5349, "Pretrain/Step Time": 8.519856974482536} +{"Pretrain/Learning Rate": 2.1290934202882805e-05, "Pretrain/Loss": 2.0343809127807617, "Pretrain/Loss (Raw)": 1.7094852924346924, "Pretrain/Step": 5350, "Pretrain/Step Time": 8.5161117259413} +{"Pretrain/Learning Rate": 2.128253850099329e-05, "Pretrain/Loss": 2.0362491607666016, "Pretrain/Loss (Raw)": 1.9899698495864868, "Pretrain/Step": 5351, "Pretrain/Step Time": 8.522549765184522} +{"Pretrain/Learning Rate": 2.1274143227818938e-05, "Pretrain/Loss": 2.0331387519836426, "Pretrain/Loss (Raw)": 1.7734854221343994, "Pretrain/Step": 5352, "Pretrain/Step Time": 8.523691814392805} +{"Pretrain/Learning Rate": 2.126574838432796e-05, "Pretrain/Loss": 2.0367887020111084, "Pretrain/Loss (Raw)": 2.1876144409179688, "Pretrain/Step": 5353, "Pretrain/Step Time": 8.518485249951482} +{"Pretrain/Learning Rate": 2.1257353971488463e-05, "Pretrain/Loss": 2.0349597930908203, "Pretrain/Loss (Raw)": 2.143803596496582, "Pretrain/Step": 5354, "Pretrain/Step Time": 8.514758804813027} +{"Pretrain/Learning Rate": 2.1248959990268554e-05, "Pretrain/Loss": 2.0367350578308105, "Pretrain/Loss (Raw)": 2.1780591011047363, "Pretrain/Step": 5355, "Pretrain/Step Time": 8.512346632778645} +{"Pretrain/Learning Rate": 2.1240566441636238e-05, "Pretrain/Loss": 2.0346579551696777, "Pretrain/Loss (Raw)": 1.8319854736328125, "Pretrain/Step": 5356, "Pretrain/Step Time": 8.517413347959518} +{"Pretrain/Learning Rate": 2.1232173326559535e-05, "Pretrain/Loss": 2.034728527069092, "Pretrain/Loss (Raw)": 1.972263216972351, "Pretrain/Step": 5357, "Pretrain/Step Time": 8.524252135306597} +{"Pretrain/Learning Rate": 2.122378064600634e-05, "Pretrain/Loss": 2.0330915451049805, "Pretrain/Loss (Raw)": 1.9015872478485107, "Pretrain/Step": 5358, "Pretrain/Step Time": 8.527526065707207} +{"Pretrain/Learning Rate": 2.121538840094457e-05, "Pretrain/Loss": 2.033261299133301, "Pretrain/Loss (Raw)": 2.119205951690674, "Pretrain/Step": 5359, "Pretrain/Step Time": 8.522923473268747} +{"Pretrain/Learning Rate": 2.120699659234203e-05, "Pretrain/Loss": 2.0320327281951904, "Pretrain/Loss (Raw)": 2.0456435680389404, "Pretrain/Step": 5360, "Pretrain/Step Time": 8.51369541324675} +{"Pretrain/Learning Rate": 2.1198605221166528e-05, "Pretrain/Loss": 2.031130790710449, "Pretrain/Loss (Raw)": 1.997109293937683, "Pretrain/Step": 5361, "Pretrain/Step Time": 8.521628443151712} +{"Pretrain/Learning Rate": 2.1190214288385778e-05, "Pretrain/Loss": 2.031905174255371, "Pretrain/Loss (Raw)": 2.315004348754883, "Pretrain/Step": 5362, "Pretrain/Step Time": 8.520380184054375} +{"Pretrain/Learning Rate": 2.1181823794967472e-05, "Pretrain/Loss": 2.0318217277526855, "Pretrain/Loss (Raw)": 1.985155463218689, "Pretrain/Step": 5363, "Pretrain/Step Time": 8.519759031012654} +{"Pretrain/Learning Rate": 2.1173433741879234e-05, "Pretrain/Loss": 2.0318241119384766, "Pretrain/Loss (Raw)": 1.8896557092666626, "Pretrain/Step": 5364, "Pretrain/Step Time": 8.513640550896525} +{"Pretrain/Learning Rate": 2.116504413008865e-05, "Pretrain/Loss": 2.0344700813293457, "Pretrain/Loss (Raw)": 2.1176271438598633, "Pretrain/Step": 5365, "Pretrain/Step Time": 8.51214338466525} +{"Pretrain/Learning Rate": 2.1156654960563248e-05, "Pretrain/Loss": 2.0325870513916016, "Pretrain/Loss (Raw)": 2.1527259349823, "Pretrain/Step": 5366, "Pretrain/Step Time": 8.506375826895237} +{"Pretrain/Learning Rate": 2.1148266234270508e-05, "Pretrain/Loss": 2.0316925048828125, "Pretrain/Loss (Raw)": 2.0793983936309814, "Pretrain/Step": 5367, "Pretrain/Step Time": 8.509016735479236} +{"Pretrain/Learning Rate": 2.1139877952177852e-05, "Pretrain/Loss": 2.0320370197296143, "Pretrain/Loss (Raw)": 2.11995530128479, "Pretrain/Step": 5368, "Pretrain/Step Time": 8.516890397295356} +{"Pretrain/Learning Rate": 2.1131490115252668e-05, "Pretrain/Loss": 2.032893180847168, "Pretrain/Loss (Raw)": 2.1188483238220215, "Pretrain/Step": 5369, "Pretrain/Step Time": 8.513304334133863} +{"Pretrain/Learning Rate": 2.1123102724462262e-05, "Pretrain/Loss": 2.034653902053833, "Pretrain/Loss (Raw)": 2.1027987003326416, "Pretrain/Step": 5370, "Pretrain/Step Time": 8.514085043221712} +{"Pretrain/Learning Rate": 2.1114715780773924e-05, "Pretrain/Loss": 2.0334601402282715, "Pretrain/Loss (Raw)": 2.0364861488342285, "Pretrain/Step": 5371, "Pretrain/Step Time": 8.512005956843495} +{"Pretrain/Learning Rate": 2.110632928515487e-05, "Pretrain/Loss": 2.032564878463745, "Pretrain/Loss (Raw)": 1.931984543800354, "Pretrain/Step": 5372, "Pretrain/Step Time": 8.511911766603589} +{"Pretrain/Learning Rate": 2.1097943238572272e-05, "Pretrain/Loss": 2.0317745208740234, "Pretrain/Loss (Raw)": 2.0662155151367188, "Pretrain/Step": 5373, "Pretrain/Step Time": 8.51836832612753} +{"Pretrain/Learning Rate": 2.108955764199324e-05, "Pretrain/Loss": 2.0294747352600098, "Pretrain/Loss (Raw)": 1.8321977853775024, "Pretrain/Step": 5374, "Pretrain/Step Time": 8.525916399434209} +{"Pretrain/Learning Rate": 2.1081172496384855e-05, "Pretrain/Loss": 2.028219699859619, "Pretrain/Loss (Raw)": 1.9177510738372803, "Pretrain/Step": 5375, "Pretrain/Step Time": 8.5219199154526} +{"Pretrain/Learning Rate": 2.107278780271412e-05, "Pretrain/Loss": 2.026841163635254, "Pretrain/Loss (Raw)": 1.9817732572555542, "Pretrain/Step": 5376, "Pretrain/Step Time": 8.519576996564865} +{"Pretrain/Learning Rate": 2.1064403561948003e-05, "Pretrain/Loss": 2.0298094749450684, "Pretrain/Loss (Raw)": 2.07517409324646, "Pretrain/Step": 5377, "Pretrain/Step Time": 8.517366060987115} +{"Pretrain/Learning Rate": 2.105601977505341e-05, "Pretrain/Loss": 2.0293354988098145, "Pretrain/Loss (Raw)": 2.012364149093628, "Pretrain/Step": 5378, "Pretrain/Step Time": 8.510888777673244} +{"Pretrain/Learning Rate": 2.1047636442997205e-05, "Pretrain/Loss": 2.028850555419922, "Pretrain/Loss (Raw)": 2.077212333679199, "Pretrain/Step": 5379, "Pretrain/Step Time": 8.512206193059683} +{"Pretrain/Learning Rate": 2.1039253566746182e-05, "Pretrain/Loss": 2.028043031692505, "Pretrain/Loss (Raw)": 1.8926236629486084, "Pretrain/Step": 5380, "Pretrain/Step Time": 8.516959100961685} +{"Pretrain/Learning Rate": 2.1030871147267113e-05, "Pretrain/Loss": 2.027876615524292, "Pretrain/Loss (Raw)": 2.0129523277282715, "Pretrain/Step": 5381, "Pretrain/Step Time": 8.520387846976519} +{"Pretrain/Learning Rate": 2.1022489185526674e-05, "Pretrain/Loss": 2.0270237922668457, "Pretrain/Loss (Raw)": 1.9587150812149048, "Pretrain/Step": 5382, "Pretrain/Step Time": 8.51956974901259} +{"Pretrain/Learning Rate": 2.1014107682491534e-05, "Pretrain/Loss": 2.025735855102539, "Pretrain/Loss (Raw)": 1.840962290763855, "Pretrain/Step": 5383, "Pretrain/Step Time": 8.509895095601678} +{"Pretrain/Learning Rate": 2.1005726639128276e-05, "Pretrain/Loss": 2.025920867919922, "Pretrain/Loss (Raw)": 2.110013008117676, "Pretrain/Step": 5384, "Pretrain/Step Time": 8.504652133211493} +{"Pretrain/Learning Rate": 2.0997346056403438e-05, "Pretrain/Loss": 2.0262584686279297, "Pretrain/Loss (Raw)": 2.139517307281494, "Pretrain/Step": 5385, "Pretrain/Step Time": 8.502244465053082} +{"Pretrain/Learning Rate": 2.0988965935283524e-05, "Pretrain/Loss": 2.028794288635254, "Pretrain/Loss (Raw)": 2.155827522277832, "Pretrain/Step": 5386, "Pretrain/Step Time": 8.504932507872581} +{"Pretrain/Learning Rate": 2.098058627673495e-05, "Pretrain/Loss": 2.0305399894714355, "Pretrain/Loss (Raw)": 2.1027586460113525, "Pretrain/Step": 5387, "Pretrain/Step Time": 8.502228055149317} +{"Pretrain/Learning Rate": 2.097220708172411e-05, "Pretrain/Loss": 2.0308120250701904, "Pretrain/Loss (Raw)": 1.9911649227142334, "Pretrain/Step": 5388, "Pretrain/Step Time": 8.509916629642248} +{"Pretrain/Learning Rate": 2.0963828351217327e-05, "Pretrain/Loss": 2.0323281288146973, "Pretrain/Loss (Raw)": 2.2049245834350586, "Pretrain/Step": 5389, "Pretrain/Step Time": 8.501897828653455} +{"Pretrain/Learning Rate": 2.0955450086180882e-05, "Pretrain/Loss": 2.0331530570983887, "Pretrain/Loss (Raw)": 2.1515989303588867, "Pretrain/Step": 5390, "Pretrain/Step Time": 8.505107589066029} +{"Pretrain/Learning Rate": 2.094707228758099e-05, "Pretrain/Loss": 2.0335693359375, "Pretrain/Loss (Raw)": 2.0127859115600586, "Pretrain/Step": 5391, "Pretrain/Step Time": 8.504314152523875} +{"Pretrain/Learning Rate": 2.093869495638382e-05, "Pretrain/Loss": 2.033857822418213, "Pretrain/Loss (Raw)": 1.989582896232605, "Pretrain/Step": 5392, "Pretrain/Step Time": 8.508053941652179} +{"Pretrain/Learning Rate": 2.093031809355548e-05, "Pretrain/Loss": 2.0331146717071533, "Pretrain/Loss (Raw)": 2.1270601749420166, "Pretrain/Step": 5393, "Pretrain/Step Time": 8.51199628226459} +{"Pretrain/Learning Rate": 2.0921941700062047e-05, "Pretrain/Loss": 2.032163143157959, "Pretrain/Loss (Raw)": 1.9655721187591553, "Pretrain/Step": 5394, "Pretrain/Step Time": 8.514987980946898} +{"Pretrain/Learning Rate": 2.0913565776869498e-05, "Pretrain/Loss": 2.031867742538452, "Pretrain/Loss (Raw)": 1.9893115758895874, "Pretrain/Step": 5395, "Pretrain/Step Time": 8.517719686031342} +{"Pretrain/Learning Rate": 2.0905190324943814e-05, "Pretrain/Loss": 2.0322518348693848, "Pretrain/Loss (Raw)": 2.200679063796997, "Pretrain/Step": 5396, "Pretrain/Step Time": 8.514815470203757} +{"Pretrain/Learning Rate": 2.089681534525086e-05, "Pretrain/Loss": 2.0328428745269775, "Pretrain/Loss (Raw)": 2.1415350437164307, "Pretrain/Step": 5397, "Pretrain/Step Time": 8.516700325533748} +{"Pretrain/Learning Rate": 2.0888440838756515e-05, "Pretrain/Loss": 2.0369033813476562, "Pretrain/Loss (Raw)": 2.384518623352051, "Pretrain/Step": 5398, "Pretrain/Step Time": 8.52047361060977} +{"Pretrain/Learning Rate": 2.088006680642653e-05, "Pretrain/Loss": 2.0355405807495117, "Pretrain/Loss (Raw)": 1.9730290174484253, "Pretrain/Step": 5399, "Pretrain/Step Time": 8.520183954387903} +{"Pretrain/Learning Rate": 2.087169324922667e-05, "Pretrain/Loss": 2.037187099456787, "Pretrain/Loss (Raw)": 2.146409749984741, "Pretrain/Step": 5400, "Pretrain/Step Time": 8.5249481536448} +{"Pretrain/Learning Rate": 2.086332016812258e-05, "Pretrain/Loss": 2.036696672439575, "Pretrain/Loss (Raw)": 1.9019914865493774, "Pretrain/Step": 5401, "Pretrain/Step Time": 8.525155492126942} +{"Pretrain/Learning Rate": 2.085494756407992e-05, "Pretrain/Loss": 2.0365118980407715, "Pretrain/Loss (Raw)": 1.9866174459457397, "Pretrain/Step": 5402, "Pretrain/Step Time": 8.520540401339531} +{"Pretrain/Learning Rate": 2.0846575438064227e-05, "Pretrain/Loss": 2.034384250640869, "Pretrain/Loss (Raw)": 1.8962010145187378, "Pretrain/Step": 5403, "Pretrain/Step Time": 8.520292500033975} +{"Pretrain/Learning Rate": 2.0838203791041028e-05, "Pretrain/Loss": 2.034623622894287, "Pretrain/Loss (Raw)": 1.958420991897583, "Pretrain/Step": 5404, "Pretrain/Step Time": 8.528106803074479} +{"Pretrain/Learning Rate": 2.0829832623975775e-05, "Pretrain/Loss": 2.037714958190918, "Pretrain/Loss (Raw)": 2.1794300079345703, "Pretrain/Step": 5405, "Pretrain/Step Time": 8.530043065547943} +{"Pretrain/Learning Rate": 2.0821461937833884e-05, "Pretrain/Loss": 2.039963722229004, "Pretrain/Loss (Raw)": 2.2558302879333496, "Pretrain/Step": 5406, "Pretrain/Step Time": 8.52822687663138} +{"Pretrain/Learning Rate": 2.0813091733580685e-05, "Pretrain/Loss": 2.0399513244628906, "Pretrain/Loss (Raw)": 2.0864288806915283, "Pretrain/Step": 5407, "Pretrain/Step Time": 8.527929471805692} +{"Pretrain/Learning Rate": 2.080472201218148e-05, "Pretrain/Loss": 2.0391907691955566, "Pretrain/Loss (Raw)": 2.044762134552002, "Pretrain/Step": 5408, "Pretrain/Step Time": 8.524856084957719} +{"Pretrain/Learning Rate": 2.0796352774601495e-05, "Pretrain/Loss": 2.0388050079345703, "Pretrain/Loss (Raw)": 1.7137863636016846, "Pretrain/Step": 5409, "Pretrain/Step Time": 8.52629742398858} +{"Pretrain/Learning Rate": 2.0787984021805922e-05, "Pretrain/Loss": 2.0386929512023926, "Pretrain/Loss (Raw)": 2.1546149253845215, "Pretrain/Step": 5410, "Pretrain/Step Time": 8.525654315948486} +{"Pretrain/Learning Rate": 2.077961575475988e-05, "Pretrain/Loss": 2.039308547973633, "Pretrain/Loss (Raw)": 2.085744619369507, "Pretrain/Step": 5411, "Pretrain/Step Time": 8.529800916090608} +{"Pretrain/Learning Rate": 2.0771247974428434e-05, "Pretrain/Loss": 2.043199062347412, "Pretrain/Loss (Raw)": 2.418424129486084, "Pretrain/Step": 5412, "Pretrain/Step Time": 8.53214393183589} +{"Pretrain/Learning Rate": 2.07628806817766e-05, "Pretrain/Loss": 2.0431582927703857, "Pretrain/Loss (Raw)": 1.9127602577209473, "Pretrain/Step": 5413, "Pretrain/Step Time": 8.521393103525043} +{"Pretrain/Learning Rate": 2.0754513877769328e-05, "Pretrain/Loss": 2.042009115219116, "Pretrain/Loss (Raw)": 2.0392963886260986, "Pretrain/Step": 5414, "Pretrain/Step Time": 8.519489701837301} +{"Pretrain/Learning Rate": 2.074614756337152e-05, "Pretrain/Loss": 2.0403926372528076, "Pretrain/Loss (Raw)": 1.8323992490768433, "Pretrain/Step": 5415, "Pretrain/Step Time": 8.524019654840231} +{"Pretrain/Learning Rate": 2.073778173954803e-05, "Pretrain/Loss": 2.039205551147461, "Pretrain/Loss (Raw)": 1.770085334777832, "Pretrain/Step": 5416, "Pretrain/Step Time": 8.52972169779241} +{"Pretrain/Learning Rate": 2.072941640726362e-05, "Pretrain/Loss": 2.040346622467041, "Pretrain/Loss (Raw)": 1.9789286851882935, "Pretrain/Step": 5417, "Pretrain/Step Time": 8.525629967451096} +{"Pretrain/Learning Rate": 2.0721051567483045e-05, "Pretrain/Loss": 2.0418758392333984, "Pretrain/Loss (Raw)": 2.179088830947876, "Pretrain/Step": 5418, "Pretrain/Step Time": 8.525619361549616} +{"Pretrain/Learning Rate": 2.071268722117096e-05, "Pretrain/Loss": 2.043022632598877, "Pretrain/Loss (Raw)": 2.1978189945220947, "Pretrain/Step": 5419, "Pretrain/Step Time": 8.521144473925233} +{"Pretrain/Learning Rate": 2.0704323369291993e-05, "Pretrain/Loss": 2.045868396759033, "Pretrain/Loss (Raw)": 2.283973455429077, "Pretrain/Step": 5420, "Pretrain/Step Time": 8.519207540899515} +{"Pretrain/Learning Rate": 2.069596001281069e-05, "Pretrain/Loss": 2.0413177013397217, "Pretrain/Loss (Raw)": 1.90712571144104, "Pretrain/Step": 5421, "Pretrain/Step Time": 8.510447150096297} +{"Pretrain/Learning Rate": 2.0687597152691567e-05, "Pretrain/Loss": 2.041729688644409, "Pretrain/Loss (Raw)": 2.107588052749634, "Pretrain/Step": 5422, "Pretrain/Step Time": 8.52063238248229} +{"Pretrain/Learning Rate": 2.0679234789899054e-05, "Pretrain/Loss": 2.0406172275543213, "Pretrain/Loss (Raw)": 2.0225417613983154, "Pretrain/Step": 5423, "Pretrain/Step Time": 8.524608012288809} +{"Pretrain/Learning Rate": 2.067087292539755e-05, "Pretrain/Loss": 2.0404818058013916, "Pretrain/Loss (Raw)": 2.1135857105255127, "Pretrain/Step": 5424, "Pretrain/Step Time": 8.531186506152153} +{"Pretrain/Learning Rate": 2.0662511560151373e-05, "Pretrain/Loss": 2.0402307510375977, "Pretrain/Loss (Raw)": 2.043877601623535, "Pretrain/Step": 5425, "Pretrain/Step Time": 8.520134108141065} +{"Pretrain/Learning Rate": 2.0654150695124804e-05, "Pretrain/Loss": 2.0422492027282715, "Pretrain/Loss (Raw)": 2.2353012561798096, "Pretrain/Step": 5426, "Pretrain/Step Time": 8.521218489855528} +{"Pretrain/Learning Rate": 2.064579033128206e-05, "Pretrain/Loss": 2.0437309741973877, "Pretrain/Loss (Raw)": 2.035132646560669, "Pretrain/Step": 5427, "Pretrain/Step Time": 8.518334763124585} +{"Pretrain/Learning Rate": 2.063743046958729e-05, "Pretrain/Loss": 2.044332981109619, "Pretrain/Loss (Raw)": 1.9399430751800537, "Pretrain/Step": 5428, "Pretrain/Step Time": 8.524548688903451} +{"Pretrain/Learning Rate": 2.0629071111004595e-05, "Pretrain/Loss": 2.0459370613098145, "Pretrain/Loss (Raw)": 2.2949655055999756, "Pretrain/Step": 5429, "Pretrain/Step Time": 8.530620764940977} +{"Pretrain/Learning Rate": 2.0620712256498016e-05, "Pretrain/Loss": 2.0456724166870117, "Pretrain/Loss (Raw)": 2.028501272201538, "Pretrain/Step": 5430, "Pretrain/Step Time": 8.530642779543996} +{"Pretrain/Learning Rate": 2.061235390703154e-05, "Pretrain/Loss": 2.0451607704162598, "Pretrain/Loss (Raw)": 1.9776406288146973, "Pretrain/Step": 5431, "Pretrain/Step Time": 8.523589773103595} +{"Pretrain/Learning Rate": 2.0603996063569078e-05, "Pretrain/Loss": 2.0452120304107666, "Pretrain/Loss (Raw)": 2.079545736312866, "Pretrain/Step": 5432, "Pretrain/Step Time": 8.520422017201781} +{"Pretrain/Learning Rate": 2.0595638727074512e-05, "Pretrain/Loss": 2.044221878051758, "Pretrain/Loss (Raw)": 1.9928549528121948, "Pretrain/Step": 5433, "Pretrain/Step Time": 8.512568809092045} +{"Pretrain/Learning Rate": 2.058728189851164e-05, "Pretrain/Loss": 2.0415096282958984, "Pretrain/Loss (Raw)": 1.5616182088851929, "Pretrain/Step": 5434, "Pretrain/Step Time": 8.522986004129052} +{"Pretrain/Learning Rate": 2.0578925578844216e-05, "Pretrain/Loss": 2.0420284271240234, "Pretrain/Loss (Raw)": 2.1927525997161865, "Pretrain/Step": 5435, "Pretrain/Step Time": 8.526328168809414} +{"Pretrain/Learning Rate": 2.0570569769035915e-05, "Pretrain/Loss": 2.0425262451171875, "Pretrain/Loss (Raw)": 1.948671817779541, "Pretrain/Step": 5436, "Pretrain/Step Time": 8.527699055150151} +{"Pretrain/Learning Rate": 2.0562214470050396e-05, "Pretrain/Loss": 2.041513442993164, "Pretrain/Loss (Raw)": 1.9951053857803345, "Pretrain/Step": 5437, "Pretrain/Step Time": 8.516692604869604} +{"Pretrain/Learning Rate": 2.0553859682851204e-05, "Pretrain/Loss": 2.042651653289795, "Pretrain/Loss (Raw)": 2.244088649749756, "Pretrain/Step": 5438, "Pretrain/Step Time": 8.508696485310793} +{"Pretrain/Learning Rate": 2.0545505408401878e-05, "Pretrain/Loss": 2.0437886714935303, "Pretrain/Loss (Raw)": 2.0733184814453125, "Pretrain/Step": 5439, "Pretrain/Step Time": 8.513239869847894} +{"Pretrain/Learning Rate": 2.053715164766584e-05, "Pretrain/Loss": 2.0434255599975586, "Pretrain/Loss (Raw)": 1.923541784286499, "Pretrain/Step": 5440, "Pretrain/Step Time": 8.513929663226008} +{"Pretrain/Learning Rate": 2.052879840160652e-05, "Pretrain/Loss": 2.044750690460205, "Pretrain/Loss (Raw)": 2.050743818283081, "Pretrain/Step": 5441, "Pretrain/Step Time": 8.516763968393207} +{"Pretrain/Learning Rate": 2.052044567118722e-05, "Pretrain/Loss": 2.0448832511901855, "Pretrain/Loss (Raw)": 2.1464130878448486, "Pretrain/Step": 5442, "Pretrain/Step Time": 8.511629862710834} +{"Pretrain/Learning Rate": 2.0512093457371253e-05, "Pretrain/Loss": 2.044477939605713, "Pretrain/Loss (Raw)": 2.0085129737854004, "Pretrain/Step": 5443, "Pretrain/Step Time": 8.502945410087705} +{"Pretrain/Learning Rate": 2.0503741761121804e-05, "Pretrain/Loss": 2.045734405517578, "Pretrain/Loss (Raw)": 2.1176140308380127, "Pretrain/Step": 5444, "Pretrain/Step Time": 8.507128566503525} +{"Pretrain/Learning Rate": 2.049539058340205e-05, "Pretrain/Loss": 2.0447449684143066, "Pretrain/Loss (Raw)": 1.9643679857254028, "Pretrain/Step": 5445, "Pretrain/Step Time": 8.51070729829371} +{"Pretrain/Learning Rate": 2.0487039925175073e-05, "Pretrain/Loss": 2.046146869659424, "Pretrain/Loss (Raw)": 2.334498167037964, "Pretrain/Step": 5446, "Pretrain/Step Time": 8.52284735813737} +{"Pretrain/Learning Rate": 2.0478689787403923e-05, "Pretrain/Loss": 2.047189474105835, "Pretrain/Loss (Raw)": 2.107542037963867, "Pretrain/Step": 5447, "Pretrain/Step Time": 8.525407066568732} +{"Pretrain/Learning Rate": 2.0470340171051567e-05, "Pretrain/Loss": 2.0479111671447754, "Pretrain/Loss (Raw)": 2.0602357387542725, "Pretrain/Step": 5448, "Pretrain/Step Time": 8.512036310508847} +{"Pretrain/Learning Rate": 2.046199107708093e-05, "Pretrain/Loss": 2.048175811767578, "Pretrain/Loss (Raw)": 2.157578945159912, "Pretrain/Step": 5449, "Pretrain/Step Time": 8.511224752292037} +{"Pretrain/Learning Rate": 2.0453642506454862e-05, "Pretrain/Loss": 2.0481462478637695, "Pretrain/Loss (Raw)": 2.1305091381073, "Pretrain/Step": 5450, "Pretrain/Step Time": 8.509401220828295} +{"Pretrain/Learning Rate": 2.044529446013617e-05, "Pretrain/Loss": 2.0455493927001953, "Pretrain/Loss (Raw)": 1.873347520828247, "Pretrain/Step": 5451, "Pretrain/Step Time": 8.512660022825003} +{"Pretrain/Learning Rate": 2.0436946939087576e-05, "Pretrain/Loss": 2.0454373359680176, "Pretrain/Loss (Raw)": 2.0628044605255127, "Pretrain/Step": 5452, "Pretrain/Step Time": 8.51139897853136} +{"Pretrain/Learning Rate": 2.042859994427177e-05, "Pretrain/Loss": 2.0498902797698975, "Pretrain/Loss (Raw)": 2.1256730556488037, "Pretrain/Step": 5453, "Pretrain/Step Time": 8.505467599257827} +{"Pretrain/Learning Rate": 2.042025347665135e-05, "Pretrain/Loss": 2.048610210418701, "Pretrain/Loss (Raw)": 2.09121036529541, "Pretrain/Step": 5454, "Pretrain/Step Time": 8.50725606456399} +{"Pretrain/Learning Rate": 2.041190753718889e-05, "Pretrain/Loss": 2.049605131149292, "Pretrain/Loss (Raw)": 2.086085319519043, "Pretrain/Step": 5455, "Pretrain/Step Time": 8.49552939645946} +{"Pretrain/Learning Rate": 2.0403562126846865e-05, "Pretrain/Loss": 2.0504798889160156, "Pretrain/Loss (Raw)": 2.114394187927246, "Pretrain/Step": 5456, "Pretrain/Step Time": 8.50262514129281} +{"Pretrain/Learning Rate": 2.039521724658772e-05, "Pretrain/Loss": 2.0487418174743652, "Pretrain/Loss (Raw)": 1.9411059617996216, "Pretrain/Step": 5457, "Pretrain/Step Time": 8.509392030537128} +{"Pretrain/Learning Rate": 2.0386872897373816e-05, "Pretrain/Loss": 2.048757791519165, "Pretrain/Loss (Raw)": 1.9874495267868042, "Pretrain/Step": 5458, "Pretrain/Step Time": 8.505335059016943} +{"Pretrain/Learning Rate": 2.037852908016747e-05, "Pretrain/Loss": 2.0482027530670166, "Pretrain/Loss (Raw)": 1.9574410915374756, "Pretrain/Step": 5459, "Pretrain/Step Time": 8.509981103241444} +{"Pretrain/Learning Rate": 2.0370185795930927e-05, "Pretrain/Loss": 2.049438714981079, "Pretrain/Loss (Raw)": 2.0798299312591553, "Pretrain/Step": 5460, "Pretrain/Step Time": 8.508390795439482} +{"Pretrain/Learning Rate": 2.0361843045626378e-05, "Pretrain/Loss": 2.0443005561828613, "Pretrain/Loss (Raw)": 1.5212185382843018, "Pretrain/Step": 5461, "Pretrain/Step Time": 8.50075102970004} +{"Pretrain/Learning Rate": 2.035350083021594e-05, "Pretrain/Loss": 2.045043468475342, "Pretrain/Loss (Raw)": 1.9817019701004028, "Pretrain/Step": 5462, "Pretrain/Step Time": 8.505251359194517} +{"Pretrain/Learning Rate": 2.0345159150661683e-05, "Pretrain/Loss": 2.0446085929870605, "Pretrain/Loss (Raw)": 1.8363436460494995, "Pretrain/Step": 5463, "Pretrain/Step Time": 8.509997490793467} +{"Pretrain/Learning Rate": 2.0336818007925603e-05, "Pretrain/Loss": 2.042633056640625, "Pretrain/Loss (Raw)": 1.9159281253814697, "Pretrain/Step": 5464, "Pretrain/Step Time": 8.512566084042192} +{"Pretrain/Learning Rate": 2.032847740296965e-05, "Pretrain/Loss": 2.0405030250549316, "Pretrain/Loss (Raw)": 2.0158066749572754, "Pretrain/Step": 5465, "Pretrain/Step Time": 8.518034424632788} +{"Pretrain/Learning Rate": 2.0320137336755692e-05, "Pretrain/Loss": 2.0400514602661133, "Pretrain/Loss (Raw)": 2.153231382369995, "Pretrain/Step": 5466, "Pretrain/Step Time": 8.508097494021058} +{"Pretrain/Learning Rate": 2.0311797810245543e-05, "Pretrain/Loss": 2.03955078125, "Pretrain/Loss (Raw)": 1.9432222843170166, "Pretrain/Step": 5467, "Pretrain/Step Time": 8.500888761132956} +{"Pretrain/Learning Rate": 2.0303458824400974e-05, "Pretrain/Loss": 2.0434188842773438, "Pretrain/Loss (Raw)": 2.2479188442230225, "Pretrain/Step": 5468, "Pretrain/Step Time": 8.502602744847536} +{"Pretrain/Learning Rate": 2.0295120380183657e-05, "Pretrain/Loss": 2.044696092605591, "Pretrain/Loss (Raw)": 1.8041691780090332, "Pretrain/Step": 5469, "Pretrain/Step Time": 8.509622879326344} +{"Pretrain/Learning Rate": 2.0286782478555232e-05, "Pretrain/Loss": 2.0446324348449707, "Pretrain/Loss (Raw)": 2.0727193355560303, "Pretrain/Step": 5470, "Pretrain/Step Time": 8.51224958524108} +{"Pretrain/Learning Rate": 2.027844512047726e-05, "Pretrain/Loss": 2.0450448989868164, "Pretrain/Loss (Raw)": 2.2379918098449707, "Pretrain/Step": 5471, "Pretrain/Step Time": 8.508707033470273} +{"Pretrain/Learning Rate": 2.027010830691124e-05, "Pretrain/Loss": 2.042560577392578, "Pretrain/Loss (Raw)": 1.762159824371338, "Pretrain/Step": 5472, "Pretrain/Step Time": 8.50079126469791} +{"Pretrain/Learning Rate": 2.0261772038818622e-05, "Pretrain/Loss": 2.040578842163086, "Pretrain/Loss (Raw)": 2.1412692070007324, "Pretrain/Step": 5473, "Pretrain/Step Time": 8.507153693586588} +{"Pretrain/Learning Rate": 2.0253436317160784e-05, "Pretrain/Loss": 2.040513038635254, "Pretrain/Loss (Raw)": 2.0954127311706543, "Pretrain/Step": 5474, "Pretrain/Step Time": 8.505717666819692} +{"Pretrain/Learning Rate": 2.0245101142899032e-05, "Pretrain/Loss": 2.0412819385528564, "Pretrain/Loss (Raw)": 2.3122000694274902, "Pretrain/Step": 5475, "Pretrain/Step Time": 8.506977377459407} +{"Pretrain/Learning Rate": 2.0236766516994623e-05, "Pretrain/Loss": 2.0410726070404053, "Pretrain/Loss (Raw)": 1.9607170820236206, "Pretrain/Step": 5476, "Pretrain/Step Time": 8.50790585577488} +{"Pretrain/Learning Rate": 2.022843244040874e-05, "Pretrain/Loss": 2.040447235107422, "Pretrain/Loss (Raw)": 2.029510259628296, "Pretrain/Step": 5477, "Pretrain/Step Time": 8.504746505990624} +{"Pretrain/Learning Rate": 2.0220098914102525e-05, "Pretrain/Loss": 2.04130482673645, "Pretrain/Loss (Raw)": 1.8192508220672607, "Pretrain/Step": 5478, "Pretrain/Step Time": 8.503547491505742} +{"Pretrain/Learning Rate": 2.021176593903701e-05, "Pretrain/Loss": 2.0424656867980957, "Pretrain/Loss (Raw)": 2.1385374069213867, "Pretrain/Step": 5479, "Pretrain/Step Time": 8.49589023180306} +{"Pretrain/Learning Rate": 2.0203433516173225e-05, "Pretrain/Loss": 2.0454041957855225, "Pretrain/Loss (Raw)": 2.1496264934539795, "Pretrain/Step": 5480, "Pretrain/Step Time": 8.495446018874645} +{"Pretrain/Learning Rate": 2.0195101646472075e-05, "Pretrain/Loss": 2.0425400733947754, "Pretrain/Loss (Raw)": 1.820986270904541, "Pretrain/Step": 5481, "Pretrain/Step Time": 8.501220302656293} +{"Pretrain/Learning Rate": 2.018677033089446e-05, "Pretrain/Loss": 2.040959596633911, "Pretrain/Loss (Raw)": 1.941528081893921, "Pretrain/Step": 5482, "Pretrain/Step Time": 8.50069615803659} +{"Pretrain/Learning Rate": 2.017843957040115e-05, "Pretrain/Loss": 2.0386743545532227, "Pretrain/Loss (Raw)": 1.8855557441711426, "Pretrain/Step": 5483, "Pretrain/Step Time": 8.5104223433882} +{"Pretrain/Learning Rate": 2.0170109365952934e-05, "Pretrain/Loss": 2.041670560836792, "Pretrain/Loss (Raw)": 2.215477705001831, "Pretrain/Step": 5484, "Pretrain/Step Time": 8.504774326458573} +{"Pretrain/Learning Rate": 2.0161779718510443e-05, "Pretrain/Loss": 2.044527530670166, "Pretrain/Loss (Raw)": 2.3379554748535156, "Pretrain/Step": 5485, "Pretrain/Step Time": 8.498904230073094} +{"Pretrain/Learning Rate": 2.015345062903433e-05, "Pretrain/Loss": 2.0458621978759766, "Pretrain/Loss (Raw)": 2.0724072456359863, "Pretrain/Step": 5486, "Pretrain/Step Time": 8.499890439212322} +{"Pretrain/Learning Rate": 2.014512209848512e-05, "Pretrain/Loss": 2.04544734954834, "Pretrain/Loss (Raw)": 2.066106081008911, "Pretrain/Step": 5487, "Pretrain/Step Time": 8.504550911486149} +{"Pretrain/Learning Rate": 2.013679412782331e-05, "Pretrain/Loss": 2.043272018432617, "Pretrain/Loss (Raw)": 1.7672075033187866, "Pretrain/Step": 5488, "Pretrain/Step Time": 8.50416019745171} +{"Pretrain/Learning Rate": 2.0128466718009313e-05, "Pretrain/Loss": 2.042736053466797, "Pretrain/Loss (Raw)": 1.9285259246826172, "Pretrain/Step": 5489, "Pretrain/Step Time": 8.500602146610618} +{"Pretrain/Learning Rate": 2.0120139870003492e-05, "Pretrain/Loss": 2.041410446166992, "Pretrain/Loss (Raw)": 2.1453514099121094, "Pretrain/Step": 5490, "Pretrain/Step Time": 8.497834961861372} +{"Pretrain/Learning Rate": 2.0111813584766134e-05, "Pretrain/Loss": 2.04167103767395, "Pretrain/Loss (Raw)": 2.0184731483459473, "Pretrain/Step": 5491, "Pretrain/Step Time": 8.498363023623824} +{"Pretrain/Learning Rate": 2.010348786325747e-05, "Pretrain/Loss": 2.0418858528137207, "Pretrain/Loss (Raw)": 1.9171605110168457, "Pretrain/Step": 5492, "Pretrain/Step Time": 8.5100027769804} +{"Pretrain/Learning Rate": 2.0095162706437655e-05, "Pretrain/Loss": 2.0414974689483643, "Pretrain/Loss (Raw)": 2.0679068565368652, "Pretrain/Step": 5493, "Pretrain/Step Time": 8.514120567589998} +{"Pretrain/Learning Rate": 2.0086838115266794e-05, "Pretrain/Loss": 2.039440631866455, "Pretrain/Loss (Raw)": 1.889477014541626, "Pretrain/Step": 5494, "Pretrain/Step Time": 8.511374359950423} +{"Pretrain/Learning Rate": 2.007851409070491e-05, "Pretrain/Loss": 2.0381250381469727, "Pretrain/Loss (Raw)": 1.9109855890274048, "Pretrain/Step": 5495, "Pretrain/Step Time": 8.506195863708854} +{"Pretrain/Learning Rate": 2.007019063371197e-05, "Pretrain/Loss": 2.036351203918457, "Pretrain/Loss (Raw)": 1.892903447151184, "Pretrain/Step": 5496, "Pretrain/Step Time": 8.497631136327982} +{"Pretrain/Learning Rate": 2.006186774524788e-05, "Pretrain/Loss": 2.033780574798584, "Pretrain/Loss (Raw)": 1.7897822856903076, "Pretrain/Step": 5497, "Pretrain/Step Time": 8.500165024772286} +{"Pretrain/Learning Rate": 2.005354542627247e-05, "Pretrain/Loss": 2.033015489578247, "Pretrain/Loss (Raw)": 2.004899024963379, "Pretrain/Step": 5498, "Pretrain/Step Time": 8.500661613419652} +{"Pretrain/Learning Rate": 2.0045223677745507e-05, "Pretrain/Loss": 2.033599853515625, "Pretrain/Loss (Raw)": 2.111266851425171, "Pretrain/Step": 5499, "Pretrain/Step Time": 8.508210983127356} +{"Pretrain/Learning Rate": 2.0036902500626704e-05, "Pretrain/Loss": 2.0337438583374023, "Pretrain/Loss (Raw)": 1.9504401683807373, "Pretrain/Step": 5500, "Pretrain/Step Time": 8.511060683056712} +{"Pretrain/Learning Rate": 2.002858189587568e-05, "Pretrain/Loss": 2.036076545715332, "Pretrain/Loss (Raw)": 2.3647961616516113, "Pretrain/Step": 5501, "Pretrain/Step Time": 8.508544605225325} +{"Pretrain/Learning Rate": 2.002026186445203e-05, "Pretrain/Loss": 2.0372610092163086, "Pretrain/Loss (Raw)": 1.9837960004806519, "Pretrain/Step": 5502, "Pretrain/Step Time": 8.501862606033683} +{"Pretrain/Learning Rate": 2.0011942407315236e-05, "Pretrain/Loss": 2.0393075942993164, "Pretrain/Loss (Raw)": 2.1796956062316895, "Pretrain/Step": 5503, "Pretrain/Step Time": 8.502256814390421} +{"Pretrain/Learning Rate": 2.0003623525424758e-05, "Pretrain/Loss": 2.038370132446289, "Pretrain/Loss (Raw)": 1.8617998361587524, "Pretrain/Step": 5504, "Pretrain/Step Time": 8.508136639371514} +{"Pretrain/Learning Rate": 1.9995305219739952e-05, "Pretrain/Loss": 2.0366756916046143, "Pretrain/Loss (Raw)": 1.8582707643508911, "Pretrain/Step": 5505, "Pretrain/Step Time": 8.515402046963573} +{"Pretrain/Learning Rate": 1.9986987491220137e-05, "Pretrain/Loss": 2.037722587585449, "Pretrain/Loss (Raw)": 2.1464202404022217, "Pretrain/Step": 5506, "Pretrain/Step Time": 8.514686822891235} +{"Pretrain/Learning Rate": 1.997867034082454e-05, "Pretrain/Loss": 2.0361194610595703, "Pretrain/Loss (Raw)": 1.8719547986984253, "Pretrain/Step": 5507, "Pretrain/Step Time": 8.52044434659183} +{"Pretrain/Learning Rate": 1.997035376951234e-05, "Pretrain/Loss": 2.0383949279785156, "Pretrain/Loss (Raw)": 2.1839253902435303, "Pretrain/Step": 5508, "Pretrain/Step Time": 8.512715956196189} +{"Pretrain/Learning Rate": 1.996203777824265e-05, "Pretrain/Loss": 2.037231683731079, "Pretrain/Loss (Raw)": 1.8640371561050415, "Pretrain/Step": 5509, "Pretrain/Step Time": 8.509643461555243} +{"Pretrain/Learning Rate": 1.99537223679745e-05, "Pretrain/Loss": 2.037105083465576, "Pretrain/Loss (Raw)": 1.9424973726272583, "Pretrain/Step": 5510, "Pretrain/Step Time": 8.513153536245227} +{"Pretrain/Learning Rate": 1.994540753966687e-05, "Pretrain/Loss": 2.0396695137023926, "Pretrain/Loss (Raw)": 2.1692049503326416, "Pretrain/Step": 5511, "Pretrain/Step Time": 8.518046608194709} +{"Pretrain/Learning Rate": 1.9937093294278653e-05, "Pretrain/Loss": 2.038646697998047, "Pretrain/Loss (Raw)": 1.9791189432144165, "Pretrain/Step": 5512, "Pretrain/Step Time": 8.520279893651605} +{"Pretrain/Learning Rate": 1.99287796327687e-05, "Pretrain/Loss": 2.0368599891662598, "Pretrain/Loss (Raw)": 1.910791277885437, "Pretrain/Step": 5513, "Pretrain/Step Time": 8.522987363860011} +{"Pretrain/Learning Rate": 1.9920466556095772e-05, "Pretrain/Loss": 2.035006523132324, "Pretrain/Loss (Raw)": 1.9185985326766968, "Pretrain/Step": 5514, "Pretrain/Step Time": 8.517890634015203} +{"Pretrain/Learning Rate": 1.991215406521858e-05, "Pretrain/Loss": 2.033543109893799, "Pretrain/Loss (Raw)": 1.9154257774353027, "Pretrain/Step": 5515, "Pretrain/Step Time": 8.512863447889686} +{"Pretrain/Learning Rate": 1.9903842161095752e-05, "Pretrain/Loss": 2.033292293548584, "Pretrain/Loss (Raw)": 1.9590833187103271, "Pretrain/Step": 5516, "Pretrain/Step Time": 8.505675928667188} +{"Pretrain/Learning Rate": 1.9895530844685865e-05, "Pretrain/Loss": 2.0316367149353027, "Pretrain/Loss (Raw)": 1.9929922819137573, "Pretrain/Step": 5517, "Pretrain/Step Time": 8.505161508917809} +{"Pretrain/Learning Rate": 1.988722011694741e-05, "Pretrain/Loss": 2.0309524536132812, "Pretrain/Loss (Raw)": 2.0640242099761963, "Pretrain/Step": 5518, "Pretrain/Step Time": 8.512807542458177} +{"Pretrain/Learning Rate": 1.987890997883883e-05, "Pretrain/Loss": 2.034358024597168, "Pretrain/Loss (Raw)": 2.4486851692199707, "Pretrain/Step": 5519, "Pretrain/Step Time": 8.515267414972186} +{"Pretrain/Learning Rate": 1.987060043131847e-05, "Pretrain/Loss": 2.0338728427886963, "Pretrain/Loss (Raw)": 1.9275155067443848, "Pretrain/Step": 5520, "Pretrain/Step Time": 8.512221602723002} +{"Pretrain/Learning Rate": 1.9862291475344654e-05, "Pretrain/Loss": 2.0341224670410156, "Pretrain/Loss (Raw)": 2.1589722633361816, "Pretrain/Step": 5521, "Pretrain/Step Time": 8.512567080557346} +{"Pretrain/Learning Rate": 1.985398311187558e-05, "Pretrain/Loss": 2.0331993103027344, "Pretrain/Loss (Raw)": 1.8474318981170654, "Pretrain/Step": 5522, "Pretrain/Step Time": 8.507096014916897} +{"Pretrain/Learning Rate": 1.9845675341869437e-05, "Pretrain/Loss": 2.0345678329467773, "Pretrain/Loss (Raw)": 2.1644935607910156, "Pretrain/Step": 5523, "Pretrain/Step Time": 8.51820064894855} +{"Pretrain/Learning Rate": 1.9837368166284284e-05, "Pretrain/Loss": 2.0364696979522705, "Pretrain/Loss (Raw)": 2.444108247756958, "Pretrain/Step": 5524, "Pretrain/Step Time": 8.521082596853375} +{"Pretrain/Learning Rate": 1.982906158607818e-05, "Pretrain/Loss": 2.036129951477051, "Pretrain/Loss (Raw)": 2.0980570316314697, "Pretrain/Step": 5525, "Pretrain/Step Time": 8.525001514703035} +{"Pretrain/Learning Rate": 1.982075560220904e-05, "Pretrain/Loss": 2.032808303833008, "Pretrain/Loss (Raw)": 1.9593416452407837, "Pretrain/Step": 5526, "Pretrain/Step Time": 8.517026657238603} +{"Pretrain/Learning Rate": 1.981245021563479e-05, "Pretrain/Loss": 2.0329928398132324, "Pretrain/Loss (Raw)": 1.9966579675674438, "Pretrain/Step": 5527, "Pretrain/Step Time": 8.514857804402709} +{"Pretrain/Learning Rate": 1.9804145427313213e-05, "Pretrain/Loss": 2.0306057929992676, "Pretrain/Loss (Raw)": 1.8408677577972412, "Pretrain/Step": 5528, "Pretrain/Step Time": 8.51139647513628} +{"Pretrain/Learning Rate": 1.9795841238202077e-05, "Pretrain/Loss": 2.031726837158203, "Pretrain/Loss (Raw)": 2.0454654693603516, "Pretrain/Step": 5529, "Pretrain/Step Time": 8.516670774668455} +{"Pretrain/Learning Rate": 1.9787537649259043e-05, "Pretrain/Loss": 2.032392740249634, "Pretrain/Loss (Raw)": 2.0718588829040527, "Pretrain/Step": 5530, "Pretrain/Step Time": 8.51755814999342} +{"Pretrain/Learning Rate": 1.977923466144174e-05, "Pretrain/Loss": 2.0327229499816895, "Pretrain/Loss (Raw)": 1.9384721517562866, "Pretrain/Step": 5531, "Pretrain/Step Time": 8.522574378177524} +{"Pretrain/Learning Rate": 1.977093227570768e-05, "Pretrain/Loss": 2.030174970626831, "Pretrain/Loss (Raw)": 1.6322754621505737, "Pretrain/Step": 5532, "Pretrain/Step Time": 8.509138483554125} +{"Pretrain/Learning Rate": 1.9762630493014366e-05, "Pretrain/Loss": 2.0275352001190186, "Pretrain/Loss (Raw)": 1.841524362564087, "Pretrain/Step": 5533, "Pretrain/Step Time": 8.507745776325464} +{"Pretrain/Learning Rate": 1.9754329314319176e-05, "Pretrain/Loss": 2.025486707687378, "Pretrain/Loss (Raw)": 1.9936349391937256, "Pretrain/Step": 5534, "Pretrain/Step Time": 8.507155997678638} +{"Pretrain/Learning Rate": 1.974602874057945e-05, "Pretrain/Loss": 2.0239360332489014, "Pretrain/Loss (Raw)": 1.8879252672195435, "Pretrain/Step": 5535, "Pretrain/Step Time": 8.50917562097311} +{"Pretrain/Learning Rate": 1.9737728772752446e-05, "Pretrain/Loss": 2.0256447792053223, "Pretrain/Loss (Raw)": 2.263510227203369, "Pretrain/Step": 5536, "Pretrain/Step Time": 8.511118238791823} +{"Pretrain/Learning Rate": 1.9729429411795358e-05, "Pretrain/Loss": 2.0281691551208496, "Pretrain/Loss (Raw)": 2.0368990898132324, "Pretrain/Step": 5537, "Pretrain/Step Time": 8.51083185710013} +{"Pretrain/Learning Rate": 1.97211306586653e-05, "Pretrain/Loss": 2.0265607833862305, "Pretrain/Loss (Raw)": 1.948737382888794, "Pretrain/Step": 5538, "Pretrain/Step Time": 8.50998224876821} +{"Pretrain/Learning Rate": 1.971283251431934e-05, "Pretrain/Loss": 2.0261166095733643, "Pretrain/Loss (Raw)": 2.0288729667663574, "Pretrain/Step": 5539, "Pretrain/Step Time": 8.501157328486443} +{"Pretrain/Learning Rate": 1.970453497971444e-05, "Pretrain/Loss": 2.023134231567383, "Pretrain/Loss (Raw)": 2.036710262298584, "Pretrain/Step": 5540, "Pretrain/Step Time": 8.501892818138003} +{"Pretrain/Learning Rate": 1.969623805580752e-05, "Pretrain/Loss": 2.0240986347198486, "Pretrain/Loss (Raw)": 2.0361812114715576, "Pretrain/Step": 5541, "Pretrain/Step Time": 8.50802438147366} +{"Pretrain/Learning Rate": 1.9687941743555422e-05, "Pretrain/Loss": 2.023826837539673, "Pretrain/Loss (Raw)": 2.004526138305664, "Pretrain/Step": 5542, "Pretrain/Step Time": 8.516813838854432} +{"Pretrain/Learning Rate": 1.9679646043914914e-05, "Pretrain/Loss": 2.0244996547698975, "Pretrain/Loss (Raw)": 1.9185174703598022, "Pretrain/Step": 5543, "Pretrain/Step Time": 8.512012459337711} +{"Pretrain/Learning Rate": 1.967135095784269e-05, "Pretrain/Loss": 2.0266618728637695, "Pretrain/Loss (Raw)": 2.0468294620513916, "Pretrain/Step": 5544, "Pretrain/Step Time": 8.51128089800477} +{"Pretrain/Learning Rate": 1.966305648629539e-05, "Pretrain/Loss": 2.0264859199523926, "Pretrain/Loss (Raw)": 1.9564403295516968, "Pretrain/Step": 5545, "Pretrain/Step Time": 8.509946370497346} +{"Pretrain/Learning Rate": 1.9654762630229558e-05, "Pretrain/Loss": 2.025536060333252, "Pretrain/Loss (Raw)": 2.057469129562378, "Pretrain/Step": 5546, "Pretrain/Step Time": 8.51814179122448} +{"Pretrain/Learning Rate": 1.9646469390601692e-05, "Pretrain/Loss": 2.0236244201660156, "Pretrain/Loss (Raw)": 1.9531513452529907, "Pretrain/Step": 5547, "Pretrain/Step Time": 8.516940284520388} +{"Pretrain/Learning Rate": 1.96381767683682e-05, "Pretrain/Loss": 2.0209555625915527, "Pretrain/Loss (Raw)": 1.9423531293869019, "Pretrain/Step": 5548, "Pretrain/Step Time": 8.51978014037013} +{"Pretrain/Learning Rate": 1.9629884764485422e-05, "Pretrain/Loss": 2.0218286514282227, "Pretrain/Loss (Raw)": 2.0188968181610107, "Pretrain/Step": 5549, "Pretrain/Step Time": 8.5174873881042} +{"Pretrain/Learning Rate": 1.962159337990965e-05, "Pretrain/Loss": 2.0202598571777344, "Pretrain/Loss (Raw)": 1.9067561626434326, "Pretrain/Step": 5550, "Pretrain/Step Time": 8.510218711569905} +{"Pretrain/Learning Rate": 1.9613302615597064e-05, "Pretrain/Loss": 2.0200741291046143, "Pretrain/Loss (Raw)": 1.9987679719924927, "Pretrain/Step": 5551, "Pretrain/Step Time": 8.508328067138791} +{"Pretrain/Learning Rate": 1.960501247250381e-05, "Pretrain/Loss": 2.0180163383483887, "Pretrain/Loss (Raw)": 1.850202202796936, "Pretrain/Step": 5552, "Pretrain/Step Time": 8.513704961165786} +{"Pretrain/Learning Rate": 1.9596722951585936e-05, "Pretrain/Loss": 2.0183186531066895, "Pretrain/Loss (Raw)": 2.082594156265259, "Pretrain/Step": 5553, "Pretrain/Step Time": 8.512296373024583} +{"Pretrain/Learning Rate": 1.9588434053799437e-05, "Pretrain/Loss": 2.016935348510742, "Pretrain/Loss (Raw)": 2.0582375526428223, "Pretrain/Step": 5554, "Pretrain/Step Time": 8.510748364031315} +{"Pretrain/Learning Rate": 1.9580145780100216e-05, "Pretrain/Loss": 2.0182485580444336, "Pretrain/Loss (Raw)": 2.203200101852417, "Pretrain/Step": 5555, "Pretrain/Step Time": 8.51349950954318} +{"Pretrain/Learning Rate": 1.9571858131444128e-05, "Pretrain/Loss": 2.019789695739746, "Pretrain/Loss (Raw)": 2.1372299194335938, "Pretrain/Step": 5556, "Pretrain/Step Time": 8.509326262399554} +{"Pretrain/Learning Rate": 1.9563571108786936e-05, "Pretrain/Loss": 2.0155181884765625, "Pretrain/Loss (Raw)": 1.748203158378601, "Pretrain/Step": 5557, "Pretrain/Step Time": 8.508290871977806} +{"Pretrain/Learning Rate": 1.9555284713084345e-05, "Pretrain/Loss": 2.0154786109924316, "Pretrain/Loss (Raw)": 2.0234320163726807, "Pretrain/Step": 5558, "Pretrain/Step Time": 8.515944980084896} +{"Pretrain/Learning Rate": 1.954699894529197e-05, "Pretrain/Loss": 2.015045166015625, "Pretrain/Loss (Raw)": 1.9221694469451904, "Pretrain/Step": 5559, "Pretrain/Step Time": 8.520388342440128} +{"Pretrain/Learning Rate": 1.953871380636538e-05, "Pretrain/Loss": 2.013770580291748, "Pretrain/Loss (Raw)": 1.916398286819458, "Pretrain/Step": 5560, "Pretrain/Step Time": 8.519859367981553} +{"Pretrain/Learning Rate": 1.953042929726004e-05, "Pretrain/Loss": 2.01397705078125, "Pretrain/Loss (Raw)": 2.019284725189209, "Pretrain/Step": 5561, "Pretrain/Step Time": 8.524596609175205} +{"Pretrain/Learning Rate": 1.952214541893138e-05, "Pretrain/Loss": 2.016481399536133, "Pretrain/Loss (Raw)": 1.8821606636047363, "Pretrain/Step": 5562, "Pretrain/Step Time": 8.517698835581541} +{"Pretrain/Learning Rate": 1.9513862172334707e-05, "Pretrain/Loss": 2.0150654315948486, "Pretrain/Loss (Raw)": 2.011510133743286, "Pretrain/Step": 5563, "Pretrain/Step Time": 8.508652780205011} +{"Pretrain/Learning Rate": 1.9505579558425313e-05, "Pretrain/Loss": 2.015090227127075, "Pretrain/Loss (Raw)": 1.9518423080444336, "Pretrain/Step": 5564, "Pretrain/Step Time": 8.516287200152874} +{"Pretrain/Learning Rate": 1.9497297578158363e-05, "Pretrain/Loss": 2.012742519378662, "Pretrain/Loss (Raw)": 1.6946008205413818, "Pretrain/Step": 5565, "Pretrain/Step Time": 8.51590789295733} +{"Pretrain/Learning Rate": 1.9489016232489e-05, "Pretrain/Loss": 2.011087417602539, "Pretrain/Loss (Raw)": 2.0322530269622803, "Pretrain/Step": 5566, "Pretrain/Step Time": 8.516483088955283} +{"Pretrain/Learning Rate": 1.9480735522372236e-05, "Pretrain/Loss": 2.0129342079162598, "Pretrain/Loss (Raw)": 2.309706449508667, "Pretrain/Step": 5567, "Pretrain/Step Time": 8.506340919062495} +{"Pretrain/Learning Rate": 1.9472455448763077e-05, "Pretrain/Loss": 2.013474464416504, "Pretrain/Loss (Raw)": 1.9926810264587402, "Pretrain/Step": 5568, "Pretrain/Step Time": 8.502280028536916} +{"Pretrain/Learning Rate": 1.9464176012616386e-05, "Pretrain/Loss": 2.0129518508911133, "Pretrain/Loss (Raw)": 1.9838354587554932, "Pretrain/Step": 5569, "Pretrain/Step Time": 8.504595063626766} +{"Pretrain/Learning Rate": 1.945589721488702e-05, "Pretrain/Loss": 2.011892080307007, "Pretrain/Loss (Raw)": 2.010775327682495, "Pretrain/Step": 5570, "Pretrain/Step Time": 8.505777034908533} +{"Pretrain/Learning Rate": 1.9447619056529697e-05, "Pretrain/Loss": 2.011910915374756, "Pretrain/Loss (Raw)": 2.010913133621216, "Pretrain/Step": 5571, "Pretrain/Step Time": 8.5080989561975} +{"Pretrain/Learning Rate": 1.9439341538499117e-05, "Pretrain/Loss": 2.011843681335449, "Pretrain/Loss (Raw)": 2.1089930534362793, "Pretrain/Step": 5572, "Pretrain/Step Time": 8.505483414977789} +{"Pretrain/Learning Rate": 1.9431064661749866e-05, "Pretrain/Loss": 2.011441230773926, "Pretrain/Loss (Raw)": 1.912877082824707, "Pretrain/Step": 5573, "Pretrain/Step Time": 8.50372869707644} +{"Pretrain/Learning Rate": 1.9422788427236487e-05, "Pretrain/Loss": 2.0099387168884277, "Pretrain/Loss (Raw)": 2.1421873569488525, "Pretrain/Step": 5574, "Pretrain/Step Time": 8.489774152636528} +{"Pretrain/Learning Rate": 1.9414512835913422e-05, "Pretrain/Loss": 2.010061025619507, "Pretrain/Loss (Raw)": 2.1232004165649414, "Pretrain/Step": 5575, "Pretrain/Step Time": 8.49612819775939} +{"Pretrain/Learning Rate": 1.940623788873506e-05, "Pretrain/Loss": 2.008249282836914, "Pretrain/Loss (Raw)": 1.8283041715621948, "Pretrain/Step": 5576, "Pretrain/Step Time": 8.502931825816631} +{"Pretrain/Learning Rate": 1.9397963586655702e-05, "Pretrain/Loss": 2.0088014602661133, "Pretrain/Loss (Raw)": 2.228276252746582, "Pretrain/Step": 5577, "Pretrain/Step Time": 8.506049122661352} +{"Pretrain/Learning Rate": 1.9389689930629585e-05, "Pretrain/Loss": 2.0083956718444824, "Pretrain/Loss (Raw)": 2.0785634517669678, "Pretrain/Step": 5578, "Pretrain/Step Time": 8.504713743925095} +{"Pretrain/Learning Rate": 1.9381416921610855e-05, "Pretrain/Loss": 2.009812355041504, "Pretrain/Loss (Raw)": 2.0546655654907227, "Pretrain/Step": 5579, "Pretrain/Step Time": 8.498737743124366} +{"Pretrain/Learning Rate": 1.9373144560553604e-05, "Pretrain/Loss": 2.0097055435180664, "Pretrain/Loss (Raw)": 2.049125909805298, "Pretrain/Step": 5580, "Pretrain/Step Time": 8.504071164876223} +{"Pretrain/Learning Rate": 1.9364872848411837e-05, "Pretrain/Loss": 2.009289264678955, "Pretrain/Loss (Raw)": 2.072421073913574, "Pretrain/Step": 5581, "Pretrain/Step Time": 8.51359597593546} +{"Pretrain/Learning Rate": 1.9356601786139487e-05, "Pretrain/Loss": 2.0082316398620605, "Pretrain/Loss (Raw)": 1.9558303356170654, "Pretrain/Step": 5582, "Pretrain/Step Time": 8.518425427377224} +{"Pretrain/Learning Rate": 1.934833137469041e-05, "Pretrain/Loss": 2.007856845855713, "Pretrain/Loss (Raw)": 2.0381410121917725, "Pretrain/Step": 5583, "Pretrain/Step Time": 8.519943784922361} +{"Pretrain/Learning Rate": 1.9340061615018393e-05, "Pretrain/Loss": 2.0068352222442627, "Pretrain/Loss (Raw)": 1.9835851192474365, "Pretrain/Step": 5584, "Pretrain/Step Time": 8.515063287690282} +{"Pretrain/Learning Rate": 1.9331792508077136e-05, "Pretrain/Loss": 2.0062332153320312, "Pretrain/Loss (Raw)": 1.8640629053115845, "Pretrain/Step": 5585, "Pretrain/Step Time": 8.510346906259656} +{"Pretrain/Learning Rate": 1.9323524054820285e-05, "Pretrain/Loss": 2.0053446292877197, "Pretrain/Loss (Raw)": 1.8737127780914307, "Pretrain/Step": 5586, "Pretrain/Step Time": 8.510005811229348} +{"Pretrain/Learning Rate": 1.9315256256201382e-05, "Pretrain/Loss": 2.0071463584899902, "Pretrain/Loss (Raw)": 2.1880669593811035, "Pretrain/Step": 5587, "Pretrain/Step Time": 8.515356563031673} +{"Pretrain/Learning Rate": 1.930698911317392e-05, "Pretrain/Loss": 2.00272798538208, "Pretrain/Loss (Raw)": 1.5142744779586792, "Pretrain/Step": 5588, "Pretrain/Step Time": 8.514913614839315} +{"Pretrain/Learning Rate": 1.929872262669129e-05, "Pretrain/Loss": 2.004894733428955, "Pretrain/Loss (Raw)": 1.7985590696334839, "Pretrain/Step": 5589, "Pretrain/Step Time": 8.514632817357779} +{"Pretrain/Learning Rate": 1.9290456797706835e-05, "Pretrain/Loss": 2.0049777030944824, "Pretrain/Loss (Raw)": 1.9923499822616577, "Pretrain/Step": 5590, "Pretrain/Step Time": 8.508911047130823} +{"Pretrain/Learning Rate": 1.928219162717381e-05, "Pretrain/Loss": 2.0060200691223145, "Pretrain/Loss (Raw)": 1.9697540998458862, "Pretrain/Step": 5591, "Pretrain/Step Time": 8.501601023599505} +{"Pretrain/Learning Rate": 1.927392711604539e-05, "Pretrain/Loss": 2.005033493041992, "Pretrain/Loss (Raw)": 1.7896244525909424, "Pretrain/Step": 5592, "Pretrain/Step Time": 8.49724206700921} +{"Pretrain/Learning Rate": 1.926566326527468e-05, "Pretrain/Loss": 2.00445556640625, "Pretrain/Loss (Raw)": 1.9418212175369263, "Pretrain/Step": 5593, "Pretrain/Step Time": 8.500640664249659} +{"Pretrain/Learning Rate": 1.9257400075814697e-05, "Pretrain/Loss": 2.0035159587860107, "Pretrain/Loss (Raw)": 2.0329670906066895, "Pretrain/Step": 5594, "Pretrain/Step Time": 8.508821368217468} +{"Pretrain/Learning Rate": 1.92491375486184e-05, "Pretrain/Loss": 2.004579544067383, "Pretrain/Loss (Raw)": 2.079367160797119, "Pretrain/Step": 5595, "Pretrain/Step Time": 8.513225192204118} +{"Pretrain/Learning Rate": 1.9240875684638658e-05, "Pretrain/Loss": 2.0044922828674316, "Pretrain/Loss (Raw)": 2.23673152923584, "Pretrain/Step": 5596, "Pretrain/Step Time": 8.518570339307189} +{"Pretrain/Learning Rate": 1.9232614484828277e-05, "Pretrain/Loss": 2.007293224334717, "Pretrain/Loss (Raw)": 2.162682294845581, "Pretrain/Step": 5597, "Pretrain/Step Time": 8.513426078483462} +{"Pretrain/Learning Rate": 1.922435395013996e-05, "Pretrain/Loss": 2.006824493408203, "Pretrain/Loss (Raw)": 2.012784719467163, "Pretrain/Step": 5598, "Pretrain/Step Time": 8.510834353044629} +{"Pretrain/Learning Rate": 1.921609408152637e-05, "Pretrain/Loss": 2.006474018096924, "Pretrain/Loss (Raw)": 2.193113327026367, "Pretrain/Step": 5599, "Pretrain/Step Time": 8.515570931136608} +{"Pretrain/Learning Rate": 1.9207834879940058e-05, "Pretrain/Loss": 2.00750470161438, "Pretrain/Loss (Raw)": 1.894069790840149, "Pretrain/Step": 5600, "Pretrain/Step Time": 8.527449056506157} +{"Pretrain/Learning Rate": 1.919957634633353e-05, "Pretrain/Loss": 2.005702495574951, "Pretrain/Loss (Raw)": 1.9105855226516724, "Pretrain/Step": 5601, "Pretrain/Step Time": 8.52367421798408} +{"Pretrain/Learning Rate": 1.9191318481659183e-05, "Pretrain/Loss": 2.0070018768310547, "Pretrain/Loss (Raw)": 2.261730194091797, "Pretrain/Step": 5602, "Pretrain/Step Time": 8.523073380813003} +{"Pretrain/Learning Rate": 1.918306128686937e-05, "Pretrain/Loss": 2.0047881603240967, "Pretrain/Loss (Raw)": 2.0288565158843994, "Pretrain/Step": 5603, "Pretrain/Step Time": 8.518610617145896} +{"Pretrain/Learning Rate": 1.9174804762916324e-05, "Pretrain/Loss": 2.0055909156799316, "Pretrain/Loss (Raw)": 2.0634634494781494, "Pretrain/Step": 5604, "Pretrain/Step Time": 8.517730114981532} +{"Pretrain/Learning Rate": 1.916654891075226e-05, "Pretrain/Loss": 2.0043110847473145, "Pretrain/Loss (Raw)": 1.86568284034729, "Pretrain/Step": 5605, "Pretrain/Step Time": 8.515642303973436} +{"Pretrain/Learning Rate": 1.915829373132924e-05, "Pretrain/Loss": 2.0053906440734863, "Pretrain/Loss (Raw)": 1.9574319124221802, "Pretrain/Step": 5606, "Pretrain/Step Time": 8.527291828766465} +{"Pretrain/Learning Rate": 1.9150039225599336e-05, "Pretrain/Loss": 2.0044922828674316, "Pretrain/Loss (Raw)": 2.023552656173706, "Pretrain/Step": 5607, "Pretrain/Step Time": 8.52881714142859} +{"Pretrain/Learning Rate": 1.914178539451446e-05, "Pretrain/Loss": 2.0019211769104004, "Pretrain/Loss (Raw)": 1.8205121755599976, "Pretrain/Step": 5608, "Pretrain/Step Time": 8.525571376085281} +{"Pretrain/Learning Rate": 1.913353223902651e-05, "Pretrain/Loss": 2.004622220993042, "Pretrain/Loss (Raw)": 2.166735887527466, "Pretrain/Step": 5609, "Pretrain/Step Time": 8.518980188295245} +{"Pretrain/Learning Rate": 1.912527976008725e-05, "Pretrain/Loss": 2.004945993423462, "Pretrain/Loss (Raw)": 1.9829766750335693, "Pretrain/Step": 5610, "Pretrain/Step Time": 8.517431756481528} +{"Pretrain/Learning Rate": 1.911702795864843e-05, "Pretrain/Loss": 2.00606632232666, "Pretrain/Loss (Raw)": 2.0289604663848877, "Pretrain/Step": 5611, "Pretrain/Step Time": 8.515597799792886} +{"Pretrain/Learning Rate": 1.9108776835661655e-05, "Pretrain/Loss": 2.0045080184936523, "Pretrain/Loss (Raw)": 2.015988826751709, "Pretrain/Step": 5612, "Pretrain/Step Time": 8.512765543535352} +{"Pretrain/Learning Rate": 1.91005263920785e-05, "Pretrain/Loss": 2.00203537940979, "Pretrain/Loss (Raw)": 2.021474838256836, "Pretrain/Step": 5613, "Pretrain/Step Time": 8.518582319840789} +{"Pretrain/Learning Rate": 1.9092276628850438e-05, "Pretrain/Loss": 2.0021910667419434, "Pretrain/Loss (Raw)": 2.0923497676849365, "Pretrain/Step": 5614, "Pretrain/Step Time": 8.517946194857359} +{"Pretrain/Learning Rate": 1.9084027546928872e-05, "Pretrain/Loss": 2.0018410682678223, "Pretrain/Loss (Raw)": 2.021285057067871, "Pretrain/Step": 5615, "Pretrain/Step Time": 8.513329977169633} +{"Pretrain/Learning Rate": 1.907577914726513e-05, "Pretrain/Loss": 2.0045173168182373, "Pretrain/Loss (Raw)": 2.1097781658172607, "Pretrain/Step": 5616, "Pretrain/Step Time": 8.511880418285728} +{"Pretrain/Learning Rate": 1.906753143081045e-05, "Pretrain/Loss": 2.0050883293151855, "Pretrain/Loss (Raw)": 2.0016353130340576, "Pretrain/Step": 5617, "Pretrain/Step Time": 8.510709526017308} +{"Pretrain/Learning Rate": 1.9059284398515997e-05, "Pretrain/Loss": 2.005598306655884, "Pretrain/Loss (Raw)": 2.2106008529663086, "Pretrain/Step": 5618, "Pretrain/Step Time": 8.520419178530574} +{"Pretrain/Learning Rate": 1.9051038051332868e-05, "Pretrain/Loss": 2.00530743598938, "Pretrain/Loss (Raw)": 1.9812431335449219, "Pretrain/Step": 5619, "Pretrain/Step Time": 8.526356222108006} +{"Pretrain/Learning Rate": 1.9042792390212054e-05, "Pretrain/Loss": 2.005418300628662, "Pretrain/Loss (Raw)": 1.9313552379608154, "Pretrain/Step": 5620, "Pretrain/Step Time": 8.515865102410316} +{"Pretrain/Learning Rate": 1.9034547416104502e-05, "Pretrain/Loss": 2.005871534347534, "Pretrain/Loss (Raw)": 2.1259241104125977, "Pretrain/Step": 5621, "Pretrain/Step Time": 8.509772321209311} +{"Pretrain/Learning Rate": 1.9026303129961047e-05, "Pretrain/Loss": 2.004589080810547, "Pretrain/Loss (Raw)": 1.7253338098526, "Pretrain/Step": 5622, "Pretrain/Step Time": 8.510632136836648} +{"Pretrain/Learning Rate": 1.901805953273247e-05, "Pretrain/Loss": 2.009779930114746, "Pretrain/Loss (Raw)": 2.5753896236419678, "Pretrain/Step": 5623, "Pretrain/Step Time": 8.512970140203834} +{"Pretrain/Learning Rate": 1.900981662536945e-05, "Pretrain/Loss": 2.0101656913757324, "Pretrain/Loss (Raw)": 1.9422739744186401, "Pretrain/Step": 5624, "Pretrain/Step Time": 8.521898800507188} +{"Pretrain/Learning Rate": 1.9001574408822603e-05, "Pretrain/Loss": 2.0120885372161865, "Pretrain/Loss (Raw)": 2.0359177589416504, "Pretrain/Step": 5625, "Pretrain/Step Time": 8.521644044667482} +{"Pretrain/Learning Rate": 1.899333288404246e-05, "Pretrain/Loss": 2.0132341384887695, "Pretrain/Loss (Raw)": 2.151557207107544, "Pretrain/Step": 5626, "Pretrain/Step Time": 8.523098342120647} +{"Pretrain/Learning Rate": 1.8985092051979478e-05, "Pretrain/Loss": 2.0120363235473633, "Pretrain/Loss (Raw)": 1.9579408168792725, "Pretrain/Step": 5627, "Pretrain/Step Time": 8.512194944545627} +{"Pretrain/Learning Rate": 1.897685191358402e-05, "Pretrain/Loss": 2.0126519203186035, "Pretrain/Loss (Raw)": 2.0292391777038574, "Pretrain/Step": 5628, "Pretrain/Step Time": 8.506868448108435} +{"Pretrain/Learning Rate": 1.8968612469806387e-05, "Pretrain/Loss": 2.0106005668640137, "Pretrain/Loss (Raw)": 2.1022145748138428, "Pretrain/Step": 5629, "Pretrain/Step Time": 8.50574185885489} +{"Pretrain/Learning Rate": 1.8960373721596775e-05, "Pretrain/Loss": 2.0108819007873535, "Pretrain/Loss (Raw)": 2.019819498062134, "Pretrain/Step": 5630, "Pretrain/Step Time": 8.50554153881967} +{"Pretrain/Learning Rate": 1.8952135669905334e-05, "Pretrain/Loss": 2.01072359085083, "Pretrain/Loss (Raw)": 2.159423351287842, "Pretrain/Step": 5631, "Pretrain/Step Time": 8.52001777291298} +{"Pretrain/Learning Rate": 1.89438983156821e-05, "Pretrain/Loss": 2.011789321899414, "Pretrain/Loss (Raw)": 1.9982165098190308, "Pretrain/Step": 5632, "Pretrain/Step Time": 8.513896699994802} +{"Pretrain/Learning Rate": 1.8935661659877046e-05, "Pretrain/Loss": 2.0123579502105713, "Pretrain/Loss (Raw)": 1.9310541152954102, "Pretrain/Step": 5633, "Pretrain/Step Time": 8.505769265815616} +{"Pretrain/Learning Rate": 1.8927425703440076e-05, "Pretrain/Loss": 2.011305809020996, "Pretrain/Loss (Raw)": 2.011759042739868, "Pretrain/Step": 5634, "Pretrain/Step Time": 8.50730525329709} +{"Pretrain/Learning Rate": 1.8919190447320982e-05, "Pretrain/Loss": 2.015672206878662, "Pretrain/Loss (Raw)": 2.4308478832244873, "Pretrain/Step": 5635, "Pretrain/Step Time": 8.508174428716302} +{"Pretrain/Learning Rate": 1.8910955892469505e-05, "Pretrain/Loss": 2.015371322631836, "Pretrain/Loss (Raw)": 2.145395278930664, "Pretrain/Step": 5636, "Pretrain/Step Time": 8.517203994095325} +{"Pretrain/Learning Rate": 1.890272203983528e-05, "Pretrain/Loss": 2.016782283782959, "Pretrain/Loss (Raw)": 2.0446391105651855, "Pretrain/Step": 5637, "Pretrain/Step Time": 8.52305748872459} +{"Pretrain/Learning Rate": 1.8894488890367885e-05, "Pretrain/Loss": 2.016782283782959, "Pretrain/Loss (Raw)": 1.9425060749053955, "Pretrain/Step": 5638, "Pretrain/Step Time": 8.520497895777225} +{"Pretrain/Learning Rate": 1.8886256445016798e-05, "Pretrain/Loss": 2.0170106887817383, "Pretrain/Loss (Raw)": 2.198422908782959, "Pretrain/Step": 5639, "Pretrain/Step Time": 8.51553339138627} +{"Pretrain/Learning Rate": 1.8878024704731433e-05, "Pretrain/Loss": 2.019002914428711, "Pretrain/Loss (Raw)": 2.234149217605591, "Pretrain/Step": 5640, "Pretrain/Step Time": 8.51901464536786} +{"Pretrain/Learning Rate": 1.88697936704611e-05, "Pretrain/Loss": 2.019587755203247, "Pretrain/Loss (Raw)": 1.9856301546096802, "Pretrain/Step": 5641, "Pretrain/Step Time": 8.516180414706469} +{"Pretrain/Learning Rate": 1.8861563343155054e-05, "Pretrain/Loss": 2.020310163497925, "Pretrain/Loss (Raw)": 2.0110790729522705, "Pretrain/Step": 5642, "Pretrain/Step Time": 8.520632421597838} +{"Pretrain/Learning Rate": 1.8853333723762438e-05, "Pretrain/Loss": 2.0201706886291504, "Pretrain/Loss (Raw)": 1.897552728652954, "Pretrain/Step": 5643, "Pretrain/Step Time": 8.521746015176177} +{"Pretrain/Learning Rate": 1.884510481323236e-05, "Pretrain/Loss": 2.023858070373535, "Pretrain/Loss (Raw)": 2.431100845336914, "Pretrain/Step": 5644, "Pretrain/Step Time": 8.519730666652322} +{"Pretrain/Learning Rate": 1.8836876612513777e-05, "Pretrain/Loss": 2.0239953994750977, "Pretrain/Loss (Raw)": 2.010558843612671, "Pretrain/Step": 5645, "Pretrain/Step Time": 8.517157321795821} +{"Pretrain/Learning Rate": 1.882864912255564e-05, "Pretrain/Loss": 2.02526593208313, "Pretrain/Loss (Raw)": 2.2266550064086914, "Pretrain/Step": 5646, "Pretrain/Step Time": 8.514610076323152} +{"Pretrain/Learning Rate": 1.882042234430675e-05, "Pretrain/Loss": 2.022470712661743, "Pretrain/Loss (Raw)": 2.090880870819092, "Pretrain/Step": 5647, "Pretrain/Step Time": 8.51555797457695} +{"Pretrain/Learning Rate": 1.8812196278715895e-05, "Pretrain/Loss": 2.0261120796203613, "Pretrain/Loss (Raw)": 2.393634557723999, "Pretrain/Step": 5648, "Pretrain/Step Time": 8.514356330037117} +{"Pretrain/Learning Rate": 1.8803970926731703e-05, "Pretrain/Loss": 2.0258936882019043, "Pretrain/Loss (Raw)": 2.131013870239258, "Pretrain/Step": 5649, "Pretrain/Step Time": 8.513923414051533} +{"Pretrain/Learning Rate": 1.8795746289302798e-05, "Pretrain/Loss": 2.0270495414733887, "Pretrain/Loss (Raw)": 1.9953655004501343, "Pretrain/Step": 5650, "Pretrain/Step Time": 8.51036717183888} +{"Pretrain/Learning Rate": 1.878752236737765e-05, "Pretrain/Loss": 2.025484323501587, "Pretrain/Loss (Raw)": 1.9641613960266113, "Pretrain/Step": 5651, "Pretrain/Step Time": 8.496781580150127} +{"Pretrain/Learning Rate": 1.8779299161904712e-05, "Pretrain/Loss": 2.02266788482666, "Pretrain/Loss (Raw)": 2.0835866928100586, "Pretrain/Step": 5652, "Pretrain/Step Time": 8.498611081391573} +{"Pretrain/Learning Rate": 1.87710766738323e-05, "Pretrain/Loss": 2.0227675437927246, "Pretrain/Loss (Raw)": 2.110811233520508, "Pretrain/Step": 5653, "Pretrain/Step Time": 8.50173300690949} +{"Pretrain/Learning Rate": 1.8762854904108677e-05, "Pretrain/Loss": 2.024294376373291, "Pretrain/Loss (Raw)": 2.15476655960083, "Pretrain/Step": 5654, "Pretrain/Step Time": 8.506045941263437} +{"Pretrain/Learning Rate": 1.8754633853682016e-05, "Pretrain/Loss": 2.025324821472168, "Pretrain/Loss (Raw)": 2.128539562225342, "Pretrain/Step": 5655, "Pretrain/Step Time": 8.512477727606893} +{"Pretrain/Learning Rate": 1.874641352350041e-05, "Pretrain/Loss": 2.028632640838623, "Pretrain/Loss (Raw)": 2.2642979621887207, "Pretrain/Step": 5656, "Pretrain/Step Time": 8.50687711685896} +{"Pretrain/Learning Rate": 1.8738193914511865e-05, "Pretrain/Loss": 2.027438163757324, "Pretrain/Loss (Raw)": 1.89259672164917, "Pretrain/Step": 5657, "Pretrain/Step Time": 8.506529657170177} +{"Pretrain/Learning Rate": 1.8729975027664303e-05, "Pretrain/Loss": 2.023501396179199, "Pretrain/Loss (Raw)": 1.567942500114441, "Pretrain/Step": 5658, "Pretrain/Step Time": 8.509599901735783} +{"Pretrain/Learning Rate": 1.8721756863905566e-05, "Pretrain/Loss": 2.024609327316284, "Pretrain/Loss (Raw)": 2.080267906188965, "Pretrain/Step": 5659, "Pretrain/Step Time": 8.511057991534472} +{"Pretrain/Learning Rate": 1.8713539424183417e-05, "Pretrain/Loss": 2.0286812782287598, "Pretrain/Loss (Raw)": 2.1534922122955322, "Pretrain/Step": 5660, "Pretrain/Step Time": 8.513595048338175} +{"Pretrain/Learning Rate": 1.8705322709445515e-05, "Pretrain/Loss": 2.0305633544921875, "Pretrain/Loss (Raw)": 2.082425832748413, "Pretrain/Step": 5661, "Pretrain/Step Time": 8.513734186068177} +{"Pretrain/Learning Rate": 1.8697106720639467e-05, "Pretrain/Loss": 2.0323238372802734, "Pretrain/Loss (Raw)": 2.218975067138672, "Pretrain/Step": 5662, "Pretrain/Step Time": 8.5111581441015} +{"Pretrain/Learning Rate": 1.8688891458712765e-05, "Pretrain/Loss": 2.0337793827056885, "Pretrain/Loss (Raw)": 2.0742318630218506, "Pretrain/Step": 5663, "Pretrain/Step Time": 8.507946344092488} +{"Pretrain/Learning Rate": 1.8680676924612847e-05, "Pretrain/Loss": 2.0318808555603027, "Pretrain/Loss (Raw)": 2.0205001831054688, "Pretrain/Step": 5664, "Pretrain/Step Time": 8.511634154245257} +{"Pretrain/Learning Rate": 1.8672463119287037e-05, "Pretrain/Loss": 2.0322909355163574, "Pretrain/Loss (Raw)": 2.089409589767456, "Pretrain/Step": 5665, "Pretrain/Step Time": 8.511693404987454} +{"Pretrain/Learning Rate": 1.86642500436826e-05, "Pretrain/Loss": 2.0328452587127686, "Pretrain/Loss (Raw)": 2.0196616649627686, "Pretrain/Step": 5666, "Pretrain/Step Time": 8.512456249445677} +{"Pretrain/Learning Rate": 1.8656037698746704e-05, "Pretrain/Loss": 2.0347607135772705, "Pretrain/Loss (Raw)": 2.2740793228149414, "Pretrain/Step": 5667, "Pretrain/Step Time": 8.517557060346007} +{"Pretrain/Learning Rate": 1.8647826085426433e-05, "Pretrain/Loss": 2.0356264114379883, "Pretrain/Loss (Raw)": 2.1475343704223633, "Pretrain/Step": 5668, "Pretrain/Step Time": 8.512506579980254} +{"Pretrain/Learning Rate": 1.8639615204668786e-05, "Pretrain/Loss": 2.0364089012145996, "Pretrain/Loss (Raw)": 2.1362879276275635, "Pretrain/Step": 5669, "Pretrain/Step Time": 8.503841137513518} +{"Pretrain/Learning Rate": 1.863140505742069e-05, "Pretrain/Loss": 2.0358543395996094, "Pretrain/Loss (Raw)": 1.9335503578186035, "Pretrain/Step": 5670, "Pretrain/Step Time": 8.501497436314821} +{"Pretrain/Learning Rate": 1.862319564462897e-05, "Pretrain/Loss": 2.0373287200927734, "Pretrain/Loss (Raw)": 2.1072757244110107, "Pretrain/Step": 5671, "Pretrain/Step Time": 8.502241726964712} +{"Pretrain/Learning Rate": 1.8614986967240382e-05, "Pretrain/Loss": 2.035482883453369, "Pretrain/Loss (Raw)": 1.810528039932251, "Pretrain/Step": 5672, "Pretrain/Step Time": 8.50911563448608} +{"Pretrain/Learning Rate": 1.8606779026201577e-05, "Pretrain/Loss": 2.0368247032165527, "Pretrain/Loss (Raw)": 2.1282191276550293, "Pretrain/Step": 5673, "Pretrain/Step Time": 8.513543056324124} +{"Pretrain/Learning Rate": 1.859857182245914e-05, "Pretrain/Loss": 2.0349273681640625, "Pretrain/Loss (Raw)": 1.814616322517395, "Pretrain/Step": 5674, "Pretrain/Step Time": 8.504230201244354} +{"Pretrain/Learning Rate": 1.859036535695957e-05, "Pretrain/Loss": 2.035123586654663, "Pretrain/Loss (Raw)": 1.9782488346099854, "Pretrain/Step": 5675, "Pretrain/Step Time": 8.510356616228819} +{"Pretrain/Learning Rate": 1.858215963064927e-05, "Pretrain/Loss": 2.0361948013305664, "Pretrain/Loss (Raw)": 2.0794618129730225, "Pretrain/Step": 5676, "Pretrain/Step Time": 8.510485326871276} +{"Pretrain/Learning Rate": 1.8573954644474562e-05, "Pretrain/Loss": 2.0375921726226807, "Pretrain/Loss (Raw)": 2.1977500915527344, "Pretrain/Step": 5677, "Pretrain/Step Time": 8.519526448100805} +{"Pretrain/Learning Rate": 1.8565750399381684e-05, "Pretrain/Loss": 2.0375800132751465, "Pretrain/Loss (Raw)": 1.9052115678787231, "Pretrain/Step": 5678, "Pretrain/Step Time": 8.52026504650712} +{"Pretrain/Learning Rate": 1.8557546896316793e-05, "Pretrain/Loss": 2.036961317062378, "Pretrain/Loss (Raw)": 1.9195762872695923, "Pretrain/Step": 5679, "Pretrain/Step Time": 8.519571658223867} +{"Pretrain/Learning Rate": 1.8549344136225946e-05, "Pretrain/Loss": 2.0391061305999756, "Pretrain/Loss (Raw)": 2.124748468399048, "Pretrain/Step": 5680, "Pretrain/Step Time": 8.51014505699277} +{"Pretrain/Learning Rate": 1.8541142120055136e-05, "Pretrain/Loss": 2.038480758666992, "Pretrain/Loss (Raw)": 2.0025575160980225, "Pretrain/Step": 5681, "Pretrain/Step Time": 8.50988502241671} +{"Pretrain/Learning Rate": 1.8532940848750245e-05, "Pretrain/Loss": 2.0372934341430664, "Pretrain/Loss (Raw)": 1.9062377214431763, "Pretrain/Step": 5682, "Pretrain/Step Time": 8.516832936555147} +{"Pretrain/Learning Rate": 1.8524740323257095e-05, "Pretrain/Loss": 2.0364062786102295, "Pretrain/Loss (Raw)": 2.089634895324707, "Pretrain/Step": 5683, "Pretrain/Step Time": 8.522773450240493} +{"Pretrain/Learning Rate": 1.85165405445214e-05, "Pretrain/Loss": 2.0356788635253906, "Pretrain/Loss (Raw)": 2.044118642807007, "Pretrain/Step": 5684, "Pretrain/Step Time": 8.519266925752163} +{"Pretrain/Learning Rate": 1.8508341513488804e-05, "Pretrain/Loss": 2.038928270339966, "Pretrain/Loss (Raw)": 2.1641430854797363, "Pretrain/Step": 5685, "Pretrain/Step Time": 8.517845956608653} +{"Pretrain/Learning Rate": 1.8500143231104846e-05, "Pretrain/Loss": 2.0389771461486816, "Pretrain/Loss (Raw)": 2.029694080352783, "Pretrain/Step": 5686, "Pretrain/Step Time": 8.508344555273652} +{"Pretrain/Learning Rate": 1.8491945698315014e-05, "Pretrain/Loss": 2.0378127098083496, "Pretrain/Loss (Raw)": 1.7731224298477173, "Pretrain/Step": 5687, "Pretrain/Step Time": 8.503088062629104} +{"Pretrain/Learning Rate": 1.8483748916064654e-05, "Pretrain/Loss": 2.037393093109131, "Pretrain/Loss (Raw)": 1.862682819366455, "Pretrain/Step": 5688, "Pretrain/Step Time": 8.506705272942781} +{"Pretrain/Learning Rate": 1.8475552885299092e-05, "Pretrain/Loss": 2.0373709201812744, "Pretrain/Loss (Raw)": 2.0164413452148438, "Pretrain/Step": 5689, "Pretrain/Step Time": 8.511567646637559} +{"Pretrain/Learning Rate": 1.8467357606963496e-05, "Pretrain/Loss": 2.038374662399292, "Pretrain/Loss (Raw)": 2.010641098022461, "Pretrain/Step": 5690, "Pretrain/Step Time": 8.511462461203337} +{"Pretrain/Learning Rate": 1.845916308200302e-05, "Pretrain/Loss": 2.0392825603485107, "Pretrain/Loss (Raw)": 2.127716541290283, "Pretrain/Step": 5691, "Pretrain/Step Time": 8.516015227884054} +{"Pretrain/Learning Rate": 1.8450969311362666e-05, "Pretrain/Loss": 2.0398411750793457, "Pretrain/Loss (Raw)": 2.023334264755249, "Pretrain/Step": 5692, "Pretrain/Step Time": 8.508512338623405} +{"Pretrain/Learning Rate": 1.8442776295987403e-05, "Pretrain/Loss": 2.0427632331848145, "Pretrain/Loss (Raw)": 2.0686206817626953, "Pretrain/Step": 5693, "Pretrain/Step Time": 8.514271119609475} +{"Pretrain/Learning Rate": 1.843458403682206e-05, "Pretrain/Loss": 2.0428671836853027, "Pretrain/Loss (Raw)": 2.0455868244171143, "Pretrain/Step": 5694, "Pretrain/Step Time": 8.517594551667571} +{"Pretrain/Learning Rate": 1.8426392534811445e-05, "Pretrain/Loss": 2.0406556129455566, "Pretrain/Loss (Raw)": 2.0266127586364746, "Pretrain/Step": 5695, "Pretrain/Step Time": 8.519707536324859} +{"Pretrain/Learning Rate": 1.84182017909002e-05, "Pretrain/Loss": 2.042038917541504, "Pretrain/Loss (Raw)": 2.169764518737793, "Pretrain/Step": 5696, "Pretrain/Step Time": 8.51967617124319} +{"Pretrain/Learning Rate": 1.841001180603295e-05, "Pretrain/Loss": 2.0421130657196045, "Pretrain/Loss (Raw)": 1.993316411972046, "Pretrain/Step": 5697, "Pretrain/Step Time": 8.514475742354989} +{"Pretrain/Learning Rate": 1.8401822581154188e-05, "Pretrain/Loss": 2.0422959327697754, "Pretrain/Loss (Raw)": 2.0341718196868896, "Pretrain/Step": 5698, "Pretrain/Step Time": 8.514875747263432} +{"Pretrain/Learning Rate": 1.8393634117208343e-05, "Pretrain/Loss": 2.0401291847229004, "Pretrain/Loss (Raw)": 1.7335777282714844, "Pretrain/Step": 5699, "Pretrain/Step Time": 8.51158395037055} +{"Pretrain/Learning Rate": 1.838544641513973e-05, "Pretrain/Loss": 2.0401611328125, "Pretrain/Loss (Raw)": 2.1130692958831787, "Pretrain/Step": 5700, "Pretrain/Step Time": 8.51543884165585} +{"Pretrain/Learning Rate": 1.8377259475892612e-05, "Pretrain/Loss": 2.0409035682678223, "Pretrain/Loss (Raw)": 2.0078961849212646, "Pretrain/Step": 5701, "Pretrain/Step Time": 8.5168098770082} +{"Pretrain/Learning Rate": 1.8369073300411137e-05, "Pretrain/Loss": 2.0386962890625, "Pretrain/Loss (Raw)": 1.8596643209457397, "Pretrain/Step": 5702, "Pretrain/Step Time": 8.516714930534363} +{"Pretrain/Learning Rate": 1.836088788963938e-05, "Pretrain/Loss": 2.0358469486236572, "Pretrain/Loss (Raw)": 1.758489727973938, "Pretrain/Step": 5703, "Pretrain/Step Time": 8.508396476507187} +{"Pretrain/Learning Rate": 1.8352703244521308e-05, "Pretrain/Loss": 2.0377249717712402, "Pretrain/Loss (Raw)": 2.068697452545166, "Pretrain/Step": 5704, "Pretrain/Step Time": 8.506395697593689} +{"Pretrain/Learning Rate": 1.8344519366000828e-05, "Pretrain/Loss": 2.035741090774536, "Pretrain/Loss (Raw)": 1.9743373394012451, "Pretrain/Step": 5705, "Pretrain/Step Time": 8.505029007792473} +{"Pretrain/Learning Rate": 1.833633625502173e-05, "Pretrain/Loss": 2.035168170928955, "Pretrain/Loss (Raw)": 2.0052475929260254, "Pretrain/Step": 5706, "Pretrain/Step Time": 8.503404015675187} +{"Pretrain/Learning Rate": 1.832815391252774e-05, "Pretrain/Loss": 2.0350356101989746, "Pretrain/Loss (Raw)": 2.037693977355957, "Pretrain/Step": 5707, "Pretrain/Step Time": 8.511108363047242} +{"Pretrain/Learning Rate": 1.8319972339462478e-05, "Pretrain/Loss": 2.036602258682251, "Pretrain/Loss (Raw)": 2.249643564224243, "Pretrain/Step": 5708, "Pretrain/Step Time": 8.516883432865143} +{"Pretrain/Learning Rate": 1.8311791536769483e-05, "Pretrain/Loss": 2.0347700119018555, "Pretrain/Loss (Raw)": 1.837913990020752, "Pretrain/Step": 5709, "Pretrain/Step Time": 8.50615925528109} +{"Pretrain/Learning Rate": 1.8303611505392205e-05, "Pretrain/Loss": 2.0371570587158203, "Pretrain/Loss (Raw)": 2.2613580226898193, "Pretrain/Step": 5710, "Pretrain/Step Time": 8.50071938894689} +{"Pretrain/Learning Rate": 1.8295432246274e-05, "Pretrain/Loss": 2.037933349609375, "Pretrain/Loss (Raw)": 2.137489080429077, "Pretrain/Step": 5711, "Pretrain/Step Time": 8.498246598988771} +{"Pretrain/Learning Rate": 1.828725376035814e-05, "Pretrain/Loss": 2.038270950317383, "Pretrain/Loss (Raw)": 2.026808261871338, "Pretrain/Step": 5712, "Pretrain/Step Time": 8.51126372627914} +{"Pretrain/Learning Rate": 1.827907604858782e-05, "Pretrain/Loss": 2.0362985134124756, "Pretrain/Loss (Raw)": 1.6115939617156982, "Pretrain/Step": 5713, "Pretrain/Step Time": 8.514103392139077} +{"Pretrain/Learning Rate": 1.8270899111906102e-05, "Pretrain/Loss": 2.0388922691345215, "Pretrain/Loss (Raw)": 2.2057206630706787, "Pretrain/Step": 5714, "Pretrain/Step Time": 8.518052129074931} +{"Pretrain/Learning Rate": 1.826272295125602e-05, "Pretrain/Loss": 2.036865234375, "Pretrain/Loss (Raw)": 1.9285905361175537, "Pretrain/Step": 5715, "Pretrain/Step Time": 8.515278972685337} +{"Pretrain/Learning Rate": 1.8254547567580472e-05, "Pretrain/Loss": 2.041167736053467, "Pretrain/Loss (Raw)": 2.065009593963623, "Pretrain/Step": 5716, "Pretrain/Step Time": 8.51119695045054} +{"Pretrain/Learning Rate": 1.824637296182228e-05, "Pretrain/Loss": 2.042931079864502, "Pretrain/Loss (Raw)": 2.0242457389831543, "Pretrain/Step": 5717, "Pretrain/Step Time": 8.514644926413894} +{"Pretrain/Learning Rate": 1.8238199134924185e-05, "Pretrain/Loss": 2.0442166328430176, "Pretrain/Loss (Raw)": 2.156928539276123, "Pretrain/Step": 5718, "Pretrain/Step Time": 8.524591818451881} +{"Pretrain/Learning Rate": 1.8230026087828824e-05, "Pretrain/Loss": 2.0431265830993652, "Pretrain/Loss (Raw)": 1.830227255821228, "Pretrain/Step": 5719, "Pretrain/Step Time": 8.526601929217577} +{"Pretrain/Learning Rate": 1.8221853821478763e-05, "Pretrain/Loss": 2.044633626937866, "Pretrain/Loss (Raw)": 1.98250150680542, "Pretrain/Step": 5720, "Pretrain/Step Time": 8.523917559534311} +{"Pretrain/Learning Rate": 1.821368233681645e-05, "Pretrain/Loss": 2.045680284500122, "Pretrain/Loss (Raw)": 2.0757968425750732, "Pretrain/Step": 5721, "Pretrain/Step Time": 8.517823960632086} +{"Pretrain/Learning Rate": 1.820551163478428e-05, "Pretrain/Loss": 2.0455739498138428, "Pretrain/Loss (Raw)": 2.019361734390259, "Pretrain/Step": 5722, "Pretrain/Step Time": 8.509012566879392} +{"Pretrain/Learning Rate": 1.8197341716324516e-05, "Pretrain/Loss": 2.0458459854125977, "Pretrain/Loss (Raw)": 2.114182949066162, "Pretrain/Step": 5723, "Pretrain/Step Time": 8.514691706746817} +{"Pretrain/Learning Rate": 1.8189172582379365e-05, "Pretrain/Loss": 2.044079303741455, "Pretrain/Loss (Raw)": 2.0106091499328613, "Pretrain/Step": 5724, "Pretrain/Step Time": 8.513205962255597} +{"Pretrain/Learning Rate": 1.818100423389092e-05, "Pretrain/Loss": 2.043018341064453, "Pretrain/Loss (Raw)": 2.026880979537964, "Pretrain/Step": 5725, "Pretrain/Step Time": 8.514121996238828} +{"Pretrain/Learning Rate": 1.817283667180121e-05, "Pretrain/Loss": 2.0430421829223633, "Pretrain/Loss (Raw)": 2.0158276557922363, "Pretrain/Step": 5726, "Pretrain/Step Time": 8.512717250734568} +{"Pretrain/Learning Rate": 1.8164669897052134e-05, "Pretrain/Loss": 2.041621208190918, "Pretrain/Loss (Raw)": 2.011225461959839, "Pretrain/Step": 5727, "Pretrain/Step Time": 8.508767345920205} +{"Pretrain/Learning Rate": 1.8156503910585544e-05, "Pretrain/Loss": 2.042785167694092, "Pretrain/Loss (Raw)": 2.0430691242218018, "Pretrain/Step": 5728, "Pretrain/Step Time": 8.495084529742599} +{"Pretrain/Learning Rate": 1.814833871334316e-05, "Pretrain/Loss": 2.0434417724609375, "Pretrain/Loss (Raw)": 1.994597315788269, "Pretrain/Step": 5729, "Pretrain/Step Time": 8.496387409046292} +{"Pretrain/Learning Rate": 1.8140174306266655e-05, "Pretrain/Loss": 2.040510654449463, "Pretrain/Loss (Raw)": 1.886595606803894, "Pretrain/Step": 5730, "Pretrain/Step Time": 8.498639907687902} +{"Pretrain/Learning Rate": 1.8132010690297557e-05, "Pretrain/Loss": 2.0401575565338135, "Pretrain/Loss (Raw)": 1.983649730682373, "Pretrain/Step": 5731, "Pretrain/Step Time": 8.509606517851353} +{"Pretrain/Learning Rate": 1.8123847866377367e-05, "Pretrain/Loss": 2.0392208099365234, "Pretrain/Loss (Raw)": 1.9435558319091797, "Pretrain/Step": 5732, "Pretrain/Step Time": 8.51165803335607} +{"Pretrain/Learning Rate": 1.8115685835447423e-05, "Pretrain/Loss": 2.0413920879364014, "Pretrain/Loss (Raw)": 2.143598794937134, "Pretrain/Step": 5733, "Pretrain/Step Time": 8.50970091111958} +{"Pretrain/Learning Rate": 1.810752459844905e-05, "Pretrain/Loss": 2.042625904083252, "Pretrain/Loss (Raw)": 2.1153669357299805, "Pretrain/Step": 5734, "Pretrain/Step Time": 8.499133488163352} +{"Pretrain/Learning Rate": 1.8099364156323396e-05, "Pretrain/Loss": 2.0429553985595703, "Pretrain/Loss (Raw)": 2.0657236576080322, "Pretrain/Step": 5735, "Pretrain/Step Time": 8.500488048419356} +{"Pretrain/Learning Rate": 1.8091204510011607e-05, "Pretrain/Loss": 2.045135974884033, "Pretrain/Loss (Raw)": 2.0996322631835938, "Pretrain/Step": 5736, "Pretrain/Step Time": 8.513204393908381} +{"Pretrain/Learning Rate": 1.8083045660454655e-05, "Pretrain/Loss": 2.0427968502044678, "Pretrain/Loss (Raw)": 1.8673208951950073, "Pretrain/Step": 5737, "Pretrain/Step Time": 8.517103971913457} +{"Pretrain/Learning Rate": 1.8074887608593477e-05, "Pretrain/Loss": 2.043104648590088, "Pretrain/Loss (Raw)": 2.022379159927368, "Pretrain/Step": 5738, "Pretrain/Step Time": 8.517696617171168} +{"Pretrain/Learning Rate": 1.8066730355368888e-05, "Pretrain/Loss": 2.044419527053833, "Pretrain/Loss (Raw)": 2.1972553730010986, "Pretrain/Step": 5739, "Pretrain/Step Time": 8.513191984966397} +{"Pretrain/Learning Rate": 1.805857390172163e-05, "Pretrain/Loss": 2.0449297428131104, "Pretrain/Loss (Raw)": 2.081301212310791, "Pretrain/Step": 5740, "Pretrain/Step Time": 8.514065271243453} +{"Pretrain/Learning Rate": 1.8050418248592334e-05, "Pretrain/Loss": 2.042642831802368, "Pretrain/Loss (Raw)": 1.7287535667419434, "Pretrain/Step": 5741, "Pretrain/Step Time": 8.51716367341578} +{"Pretrain/Learning Rate": 1.8042263396921554e-05, "Pretrain/Loss": 2.041649341583252, "Pretrain/Loss (Raw)": 1.9651682376861572, "Pretrain/Step": 5742, "Pretrain/Step Time": 8.513597909361124} +{"Pretrain/Learning Rate": 1.803410934764974e-05, "Pretrain/Loss": 2.0430636405944824, "Pretrain/Loss (Raw)": 2.2023394107818604, "Pretrain/Step": 5743, "Pretrain/Step Time": 8.516794312745333} +{"Pretrain/Learning Rate": 1.8025956101717272e-05, "Pretrain/Loss": 2.0436806678771973, "Pretrain/Loss (Raw)": 2.1887452602386475, "Pretrain/Step": 5744, "Pretrain/Step Time": 8.51320094242692} +{"Pretrain/Learning Rate": 1.80178036600644e-05, "Pretrain/Loss": 2.043200969696045, "Pretrain/Loss (Raw)": 1.940207839012146, "Pretrain/Step": 5745, "Pretrain/Step Time": 8.511599013581872} +{"Pretrain/Learning Rate": 1.8009652023631318e-05, "Pretrain/Loss": 2.0420351028442383, "Pretrain/Loss (Raw)": 2.0614120960235596, "Pretrain/Step": 5746, "Pretrain/Step Time": 8.499255722388625} +{"Pretrain/Learning Rate": 1.8001501193358096e-05, "Pretrain/Loss": 2.0429277420043945, "Pretrain/Loss (Raw)": 2.0954782962799072, "Pretrain/Step": 5747, "Pretrain/Step Time": 8.50243590399623} +{"Pretrain/Learning Rate": 1.799335117018474e-05, "Pretrain/Loss": 2.042367458343506, "Pretrain/Loss (Raw)": 1.8596582412719727, "Pretrain/Step": 5748, "Pretrain/Step Time": 8.50946343690157} +{"Pretrain/Learning Rate": 1.798520195505114e-05, "Pretrain/Loss": 2.0410633087158203, "Pretrain/Loss (Raw)": 1.9589885473251343, "Pretrain/Step": 5749, "Pretrain/Step Time": 8.5133002307266} +{"Pretrain/Learning Rate": 1.7977053548897112e-05, "Pretrain/Loss": 2.042013168334961, "Pretrain/Loss (Raw)": 1.8469007015228271, "Pretrain/Step": 5750, "Pretrain/Step Time": 8.519061109051108} +{"Pretrain/Learning Rate": 1.7968905952662354e-05, "Pretrain/Loss": 2.0357956886291504, "Pretrain/Loss (Raw)": 1.779549241065979, "Pretrain/Step": 5751, "Pretrain/Step Time": 8.51608968526125} +{"Pretrain/Learning Rate": 1.79607591672865e-05, "Pretrain/Loss": 2.0400948524475098, "Pretrain/Loss (Raw)": 2.492601156234741, "Pretrain/Step": 5752, "Pretrain/Step Time": 8.508396165445447} +{"Pretrain/Learning Rate": 1.7952613193709063e-05, "Pretrain/Loss": 2.038214683532715, "Pretrain/Loss (Raw)": 1.7952311038970947, "Pretrain/Step": 5753, "Pretrain/Step Time": 8.507117036730051} +{"Pretrain/Learning Rate": 1.7944468032869486e-05, "Pretrain/Loss": 2.0375466346740723, "Pretrain/Loss (Raw)": 2.066061019897461, "Pretrain/Step": 5754, "Pretrain/Step Time": 8.509765537455678} +{"Pretrain/Learning Rate": 1.7936323685707095e-05, "Pretrain/Loss": 2.040268898010254, "Pretrain/Loss (Raw)": 2.3063809871673584, "Pretrain/Step": 5755, "Pretrain/Step Time": 8.522226680070162} +{"Pretrain/Learning Rate": 1.7928180153161146e-05, "Pretrain/Loss": 2.0390939712524414, "Pretrain/Loss (Raw)": 1.8788387775421143, "Pretrain/Step": 5756, "Pretrain/Step Time": 8.528693867847323} +{"Pretrain/Learning Rate": 1.792003743617079e-05, "Pretrain/Loss": 2.0383870601654053, "Pretrain/Loss (Raw)": 2.011734962463379, "Pretrain/Step": 5757, "Pretrain/Step Time": 8.525658637285233} +{"Pretrain/Learning Rate": 1.7911895535675067e-05, "Pretrain/Loss": 2.037768602371216, "Pretrain/Loss (Raw)": 1.940664291381836, "Pretrain/Step": 5758, "Pretrain/Step Time": 8.524172250181437} +{"Pretrain/Learning Rate": 1.7903754452612964e-05, "Pretrain/Loss": 2.0374207496643066, "Pretrain/Loss (Raw)": 2.1148617267608643, "Pretrain/Step": 5759, "Pretrain/Step Time": 8.516180600970984} +{"Pretrain/Learning Rate": 1.7895614187923326e-05, "Pretrain/Loss": 2.037327766418457, "Pretrain/Loss (Raw)": 1.9863547086715698, "Pretrain/Step": 5760, "Pretrain/Step Time": 8.519964361563325} +{"Pretrain/Learning Rate": 1.7887474742544945e-05, "Pretrain/Loss": 2.0378692150115967, "Pretrain/Loss (Raw)": 2.0003504753112793, "Pretrain/Step": 5761, "Pretrain/Step Time": 8.524506315588951} +{"Pretrain/Learning Rate": 1.7879336117416485e-05, "Pretrain/Loss": 2.0372142791748047, "Pretrain/Loss (Raw)": 1.9279348850250244, "Pretrain/Step": 5762, "Pretrain/Step Time": 8.526143938302994} +{"Pretrain/Learning Rate": 1.7871198313476544e-05, "Pretrain/Loss": 2.034395217895508, "Pretrain/Loss (Raw)": 2.069976568222046, "Pretrain/Step": 5763, "Pretrain/Step Time": 8.518585957586765} +{"Pretrain/Learning Rate": 1.78630613316636e-05, "Pretrain/Loss": 2.0331950187683105, "Pretrain/Loss (Raw)": 1.9917833805084229, "Pretrain/Step": 5764, "Pretrain/Step Time": 8.508064633235335} +{"Pretrain/Learning Rate": 1.785492517291606e-05, "Pretrain/Loss": 2.033149242401123, "Pretrain/Loss (Raw)": 2.0387909412384033, "Pretrain/Step": 5765, "Pretrain/Step Time": 8.50305176153779} +{"Pretrain/Learning Rate": 1.784678983817221e-05, "Pretrain/Loss": 2.0340423583984375, "Pretrain/Loss (Raw)": 2.0568430423736572, "Pretrain/Step": 5766, "Pretrain/Step Time": 8.513487378135324} +{"Pretrain/Learning Rate": 1.783865532837027e-05, "Pretrain/Loss": 2.0311946868896484, "Pretrain/Loss (Raw)": 1.8338850736618042, "Pretrain/Step": 5767, "Pretrain/Step Time": 8.515781041234732} +{"Pretrain/Learning Rate": 1.7830521644448334e-05, "Pretrain/Loss": 2.029294013977051, "Pretrain/Loss (Raw)": 1.9908678531646729, "Pretrain/Step": 5768, "Pretrain/Step Time": 8.515561942011118} +{"Pretrain/Learning Rate": 1.7822388787344434e-05, "Pretrain/Loss": 2.0285468101501465, "Pretrain/Loss (Raw)": 1.8900015354156494, "Pretrain/Step": 5769, "Pretrain/Step Time": 8.51430575735867} +{"Pretrain/Learning Rate": 1.781425675799648e-05, "Pretrain/Loss": 2.029323101043701, "Pretrain/Loss (Raw)": 2.110454559326172, "Pretrain/Step": 5770, "Pretrain/Step Time": 8.511582862585783} +{"Pretrain/Learning Rate": 1.7806125557342303e-05, "Pretrain/Loss": 2.0305042266845703, "Pretrain/Loss (Raw)": 2.0487139225006104, "Pretrain/Step": 5771, "Pretrain/Step Time": 8.520922223106027} +{"Pretrain/Learning Rate": 1.7797995186319606e-05, "Pretrain/Loss": 2.026477813720703, "Pretrain/Loss (Raw)": 1.9157543182373047, "Pretrain/Step": 5772, "Pretrain/Step Time": 8.519362196326256} +{"Pretrain/Learning Rate": 1.778986564586606e-05, "Pretrain/Loss": 2.0264623165130615, "Pretrain/Loss (Raw)": 2.008551836013794, "Pretrain/Step": 5773, "Pretrain/Step Time": 8.523754296824336} +{"Pretrain/Learning Rate": 1.778173693691917e-05, "Pretrain/Loss": 2.023988962173462, "Pretrain/Loss (Raw)": 1.9100797176361084, "Pretrain/Step": 5774, "Pretrain/Step Time": 8.516461266204715} +{"Pretrain/Learning Rate": 1.77736090604164e-05, "Pretrain/Loss": 2.0254361629486084, "Pretrain/Loss (Raw)": 2.2760872840881348, "Pretrain/Step": 5775, "Pretrain/Step Time": 8.515878312289715} +{"Pretrain/Learning Rate": 1.7765482017295077e-05, "Pretrain/Loss": 2.022770404815674, "Pretrain/Loss (Raw)": 2.05243182182312, "Pretrain/Step": 5776, "Pretrain/Step Time": 8.518353320658207} +{"Pretrain/Learning Rate": 1.7757355808492468e-05, "Pretrain/Loss": 2.0201029777526855, "Pretrain/Loss (Raw)": 1.7895770072937012, "Pretrain/Step": 5777, "Pretrain/Step Time": 8.522777846083045} +{"Pretrain/Learning Rate": 1.77492304349457e-05, "Pretrain/Loss": 2.0236635208129883, "Pretrain/Loss (Raw)": 2.4511289596557617, "Pretrain/Step": 5778, "Pretrain/Step Time": 8.523805100470781} +{"Pretrain/Learning Rate": 1.7741105897591865e-05, "Pretrain/Loss": 2.024829626083374, "Pretrain/Loss (Raw)": 2.11342453956604, "Pretrain/Step": 5779, "Pretrain/Step Time": 8.524660931900144} +{"Pretrain/Learning Rate": 1.7732982197367888e-05, "Pretrain/Loss": 2.0242037773132324, "Pretrain/Loss (Raw)": 2.0034663677215576, "Pretrain/Step": 5780, "Pretrain/Step Time": 8.522923672571778} +{"Pretrain/Learning Rate": 1.7724859335210654e-05, "Pretrain/Loss": 2.023454189300537, "Pretrain/Loss (Raw)": 2.0148658752441406, "Pretrain/Step": 5781, "Pretrain/Step Time": 8.516375429928303} +{"Pretrain/Learning Rate": 1.771673731205692e-05, "Pretrain/Loss": 2.022581100463867, "Pretrain/Loss (Raw)": 2.0430259704589844, "Pretrain/Step": 5782, "Pretrain/Step Time": 8.52105974033475} +{"Pretrain/Learning Rate": 1.770861612884336e-05, "Pretrain/Loss": 2.022510051727295, "Pretrain/Loss (Raw)": 2.119441032409668, "Pretrain/Step": 5783, "Pretrain/Step Time": 8.518239943310618} +{"Pretrain/Learning Rate": 1.7700495786506545e-05, "Pretrain/Loss": 2.0205063819885254, "Pretrain/Loss (Raw)": 2.007847309112549, "Pretrain/Step": 5784, "Pretrain/Step Time": 8.518898766487837} +{"Pretrain/Learning Rate": 1.7692376285982953e-05, "Pretrain/Loss": 2.019552707672119, "Pretrain/Loss (Raw)": 1.7705143690109253, "Pretrain/Step": 5785, "Pretrain/Step Time": 8.514868484809995} +{"Pretrain/Learning Rate": 1.768425762820896e-05, "Pretrain/Loss": 2.022606134414673, "Pretrain/Loss (Raw)": 1.9587761163711548, "Pretrain/Step": 5786, "Pretrain/Step Time": 8.515199434012175} +{"Pretrain/Learning Rate": 1.7676139814120857e-05, "Pretrain/Loss": 2.0223288536071777, "Pretrain/Loss (Raw)": 2.0447511672973633, "Pretrain/Step": 5787, "Pretrain/Step Time": 8.509742815047503} +{"Pretrain/Learning Rate": 1.7668022844654812e-05, "Pretrain/Loss": 2.019423007965088, "Pretrain/Loss (Raw)": 1.7815779447555542, "Pretrain/Step": 5788, "Pretrain/Step Time": 8.509050043299794} +{"Pretrain/Learning Rate": 1.765990672074693e-05, "Pretrain/Loss": 2.0165464878082275, "Pretrain/Loss (Raw)": 1.7142232656478882, "Pretrain/Step": 5789, "Pretrain/Step Time": 8.507465554401278} +{"Pretrain/Learning Rate": 1.7651791443333187e-05, "Pretrain/Loss": 2.0149364471435547, "Pretrain/Loss (Raw)": 2.0129151344299316, "Pretrain/Step": 5790, "Pretrain/Step Time": 8.518687579780817} +{"Pretrain/Learning Rate": 1.764367701334949e-05, "Pretrain/Loss": 2.015023708343506, "Pretrain/Loss (Raw)": 2.0853450298309326, "Pretrain/Step": 5791, "Pretrain/Step Time": 8.521105719730258} +{"Pretrain/Learning Rate": 1.7635563431731612e-05, "Pretrain/Loss": 2.014829635620117, "Pretrain/Loss (Raw)": 1.9957122802734375, "Pretrain/Step": 5792, "Pretrain/Step Time": 8.515854068100452} +{"Pretrain/Learning Rate": 1.762745069941527e-05, "Pretrain/Loss": 2.014199733734131, "Pretrain/Loss (Raw)": 2.0087549686431885, "Pretrain/Step": 5793, "Pretrain/Step Time": 8.51423604413867} +{"Pretrain/Learning Rate": 1.7619338817336046e-05, "Pretrain/Loss": 2.0129876136779785, "Pretrain/Loss (Raw)": 1.8644952774047852, "Pretrain/Step": 5794, "Pretrain/Step Time": 8.512749895453453} +{"Pretrain/Learning Rate": 1.7611227786429457e-05, "Pretrain/Loss": 2.0103142261505127, "Pretrain/Loss (Raw)": 1.9319080114364624, "Pretrain/Step": 5795, "Pretrain/Step Time": 8.518271388486028} +{"Pretrain/Learning Rate": 1.7603117607630893e-05, "Pretrain/Loss": 2.0088915824890137, "Pretrain/Loss (Raw)": 1.9654481410980225, "Pretrain/Step": 5796, "Pretrain/Step Time": 8.522259583696723} +{"Pretrain/Learning Rate": 1.7595008281875657e-05, "Pretrain/Loss": 2.007398843765259, "Pretrain/Loss (Raw)": 1.945205807685852, "Pretrain/Step": 5797, "Pretrain/Step Time": 8.525112697854638} +{"Pretrain/Learning Rate": 1.7586899810098967e-05, "Pretrain/Loss": 2.0088469982147217, "Pretrain/Loss (Raw)": 2.1189000606536865, "Pretrain/Step": 5798, "Pretrain/Step Time": 8.52214889228344} +{"Pretrain/Learning Rate": 1.757879219323592e-05, "Pretrain/Loss": 2.0095577239990234, "Pretrain/Loss (Raw)": 2.1982576847076416, "Pretrain/Step": 5799, "Pretrain/Step Time": 8.52184802852571} +{"Pretrain/Learning Rate": 1.757068543222153e-05, "Pretrain/Loss": 2.014296531677246, "Pretrain/Loss (Raw)": 2.417090892791748, "Pretrain/Step": 5800, "Pretrain/Step Time": 8.514684654772282} +{"Pretrain/Learning Rate": 1.7562579527990696e-05, "Pretrain/Loss": 2.013199806213379, "Pretrain/Loss (Raw)": 1.9878638982772827, "Pretrain/Step": 5801, "Pretrain/Step Time": 8.515193546190858} +{"Pretrain/Learning Rate": 1.7554474481478245e-05, "Pretrain/Loss": 2.015474319458008, "Pretrain/Loss (Raw)": 2.1057183742523193, "Pretrain/Step": 5802, "Pretrain/Step Time": 8.51435268111527} +{"Pretrain/Learning Rate": 1.7546370293618875e-05, "Pretrain/Loss": 2.0161430835723877, "Pretrain/Loss (Raw)": 2.063875675201416, "Pretrain/Step": 5803, "Pretrain/Step Time": 8.51075224392116} +{"Pretrain/Learning Rate": 1.7538266965347212e-05, "Pretrain/Loss": 2.0152101516723633, "Pretrain/Loss (Raw)": 1.9600512981414795, "Pretrain/Step": 5804, "Pretrain/Step Time": 8.512663250789046} +{"Pretrain/Learning Rate": 1.7530164497597757e-05, "Pretrain/Loss": 2.0128626823425293, "Pretrain/Loss (Raw)": 1.897246241569519, "Pretrain/Step": 5805, "Pretrain/Step Time": 8.503315949812531} +{"Pretrain/Learning Rate": 1.7522062891304936e-05, "Pretrain/Loss": 2.0138065814971924, "Pretrain/Loss (Raw)": 2.026045083999634, "Pretrain/Step": 5806, "Pretrain/Step Time": 8.504570562392473} +{"Pretrain/Learning Rate": 1.7513962147403057e-05, "Pretrain/Loss": 2.0141749382019043, "Pretrain/Loss (Raw)": 1.9667397737503052, "Pretrain/Step": 5807, "Pretrain/Step Time": 8.502649273723364} +{"Pretrain/Learning Rate": 1.750586226682634e-05, "Pretrain/Loss": 2.0135419368743896, "Pretrain/Loss (Raw)": 2.0437209606170654, "Pretrain/Step": 5808, "Pretrain/Step Time": 8.510831767693162} +{"Pretrain/Learning Rate": 1.74977632505089e-05, "Pretrain/Loss": 2.0142974853515625, "Pretrain/Loss (Raw)": 2.0992560386657715, "Pretrain/Step": 5809, "Pretrain/Step Time": 8.517610164359212} +{"Pretrain/Learning Rate": 1.7489665099384755e-05, "Pretrain/Loss": 2.0152740478515625, "Pretrain/Loss (Raw)": 2.031226873397827, "Pretrain/Step": 5810, "Pretrain/Step Time": 8.51411448046565} +{"Pretrain/Learning Rate": 1.7481567814387815e-05, "Pretrain/Loss": 2.0147545337677, "Pretrain/Loss (Raw)": 2.023136615753174, "Pretrain/Step": 5811, "Pretrain/Step Time": 8.501043966040015} +{"Pretrain/Learning Rate": 1.7473471396451913e-05, "Pretrain/Loss": 2.0156798362731934, "Pretrain/Loss (Raw)": 2.162557363510132, "Pretrain/Step": 5812, "Pretrain/Step Time": 8.508444448933005} +{"Pretrain/Learning Rate": 1.746537584651074e-05, "Pretrain/Loss": 2.0141654014587402, "Pretrain/Loss (Raw)": 1.9703103303909302, "Pretrain/Step": 5813, "Pretrain/Step Time": 8.509216574952006} +{"Pretrain/Learning Rate": 1.7457281165497947e-05, "Pretrain/Loss": 2.014420509338379, "Pretrain/Loss (Raw)": 2.062328815460205, "Pretrain/Step": 5814, "Pretrain/Step Time": 8.513844741508365} +{"Pretrain/Learning Rate": 1.7449187354347014e-05, "Pretrain/Loss": 2.016702651977539, "Pretrain/Loss (Raw)": 2.065249443054199, "Pretrain/Step": 5815, "Pretrain/Step Time": 8.513905126601458} +{"Pretrain/Learning Rate": 1.7441094413991393e-05, "Pretrain/Loss": 2.017426013946533, "Pretrain/Loss (Raw)": 1.9552770853042603, "Pretrain/Step": 5816, "Pretrain/Step Time": 8.512017758563161} +{"Pretrain/Learning Rate": 1.7433002345364368e-05, "Pretrain/Loss": 2.0164976119995117, "Pretrain/Loss (Raw)": 1.8976085186004639, "Pretrain/Step": 5817, "Pretrain/Step Time": 8.50207263790071} +{"Pretrain/Learning Rate": 1.7424911149399183e-05, "Pretrain/Loss": 2.018209934234619, "Pretrain/Loss (Raw)": 2.2298333644866943, "Pretrain/Step": 5818, "Pretrain/Step Time": 8.50488911755383} +{"Pretrain/Learning Rate": 1.7416820827028926e-05, "Pretrain/Loss": 2.0183160305023193, "Pretrain/Loss (Raw)": 2.1412928104400635, "Pretrain/Step": 5819, "Pretrain/Step Time": 8.510174080729485} +{"Pretrain/Learning Rate": 1.7408731379186638e-05, "Pretrain/Loss": 2.0171077251434326, "Pretrain/Loss (Raw)": 1.8686466217041016, "Pretrain/Step": 5820, "Pretrain/Step Time": 8.5102856811136} +{"Pretrain/Learning Rate": 1.740064280680521e-05, "Pretrain/Loss": 2.018312931060791, "Pretrain/Loss (Raw)": 2.2229042053222656, "Pretrain/Step": 5821, "Pretrain/Step Time": 8.505569107830524} +{"Pretrain/Learning Rate": 1.7392555110817467e-05, "Pretrain/Loss": 2.017354726791382, "Pretrain/Loss (Raw)": 1.9229286909103394, "Pretrain/Step": 5822, "Pretrain/Step Time": 8.504323333501816} +{"Pretrain/Learning Rate": 1.738446829215611e-05, "Pretrain/Loss": 2.0178043842315674, "Pretrain/Loss (Raw)": 2.0841622352600098, "Pretrain/Step": 5823, "Pretrain/Step Time": 8.507707845419645} +{"Pretrain/Learning Rate": 1.737638235175376e-05, "Pretrain/Loss": 2.0163793563842773, "Pretrain/Loss (Raw)": 1.987345576286316, "Pretrain/Step": 5824, "Pretrain/Step Time": 8.51313135959208} +{"Pretrain/Learning Rate": 1.736829729054292e-05, "Pretrain/Loss": 2.0173840522766113, "Pretrain/Loss (Raw)": 2.121938467025757, "Pretrain/Step": 5825, "Pretrain/Step Time": 8.519813256338239} +{"Pretrain/Learning Rate": 1.7360213109456e-05, "Pretrain/Loss": 2.0147454738616943, "Pretrain/Loss (Raw)": 1.6964280605316162, "Pretrain/Step": 5826, "Pretrain/Step Time": 8.518205486238003} +{"Pretrain/Learning Rate": 1.73521298094253e-05, "Pretrain/Loss": 2.020049571990967, "Pretrain/Loss (Raw)": 2.4125211238861084, "Pretrain/Step": 5827, "Pretrain/Step Time": 8.519138922914863} +{"Pretrain/Learning Rate": 1.734404739138303e-05, "Pretrain/Loss": 2.0176570415496826, "Pretrain/Loss (Raw)": 1.8067994117736816, "Pretrain/Step": 5828, "Pretrain/Step Time": 8.515647277235985} +{"Pretrain/Learning Rate": 1.733596585626129e-05, "Pretrain/Loss": 2.016753673553467, "Pretrain/Loss (Raw)": 1.892268180847168, "Pretrain/Step": 5829, "Pretrain/Step Time": 8.510144846513867} +{"Pretrain/Learning Rate": 1.7327885204992083e-05, "Pretrain/Loss": 2.019228935241699, "Pretrain/Loss (Raw)": 2.176499605178833, "Pretrain/Step": 5830, "Pretrain/Step Time": 8.512264057993889} +{"Pretrain/Learning Rate": 1.7319805438507303e-05, "Pretrain/Loss": 2.0219531059265137, "Pretrain/Loss (Raw)": 2.107177495956421, "Pretrain/Step": 5831, "Pretrain/Step Time": 8.519257167354226} +{"Pretrain/Learning Rate": 1.7311726557738754e-05, "Pretrain/Loss": 2.0221381187438965, "Pretrain/Loss (Raw)": 2.0924017429351807, "Pretrain/Step": 5832, "Pretrain/Step Time": 8.519015830010176} +{"Pretrain/Learning Rate": 1.7303648563618125e-05, "Pretrain/Loss": 2.0262222290039062, "Pretrain/Loss (Raw)": 2.497112989425659, "Pretrain/Step": 5833, "Pretrain/Step Time": 8.523058148100972} +{"Pretrain/Learning Rate": 1.7295571457077015e-05, "Pretrain/Loss": 2.0254764556884766, "Pretrain/Loss (Raw)": 1.909785270690918, "Pretrain/Step": 5834, "Pretrain/Step Time": 8.524708032608032} +{"Pretrain/Learning Rate": 1.72874952390469e-05, "Pretrain/Loss": 2.026095390319824, "Pretrain/Loss (Raw)": 2.1169002056121826, "Pretrain/Step": 5835, "Pretrain/Step Time": 8.517356967553496} +{"Pretrain/Learning Rate": 1.7279419910459182e-05, "Pretrain/Loss": 2.0253500938415527, "Pretrain/Loss (Raw)": 2.154249906539917, "Pretrain/Step": 5836, "Pretrain/Step Time": 8.511940063908696} +{"Pretrain/Learning Rate": 1.727134547224514e-05, "Pretrain/Loss": 2.0262162685394287, "Pretrain/Loss (Raw)": 1.9487730264663696, "Pretrain/Step": 5837, "Pretrain/Step Time": 8.519907927140594} +{"Pretrain/Learning Rate": 1.726327192533595e-05, "Pretrain/Loss": 2.0233209133148193, "Pretrain/Loss (Raw)": 1.8907727003097534, "Pretrain/Step": 5838, "Pretrain/Step Time": 8.518783321604133} +{"Pretrain/Learning Rate": 1.7255199270662708e-05, "Pretrain/Loss": 2.022754430770874, "Pretrain/Loss (Raw)": 2.064969539642334, "Pretrain/Step": 5839, "Pretrain/Step Time": 8.521519284695387} +{"Pretrain/Learning Rate": 1.7247127509156377e-05, "Pretrain/Loss": 2.0245790481567383, "Pretrain/Loss (Raw)": 2.2603535652160645, "Pretrain/Step": 5840, "Pretrain/Step Time": 8.511506652459502} +{"Pretrain/Learning Rate": 1.7239056641747836e-05, "Pretrain/Loss": 2.0269341468811035, "Pretrain/Loss (Raw)": 1.9130407571792603, "Pretrain/Step": 5841, "Pretrain/Step Time": 8.507180778309703} +{"Pretrain/Learning Rate": 1.723098666936785e-05, "Pretrain/Loss": 2.025520086288452, "Pretrain/Loss (Raw)": 2.0247316360473633, "Pretrain/Step": 5842, "Pretrain/Step Time": 8.50544343329966} +{"Pretrain/Learning Rate": 1.7222917592947096e-05, "Pretrain/Loss": 2.0266952514648438, "Pretrain/Loss (Raw)": 2.0790083408355713, "Pretrain/Step": 5843, "Pretrain/Step Time": 8.50845849700272} +{"Pretrain/Learning Rate": 1.7214849413416128e-05, "Pretrain/Loss": 2.0261402130126953, "Pretrain/Loss (Raw)": 1.9939645528793335, "Pretrain/Step": 5844, "Pretrain/Step Time": 8.516473691910505} +{"Pretrain/Learning Rate": 1.7206782131705414e-05, "Pretrain/Loss": 2.0279083251953125, "Pretrain/Loss (Raw)": 2.25054669380188, "Pretrain/Step": 5845, "Pretrain/Step Time": 8.517285527661443} +{"Pretrain/Learning Rate": 1.7198715748745304e-05, "Pretrain/Loss": 2.026839256286621, "Pretrain/Loss (Raw)": 2.020127296447754, "Pretrain/Step": 5846, "Pretrain/Step Time": 8.507262609899044} +{"Pretrain/Learning Rate": 1.7190650265466056e-05, "Pretrain/Loss": 2.0276856422424316, "Pretrain/Loss (Raw)": 1.9385405778884888, "Pretrain/Step": 5847, "Pretrain/Step Time": 8.51045298203826} +{"Pretrain/Learning Rate": 1.7182585682797815e-05, "Pretrain/Loss": 2.028282642364502, "Pretrain/Loss (Raw)": 2.0589122772216797, "Pretrain/Step": 5848, "Pretrain/Step Time": 8.512018779292703} +{"Pretrain/Learning Rate": 1.7174522001670633e-05, "Pretrain/Loss": 2.02830171585083, "Pretrain/Loss (Raw)": 2.078235387802124, "Pretrain/Step": 5849, "Pretrain/Step Time": 8.526565823704004} +{"Pretrain/Learning Rate": 1.7166459223014448e-05, "Pretrain/Loss": 2.0271148681640625, "Pretrain/Loss (Raw)": 1.8674815893173218, "Pretrain/Step": 5850, "Pretrain/Step Time": 8.527275513857603} +{"Pretrain/Learning Rate": 1.71583973477591e-05, "Pretrain/Loss": 2.0258779525756836, "Pretrain/Loss (Raw)": 1.9558168649673462, "Pretrain/Step": 5851, "Pretrain/Step Time": 8.517583083361387} +{"Pretrain/Learning Rate": 1.7150336376834315e-05, "Pretrain/Loss": 2.0268921852111816, "Pretrain/Loss (Raw)": 2.140427589416504, "Pretrain/Step": 5852, "Pretrain/Step Time": 8.515209892764688} +{"Pretrain/Learning Rate": 1.714227631116974e-05, "Pretrain/Loss": 2.026742696762085, "Pretrain/Loss (Raw)": 2.0077600479125977, "Pretrain/Step": 5853, "Pretrain/Step Time": 8.511392137035728} +{"Pretrain/Learning Rate": 1.7134217151694872e-05, "Pretrain/Loss": 2.0267510414123535, "Pretrain/Loss (Raw)": 2.016904354095459, "Pretrain/Step": 5854, "Pretrain/Step Time": 8.518997985869646} +{"Pretrain/Learning Rate": 1.7126158899339164e-05, "Pretrain/Loss": 2.0282280445098877, "Pretrain/Loss (Raw)": 2.200275421142578, "Pretrain/Step": 5855, "Pretrain/Step Time": 8.526558069512248} +{"Pretrain/Learning Rate": 1.7118101555031895e-05, "Pretrain/Loss": 2.0295164585113525, "Pretrain/Loss (Raw)": 2.2080001831054688, "Pretrain/Step": 5856, "Pretrain/Step Time": 8.527843087911606} +{"Pretrain/Learning Rate": 1.7110045119702314e-05, "Pretrain/Loss": 2.0286498069763184, "Pretrain/Loss (Raw)": 1.883654236793518, "Pretrain/Step": 5857, "Pretrain/Step Time": 8.527715353295207} +{"Pretrain/Learning Rate": 1.7101989594279495e-05, "Pretrain/Loss": 2.029426097869873, "Pretrain/Loss (Raw)": 1.985988736152649, "Pretrain/Step": 5858, "Pretrain/Step Time": 8.524855565279722} +{"Pretrain/Learning Rate": 1.7093934979692465e-05, "Pretrain/Loss": 2.0295403003692627, "Pretrain/Loss (Raw)": 1.9982572793960571, "Pretrain/Step": 5859, "Pretrain/Step Time": 8.516617201268673} +{"Pretrain/Learning Rate": 1.7085881276870093e-05, "Pretrain/Loss": 2.030116081237793, "Pretrain/Loss (Raw)": 2.0172371864318848, "Pretrain/Step": 5860, "Pretrain/Step Time": 8.515810502693057} +{"Pretrain/Learning Rate": 1.70778284867412e-05, "Pretrain/Loss": 2.0262653827667236, "Pretrain/Loss (Raw)": 1.6507009267807007, "Pretrain/Step": 5861, "Pretrain/Step Time": 8.514686811715364} +{"Pretrain/Learning Rate": 1.706977661023444e-05, "Pretrain/Loss": 2.025911331176758, "Pretrain/Loss (Raw)": 2.0700607299804688, "Pretrain/Step": 5862, "Pretrain/Step Time": 8.523310583084822} +{"Pretrain/Learning Rate": 1.7061725648278423e-05, "Pretrain/Loss": 2.025723934173584, "Pretrain/Loss (Raw)": 2.0417139530181885, "Pretrain/Step": 5863, "Pretrain/Step Time": 8.521298693493009} +{"Pretrain/Learning Rate": 1.7053675601801606e-05, "Pretrain/Loss": 2.0246171951293945, "Pretrain/Loss (Raw)": 1.9580159187316895, "Pretrain/Step": 5864, "Pretrain/Step Time": 8.507369574159384} +{"Pretrain/Learning Rate": 1.7045626471732363e-05, "Pretrain/Loss": 2.0255587100982666, "Pretrain/Loss (Raw)": 1.987801194190979, "Pretrain/Step": 5865, "Pretrain/Step Time": 8.504906935617328} +{"Pretrain/Learning Rate": 1.7037578258998956e-05, "Pretrain/Loss": 2.024073839187622, "Pretrain/Loss (Raw)": 1.8323352336883545, "Pretrain/Step": 5866, "Pretrain/Step Time": 8.512730216607451} +{"Pretrain/Learning Rate": 1.702953096452955e-05, "Pretrain/Loss": 2.022461175918579, "Pretrain/Loss (Raw)": 1.9908204078674316, "Pretrain/Step": 5867, "Pretrain/Step Time": 8.515169842168689} +{"Pretrain/Learning Rate": 1.702148458925218e-05, "Pretrain/Loss": 2.0232162475585938, "Pretrain/Loss (Raw)": 2.1779677867889404, "Pretrain/Step": 5868, "Pretrain/Step Time": 8.517217734828591} +{"Pretrain/Learning Rate": 1.7013439134094815e-05, "Pretrain/Loss": 2.0231242179870605, "Pretrain/Loss (Raw)": 1.716942548751831, "Pretrain/Step": 5869, "Pretrain/Step Time": 8.512288404628634} +{"Pretrain/Learning Rate": 1.7005394599985273e-05, "Pretrain/Loss": 2.0237975120544434, "Pretrain/Loss (Raw)": 2.0513548851013184, "Pretrain/Step": 5870, "Pretrain/Step Time": 8.510595643892884} +{"Pretrain/Learning Rate": 1.6997350987851308e-05, "Pretrain/Loss": 2.022428274154663, "Pretrain/Loss (Raw)": 2.027076244354248, "Pretrain/Step": 5871, "Pretrain/Step Time": 8.511848965659738} +{"Pretrain/Learning Rate": 1.6989308298620526e-05, "Pretrain/Loss": 2.0215237140655518, "Pretrain/Loss (Raw)": 2.072979211807251, "Pretrain/Step": 5872, "Pretrain/Step Time": 8.516724575310946} +{"Pretrain/Learning Rate": 1.6981266533220467e-05, "Pretrain/Loss": 2.021822214126587, "Pretrain/Loss (Raw)": 1.9784034490585327, "Pretrain/Step": 5873, "Pretrain/Step Time": 8.521395096555352} +{"Pretrain/Learning Rate": 1.6973225692578533e-05, "Pretrain/Loss": 2.0220232009887695, "Pretrain/Loss (Raw)": 2.087153196334839, "Pretrain/Step": 5874, "Pretrain/Step Time": 8.525057861581445} +{"Pretrain/Learning Rate": 1.6965185777622037e-05, "Pretrain/Loss": 2.0212249755859375, "Pretrain/Loss (Raw)": 1.9932899475097656, "Pretrain/Step": 5875, "Pretrain/Step Time": 8.517066104337573} +{"Pretrain/Learning Rate": 1.6957146789278175e-05, "Pretrain/Loss": 2.0226287841796875, "Pretrain/Loss (Raw)": 2.03934383392334, "Pretrain/Step": 5876, "Pretrain/Step Time": 8.511493608355522} +{"Pretrain/Learning Rate": 1.694910872847405e-05, "Pretrain/Loss": 2.022393226623535, "Pretrain/Loss (Raw)": 1.9288413524627686, "Pretrain/Step": 5877, "Pretrain/Step Time": 8.510047337040305} +{"Pretrain/Learning Rate": 1.694107159613664e-05, "Pretrain/Loss": 2.022663116455078, "Pretrain/Loss (Raw)": 1.8814196586608887, "Pretrain/Step": 5878, "Pretrain/Step Time": 8.51210517808795} +{"Pretrain/Learning Rate": 1.6933035393192824e-05, "Pretrain/Loss": 2.024506092071533, "Pretrain/Loss (Raw)": 2.0154974460601807, "Pretrain/Step": 5879, "Pretrain/Step Time": 8.513845641165972} +{"Pretrain/Learning Rate": 1.6925000120569385e-05, "Pretrain/Loss": 2.0214662551879883, "Pretrain/Loss (Raw)": 2.1035141944885254, "Pretrain/Step": 5880, "Pretrain/Step Time": 8.518888829275966} +{"Pretrain/Learning Rate": 1.6916965779192983e-05, "Pretrain/Loss": 2.023414134979248, "Pretrain/Loss (Raw)": 2.044543504714966, "Pretrain/Step": 5881, "Pretrain/Step Time": 8.519818373024464} +{"Pretrain/Learning Rate": 1.6908932369990176e-05, "Pretrain/Loss": 2.0234782695770264, "Pretrain/Loss (Raw)": 2.07425856590271, "Pretrain/Step": 5882, "Pretrain/Step Time": 8.514325166121125} +{"Pretrain/Learning Rate": 1.6900899893887408e-05, "Pretrain/Loss": 2.0210256576538086, "Pretrain/Loss (Raw)": 1.9924356937408447, "Pretrain/Step": 5883, "Pretrain/Step Time": 8.503595005720854} +{"Pretrain/Learning Rate": 1.6892868351811036e-05, "Pretrain/Loss": 2.0236222743988037, "Pretrain/Loss (Raw)": 2.211219072341919, "Pretrain/Step": 5884, "Pretrain/Step Time": 8.503055425360799} +{"Pretrain/Learning Rate": 1.6884837744687284e-05, "Pretrain/Loss": 2.0237061977386475, "Pretrain/Loss (Raw)": 2.022474765777588, "Pretrain/Step": 5885, "Pretrain/Step Time": 8.510809211060405} +{"Pretrain/Learning Rate": 1.687680807344229e-05, "Pretrain/Loss": 2.0241146087646484, "Pretrain/Loss (Raw)": 1.9929450750350952, "Pretrain/Step": 5886, "Pretrain/Step Time": 8.515217276290059} +{"Pretrain/Learning Rate": 1.6868779339002056e-05, "Pretrain/Loss": 2.0238568782806396, "Pretrain/Loss (Raw)": 2.081873655319214, "Pretrain/Step": 5887, "Pretrain/Step Time": 8.512501934543252} +{"Pretrain/Learning Rate": 1.6860751542292515e-05, "Pretrain/Loss": 2.0235774517059326, "Pretrain/Loss (Raw)": 1.9505754709243774, "Pretrain/Step": 5888, "Pretrain/Step Time": 8.510565424337983} +{"Pretrain/Learning Rate": 1.685272468423945e-05, "Pretrain/Loss": 2.0240278244018555, "Pretrain/Loss (Raw)": 2.0580079555511475, "Pretrain/Step": 5889, "Pretrain/Step Time": 8.509358445182443} +{"Pretrain/Learning Rate": 1.6844698765768575e-05, "Pretrain/Loss": 2.02689528465271, "Pretrain/Loss (Raw)": 2.2949516773223877, "Pretrain/Step": 5890, "Pretrain/Step Time": 8.509793436154723} +{"Pretrain/Learning Rate": 1.6836673787805456e-05, "Pretrain/Loss": 2.0255908966064453, "Pretrain/Loss (Raw)": 1.9030512571334839, "Pretrain/Step": 5891, "Pretrain/Step Time": 8.514285076409578} +{"Pretrain/Learning Rate": 1.6828649751275592e-05, "Pretrain/Loss": 2.026120185852051, "Pretrain/Loss (Raw)": 2.0595169067382812, "Pretrain/Step": 5892, "Pretrain/Step Time": 8.51478443108499} +{"Pretrain/Learning Rate": 1.682062665710434e-05, "Pretrain/Loss": 2.0281081199645996, "Pretrain/Loss (Raw)": 2.2932474613189697, "Pretrain/Step": 5893, "Pretrain/Step Time": 8.519619373604655} +{"Pretrain/Learning Rate": 1.6812604506216966e-05, "Pretrain/Loss": 2.027960777282715, "Pretrain/Loss (Raw)": 2.0379815101623535, "Pretrain/Step": 5894, "Pretrain/Step Time": 8.506252938881516} +{"Pretrain/Learning Rate": 1.6804583299538614e-05, "Pretrain/Loss": 2.0286712646484375, "Pretrain/Loss (Raw)": 1.9248454570770264, "Pretrain/Step": 5895, "Pretrain/Step Time": 8.505796037614346} +{"Pretrain/Learning Rate": 1.6796563037994347e-05, "Pretrain/Loss": 2.0278396606445312, "Pretrain/Loss (Raw)": 1.8843934535980225, "Pretrain/Step": 5896, "Pretrain/Step Time": 8.50903394818306} +{"Pretrain/Learning Rate": 1.678854372250907e-05, "Pretrain/Loss": 2.0303516387939453, "Pretrain/Loss (Raw)": 2.2115347385406494, "Pretrain/Step": 5897, "Pretrain/Step Time": 8.514271717518568} +{"Pretrain/Learning Rate": 1.6780525354007644e-05, "Pretrain/Loss": 2.029670476913452, "Pretrain/Loss (Raw)": 2.023280143737793, "Pretrain/Step": 5898, "Pretrain/Step Time": 8.514609204605222} +{"Pretrain/Learning Rate": 1.6772507933414744e-05, "Pretrain/Loss": 2.028806209564209, "Pretrain/Loss (Raw)": 1.9380868673324585, "Pretrain/Step": 5899, "Pretrain/Step Time": 8.509241718798876} +{"Pretrain/Learning Rate": 1.6764491461655017e-05, "Pretrain/Loss": 2.031397819519043, "Pretrain/Loss (Raw)": 2.247487783432007, "Pretrain/Step": 5900, "Pretrain/Step Time": 8.507380655035377} +{"Pretrain/Learning Rate": 1.6756475939652927e-05, "Pretrain/Loss": 2.0321526527404785, "Pretrain/Loss (Raw)": 2.1051435470581055, "Pretrain/Step": 5901, "Pretrain/Step Time": 8.508451106026769} +{"Pretrain/Learning Rate": 1.674846136833289e-05, "Pretrain/Loss": 2.0322959423065186, "Pretrain/Loss (Raw)": 1.9284340143203735, "Pretrain/Step": 5902, "Pretrain/Step Time": 8.513136675581336} +{"Pretrain/Learning Rate": 1.6740447748619156e-05, "Pretrain/Loss": 2.030336856842041, "Pretrain/Loss (Raw)": 2.025341272354126, "Pretrain/Step": 5903, "Pretrain/Step Time": 8.513713015243411} +{"Pretrain/Learning Rate": 1.6732435081435924e-05, "Pretrain/Loss": 2.0293526649475098, "Pretrain/Loss (Raw)": 1.9264434576034546, "Pretrain/Step": 5904, "Pretrain/Step Time": 8.5097662396729} +{"Pretrain/Learning Rate": 1.6724423367707226e-05, "Pretrain/Loss": 2.0298588275909424, "Pretrain/Loss (Raw)": 1.8543570041656494, "Pretrain/Step": 5905, "Pretrain/Step Time": 8.504698971286416} +{"Pretrain/Learning Rate": 1.6716412608357024e-05, "Pretrain/Loss": 2.0255839824676514, "Pretrain/Loss (Raw)": 1.903928279876709, "Pretrain/Step": 5906, "Pretrain/Step Time": 8.504180952906609} +{"Pretrain/Learning Rate": 1.670840280430915e-05, "Pretrain/Loss": 2.0247132778167725, "Pretrain/Loss (Raw)": 2.0020015239715576, "Pretrain/Step": 5907, "Pretrain/Step Time": 8.51182071492076} +{"Pretrain/Learning Rate": 1.6700393956487342e-05, "Pretrain/Loss": 2.0256876945495605, "Pretrain/Loss (Raw)": 2.1281630992889404, "Pretrain/Step": 5908, "Pretrain/Step Time": 8.512469597160816} +{"Pretrain/Learning Rate": 1.6692386065815203e-05, "Pretrain/Loss": 2.027656078338623, "Pretrain/Loss (Raw)": 2.2668464183807373, "Pretrain/Step": 5909, "Pretrain/Step Time": 8.51470391638577} +{"Pretrain/Learning Rate": 1.668437913321626e-05, "Pretrain/Loss": 2.0272669792175293, "Pretrain/Loss (Raw)": 1.9931972026824951, "Pretrain/Step": 5910, "Pretrain/Step Time": 8.50927098467946} +{"Pretrain/Learning Rate": 1.667637315961389e-05, "Pretrain/Loss": 2.025636672973633, "Pretrain/Loss (Raw)": 1.910770058631897, "Pretrain/Step": 5911, "Pretrain/Step Time": 8.504685837775469} +{"Pretrain/Learning Rate": 1.6668368145931397e-05, "Pretrain/Loss": 2.024688482284546, "Pretrain/Loss (Raw)": 1.8864893913269043, "Pretrain/Step": 5912, "Pretrain/Step Time": 8.503097211942077} +{"Pretrain/Learning Rate": 1.6660364093091945e-05, "Pretrain/Loss": 2.0291404724121094, "Pretrain/Loss (Raw)": 2.340369939804077, "Pretrain/Step": 5913, "Pretrain/Step Time": 8.511633621528745} +{"Pretrain/Learning Rate": 1.6652361002018608e-05, "Pretrain/Loss": 2.0282297134399414, "Pretrain/Loss (Raw)": 1.842203140258789, "Pretrain/Step": 5914, "Pretrain/Step Time": 8.51426787301898} +{"Pretrain/Learning Rate": 1.664435887363433e-05, "Pretrain/Loss": 2.0272552967071533, "Pretrain/Loss (Raw)": 1.920017957687378, "Pretrain/Step": 5915, "Pretrain/Step Time": 8.511856375262141} +{"Pretrain/Learning Rate": 1.6636357708861966e-05, "Pretrain/Loss": 2.027906894683838, "Pretrain/Loss (Raw)": 1.8649966716766357, "Pretrain/Step": 5916, "Pretrain/Step Time": 8.511092877015471} +{"Pretrain/Learning Rate": 1.6628357508624234e-05, "Pretrain/Loss": 2.0307188034057617, "Pretrain/Loss (Raw)": 2.0741403102874756, "Pretrain/Step": 5917, "Pretrain/Step Time": 8.516273647546768} +{"Pretrain/Learning Rate": 1.662035827384377e-05, "Pretrain/Loss": 2.0317628383636475, "Pretrain/Loss (Raw)": 2.146543025970459, "Pretrain/Step": 5918, "Pretrain/Step Time": 8.507478838786483} +{"Pretrain/Learning Rate": 1.661236000544307e-05, "Pretrain/Loss": 2.031364917755127, "Pretrain/Loss (Raw)": 2.0343918800354004, "Pretrain/Step": 5919, "Pretrain/Step Time": 8.506808064877987} +{"Pretrain/Learning Rate": 1.660436270434454e-05, "Pretrain/Loss": 2.030585765838623, "Pretrain/Loss (Raw)": 1.8959952592849731, "Pretrain/Step": 5920, "Pretrain/Step Time": 8.508621057495475} +{"Pretrain/Learning Rate": 1.6596366371470466e-05, "Pretrain/Loss": 2.028107166290283, "Pretrain/Loss (Raw)": 1.6914948225021362, "Pretrain/Step": 5921, "Pretrain/Step Time": 8.509639693424106} +{"Pretrain/Learning Rate": 1.658837100774302e-05, "Pretrain/Loss": 2.0291271209716797, "Pretrain/Loss (Raw)": 1.9950586557388306, "Pretrain/Step": 5922, "Pretrain/Step Time": 8.519288936629891} +{"Pretrain/Learning Rate": 1.658037661408427e-05, "Pretrain/Loss": 2.030710220336914, "Pretrain/Loss (Raw)": 2.1345560550689697, "Pretrain/Step": 5923, "Pretrain/Step Time": 8.515598738566041} +{"Pretrain/Learning Rate": 1.657238319141616e-05, "Pretrain/Loss": 2.031214714050293, "Pretrain/Loss (Raw)": 2.0300002098083496, "Pretrain/Step": 5924, "Pretrain/Step Time": 8.511475058272481} +{"Pretrain/Learning Rate": 1.656439074066053e-05, "Pretrain/Loss": 2.031609058380127, "Pretrain/Loss (Raw)": 1.9956614971160889, "Pretrain/Step": 5925, "Pretrain/Step Time": 8.512979499995708} +{"Pretrain/Learning Rate": 1.655639926273911e-05, "Pretrain/Loss": 2.030372381210327, "Pretrain/Loss (Raw)": 1.9606373310089111, "Pretrain/Step": 5926, "Pretrain/Step Time": 8.516629088670015} +{"Pretrain/Learning Rate": 1.654840875857352e-05, "Pretrain/Loss": 2.029421329498291, "Pretrain/Loss (Raw)": 2.076551914215088, "Pretrain/Step": 5927, "Pretrain/Step Time": 8.52145510725677} +{"Pretrain/Learning Rate": 1.654041922908525e-05, "Pretrain/Loss": 2.0273914337158203, "Pretrain/Loss (Raw)": 2.1572647094726562, "Pretrain/Step": 5928, "Pretrain/Step Time": 8.520960779860616} +{"Pretrain/Learning Rate": 1.6532430675195705e-05, "Pretrain/Loss": 2.027587652206421, "Pretrain/Loss (Raw)": 2.0129547119140625, "Pretrain/Step": 5929, "Pretrain/Step Time": 8.515019819140434} +{"Pretrain/Learning Rate": 1.652444309782615e-05, "Pretrain/Loss": 2.024874210357666, "Pretrain/Loss (Raw)": 1.7583762407302856, "Pretrain/Step": 5930, "Pretrain/Step Time": 8.515291510149837} +{"Pretrain/Learning Rate": 1.651645649789776e-05, "Pretrain/Loss": 2.0254244804382324, "Pretrain/Loss (Raw)": 2.134340286254883, "Pretrain/Step": 5931, "Pretrain/Step Time": 8.518578996881843} +{"Pretrain/Learning Rate": 1.6508470876331577e-05, "Pretrain/Loss": 2.0274760723114014, "Pretrain/Loss (Raw)": 2.2226510047912598, "Pretrain/Step": 5932, "Pretrain/Step Time": 8.523337146267295} +{"Pretrain/Learning Rate": 1.650048623404855e-05, "Pretrain/Loss": 2.028744697570801, "Pretrain/Loss (Raw)": 2.059600591659546, "Pretrain/Step": 5933, "Pretrain/Step Time": 8.526010712608695} +{"Pretrain/Learning Rate": 1.6492502571969498e-05, "Pretrain/Loss": 2.0295047760009766, "Pretrain/Loss (Raw)": 2.123352527618408, "Pretrain/Step": 5934, "Pretrain/Step Time": 8.521234693005681} +{"Pretrain/Learning Rate": 1.6484519891015143e-05, "Pretrain/Loss": 2.030179500579834, "Pretrain/Loss (Raw)": 2.0531272888183594, "Pretrain/Step": 5935, "Pretrain/Step Time": 8.523792244493961} +{"Pretrain/Learning Rate": 1.647653819210607e-05, "Pretrain/Loss": 2.02933406829834, "Pretrain/Loss (Raw)": 1.9354820251464844, "Pretrain/Step": 5936, "Pretrain/Step Time": 8.51410186290741} +{"Pretrain/Learning Rate": 1.6468557476162793e-05, "Pretrain/Loss": 2.0278210639953613, "Pretrain/Loss (Raw)": 1.9055737257003784, "Pretrain/Step": 5937, "Pretrain/Step Time": 8.512495392933488} +{"Pretrain/Learning Rate": 1.6460577744105654e-05, "Pretrain/Loss": 2.027524948120117, "Pretrain/Loss (Raw)": 1.993327021598816, "Pretrain/Step": 5938, "Pretrain/Step Time": 8.522572316229343} +{"Pretrain/Learning Rate": 1.6452598996854943e-05, "Pretrain/Loss": 2.0274243354797363, "Pretrain/Loss (Raw)": 2.010277271270752, "Pretrain/Step": 5939, "Pretrain/Step Time": 8.522753238677979} +{"Pretrain/Learning Rate": 1.6444621235330777e-05, "Pretrain/Loss": 2.0268871784210205, "Pretrain/Loss (Raw)": 2.0938045978546143, "Pretrain/Step": 5940, "Pretrain/Step Time": 8.517797987908125} +{"Pretrain/Learning Rate": 1.6436644460453217e-05, "Pretrain/Loss": 2.028759002685547, "Pretrain/Loss (Raw)": 2.2098796367645264, "Pretrain/Step": 5941, "Pretrain/Step Time": 8.515428449958563} +{"Pretrain/Learning Rate": 1.642866867314216e-05, "Pretrain/Loss": 2.028228759765625, "Pretrain/Loss (Raw)": 1.9944994449615479, "Pretrain/Step": 5942, "Pretrain/Step Time": 8.514292158186436} +{"Pretrain/Learning Rate": 1.642069387431743e-05, "Pretrain/Loss": 2.0292298793792725, "Pretrain/Loss (Raw)": 2.193387269973755, "Pretrain/Step": 5943, "Pretrain/Step Time": 8.512857930734754} +{"Pretrain/Learning Rate": 1.64127200648987e-05, "Pretrain/Loss": 2.0292584896087646, "Pretrain/Loss (Raw)": 1.958937644958496, "Pretrain/Step": 5944, "Pretrain/Step Time": 8.51982588134706} +{"Pretrain/Learning Rate": 1.6404747245805567e-05, "Pretrain/Loss": 2.031130313873291, "Pretrain/Loss (Raw)": 2.137199640274048, "Pretrain/Step": 5945, "Pretrain/Step Time": 8.518747970461845} +{"Pretrain/Learning Rate": 1.6396775417957478e-05, "Pretrain/Loss": 2.0289535522460938, "Pretrain/Loss (Raw)": 1.9511736631393433, "Pretrain/Step": 5946, "Pretrain/Step Time": 8.515801060944796} +{"Pretrain/Learning Rate": 1.6388804582273788e-05, "Pretrain/Loss": 2.0292727947235107, "Pretrain/Loss (Raw)": 2.1821892261505127, "Pretrain/Step": 5947, "Pretrain/Step Time": 8.506302958354354} +{"Pretrain/Learning Rate": 1.6380834739673727e-05, "Pretrain/Loss": 2.031536102294922, "Pretrain/Loss (Raw)": 2.158338785171509, "Pretrain/Step": 5948, "Pretrain/Step Time": 8.50585781224072} +{"Pretrain/Learning Rate": 1.6372865891076426e-05, "Pretrain/Loss": 2.028921604156494, "Pretrain/Loss (Raw)": 1.8882445096969604, "Pretrain/Step": 5949, "Pretrain/Step Time": 8.507742514833808} +{"Pretrain/Learning Rate": 1.6364898037400876e-05, "Pretrain/Loss": 2.03102970123291, "Pretrain/Loss (Raw)": 2.192761182785034, "Pretrain/Step": 5950, "Pretrain/Step Time": 8.511870600283146} +{"Pretrain/Learning Rate": 1.6356931179565978e-05, "Pretrain/Loss": 2.0310611724853516, "Pretrain/Loss (Raw)": 2.088226556777954, "Pretrain/Step": 5951, "Pretrain/Step Time": 8.512320565059781} +{"Pretrain/Learning Rate": 1.63489653184905e-05, "Pretrain/Loss": 2.031517744064331, "Pretrain/Loss (Raw)": 2.045769453048706, "Pretrain/Step": 5952, "Pretrain/Step Time": 8.506769521161914} +{"Pretrain/Learning Rate": 1.6341000455093115e-05, "Pretrain/Loss": 2.0326600074768066, "Pretrain/Loss (Raw)": 2.2681453227996826, "Pretrain/Step": 5953, "Pretrain/Step Time": 8.505401952192187} +{"Pretrain/Learning Rate": 1.633303659029235e-05, "Pretrain/Loss": 2.0359725952148438, "Pretrain/Loss (Raw)": 2.1204118728637695, "Pretrain/Step": 5954, "Pretrain/Step Time": 8.503437802195549} +{"Pretrain/Learning Rate": 1.6325073725006654e-05, "Pretrain/Loss": 2.030975341796875, "Pretrain/Loss (Raw)": 1.7729084491729736, "Pretrain/Step": 5955, "Pretrain/Step Time": 8.50332186743617} +{"Pretrain/Learning Rate": 1.6317111860154328e-05, "Pretrain/Loss": 2.0332226753234863, "Pretrain/Loss (Raw)": 2.094447135925293, "Pretrain/Step": 5956, "Pretrain/Step Time": 8.513571612536907} +{"Pretrain/Learning Rate": 1.6309150996653582e-05, "Pretrain/Loss": 2.0341217517852783, "Pretrain/Loss (Raw)": 2.0073487758636475, "Pretrain/Step": 5957, "Pretrain/Step Time": 8.516449831426144} +{"Pretrain/Learning Rate": 1.630119113542249e-05, "Pretrain/Loss": 2.032942771911621, "Pretrain/Loss (Raw)": 2.025592088699341, "Pretrain/Step": 5958, "Pretrain/Step Time": 8.518921641632915} +{"Pretrain/Learning Rate": 1.629323227737903e-05, "Pretrain/Loss": 2.0311408042907715, "Pretrain/Loss (Raw)": 1.8765064477920532, "Pretrain/Step": 5959, "Pretrain/Step Time": 8.511690182611346} +{"Pretrain/Learning Rate": 1.628527442344105e-05, "Pretrain/Loss": 2.02970814704895, "Pretrain/Loss (Raw)": 1.9090299606323242, "Pretrain/Step": 5960, "Pretrain/Step Time": 8.511263052001595} +{"Pretrain/Learning Rate": 1.6277317574526284e-05, "Pretrain/Loss": 2.0253844261169434, "Pretrain/Loss (Raw)": 1.9436986446380615, "Pretrain/Step": 5961, "Pretrain/Step Time": 8.51246264949441} +{"Pretrain/Learning Rate": 1.626936173155237e-05, "Pretrain/Loss": 2.02687406539917, "Pretrain/Loss (Raw)": 2.1004271507263184, "Pretrain/Step": 5962, "Pretrain/Step Time": 8.52153854072094} +{"Pretrain/Learning Rate": 1.626140689543679e-05, "Pretrain/Loss": 2.026444911956787, "Pretrain/Loss (Raw)": 2.0619637966156006, "Pretrain/Step": 5963, "Pretrain/Step Time": 8.521895442157984} +{"Pretrain/Learning Rate": 1.6253453067096954e-05, "Pretrain/Loss": 2.0261166095733643, "Pretrain/Loss (Raw)": 2.1122419834136963, "Pretrain/Step": 5964, "Pretrain/Step Time": 8.519344188272953} +{"Pretrain/Learning Rate": 1.6245500247450114e-05, "Pretrain/Loss": 2.026477813720703, "Pretrain/Loss (Raw)": 1.9950402975082397, "Pretrain/Step": 5965, "Pretrain/Step Time": 8.509530605748296} +{"Pretrain/Learning Rate": 1.6237548437413448e-05, "Pretrain/Loss": 2.026416301727295, "Pretrain/Loss (Raw)": 1.882863998413086, "Pretrain/Step": 5966, "Pretrain/Step Time": 8.512213800102472} +{"Pretrain/Learning Rate": 1.622959763790398e-05, "Pretrain/Loss": 2.025325298309326, "Pretrain/Loss (Raw)": 1.9253190755844116, "Pretrain/Step": 5967, "Pretrain/Step Time": 8.515742076560855} +{"Pretrain/Learning Rate": 1.6221647849838645e-05, "Pretrain/Loss": 2.0246052742004395, "Pretrain/Loss (Raw)": 2.1682069301605225, "Pretrain/Step": 5968, "Pretrain/Step Time": 8.514484647661448} +{"Pretrain/Learning Rate": 1.621369907413424e-05, "Pretrain/Loss": 2.024843692779541, "Pretrain/Loss (Raw)": 1.9435538053512573, "Pretrain/Step": 5969, "Pretrain/Step Time": 8.516734620556235} +{"Pretrain/Learning Rate": 1.6205751311707463e-05, "Pretrain/Loss": 2.0231194496154785, "Pretrain/Loss (Raw)": 1.8040282726287842, "Pretrain/Step": 5970, "Pretrain/Step Time": 8.516443572938442} +{"Pretrain/Learning Rate": 1.6197804563474882e-05, "Pretrain/Loss": 2.0239598751068115, "Pretrain/Loss (Raw)": 2.186577558517456, "Pretrain/Step": 5971, "Pretrain/Step Time": 8.509344931691885} +{"Pretrain/Learning Rate": 1.6189858830352962e-05, "Pretrain/Loss": 2.0238797664642334, "Pretrain/Loss (Raw)": 1.9837077856063843, "Pretrain/Step": 5972, "Pretrain/Step Time": 8.507106648758054} +{"Pretrain/Learning Rate": 1.618191411325803e-05, "Pretrain/Loss": 2.0218944549560547, "Pretrain/Loss (Raw)": 1.9964373111724854, "Pretrain/Step": 5973, "Pretrain/Step Time": 8.507989322766662} +{"Pretrain/Learning Rate": 1.617397041310632e-05, "Pretrain/Loss": 2.0219154357910156, "Pretrain/Loss (Raw)": 2.022782802581787, "Pretrain/Step": 5974, "Pretrain/Step Time": 8.51483186520636} +{"Pretrain/Learning Rate": 1.6166027730813926e-05, "Pretrain/Loss": 2.02180552482605, "Pretrain/Loss (Raw)": 1.9244853258132935, "Pretrain/Step": 5975, "Pretrain/Step Time": 8.513759769499302} +{"Pretrain/Learning Rate": 1.6158086067296844e-05, "Pretrain/Loss": 2.020555019378662, "Pretrain/Loss (Raw)": 1.898847222328186, "Pretrain/Step": 5976, "Pretrain/Step Time": 8.510007182136178} +{"Pretrain/Learning Rate": 1.615014542347094e-05, "Pretrain/Loss": 2.0201210975646973, "Pretrain/Loss (Raw)": 2.0226964950561523, "Pretrain/Step": 5977, "Pretrain/Step Time": 8.49383376725018} +{"Pretrain/Learning Rate": 1.6142205800251968e-05, "Pretrain/Loss": 2.0209708213806152, "Pretrain/Loss (Raw)": 1.9762461185455322, "Pretrain/Step": 5978, "Pretrain/Step Time": 8.49656774289906} +{"Pretrain/Learning Rate": 1.6134267198555563e-05, "Pretrain/Loss": 2.020905017852783, "Pretrain/Loss (Raw)": 1.9474024772644043, "Pretrain/Step": 5979, "Pretrain/Step Time": 8.505645874887705} +{"Pretrain/Learning Rate": 1.612632961929725e-05, "Pretrain/Loss": 2.020045280456543, "Pretrain/Loss (Raw)": 2.030388355255127, "Pretrain/Step": 5980, "Pretrain/Step Time": 8.507031593471766} +{"Pretrain/Learning Rate": 1.6118393063392402e-05, "Pretrain/Loss": 2.0207366943359375, "Pretrain/Loss (Raw)": 2.0962724685668945, "Pretrain/Step": 5981, "Pretrain/Step Time": 8.514255356043577} +{"Pretrain/Learning Rate": 1.6110457531756334e-05, "Pretrain/Loss": 2.022153377532959, "Pretrain/Loss (Raw)": 2.1982102394104004, "Pretrain/Step": 5982, "Pretrain/Step Time": 8.505513986572623} +{"Pretrain/Learning Rate": 1.6102523025304178e-05, "Pretrain/Loss": 2.0217294692993164, "Pretrain/Loss (Raw)": 2.1460318565368652, "Pretrain/Step": 5983, "Pretrain/Step Time": 8.495830416679382} +{"Pretrain/Learning Rate": 1.6094589544951006e-05, "Pretrain/Loss": 2.020310878753662, "Pretrain/Loss (Raw)": 2.0264525413513184, "Pretrain/Step": 5984, "Pretrain/Step Time": 8.502795428037643} +{"Pretrain/Learning Rate": 1.6086657091611718e-05, "Pretrain/Loss": 2.0202441215515137, "Pretrain/Loss (Raw)": 1.8750627040863037, "Pretrain/Step": 5985, "Pretrain/Step Time": 8.506786860525608} +{"Pretrain/Learning Rate": 1.607872566620115e-05, "Pretrain/Loss": 2.0205421447753906, "Pretrain/Loss (Raw)": 2.024165153503418, "Pretrain/Step": 5986, "Pretrain/Step Time": 8.511197056621313} +{"Pretrain/Learning Rate": 1.6070795269633964e-05, "Pretrain/Loss": 2.0198471546173096, "Pretrain/Loss (Raw)": 1.909288763999939, "Pretrain/Step": 5987, "Pretrain/Step Time": 8.512393940240145} +{"Pretrain/Learning Rate": 1.6062865902824754e-05, "Pretrain/Loss": 2.019294500350952, "Pretrain/Loss (Raw)": 1.946486234664917, "Pretrain/Step": 5988, "Pretrain/Step Time": 8.509628923609853} +{"Pretrain/Learning Rate": 1.605493756668795e-05, "Pretrain/Loss": 2.0219364166259766, "Pretrain/Loss (Raw)": 1.9888840913772583, "Pretrain/Step": 5989, "Pretrain/Step Time": 8.510619770735502} +{"Pretrain/Learning Rate": 1.6047010262137908e-05, "Pretrain/Loss": 2.022763252258301, "Pretrain/Loss (Raw)": 2.1758780479431152, "Pretrain/Step": 5990, "Pretrain/Step Time": 8.506774485111237} +{"Pretrain/Learning Rate": 1.603908399008882e-05, "Pretrain/Loss": 2.0255391597747803, "Pretrain/Loss (Raw)": 2.3970251083374023, "Pretrain/Step": 5991, "Pretrain/Step Time": 8.514638453722} +{"Pretrain/Learning Rate": 1.60311587514548e-05, "Pretrain/Loss": 2.0252718925476074, "Pretrain/Loss (Raw)": 1.9238169193267822, "Pretrain/Step": 5992, "Pretrain/Step Time": 8.516860876232386} +{"Pretrain/Learning Rate": 1.6023234547149808e-05, "Pretrain/Loss": 2.025465488433838, "Pretrain/Loss (Raw)": 2.012585163116455, "Pretrain/Step": 5993, "Pretrain/Step Time": 8.51583250053227} +{"Pretrain/Learning Rate": 1.6015311378087714e-05, "Pretrain/Loss": 2.0269289016723633, "Pretrain/Loss (Raw)": 2.019630193710327, "Pretrain/Step": 5994, "Pretrain/Step Time": 8.508690172806382} +{"Pretrain/Learning Rate": 1.600738924518224e-05, "Pretrain/Loss": 2.0261316299438477, "Pretrain/Loss (Raw)": 1.888803482055664, "Pretrain/Step": 5995, "Pretrain/Step Time": 8.504334652796388} +{"Pretrain/Learning Rate": 1.5999468149347024e-05, "Pretrain/Loss": 2.0247905254364014, "Pretrain/Loss (Raw)": 2.006291151046753, "Pretrain/Step": 5996, "Pretrain/Step Time": 8.509800000116229} +{"Pretrain/Learning Rate": 1.5991548091495546e-05, "Pretrain/Loss": 2.027757406234741, "Pretrain/Loss (Raw)": 2.096702814102173, "Pretrain/Step": 5997, "Pretrain/Step Time": 8.505485128611326} +{"Pretrain/Learning Rate": 1.5983629072541196e-05, "Pretrain/Loss": 2.0264205932617188, "Pretrain/Loss (Raw)": 1.8802250623703003, "Pretrain/Step": 5998, "Pretrain/Step Time": 8.513670690357685} +{"Pretrain/Learning Rate": 1.597571109339722e-05, "Pretrain/Loss": 2.027555227279663, "Pretrain/Loss (Raw)": 2.172325611114502, "Pretrain/Step": 5999, "Pretrain/Step Time": 8.519052444025874} +{"Pretrain/Learning Rate": 1.5967794154976773e-05, "Pretrain/Loss": 2.0270628929138184, "Pretrain/Loss (Raw)": 2.0099735260009766, "Pretrain/Step": 6000, "Pretrain/Step Time": 8.51282430998981} +{"Pretrain/Learning Rate": 1.5959878258192863e-05, "Pretrain/Loss": 2.028256893157959, "Pretrain/Loss (Raw)": 2.13122296333313, "Pretrain/Step": 6001, "Pretrain/Step Time": 8.508215768262744} +{"Pretrain/Learning Rate": 1.5951963403958382e-05, "Pretrain/Loss": 2.0275063514709473, "Pretrain/Loss (Raw)": 1.9910798072814941, "Pretrain/Step": 6002, "Pretrain/Step Time": 8.513377379626036} +{"Pretrain/Learning Rate": 1.5944049593186127e-05, "Pretrain/Loss": 2.0295825004577637, "Pretrain/Loss (Raw)": 2.2590529918670654, "Pretrain/Step": 6003, "Pretrain/Step Time": 8.518651336431503} +{"Pretrain/Learning Rate": 1.5936136826788745e-05, "Pretrain/Loss": 2.029299736022949, "Pretrain/Loss (Raw)": 2.003122568130493, "Pretrain/Step": 6004, "Pretrain/Step Time": 8.522478761151433} +{"Pretrain/Learning Rate": 1.5928225105678774e-05, "Pretrain/Loss": 2.0298585891723633, "Pretrain/Loss (Raw)": 2.000394821166992, "Pretrain/Step": 6005, "Pretrain/Step Time": 8.523436140269041} +{"Pretrain/Learning Rate": 1.592031443076863e-05, "Pretrain/Loss": 2.0318093299865723, "Pretrain/Loss (Raw)": 2.1311466693878174, "Pretrain/Step": 6006, "Pretrain/Step Time": 8.517432967200875} +{"Pretrain/Learning Rate": 1.591240480297061e-05, "Pretrain/Loss": 2.0332252979278564, "Pretrain/Loss (Raw)": 2.1967062950134277, "Pretrain/Step": 6007, "Pretrain/Step Time": 8.514160010963678} +{"Pretrain/Learning Rate": 1.590449622319689e-05, "Pretrain/Loss": 2.0346150398254395, "Pretrain/Loss (Raw)": 2.2814059257507324, "Pretrain/Step": 6008, "Pretrain/Step Time": 8.512757524847984} +{"Pretrain/Learning Rate": 1.589658869235953e-05, "Pretrain/Loss": 2.035443067550659, "Pretrain/Loss (Raw)": 2.1505327224731445, "Pretrain/Step": 6009, "Pretrain/Step Time": 8.513470279052854} +{"Pretrain/Learning Rate": 1.588868221137045e-05, "Pretrain/Loss": 2.0347793102264404, "Pretrain/Loss (Raw)": 1.9892821311950684, "Pretrain/Step": 6010, "Pretrain/Step Time": 8.522487506270409} +{"Pretrain/Learning Rate": 1.588077678114148e-05, "Pretrain/Loss": 2.0356087684631348, "Pretrain/Loss (Raw)": 2.0986053943634033, "Pretrain/Step": 6011, "Pretrain/Step Time": 8.52630853280425} +{"Pretrain/Learning Rate": 1.5872872402584296e-05, "Pretrain/Loss": 2.034965991973877, "Pretrain/Loss (Raw)": 2.128955364227295, "Pretrain/Step": 6012, "Pretrain/Step Time": 8.524676885455847} +{"Pretrain/Learning Rate": 1.586496907661048e-05, "Pretrain/Loss": 2.0344667434692383, "Pretrain/Loss (Raw)": 1.9585845470428467, "Pretrain/Step": 6013, "Pretrain/Step Time": 8.514699941501021} +{"Pretrain/Learning Rate": 1.5857066804131472e-05, "Pretrain/Loss": 2.034353256225586, "Pretrain/Loss (Raw)": 1.9783958196640015, "Pretrain/Step": 6014, "Pretrain/Step Time": 8.516705106943846} +{"Pretrain/Learning Rate": 1.5849165586058608e-05, "Pretrain/Loss": 2.033388137817383, "Pretrain/Loss (Raw)": 1.9583461284637451, "Pretrain/Step": 6015, "Pretrain/Step Time": 8.5269196331501} +{"Pretrain/Learning Rate": 1.5841265423303084e-05, "Pretrain/Loss": 2.0331170558929443, "Pretrain/Loss (Raw)": 1.915848970413208, "Pretrain/Step": 6016, "Pretrain/Step Time": 8.52651590667665} +{"Pretrain/Learning Rate": 1.5833366316775994e-05, "Pretrain/Loss": 2.0344247817993164, "Pretrain/Loss (Raw)": 2.225447416305542, "Pretrain/Step": 6017, "Pretrain/Step Time": 8.52369486913085} +{"Pretrain/Learning Rate": 1.582546826738829e-05, "Pretrain/Loss": 2.0315396785736084, "Pretrain/Loss (Raw)": 1.925620675086975, "Pretrain/Step": 6018, "Pretrain/Step Time": 8.522010516375303} +{"Pretrain/Learning Rate": 1.581757127605082e-05, "Pretrain/Loss": 2.0335071086883545, "Pretrain/Loss (Raw)": 2.154900312423706, "Pretrain/Step": 6019, "Pretrain/Step Time": 8.517721749842167} +{"Pretrain/Learning Rate": 1.5809675343674295e-05, "Pretrain/Loss": 2.033867597579956, "Pretrain/Loss (Raw)": 2.105654001235962, "Pretrain/Step": 6020, "Pretrain/Step Time": 8.519454553723335} +{"Pretrain/Learning Rate": 1.5801780471169324e-05, "Pretrain/Loss": 2.0332281589508057, "Pretrain/Loss (Raw)": 2.2114224433898926, "Pretrain/Step": 6021, "Pretrain/Step Time": 8.521445656195283} +{"Pretrain/Learning Rate": 1.579388665944636e-05, "Pretrain/Loss": 2.033088445663452, "Pretrain/Loss (Raw)": 2.0200788974761963, "Pretrain/Step": 6022, "Pretrain/Step Time": 8.5259446837008} +{"Pretrain/Learning Rate": 1.578599390941578e-05, "Pretrain/Loss": 2.0341360569000244, "Pretrain/Loss (Raw)": 2.058945655822754, "Pretrain/Step": 6023, "Pretrain/Step Time": 8.525144742801785} +{"Pretrain/Learning Rate": 1.577810222198779e-05, "Pretrain/Loss": 2.03285813331604, "Pretrain/Loss (Raw)": 1.7207961082458496, "Pretrain/Step": 6024, "Pretrain/Step Time": 8.518565207719803} +{"Pretrain/Learning Rate": 1.577021159807252e-05, "Pretrain/Loss": 2.0331382751464844, "Pretrain/Loss (Raw)": 2.24743914604187, "Pretrain/Step": 6025, "Pretrain/Step Time": 8.51261093467474} +{"Pretrain/Learning Rate": 1.5762322038579925e-05, "Pretrain/Loss": 2.030736207962036, "Pretrain/Loss (Raw)": 1.7157845497131348, "Pretrain/Step": 6026, "Pretrain/Step Time": 8.517278462648392} +{"Pretrain/Learning Rate": 1.5754433544419893e-05, "Pretrain/Loss": 2.0304479598999023, "Pretrain/Loss (Raw)": 1.9011995792388916, "Pretrain/Step": 6027, "Pretrain/Step Time": 8.512043256312609} +{"Pretrain/Learning Rate": 1.574654611650214e-05, "Pretrain/Loss": 2.028294086456299, "Pretrain/Loss (Raw)": 1.9717862606048584, "Pretrain/Step": 6028, "Pretrain/Step Time": 8.520469663664699} +{"Pretrain/Learning Rate": 1.5738659755736308e-05, "Pretrain/Loss": 2.0266804695129395, "Pretrain/Loss (Raw)": 1.8985910415649414, "Pretrain/Step": 6029, "Pretrain/Step Time": 8.522634806111455} +{"Pretrain/Learning Rate": 1.5730774463031862e-05, "Pretrain/Loss": 2.028886318206787, "Pretrain/Loss (Raw)": 2.2108070850372314, "Pretrain/Step": 6030, "Pretrain/Step Time": 8.515900418162346} +{"Pretrain/Learning Rate": 1.572289023929819e-05, "Pretrain/Loss": 2.0280203819274902, "Pretrain/Loss (Raw)": 1.9145137071609497, "Pretrain/Step": 6031, "Pretrain/Step Time": 8.510613363236189} +{"Pretrain/Learning Rate": 1.5715007085444523e-05, "Pretrain/Loss": 2.0271153450012207, "Pretrain/Loss (Raw)": 1.8105469942092896, "Pretrain/Step": 6032, "Pretrain/Step Time": 8.516534239053726} +{"Pretrain/Learning Rate": 1.5707125002379996e-05, "Pretrain/Loss": 2.0272364616394043, "Pretrain/Loss (Raw)": 1.869871735572815, "Pretrain/Step": 6033, "Pretrain/Step Time": 8.521534010767937} +{"Pretrain/Learning Rate": 1.56992439910136e-05, "Pretrain/Loss": 2.0277156829833984, "Pretrain/Loss (Raw)": 1.9652646780014038, "Pretrain/Step": 6034, "Pretrain/Step Time": 8.523003444075584} +{"Pretrain/Learning Rate": 1.569136405225422e-05, "Pretrain/Loss": 2.028613567352295, "Pretrain/Loss (Raw)": 2.1169285774230957, "Pretrain/Step": 6035, "Pretrain/Step Time": 8.520028453320265} +{"Pretrain/Learning Rate": 1.5683485187010593e-05, "Pretrain/Loss": 2.0281431674957275, "Pretrain/Loss (Raw)": 2.067962169647217, "Pretrain/Step": 6036, "Pretrain/Step Time": 8.51653709448874} +{"Pretrain/Learning Rate": 1.5675607396191366e-05, "Pretrain/Loss": 2.0263161659240723, "Pretrain/Loss (Raw)": 2.0330214500427246, "Pretrain/Step": 6037, "Pretrain/Step Time": 8.515603557229042} +{"Pretrain/Learning Rate": 1.5667730680705022e-05, "Pretrain/Loss": 2.027163028717041, "Pretrain/Loss (Raw)": 2.101543664932251, "Pretrain/Step": 6038, "Pretrain/Step Time": 8.516040606424212} +{"Pretrain/Learning Rate": 1.5659855041459955e-05, "Pretrain/Loss": 2.031292200088501, "Pretrain/Loss (Raw)": 2.4393227100372314, "Pretrain/Step": 6039, "Pretrain/Step Time": 8.520383102819324} +{"Pretrain/Learning Rate": 1.5651980479364416e-05, "Pretrain/Loss": 2.032290458679199, "Pretrain/Loss (Raw)": 2.014261484146118, "Pretrain/Step": 6040, "Pretrain/Step Time": 8.519331997260451} +{"Pretrain/Learning Rate": 1.564410699532654e-05, "Pretrain/Loss": 2.0304813385009766, "Pretrain/Loss (Raw)": 2.108839273452759, "Pretrain/Step": 6041, "Pretrain/Step Time": 8.513369834050536} +{"Pretrain/Learning Rate": 1.5636234590254324e-05, "Pretrain/Loss": 2.032609462738037, "Pretrain/Loss (Raw)": 2.1145873069763184, "Pretrain/Step": 6042, "Pretrain/Step Time": 8.504827434197068} +{"Pretrain/Learning Rate": 1.5628363265055664e-05, "Pretrain/Loss": 2.0352659225463867, "Pretrain/Loss (Raw)": 2.260012626647949, "Pretrain/Step": 6043, "Pretrain/Step Time": 8.510679427534342} +{"Pretrain/Learning Rate": 1.5620493020638315e-05, "Pretrain/Loss": 2.0350191593170166, "Pretrain/Loss (Raw)": 1.833423376083374, "Pretrain/Step": 6044, "Pretrain/Step Time": 8.515084266662598} +{"Pretrain/Learning Rate": 1.5612623857909904e-05, "Pretrain/Loss": 2.034365177154541, "Pretrain/Loss (Raw)": 1.990429401397705, "Pretrain/Step": 6045, "Pretrain/Step Time": 8.512647923082113} +{"Pretrain/Learning Rate": 1.5604755777777948e-05, "Pretrain/Loss": 2.0332202911376953, "Pretrain/Loss (Raw)": 1.9999762773513794, "Pretrain/Step": 6046, "Pretrain/Step Time": 8.516972517594695} +{"Pretrain/Learning Rate": 1.5596888781149827e-05, "Pretrain/Loss": 2.0342564582824707, "Pretrain/Loss (Raw)": 2.1670777797698975, "Pretrain/Step": 6047, "Pretrain/Step Time": 8.513543182983994} +{"Pretrain/Learning Rate": 1.55890228689328e-05, "Pretrain/Loss": 2.037745952606201, "Pretrain/Loss (Raw)": 2.3426308631896973, "Pretrain/Step": 6048, "Pretrain/Step Time": 8.51185460947454} +{"Pretrain/Learning Rate": 1.5581158042034e-05, "Pretrain/Loss": 2.040426254272461, "Pretrain/Loss (Raw)": 2.03458571434021, "Pretrain/Step": 6049, "Pretrain/Step Time": 8.50901148468256} +{"Pretrain/Learning Rate": 1.557329430136044e-05, "Pretrain/Loss": 2.040435314178467, "Pretrain/Loss (Raw)": 1.9962044954299927, "Pretrain/Step": 6050, "Pretrain/Step Time": 8.513465462252498} +{"Pretrain/Learning Rate": 1.5565431647819e-05, "Pretrain/Loss": 2.0383918285369873, "Pretrain/Loss (Raw)": 1.8729832172393799, "Pretrain/Step": 6051, "Pretrain/Step Time": 8.508281290531158} +{"Pretrain/Learning Rate": 1.555757008231644e-05, "Pretrain/Loss": 2.0364227294921875, "Pretrain/Loss (Raw)": 1.7779676914215088, "Pretrain/Step": 6052, "Pretrain/Step Time": 8.509460655972362} +{"Pretrain/Learning Rate": 1.5549709605759393e-05, "Pretrain/Loss": 2.040739059448242, "Pretrain/Loss (Raw)": 2.548135757446289, "Pretrain/Step": 6053, "Pretrain/Step Time": 8.506781818345189} +{"Pretrain/Learning Rate": 1.5541850219054366e-05, "Pretrain/Loss": 2.040818214416504, "Pretrain/Loss (Raw)": 1.9707738161087036, "Pretrain/Step": 6054, "Pretrain/Step Time": 8.504031563177705} +{"Pretrain/Learning Rate": 1.5533991923107737e-05, "Pretrain/Loss": 2.0405290126800537, "Pretrain/Loss (Raw)": 2.03951358795166, "Pretrain/Step": 6055, "Pretrain/Step Time": 8.501042246818542} +{"Pretrain/Learning Rate": 1.552613471882577e-05, "Pretrain/Loss": 2.0401601791381836, "Pretrain/Loss (Raw)": 2.1100656986236572, "Pretrain/Step": 6056, "Pretrain/Step Time": 8.510831385850906} +{"Pretrain/Learning Rate": 1.5518278607114585e-05, "Pretrain/Loss": 2.0406649112701416, "Pretrain/Loss (Raw)": 2.0775907039642334, "Pretrain/Step": 6057, "Pretrain/Step Time": 8.510310774669051} +{"Pretrain/Learning Rate": 1.5510423588880194e-05, "Pretrain/Loss": 2.0425729751586914, "Pretrain/Loss (Raw)": 2.002595901489258, "Pretrain/Step": 6058, "Pretrain/Step Time": 8.512902647256851} +{"Pretrain/Learning Rate": 1.5502569665028465e-05, "Pretrain/Loss": 2.041105270385742, "Pretrain/Loss (Raw)": 1.9464465379714966, "Pretrain/Step": 6059, "Pretrain/Step Time": 8.506111966446042} +{"Pretrain/Learning Rate": 1.549471683646516e-05, "Pretrain/Loss": 2.0393545627593994, "Pretrain/Loss (Raw)": 1.9985896348953247, "Pretrain/Step": 6060, "Pretrain/Step Time": 8.500453164801002} +{"Pretrain/Learning Rate": 1.54868651040959e-05, "Pretrain/Loss": 2.040192127227783, "Pretrain/Loss (Raw)": 2.16678786277771, "Pretrain/Step": 6061, "Pretrain/Step Time": 8.499751389026642} +{"Pretrain/Learning Rate": 1.5479014468826184e-05, "Pretrain/Loss": 2.039675235748291, "Pretrain/Loss (Raw)": 2.0571861267089844, "Pretrain/Step": 6062, "Pretrain/Step Time": 8.503642678260803} +{"Pretrain/Learning Rate": 1.547116493156138e-05, "Pretrain/Loss": 2.0409512519836426, "Pretrain/Loss (Raw)": 2.216485023498535, "Pretrain/Step": 6063, "Pretrain/Step Time": 8.50804734788835} +{"Pretrain/Learning Rate": 1.5463316493206748e-05, "Pretrain/Loss": 2.039883613586426, "Pretrain/Loss (Raw)": 1.7988152503967285, "Pretrain/Step": 6064, "Pretrain/Step Time": 8.512093294411898} +{"Pretrain/Learning Rate": 1.545546915466738e-05, "Pretrain/Loss": 2.038970947265625, "Pretrain/Loss (Raw)": 1.7887786626815796, "Pretrain/Step": 6065, "Pretrain/Step Time": 8.507303109392524} +{"Pretrain/Learning Rate": 1.54476229168483e-05, "Pretrain/Loss": 2.0390377044677734, "Pretrain/Loss (Raw)": 2.0018551349639893, "Pretrain/Step": 6066, "Pretrain/Step Time": 8.493350606411695} +{"Pretrain/Learning Rate": 1.543977778065434e-05, "Pretrain/Loss": 2.0387024879455566, "Pretrain/Loss (Raw)": 1.9673726558685303, "Pretrain/Step": 6067, "Pretrain/Step Time": 8.505010109394789} +{"Pretrain/Learning Rate": 1.5431933746990276e-05, "Pretrain/Loss": 2.0366575717926025, "Pretrain/Loss (Raw)": 1.8320422172546387, "Pretrain/Step": 6068, "Pretrain/Step Time": 8.510404882952571} +{"Pretrain/Learning Rate": 1.542409081676068e-05, "Pretrain/Loss": 2.035888433456421, "Pretrain/Loss (Raw)": 2.111450672149658, "Pretrain/Step": 6069, "Pretrain/Step Time": 8.513101283460855} +{"Pretrain/Learning Rate": 1.541624899087007e-05, "Pretrain/Loss": 2.0343375205993652, "Pretrain/Loss (Raw)": 1.7959578037261963, "Pretrain/Step": 6070, "Pretrain/Step Time": 8.507983868941665} +{"Pretrain/Learning Rate": 1.5408408270222773e-05, "Pretrain/Loss": 2.032271146774292, "Pretrain/Loss (Raw)": 1.9288828372955322, "Pretrain/Step": 6071, "Pretrain/Step Time": 8.511692050844431} +{"Pretrain/Learning Rate": 1.5400568655723043e-05, "Pretrain/Loss": 2.035261631011963, "Pretrain/Loss (Raw)": 2.341717481613159, "Pretrain/Step": 6072, "Pretrain/Step Time": 8.503711979836226} +{"Pretrain/Learning Rate": 1.5392730148274965e-05, "Pretrain/Loss": 2.034099578857422, "Pretrain/Loss (Raw)": 1.988486409187317, "Pretrain/Step": 6073, "Pretrain/Step Time": 8.505811125040054} +{"Pretrain/Learning Rate": 1.5384892748782513e-05, "Pretrain/Loss": 2.0342843532562256, "Pretrain/Loss (Raw)": 1.9748034477233887, "Pretrain/Step": 6074, "Pretrain/Step Time": 8.514940751716495} +{"Pretrain/Learning Rate": 1.5377056458149542e-05, "Pretrain/Loss": 2.0329270362854004, "Pretrain/Loss (Raw)": 2.008488655090332, "Pretrain/Step": 6075, "Pretrain/Step Time": 8.521177217364311} +{"Pretrain/Learning Rate": 1.5369221277279765e-05, "Pretrain/Loss": 2.0304501056671143, "Pretrain/Loss (Raw)": 1.8412843942642212, "Pretrain/Step": 6076, "Pretrain/Step Time": 8.52118843048811} +{"Pretrain/Learning Rate": 1.5361387207076766e-05, "Pretrain/Loss": 2.031348466873169, "Pretrain/Loss (Raw)": 2.003213882446289, "Pretrain/Step": 6077, "Pretrain/Step Time": 8.52191287279129} +{"Pretrain/Learning Rate": 1.5353554248444022e-05, "Pretrain/Loss": 2.0308773517608643, "Pretrain/Loss (Raw)": 2.132455825805664, "Pretrain/Step": 6078, "Pretrain/Step Time": 8.515792522579432} +{"Pretrain/Learning Rate": 1.5345722402284852e-05, "Pretrain/Loss": 2.03196382522583, "Pretrain/Loss (Raw)": 2.2272915840148926, "Pretrain/Step": 6079, "Pretrain/Step Time": 8.511268731206656} +{"Pretrain/Learning Rate": 1.5337891669502468e-05, "Pretrain/Loss": 2.032101631164551, "Pretrain/Loss (Raw)": 2.063417434692383, "Pretrain/Step": 6080, "Pretrain/Step Time": 8.521263126283884} +{"Pretrain/Learning Rate": 1.5330062050999945e-05, "Pretrain/Loss": 2.0307416915893555, "Pretrain/Loss (Raw)": 2.094088554382324, "Pretrain/Step": 6081, "Pretrain/Step Time": 8.51730971224606} +{"Pretrain/Learning Rate": 1.5322233547680235e-05, "Pretrain/Loss": 2.0299832820892334, "Pretrain/Loss (Raw)": 2.023327589035034, "Pretrain/Step": 6082, "Pretrain/Step Time": 8.520820558071136} +{"Pretrain/Learning Rate": 1.531440616044615e-05, "Pretrain/Loss": 2.0309319496154785, "Pretrain/Loss (Raw)": 1.8943519592285156, "Pretrain/Step": 6083, "Pretrain/Step Time": 8.519592192023993} +{"Pretrain/Learning Rate": 1.530657989020039e-05, "Pretrain/Loss": 2.030555248260498, "Pretrain/Loss (Raw)": 2.0461909770965576, "Pretrain/Step": 6084, "Pretrain/Step Time": 8.510880686342716} +{"Pretrain/Learning Rate": 1.5298754737845515e-05, "Pretrain/Loss": 2.0306124687194824, "Pretrain/Loss (Raw)": 2.014686346054077, "Pretrain/Step": 6085, "Pretrain/Step Time": 8.510026596486568} +{"Pretrain/Learning Rate": 1.5290930704283953e-05, "Pretrain/Loss": 2.032247304916382, "Pretrain/Loss (Raw)": 2.234842538833618, "Pretrain/Step": 6086, "Pretrain/Step Time": 8.515964906662703} +{"Pretrain/Learning Rate": 1.5283107790418023e-05, "Pretrain/Loss": 2.033912181854248, "Pretrain/Loss (Raw)": 2.0896458625793457, "Pretrain/Step": 6087, "Pretrain/Step Time": 8.515697091817856} +{"Pretrain/Learning Rate": 1.527528599714988e-05, "Pretrain/Loss": 2.03517484664917, "Pretrain/Loss (Raw)": 2.070612668991089, "Pretrain/Step": 6088, "Pretrain/Step Time": 8.52404334768653} +{"Pretrain/Learning Rate": 1.5267465325381584e-05, "Pretrain/Loss": 2.0342273712158203, "Pretrain/Loss (Raw)": 1.8224467039108276, "Pretrain/Step": 6089, "Pretrain/Step Time": 8.52482726611197} +{"Pretrain/Learning Rate": 1.5259645776015047e-05, "Pretrain/Loss": 2.035116195678711, "Pretrain/Loss (Raw)": 2.2142012119293213, "Pretrain/Step": 6090, "Pretrain/Step Time": 8.513489283621311} +{"Pretrain/Learning Rate": 1.5251827349952058e-05, "Pretrain/Loss": 2.0342342853546143, "Pretrain/Loss (Raw)": 1.9490745067596436, "Pretrain/Step": 6091, "Pretrain/Step Time": 8.515846060588956} +{"Pretrain/Learning Rate": 1.524401004809427e-05, "Pretrain/Loss": 2.0337419509887695, "Pretrain/Loss (Raw)": 2.0492193698883057, "Pretrain/Step": 6092, "Pretrain/Step Time": 8.517280684784055} +{"Pretrain/Learning Rate": 1.5236193871343224e-05, "Pretrain/Loss": 2.033815860748291, "Pretrain/Loss (Raw)": 2.004464626312256, "Pretrain/Step": 6093, "Pretrain/Step Time": 8.526400037109852} +{"Pretrain/Learning Rate": 1.5228378820600303e-05, "Pretrain/Loss": 2.0353050231933594, "Pretrain/Loss (Raw)": 2.0734832286834717, "Pretrain/Step": 6094, "Pretrain/Step Time": 8.529357589781284} +{"Pretrain/Learning Rate": 1.5220564896766784e-05, "Pretrain/Loss": 2.0358142852783203, "Pretrain/Loss (Raw)": 1.9905396699905396, "Pretrain/Step": 6095, "Pretrain/Step Time": 8.524574544280767} +{"Pretrain/Learning Rate": 1.52127521007438e-05, "Pretrain/Loss": 2.0357069969177246, "Pretrain/Loss (Raw)": 2.154461145401001, "Pretrain/Step": 6096, "Pretrain/Step Time": 8.523402465507388} +{"Pretrain/Learning Rate": 1.5204940433432368e-05, "Pretrain/Loss": 2.034644365310669, "Pretrain/Loss (Raw)": 1.8075470924377441, "Pretrain/Step": 6097, "Pretrain/Step Time": 8.524354349821806} +{"Pretrain/Learning Rate": 1.5197129895733354e-05, "Pretrain/Loss": 2.0379579067230225, "Pretrain/Loss (Raw)": 2.228147268295288, "Pretrain/Step": 6098, "Pretrain/Step Time": 8.525994442403316} +{"Pretrain/Learning Rate": 1.518932048854752e-05, "Pretrain/Loss": 2.037325859069824, "Pretrain/Loss (Raw)": 2.105696678161621, "Pretrain/Step": 6099, "Pretrain/Step Time": 8.525937832891941} +{"Pretrain/Learning Rate": 1.5181512212775472e-05, "Pretrain/Loss": 2.0376033782958984, "Pretrain/Loss (Raw)": 2.019223690032959, "Pretrain/Step": 6100, "Pretrain/Step Time": 8.526313433423638} +{"Pretrain/Learning Rate": 1.5173705069317706e-05, "Pretrain/Loss": 2.0358829498291016, "Pretrain/Loss (Raw)": 1.776209831237793, "Pretrain/Step": 6101, "Pretrain/Step Time": 8.524511154741049} +{"Pretrain/Learning Rate": 1.5165899059074567e-05, "Pretrain/Loss": 2.0356273651123047, "Pretrain/Loss (Raw)": 1.9900376796722412, "Pretrain/Step": 6102, "Pretrain/Step Time": 8.516077009961009} +{"Pretrain/Learning Rate": 1.5158094182946298e-05, "Pretrain/Loss": 2.0360026359558105, "Pretrain/Loss (Raw)": 1.972586989402771, "Pretrain/Step": 6103, "Pretrain/Step Time": 8.523648412898183} +{"Pretrain/Learning Rate": 1.5150290441832976e-05, "Pretrain/Loss": 2.0369415283203125, "Pretrain/Loss (Raw)": 2.018989324569702, "Pretrain/Step": 6104, "Pretrain/Step Time": 8.536414910107851} +{"Pretrain/Learning Rate": 1.5142487836634587e-05, "Pretrain/Loss": 2.0379538536071777, "Pretrain/Loss (Raw)": 2.152251958847046, "Pretrain/Step": 6105, "Pretrain/Step Time": 8.53860593214631} +{"Pretrain/Learning Rate": 1.5134686368250932e-05, "Pretrain/Loss": 2.0391879081726074, "Pretrain/Loss (Raw)": 2.134209632873535, "Pretrain/Step": 6106, "Pretrain/Step Time": 8.534186469390988} +{"Pretrain/Learning Rate": 1.512688603758175e-05, "Pretrain/Loss": 2.041353940963745, "Pretrain/Loss (Raw)": 2.2246761322021484, "Pretrain/Step": 6107, "Pretrain/Step Time": 8.527020130306482} +{"Pretrain/Learning Rate": 1.5119086845526576e-05, "Pretrain/Loss": 2.041593551635742, "Pretrain/Loss (Raw)": 2.061065912246704, "Pretrain/Step": 6108, "Pretrain/Step Time": 8.529933892190456} +{"Pretrain/Learning Rate": 1.5111288792984884e-05, "Pretrain/Loss": 2.0417160987854004, "Pretrain/Loss (Raw)": 2.1119182109832764, "Pretrain/Step": 6109, "Pretrain/Step Time": 8.52763201110065} +{"Pretrain/Learning Rate": 1.5103491880855953e-05, "Pretrain/Loss": 2.0425009727478027, "Pretrain/Loss (Raw)": 2.2986903190612793, "Pretrain/Step": 6110, "Pretrain/Step Time": 8.535383872687817} +{"Pretrain/Learning Rate": 1.5095696110038981e-05, "Pretrain/Loss": 2.0428194999694824, "Pretrain/Loss (Raw)": 2.1868231296539307, "Pretrain/Step": 6111, "Pretrain/Step Time": 8.536682868376374} +{"Pretrain/Learning Rate": 1.5087901481432993e-05, "Pretrain/Loss": 2.044468879699707, "Pretrain/Loss (Raw)": 2.237574577331543, "Pretrain/Step": 6112, "Pretrain/Step Time": 8.529837526381016} +{"Pretrain/Learning Rate": 1.5080107995936929e-05, "Pretrain/Loss": 2.0448951721191406, "Pretrain/Loss (Raw)": 1.9296307563781738, "Pretrain/Step": 6113, "Pretrain/Step Time": 8.526991648599505} +{"Pretrain/Learning Rate": 1.5072315654449543e-05, "Pretrain/Loss": 2.0430095195770264, "Pretrain/Loss (Raw)": 1.7827962636947632, "Pretrain/Step": 6114, "Pretrain/Step Time": 8.524304997175932} +{"Pretrain/Learning Rate": 1.5064524457869506e-05, "Pretrain/Loss": 2.045029640197754, "Pretrain/Loss (Raw)": 2.1678643226623535, "Pretrain/Step": 6115, "Pretrain/Step Time": 8.52638392150402} +{"Pretrain/Learning Rate": 1.5056734407095316e-05, "Pretrain/Loss": 2.0448532104492188, "Pretrain/Loss (Raw)": 1.9239022731781006, "Pretrain/Step": 6116, "Pretrain/Step Time": 8.52503046952188} +{"Pretrain/Learning Rate": 1.5048945503025375e-05, "Pretrain/Loss": 2.0466408729553223, "Pretrain/Loss (Raw)": 2.2176759243011475, "Pretrain/Step": 6117, "Pretrain/Step Time": 8.52533221617341} +{"Pretrain/Learning Rate": 1.5041157746557924e-05, "Pretrain/Loss": 2.0435807704925537, "Pretrain/Loss (Raw)": 1.7841986417770386, "Pretrain/Step": 6118, "Pretrain/Step Time": 8.522271793335676} +{"Pretrain/Learning Rate": 1.5033371138591095e-05, "Pretrain/Loss": 2.040987253189087, "Pretrain/Loss (Raw)": 2.0650811195373535, "Pretrain/Step": 6119, "Pretrain/Step Time": 8.515777710825205} +{"Pretrain/Learning Rate": 1.5025585680022866e-05, "Pretrain/Loss": 2.0415666103363037, "Pretrain/Loss (Raw)": 1.9979594945907593, "Pretrain/Step": 6120, "Pretrain/Step Time": 8.514697004109621} +{"Pretrain/Learning Rate": 1.50178013717511e-05, "Pretrain/Loss": 2.041564464569092, "Pretrain/Loss (Raw)": 2.012310743331909, "Pretrain/Step": 6121, "Pretrain/Step Time": 8.519137341529131} +{"Pretrain/Learning Rate": 1.5010018214673515e-05, "Pretrain/Loss": 2.0421266555786133, "Pretrain/Loss (Raw)": 2.0915822982788086, "Pretrain/Step": 6122, "Pretrain/Step Time": 8.520465429872274} +{"Pretrain/Learning Rate": 1.5002236209687709e-05, "Pretrain/Loss": 2.0424909591674805, "Pretrain/Loss (Raw)": 1.9354428052902222, "Pretrain/Step": 6123, "Pretrain/Step Time": 8.528427112847567} +{"Pretrain/Learning Rate": 1.4994455357691128e-05, "Pretrain/Loss": 2.0431160926818848, "Pretrain/Loss (Raw)": 2.0863149166107178, "Pretrain/Step": 6124, "Pretrain/Step Time": 8.5225840639323} +{"Pretrain/Learning Rate": 1.4986675659581103e-05, "Pretrain/Loss": 2.0425264835357666, "Pretrain/Loss (Raw)": 2.0212090015411377, "Pretrain/Step": 6125, "Pretrain/Step Time": 8.52183642052114} +{"Pretrain/Learning Rate": 1.4978897116254832e-05, "Pretrain/Loss": 2.0435657501220703, "Pretrain/Loss (Raw)": 2.01324462890625, "Pretrain/Step": 6126, "Pretrain/Step Time": 8.519220454618335} +{"Pretrain/Learning Rate": 1.4971119728609359e-05, "Pretrain/Loss": 2.042452335357666, "Pretrain/Loss (Raw)": 2.0298330783843994, "Pretrain/Step": 6127, "Pretrain/Step Time": 8.511392023414373} +{"Pretrain/Learning Rate": 1.4963343497541621e-05, "Pretrain/Loss": 2.0421342849731445, "Pretrain/Loss (Raw)": 1.9692379236221313, "Pretrain/Step": 6128, "Pretrain/Step Time": 8.518271680921316} +{"Pretrain/Learning Rate": 1.4955568423948402e-05, "Pretrain/Loss": 2.04080867767334, "Pretrain/Loss (Raw)": 1.9615657329559326, "Pretrain/Step": 6129, "Pretrain/Step Time": 8.519969865679741} +{"Pretrain/Learning Rate": 1.494779450872637e-05, "Pretrain/Loss": 2.040133476257324, "Pretrain/Loss (Raw)": 1.9046624898910522, "Pretrain/Step": 6130, "Pretrain/Step Time": 8.514304526150227} +{"Pretrain/Learning Rate": 1.4940021752772034e-05, "Pretrain/Loss": 2.0374414920806885, "Pretrain/Loss (Raw)": 1.9144741296768188, "Pretrain/Step": 6131, "Pretrain/Step Time": 8.510898225009441} +{"Pretrain/Learning Rate": 1.4932250156981803e-05, "Pretrain/Loss": 2.0376200675964355, "Pretrain/Loss (Raw)": 2.0259976387023926, "Pretrain/Step": 6132, "Pretrain/Step Time": 8.509688774123788} +{"Pretrain/Learning Rate": 1.4924479722251916e-05, "Pretrain/Loss": 2.037191390991211, "Pretrain/Loss (Raw)": 1.9455127716064453, "Pretrain/Step": 6133, "Pretrain/Step Time": 8.515566086396575} +{"Pretrain/Learning Rate": 1.4916710449478511e-05, "Pretrain/Loss": 2.035560131072998, "Pretrain/Loss (Raw)": 1.9223459959030151, "Pretrain/Step": 6134, "Pretrain/Step Time": 8.512642912566662} +{"Pretrain/Learning Rate": 1.4908942339557564e-05, "Pretrain/Loss": 2.0322113037109375, "Pretrain/Loss (Raw)": 1.7680761814117432, "Pretrain/Step": 6135, "Pretrain/Step Time": 8.515850879251957} +{"Pretrain/Learning Rate": 1.4901175393384944e-05, "Pretrain/Loss": 2.032015323638916, "Pretrain/Loss (Raw)": 2.256281614303589, "Pretrain/Step": 6136, "Pretrain/Step Time": 8.50927042402327} +{"Pretrain/Learning Rate": 1.4893409611856362e-05, "Pretrain/Loss": 2.0315566062927246, "Pretrain/Loss (Raw)": 2.091822862625122, "Pretrain/Step": 6137, "Pretrain/Step Time": 8.512789025902748} +{"Pretrain/Learning Rate": 1.488564499586741e-05, "Pretrain/Loss": 2.030452251434326, "Pretrain/Loss (Raw)": 1.8479328155517578, "Pretrain/Step": 6138, "Pretrain/Step Time": 8.505392882972956} +{"Pretrain/Learning Rate": 1.4877881546313532e-05, "Pretrain/Loss": 2.0285158157348633, "Pretrain/Loss (Raw)": 1.8507130146026611, "Pretrain/Step": 6139, "Pretrain/Step Time": 8.502689123153687} +{"Pretrain/Learning Rate": 1.4870119264090057e-05, "Pretrain/Loss": 2.027139186859131, "Pretrain/Loss (Raw)": 1.952760100364685, "Pretrain/Step": 6140, "Pretrain/Step Time": 8.505159636959434} +{"Pretrain/Learning Rate": 1.4862358150092157e-05, "Pretrain/Loss": 2.026069402694702, "Pretrain/Loss (Raw)": 1.8216452598571777, "Pretrain/Step": 6141, "Pretrain/Step Time": 8.511425729840994} +{"Pretrain/Learning Rate": 1.485459820521489e-05, "Pretrain/Loss": 2.026484966278076, "Pretrain/Loss (Raw)": 2.0316126346588135, "Pretrain/Step": 6142, "Pretrain/Step Time": 8.508275782689452} +{"Pretrain/Learning Rate": 1.484683943035316e-05, "Pretrain/Loss": 2.0300557613372803, "Pretrain/Loss (Raw)": 2.4154090881347656, "Pretrain/Step": 6143, "Pretrain/Step Time": 8.495917562395334} +{"Pretrain/Learning Rate": 1.4839081826401755e-05, "Pretrain/Loss": 2.030630588531494, "Pretrain/Loss (Raw)": 1.9894214868545532, "Pretrain/Step": 6144, "Pretrain/Step Time": 8.496576651930809} +{"Pretrain/Learning Rate": 1.4831325394255307e-05, "Pretrain/Loss": 2.0277061462402344, "Pretrain/Loss (Raw)": 1.8511070013046265, "Pretrain/Step": 6145, "Pretrain/Step Time": 8.50459730066359} +{"Pretrain/Learning Rate": 1.4823570134808342e-05, "Pretrain/Loss": 2.0276012420654297, "Pretrain/Loss (Raw)": 1.9122282266616821, "Pretrain/Step": 6146, "Pretrain/Step Time": 8.504919480532408} +{"Pretrain/Learning Rate": 1.4815816048955208e-05, "Pretrain/Loss": 2.0261335372924805, "Pretrain/Loss (Raw)": 1.9669932126998901, "Pretrain/Step": 6147, "Pretrain/Step Time": 8.506071975454688} +{"Pretrain/Learning Rate": 1.4808063137590172e-05, "Pretrain/Loss": 2.0246028900146484, "Pretrain/Loss (Raw)": 1.90975821018219, "Pretrain/Step": 6148, "Pretrain/Step Time": 8.502883471548557} +{"Pretrain/Learning Rate": 1.4800311401607304e-05, "Pretrain/Loss": 2.023228168487549, "Pretrain/Loss (Raw)": 2.0354208946228027, "Pretrain/Step": 6149, "Pretrain/Step Time": 8.502899054437876} +{"Pretrain/Learning Rate": 1.4792560841900604e-05, "Pretrain/Loss": 2.021710157394409, "Pretrain/Loss (Raw)": 1.825785756111145, "Pretrain/Step": 6150, "Pretrain/Step Time": 8.498775891959667} +{"Pretrain/Learning Rate": 1.4784811459363873e-05, "Pretrain/Loss": 2.0218677520751953, "Pretrain/Loss (Raw)": 2.0791585445404053, "Pretrain/Step": 6151, "Pretrain/Step Time": 8.509717443957925} +{"Pretrain/Learning Rate": 1.4777063254890833e-05, "Pretrain/Loss": 2.023362159729004, "Pretrain/Loss (Raw)": 1.9120659828186035, "Pretrain/Step": 6152, "Pretrain/Step Time": 8.510837322100997} +{"Pretrain/Learning Rate": 1.4769316229375012e-05, "Pretrain/Loss": 2.020380735397339, "Pretrain/Loss (Raw)": 1.865797758102417, "Pretrain/Step": 6153, "Pretrain/Step Time": 8.51116337440908} +{"Pretrain/Learning Rate": 1.4761570383709871e-05, "Pretrain/Loss": 2.0245587825775146, "Pretrain/Loss (Raw)": 2.2505834102630615, "Pretrain/Step": 6154, "Pretrain/Step Time": 8.504025004804134} +{"Pretrain/Learning Rate": 1.4753825718788667e-05, "Pretrain/Loss": 2.025381565093994, "Pretrain/Loss (Raw)": 2.0064897537231445, "Pretrain/Step": 6155, "Pretrain/Step Time": 8.50599611364305} +{"Pretrain/Learning Rate": 1.4746082235504572e-05, "Pretrain/Loss": 2.023951530456543, "Pretrain/Loss (Raw)": 1.7887647151947021, "Pretrain/Step": 6156, "Pretrain/Step Time": 8.50869987346232} +{"Pretrain/Learning Rate": 1.4738339934750584e-05, "Pretrain/Loss": 2.0252556800842285, "Pretrain/Loss (Raw)": 2.0654900074005127, "Pretrain/Step": 6157, "Pretrain/Step Time": 8.50989119708538} +{"Pretrain/Learning Rate": 1.4730598817419593e-05, "Pretrain/Loss": 2.024911880493164, "Pretrain/Loss (Raw)": 2.166834592819214, "Pretrain/Step": 6158, "Pretrain/Step Time": 8.511208673939109} +{"Pretrain/Learning Rate": 1.4722858884404333e-05, "Pretrain/Loss": 2.028146743774414, "Pretrain/Loss (Raw)": 2.328598976135254, "Pretrain/Step": 6159, "Pretrain/Step Time": 8.510754376649857} +{"Pretrain/Learning Rate": 1.4715120136597421e-05, "Pretrain/Loss": 2.0310556888580322, "Pretrain/Loss (Raw)": 2.1828713417053223, "Pretrain/Step": 6160, "Pretrain/Step Time": 8.50725650973618} +{"Pretrain/Learning Rate": 1.4707382574891312e-05, "Pretrain/Loss": 2.032705783843994, "Pretrain/Loss (Raw)": 2.0810787677764893, "Pretrain/Step": 6161, "Pretrain/Step Time": 8.505073726177216} +{"Pretrain/Learning Rate": 1.4699646200178353e-05, "Pretrain/Loss": 2.0327837467193604, "Pretrain/Loss (Raw)": 1.9752455949783325, "Pretrain/Step": 6162, "Pretrain/Step Time": 8.502331981435418} +{"Pretrain/Learning Rate": 1.469191101335072e-05, "Pretrain/Loss": 2.032649278640747, "Pretrain/Loss (Raw)": 2.0997095108032227, "Pretrain/Step": 6163, "Pretrain/Step Time": 8.504188874736428} +{"Pretrain/Learning Rate": 1.4684177015300491e-05, "Pretrain/Loss": 2.0331900119781494, "Pretrain/Loss (Raw)": 2.1371986865997314, "Pretrain/Step": 6164, "Pretrain/Step Time": 8.511643957346678} +{"Pretrain/Learning Rate": 1.467644420691957e-05, "Pretrain/Loss": 2.0312931537628174, "Pretrain/Loss (Raw)": 1.7901955842971802, "Pretrain/Step": 6165, "Pretrain/Step Time": 8.514831127598882} +{"Pretrain/Learning Rate": 1.4668712589099753e-05, "Pretrain/Loss": 2.030332326889038, "Pretrain/Loss (Raw)": 1.978561520576477, "Pretrain/Step": 6166, "Pretrain/Step Time": 8.516661388799548} +{"Pretrain/Learning Rate": 1.466098216273269e-05, "Pretrain/Loss": 2.0269148349761963, "Pretrain/Loss (Raw)": 2.001901865005493, "Pretrain/Step": 6167, "Pretrain/Step Time": 8.514924943447113} +{"Pretrain/Learning Rate": 1.465325292870987e-05, "Pretrain/Loss": 2.0264434814453125, "Pretrain/Loss (Raw)": 1.9539132118225098, "Pretrain/Step": 6168, "Pretrain/Step Time": 8.516128048300743} +{"Pretrain/Learning Rate": 1.464552488792269e-05, "Pretrain/Loss": 2.026773452758789, "Pretrain/Loss (Raw)": 2.1510884761810303, "Pretrain/Step": 6169, "Pretrain/Step Time": 8.515332650393248} +{"Pretrain/Learning Rate": 1.4637798041262363e-05, "Pretrain/Loss": 2.027651786804199, "Pretrain/Loss (Raw)": 2.227020025253296, "Pretrain/Step": 6170, "Pretrain/Step Time": 8.535974895581603} +{"Pretrain/Learning Rate": 1.4630072389620003e-05, "Pretrain/Loss": 2.0268874168395996, "Pretrain/Loss (Raw)": 2.162165641784668, "Pretrain/Step": 6171, "Pretrain/Step Time": 8.530178545042872} +{"Pretrain/Learning Rate": 1.462234793388655e-05, "Pretrain/Loss": 2.027226448059082, "Pretrain/Loss (Raw)": 1.8768390417099, "Pretrain/Step": 6172, "Pretrain/Step Time": 8.528082523494959} +{"Pretrain/Learning Rate": 1.4614624674952842e-05, "Pretrain/Loss": 2.028193473815918, "Pretrain/Loss (Raw)": 2.1141722202301025, "Pretrain/Step": 6173, "Pretrain/Step Time": 8.525863585993648} +{"Pretrain/Learning Rate": 1.460690261370955e-05, "Pretrain/Loss": 2.0277514457702637, "Pretrain/Loss (Raw)": 1.94339919090271, "Pretrain/Step": 6174, "Pretrain/Step Time": 8.520619744434953} +{"Pretrain/Learning Rate": 1.4599181751047225e-05, "Pretrain/Loss": 2.0276682376861572, "Pretrain/Loss (Raw)": 2.15645170211792, "Pretrain/Step": 6175, "Pretrain/Step Time": 8.526390748098493} +{"Pretrain/Learning Rate": 1.4591462087856262e-05, "Pretrain/Loss": 2.024289131164551, "Pretrain/Loss (Raw)": 1.9100714921951294, "Pretrain/Step": 6176, "Pretrain/Step Time": 8.531311891973019} +{"Pretrain/Learning Rate": 1.4583743625026958e-05, "Pretrain/Loss": 2.0244805812835693, "Pretrain/Loss (Raw)": 2.059101104736328, "Pretrain/Step": 6177, "Pretrain/Step Time": 8.534997144713998} +{"Pretrain/Learning Rate": 1.4576026363449402e-05, "Pretrain/Loss": 2.024031639099121, "Pretrain/Loss (Raw)": 1.9387511014938354, "Pretrain/Step": 6178, "Pretrain/Step Time": 8.522270355373621} +{"Pretrain/Learning Rate": 1.4568310304013613e-05, "Pretrain/Loss": 2.0252256393432617, "Pretrain/Loss (Raw)": 2.02582049369812, "Pretrain/Step": 6179, "Pretrain/Step Time": 8.520050225779414} +{"Pretrain/Learning Rate": 1.4560595447609427e-05, "Pretrain/Loss": 2.0265748500823975, "Pretrain/Loss (Raw)": 1.9506818056106567, "Pretrain/Step": 6180, "Pretrain/Step Time": 8.52151564322412} +{"Pretrain/Learning Rate": 1.4552881795126588e-05, "Pretrain/Loss": 2.0213782787323, "Pretrain/Loss (Raw)": 1.8829543590545654, "Pretrain/Step": 6181, "Pretrain/Step Time": 8.52472005225718} +{"Pretrain/Learning Rate": 1.4545169347454627e-05, "Pretrain/Loss": 2.02063250541687, "Pretrain/Loss (Raw)": 1.875295639038086, "Pretrain/Step": 6182, "Pretrain/Step Time": 8.527231000363827} +{"Pretrain/Learning Rate": 1.453745810548301e-05, "Pretrain/Loss": 2.019791603088379, "Pretrain/Loss (Raw)": 1.9319231510162354, "Pretrain/Step": 6183, "Pretrain/Step Time": 8.531083807349205} +{"Pretrain/Learning Rate": 1.452974807010103e-05, "Pretrain/Loss": 2.0191924571990967, "Pretrain/Loss (Raw)": 2.0333526134490967, "Pretrain/Step": 6184, "Pretrain/Step Time": 8.520322820171714} +{"Pretrain/Learning Rate": 1.4522039242197835e-05, "Pretrain/Loss": 2.0164220333099365, "Pretrain/Loss (Raw)": 1.7229715585708618, "Pretrain/Step": 6185, "Pretrain/Step Time": 8.519365744665265} +{"Pretrain/Learning Rate": 1.4514331622662441e-05, "Pretrain/Loss": 2.016421318054199, "Pretrain/Loss (Raw)": 2.002512216567993, "Pretrain/Step": 6186, "Pretrain/Step Time": 8.518699757754803} +{"Pretrain/Learning Rate": 1.4506625212383743e-05, "Pretrain/Loss": 2.0162253379821777, "Pretrain/Loss (Raw)": 1.921362280845642, "Pretrain/Step": 6187, "Pretrain/Step Time": 8.52706828340888} +{"Pretrain/Learning Rate": 1.4498920012250472e-05, "Pretrain/Loss": 2.015259265899658, "Pretrain/Loss (Raw)": 1.8749226331710815, "Pretrain/Step": 6188, "Pretrain/Step Time": 8.530756978318095} +{"Pretrain/Learning Rate": 1.449121602315123e-05, "Pretrain/Loss": 2.0147640705108643, "Pretrain/Loss (Raw)": 2.103423833847046, "Pretrain/Step": 6189, "Pretrain/Step Time": 8.531247956678271} +{"Pretrain/Learning Rate": 1.4483513245974461e-05, "Pretrain/Loss": 2.013052463531494, "Pretrain/Loss (Raw)": 1.8380488157272339, "Pretrain/Step": 6190, "Pretrain/Step Time": 8.525511799380183} +{"Pretrain/Learning Rate": 1.4475811681608515e-05, "Pretrain/Loss": 2.0110838413238525, "Pretrain/Loss (Raw)": 1.9645508527755737, "Pretrain/Step": 6191, "Pretrain/Step Time": 8.518064558506012} +{"Pretrain/Learning Rate": 1.4468111330941556e-05, "Pretrain/Loss": 2.0125112533569336, "Pretrain/Loss (Raw)": 1.9814802408218384, "Pretrain/Step": 6192, "Pretrain/Step Time": 8.515056615695357} +{"Pretrain/Learning Rate": 1.4460412194861624e-05, "Pretrain/Loss": 2.014907121658325, "Pretrain/Loss (Raw)": 2.0954577922821045, "Pretrain/Step": 6193, "Pretrain/Step Time": 8.522325424477458} +{"Pretrain/Learning Rate": 1.4452714274256612e-05, "Pretrain/Loss": 2.014566421508789, "Pretrain/Loss (Raw)": 1.9582781791687012, "Pretrain/Step": 6194, "Pretrain/Step Time": 8.528201658278704} +{"Pretrain/Learning Rate": 1.4445017570014303e-05, "Pretrain/Loss": 2.0146372318267822, "Pretrain/Loss (Raw)": 1.9764291048049927, "Pretrain/Step": 6195, "Pretrain/Step Time": 8.519614577293396} +{"Pretrain/Learning Rate": 1.4437322083022304e-05, "Pretrain/Loss": 2.0160670280456543, "Pretrain/Loss (Raw)": 2.0150671005249023, "Pretrain/Step": 6196, "Pretrain/Step Time": 8.514925476163626} +{"Pretrain/Learning Rate": 1.4429627814168095e-05, "Pretrain/Loss": 2.015984058380127, "Pretrain/Loss (Raw)": 2.100795269012451, "Pretrain/Step": 6197, "Pretrain/Step Time": 8.510245732963085} +{"Pretrain/Learning Rate": 1.4421934764339004e-05, "Pretrain/Loss": 2.01702880859375, "Pretrain/Loss (Raw)": 1.9296743869781494, "Pretrain/Step": 6198, "Pretrain/Step Time": 8.517207795754075} +{"Pretrain/Learning Rate": 1.4414242934422251e-05, "Pretrain/Loss": 2.0151515007019043, "Pretrain/Loss (Raw)": 1.6886467933654785, "Pretrain/Step": 6199, "Pretrain/Step Time": 8.528680393472314} +{"Pretrain/Learning Rate": 1.440655232530489e-05, "Pretrain/Loss": 2.0136051177978516, "Pretrain/Loss (Raw)": 2.143733024597168, "Pretrain/Step": 6200, "Pretrain/Step Time": 8.529988070949912} +{"Pretrain/Learning Rate": 1.4398862937873825e-05, "Pretrain/Loss": 2.0144965648651123, "Pretrain/Loss (Raw)": 2.102619171142578, "Pretrain/Step": 6201, "Pretrain/Step Time": 8.530028279870749} +{"Pretrain/Learning Rate": 1.4391174773015836e-05, "Pretrain/Loss": 2.014002799987793, "Pretrain/Loss (Raw)": 1.9115879535675049, "Pretrain/Step": 6202, "Pretrain/Step Time": 8.520341435447335} +{"Pretrain/Learning Rate": 1.4383487831617571e-05, "Pretrain/Loss": 2.0130233764648438, "Pretrain/Loss (Raw)": 1.8831266164779663, "Pretrain/Step": 6203, "Pretrain/Step Time": 8.5156239438802} +{"Pretrain/Learning Rate": 1.4375802114565515e-05, "Pretrain/Loss": 2.0146398544311523, "Pretrain/Loss (Raw)": 2.0482070446014404, "Pretrain/Step": 6204, "Pretrain/Step Time": 8.51747364550829} +{"Pretrain/Learning Rate": 1.4368117622746025e-05, "Pretrain/Loss": 2.015552520751953, "Pretrain/Loss (Raw)": 2.1200361251831055, "Pretrain/Step": 6205, "Pretrain/Step Time": 8.52804123237729} +{"Pretrain/Learning Rate": 1.4360434357045294e-05, "Pretrain/Loss": 2.0145788192749023, "Pretrain/Loss (Raw)": 2.0078141689300537, "Pretrain/Step": 6206, "Pretrain/Step Time": 8.532415553927422} +{"Pretrain/Learning Rate": 1.4352752318349421e-05, "Pretrain/Loss": 2.0134074687957764, "Pretrain/Loss (Raw)": 2.077362060546875, "Pretrain/Step": 6207, "Pretrain/Step Time": 8.533069098368287} +{"Pretrain/Learning Rate": 1.4345071507544326e-05, "Pretrain/Loss": 2.0130341053009033, "Pretrain/Loss (Raw)": 2.0156188011169434, "Pretrain/Step": 6208, "Pretrain/Step Time": 8.525319688022137} +{"Pretrain/Learning Rate": 1.4337391925515777e-05, "Pretrain/Loss": 2.0136537551879883, "Pretrain/Loss (Raw)": 2.173394203186035, "Pretrain/Step": 6209, "Pretrain/Step Time": 8.522498402744532} +{"Pretrain/Learning Rate": 1.432971357314945e-05, "Pretrain/Loss": 2.0129895210266113, "Pretrain/Loss (Raw)": 1.9383071660995483, "Pretrain/Step": 6210, "Pretrain/Step Time": 8.523976078256965} +{"Pretrain/Learning Rate": 1.4322036451330828e-05, "Pretrain/Loss": 2.014122486114502, "Pretrain/Loss (Raw)": 2.0393848419189453, "Pretrain/Step": 6211, "Pretrain/Step Time": 8.532129116356373} +{"Pretrain/Learning Rate": 1.4314360560945284e-05, "Pretrain/Loss": 2.014855146408081, "Pretrain/Loss (Raw)": 2.1399693489074707, "Pretrain/Step": 6212, "Pretrain/Step Time": 8.531361620873213} +{"Pretrain/Learning Rate": 1.430668590287802e-05, "Pretrain/Loss": 2.0156006813049316, "Pretrain/Loss (Raw)": 2.1101016998291016, "Pretrain/Step": 6213, "Pretrain/Step Time": 8.534116426482797} +{"Pretrain/Learning Rate": 1.4299012478014146e-05, "Pretrain/Loss": 2.0117287635803223, "Pretrain/Loss (Raw)": 1.7392632961273193, "Pretrain/Step": 6214, "Pretrain/Step Time": 8.529181661084294} +{"Pretrain/Learning Rate": 1.4291340287238558e-05, "Pretrain/Loss": 2.0122249126434326, "Pretrain/Loss (Raw)": 2.1531448364257812, "Pretrain/Step": 6215, "Pretrain/Step Time": 8.528972061350942} +{"Pretrain/Learning Rate": 1.4283669331436078e-05, "Pretrain/Loss": 2.0150399208068848, "Pretrain/Loss (Raw)": 2.4309418201446533, "Pretrain/Step": 6216, "Pretrain/Step Time": 8.526783883571625} +{"Pretrain/Learning Rate": 1.4275999611491342e-05, "Pretrain/Loss": 2.0159945487976074, "Pretrain/Loss (Raw)": 1.9446332454681396, "Pretrain/Step": 6217, "Pretrain/Step Time": 8.518955422565341} +{"Pretrain/Learning Rate": 1.4268331128288881e-05, "Pretrain/Loss": 2.015503406524658, "Pretrain/Loss (Raw)": 2.1513187885284424, "Pretrain/Step": 6218, "Pretrain/Step Time": 8.526310237124562} +{"Pretrain/Learning Rate": 1.4260663882713022e-05, "Pretrain/Loss": 2.0150296688079834, "Pretrain/Loss (Raw)": 1.888441801071167, "Pretrain/Step": 6219, "Pretrain/Step Time": 8.53055958263576} +{"Pretrain/Learning Rate": 1.4252997875648021e-05, "Pretrain/Loss": 2.0164780616760254, "Pretrain/Loss (Raw)": 2.234611988067627, "Pretrain/Step": 6220, "Pretrain/Step Time": 8.524869641289115} +{"Pretrain/Learning Rate": 1.4245333107977937e-05, "Pretrain/Loss": 2.0172340869903564, "Pretrain/Loss (Raw)": 2.1012494564056396, "Pretrain/Step": 6221, "Pretrain/Step Time": 8.518016526475549} +{"Pretrain/Learning Rate": 1.4237669580586736e-05, "Pretrain/Loss": 2.0168583393096924, "Pretrain/Loss (Raw)": 2.0253689289093018, "Pretrain/Step": 6222, "Pretrain/Step Time": 8.517047684639692} +{"Pretrain/Learning Rate": 1.4230007294358173e-05, "Pretrain/Loss": 2.014334201812744, "Pretrain/Loss (Raw)": 1.6674383878707886, "Pretrain/Step": 6223, "Pretrain/Step Time": 8.518203949555755} +{"Pretrain/Learning Rate": 1.4222346250175928e-05, "Pretrain/Loss": 2.0158767700195312, "Pretrain/Loss (Raw)": 2.3519175052642822, "Pretrain/Step": 6224, "Pretrain/Step Time": 8.518013099208474} +{"Pretrain/Learning Rate": 1.4214686448923498e-05, "Pretrain/Loss": 2.0184273719787598, "Pretrain/Loss (Raw)": 2.1340277194976807, "Pretrain/Step": 6225, "Pretrain/Step Time": 8.516711451113224} +{"Pretrain/Learning Rate": 1.420702789148425e-05, "Pretrain/Loss": 2.016714572906494, "Pretrain/Loss (Raw)": 2.008927583694458, "Pretrain/Step": 6226, "Pretrain/Step Time": 8.513241417706013} +{"Pretrain/Learning Rate": 1.4199370578741395e-05, "Pretrain/Loss": 2.013542890548706, "Pretrain/Loss (Raw)": 1.6997078657150269, "Pretrain/Step": 6227, "Pretrain/Step Time": 8.511785753071308} +{"Pretrain/Learning Rate": 1.419171451157803e-05, "Pretrain/Loss": 2.014463424682617, "Pretrain/Loss (Raw)": 2.137045383453369, "Pretrain/Step": 6228, "Pretrain/Step Time": 8.516840625554323} +{"Pretrain/Learning Rate": 1.4184059690877075e-05, "Pretrain/Loss": 2.015153408050537, "Pretrain/Loss (Raw)": 1.8645349740982056, "Pretrain/Step": 6229, "Pretrain/Step Time": 8.51440760307014} +{"Pretrain/Learning Rate": 1.4176406117521324e-05, "Pretrain/Loss": 2.0167078971862793, "Pretrain/Loss (Raw)": 2.1889986991882324, "Pretrain/Step": 6230, "Pretrain/Step Time": 8.520675545558333} +{"Pretrain/Learning Rate": 1.4168753792393414e-05, "Pretrain/Loss": 2.0172882080078125, "Pretrain/Loss (Raw)": 2.046860456466675, "Pretrain/Step": 6231, "Pretrain/Step Time": 8.51179764047265} +{"Pretrain/Learning Rate": 1.4161102716375863e-05, "Pretrain/Loss": 2.017803430557251, "Pretrain/Loss (Raw)": 2.084961414337158, "Pretrain/Step": 6232, "Pretrain/Step Time": 8.502635853365064} +{"Pretrain/Learning Rate": 1.4153452890351022e-05, "Pretrain/Loss": 2.0162887573242188, "Pretrain/Loss (Raw)": 1.9583611488342285, "Pretrain/Step": 6233, "Pretrain/Step Time": 8.50634303316474} +{"Pretrain/Learning Rate": 1.41458043152011e-05, "Pretrain/Loss": 2.0155086517333984, "Pretrain/Loss (Raw)": 2.034334182739258, "Pretrain/Step": 6234, "Pretrain/Step Time": 8.511806409806013} +{"Pretrain/Learning Rate": 1.4138156991808165e-05, "Pretrain/Loss": 2.012207269668579, "Pretrain/Loss (Raw)": 1.8021336793899536, "Pretrain/Step": 6235, "Pretrain/Step Time": 8.511363483965397} +{"Pretrain/Learning Rate": 1.4130510921054157e-05, "Pretrain/Loss": 2.013331890106201, "Pretrain/Loss (Raw)": 2.205010175704956, "Pretrain/Step": 6236, "Pretrain/Step Time": 8.512777915224433} +{"Pretrain/Learning Rate": 1.4122866103820854e-05, "Pretrain/Loss": 2.0132789611816406, "Pretrain/Loss (Raw)": 2.105142593383789, "Pretrain/Step": 6237, "Pretrain/Step Time": 8.508400030434132} +{"Pretrain/Learning Rate": 1.411522254098988e-05, "Pretrain/Loss": 2.0129523277282715, "Pretrain/Loss (Raw)": 2.256855010986328, "Pretrain/Step": 6238, "Pretrain/Step Time": 8.504528041929007} +{"Pretrain/Learning Rate": 1.4107580233442725e-05, "Pretrain/Loss": 2.010071277618408, "Pretrain/Loss (Raw)": 1.818092703819275, "Pretrain/Step": 6239, "Pretrain/Step Time": 8.50421011634171} +{"Pretrain/Learning Rate": 1.4099939182060755e-05, "Pretrain/Loss": 2.007561206817627, "Pretrain/Loss (Raw)": 1.916266679763794, "Pretrain/Step": 6240, "Pretrain/Step Time": 8.505839744582772} +{"Pretrain/Learning Rate": 1.409229938772516e-05, "Pretrain/Loss": 2.009138584136963, "Pretrain/Loss (Raw)": 2.131528377532959, "Pretrain/Step": 6241, "Pretrain/Step Time": 8.505563763901591} +{"Pretrain/Learning Rate": 1.4084660851316999e-05, "Pretrain/Loss": 2.012307643890381, "Pretrain/Loss (Raw)": 2.188448190689087, "Pretrain/Step": 6242, "Pretrain/Step Time": 8.509690245613456} +{"Pretrain/Learning Rate": 1.4077023573717174e-05, "Pretrain/Loss": 2.011895179748535, "Pretrain/Loss (Raw)": 2.1150596141815186, "Pretrain/Step": 6243, "Pretrain/Step Time": 8.506744148209691} +{"Pretrain/Learning Rate": 1.4069387555806473e-05, "Pretrain/Loss": 2.0123186111450195, "Pretrain/Loss (Raw)": 1.97809898853302, "Pretrain/Step": 6244, "Pretrain/Step Time": 8.5135599039495} +{"Pretrain/Learning Rate": 1.4061752798465503e-05, "Pretrain/Loss": 2.011911630630493, "Pretrain/Loss (Raw)": 2.1655900478363037, "Pretrain/Step": 6245, "Pretrain/Step Time": 8.511623498052359} +{"Pretrain/Learning Rate": 1.4054119302574741e-05, "Pretrain/Loss": 2.012491226196289, "Pretrain/Loss (Raw)": 1.8583672046661377, "Pretrain/Step": 6246, "Pretrain/Step Time": 8.512010898441076} +{"Pretrain/Learning Rate": 1.4046487069014513e-05, "Pretrain/Loss": 2.0133113861083984, "Pretrain/Loss (Raw)": 2.1700754165649414, "Pretrain/Step": 6247, "Pretrain/Step Time": 8.51320031285286} +{"Pretrain/Learning Rate": 1.403885609866502e-05, "Pretrain/Loss": 2.014244556427002, "Pretrain/Loss (Raw)": 2.1173996925354004, "Pretrain/Step": 6248, "Pretrain/Step Time": 8.519529148936272} +{"Pretrain/Learning Rate": 1.4031226392406293e-05, "Pretrain/Loss": 2.014270782470703, "Pretrain/Loss (Raw)": 2.0156962871551514, "Pretrain/Step": 6249, "Pretrain/Step Time": 8.51561849936843} +{"Pretrain/Learning Rate": 1.4023597951118217e-05, "Pretrain/Loss": 2.0144472122192383, "Pretrain/Loss (Raw)": 2.1141390800476074, "Pretrain/Step": 6250, "Pretrain/Step Time": 8.516645105555654} +{"Pretrain/Learning Rate": 1.4015970775680554e-05, "Pretrain/Loss": 2.0152111053466797, "Pretrain/Loss (Raw)": 2.0332188606262207, "Pretrain/Step": 6251, "Pretrain/Step Time": 8.511176466941833} +{"Pretrain/Learning Rate": 1.4008344866972902e-05, "Pretrain/Loss": 2.0145230293273926, "Pretrain/Loss (Raw)": 1.998260498046875, "Pretrain/Step": 6252, "Pretrain/Step Time": 8.517822280526161} +{"Pretrain/Learning Rate": 1.4000720225874714e-05, "Pretrain/Loss": 2.0138301849365234, "Pretrain/Loss (Raw)": 1.9325363636016846, "Pretrain/Step": 6253, "Pretrain/Step Time": 8.523666331544518} +{"Pretrain/Learning Rate": 1.399309685326529e-05, "Pretrain/Loss": 2.0124478340148926, "Pretrain/Loss (Raw)": 1.8362879753112793, "Pretrain/Step": 6254, "Pretrain/Step Time": 8.52530581690371} +{"Pretrain/Learning Rate": 1.3985474750023821e-05, "Pretrain/Loss": 2.0127997398376465, "Pretrain/Loss (Raw)": 2.0748677253723145, "Pretrain/Step": 6255, "Pretrain/Step Time": 8.524291416630149} +{"Pretrain/Learning Rate": 1.3977853917029287e-05, "Pretrain/Loss": 2.0129966735839844, "Pretrain/Loss (Raw)": 1.9944368600845337, "Pretrain/Step": 6256, "Pretrain/Step Time": 8.520350236445665} +{"Pretrain/Learning Rate": 1.3970234355160588e-05, "Pretrain/Loss": 2.0131568908691406, "Pretrain/Loss (Raw)": 1.982076644897461, "Pretrain/Step": 6257, "Pretrain/Step Time": 8.52168619632721} +{"Pretrain/Learning Rate": 1.3962616065296428e-05, "Pretrain/Loss": 2.0131068229675293, "Pretrain/Loss (Raw)": 1.898284673690796, "Pretrain/Step": 6258, "Pretrain/Step Time": 8.518542697653174} +{"Pretrain/Learning Rate": 1.395499904831541e-05, "Pretrain/Loss": 2.012167453765869, "Pretrain/Loss (Raw)": 1.7942252159118652, "Pretrain/Step": 6259, "Pretrain/Step Time": 8.523789653554559} +{"Pretrain/Learning Rate": 1.394738330509593e-05, "Pretrain/Loss": 2.0119736194610596, "Pretrain/Loss (Raw)": 2.001173257827759, "Pretrain/Step": 6260, "Pretrain/Step Time": 8.523620394989848} +{"Pretrain/Learning Rate": 1.3939768836516299e-05, "Pretrain/Loss": 2.011826992034912, "Pretrain/Loss (Raw)": 1.9267621040344238, "Pretrain/Step": 6261, "Pretrain/Step Time": 8.515198558568954} +{"Pretrain/Learning Rate": 1.393215564345463e-05, "Pretrain/Loss": 2.013716220855713, "Pretrain/Loss (Raw)": 2.1641647815704346, "Pretrain/Step": 6262, "Pretrain/Step Time": 8.517489269375801} +{"Pretrain/Learning Rate": 1.3924543726788953e-05, "Pretrain/Loss": 2.0156993865966797, "Pretrain/Loss (Raw)": 2.0219204425811768, "Pretrain/Step": 6263, "Pretrain/Step Time": 8.517730696126819} +{"Pretrain/Learning Rate": 1.3916933087397055e-05, "Pretrain/Loss": 2.0133588314056396, "Pretrain/Loss (Raw)": 1.9566733837127686, "Pretrain/Step": 6264, "Pretrain/Step Time": 8.521695142611861} +{"Pretrain/Learning Rate": 1.3909323726156672e-05, "Pretrain/Loss": 2.0157389640808105, "Pretrain/Loss (Raw)": 2.39650821685791, "Pretrain/Step": 6265, "Pretrain/Step Time": 8.51933759264648} +{"Pretrain/Learning Rate": 1.3901715643945337e-05, "Pretrain/Loss": 2.0176730155944824, "Pretrain/Loss (Raw)": 2.095449447631836, "Pretrain/Step": 6266, "Pretrain/Step Time": 8.520767569541931} +{"Pretrain/Learning Rate": 1.3894108841640452e-05, "Pretrain/Loss": 2.0197370052337646, "Pretrain/Loss (Raw)": 2.1149158477783203, "Pretrain/Step": 6267, "Pretrain/Step Time": 8.521675873547792} +{"Pretrain/Learning Rate": 1.3886503320119256e-05, "Pretrain/Loss": 2.0208137035369873, "Pretrain/Loss (Raw)": 2.0905792713165283, "Pretrain/Step": 6268, "Pretrain/Step Time": 8.517486974596977} +{"Pretrain/Learning Rate": 1.3878899080258878e-05, "Pretrain/Loss": 2.0215981006622314, "Pretrain/Loss (Raw)": 1.9220387935638428, "Pretrain/Step": 6269, "Pretrain/Step Time": 8.513393057510257} +{"Pretrain/Learning Rate": 1.3871296122936261e-05, "Pretrain/Loss": 2.0189619064331055, "Pretrain/Loss (Raw)": 1.6941808462142944, "Pretrain/Step": 6270, "Pretrain/Step Time": 8.51719357073307} +{"Pretrain/Learning Rate": 1.3863694449028214e-05, "Pretrain/Loss": 2.0163815021514893, "Pretrain/Loss (Raw)": 2.0851235389709473, "Pretrain/Step": 6271, "Pretrain/Step Time": 8.526626804843545} +{"Pretrain/Learning Rate": 1.3856094059411392e-05, "Pretrain/Loss": 2.0161337852478027, "Pretrain/Loss (Raw)": 1.9577274322509766, "Pretrain/Step": 6272, "Pretrain/Step Time": 8.527329254895449} +{"Pretrain/Learning Rate": 1.3848494954962324e-05, "Pretrain/Loss": 2.01788592338562, "Pretrain/Loss (Raw)": 2.075373649597168, "Pretrain/Step": 6273, "Pretrain/Step Time": 8.523831801488996} +{"Pretrain/Learning Rate": 1.3840897136557366e-05, "Pretrain/Loss": 2.0199317932128906, "Pretrain/Loss (Raw)": 2.174069404602051, "Pretrain/Step": 6274, "Pretrain/Step Time": 8.523206869140267} +{"Pretrain/Learning Rate": 1.383330060507273e-05, "Pretrain/Loss": 2.0203604698181152, "Pretrain/Loss (Raw)": 2.021904945373535, "Pretrain/Step": 6275, "Pretrain/Step Time": 8.519430195912719} +{"Pretrain/Learning Rate": 1.382570536138448e-05, "Pretrain/Loss": 2.021512985229492, "Pretrain/Loss (Raw)": 2.0572733879089355, "Pretrain/Step": 6276, "Pretrain/Step Time": 8.524018267169595} +{"Pretrain/Learning Rate": 1.3818111406368555e-05, "Pretrain/Loss": 2.0210487842559814, "Pretrain/Loss (Raw)": 1.9760113954544067, "Pretrain/Step": 6277, "Pretrain/Step Time": 8.533168688416481} +{"Pretrain/Learning Rate": 1.381051874090071e-05, "Pretrain/Loss": 2.0198073387145996, "Pretrain/Loss (Raw)": 1.6668745279312134, "Pretrain/Step": 6278, "Pretrain/Step Time": 8.533616699278355} +{"Pretrain/Learning Rate": 1.3802927365856571e-05, "Pretrain/Loss": 2.016596794128418, "Pretrain/Loss (Raw)": 1.6682064533233643, "Pretrain/Step": 6279, "Pretrain/Step Time": 8.522182378917933} +{"Pretrain/Learning Rate": 1.3795337282111604e-05, "Pretrain/Loss": 2.0190229415893555, "Pretrain/Loss (Raw)": 2.2225897312164307, "Pretrain/Step": 6280, "Pretrain/Step Time": 8.52076918259263} +{"Pretrain/Learning Rate": 1.3787748490541144e-05, "Pretrain/Loss": 2.020094871520996, "Pretrain/Loss (Raw)": 2.0030455589294434, "Pretrain/Step": 6281, "Pretrain/Step Time": 8.516664629802108} +{"Pretrain/Learning Rate": 1.3780160992020364e-05, "Pretrain/Loss": 2.0184736251831055, "Pretrain/Loss (Raw)": 2.0430362224578857, "Pretrain/Step": 6282, "Pretrain/Step Time": 8.525799795985222} +{"Pretrain/Learning Rate": 1.3772574787424291e-05, "Pretrain/Loss": 2.018017530441284, "Pretrain/Loss (Raw)": 1.9481287002563477, "Pretrain/Step": 6283, "Pretrain/Step Time": 8.532995529472828} +{"Pretrain/Learning Rate": 1.3764989877627785e-05, "Pretrain/Loss": 2.0215368270874023, "Pretrain/Loss (Raw)": 2.239222288131714, "Pretrain/Step": 6284, "Pretrain/Step Time": 8.527819026261568} +{"Pretrain/Learning Rate": 1.3757406263505602e-05, "Pretrain/Loss": 2.024541139602661, "Pretrain/Loss (Raw)": 2.4500324726104736, "Pretrain/Step": 6285, "Pretrain/Step Time": 8.519990086555481} +{"Pretrain/Learning Rate": 1.37498239459323e-05, "Pretrain/Loss": 2.0243356227874756, "Pretrain/Loss (Raw)": 2.140533447265625, "Pretrain/Step": 6286, "Pretrain/Step Time": 8.521173976361752} +{"Pretrain/Learning Rate": 1.3742242925782317e-05, "Pretrain/Loss": 2.0209929943084717, "Pretrain/Loss (Raw)": 1.9007468223571777, "Pretrain/Step": 6287, "Pretrain/Step Time": 8.520973931998014} +{"Pretrain/Learning Rate": 1.3734663203929916e-05, "Pretrain/Loss": 2.0200729370117188, "Pretrain/Loss (Raw)": 2.0651068687438965, "Pretrain/Step": 6288, "Pretrain/Step Time": 8.52403661981225} +{"Pretrain/Learning Rate": 1.372708478124925e-05, "Pretrain/Loss": 2.0192582607269287, "Pretrain/Loss (Raw)": 1.9767975807189941, "Pretrain/Step": 6289, "Pretrain/Step Time": 8.52675729058683} +{"Pretrain/Learning Rate": 1.3719507658614284e-05, "Pretrain/Loss": 2.018129587173462, "Pretrain/Loss (Raw)": 1.8307502269744873, "Pretrain/Step": 6290, "Pretrain/Step Time": 8.531638717278838} +{"Pretrain/Learning Rate": 1.3711931836898842e-05, "Pretrain/Loss": 2.0170130729675293, "Pretrain/Loss (Raw)": 1.9568216800689697, "Pretrain/Step": 6291, "Pretrain/Step Time": 8.526072600856423} +{"Pretrain/Learning Rate": 1.3704357316976623e-05, "Pretrain/Loss": 2.0157172679901123, "Pretrain/Loss (Raw)": 1.971337080001831, "Pretrain/Step": 6292, "Pretrain/Step Time": 8.527035161852837} +{"Pretrain/Learning Rate": 1.3696784099721143e-05, "Pretrain/Loss": 2.0159456729888916, "Pretrain/Loss (Raw)": 1.8194479942321777, "Pretrain/Step": 6293, "Pretrain/Step Time": 8.520228244364262} +{"Pretrain/Learning Rate": 1.3689212186005784e-05, "Pretrain/Loss": 2.0165905952453613, "Pretrain/Loss (Raw)": 2.061084032058716, "Pretrain/Step": 6294, "Pretrain/Step Time": 8.520586976781487} +{"Pretrain/Learning Rate": 1.3681641576703763e-05, "Pretrain/Loss": 2.014366626739502, "Pretrain/Loss (Raw)": 1.7172343730926514, "Pretrain/Step": 6295, "Pretrain/Step Time": 8.522569326683879} +{"Pretrain/Learning Rate": 1.3674072272688182e-05, "Pretrain/Loss": 2.01450777053833, "Pretrain/Loss (Raw)": 1.9719780683517456, "Pretrain/Step": 6296, "Pretrain/Step Time": 8.525517532601953} +{"Pretrain/Learning Rate": 1.3666504274831954e-05, "Pretrain/Loss": 2.0142412185668945, "Pretrain/Loss (Raw)": 2.1169722080230713, "Pretrain/Step": 6297, "Pretrain/Step Time": 8.523067228496075} +{"Pretrain/Learning Rate": 1.3658937584007859e-05, "Pretrain/Loss": 2.0129709243774414, "Pretrain/Loss (Raw)": 2.064434289932251, "Pretrain/Step": 6298, "Pretrain/Step Time": 8.504483425989747} +{"Pretrain/Learning Rate": 1.3651372201088508e-05, "Pretrain/Loss": 2.0119006633758545, "Pretrain/Loss (Raw)": 2.025162696838379, "Pretrain/Step": 6299, "Pretrain/Step Time": 8.509951738640666} +{"Pretrain/Learning Rate": 1.3643808126946417e-05, "Pretrain/Loss": 2.0113582611083984, "Pretrain/Loss (Raw)": 1.807428002357483, "Pretrain/Step": 6300, "Pretrain/Step Time": 8.513012520968914} +{"Pretrain/Learning Rate": 1.3636245362453865e-05, "Pretrain/Loss": 2.0089075565338135, "Pretrain/Loss (Raw)": 1.8004776239395142, "Pretrain/Step": 6301, "Pretrain/Step Time": 8.516271967440844} +{"Pretrain/Learning Rate": 1.3628683908483054e-05, "Pretrain/Loss": 2.0103495121002197, "Pretrain/Loss (Raw)": 2.1279711723327637, "Pretrain/Step": 6302, "Pretrain/Step Time": 8.519307166337967} +{"Pretrain/Learning Rate": 1.3621123765905985e-05, "Pretrain/Loss": 2.009460926055908, "Pretrain/Loss (Raw)": 2.0426928997039795, "Pretrain/Step": 6303, "Pretrain/Step Time": 8.516610341146588} +{"Pretrain/Learning Rate": 1.3613564935594565e-05, "Pretrain/Loss": 2.011070966720581, "Pretrain/Loss (Raw)": 2.1161580085754395, "Pretrain/Step": 6304, "Pretrain/Step Time": 8.513343131169677} +{"Pretrain/Learning Rate": 1.3606007418420472e-05, "Pretrain/Loss": 2.0097124576568604, "Pretrain/Loss (Raw)": 1.8852089643478394, "Pretrain/Step": 6305, "Pretrain/Step Time": 8.518782442435622} +{"Pretrain/Learning Rate": 1.3598451215255303e-05, "Pretrain/Loss": 2.0051674842834473, "Pretrain/Loss (Raw)": 1.3570033311843872, "Pretrain/Step": 6306, "Pretrain/Step Time": 8.5250048879534} +{"Pretrain/Learning Rate": 1.3590896326970465e-05, "Pretrain/Loss": 2.0050854682922363, "Pretrain/Loss (Raw)": 2.0153326988220215, "Pretrain/Step": 6307, "Pretrain/Step Time": 8.527652844786644} +{"Pretrain/Learning Rate": 1.3583342754437226e-05, "Pretrain/Loss": 2.0050923824310303, "Pretrain/Loss (Raw)": 1.9515587091445923, "Pretrain/Step": 6308, "Pretrain/Step Time": 8.525992028415203} +{"Pretrain/Learning Rate": 1.3575790498526687e-05, "Pretrain/Loss": 2.0064876079559326, "Pretrain/Loss (Raw)": 2.0615527629852295, "Pretrain/Step": 6309, "Pretrain/Step Time": 8.52358990162611} +{"Pretrain/Learning Rate": 1.356823956010983e-05, "Pretrain/Loss": 2.0073771476745605, "Pretrain/Loss (Raw)": 1.9891403913497925, "Pretrain/Step": 6310, "Pretrain/Step Time": 8.52107461169362} +{"Pretrain/Learning Rate": 1.3560689940057453e-05, "Pretrain/Loss": 2.0071492195129395, "Pretrain/Loss (Raw)": 1.902748465538025, "Pretrain/Step": 6311, "Pretrain/Step Time": 8.525758191943169} +{"Pretrain/Learning Rate": 1.3553141639240218e-05, "Pretrain/Loss": 2.005194664001465, "Pretrain/Loss (Raw)": 1.7831778526306152, "Pretrain/Step": 6312, "Pretrain/Step Time": 8.529210956767201} +{"Pretrain/Learning Rate": 1.354559465852862e-05, "Pretrain/Loss": 2.0066874027252197, "Pretrain/Loss (Raw)": 1.9140524864196777, "Pretrain/Step": 6313, "Pretrain/Step Time": 8.529900366440415} +{"Pretrain/Learning Rate": 1.353804899879303e-05, "Pretrain/Loss": 2.0068578720092773, "Pretrain/Loss (Raw)": 2.0243418216705322, "Pretrain/Step": 6314, "Pretrain/Step Time": 8.532514799386263} +{"Pretrain/Learning Rate": 1.3530504660903637e-05, "Pretrain/Loss": 2.007394552230835, "Pretrain/Loss (Raw)": 1.9900286197662354, "Pretrain/Step": 6315, "Pretrain/Step Time": 8.52519147284329} +{"Pretrain/Learning Rate": 1.3522961645730498e-05, "Pretrain/Loss": 2.0068116188049316, "Pretrain/Loss (Raw)": 1.8003363609313965, "Pretrain/Step": 6316, "Pretrain/Step Time": 8.518253911286592} +{"Pretrain/Learning Rate": 1.3515419954143489e-05, "Pretrain/Loss": 2.0064406394958496, "Pretrain/Loss (Raw)": 2.05593204498291, "Pretrain/Step": 6317, "Pretrain/Step Time": 8.522174751386046} +{"Pretrain/Learning Rate": 1.3507879587012378e-05, "Pretrain/Loss": 2.005424976348877, "Pretrain/Loss (Raw)": 1.7080273628234863, "Pretrain/Step": 6318, "Pretrain/Step Time": 8.530141353607178} +{"Pretrain/Learning Rate": 1.3500340545206747e-05, "Pretrain/Loss": 2.0059072971343994, "Pretrain/Loss (Raw)": 2.0262808799743652, "Pretrain/Step": 6319, "Pretrain/Step Time": 8.52854554541409} +{"Pretrain/Learning Rate": 1.3492802829596035e-05, "Pretrain/Loss": 2.006070613861084, "Pretrain/Loss (Raw)": 2.002394437789917, "Pretrain/Step": 6320, "Pretrain/Step Time": 8.529859403148293} +{"Pretrain/Learning Rate": 1.348526644104951e-05, "Pretrain/Loss": 2.005495548248291, "Pretrain/Loss (Raw)": 2.021832227706909, "Pretrain/Step": 6321, "Pretrain/Step Time": 8.523383175954223} +{"Pretrain/Learning Rate": 1.3477731380436332e-05, "Pretrain/Loss": 2.006648540496826, "Pretrain/Loss (Raw)": 2.10588002204895, "Pretrain/Step": 6322, "Pretrain/Step Time": 8.520216619595885} +{"Pretrain/Learning Rate": 1.3470197648625463e-05, "Pretrain/Loss": 2.0068156719207764, "Pretrain/Loss (Raw)": 1.9978166818618774, "Pretrain/Step": 6323, "Pretrain/Step Time": 8.520144963636994} +{"Pretrain/Learning Rate": 1.3462665246485734e-05, "Pretrain/Loss": 2.007286310195923, "Pretrain/Loss (Raw)": 2.0753090381622314, "Pretrain/Step": 6324, "Pretrain/Step Time": 8.526119465008378} +{"Pretrain/Learning Rate": 1.3455134174885802e-05, "Pretrain/Loss": 2.006202220916748, "Pretrain/Loss (Raw)": 1.9620327949523926, "Pretrain/Step": 6325, "Pretrain/Step Time": 8.526421500369906} +{"Pretrain/Learning Rate": 1.3447604434694207e-05, "Pretrain/Loss": 2.007307529449463, "Pretrain/Loss (Raw)": 2.0711567401885986, "Pretrain/Step": 6326, "Pretrain/Step Time": 8.525584191083908} +{"Pretrain/Learning Rate": 1.3440076026779309e-05, "Pretrain/Loss": 2.0102694034576416, "Pretrain/Loss (Raw)": 2.0677719116210938, "Pretrain/Step": 6327, "Pretrain/Step Time": 8.514120755717158} +{"Pretrain/Learning Rate": 1.3432548952009313e-05, "Pretrain/Loss": 2.008199453353882, "Pretrain/Loss (Raw)": 1.878785252571106, "Pretrain/Step": 6328, "Pretrain/Step Time": 8.511257221922278} +{"Pretrain/Learning Rate": 1.3425023211252272e-05, "Pretrain/Loss": 2.0073866844177246, "Pretrain/Loss (Raw)": 1.9985637664794922, "Pretrain/Step": 6329, "Pretrain/Step Time": 8.512978535145521} +{"Pretrain/Learning Rate": 1.3417498805376105e-05, "Pretrain/Loss": 2.008759021759033, "Pretrain/Loss (Raw)": 2.087252140045166, "Pretrain/Step": 6330, "Pretrain/Step Time": 8.522186517715454} +{"Pretrain/Learning Rate": 1.3409975735248556e-05, "Pretrain/Loss": 2.009610652923584, "Pretrain/Loss (Raw)": 1.9921441078186035, "Pretrain/Step": 6331, "Pretrain/Step Time": 8.527141936123371} +{"Pretrain/Learning Rate": 1.3402454001737209e-05, "Pretrain/Loss": 2.008749008178711, "Pretrain/Loss (Raw)": 1.937897801399231, "Pretrain/Step": 6332, "Pretrain/Step Time": 8.52200067974627} +{"Pretrain/Learning Rate": 1.3394933605709525e-05, "Pretrain/Loss": 2.00870680809021, "Pretrain/Loss (Raw)": 2.1146457195281982, "Pretrain/Step": 6333, "Pretrain/Step Time": 8.51332082785666} +{"Pretrain/Learning Rate": 1.3387414548032783e-05, "Pretrain/Loss": 2.0089542865753174, "Pretrain/Loss (Raw)": 2.039482593536377, "Pretrain/Step": 6334, "Pretrain/Step Time": 8.507374849170446} +{"Pretrain/Learning Rate": 1.3379896829574115e-05, "Pretrain/Loss": 2.009660005569458, "Pretrain/Loss (Raw)": 2.167710304260254, "Pretrain/Step": 6335, "Pretrain/Step Time": 8.514159571379423} +{"Pretrain/Learning Rate": 1.337238045120049e-05, "Pretrain/Loss": 2.0084309577941895, "Pretrain/Loss (Raw)": 1.858315110206604, "Pretrain/Step": 6336, "Pretrain/Step Time": 8.516121432185173} +{"Pretrain/Learning Rate": 1.3364865413778755e-05, "Pretrain/Loss": 2.006953716278076, "Pretrain/Loss (Raw)": 1.98427414894104, "Pretrain/Step": 6337, "Pretrain/Step Time": 8.519200507551432} +{"Pretrain/Learning Rate": 1.3357351718175564e-05, "Pretrain/Loss": 2.006131649017334, "Pretrain/Loss (Raw)": 1.833089828491211, "Pretrain/Step": 6338, "Pretrain/Step Time": 8.519772654399276} +{"Pretrain/Learning Rate": 1.3349839365257438e-05, "Pretrain/Loss": 2.006045341491699, "Pretrain/Loss (Raw)": 2.028355121612549, "Pretrain/Step": 6339, "Pretrain/Step Time": 8.512512920424342} +{"Pretrain/Learning Rate": 1.3342328355890721e-05, "Pretrain/Loss": 2.0048763751983643, "Pretrain/Loss (Raw)": 1.9903473854064941, "Pretrain/Step": 6340, "Pretrain/Step Time": 8.511003708466887} +{"Pretrain/Learning Rate": 1.3334818690941652e-05, "Pretrain/Loss": 2.005155563354492, "Pretrain/Loss (Raw)": 2.1458396911621094, "Pretrain/Step": 6341, "Pretrain/Step Time": 8.506576159968972} +{"Pretrain/Learning Rate": 1.332731037127624e-05, "Pretrain/Loss": 2.0110116004943848, "Pretrain/Loss (Raw)": 2.4888222217559814, "Pretrain/Step": 6342, "Pretrain/Step Time": 8.513868473470211} +{"Pretrain/Learning Rate": 1.3319803397760408e-05, "Pretrain/Loss": 2.007903575897217, "Pretrain/Loss (Raw)": 1.7553157806396484, "Pretrain/Step": 6343, "Pretrain/Step Time": 8.513836914673448} +{"Pretrain/Learning Rate": 1.331229777125988e-05, "Pretrain/Loss": 2.005387544631958, "Pretrain/Loss (Raw)": 2.1088953018188477, "Pretrain/Step": 6344, "Pretrain/Step Time": 8.506072878837585} +{"Pretrain/Learning Rate": 1.3304793492640263e-05, "Pretrain/Loss": 2.00563645362854, "Pretrain/Loss (Raw)": 1.9764790534973145, "Pretrain/Step": 6345, "Pretrain/Step Time": 8.508527824655175} +{"Pretrain/Learning Rate": 1.329729056276695e-05, "Pretrain/Loss": 2.0052623748779297, "Pretrain/Loss (Raw)": 2.10343599319458, "Pretrain/Step": 6346, "Pretrain/Step Time": 8.50157331675291} +{"Pretrain/Learning Rate": 1.328978898250525e-05, "Pretrain/Loss": 2.004810333251953, "Pretrain/Loss (Raw)": 1.8306043148040771, "Pretrain/Step": 6347, "Pretrain/Step Time": 8.499865610152483} +{"Pretrain/Learning Rate": 1.3282288752720262e-05, "Pretrain/Loss": 2.0013182163238525, "Pretrain/Loss (Raw)": 1.7876118421554565, "Pretrain/Step": 6348, "Pretrain/Step Time": 8.512560710310936} +{"Pretrain/Learning Rate": 1.3274789874276949e-05, "Pretrain/Loss": 2.0036678314208984, "Pretrain/Loss (Raw)": 2.4019904136657715, "Pretrain/Step": 6349, "Pretrain/Step Time": 8.514440821483731} +{"Pretrain/Learning Rate": 1.3267292348040111e-05, "Pretrain/Loss": 2.0046396255493164, "Pretrain/Loss (Raw)": 2.1497414112091064, "Pretrain/Step": 6350, "Pretrain/Step Time": 8.51154308207333} +{"Pretrain/Learning Rate": 1.3259796174874411e-05, "Pretrain/Loss": 2.006680965423584, "Pretrain/Loss (Raw)": 1.9287840127944946, "Pretrain/Step": 6351, "Pretrain/Step Time": 8.509717620909214} +{"Pretrain/Learning Rate": 1.3252301355644341e-05, "Pretrain/Loss": 2.004399538040161, "Pretrain/Loss (Raw)": 2.0598673820495605, "Pretrain/Step": 6352, "Pretrain/Step Time": 8.508301572874188} +{"Pretrain/Learning Rate": 1.324480789121424e-05, "Pretrain/Loss": 2.00335693359375, "Pretrain/Loss (Raw)": 2.00057053565979, "Pretrain/Step": 6353, "Pretrain/Step Time": 8.506190095096827} +{"Pretrain/Learning Rate": 1.323731578244827e-05, "Pretrain/Loss": 2.002565860748291, "Pretrain/Loss (Raw)": 1.9076552391052246, "Pretrain/Step": 6354, "Pretrain/Step Time": 8.512310303747654} +{"Pretrain/Learning Rate": 1.3229825030210482e-05, "Pretrain/Loss": 2.0051584243774414, "Pretrain/Loss (Raw)": 2.031585931777954, "Pretrain/Step": 6355, "Pretrain/Step Time": 8.516891073435545} +{"Pretrain/Learning Rate": 1.3222335635364736e-05, "Pretrain/Loss": 2.0032732486724854, "Pretrain/Loss (Raw)": 1.8957425355911255, "Pretrain/Step": 6356, "Pretrain/Step Time": 8.50889297388494} +{"Pretrain/Learning Rate": 1.3214847598774744e-05, "Pretrain/Loss": 2.005232334136963, "Pretrain/Loss (Raw)": 2.1152846813201904, "Pretrain/Step": 6357, "Pretrain/Step Time": 8.50551476702094} +{"Pretrain/Learning Rate": 1.3207360921304046e-05, "Pretrain/Loss": 2.002507448196411, "Pretrain/Loss (Raw)": 1.8402092456817627, "Pretrain/Step": 6358, "Pretrain/Step Time": 8.504436837509274} +{"Pretrain/Learning Rate": 1.319987560381607e-05, "Pretrain/Loss": 2.0040335655212402, "Pretrain/Loss (Raw)": 2.2422280311584473, "Pretrain/Step": 6359, "Pretrain/Step Time": 8.51166744157672} +{"Pretrain/Learning Rate": 1.319239164717404e-05, "Pretrain/Loss": 2.005654811859131, "Pretrain/Loss (Raw)": 2.292475938796997, "Pretrain/Step": 6360, "Pretrain/Step Time": 8.512030461803079} +{"Pretrain/Learning Rate": 1.3184909052241046e-05, "Pretrain/Loss": 2.005136251449585, "Pretrain/Loss (Raw)": 1.8919752836227417, "Pretrain/Step": 6361, "Pretrain/Step Time": 8.512519853189588} +{"Pretrain/Learning Rate": 1.3177427819880002e-05, "Pretrain/Loss": 2.005512237548828, "Pretrain/Loss (Raw)": 2.0824692249298096, "Pretrain/Step": 6362, "Pretrain/Step Time": 8.509983818978071} +{"Pretrain/Learning Rate": 1.3169947950953704e-05, "Pretrain/Loss": 2.0077123641967773, "Pretrain/Loss (Raw)": 2.0837531089782715, "Pretrain/Step": 6363, "Pretrain/Step Time": 8.509175019338727} +{"Pretrain/Learning Rate": 1.3162469446324755e-05, "Pretrain/Loss": 2.007486343383789, "Pretrain/Loss (Raw)": 2.1760804653167725, "Pretrain/Step": 6364, "Pretrain/Step Time": 8.498285850510001} +{"Pretrain/Learning Rate": 1.3154992306855607e-05, "Pretrain/Loss": 2.006589412689209, "Pretrain/Loss (Raw)": 1.9903182983398438, "Pretrain/Step": 6365, "Pretrain/Step Time": 8.508322812616825} +{"Pretrain/Learning Rate": 1.3147516533408552e-05, "Pretrain/Loss": 2.0035834312438965, "Pretrain/Loss (Raw)": 1.8720966577529907, "Pretrain/Step": 6366, "Pretrain/Step Time": 8.516233375295997} +{"Pretrain/Learning Rate": 1.3140042126845753e-05, "Pretrain/Loss": 2.0048656463623047, "Pretrain/Loss (Raw)": 1.9821964502334595, "Pretrain/Step": 6367, "Pretrain/Step Time": 8.51897763647139} +{"Pretrain/Learning Rate": 1.3132569088029179e-05, "Pretrain/Loss": 2.0053062438964844, "Pretrain/Loss (Raw)": 1.9726979732513428, "Pretrain/Step": 6368, "Pretrain/Step Time": 8.520177515223622} +{"Pretrain/Learning Rate": 1.312509741782066e-05, "Pretrain/Loss": 2.004958391189575, "Pretrain/Loss (Raw)": 2.086980104446411, "Pretrain/Step": 6369, "Pretrain/Step Time": 8.518572567030787} +{"Pretrain/Learning Rate": 1.3117627117081854e-05, "Pretrain/Loss": 2.002338409423828, "Pretrain/Loss (Raw)": 1.8530611991882324, "Pretrain/Step": 6370, "Pretrain/Step Time": 8.511183379217982} +{"Pretrain/Learning Rate": 1.3110158186674293e-05, "Pretrain/Loss": 2.0024983882904053, "Pretrain/Loss (Raw)": 2.135561227798462, "Pretrain/Step": 6371, "Pretrain/Step Time": 8.51427267678082} +{"Pretrain/Learning Rate": 1.3102690627459314e-05, "Pretrain/Loss": 2.0022735595703125, "Pretrain/Loss (Raw)": 1.9493247270584106, "Pretrain/Step": 6372, "Pretrain/Step Time": 8.515177853405476} +{"Pretrain/Learning Rate": 1.30952244402981e-05, "Pretrain/Loss": 2.0014500617980957, "Pretrain/Loss (Raw)": 2.0601842403411865, "Pretrain/Step": 6373, "Pretrain/Step Time": 8.516873694956303} +{"Pretrain/Learning Rate": 1.3087759626051716e-05, "Pretrain/Loss": 2.0014727115631104, "Pretrain/Loss (Raw)": 1.8612691164016724, "Pretrain/Step": 6374, "Pretrain/Step Time": 8.513741631060839} +{"Pretrain/Learning Rate": 1.308029618558102e-05, "Pretrain/Loss": 1.9991503953933716, "Pretrain/Loss (Raw)": 1.8728092908859253, "Pretrain/Step": 6375, "Pretrain/Step Time": 8.511754965409636} +{"Pretrain/Learning Rate": 1.3072834119746741e-05, "Pretrain/Loss": 2.0003464221954346, "Pretrain/Loss (Raw)": 2.270512342453003, "Pretrain/Step": 6376, "Pretrain/Step Time": 8.505143670365214} +{"Pretrain/Learning Rate": 1.3065373429409419e-05, "Pretrain/Loss": 1.9989509582519531, "Pretrain/Loss (Raw)": 1.837071180343628, "Pretrain/Step": 6377, "Pretrain/Step Time": 8.513237675651908} +{"Pretrain/Learning Rate": 1.3057914115429482e-05, "Pretrain/Loss": 1.9960041046142578, "Pretrain/Loss (Raw)": 1.7369261980056763, "Pretrain/Step": 6378, "Pretrain/Step Time": 8.517576318234205} +{"Pretrain/Learning Rate": 1.3050456178667165e-05, "Pretrain/Loss": 1.9962782859802246, "Pretrain/Loss (Raw)": 2.068312406539917, "Pretrain/Step": 6379, "Pretrain/Step Time": 8.518649915233254} +{"Pretrain/Learning Rate": 1.3042999619982546e-05, "Pretrain/Loss": 1.9960980415344238, "Pretrain/Loss (Raw)": 1.9751986265182495, "Pretrain/Step": 6380, "Pretrain/Step Time": 8.514012180268764} +{"Pretrain/Learning Rate": 1.3035544440235548e-05, "Pretrain/Loss": 1.9974048137664795, "Pretrain/Loss (Raw)": 2.099783420562744, "Pretrain/Step": 6381, "Pretrain/Step Time": 8.508610144257545} +{"Pretrain/Learning Rate": 1.3028090640285958e-05, "Pretrain/Loss": 1.998085618019104, "Pretrain/Loss (Raw)": 1.923449158668518, "Pretrain/Step": 6382, "Pretrain/Step Time": 8.506535584107041} +{"Pretrain/Learning Rate": 1.3020638220993353e-05, "Pretrain/Loss": 1.9966115951538086, "Pretrain/Loss (Raw)": 1.8861768245697021, "Pretrain/Step": 6383, "Pretrain/Step Time": 8.510184338316321} +{"Pretrain/Learning Rate": 1.3013187183217206e-05, "Pretrain/Loss": 1.9981365203857422, "Pretrain/Loss (Raw)": 2.189657688140869, "Pretrain/Step": 6384, "Pretrain/Step Time": 8.513348562642932} +{"Pretrain/Learning Rate": 1.3005737527816786e-05, "Pretrain/Loss": 1.9999653100967407, "Pretrain/Loss (Raw)": 2.216139078140259, "Pretrain/Step": 6385, "Pretrain/Step Time": 8.518756868317723} +{"Pretrain/Learning Rate": 1.2998289255651253e-05, "Pretrain/Loss": 1.9994839429855347, "Pretrain/Loss (Raw)": 1.8366833925247192, "Pretrain/Step": 6386, "Pretrain/Step Time": 8.522790618240833} +{"Pretrain/Learning Rate": 1.2990842367579539e-05, "Pretrain/Loss": 2.0017380714416504, "Pretrain/Loss (Raw)": 2.0827560424804688, "Pretrain/Step": 6387, "Pretrain/Step Time": 8.515120578929782} +{"Pretrain/Learning Rate": 1.2983396864460482e-05, "Pretrain/Loss": 2.001929759979248, "Pretrain/Loss (Raw)": 2.0257174968719482, "Pretrain/Step": 6388, "Pretrain/Step Time": 8.515160333365202} +{"Pretrain/Learning Rate": 1.2975952747152709e-05, "Pretrain/Loss": 2.0032238960266113, "Pretrain/Loss (Raw)": 2.092388868331909, "Pretrain/Step": 6389, "Pretrain/Step Time": 8.517214460298419} +{"Pretrain/Learning Rate": 1.2968510016514749e-05, "Pretrain/Loss": 1.9995731115341187, "Pretrain/Loss (Raw)": 1.6968741416931152, "Pretrain/Step": 6390, "Pretrain/Step Time": 8.526887545362115} +{"Pretrain/Learning Rate": 1.2961068673404886e-05, "Pretrain/Loss": 2.000150203704834, "Pretrain/Loss (Raw)": 2.0957741737365723, "Pretrain/Step": 6391, "Pretrain/Step Time": 8.526275740936399} +{"Pretrain/Learning Rate": 1.295362871868132e-05, "Pretrain/Loss": 1.9995698928833008, "Pretrain/Loss (Raw)": 1.882413387298584, "Pretrain/Step": 6392, "Pretrain/Step Time": 8.523770427331328} +{"Pretrain/Learning Rate": 1.2946190153202059e-05, "Pretrain/Loss": 1.9970059394836426, "Pretrain/Loss (Raw)": 2.0683069229125977, "Pretrain/Step": 6393, "Pretrain/Step Time": 8.520745020359755} +{"Pretrain/Learning Rate": 1.2938752977824947e-05, "Pretrain/Loss": 1.9954208135604858, "Pretrain/Loss (Raw)": 1.8925589323043823, "Pretrain/Step": 6394, "Pretrain/Step Time": 8.517793314531446} +{"Pretrain/Learning Rate": 1.2931317193407665e-05, "Pretrain/Loss": 1.9936985969543457, "Pretrain/Loss (Raw)": 1.8944514989852905, "Pretrain/Step": 6395, "Pretrain/Step Time": 8.520838517695665} +{"Pretrain/Learning Rate": 1.2923882800807768e-05, "Pretrain/Loss": 1.9944908618927002, "Pretrain/Loss (Raw)": 2.192018747329712, "Pretrain/Step": 6396, "Pretrain/Step Time": 8.522973209619522} +{"Pretrain/Learning Rate": 1.2916449800882607e-05, "Pretrain/Loss": 1.9940801858901978, "Pretrain/Loss (Raw)": 1.8694578409194946, "Pretrain/Step": 6397, "Pretrain/Step Time": 8.527389356866479} +{"Pretrain/Learning Rate": 1.2909018194489397e-05, "Pretrain/Loss": 1.995612621307373, "Pretrain/Loss (Raw)": 1.8903504610061646, "Pretrain/Step": 6398, "Pretrain/Step Time": 8.523933919146657} +{"Pretrain/Learning Rate": 1.2901587982485172e-05, "Pretrain/Loss": 1.9946210384368896, "Pretrain/Loss (Raw)": 1.9581842422485352, "Pretrain/Step": 6399, "Pretrain/Step Time": 8.510577416047454} +{"Pretrain/Learning Rate": 1.289415916572684e-05, "Pretrain/Loss": 1.994334101676941, "Pretrain/Loss (Raw)": 1.9210113286972046, "Pretrain/Step": 6400, "Pretrain/Step Time": 8.508622355759144} +{"Pretrain/Learning Rate": 1.2886731745071117e-05, "Pretrain/Loss": 1.9928823709487915, "Pretrain/Loss (Raw)": 1.8895368576049805, "Pretrain/Step": 6401, "Pretrain/Step Time": 8.51380280777812} +{"Pretrain/Learning Rate": 1.287930572137457e-05, "Pretrain/Loss": 1.990978717803955, "Pretrain/Loss (Raw)": 1.9304108619689941, "Pretrain/Step": 6402, "Pretrain/Step Time": 8.513659598305821} +{"Pretrain/Learning Rate": 1.2871881095493592e-05, "Pretrain/Loss": 1.9903815984725952, "Pretrain/Loss (Raw)": 1.9454677104949951, "Pretrain/Step": 6403, "Pretrain/Step Time": 8.519976731389761} +{"Pretrain/Learning Rate": 1.2864457868284446e-05, "Pretrain/Loss": 1.9903286695480347, "Pretrain/Loss (Raw)": 2.050508499145508, "Pretrain/Step": 6404, "Pretrain/Step Time": 8.518372662365437} +{"Pretrain/Learning Rate": 1.2857036040603205e-05, "Pretrain/Loss": 1.992540717124939, "Pretrain/Loss (Raw)": 2.2591419219970703, "Pretrain/Step": 6405, "Pretrain/Step Time": 8.501150278374553} +{"Pretrain/Learning Rate": 1.2849615613305782e-05, "Pretrain/Loss": 1.997565507888794, "Pretrain/Loss (Raw)": 2.3100554943084717, "Pretrain/Step": 6406, "Pretrain/Step Time": 8.504626121371984} +{"Pretrain/Learning Rate": 1.2842196587247935e-05, "Pretrain/Loss": 1.9989280700683594, "Pretrain/Loss (Raw)": 1.8426111936569214, "Pretrain/Step": 6407, "Pretrain/Step Time": 8.51616781577468} +{"Pretrain/Learning Rate": 1.2834778963285276e-05, "Pretrain/Loss": 1.999040961265564, "Pretrain/Loss (Raw)": 2.2370517253875732, "Pretrain/Step": 6408, "Pretrain/Step Time": 8.516391891986132} +{"Pretrain/Learning Rate": 1.282736274227323e-05, "Pretrain/Loss": 1.9980922937393188, "Pretrain/Loss (Raw)": 1.8815879821777344, "Pretrain/Step": 6409, "Pretrain/Step Time": 8.524262480437756} +{"Pretrain/Learning Rate": 1.2819947925067071e-05, "Pretrain/Loss": 1.9980725049972534, "Pretrain/Loss (Raw)": 2.0405237674713135, "Pretrain/Step": 6410, "Pretrain/Step Time": 8.517432540655136} +{"Pretrain/Learning Rate": 1.2812534512521906e-05, "Pretrain/Loss": 1.9984797239303589, "Pretrain/Loss (Raw)": 2.0002431869506836, "Pretrain/Step": 6411, "Pretrain/Step Time": 8.509047493338585} +{"Pretrain/Learning Rate": 1.2805122505492697e-05, "Pretrain/Loss": 1.9975098371505737, "Pretrain/Loss (Raw)": 2.1150941848754883, "Pretrain/Step": 6412, "Pretrain/Step Time": 8.504645481705666} +{"Pretrain/Learning Rate": 1.2797711904834226e-05, "Pretrain/Loss": 1.996145486831665, "Pretrain/Loss (Raw)": 2.2753891944885254, "Pretrain/Step": 6413, "Pretrain/Step Time": 8.51530566625297} +{"Pretrain/Learning Rate": 1.279030271140111e-05, "Pretrain/Loss": 1.9955735206604004, "Pretrain/Loss (Raw)": 2.067300319671631, "Pretrain/Step": 6414, "Pretrain/Step Time": 8.517297837883234} +{"Pretrain/Learning Rate": 1.2782894926047822e-05, "Pretrain/Loss": 1.996874213218689, "Pretrain/Loss (Raw)": 2.067260503768921, "Pretrain/Step": 6415, "Pretrain/Step Time": 8.520998988300562} +{"Pretrain/Learning Rate": 1.2775488549628667e-05, "Pretrain/Loss": 1.9962189197540283, "Pretrain/Loss (Raw)": 1.981236219406128, "Pretrain/Step": 6416, "Pretrain/Step Time": 8.513977583497763} +{"Pretrain/Learning Rate": 1.2768083582997772e-05, "Pretrain/Loss": 1.9973706007003784, "Pretrain/Loss (Raw)": 2.1241848468780518, "Pretrain/Step": 6417, "Pretrain/Step Time": 8.510299779474735} +{"Pretrain/Learning Rate": 1.2760680027009109e-05, "Pretrain/Loss": 1.9989945888519287, "Pretrain/Loss (Raw)": 2.0386390686035156, "Pretrain/Step": 6418, "Pretrain/Step Time": 8.510727001354098} +{"Pretrain/Learning Rate": 1.2753277882516507e-05, "Pretrain/Loss": 2.0006942749023438, "Pretrain/Loss (Raw)": 2.1743710041046143, "Pretrain/Step": 6419, "Pretrain/Step Time": 8.52129484899342} +{"Pretrain/Learning Rate": 1.2745877150373612e-05, "Pretrain/Loss": 2.0003859996795654, "Pretrain/Loss (Raw)": 1.9318795204162598, "Pretrain/Step": 6420, "Pretrain/Step Time": 8.511696988716722} +{"Pretrain/Learning Rate": 1.2738477831433904e-05, "Pretrain/Loss": 2.002506971359253, "Pretrain/Loss (Raw)": 2.0909323692321777, "Pretrain/Step": 6421, "Pretrain/Step Time": 8.515881109982729} +{"Pretrain/Learning Rate": 1.2731079926550701e-05, "Pretrain/Loss": 2.001955986022949, "Pretrain/Loss (Raw)": 1.9905498027801514, "Pretrain/Step": 6422, "Pretrain/Step Time": 8.514607310295105} +{"Pretrain/Learning Rate": 1.2723683436577195e-05, "Pretrain/Loss": 2.0041656494140625, "Pretrain/Loss (Raw)": 2.00008487701416, "Pretrain/Step": 6423, "Pretrain/Step Time": 8.509005768224597} +{"Pretrain/Learning Rate": 1.271628836236634e-05, "Pretrain/Loss": 2.004103422164917, "Pretrain/Loss (Raw)": 1.9640196561813354, "Pretrain/Step": 6424, "Pretrain/Step Time": 8.510349310934544} +{"Pretrain/Learning Rate": 1.2708894704771007e-05, "Pretrain/Loss": 2.0043182373046875, "Pretrain/Loss (Raw)": 2.1444225311279297, "Pretrain/Step": 6425, "Pretrain/Step Time": 8.519448064267635} +{"Pretrain/Learning Rate": 1.2701502464643844e-05, "Pretrain/Loss": 2.003490447998047, "Pretrain/Loss (Raw)": 1.9585273265838623, "Pretrain/Step": 6426, "Pretrain/Step Time": 8.525515088811517} +{"Pretrain/Learning Rate": 1.2694111642837386e-05, "Pretrain/Loss": 2.0002808570861816, "Pretrain/Loss (Raw)": 1.6143333911895752, "Pretrain/Step": 6427, "Pretrain/Step Time": 8.520906127989292} +{"Pretrain/Learning Rate": 1.2686722240203946e-05, "Pretrain/Loss": 2.002930164337158, "Pretrain/Loss (Raw)": 2.1465489864349365, "Pretrain/Step": 6428, "Pretrain/Step Time": 8.516197321936488} +{"Pretrain/Learning Rate": 1.2679334257595727e-05, "Pretrain/Loss": 2.0039443969726562, "Pretrain/Loss (Raw)": 1.9302562475204468, "Pretrain/Step": 6429, "Pretrain/Step Time": 8.51472770050168} +{"Pretrain/Learning Rate": 1.2671947695864727e-05, "Pretrain/Loss": 2.0021581649780273, "Pretrain/Loss (Raw)": 1.899349570274353, "Pretrain/Step": 6430, "Pretrain/Step Time": 8.515888810157776} +{"Pretrain/Learning Rate": 1.266456255586283e-05, "Pretrain/Loss": 2.0033063888549805, "Pretrain/Loss (Raw)": 2.189685344696045, "Pretrain/Step": 6431, "Pretrain/Step Time": 8.512597717344761} +{"Pretrain/Learning Rate": 1.2657178838441686e-05, "Pretrain/Loss": 2.003321886062622, "Pretrain/Loss (Raw)": 2.118136405944824, "Pretrain/Step": 6432, "Pretrain/Step Time": 8.512767584994435} +{"Pretrain/Learning Rate": 1.2649796544452852e-05, "Pretrain/Loss": 2.0051040649414062, "Pretrain/Loss (Raw)": 2.1132898330688477, "Pretrain/Step": 6433, "Pretrain/Step Time": 8.507953537628055} +{"Pretrain/Learning Rate": 1.2642415674747673e-05, "Pretrain/Loss": 2.01063871383667, "Pretrain/Loss (Raw)": 2.0654637813568115, "Pretrain/Step": 6434, "Pretrain/Step Time": 8.502105990424752} +{"Pretrain/Learning Rate": 1.263503623017735e-05, "Pretrain/Loss": 2.010699510574341, "Pretrain/Loss (Raw)": 2.02311110496521, "Pretrain/Step": 6435, "Pretrain/Step Time": 8.502232236787677} +{"Pretrain/Learning Rate": 1.2627658211592907e-05, "Pretrain/Loss": 2.011439561843872, "Pretrain/Loss (Raw)": 2.046279191970825, "Pretrain/Step": 6436, "Pretrain/Step Time": 8.507792176678777} +{"Pretrain/Learning Rate": 1.262028161984523e-05, "Pretrain/Loss": 2.0121278762817383, "Pretrain/Loss (Raw)": 2.149675130844116, "Pretrain/Step": 6437, "Pretrain/Step Time": 8.506556630134583} +{"Pretrain/Learning Rate": 1.2612906455785006e-05, "Pretrain/Loss": 2.0116095542907715, "Pretrain/Loss (Raw)": 1.9227951765060425, "Pretrain/Step": 6438, "Pretrain/Step Time": 8.509160367771983} +{"Pretrain/Learning Rate": 1.2605532720262785e-05, "Pretrain/Loss": 2.013089656829834, "Pretrain/Loss (Raw)": 2.092195987701416, "Pretrain/Step": 6439, "Pretrain/Step Time": 8.502363182604313} +{"Pretrain/Learning Rate": 1.2598160414128924e-05, "Pretrain/Loss": 2.0135245323181152, "Pretrain/Loss (Raw)": 1.8388545513153076, "Pretrain/Step": 6440, "Pretrain/Step Time": 8.497151410207152} +{"Pretrain/Learning Rate": 1.2590789538233652e-05, "Pretrain/Loss": 2.0147926807403564, "Pretrain/Loss (Raw)": 2.0763473510742188, "Pretrain/Step": 6441, "Pretrain/Step Time": 8.499663734808564} +{"Pretrain/Learning Rate": 1.2583420093427006e-05, "Pretrain/Loss": 2.0138823986053467, "Pretrain/Loss (Raw)": 1.907840609550476, "Pretrain/Step": 6442, "Pretrain/Step Time": 8.502620283514261} +{"Pretrain/Learning Rate": 1.2576052080558864e-05, "Pretrain/Loss": 2.0132076740264893, "Pretrain/Loss (Raw)": 1.9036606550216675, "Pretrain/Step": 6443, "Pretrain/Step Time": 8.51222530938685} +{"Pretrain/Learning Rate": 1.2568685500478927e-05, "Pretrain/Loss": 2.0171918869018555, "Pretrain/Loss (Raw)": 2.3103015422821045, "Pretrain/Step": 6444, "Pretrain/Step Time": 8.518340921029449} +{"Pretrain/Learning Rate": 1.256132035403677e-05, "Pretrain/Loss": 2.013859987258911, "Pretrain/Loss (Raw)": 1.6294652223587036, "Pretrain/Step": 6445, "Pretrain/Step Time": 8.513008831068873} +{"Pretrain/Learning Rate": 1.255395664208176e-05, "Pretrain/Loss": 2.0150411128997803, "Pretrain/Loss (Raw)": 1.8592089414596558, "Pretrain/Step": 6446, "Pretrain/Step Time": 8.506453910842538} +{"Pretrain/Learning Rate": 1.2546594365463119e-05, "Pretrain/Loss": 2.015058755874634, "Pretrain/Loss (Raw)": 2.0285420417785645, "Pretrain/Step": 6447, "Pretrain/Step Time": 8.507158137857914} +{"Pretrain/Learning Rate": 1.2539233525029886e-05, "Pretrain/Loss": 2.014113426208496, "Pretrain/Loss (Raw)": 1.8813890218734741, "Pretrain/Step": 6448, "Pretrain/Step Time": 8.512153128162026} +{"Pretrain/Learning Rate": 1.2531874121630973e-05, "Pretrain/Loss": 2.016723394393921, "Pretrain/Loss (Raw)": 2.355898380279541, "Pretrain/Step": 6449, "Pretrain/Step Time": 8.513448180630803} +{"Pretrain/Learning Rate": 1.2524516156115088e-05, "Pretrain/Loss": 2.0154576301574707, "Pretrain/Loss (Raw)": 1.9438858032226562, "Pretrain/Step": 6450, "Pretrain/Step Time": 8.519610377028584} +{"Pretrain/Learning Rate": 1.2517159629330783e-05, "Pretrain/Loss": 2.0175862312316895, "Pretrain/Loss (Raw)": 2.2702550888061523, "Pretrain/Step": 6451, "Pretrain/Step Time": 8.517381235957146} +{"Pretrain/Learning Rate": 1.2509804542126444e-05, "Pretrain/Loss": 2.0203356742858887, "Pretrain/Loss (Raw)": 2.4272384643554688, "Pretrain/Step": 6452, "Pretrain/Step Time": 8.51167014427483} +{"Pretrain/Learning Rate": 1.250245089535031e-05, "Pretrain/Loss": 2.0199337005615234, "Pretrain/Loss (Raw)": 1.910610318183899, "Pretrain/Step": 6453, "Pretrain/Step Time": 8.51236566528678} +{"Pretrain/Learning Rate": 1.2495098689850429e-05, "Pretrain/Loss": 2.0181708335876465, "Pretrain/Loss (Raw)": 1.8454976081848145, "Pretrain/Step": 6454, "Pretrain/Step Time": 8.518792854622006} +{"Pretrain/Learning Rate": 1.2487747926474683e-05, "Pretrain/Loss": 2.017993927001953, "Pretrain/Loss (Raw)": 2.045111656188965, "Pretrain/Step": 6455, "Pretrain/Step Time": 8.516325920820236} +{"Pretrain/Learning Rate": 1.2480398606070815e-05, "Pretrain/Loss": 2.0204968452453613, "Pretrain/Loss (Raw)": 2.1991777420043945, "Pretrain/Step": 6456, "Pretrain/Step Time": 8.516599006950855} +{"Pretrain/Learning Rate": 1.2473050729486371e-05, "Pretrain/Loss": 2.021101713180542, "Pretrain/Loss (Raw)": 2.0759756565093994, "Pretrain/Step": 6457, "Pretrain/Step Time": 8.518041366711259} +{"Pretrain/Learning Rate": 1.246570429756875e-05, "Pretrain/Loss": 2.020444393157959, "Pretrain/Loss (Raw)": 2.0031282901763916, "Pretrain/Step": 6458, "Pretrain/Step Time": 8.506012879312038} +{"Pretrain/Learning Rate": 1.245835931116516e-05, "Pretrain/Loss": 2.0207672119140625, "Pretrain/Loss (Raw)": 2.0334763526916504, "Pretrain/Step": 6459, "Pretrain/Step Time": 8.503625199198723} +{"Pretrain/Learning Rate": 1.2451015771122684e-05, "Pretrain/Loss": 2.022449493408203, "Pretrain/Loss (Raw)": 2.1531918048858643, "Pretrain/Step": 6460, "Pretrain/Step Time": 8.511725218966603} +{"Pretrain/Learning Rate": 1.2443673678288204e-05, "Pretrain/Loss": 2.0199029445648193, "Pretrain/Loss (Raw)": 1.7886992692947388, "Pretrain/Step": 6461, "Pretrain/Step Time": 8.514506001025438} +{"Pretrain/Learning Rate": 1.243633303350844e-05, "Pretrain/Loss": 2.018139362335205, "Pretrain/Loss (Raw)": 1.813732624053955, "Pretrain/Step": 6462, "Pretrain/Step Time": 8.524007868021727} +{"Pretrain/Learning Rate": 1.2428993837629943e-05, "Pretrain/Loss": 2.017475128173828, "Pretrain/Loss (Raw)": 2.0826995372772217, "Pretrain/Step": 6463, "Pretrain/Step Time": 8.51673375070095} +{"Pretrain/Learning Rate": 1.2421656091499123e-05, "Pretrain/Loss": 2.018040657043457, "Pretrain/Loss (Raw)": 1.9306801557540894, "Pretrain/Step": 6464, "Pretrain/Step Time": 8.51474454626441} +{"Pretrain/Learning Rate": 1.2414319795962196e-05, "Pretrain/Loss": 2.0166468620300293, "Pretrain/Loss (Raw)": 1.8058961629867554, "Pretrain/Step": 6465, "Pretrain/Step Time": 8.512036312371492} +{"Pretrain/Learning Rate": 1.240698495186521e-05, "Pretrain/Loss": 2.017754077911377, "Pretrain/Loss (Raw)": 1.9747897386550903, "Pretrain/Step": 6466, "Pretrain/Step Time": 8.514332855120301} +{"Pretrain/Learning Rate": 1.2399651560054056e-05, "Pretrain/Loss": 2.0188522338867188, "Pretrain/Loss (Raw)": 2.1689581871032715, "Pretrain/Step": 6467, "Pretrain/Step Time": 8.520372113212943} +{"Pretrain/Learning Rate": 1.2392319621374476e-05, "Pretrain/Loss": 2.019040107727051, "Pretrain/Loss (Raw)": 2.0143842697143555, "Pretrain/Step": 6468, "Pretrain/Step Time": 8.523742772638798} +{"Pretrain/Learning Rate": 1.2384989136671987e-05, "Pretrain/Loss": 2.020407199859619, "Pretrain/Loss (Raw)": 2.3208181858062744, "Pretrain/Step": 6469, "Pretrain/Step Time": 8.523980801925063} +{"Pretrain/Learning Rate": 1.2377660106792005e-05, "Pretrain/Loss": 2.017012357711792, "Pretrain/Loss (Raw)": 2.054271936416626, "Pretrain/Step": 6470, "Pretrain/Step Time": 8.516223618760705} +{"Pretrain/Learning Rate": 1.2370332532579726e-05, "Pretrain/Loss": 2.0193192958831787, "Pretrain/Loss (Raw)": 2.050626039505005, "Pretrain/Step": 6471, "Pretrain/Step Time": 8.514493834227324} +{"Pretrain/Learning Rate": 1.2363006414880236e-05, "Pretrain/Loss": 2.0177767276763916, "Pretrain/Loss (Raw)": 1.9114439487457275, "Pretrain/Step": 6472, "Pretrain/Step Time": 8.514813957735896} +{"Pretrain/Learning Rate": 1.235568175453837e-05, "Pretrain/Loss": 2.018275260925293, "Pretrain/Loss (Raw)": 2.0402753353118896, "Pretrain/Step": 6473, "Pretrain/Step Time": 8.51804144307971} +{"Pretrain/Learning Rate": 1.2348358552398878e-05, "Pretrain/Loss": 2.0176515579223633, "Pretrain/Loss (Raw)": 2.023616313934326, "Pretrain/Step": 6474, "Pretrain/Step Time": 8.520790541544557} +{"Pretrain/Learning Rate": 1.2341036809306292e-05, "Pretrain/Loss": 2.0190131664276123, "Pretrain/Loss (Raw)": 2.004892110824585, "Pretrain/Step": 6475, "Pretrain/Step Time": 8.517815390601754} +{"Pretrain/Learning Rate": 1.2333716526104993e-05, "Pretrain/Loss": 2.0215959548950195, "Pretrain/Loss (Raw)": 2.1182069778442383, "Pretrain/Step": 6476, "Pretrain/Step Time": 8.506232274696231} +{"Pretrain/Learning Rate": 1.2326397703639181e-05, "Pretrain/Loss": 2.020324468612671, "Pretrain/Loss (Raw)": 2.239232063293457, "Pretrain/Step": 6477, "Pretrain/Step Time": 8.504610260948539} +{"Pretrain/Learning Rate": 1.2319080342752918e-05, "Pretrain/Loss": 2.019442319869995, "Pretrain/Loss (Raw)": 2.03682804107666, "Pretrain/Step": 6478, "Pretrain/Step Time": 8.512129284441471} +{"Pretrain/Learning Rate": 1.2311764444290061e-05, "Pretrain/Loss": 2.0209405422210693, "Pretrain/Loss (Raw)": 2.12056303024292, "Pretrain/Step": 6479, "Pretrain/Step Time": 8.513984082266688} +{"Pretrain/Learning Rate": 1.2304450009094317e-05, "Pretrain/Loss": 2.0231051445007324, "Pretrain/Loss (Raw)": 2.3369174003601074, "Pretrain/Step": 6480, "Pretrain/Step Time": 8.51936686784029} +{"Pretrain/Learning Rate": 1.2297137038009213e-05, "Pretrain/Loss": 2.0197882652282715, "Pretrain/Loss (Raw)": 1.576053261756897, "Pretrain/Step": 6481, "Pretrain/Step Time": 8.521810431033373} +{"Pretrain/Learning Rate": 1.2289825531878133e-05, "Pretrain/Loss": 2.0202059745788574, "Pretrain/Loss (Raw)": 1.9610916376113892, "Pretrain/Step": 6482, "Pretrain/Step Time": 8.51913570612669} +{"Pretrain/Learning Rate": 1.2282515491544264e-05, "Pretrain/Loss": 2.0212676525115967, "Pretrain/Loss (Raw)": 2.1674935817718506, "Pretrain/Step": 6483, "Pretrain/Step Time": 8.513461858034134} +{"Pretrain/Learning Rate": 1.2275206917850635e-05, "Pretrain/Loss": 2.021989107131958, "Pretrain/Loss (Raw)": 1.9880720376968384, "Pretrain/Step": 6484, "Pretrain/Step Time": 8.52308515459299} +{"Pretrain/Learning Rate": 1.22678998116401e-05, "Pretrain/Loss": 2.0194287300109863, "Pretrain/Loss (Raw)": 1.7875641584396362, "Pretrain/Step": 6485, "Pretrain/Step Time": 8.524773892015219} +{"Pretrain/Learning Rate": 1.2260594173755358e-05, "Pretrain/Loss": 2.0197153091430664, "Pretrain/Loss (Raw)": 1.876908540725708, "Pretrain/Step": 6486, "Pretrain/Step Time": 8.52499988116324} +{"Pretrain/Learning Rate": 1.2253290005038929e-05, "Pretrain/Loss": 2.01719069480896, "Pretrain/Loss (Raw)": 1.9190646409988403, "Pretrain/Step": 6487, "Pretrain/Step Time": 8.515845037996769} +{"Pretrain/Learning Rate": 1.2245987306333162e-05, "Pretrain/Loss": 2.018799304962158, "Pretrain/Loss (Raw)": 2.498349666595459, "Pretrain/Step": 6488, "Pretrain/Step Time": 8.515573361888528} +{"Pretrain/Learning Rate": 1.2238686078480227e-05, "Pretrain/Loss": 2.020371913909912, "Pretrain/Loss (Raw)": 2.093287706375122, "Pretrain/Step": 6489, "Pretrain/Step Time": 8.511596789583564} +{"Pretrain/Learning Rate": 1.2231386322322155e-05, "Pretrain/Loss": 2.019878625869751, "Pretrain/Loss (Raw)": 2.0193369388580322, "Pretrain/Step": 6490, "Pretrain/Step Time": 8.51334405504167} +{"Pretrain/Learning Rate": 1.2224088038700782e-05, "Pretrain/Loss": 2.0206069946289062, "Pretrain/Loss (Raw)": 2.176954984664917, "Pretrain/Step": 6491, "Pretrain/Step Time": 8.523950295522809} +{"Pretrain/Learning Rate": 1.2216791228457778e-05, "Pretrain/Loss": 2.019498825073242, "Pretrain/Loss (Raw)": 2.0342726707458496, "Pretrain/Step": 6492, "Pretrain/Step Time": 8.531419543549418} +{"Pretrain/Learning Rate": 1.2209495892434635e-05, "Pretrain/Loss": 2.022120475769043, "Pretrain/Loss (Raw)": 2.3258821964263916, "Pretrain/Step": 6493, "Pretrain/Step Time": 8.522267766296864} +{"Pretrain/Learning Rate": 1.2202202031472707e-05, "Pretrain/Loss": 2.023824453353882, "Pretrain/Loss (Raw)": 2.090209722518921, "Pretrain/Step": 6494, "Pretrain/Step Time": 8.51084460131824} +{"Pretrain/Learning Rate": 1.2194909646413147e-05, "Pretrain/Loss": 2.023698091506958, "Pretrain/Loss (Raw)": 1.9660283327102661, "Pretrain/Step": 6495, "Pretrain/Step Time": 8.509733764454722} +{"Pretrain/Learning Rate": 1.2187618738096934e-05, "Pretrain/Loss": 2.024703025817871, "Pretrain/Loss (Raw)": 2.101300001144409, "Pretrain/Step": 6496, "Pretrain/Step Time": 8.512002503499389} +{"Pretrain/Learning Rate": 1.2180329307364916e-05, "Pretrain/Loss": 2.024225950241089, "Pretrain/Loss (Raw)": 2.025930643081665, "Pretrain/Step": 6497, "Pretrain/Step Time": 8.514408491551876} +{"Pretrain/Learning Rate": 1.2173041355057727e-05, "Pretrain/Loss": 2.0262372493743896, "Pretrain/Loss (Raw)": 2.110511302947998, "Pretrain/Step": 6498, "Pretrain/Step Time": 8.521874941885471} +{"Pretrain/Learning Rate": 1.216575488201585e-05, "Pretrain/Loss": 2.025020122528076, "Pretrain/Loss (Raw)": 1.979781150817871, "Pretrain/Step": 6499, "Pretrain/Step Time": 8.518782705068588} +{"Pretrain/Learning Rate": 1.215846988907959e-05, "Pretrain/Loss": 2.0257506370544434, "Pretrain/Loss (Raw)": 2.0428032875061035, "Pretrain/Step": 6500, "Pretrain/Step Time": 8.512886913493276} +{"Pretrain/Learning Rate": 1.2151186377089105e-05, "Pretrain/Loss": 2.0266218185424805, "Pretrain/Loss (Raw)": 2.1717166900634766, "Pretrain/Step": 6501, "Pretrain/Step Time": 8.512451939284801} +{"Pretrain/Learning Rate": 1.214390434688435e-05, "Pretrain/Loss": 2.026794910430908, "Pretrain/Loss (Raw)": 1.8834282159805298, "Pretrain/Step": 6502, "Pretrain/Step Time": 8.519816052168608} +{"Pretrain/Learning Rate": 1.2136623799305127e-05, "Pretrain/Loss": 2.027564287185669, "Pretrain/Loss (Raw)": 1.971273422241211, "Pretrain/Step": 6503, "Pretrain/Step Time": 8.52143308520317} +{"Pretrain/Learning Rate": 1.212934473519105e-05, "Pretrain/Loss": 2.025618076324463, "Pretrain/Loss (Raw)": 2.021393060684204, "Pretrain/Step": 6504, "Pretrain/Step Time": 8.521405892446637} +{"Pretrain/Learning Rate": 1.2122067155381598e-05, "Pretrain/Loss": 2.029266834259033, "Pretrain/Loss (Raw)": 2.3041234016418457, "Pretrain/Step": 6505, "Pretrain/Step Time": 8.517401723191142} +{"Pretrain/Learning Rate": 1.2114791060716043e-05, "Pretrain/Loss": 2.0324206352233887, "Pretrain/Loss (Raw)": 2.1406209468841553, "Pretrain/Step": 6506, "Pretrain/Step Time": 8.510555662214756} +{"Pretrain/Learning Rate": 1.2107516452033502e-05, "Pretrain/Loss": 2.030872344970703, "Pretrain/Loss (Raw)": 1.8700815439224243, "Pretrain/Step": 6507, "Pretrain/Step Time": 8.510892873629928} +{"Pretrain/Learning Rate": 1.2100243330172905e-05, "Pretrain/Loss": 2.032069444656372, "Pretrain/Loss (Raw)": 2.128459930419922, "Pretrain/Step": 6508, "Pretrain/Step Time": 8.514838742092252} +{"Pretrain/Learning Rate": 1.2092971695973052e-05, "Pretrain/Loss": 2.031595468521118, "Pretrain/Loss (Raw)": 2.0391132831573486, "Pretrain/Step": 6509, "Pretrain/Step Time": 8.515187915414572} +{"Pretrain/Learning Rate": 1.2085701550272502e-05, "Pretrain/Loss": 2.0363078117370605, "Pretrain/Loss (Raw)": 2.52663516998291, "Pretrain/Step": 6510, "Pretrain/Step Time": 8.515955954790115} +{"Pretrain/Learning Rate": 1.2078432893909714e-05, "Pretrain/Loss": 2.0388681888580322, "Pretrain/Loss (Raw)": 2.213899850845337, "Pretrain/Step": 6511, "Pretrain/Step Time": 8.513750474900007} +{"Pretrain/Learning Rate": 1.2071165727722925e-05, "Pretrain/Loss": 2.038637638092041, "Pretrain/Loss (Raw)": 2.1601414680480957, "Pretrain/Step": 6512, "Pretrain/Step Time": 8.50883250311017} +{"Pretrain/Learning Rate": 1.2063900052550246e-05, "Pretrain/Loss": 2.0375332832336426, "Pretrain/Loss (Raw)": 2.074810028076172, "Pretrain/Step": 6513, "Pretrain/Step Time": 8.505555646494031} +{"Pretrain/Learning Rate": 1.2056635869229549e-05, "Pretrain/Loss": 2.0358681678771973, "Pretrain/Loss (Raw)": 1.6235381364822388, "Pretrain/Step": 6514, "Pretrain/Step Time": 8.506300443783402} +{"Pretrain/Learning Rate": 1.2049373178598606e-05, "Pretrain/Loss": 2.0348362922668457, "Pretrain/Loss (Raw)": 1.950669288635254, "Pretrain/Step": 6515, "Pretrain/Step Time": 8.51494226232171} +{"Pretrain/Learning Rate": 1.2042111981494968e-05, "Pretrain/Loss": 2.035276412963867, "Pretrain/Loss (Raw)": 2.0820651054382324, "Pretrain/Step": 6516, "Pretrain/Step Time": 8.515624158084393} +{"Pretrain/Learning Rate": 1.2034852278756042e-05, "Pretrain/Loss": 2.0341897010803223, "Pretrain/Loss (Raw)": 1.9532607793807983, "Pretrain/Step": 6517, "Pretrain/Step Time": 8.517391324043274} +{"Pretrain/Learning Rate": 1.2027594071219033e-05, "Pretrain/Loss": 2.0351369380950928, "Pretrain/Loss (Raw)": 1.8181380033493042, "Pretrain/Step": 6518, "Pretrain/Step Time": 8.506920447573066} +{"Pretrain/Learning Rate": 1.2020337359721015e-05, "Pretrain/Loss": 2.0337600708007812, "Pretrain/Loss (Raw)": 1.9195204973220825, "Pretrain/Step": 6519, "Pretrain/Step Time": 8.507481651380658} +{"Pretrain/Learning Rate": 1.2013082145098852e-05, "Pretrain/Loss": 2.0338315963745117, "Pretrain/Loss (Raw)": 1.8915854692459106, "Pretrain/Step": 6520, "Pretrain/Step Time": 8.510180659592152} +{"Pretrain/Learning Rate": 1.2005828428189256e-05, "Pretrain/Loss": 2.0336756706237793, "Pretrain/Loss (Raw)": 2.048349618911743, "Pretrain/Step": 6521, "Pretrain/Step Time": 8.51549038849771} +{"Pretrain/Learning Rate": 1.1998576209828743e-05, "Pretrain/Loss": 2.034170150756836, "Pretrain/Loss (Raw)": 1.9558440446853638, "Pretrain/Step": 6522, "Pretrain/Step Time": 8.519578542560339} +{"Pretrain/Learning Rate": 1.19913254908537e-05, "Pretrain/Loss": 2.0368871688842773, "Pretrain/Loss (Raw)": 2.2422256469726562, "Pretrain/Step": 6523, "Pretrain/Step Time": 8.515945134684443} +{"Pretrain/Learning Rate": 1.1984076272100297e-05, "Pretrain/Loss": 2.0390710830688477, "Pretrain/Loss (Raw)": 2.471569538116455, "Pretrain/Step": 6524, "Pretrain/Step Time": 8.512739669531584} +{"Pretrain/Learning Rate": 1.1976828554404552e-05, "Pretrain/Loss": 2.0397958755493164, "Pretrain/Loss (Raw)": 1.9622371196746826, "Pretrain/Step": 6525, "Pretrain/Step Time": 8.509660543873906} +{"Pretrain/Learning Rate": 1.1969582338602295e-05, "Pretrain/Loss": 2.0414586067199707, "Pretrain/Loss (Raw)": 2.103175640106201, "Pretrain/Step": 6526, "Pretrain/Step Time": 8.52045970223844} +{"Pretrain/Learning Rate": 1.1962337625529215e-05, "Pretrain/Loss": 2.042160987854004, "Pretrain/Loss (Raw)": 2.04807448387146, "Pretrain/Step": 6527, "Pretrain/Step Time": 8.52477897144854} +{"Pretrain/Learning Rate": 1.1955094416020795e-05, "Pretrain/Loss": 2.042456865310669, "Pretrain/Loss (Raw)": 1.9588927030563354, "Pretrain/Step": 6528, "Pretrain/Step Time": 8.52595817297697} +{"Pretrain/Learning Rate": 1.1947852710912355e-05, "Pretrain/Loss": 2.043962001800537, "Pretrain/Loss (Raw)": 2.0822055339813232, "Pretrain/Step": 6529, "Pretrain/Step Time": 8.517918810248375} +{"Pretrain/Learning Rate": 1.1940612511039038e-05, "Pretrain/Loss": 2.044848918914795, "Pretrain/Loss (Raw)": 2.0439250469207764, "Pretrain/Step": 6530, "Pretrain/Step Time": 8.517346862703562} +{"Pretrain/Learning Rate": 1.1933373817235832e-05, "Pretrain/Loss": 2.044867992401123, "Pretrain/Loss (Raw)": 1.947922945022583, "Pretrain/Step": 6531, "Pretrain/Step Time": 8.519562017172575} +{"Pretrain/Learning Rate": 1.1926136630337528e-05, "Pretrain/Loss": 2.0454368591308594, "Pretrain/Loss (Raw)": 2.1233012676239014, "Pretrain/Step": 6532, "Pretrain/Step Time": 8.529618142172694} +{"Pretrain/Learning Rate": 1.1918900951178755e-05, "Pretrain/Loss": 2.043234348297119, "Pretrain/Loss (Raw)": 1.9772199392318726, "Pretrain/Step": 6533, "Pretrain/Step Time": 8.530057517811656} +{"Pretrain/Learning Rate": 1.1911666780593955e-05, "Pretrain/Loss": 2.040800094604492, "Pretrain/Loss (Raw)": 1.9984915256500244, "Pretrain/Step": 6534, "Pretrain/Step Time": 8.528058908879757} +{"Pretrain/Learning Rate": 1.1904434119417426e-05, "Pretrain/Loss": 2.0416722297668457, "Pretrain/Loss (Raw)": 1.9542467594146729, "Pretrain/Step": 6535, "Pretrain/Step Time": 8.51694063283503} +{"Pretrain/Learning Rate": 1.1897202968483263e-05, "Pretrain/Loss": 2.0361227989196777, "Pretrain/Loss (Raw)": 1.5267082452774048, "Pretrain/Step": 6536, "Pretrain/Step Time": 8.517868114635348} +{"Pretrain/Learning Rate": 1.1889973328625384e-05, "Pretrain/Loss": 2.0376334190368652, "Pretrain/Loss (Raw)": 2.0749621391296387, "Pretrain/Step": 6537, "Pretrain/Step Time": 8.512517901137471} +{"Pretrain/Learning Rate": 1.1882745200677569e-05, "Pretrain/Loss": 2.0383026599884033, "Pretrain/Loss (Raw)": 2.126171112060547, "Pretrain/Step": 6538, "Pretrain/Step Time": 8.516491135582328} +{"Pretrain/Learning Rate": 1.1875518585473389e-05, "Pretrain/Loss": 2.039203643798828, "Pretrain/Loss (Raw)": 2.1155917644500732, "Pretrain/Step": 6539, "Pretrain/Step Time": 8.520128477364779} +{"Pretrain/Learning Rate": 1.1868293483846247e-05, "Pretrain/Loss": 2.0379462242126465, "Pretrain/Loss (Raw)": 1.9541374444961548, "Pretrain/Step": 6540, "Pretrain/Step Time": 8.524185637012124} +{"Pretrain/Learning Rate": 1.186106989662937e-05, "Pretrain/Loss": 2.0342540740966797, "Pretrain/Loss (Raw)": 1.8027849197387695, "Pretrain/Step": 6541, "Pretrain/Step Time": 8.516764249652624} +{"Pretrain/Learning Rate": 1.1853847824655836e-05, "Pretrain/Loss": 2.03314208984375, "Pretrain/Loss (Raw)": 1.924965739250183, "Pretrain/Step": 6542, "Pretrain/Step Time": 8.512155098840594} +{"Pretrain/Learning Rate": 1.184662726875852e-05, "Pretrain/Loss": 2.0348618030548096, "Pretrain/Loss (Raw)": 2.287357807159424, "Pretrain/Step": 6543, "Pretrain/Step Time": 8.514076242223382} +{"Pretrain/Learning Rate": 1.1839408229770124e-05, "Pretrain/Loss": 2.034742832183838, "Pretrain/Loss (Raw)": 1.9660260677337646, "Pretrain/Step": 6544, "Pretrain/Step Time": 8.526517055928707} +{"Pretrain/Learning Rate": 1.183219070852318e-05, "Pretrain/Loss": 2.0339765548706055, "Pretrain/Loss (Raw)": 2.0261037349700928, "Pretrain/Step": 6545, "Pretrain/Step Time": 8.523800997063518} +{"Pretrain/Learning Rate": 1.1824974705850058e-05, "Pretrain/Loss": 2.0338120460510254, "Pretrain/Loss (Raw)": 2.0175933837890625, "Pretrain/Step": 6546, "Pretrain/Step Time": 8.519294779747725} +{"Pretrain/Learning Rate": 1.1817760222582938e-05, "Pretrain/Loss": 2.0337085723876953, "Pretrain/Loss (Raw)": 2.1611111164093018, "Pretrain/Step": 6547, "Pretrain/Step Time": 8.512532832100987} +{"Pretrain/Learning Rate": 1.1810547259553826e-05, "Pretrain/Loss": 2.034228801727295, "Pretrain/Loss (Raw)": 1.9984936714172363, "Pretrain/Step": 6548, "Pretrain/Step Time": 8.512582916766405} +{"Pretrain/Learning Rate": 1.1803335817594544e-05, "Pretrain/Loss": 2.032257080078125, "Pretrain/Loss (Raw)": 1.838544487953186, "Pretrain/Step": 6549, "Pretrain/Step Time": 8.514017211273313} +{"Pretrain/Learning Rate": 1.179612589753678e-05, "Pretrain/Loss": 2.0320398807525635, "Pretrain/Loss (Raw)": 1.9627346992492676, "Pretrain/Step": 6550, "Pretrain/Step Time": 8.512310318648815} +{"Pretrain/Learning Rate": 1.1788917500211976e-05, "Pretrain/Loss": 2.032186508178711, "Pretrain/Loss (Raw)": 2.018860340118408, "Pretrain/Step": 6551, "Pretrain/Step Time": 8.514952879399061} +{"Pretrain/Learning Rate": 1.178171062645147e-05, "Pretrain/Loss": 2.0326199531555176, "Pretrain/Loss (Raw)": 2.019517421722412, "Pretrain/Step": 6552, "Pretrain/Step Time": 8.511940203607082} +{"Pretrain/Learning Rate": 1.177450527708637e-05, "Pretrain/Loss": 2.0318174362182617, "Pretrain/Loss (Raw)": 2.041674852371216, "Pretrain/Step": 6553, "Pretrain/Step Time": 8.50250580534339} +{"Pretrain/Learning Rate": 1.1767301452947663e-05, "Pretrain/Loss": 2.028637647628784, "Pretrain/Loss (Raw)": 1.551519751548767, "Pretrain/Step": 6554, "Pretrain/Step Time": 8.498976916074753} +{"Pretrain/Learning Rate": 1.1760099154866086e-05, "Pretrain/Loss": 2.0311808586120605, "Pretrain/Loss (Raw)": 1.9398689270019531, "Pretrain/Step": 6555, "Pretrain/Step Time": 8.503974353894591} +{"Pretrain/Learning Rate": 1.1752898383672273e-05, "Pretrain/Loss": 2.0300240516662598, "Pretrain/Loss (Raw)": 1.9984662532806396, "Pretrain/Step": 6556, "Pretrain/Step Time": 8.510774537920952} +{"Pretrain/Learning Rate": 1.1745699140196632e-05, "Pretrain/Loss": 2.0329244136810303, "Pretrain/Loss (Raw)": 2.3015120029449463, "Pretrain/Step": 6557, "Pretrain/Step Time": 8.512793123722076} +{"Pretrain/Learning Rate": 1.1738501425269441e-05, "Pretrain/Loss": 2.0325112342834473, "Pretrain/Loss (Raw)": 1.846448540687561, "Pretrain/Step": 6558, "Pretrain/Step Time": 8.509254103526473} +{"Pretrain/Learning Rate": 1.1731305239720735e-05, "Pretrain/Loss": 2.032867670059204, "Pretrain/Loss (Raw)": 2.235295057296753, "Pretrain/Step": 6559, "Pretrain/Step Time": 8.507737722247839} +{"Pretrain/Learning Rate": 1.1724110584380444e-05, "Pretrain/Loss": 2.031097650527954, "Pretrain/Loss (Raw)": 1.8915975093841553, "Pretrain/Step": 6560, "Pretrain/Step Time": 8.510165372863412} +{"Pretrain/Learning Rate": 1.1716917460078278e-05, "Pretrain/Loss": 2.031383991241455, "Pretrain/Loss (Raw)": 2.14994740486145, "Pretrain/Step": 6561, "Pretrain/Step Time": 8.513336896896362} +{"Pretrain/Learning Rate": 1.1709725867643784e-05, "Pretrain/Loss": 2.0303072929382324, "Pretrain/Loss (Raw)": 1.9276527166366577, "Pretrain/Step": 6562, "Pretrain/Step Time": 8.515573622658849} +{"Pretrain/Learning Rate": 1.1702535807906318e-05, "Pretrain/Loss": 2.031282424926758, "Pretrain/Loss (Raw)": 2.1479239463806152, "Pretrain/Step": 6563, "Pretrain/Step Time": 8.516111394390464} +{"Pretrain/Learning Rate": 1.1695347281695093e-05, "Pretrain/Loss": 2.0318078994750977, "Pretrain/Loss (Raw)": 2.113551378250122, "Pretrain/Step": 6564, "Pretrain/Step Time": 8.509194346144795} +{"Pretrain/Learning Rate": 1.1688160289839111e-05, "Pretrain/Loss": 2.030992269515991, "Pretrain/Loss (Raw)": 2.045271396636963, "Pretrain/Step": 6565, "Pretrain/Step Time": 8.509221060201526} +{"Pretrain/Learning Rate": 1.1680974833167214e-05, "Pretrain/Loss": 2.031406879425049, "Pretrain/Loss (Raw)": 1.975844383239746, "Pretrain/Step": 6566, "Pretrain/Step Time": 8.5054429192096} +{"Pretrain/Learning Rate": 1.1673790912508051e-05, "Pretrain/Loss": 2.030564308166504, "Pretrain/Loss (Raw)": 1.9843624830245972, "Pretrain/Step": 6567, "Pretrain/Step Time": 8.510376600548625} +{"Pretrain/Learning Rate": 1.1666608528690123e-05, "Pretrain/Loss": 2.03145170211792, "Pretrain/Loss (Raw)": 1.9524164199829102, "Pretrain/Step": 6568, "Pretrain/Step Time": 8.512962345033884} +{"Pretrain/Learning Rate": 1.165942768254173e-05, "Pretrain/Loss": 2.0305275917053223, "Pretrain/Loss (Raw)": 1.9580674171447754, "Pretrain/Step": 6569, "Pretrain/Step Time": 8.513133816421032} +{"Pretrain/Learning Rate": 1.1652248374890999e-05, "Pretrain/Loss": 2.030172348022461, "Pretrain/Loss (Raw)": 1.8623696565628052, "Pretrain/Step": 6570, "Pretrain/Step Time": 8.5079735647887} +{"Pretrain/Learning Rate": 1.164507060656587e-05, "Pretrain/Loss": 2.03056263923645, "Pretrain/Loss (Raw)": 1.9536261558532715, "Pretrain/Step": 6571, "Pretrain/Step Time": 8.501747276633978} +{"Pretrain/Learning Rate": 1.163789437839414e-05, "Pretrain/Loss": 2.02807354927063, "Pretrain/Loss (Raw)": 1.9916990995407104, "Pretrain/Step": 6572, "Pretrain/Step Time": 8.499897751957178} +{"Pretrain/Learning Rate": 1.1630719691203395e-05, "Pretrain/Loss": 2.03017520904541, "Pretrain/Loss (Raw)": 1.8984904289245605, "Pretrain/Step": 6573, "Pretrain/Step Time": 8.507392633706331} +{"Pretrain/Learning Rate": 1.1623546545821054e-05, "Pretrain/Loss": 2.030099868774414, "Pretrain/Loss (Raw)": 1.8495591878890991, "Pretrain/Step": 6574, "Pretrain/Step Time": 8.508618414402008} +{"Pretrain/Learning Rate": 1.1616374943074349e-05, "Pretrain/Loss": 2.0298781394958496, "Pretrain/Loss (Raw)": 2.0001535415649414, "Pretrain/Step": 6575, "Pretrain/Step Time": 8.513085486367345} +{"Pretrain/Learning Rate": 1.1609204883790359e-05, "Pretrain/Loss": 2.029367208480835, "Pretrain/Loss (Raw)": 1.8159996271133423, "Pretrain/Step": 6576, "Pretrain/Step Time": 8.507552850991488} +{"Pretrain/Learning Rate": 1.1602036368795963e-05, "Pretrain/Loss": 2.0262832641601562, "Pretrain/Loss (Raw)": 1.9611409902572632, "Pretrain/Step": 6577, "Pretrain/Step Time": 8.503295166417956} +{"Pretrain/Learning Rate": 1.1594869398917854e-05, "Pretrain/Loss": 2.0269408226013184, "Pretrain/Loss (Raw)": 2.028053045272827, "Pretrain/Step": 6578, "Pretrain/Step Time": 8.497404070571065} +{"Pretrain/Learning Rate": 1.1587703974982584e-05, "Pretrain/Loss": 2.025979518890381, "Pretrain/Loss (Raw)": 2.147212266921997, "Pretrain/Step": 6579, "Pretrain/Step Time": 8.503592455759645} +{"Pretrain/Learning Rate": 1.1580540097816491e-05, "Pretrain/Loss": 2.021613597869873, "Pretrain/Loss (Raw)": 1.8683990240097046, "Pretrain/Step": 6580, "Pretrain/Step Time": 8.504713375121355} +{"Pretrain/Learning Rate": 1.157337776824575e-05, "Pretrain/Loss": 2.024721622467041, "Pretrain/Loss (Raw)": 2.308431386947632, "Pretrain/Step": 6581, "Pretrain/Step Time": 8.506441229954362} +{"Pretrain/Learning Rate": 1.1566216987096343e-05, "Pretrain/Loss": 2.0238513946533203, "Pretrain/Loss (Raw)": 1.7341182231903076, "Pretrain/Step": 6582, "Pretrain/Step Time": 8.49876118823886} +{"Pretrain/Learning Rate": 1.1559057755194105e-05, "Pretrain/Loss": 2.02347993850708, "Pretrain/Loss (Raw)": 1.997557282447815, "Pretrain/Step": 6583, "Pretrain/Step Time": 8.499016549438238} +{"Pretrain/Learning Rate": 1.1551900073364663e-05, "Pretrain/Loss": 2.021169424057007, "Pretrain/Loss (Raw)": 1.9034417867660522, "Pretrain/Step": 6584, "Pretrain/Step Time": 8.506947541609406} +{"Pretrain/Learning Rate": 1.1544743942433473e-05, "Pretrain/Loss": 2.0208380222320557, "Pretrain/Loss (Raw)": 2.0335638523101807, "Pretrain/Step": 6585, "Pretrain/Step Time": 8.509953761473298} +{"Pretrain/Learning Rate": 1.1537589363225806e-05, "Pretrain/Loss": 2.020784378051758, "Pretrain/Loss (Raw)": 1.996254801750183, "Pretrain/Step": 6586, "Pretrain/Step Time": 8.510457530617714} +{"Pretrain/Learning Rate": 1.153043633656678e-05, "Pretrain/Loss": 2.0203466415405273, "Pretrain/Loss (Raw)": 1.9774560928344727, "Pretrain/Step": 6587, "Pretrain/Step Time": 8.51652655750513} +{"Pretrain/Learning Rate": 1.1523284863281306e-05, "Pretrain/Loss": 2.0173661708831787, "Pretrain/Loss (Raw)": 1.7716717720031738, "Pretrain/Step": 6588, "Pretrain/Step Time": 8.51226662658155} +{"Pretrain/Learning Rate": 1.1516134944194126e-05, "Pretrain/Loss": 2.0202205181121826, "Pretrain/Loss (Raw)": 2.154064416885376, "Pretrain/Step": 6589, "Pretrain/Step Time": 8.50661144591868} +{"Pretrain/Learning Rate": 1.1508986580129794e-05, "Pretrain/Loss": 2.0240120887756348, "Pretrain/Loss (Raw)": 2.299067258834839, "Pretrain/Step": 6590, "Pretrain/Step Time": 8.503661686554551} +{"Pretrain/Learning Rate": 1.1501839771912718e-05, "Pretrain/Loss": 2.0236873626708984, "Pretrain/Loss (Raw)": 2.041128158569336, "Pretrain/Step": 6591, "Pretrain/Step Time": 8.51295281946659} +{"Pretrain/Learning Rate": 1.1494694520367068e-05, "Pretrain/Loss": 2.024076461791992, "Pretrain/Loss (Raw)": 1.9804729223251343, "Pretrain/Step": 6592, "Pretrain/Step Time": 8.51044593565166} +{"Pretrain/Learning Rate": 1.1487550826316893e-05, "Pretrain/Loss": 2.0230329036712646, "Pretrain/Loss (Raw)": 1.6723294258117676, "Pretrain/Step": 6593, "Pretrain/Step Time": 8.515839125961065} +{"Pretrain/Learning Rate": 1.1480408690586022e-05, "Pretrain/Loss": 2.0223913192749023, "Pretrain/Loss (Raw)": 1.8926538228988647, "Pretrain/Step": 6594, "Pretrain/Step Time": 8.510502526536584} +{"Pretrain/Learning Rate": 1.1473268113998146e-05, "Pretrain/Loss": 2.020777463912964, "Pretrain/Loss (Raw)": 1.9623943567276, "Pretrain/Step": 6595, "Pretrain/Step Time": 8.501139456406236} +{"Pretrain/Learning Rate": 1.146612909737671e-05, "Pretrain/Loss": 2.020918846130371, "Pretrain/Loss (Raw)": 2.0324978828430176, "Pretrain/Step": 6596, "Pretrain/Step Time": 8.501608612015843} +{"Pretrain/Learning Rate": 1.145899164154505e-05, "Pretrain/Loss": 2.019294500350952, "Pretrain/Loss (Raw)": 2.112886428833008, "Pretrain/Step": 6597, "Pretrain/Step Time": 8.500418683513999} +{"Pretrain/Learning Rate": 1.1451855747326273e-05, "Pretrain/Loss": 2.0183467864990234, "Pretrain/Loss (Raw)": 1.9329625368118286, "Pretrain/Step": 6598, "Pretrain/Step Time": 8.500599473714828} +{"Pretrain/Learning Rate": 1.1444721415543349e-05, "Pretrain/Loss": 2.0182998180389404, "Pretrain/Loss (Raw)": 2.0446181297302246, "Pretrain/Step": 6599, "Pretrain/Step Time": 8.510898303240538} +{"Pretrain/Learning Rate": 1.143758864701901e-05, "Pretrain/Loss": 2.0182697772979736, "Pretrain/Loss (Raw)": 1.9076040983200073, "Pretrain/Step": 6600, "Pretrain/Step Time": 8.515253895893693} +{"Pretrain/Learning Rate": 1.1430457442575863e-05, "Pretrain/Loss": 2.0182154178619385, "Pretrain/Loss (Raw)": 2.0333261489868164, "Pretrain/Step": 6601, "Pretrain/Step Time": 8.513364790007472} +{"Pretrain/Learning Rate": 1.1423327803036308e-05, "Pretrain/Loss": 2.0184478759765625, "Pretrain/Loss (Raw)": 2.0533478260040283, "Pretrain/Step": 6602, "Pretrain/Step Time": 8.509796503931284} +{"Pretrain/Learning Rate": 1.1416199729222565e-05, "Pretrain/Loss": 2.0179312229156494, "Pretrain/Loss (Raw)": 1.9387587308883667, "Pretrain/Step": 6603, "Pretrain/Step Time": 8.516733279451728} +{"Pretrain/Learning Rate": 1.1409073221956668e-05, "Pretrain/Loss": 2.0182595252990723, "Pretrain/Loss (Raw)": 2.160229444503784, "Pretrain/Step": 6604, "Pretrain/Step Time": 8.524644792079926} +{"Pretrain/Learning Rate": 1.14019482820605e-05, "Pretrain/Loss": 2.0157792568206787, "Pretrain/Loss (Raw)": 1.9217731952667236, "Pretrain/Step": 6605, "Pretrain/Step Time": 8.529366029426455} +{"Pretrain/Learning Rate": 1.1394824910355731e-05, "Pretrain/Loss": 2.018111228942871, "Pretrain/Loss (Raw)": 2.3353261947631836, "Pretrain/Step": 6606, "Pretrain/Step Time": 8.523725910112262} +{"Pretrain/Learning Rate": 1.1387703107663864e-05, "Pretrain/Loss": 2.0160534381866455, "Pretrain/Loss (Raw)": 1.8571667671203613, "Pretrain/Step": 6607, "Pretrain/Step Time": 8.524993970990181} +{"Pretrain/Learning Rate": 1.1380582874806209e-05, "Pretrain/Loss": 2.014674663543701, "Pretrain/Loss (Raw)": 2.160383462905884, "Pretrain/Step": 6608, "Pretrain/Step Time": 8.523006780073047} +{"Pretrain/Learning Rate": 1.1373464212603923e-05, "Pretrain/Loss": 2.018360137939453, "Pretrain/Loss (Raw)": 2.047837257385254, "Pretrain/Step": 6609, "Pretrain/Step Time": 8.52982147783041} +{"Pretrain/Learning Rate": 1.1366347121877955e-05, "Pretrain/Loss": 2.0156548023223877, "Pretrain/Loss (Raw)": 1.6148000955581665, "Pretrain/Step": 6610, "Pretrain/Step Time": 8.526937874034047} +{"Pretrain/Learning Rate": 1.1359231603449078e-05, "Pretrain/Loss": 2.013021945953369, "Pretrain/Loss (Raw)": 1.830491304397583, "Pretrain/Step": 6611, "Pretrain/Step Time": 8.528607174754143} +{"Pretrain/Learning Rate": 1.1352117658137884e-05, "Pretrain/Loss": 2.0150554180145264, "Pretrain/Loss (Raw)": 2.2483649253845215, "Pretrain/Step": 6612, "Pretrain/Step Time": 8.519445041194558} +{"Pretrain/Learning Rate": 1.1345005286764798e-05, "Pretrain/Loss": 2.017240524291992, "Pretrain/Loss (Raw)": 2.0672571659088135, "Pretrain/Step": 6613, "Pretrain/Step Time": 8.522799557074904} +{"Pretrain/Learning Rate": 1.133789449015005e-05, "Pretrain/Loss": 2.0206918716430664, "Pretrain/Loss (Raw)": 2.3186402320861816, "Pretrain/Step": 6614, "Pretrain/Step Time": 8.519161192700267} +{"Pretrain/Learning Rate": 1.1330785269113686e-05, "Pretrain/Loss": 2.021101951599121, "Pretrain/Loss (Raw)": 1.9715770483016968, "Pretrain/Step": 6615, "Pretrain/Step Time": 8.524870913475752} +{"Pretrain/Learning Rate": 1.1323677624475567e-05, "Pretrain/Loss": 2.015754461288452, "Pretrain/Loss (Raw)": 1.8138689994812012, "Pretrain/Step": 6616, "Pretrain/Step Time": 8.527638375759125} +{"Pretrain/Learning Rate": 1.13165715570554e-05, "Pretrain/Loss": 2.017498254776001, "Pretrain/Loss (Raw)": 2.316506862640381, "Pretrain/Step": 6617, "Pretrain/Step Time": 8.525907769799232} +{"Pretrain/Learning Rate": 1.1309467067672678e-05, "Pretrain/Loss": 2.0186212062835693, "Pretrain/Loss (Raw)": 2.1630609035491943, "Pretrain/Step": 6618, "Pretrain/Step Time": 8.52400010637939} +{"Pretrain/Learning Rate": 1.1302364157146716e-05, "Pretrain/Loss": 2.0175318717956543, "Pretrain/Loss (Raw)": 2.0375280380249023, "Pretrain/Step": 6619, "Pretrain/Step Time": 8.51742872968316} +{"Pretrain/Learning Rate": 1.1295262826296677e-05, "Pretrain/Loss": 2.0152039527893066, "Pretrain/Loss (Raw)": 1.736301064491272, "Pretrain/Step": 6620, "Pretrain/Step Time": 8.511741913855076} +{"Pretrain/Learning Rate": 1.1288163075941505e-05, "Pretrain/Loss": 2.0115907192230225, "Pretrain/Loss (Raw)": 1.8633978366851807, "Pretrain/Step": 6621, "Pretrain/Step Time": 8.521124789491296} +{"Pretrain/Learning Rate": 1.128106490689998e-05, "Pretrain/Loss": 2.0096964836120605, "Pretrain/Loss (Raw)": 1.847761631011963, "Pretrain/Step": 6622, "Pretrain/Step Time": 8.525515051558614} +{"Pretrain/Learning Rate": 1.1273968319990685e-05, "Pretrain/Loss": 2.010322332382202, "Pretrain/Loss (Raw)": 2.046117067337036, "Pretrain/Step": 6623, "Pretrain/Step Time": 8.523412117734551} +{"Pretrain/Learning Rate": 1.1266873316032053e-05, "Pretrain/Loss": 2.009101390838623, "Pretrain/Loss (Raw)": 1.9450149536132812, "Pretrain/Step": 6624, "Pretrain/Step Time": 8.52021948620677} +{"Pretrain/Learning Rate": 1.1259779895842304e-05, "Pretrain/Loss": 2.0091257095336914, "Pretrain/Loss (Raw)": 2.029052495956421, "Pretrain/Step": 6625, "Pretrain/Step Time": 8.517941858619452} +{"Pretrain/Learning Rate": 1.1252688060239481e-05, "Pretrain/Loss": 2.0086169242858887, "Pretrain/Loss (Raw)": 2.045391082763672, "Pretrain/Step": 6626, "Pretrain/Step Time": 8.51901575922966} +{"Pretrain/Learning Rate": 1.1245597810041441e-05, "Pretrain/Loss": 2.008859157562256, "Pretrain/Loss (Raw)": 2.010789394378662, "Pretrain/Step": 6627, "Pretrain/Step Time": 8.517437312752008} +{"Pretrain/Learning Rate": 1.1238509146065887e-05, "Pretrain/Loss": 2.010117292404175, "Pretrain/Loss (Raw)": 2.203821897506714, "Pretrain/Step": 6628, "Pretrain/Step Time": 8.52361560612917} +{"Pretrain/Learning Rate": 1.1231422069130302e-05, "Pretrain/Loss": 2.0097150802612305, "Pretrain/Loss (Raw)": 2.1202123165130615, "Pretrain/Step": 6629, "Pretrain/Step Time": 8.522253427654505} +{"Pretrain/Learning Rate": 1.1224336580052005e-05, "Pretrain/Loss": 2.00931978225708, "Pretrain/Loss (Raw)": 1.8328555822372437, "Pretrain/Step": 6630, "Pretrain/Step Time": 8.51611402630806} +{"Pretrain/Learning Rate": 1.1217252679648116e-05, "Pretrain/Loss": 2.0095746517181396, "Pretrain/Loss (Raw)": 2.003899335861206, "Pretrain/Step": 6631, "Pretrain/Step Time": 8.514979319646955} +{"Pretrain/Learning Rate": 1.1210170368735615e-05, "Pretrain/Loss": 2.007758140563965, "Pretrain/Loss (Raw)": 1.7888462543487549, "Pretrain/Step": 6632, "Pretrain/Step Time": 8.521751288324594} +{"Pretrain/Learning Rate": 1.1203089648131227e-05, "Pretrain/Loss": 2.007075786590576, "Pretrain/Loss (Raw)": 2.2168116569519043, "Pretrain/Step": 6633, "Pretrain/Step Time": 8.51791981048882} +{"Pretrain/Learning Rate": 1.1196010518651562e-05, "Pretrain/Loss": 2.0063178539276123, "Pretrain/Loss (Raw)": 2.043613910675049, "Pretrain/Step": 6634, "Pretrain/Step Time": 8.522395027801394} +{"Pretrain/Learning Rate": 1.1188932981113004e-05, "Pretrain/Loss": 2.0080127716064453, "Pretrain/Loss (Raw)": 2.0870282649993896, "Pretrain/Step": 6635, "Pretrain/Step Time": 8.520866299048066} +{"Pretrain/Learning Rate": 1.1181857036331792e-05, "Pretrain/Loss": 2.0073418617248535, "Pretrain/Loss (Raw)": 2.042590618133545, "Pretrain/Step": 6636, "Pretrain/Step Time": 8.517788695171475} +{"Pretrain/Learning Rate": 1.1174782685123918e-05, "Pretrain/Loss": 2.0079598426818848, "Pretrain/Loss (Raw)": 2.118217706680298, "Pretrain/Step": 6637, "Pretrain/Step Time": 8.523634627461433} +{"Pretrain/Learning Rate": 1.1167709928305265e-05, "Pretrain/Loss": 2.0053915977478027, "Pretrain/Loss (Raw)": 2.1978843212127686, "Pretrain/Step": 6638, "Pretrain/Step Time": 8.52607093192637} +{"Pretrain/Learning Rate": 1.1160638766691473e-05, "Pretrain/Loss": 2.000182628631592, "Pretrain/Loss (Raw)": 1.5471450090408325, "Pretrain/Step": 6639, "Pretrain/Step Time": 8.526493486016989} +{"Pretrain/Learning Rate": 1.1153569201098046e-05, "Pretrain/Loss": 1.9972467422485352, "Pretrain/Loss (Raw)": 1.7843393087387085, "Pretrain/Step": 6640, "Pretrain/Step Time": 8.527232956141233} +{"Pretrain/Learning Rate": 1.114650123234025e-05, "Pretrain/Loss": 1.9973692893981934, "Pretrain/Loss (Raw)": 2.090510368347168, "Pretrain/Step": 6641, "Pretrain/Step Time": 8.520824927836657} +{"Pretrain/Learning Rate": 1.1139434861233223e-05, "Pretrain/Loss": 2.0011816024780273, "Pretrain/Loss (Raw)": 2.111503839492798, "Pretrain/Step": 6642, "Pretrain/Step Time": 8.516732189804316} +{"Pretrain/Learning Rate": 1.1132370088591879e-05, "Pretrain/Loss": 2.0007524490356445, "Pretrain/Loss (Raw)": 1.895733118057251, "Pretrain/Step": 6643, "Pretrain/Step Time": 8.512262251228094} +{"Pretrain/Learning Rate": 1.1125306915230963e-05, "Pretrain/Loss": 2.0004160404205322, "Pretrain/Loss (Raw)": 2.0390069484710693, "Pretrain/Step": 6644, "Pretrain/Step Time": 8.513683332130313} +{"Pretrain/Learning Rate": 1.1118245341965022e-05, "Pretrain/Loss": 1.99911630153656, "Pretrain/Loss (Raw)": 1.7868971824645996, "Pretrain/Step": 6645, "Pretrain/Step Time": 8.508503772318363} +{"Pretrain/Learning Rate": 1.1111185369608454e-05, "Pretrain/Loss": 2.000347375869751, "Pretrain/Loss (Raw)": 1.9757264852523804, "Pretrain/Step": 6646, "Pretrain/Step Time": 8.510632462799549} +{"Pretrain/Learning Rate": 1.110412699897543e-05, "Pretrain/Loss": 2.0011136531829834, "Pretrain/Loss (Raw)": 2.0175936222076416, "Pretrain/Step": 6647, "Pretrain/Step Time": 8.51134174130857} +{"Pretrain/Learning Rate": 1.1097070230879965e-05, "Pretrain/Loss": 2.0018224716186523, "Pretrain/Loss (Raw)": 1.982321858406067, "Pretrain/Step": 6648, "Pretrain/Step Time": 8.506201334297657} +{"Pretrain/Learning Rate": 1.1090015066135865e-05, "Pretrain/Loss": 2.001713275909424, "Pretrain/Loss (Raw)": 2.034390926361084, "Pretrain/Step": 6649, "Pretrain/Step Time": 8.506695318967104} +{"Pretrain/Learning Rate": 1.108296150555678e-05, "Pretrain/Loss": 2.0030500888824463, "Pretrain/Loss (Raw)": 2.126948118209839, "Pretrain/Step": 6650, "Pretrain/Step Time": 8.510180711746216} +{"Pretrain/Learning Rate": 1.1075909549956154e-05, "Pretrain/Loss": 2.001908540725708, "Pretrain/Loss (Raw)": 2.0961103439331055, "Pretrain/Step": 6651, "Pretrain/Step Time": 8.50865863263607} +{"Pretrain/Learning Rate": 1.106885920014725e-05, "Pretrain/Loss": 1.9981598854064941, "Pretrain/Loss (Raw)": 1.9917165040969849, "Pretrain/Step": 6652, "Pretrain/Step Time": 8.508815705776215} +{"Pretrain/Learning Rate": 1.1061810456943142e-05, "Pretrain/Loss": 1.9996846914291382, "Pretrain/Loss (Raw)": 2.157417058944702, "Pretrain/Step": 6653, "Pretrain/Step Time": 8.5093894302845} +{"Pretrain/Learning Rate": 1.1054763321156738e-05, "Pretrain/Loss": 1.9985958337783813, "Pretrain/Loss (Raw)": 1.9638185501098633, "Pretrain/Step": 6654, "Pretrain/Step Time": 8.494722010567784} +{"Pretrain/Learning Rate": 1.1047717793600743e-05, "Pretrain/Loss": 1.999396562576294, "Pretrain/Loss (Raw)": 2.150550127029419, "Pretrain/Step": 6655, "Pretrain/Step Time": 8.499618107452989} +{"Pretrain/Learning Rate": 1.1040673875087673e-05, "Pretrain/Loss": 1.999330759048462, "Pretrain/Loss (Raw)": 1.950467586517334, "Pretrain/Step": 6656, "Pretrain/Step Time": 8.503006469458342} +{"Pretrain/Learning Rate": 1.1033631566429863e-05, "Pretrain/Loss": 2.0021908283233643, "Pretrain/Loss (Raw)": 2.448295831680298, "Pretrain/Step": 6657, "Pretrain/Step Time": 8.503311153501272} +{"Pretrain/Learning Rate": 1.1026590868439482e-05, "Pretrain/Loss": 2.002605438232422, "Pretrain/Loss (Raw)": 2.097024917602539, "Pretrain/Step": 6658, "Pretrain/Step Time": 8.50507466495037} +{"Pretrain/Learning Rate": 1.1019551781928489e-05, "Pretrain/Loss": 2.0022482872009277, "Pretrain/Loss (Raw)": 1.9022012948989868, "Pretrain/Step": 6659, "Pretrain/Step Time": 8.49766044691205} +{"Pretrain/Learning Rate": 1.1012514307708648e-05, "Pretrain/Loss": 2.001938819885254, "Pretrain/Loss (Raw)": 2.0836751461029053, "Pretrain/Step": 6660, "Pretrain/Step Time": 8.484129581600428} +{"Pretrain/Learning Rate": 1.1005478446591582e-05, "Pretrain/Loss": 2.0021448135375977, "Pretrain/Loss (Raw)": 2.003570556640625, "Pretrain/Step": 6661, "Pretrain/Step Time": 8.489466914907098} +{"Pretrain/Learning Rate": 1.0998444199388686e-05, "Pretrain/Loss": 2.0014584064483643, "Pretrain/Loss (Raw)": 1.9106448888778687, "Pretrain/Step": 6662, "Pretrain/Step Time": 8.497092489153147} +{"Pretrain/Learning Rate": 1.099141156691118e-05, "Pretrain/Loss": 2.001636505126953, "Pretrain/Loss (Raw)": 1.9770439863204956, "Pretrain/Step": 6663, "Pretrain/Step Time": 8.50343426503241} +{"Pretrain/Learning Rate": 1.0984380549970095e-05, "Pretrain/Loss": 2.0049386024475098, "Pretrain/Loss (Raw)": 1.9493986368179321, "Pretrain/Step": 6664, "Pretrain/Step Time": 8.50646011531353} +{"Pretrain/Learning Rate": 1.0977351149376297e-05, "Pretrain/Loss": 2.0031938552856445, "Pretrain/Loss (Raw)": 1.8515915870666504, "Pretrain/Step": 6665, "Pretrain/Step Time": 8.506767772138119} +{"Pretrain/Learning Rate": 1.0970323365940444e-05, "Pretrain/Loss": 2.0024023056030273, "Pretrain/Loss (Raw)": 2.0248944759368896, "Pretrain/Step": 6666, "Pretrain/Step Time": 8.503649819642305} +{"Pretrain/Learning Rate": 1.0963297200473007e-05, "Pretrain/Loss": 2.00254225730896, "Pretrain/Loss (Raw)": 2.133488416671753, "Pretrain/Step": 6667, "Pretrain/Step Time": 8.503234962001443} +{"Pretrain/Learning Rate": 1.0956272653784271e-05, "Pretrain/Loss": 2.002514362335205, "Pretrain/Loss (Raw)": 1.9505442380905151, "Pretrain/Step": 6668, "Pretrain/Step Time": 8.510743660852313} +{"Pretrain/Learning Rate": 1.094924972668436e-05, "Pretrain/Loss": 2.0030932426452637, "Pretrain/Loss (Raw)": 1.8768872022628784, "Pretrain/Step": 6669, "Pretrain/Step Time": 8.507620088756084} +{"Pretrain/Learning Rate": 1.0942228419983177e-05, "Pretrain/Loss": 2.0039072036743164, "Pretrain/Loss (Raw)": 2.0291872024536133, "Pretrain/Step": 6670, "Pretrain/Step Time": 8.507664883509278} +{"Pretrain/Learning Rate": 1.093520873449046e-05, "Pretrain/Loss": 2.0025885105133057, "Pretrain/Loss (Raw)": 2.1185388565063477, "Pretrain/Step": 6671, "Pretrain/Step Time": 8.503909358754754} +{"Pretrain/Learning Rate": 1.0928190671015734e-05, "Pretrain/Loss": 2.001018762588501, "Pretrain/Loss (Raw)": 1.7650946378707886, "Pretrain/Step": 6672, "Pretrain/Step Time": 8.494084177538753} +{"Pretrain/Learning Rate": 1.0921174230368378e-05, "Pretrain/Loss": 2.0010733604431152, "Pretrain/Loss (Raw)": 2.033090591430664, "Pretrain/Step": 6673, "Pretrain/Step Time": 8.49397288262844} +{"Pretrain/Learning Rate": 1.0914159413357553e-05, "Pretrain/Loss": 2.0009758472442627, "Pretrain/Loss (Raw)": 2.005124568939209, "Pretrain/Step": 6674, "Pretrain/Step Time": 8.50270121358335} +{"Pretrain/Learning Rate": 1.0907146220792236e-05, "Pretrain/Loss": 2.0009799003601074, "Pretrain/Loss (Raw)": 2.1616363525390625, "Pretrain/Step": 6675, "Pretrain/Step Time": 8.50464803352952} +{"Pretrain/Learning Rate": 1.0900134653481217e-05, "Pretrain/Loss": 2.0017428398132324, "Pretrain/Loss (Raw)": 2.0961568355560303, "Pretrain/Step": 6676, "Pretrain/Step Time": 8.512041501700878} +{"Pretrain/Learning Rate": 1.089312471223313e-05, "Pretrain/Loss": 2.0039076805114746, "Pretrain/Loss (Raw)": 2.115630626678467, "Pretrain/Step": 6677, "Pretrain/Step Time": 8.50882182456553} +{"Pretrain/Learning Rate": 1.0886116397856355e-05, "Pretrain/Loss": 2.005183696746826, "Pretrain/Loss (Raw)": 2.1260595321655273, "Pretrain/Step": 6678, "Pretrain/Step Time": 8.508799014613032} +{"Pretrain/Learning Rate": 1.0879109711159156e-05, "Pretrain/Loss": 2.0025124549865723, "Pretrain/Loss (Raw)": 1.6769448518753052, "Pretrain/Step": 6679, "Pretrain/Step Time": 8.506354348734021} +{"Pretrain/Learning Rate": 1.0872104652949552e-05, "Pretrain/Loss": 2.002805709838867, "Pretrain/Loss (Raw)": 2.057063579559326, "Pretrain/Step": 6680, "Pretrain/Step Time": 8.512035563588142} +{"Pretrain/Learning Rate": 1.0865101224035432e-05, "Pretrain/Loss": 2.002488851547241, "Pretrain/Loss (Raw)": 2.0011096000671387, "Pretrain/Step": 6681, "Pretrain/Step Time": 8.514831965789199} +{"Pretrain/Learning Rate": 1.0858099425224427e-05, "Pretrain/Loss": 2.00581693649292, "Pretrain/Loss (Raw)": 1.9774861335754395, "Pretrain/Step": 6682, "Pretrain/Step Time": 8.524854898452759} +{"Pretrain/Learning Rate": 1.0851099257324043e-05, "Pretrain/Loss": 2.007362127304077, "Pretrain/Loss (Raw)": 2.1376771926879883, "Pretrain/Step": 6683, "Pretrain/Step Time": 8.522507490590215} +{"Pretrain/Learning Rate": 1.0844100721141564e-05, "Pretrain/Loss": 2.008273124694824, "Pretrain/Loss (Raw)": 2.1150662899017334, "Pretrain/Step": 6684, "Pretrain/Step Time": 8.514650972560048} +{"Pretrain/Learning Rate": 1.0837103817484096e-05, "Pretrain/Loss": 2.006220817565918, "Pretrain/Loss (Raw)": 2.038813591003418, "Pretrain/Step": 6685, "Pretrain/Step Time": 8.511308094486594} +{"Pretrain/Learning Rate": 1.0830108547158544e-05, "Pretrain/Loss": 2.0073180198669434, "Pretrain/Loss (Raw)": 1.9868910312652588, "Pretrain/Step": 6686, "Pretrain/Step Time": 8.512420449405909} +{"Pretrain/Learning Rate": 1.0823114910971654e-05, "Pretrain/Loss": 2.003629446029663, "Pretrain/Loss (Raw)": 1.7631748914718628, "Pretrain/Step": 6687, "Pretrain/Step Time": 8.52232525497675} +{"Pretrain/Learning Rate": 1.0816122909729957e-05, "Pretrain/Loss": 2.0035815238952637, "Pretrain/Loss (Raw)": 1.885453701019287, "Pretrain/Step": 6688, "Pretrain/Step Time": 8.521968787536025} +{"Pretrain/Learning Rate": 1.0809132544239803e-05, "Pretrain/Loss": 2.001697301864624, "Pretrain/Loss (Raw)": 1.9087692499160767, "Pretrain/Step": 6689, "Pretrain/Step Time": 8.519168052822351} +{"Pretrain/Learning Rate": 1.0802143815307342e-05, "Pretrain/Loss": 2.0022995471954346, "Pretrain/Loss (Raw)": 2.004732608795166, "Pretrain/Step": 6690, "Pretrain/Step Time": 8.51464944705367} +{"Pretrain/Learning Rate": 1.079515672373857e-05, "Pretrain/Loss": 2.0021920204162598, "Pretrain/Loss (Raw)": 2.1342031955718994, "Pretrain/Step": 6691, "Pretrain/Step Time": 8.519093211740255} +{"Pretrain/Learning Rate": 1.078817127033926e-05, "Pretrain/Loss": 1.9993923902511597, "Pretrain/Loss (Raw)": 1.7551674842834473, "Pretrain/Step": 6692, "Pretrain/Step Time": 8.520325105637312} +{"Pretrain/Learning Rate": 1.0781187455915007e-05, "Pretrain/Loss": 1.9977322816848755, "Pretrain/Loss (Raw)": 1.832786202430725, "Pretrain/Step": 6693, "Pretrain/Step Time": 8.529841942712665} +{"Pretrain/Learning Rate": 1.0774205281271208e-05, "Pretrain/Loss": 1.9983932971954346, "Pretrain/Loss (Raw)": 2.060448408126831, "Pretrain/Step": 6694, "Pretrain/Step Time": 8.529018852859735} +{"Pretrain/Learning Rate": 1.0767224747213101e-05, "Pretrain/Loss": 1.9974064826965332, "Pretrain/Loss (Raw)": 1.8580378293991089, "Pretrain/Step": 6695, "Pretrain/Step Time": 8.52379359304905} +{"Pretrain/Learning Rate": 1.07602458545457e-05, "Pretrain/Loss": 1.9964442253112793, "Pretrain/Loss (Raw)": 1.8292615413665771, "Pretrain/Step": 6696, "Pretrain/Step Time": 8.520848346874118} +{"Pretrain/Learning Rate": 1.0753268604073849e-05, "Pretrain/Loss": 1.9952173233032227, "Pretrain/Loss (Raw)": 1.8010250329971313, "Pretrain/Step": 6697, "Pretrain/Step Time": 8.520630400627851} +{"Pretrain/Learning Rate": 1.0746292996602187e-05, "Pretrain/Loss": 1.9976723194122314, "Pretrain/Loss (Raw)": 2.176597833633423, "Pretrain/Step": 6698, "Pretrain/Step Time": 8.520886993035674} +{"Pretrain/Learning Rate": 1.0739319032935192e-05, "Pretrain/Loss": 1.9971754550933838, "Pretrain/Loss (Raw)": 1.89002525806427, "Pretrain/Step": 6699, "Pretrain/Step Time": 8.519969945773482} +{"Pretrain/Learning Rate": 1.0732346713877123e-05, "Pretrain/Loss": 1.9977807998657227, "Pretrain/Loss (Raw)": 2.0691940784454346, "Pretrain/Step": 6700, "Pretrain/Step Time": 8.522886173799634} +{"Pretrain/Learning Rate": 1.0725376040232052e-05, "Pretrain/Loss": 1.999640703201294, "Pretrain/Loss (Raw)": 2.1365621089935303, "Pretrain/Step": 6701, "Pretrain/Step Time": 8.519422324374318} +{"Pretrain/Learning Rate": 1.071840701280389e-05, "Pretrain/Loss": 2.000976324081421, "Pretrain/Loss (Raw)": 2.0205085277557373, "Pretrain/Step": 6702, "Pretrain/Step Time": 8.517430482432246} +{"Pretrain/Learning Rate": 1.071143963239633e-05, "Pretrain/Loss": 2.0001447200775146, "Pretrain/Loss (Raw)": 1.8937134742736816, "Pretrain/Step": 6703, "Pretrain/Step Time": 8.519107708707452} +{"Pretrain/Learning Rate": 1.0704473899812881e-05, "Pretrain/Loss": 1.9989995956420898, "Pretrain/Loss (Raw)": 1.669430136680603, "Pretrain/Step": 6704, "Pretrain/Step Time": 8.525155114009976} +{"Pretrain/Learning Rate": 1.0697509815856858e-05, "Pretrain/Loss": 1.9971864223480225, "Pretrain/Loss (Raw)": 1.7290441989898682, "Pretrain/Step": 6705, "Pretrain/Step Time": 8.529630271717906} +{"Pretrain/Learning Rate": 1.0690547381331403e-05, "Pretrain/Loss": 1.9969213008880615, "Pretrain/Loss (Raw)": 1.9941262006759644, "Pretrain/Step": 6706, "Pretrain/Step Time": 8.524658471345901} +{"Pretrain/Learning Rate": 1.0683586597039456e-05, "Pretrain/Loss": 1.9954334497451782, "Pretrain/Loss (Raw)": 1.9567636251449585, "Pretrain/Step": 6707, "Pretrain/Step Time": 8.51863569021225} +{"Pretrain/Learning Rate": 1.0676627463783762e-05, "Pretrain/Loss": 1.9960273504257202, "Pretrain/Loss (Raw)": 1.944414734840393, "Pretrain/Step": 6708, "Pretrain/Step Time": 8.516099343076348} +{"Pretrain/Learning Rate": 1.0669669982366873e-05, "Pretrain/Loss": 1.994652271270752, "Pretrain/Loss (Raw)": 2.1324355602264404, "Pretrain/Step": 6709, "Pretrain/Step Time": 8.515580771490932} +{"Pretrain/Learning Rate": 1.0662714153591177e-05, "Pretrain/Loss": 1.9980169534683228, "Pretrain/Loss (Raw)": 2.164788007736206, "Pretrain/Step": 6710, "Pretrain/Step Time": 8.520292127504945} +{"Pretrain/Learning Rate": 1.0655759978258847e-05, "Pretrain/Loss": 1.9973556995391846, "Pretrain/Loss (Raw)": 1.9129091501235962, "Pretrain/Step": 6711, "Pretrain/Step Time": 8.529976477846503} +{"Pretrain/Learning Rate": 1.0648807457171867e-05, "Pretrain/Loss": 1.9988691806793213, "Pretrain/Loss (Raw)": 2.0971813201904297, "Pretrain/Step": 6712, "Pretrain/Step Time": 8.524413708597422} +{"Pretrain/Learning Rate": 1.0641856591132027e-05, "Pretrain/Loss": 1.9985512495040894, "Pretrain/Loss (Raw)": 1.992851734161377, "Pretrain/Step": 6713, "Pretrain/Step Time": 8.515957091003656} +{"Pretrain/Learning Rate": 1.063490738094095e-05, "Pretrain/Loss": 2.0002126693725586, "Pretrain/Loss (Raw)": 2.2089221477508545, "Pretrain/Step": 6714, "Pretrain/Step Time": 8.520132692530751} +{"Pretrain/Learning Rate": 1.0627959827400047e-05, "Pretrain/Loss": 1.999474287033081, "Pretrain/Loss (Raw)": 1.8829350471496582, "Pretrain/Step": 6715, "Pretrain/Step Time": 8.51649365760386} +{"Pretrain/Learning Rate": 1.0621013931310541e-05, "Pretrain/Loss": 2.0011913776397705, "Pretrain/Loss (Raw)": 1.9914600849151611, "Pretrain/Step": 6716, "Pretrain/Step Time": 8.519390534609556} +{"Pretrain/Learning Rate": 1.0614069693473452e-05, "Pretrain/Loss": 2.0002615451812744, "Pretrain/Loss (Raw)": 2.0350520610809326, "Pretrain/Step": 6717, "Pretrain/Step Time": 8.523890333250165} +{"Pretrain/Learning Rate": 1.0607127114689655e-05, "Pretrain/Loss": 1.9981694221496582, "Pretrain/Loss (Raw)": 2.031276226043701, "Pretrain/Step": 6718, "Pretrain/Step Time": 8.519462553784251} +{"Pretrain/Learning Rate": 1.0600186195759762e-05, "Pretrain/Loss": 1.9970182180404663, "Pretrain/Loss (Raw)": 1.8937722444534302, "Pretrain/Step": 6719, "Pretrain/Step Time": 8.512917034327984} +{"Pretrain/Learning Rate": 1.0593246937484261e-05, "Pretrain/Loss": 1.9964079856872559, "Pretrain/Loss (Raw)": 1.902359962463379, "Pretrain/Step": 6720, "Pretrain/Step Time": 8.514832243323326} +{"Pretrain/Learning Rate": 1.05863093406634e-05, "Pretrain/Loss": 1.997227668762207, "Pretrain/Loss (Raw)": 1.777255892753601, "Pretrain/Step": 6721, "Pretrain/Step Time": 8.516934024170041} +{"Pretrain/Learning Rate": 1.0579373406097284e-05, "Pretrain/Loss": 1.9967749118804932, "Pretrain/Loss (Raw)": 1.8346928358078003, "Pretrain/Step": 6722, "Pretrain/Step Time": 8.513665130361915} +{"Pretrain/Learning Rate": 1.057243913458576e-05, "Pretrain/Loss": 1.9959783554077148, "Pretrain/Loss (Raw)": 1.860430121421814, "Pretrain/Step": 6723, "Pretrain/Step Time": 8.524025566875935} +{"Pretrain/Learning Rate": 1.0565506526928548e-05, "Pretrain/Loss": 1.9935582876205444, "Pretrain/Loss (Raw)": 1.7227412462234497, "Pretrain/Step": 6724, "Pretrain/Step Time": 8.520155588164926} +{"Pretrain/Learning Rate": 1.0558575583925143e-05, "Pretrain/Loss": 1.9918338060379028, "Pretrain/Loss (Raw)": 1.8921610116958618, "Pretrain/Step": 6725, "Pretrain/Step Time": 8.524467231705785} +{"Pretrain/Learning Rate": 1.0551646306374851e-05, "Pretrain/Loss": 1.9925901889801025, "Pretrain/Loss (Raw)": 2.0297603607177734, "Pretrain/Step": 6726, "Pretrain/Step Time": 8.527443217113614} +{"Pretrain/Learning Rate": 1.0544718695076783e-05, "Pretrain/Loss": 1.9925451278686523, "Pretrain/Loss (Raw)": 2.038858652114868, "Pretrain/Step": 6727, "Pretrain/Step Time": 8.523748315870762} +{"Pretrain/Learning Rate": 1.0537792750829875e-05, "Pretrain/Loss": 1.9933768510818481, "Pretrain/Loss (Raw)": 2.0140671730041504, "Pretrain/Step": 6728, "Pretrain/Step Time": 8.519364470615983} +{"Pretrain/Learning Rate": 1.053086847443286e-05, "Pretrain/Loss": 1.9939489364624023, "Pretrain/Loss (Raw)": 2.1065428256988525, "Pretrain/Step": 6729, "Pretrain/Step Time": 8.516719231382012} +{"Pretrain/Learning Rate": 1.052394586668427e-05, "Pretrain/Loss": 1.9933629035949707, "Pretrain/Loss (Raw)": 1.9783475399017334, "Pretrain/Step": 6730, "Pretrain/Step Time": 8.521013736724854} +{"Pretrain/Learning Rate": 1.0517024928382449e-05, "Pretrain/Loss": 1.9938106536865234, "Pretrain/Loss (Raw)": 1.9960637092590332, "Pretrain/Step": 6731, "Pretrain/Step Time": 8.516693480312824} +{"Pretrain/Learning Rate": 1.0510105660325567e-05, "Pretrain/Loss": 1.9940627813339233, "Pretrain/Loss (Raw)": 2.19250750541687, "Pretrain/Step": 6732, "Pretrain/Step Time": 8.51289676129818} +{"Pretrain/Learning Rate": 1.0503188063311578e-05, "Pretrain/Loss": 1.9969712495803833, "Pretrain/Loss (Raw)": 2.294067621231079, "Pretrain/Step": 6733, "Pretrain/Step Time": 8.51336445659399} +{"Pretrain/Learning Rate": 1.0496272138138255e-05, "Pretrain/Loss": 1.9933334589004517, "Pretrain/Loss (Raw)": 1.869672417640686, "Pretrain/Step": 6734, "Pretrain/Step Time": 8.514150554314256} +{"Pretrain/Learning Rate": 1.0489357885603162e-05, "Pretrain/Loss": 1.9951379299163818, "Pretrain/Loss (Raw)": 2.0881552696228027, "Pretrain/Step": 6735, "Pretrain/Step Time": 8.508283292874694} +{"Pretrain/Learning Rate": 1.0482445306503705e-05, "Pretrain/Loss": 1.9936282634735107, "Pretrain/Loss (Raw)": 1.9671443700790405, "Pretrain/Step": 6736, "Pretrain/Step Time": 8.507793562486768} +{"Pretrain/Learning Rate": 1.0475534401637063e-05, "Pretrain/Loss": 1.9925442934036255, "Pretrain/Loss (Raw)": 1.9090763330459595, "Pretrain/Step": 6737, "Pretrain/Step Time": 8.499237395823002} +{"Pretrain/Learning Rate": 1.0468625171800233e-05, "Pretrain/Loss": 1.995921015739441, "Pretrain/Loss (Raw)": 2.0470237731933594, "Pretrain/Step": 6738, "Pretrain/Step Time": 8.499806007370353} +{"Pretrain/Learning Rate": 1.0461717617790017e-05, "Pretrain/Loss": 1.9964288473129272, "Pretrain/Loss (Raw)": 1.8954946994781494, "Pretrain/Step": 6739, "Pretrain/Step Time": 8.509512227028608} +{"Pretrain/Learning Rate": 1.045481174040304e-05, "Pretrain/Loss": 1.9939509630203247, "Pretrain/Loss (Raw)": 1.9311988353729248, "Pretrain/Step": 6740, "Pretrain/Step Time": 8.509987169876695} +{"Pretrain/Learning Rate": 1.044790754043571e-05, "Pretrain/Loss": 1.9926843643188477, "Pretrain/Loss (Raw)": 1.9051319360733032, "Pretrain/Step": 6741, "Pretrain/Step Time": 8.509308066219091} +{"Pretrain/Learning Rate": 1.044100501868425e-05, "Pretrain/Loss": 1.9895250797271729, "Pretrain/Loss (Raw)": 1.914239525794983, "Pretrain/Step": 6742, "Pretrain/Step Time": 8.512563347816467} +{"Pretrain/Learning Rate": 1.0434104175944701e-05, "Pretrain/Loss": 1.9889239072799683, "Pretrain/Loss (Raw)": 1.894644021987915, "Pretrain/Step": 6743, "Pretrain/Step Time": 8.50635838881135} +{"Pretrain/Learning Rate": 1.0427205013012894e-05, "Pretrain/Loss": 1.990798830986023, "Pretrain/Loss (Raw)": 2.053858995437622, "Pretrain/Step": 6744, "Pretrain/Step Time": 8.506195656955242} +{"Pretrain/Learning Rate": 1.0420307530684478e-05, "Pretrain/Loss": 1.9895199537277222, "Pretrain/Loss (Raw)": 2.152797222137451, "Pretrain/Step": 6745, "Pretrain/Step Time": 8.515400284901261} +{"Pretrain/Learning Rate": 1.0413411729754887e-05, "Pretrain/Loss": 1.990055799484253, "Pretrain/Loss (Raw)": 2.2316536903381348, "Pretrain/Step": 6746, "Pretrain/Step Time": 8.51530140824616} +{"Pretrain/Learning Rate": 1.0406517611019401e-05, "Pretrain/Loss": 1.987810730934143, "Pretrain/Loss (Raw)": 1.7501651048660278, "Pretrain/Step": 6747, "Pretrain/Step Time": 8.50978852249682} +{"Pretrain/Learning Rate": 1.039962517527307e-05, "Pretrain/Loss": 1.9901485443115234, "Pretrain/Loss (Raw)": 2.035551071166992, "Pretrain/Step": 6748, "Pretrain/Step Time": 8.50968972593546} +{"Pretrain/Learning Rate": 1.0392734423310762e-05, "Pretrain/Loss": 1.9920133352279663, "Pretrain/Loss (Raw)": 2.1020753383636475, "Pretrain/Step": 6749, "Pretrain/Step Time": 8.505063438788056} +{"Pretrain/Learning Rate": 1.0385845355927144e-05, "Pretrain/Loss": 1.9942805767059326, "Pretrain/Loss (Raw)": 2.1379752159118652, "Pretrain/Step": 6750, "Pretrain/Step Time": 8.503255000337958} +{"Pretrain/Learning Rate": 1.0378957973916712e-05, "Pretrain/Loss": 1.9947805404663086, "Pretrain/Loss (Raw)": 2.110107660293579, "Pretrain/Step": 6751, "Pretrain/Step Time": 8.508608719334006} +{"Pretrain/Learning Rate": 1.0372072278073744e-05, "Pretrain/Loss": 1.994946002960205, "Pretrain/Loss (Raw)": 1.9661848545074463, "Pretrain/Step": 6752, "Pretrain/Step Time": 8.512615378946066} +{"Pretrain/Learning Rate": 1.036518826919233e-05, "Pretrain/Loss": 1.994831919670105, "Pretrain/Loss (Raw)": 2.0144665241241455, "Pretrain/Step": 6753, "Pretrain/Step Time": 8.510698346421123} +{"Pretrain/Learning Rate": 1.0358305948066355e-05, "Pretrain/Loss": 1.9944809675216675, "Pretrain/Loss (Raw)": 2.0004611015319824, "Pretrain/Step": 6754, "Pretrain/Step Time": 8.508368005976081} +{"Pretrain/Learning Rate": 1.0351425315489543e-05, "Pretrain/Loss": 1.994063377380371, "Pretrain/Loss (Raw)": 1.9573396444320679, "Pretrain/Step": 6755, "Pretrain/Step Time": 8.508823562413454} +{"Pretrain/Learning Rate": 1.034454637225539e-05, "Pretrain/Loss": 1.992630124092102, "Pretrain/Loss (Raw)": 2.0203585624694824, "Pretrain/Step": 6756, "Pretrain/Step Time": 8.501258227974176} +{"Pretrain/Learning Rate": 1.0337669119157208e-05, "Pretrain/Loss": 1.9909855127334595, "Pretrain/Loss (Raw)": 1.9097018241882324, "Pretrain/Step": 6757, "Pretrain/Step Time": 8.508755205199122} +{"Pretrain/Learning Rate": 1.0330793556988106e-05, "Pretrain/Loss": 1.9918944835662842, "Pretrain/Loss (Raw)": 1.949205994606018, "Pretrain/Step": 6758, "Pretrain/Step Time": 8.512729683890939} +{"Pretrain/Learning Rate": 1.032391968654103e-05, "Pretrain/Loss": 1.9909335374832153, "Pretrain/Loss (Raw)": 1.8809128999710083, "Pretrain/Step": 6759, "Pretrain/Step Time": 8.512452168390155} +{"Pretrain/Learning Rate": 1.0317047508608677e-05, "Pretrain/Loss": 1.9929617643356323, "Pretrain/Loss (Raw)": 2.0484578609466553, "Pretrain/Step": 6760, "Pretrain/Step Time": 8.508939625695348} +{"Pretrain/Learning Rate": 1.03101770239836e-05, "Pretrain/Loss": 1.9903613328933716, "Pretrain/Loss (Raw)": 1.8839466571807861, "Pretrain/Step": 6761, "Pretrain/Step Time": 8.505973158404231} +{"Pretrain/Learning Rate": 1.0303308233458123e-05, "Pretrain/Loss": 1.9897074699401855, "Pretrain/Loss (Raw)": 1.959925889968872, "Pretrain/Step": 6762, "Pretrain/Step Time": 8.504385670647025} +{"Pretrain/Learning Rate": 1.029644113782441e-05, "Pretrain/Loss": 1.9888197183609009, "Pretrain/Loss (Raw)": 1.9733856916427612, "Pretrain/Step": 6763, "Pretrain/Step Time": 8.504080437123775} +{"Pretrain/Learning Rate": 1.0289575737874372e-05, "Pretrain/Loss": 1.9886658191680908, "Pretrain/Loss (Raw)": 2.022907257080078, "Pretrain/Step": 6764, "Pretrain/Step Time": 8.504378277808428} +{"Pretrain/Learning Rate": 1.0282712034399785e-05, "Pretrain/Loss": 1.9880081415176392, "Pretrain/Loss (Raw)": 2.0340182781219482, "Pretrain/Step": 6765, "Pretrain/Step Time": 8.508411016315222} +{"Pretrain/Learning Rate": 1.0275850028192192e-05, "Pretrain/Loss": 1.9855811595916748, "Pretrain/Loss (Raw)": 1.8872413635253906, "Pretrain/Step": 6766, "Pretrain/Step Time": 8.502581978216767} +{"Pretrain/Learning Rate": 1.026898972004297e-05, "Pretrain/Loss": 1.9890152215957642, "Pretrain/Loss (Raw)": 1.9867099523544312, "Pretrain/Step": 6767, "Pretrain/Step Time": 8.501127718016505} +{"Pretrain/Learning Rate": 1.0262131110743254e-05, "Pretrain/Loss": 1.9921715259552002, "Pretrain/Loss (Raw)": 2.188338279724121, "Pretrain/Step": 6768, "Pretrain/Step Time": 8.504932183772326} +{"Pretrain/Learning Rate": 1.0255274201084031e-05, "Pretrain/Loss": 1.99168860912323, "Pretrain/Loss (Raw)": 2.028695821762085, "Pretrain/Step": 6769, "Pretrain/Step Time": 8.514404339715838} +{"Pretrain/Learning Rate": 1.0248418991856068e-05, "Pretrain/Loss": 1.9902441501617432, "Pretrain/Loss (Raw)": 1.926618218421936, "Pretrain/Step": 6770, "Pretrain/Step Time": 8.515805065631866} +{"Pretrain/Learning Rate": 1.0241565483849939e-05, "Pretrain/Loss": 1.991909146308899, "Pretrain/Loss (Raw)": 2.1088409423828125, "Pretrain/Step": 6771, "Pretrain/Step Time": 8.514450553804636} +{"Pretrain/Learning Rate": 1.0234713677856011e-05, "Pretrain/Loss": 1.991384744644165, "Pretrain/Loss (Raw)": 1.9718924760818481, "Pretrain/Step": 6772, "Pretrain/Step Time": 8.506832107901573} +{"Pretrain/Learning Rate": 1.022786357466449e-05, "Pretrain/Loss": 1.9947795867919922, "Pretrain/Loss (Raw)": 2.2214314937591553, "Pretrain/Step": 6773, "Pretrain/Step Time": 8.506145367398858} +{"Pretrain/Learning Rate": 1.022101517506535e-05, "Pretrain/Loss": 1.9954866170883179, "Pretrain/Loss (Raw)": 2.06622314453125, "Pretrain/Step": 6774, "Pretrain/Step Time": 8.505006697028875} +{"Pretrain/Learning Rate": 1.021416847984838e-05, "Pretrain/Loss": 1.994199275970459, "Pretrain/Loss (Raw)": 1.852823257446289, "Pretrain/Step": 6775, "Pretrain/Step Time": 8.509411623701453} +{"Pretrain/Learning Rate": 1.0207323489803164e-05, "Pretrain/Loss": 1.9946131706237793, "Pretrain/Loss (Raw)": 2.0352978706359863, "Pretrain/Step": 6776, "Pretrain/Step Time": 8.523073133081198} +{"Pretrain/Learning Rate": 1.0200480205719118e-05, "Pretrain/Loss": 1.993504285812378, "Pretrain/Loss (Raw)": 1.892451524734497, "Pretrain/Step": 6777, "Pretrain/Step Time": 8.523119129240513} +{"Pretrain/Learning Rate": 1.0193638628385433e-05, "Pretrain/Loss": 1.993574619293213, "Pretrain/Loss (Raw)": 2.135952949523926, "Pretrain/Step": 6778, "Pretrain/Step Time": 8.520877800881863} +{"Pretrain/Learning Rate": 1.0186798758591112e-05, "Pretrain/Loss": 1.9921109676361084, "Pretrain/Loss (Raw)": 1.908756136894226, "Pretrain/Step": 6779, "Pretrain/Step Time": 8.51961386948824} +{"Pretrain/Learning Rate": 1.017996059712495e-05, "Pretrain/Loss": 1.99204421043396, "Pretrain/Loss (Raw)": 1.9831836223602295, "Pretrain/Step": 6780, "Pretrain/Step Time": 8.525298487395048} +{"Pretrain/Learning Rate": 1.0173124144775576e-05, "Pretrain/Loss": 1.9911537170410156, "Pretrain/Loss (Raw)": 2.043430805206299, "Pretrain/Step": 6781, "Pretrain/Step Time": 8.532397128641605} +{"Pretrain/Learning Rate": 1.0166289402331391e-05, "Pretrain/Loss": 1.9943344593048096, "Pretrain/Loss (Raw)": 2.370936393737793, "Pretrain/Step": 6782, "Pretrain/Step Time": 8.532964739948511} +{"Pretrain/Learning Rate": 1.0159456370580604e-05, "Pretrain/Loss": 1.9937657117843628, "Pretrain/Loss (Raw)": 2.0777621269226074, "Pretrain/Step": 6783, "Pretrain/Step Time": 8.527509277686477} +{"Pretrain/Learning Rate": 1.0152625050311247e-05, "Pretrain/Loss": 1.9934000968933105, "Pretrain/Loss (Raw)": 1.9036749601364136, "Pretrain/Step": 6784, "Pretrain/Step Time": 8.52418053150177} +{"Pretrain/Learning Rate": 1.0145795442311132e-05, "Pretrain/Loss": 1.9891211986541748, "Pretrain/Loss (Raw)": 1.9005917310714722, "Pretrain/Step": 6785, "Pretrain/Step Time": 8.52114531956613} +{"Pretrain/Learning Rate": 1.0138967547367882e-05, "Pretrain/Loss": 1.9895927906036377, "Pretrain/Loss (Raw)": 2.157388925552368, "Pretrain/Step": 6786, "Pretrain/Step Time": 8.525362180545926} +{"Pretrain/Learning Rate": 1.0132141366268913e-05, "Pretrain/Loss": 1.9906964302062988, "Pretrain/Loss (Raw)": 2.0434720516204834, "Pretrain/Step": 6787, "Pretrain/Step Time": 8.529198538511992} +{"Pretrain/Learning Rate": 1.012531689980147e-05, "Pretrain/Loss": 1.9916291236877441, "Pretrain/Loss (Raw)": 2.2030675411224365, "Pretrain/Step": 6788, "Pretrain/Step Time": 8.535458007827401} +{"Pretrain/Learning Rate": 1.0118494148752575e-05, "Pretrain/Loss": 1.9929943084716797, "Pretrain/Loss (Raw)": 2.178305149078369, "Pretrain/Step": 6789, "Pretrain/Step Time": 8.536424554884434} +{"Pretrain/Learning Rate": 1.0111673113909056e-05, "Pretrain/Loss": 1.9943277835845947, "Pretrain/Loss (Raw)": 2.081326484680176, "Pretrain/Step": 6790, "Pretrain/Step Time": 8.5279371291399} +{"Pretrain/Learning Rate": 1.0104853796057546e-05, "Pretrain/Loss": 1.9944015741348267, "Pretrain/Loss (Raw)": 1.986495018005371, "Pretrain/Step": 6791, "Pretrain/Step Time": 8.521111864596605} +{"Pretrain/Learning Rate": 1.009803619598449e-05, "Pretrain/Loss": 1.9935921430587769, "Pretrain/Loss (Raw)": 1.8457896709442139, "Pretrain/Step": 6792, "Pretrain/Step Time": 8.51801947876811} +{"Pretrain/Learning Rate": 1.0091220314476119e-05, "Pretrain/Loss": 1.9952211380004883, "Pretrain/Loss (Raw)": 2.060105800628662, "Pretrain/Step": 6793, "Pretrain/Step Time": 8.524411495774984} +{"Pretrain/Learning Rate": 1.0084406152318473e-05, "Pretrain/Loss": 1.9951989650726318, "Pretrain/Loss (Raw)": 2.022047519683838, "Pretrain/Step": 6794, "Pretrain/Step Time": 8.521046381443739} +{"Pretrain/Learning Rate": 1.007759371029739e-05, "Pretrain/Loss": 1.9937734603881836, "Pretrain/Loss (Raw)": 1.9510340690612793, "Pretrain/Step": 6795, "Pretrain/Step Time": 8.524543860927224} +{"Pretrain/Learning Rate": 1.0070782989198521e-05, "Pretrain/Loss": 1.9948996305465698, "Pretrain/Loss (Raw)": 2.094697952270508, "Pretrain/Step": 6796, "Pretrain/Step Time": 8.513854183256626} +{"Pretrain/Learning Rate": 1.006397398980731e-05, "Pretrain/Loss": 1.9947947263717651, "Pretrain/Loss (Raw)": 1.8634570837020874, "Pretrain/Step": 6797, "Pretrain/Step Time": 8.514968622475863} +{"Pretrain/Learning Rate": 1.0057166712908996e-05, "Pretrain/Loss": 1.9944214820861816, "Pretrain/Loss (Raw)": 1.9813909530639648, "Pretrain/Step": 6798, "Pretrain/Step Time": 8.517672533169389} +{"Pretrain/Learning Rate": 1.0050361159288625e-05, "Pretrain/Loss": 1.993443489074707, "Pretrain/Loss (Raw)": 1.9933648109436035, "Pretrain/Step": 6799, "Pretrain/Step Time": 8.522395957261324} +{"Pretrain/Learning Rate": 1.0043557329731065e-05, "Pretrain/Loss": 1.9950840473175049, "Pretrain/Loss (Raw)": 1.975082278251648, "Pretrain/Step": 6800, "Pretrain/Step Time": 8.528093367815018} +{"Pretrain/Learning Rate": 1.0036755225020933e-05, "Pretrain/Loss": 1.9947917461395264, "Pretrain/Loss (Raw)": 1.995690107345581, "Pretrain/Step": 6801, "Pretrain/Step Time": 8.529075717553496} +{"Pretrain/Learning Rate": 1.0029954845942707e-05, "Pretrain/Loss": 1.9961819648742676, "Pretrain/Loss (Raw)": 2.1830625534057617, "Pretrain/Step": 6802, "Pretrain/Step Time": 8.518443364650011} +{"Pretrain/Learning Rate": 1.0023156193280622e-05, "Pretrain/Loss": 1.9942398071289062, "Pretrain/Loss (Raw)": 1.9130579233169556, "Pretrain/Step": 6803, "Pretrain/Step Time": 8.513262007385492} +{"Pretrain/Learning Rate": 1.0016359267818754e-05, "Pretrain/Loss": 1.9932565689086914, "Pretrain/Loss (Raw)": 1.9702975749969482, "Pretrain/Step": 6804, "Pretrain/Step Time": 8.50625322572887} +{"Pretrain/Learning Rate": 1.0009564070340924e-05, "Pretrain/Loss": 1.9920992851257324, "Pretrain/Loss (Raw)": 1.9674819707870483, "Pretrain/Step": 6805, "Pretrain/Step Time": 8.505580281838775} +{"Pretrain/Learning Rate": 1.0002770601630809e-05, "Pretrain/Loss": 1.9902136325836182, "Pretrain/Loss (Raw)": 1.8847156763076782, "Pretrain/Step": 6806, "Pretrain/Step Time": 8.517313884571195} +{"Pretrain/Learning Rate": 9.99597886247185e-06, "Pretrain/Loss": 1.9940929412841797, "Pretrain/Loss (Raw)": 2.1734817028045654, "Pretrain/Step": 6807, "Pretrain/Step Time": 8.52197353541851} +{"Pretrain/Learning Rate": 9.98918885364733e-06, "Pretrain/Loss": 1.992293357849121, "Pretrain/Loss (Raw)": 1.8267241716384888, "Pretrain/Step": 6808, "Pretrain/Step Time": 8.51761731505394} +{"Pretrain/Learning Rate": 9.982400575940262e-06, "Pretrain/Loss": 1.9912750720977783, "Pretrain/Loss (Raw)": 1.8707644939422607, "Pretrain/Step": 6809, "Pretrain/Step Time": 8.514161644503474} +{"Pretrain/Learning Rate": 9.975614030133537e-06, "Pretrain/Loss": 1.991422176361084, "Pretrain/Loss (Raw)": 1.9963147640228271, "Pretrain/Step": 6810, "Pretrain/Step Time": 8.503205811604857} +{"Pretrain/Learning Rate": 9.968829217009802e-06, "Pretrain/Loss": 1.9904022216796875, "Pretrain/Loss (Raw)": 2.0071356296539307, "Pretrain/Step": 6811, "Pretrain/Step Time": 8.507702955976129} +{"Pretrain/Learning Rate": 9.962046137351505e-06, "Pretrain/Loss": 1.9892373085021973, "Pretrain/Loss (Raw)": 1.9659544229507446, "Pretrain/Step": 6812, "Pretrain/Step Time": 8.513841424137354} +{"Pretrain/Learning Rate": 9.955264791940902e-06, "Pretrain/Loss": 1.989316463470459, "Pretrain/Loss (Raw)": 2.0489394664764404, "Pretrain/Step": 6813, "Pretrain/Step Time": 8.515839958563447} +{"Pretrain/Learning Rate": 9.948485181560066e-06, "Pretrain/Loss": 1.9896619319915771, "Pretrain/Loss (Raw)": 2.0311169624328613, "Pretrain/Step": 6814, "Pretrain/Step Time": 8.516977675259113} +{"Pretrain/Learning Rate": 9.941707306990843e-06, "Pretrain/Loss": 1.9905636310577393, "Pretrain/Loss (Raw)": 1.8785855770111084, "Pretrain/Step": 6815, "Pretrain/Step Time": 8.50678476318717} +{"Pretrain/Learning Rate": 9.934931169014891e-06, "Pretrain/Loss": 1.9928436279296875, "Pretrain/Loss (Raw)": 2.177279472351074, "Pretrain/Step": 6816, "Pretrain/Step Time": 8.508692713454366} +{"Pretrain/Learning Rate": 9.928156768413657e-06, "Pretrain/Loss": 1.9939929246902466, "Pretrain/Loss (Raw)": 2.055881977081299, "Pretrain/Step": 6817, "Pretrain/Step Time": 8.512998370453715} +{"Pretrain/Learning Rate": 9.921384105968415e-06, "Pretrain/Loss": 1.9939684867858887, "Pretrain/Loss (Raw)": 2.0016186237335205, "Pretrain/Step": 6818, "Pretrain/Step Time": 8.51769370958209} +{"Pretrain/Learning Rate": 9.914613182460208e-06, "Pretrain/Loss": 1.9938173294067383, "Pretrain/Loss (Raw)": 2.114856719970703, "Pretrain/Step": 6819, "Pretrain/Step Time": 8.511684276163578} +{"Pretrain/Learning Rate": 9.907843998669895e-06, "Pretrain/Loss": 1.995253562927246, "Pretrain/Loss (Raw)": 1.9390192031860352, "Pretrain/Step": 6820, "Pretrain/Step Time": 8.50902390666306} +{"Pretrain/Learning Rate": 9.90107655537812e-06, "Pretrain/Loss": 1.995936393737793, "Pretrain/Loss (Raw)": 1.920163631439209, "Pretrain/Step": 6821, "Pretrain/Step Time": 8.50054401345551} +{"Pretrain/Learning Rate": 9.894310853365354e-06, "Pretrain/Loss": 1.9959691762924194, "Pretrain/Loss (Raw)": 2.0646536350250244, "Pretrain/Step": 6822, "Pretrain/Step Time": 8.507284523919225} +{"Pretrain/Learning Rate": 9.887546893411839e-06, "Pretrain/Loss": 1.9992426633834839, "Pretrain/Loss (Raw)": 2.277022123336792, "Pretrain/Step": 6823, "Pretrain/Step Time": 8.50783108919859} +{"Pretrain/Learning Rate": 9.880784676297622e-06, "Pretrain/Loss": 2.005232334136963, "Pretrain/Loss (Raw)": 2.595933437347412, "Pretrain/Step": 6824, "Pretrain/Step Time": 8.511692594736814} +{"Pretrain/Learning Rate": 9.874024202802567e-06, "Pretrain/Loss": 2.0063014030456543, "Pretrain/Loss (Raw)": 1.9378774166107178, "Pretrain/Step": 6825, "Pretrain/Step Time": 8.512831376865506} +{"Pretrain/Learning Rate": 9.867265473706319e-06, "Pretrain/Loss": 2.003103494644165, "Pretrain/Loss (Raw)": 1.7672851085662842, "Pretrain/Step": 6826, "Pretrain/Step Time": 8.508620174601674} +{"Pretrain/Learning Rate": 9.860508489788323e-06, "Pretrain/Loss": 2.0050220489501953, "Pretrain/Loss (Raw)": 2.1355834007263184, "Pretrain/Step": 6827, "Pretrain/Step Time": 8.511692373082042} +{"Pretrain/Learning Rate": 9.853753251827818e-06, "Pretrain/Loss": 2.004326343536377, "Pretrain/Loss (Raw)": 1.9801380634307861, "Pretrain/Step": 6828, "Pretrain/Step Time": 8.509255435317755} +{"Pretrain/Learning Rate": 9.84699976060387e-06, "Pretrain/Loss": 2.0012755393981934, "Pretrain/Loss (Raw)": 1.7460473775863647, "Pretrain/Step": 6829, "Pretrain/Step Time": 8.50334076397121} +{"Pretrain/Learning Rate": 9.840248016895311e-06, "Pretrain/Loss": 1.9992331266403198, "Pretrain/Loss (Raw)": 1.7591092586517334, "Pretrain/Step": 6830, "Pretrain/Step Time": 8.511204754933715} +{"Pretrain/Learning Rate": 9.833498021480789e-06, "Pretrain/Loss": 1.999157190322876, "Pretrain/Loss (Raw)": 1.883989691734314, "Pretrain/Step": 6831, "Pretrain/Step Time": 8.502705048769712} +{"Pretrain/Learning Rate": 9.82674977513873e-06, "Pretrain/Loss": 2.001147747039795, "Pretrain/Loss (Raw)": 1.9242205619812012, "Pretrain/Step": 6832, "Pretrain/Step Time": 8.497236033901572} +{"Pretrain/Learning Rate": 9.820003278647396e-06, "Pretrain/Loss": 2.0033681392669678, "Pretrain/Loss (Raw)": 2.0132522583007812, "Pretrain/Step": 6833, "Pretrain/Step Time": 8.49984361231327} +{"Pretrain/Learning Rate": 9.813258532784813e-06, "Pretrain/Loss": 2.002967596054077, "Pretrain/Loss (Raw)": 1.942867636680603, "Pretrain/Step": 6834, "Pretrain/Step Time": 8.507687907665968} +{"Pretrain/Learning Rate": 9.80651553832882e-06, "Pretrain/Loss": 2.0030295848846436, "Pretrain/Loss (Raw)": 1.964686632156372, "Pretrain/Step": 6835, "Pretrain/Step Time": 8.51212385110557} +{"Pretrain/Learning Rate": 9.79977429605704e-06, "Pretrain/Loss": 2.002695083618164, "Pretrain/Loss (Raw)": 1.9016119241714478, "Pretrain/Step": 6836, "Pretrain/Step Time": 8.514403246343136} +{"Pretrain/Learning Rate": 9.793034806746922e-06, "Pretrain/Loss": 2.002150297164917, "Pretrain/Loss (Raw)": 2.062699556350708, "Pretrain/Step": 6837, "Pretrain/Step Time": 8.513567009940743} +{"Pretrain/Learning Rate": 9.786297071175687e-06, "Pretrain/Loss": 1.9984400272369385, "Pretrain/Loss (Raw)": 1.6898597478866577, "Pretrain/Step": 6838, "Pretrain/Step Time": 8.508950946852565} +{"Pretrain/Learning Rate": 9.779561090120366e-06, "Pretrain/Loss": 1.9978044033050537, "Pretrain/Loss (Raw)": 1.831541657447815, "Pretrain/Step": 6839, "Pretrain/Step Time": 8.506809959188104} +{"Pretrain/Learning Rate": 9.77282686435777e-06, "Pretrain/Loss": 1.99726140499115, "Pretrain/Loss (Raw)": 2.027683973312378, "Pretrain/Step": 6840, "Pretrain/Step Time": 8.505922315642238} +{"Pretrain/Learning Rate": 9.766094394664551e-06, "Pretrain/Loss": 1.9973030090332031, "Pretrain/Loss (Raw)": 1.9981932640075684, "Pretrain/Step": 6841, "Pretrain/Step Time": 8.512356616556644} +{"Pretrain/Learning Rate": 9.759363681817093e-06, "Pretrain/Loss": 1.9949274063110352, "Pretrain/Loss (Raw)": 1.9048357009887695, "Pretrain/Step": 6842, "Pretrain/Step Time": 8.511816153302789} +{"Pretrain/Learning Rate": 9.752634726591642e-06, "Pretrain/Loss": 1.994654655456543, "Pretrain/Loss (Raw)": 1.8480175733566284, "Pretrain/Step": 6843, "Pretrain/Step Time": 8.508508363738656} +{"Pretrain/Learning Rate": 9.745907529764189e-06, "Pretrain/Loss": 1.9945510625839233, "Pretrain/Loss (Raw)": 1.9782071113586426, "Pretrain/Step": 6844, "Pretrain/Step Time": 8.503682438284159} +{"Pretrain/Learning Rate": 9.739182092110583e-06, "Pretrain/Loss": 1.9928112030029297, "Pretrain/Loss (Raw)": 1.8123422861099243, "Pretrain/Step": 6845, "Pretrain/Step Time": 8.503354644402862} +{"Pretrain/Learning Rate": 9.732458414406387e-06, "Pretrain/Loss": 1.99430513381958, "Pretrain/Loss (Raw)": 2.222503185272217, "Pretrain/Step": 6846, "Pretrain/Step Time": 8.510584231466055} +{"Pretrain/Learning Rate": 9.72573649742704e-06, "Pretrain/Loss": 1.9973413944244385, "Pretrain/Loss (Raw)": 2.2824203968048096, "Pretrain/Step": 6847, "Pretrain/Step Time": 8.508688017725945} +{"Pretrain/Learning Rate": 9.719016341947726e-06, "Pretrain/Loss": 1.9985203742980957, "Pretrain/Loss (Raw)": 2.0532655715942383, "Pretrain/Step": 6848, "Pretrain/Step Time": 8.506811687722802} +{"Pretrain/Learning Rate": 9.712297948743473e-06, "Pretrain/Loss": 2.001793622970581, "Pretrain/Loss (Raw)": 2.196232557296753, "Pretrain/Step": 6849, "Pretrain/Step Time": 8.503266390413046} +{"Pretrain/Learning Rate": 9.705581318589038e-06, "Pretrain/Loss": 2.002718448638916, "Pretrain/Loss (Raw)": 1.953069806098938, "Pretrain/Step": 6850, "Pretrain/Step Time": 8.506557801738381} +{"Pretrain/Learning Rate": 9.698866452259048e-06, "Pretrain/Loss": 2.0031819343566895, "Pretrain/Loss (Raw)": 1.919732689857483, "Pretrain/Step": 6851, "Pretrain/Step Time": 8.498066833242774} +{"Pretrain/Learning Rate": 9.692153350527877e-06, "Pretrain/Loss": 2.0069761276245117, "Pretrain/Loss (Raw)": 2.2084290981292725, "Pretrain/Step": 6852, "Pretrain/Step Time": 8.504992814734578} +{"Pretrain/Learning Rate": 9.685442014169715e-06, "Pretrain/Loss": 2.008145570755005, "Pretrain/Loss (Raw)": 2.0418429374694824, "Pretrain/Step": 6853, "Pretrain/Step Time": 8.50608054921031} +{"Pretrain/Learning Rate": 9.678732443958535e-06, "Pretrain/Loss": 2.007789134979248, "Pretrain/Loss (Raw)": 1.9841288328170776, "Pretrain/Step": 6854, "Pretrain/Step Time": 8.507840706035495} +{"Pretrain/Learning Rate": 9.672024640668134e-06, "Pretrain/Loss": 2.004422187805176, "Pretrain/Loss (Raw)": 1.6078733205795288, "Pretrain/Step": 6855, "Pretrain/Step Time": 8.507294990122318} +{"Pretrain/Learning Rate": 9.665318605072082e-06, "Pretrain/Loss": 2.0052294731140137, "Pretrain/Loss (Raw)": 2.1174092292785645, "Pretrain/Step": 6856, "Pretrain/Step Time": 8.507577693089843} +{"Pretrain/Learning Rate": 9.658614337943748e-06, "Pretrain/Loss": 2.0052649974823, "Pretrain/Loss (Raw)": 2.111100435256958, "Pretrain/Step": 6857, "Pretrain/Step Time": 8.506146464496851} +{"Pretrain/Learning Rate": 9.651911840056287e-06, "Pretrain/Loss": 2.0057876110076904, "Pretrain/Loss (Raw)": 2.0452585220336914, "Pretrain/Step": 6858, "Pretrain/Step Time": 8.509939281269908} +{"Pretrain/Learning Rate": 9.645211112182687e-06, "Pretrain/Loss": 2.00618052482605, "Pretrain/Loss (Raw)": 2.0463485717773438, "Pretrain/Step": 6859, "Pretrain/Step Time": 8.509226137772202} +{"Pretrain/Learning Rate": 9.638512155095694e-06, "Pretrain/Loss": 2.005302906036377, "Pretrain/Loss (Raw)": 2.0801756381988525, "Pretrain/Step": 6860, "Pretrain/Step Time": 8.509427500888705} +{"Pretrain/Learning Rate": 9.631814969567866e-06, "Pretrain/Loss": 2.0013203620910645, "Pretrain/Loss (Raw)": 1.7843034267425537, "Pretrain/Step": 6861, "Pretrain/Step Time": 8.503180023282766} +{"Pretrain/Learning Rate": 9.625119556371542e-06, "Pretrain/Loss": 2.0055794715881348, "Pretrain/Loss (Raw)": 2.4148151874542236, "Pretrain/Step": 6862, "Pretrain/Step Time": 8.499054415151477} +{"Pretrain/Learning Rate": 9.618425916278891e-06, "Pretrain/Loss": 2.0052719116210938, "Pretrain/Loss (Raw)": 2.0487897396087646, "Pretrain/Step": 6863, "Pretrain/Step Time": 8.506401604041457} +{"Pretrain/Learning Rate": 9.611734050061844e-06, "Pretrain/Loss": 2.005138397216797, "Pretrain/Loss (Raw)": 1.9500521421432495, "Pretrain/Step": 6864, "Pretrain/Step Time": 8.513762183487415} +{"Pretrain/Learning Rate": 9.605043958492127e-06, "Pretrain/Loss": 2.0063254833221436, "Pretrain/Loss (Raw)": 2.0610365867614746, "Pretrain/Step": 6865, "Pretrain/Step Time": 8.512946177273989} +{"Pretrain/Learning Rate": 9.598355642341294e-06, "Pretrain/Loss": 2.0027453899383545, "Pretrain/Loss (Raw)": 1.588767170906067, "Pretrain/Step": 6866, "Pretrain/Step Time": 8.511816633865237} +{"Pretrain/Learning Rate": 9.591669102380666e-06, "Pretrain/Loss": 2.001832962036133, "Pretrain/Loss (Raw)": 1.7787014245986938, "Pretrain/Step": 6867, "Pretrain/Step Time": 8.50235391035676} +{"Pretrain/Learning Rate": 9.584984339381362e-06, "Pretrain/Loss": 2.001913070678711, "Pretrain/Loss (Raw)": 1.9414892196655273, "Pretrain/Step": 6868, "Pretrain/Step Time": 8.50187454558909} +{"Pretrain/Learning Rate": 9.578301354114291e-06, "Pretrain/Loss": 2.0006468296051025, "Pretrain/Loss (Raw)": 1.743022084236145, "Pretrain/Step": 6869, "Pretrain/Step Time": 8.505202593281865} +{"Pretrain/Learning Rate": 9.571620147350188e-06, "Pretrain/Loss": 1.9995795488357544, "Pretrain/Loss (Raw)": 1.7776180505752563, "Pretrain/Step": 6870, "Pretrain/Step Time": 8.511672731488943} +{"Pretrain/Learning Rate": 9.56494071985955e-06, "Pretrain/Loss": 1.9998008012771606, "Pretrain/Loss (Raw)": 1.9229785203933716, "Pretrain/Step": 6871, "Pretrain/Step Time": 8.510834315791726} +{"Pretrain/Learning Rate": 9.558263072412679e-06, "Pretrain/Loss": 1.9986255168914795, "Pretrain/Loss (Raw)": 1.9034231901168823, "Pretrain/Step": 6872, "Pretrain/Step Time": 8.507957769557834} +{"Pretrain/Learning Rate": 9.551587205779666e-06, "Pretrain/Loss": 1.997843623161316, "Pretrain/Loss (Raw)": 2.05271577835083, "Pretrain/Step": 6873, "Pretrain/Step Time": 8.503650838509202} +{"Pretrain/Learning Rate": 9.544913120730423e-06, "Pretrain/Loss": 1.9970800876617432, "Pretrain/Loss (Raw)": 2.1339285373687744, "Pretrain/Step": 6874, "Pretrain/Step Time": 8.502257823944092} +{"Pretrain/Learning Rate": 9.538240818034624e-06, "Pretrain/Loss": 1.9997535943984985, "Pretrain/Loss (Raw)": 2.092362642288208, "Pretrain/Step": 6875, "Pretrain/Step Time": 8.510996358469129} +{"Pretrain/Learning Rate": 9.531570298461754e-06, "Pretrain/Loss": 1.9975221157073975, "Pretrain/Loss (Raw)": 1.7499200105667114, "Pretrain/Step": 6876, "Pretrain/Step Time": 8.515707079321146} +{"Pretrain/Learning Rate": 9.524901562781074e-06, "Pretrain/Loss": 1.9957029819488525, "Pretrain/Loss (Raw)": 1.8692330121994019, "Pretrain/Step": 6877, "Pretrain/Step Time": 8.509954983368516} +{"Pretrain/Learning Rate": 9.518234611761678e-06, "Pretrain/Loss": 1.9937081336975098, "Pretrain/Loss (Raw)": 1.882630467414856, "Pretrain/Step": 6878, "Pretrain/Step Time": 8.512728171423078} +{"Pretrain/Learning Rate": 9.511569446172419e-06, "Pretrain/Loss": 1.9924304485321045, "Pretrain/Loss (Raw)": 1.9465478658676147, "Pretrain/Step": 6879, "Pretrain/Step Time": 8.507104882970452} +{"Pretrain/Learning Rate": 9.504906066781954e-06, "Pretrain/Loss": 1.9916527271270752, "Pretrain/Loss (Raw)": 1.8666578531265259, "Pretrain/Step": 6880, "Pretrain/Step Time": 8.502847470343113} +{"Pretrain/Learning Rate": 9.49824447435873e-06, "Pretrain/Loss": 1.9909813404083252, "Pretrain/Loss (Raw)": 1.9285290241241455, "Pretrain/Step": 6881, "Pretrain/Step Time": 8.513331212103367} +{"Pretrain/Learning Rate": 9.491584669671008e-06, "Pretrain/Loss": 1.9907504320144653, "Pretrain/Loss (Raw)": 1.9709044694900513, "Pretrain/Step": 6882, "Pretrain/Step Time": 8.510053215548396} +{"Pretrain/Learning Rate": 9.484926653486819e-06, "Pretrain/Loss": 1.990208387374878, "Pretrain/Loss (Raw)": 1.8879626989364624, "Pretrain/Step": 6883, "Pretrain/Step Time": 8.514827068895102} +{"Pretrain/Learning Rate": 9.478270426574002e-06, "Pretrain/Loss": 1.991095781326294, "Pretrain/Loss (Raw)": 2.1339528560638428, "Pretrain/Step": 6884, "Pretrain/Step Time": 8.517658801749349} +{"Pretrain/Learning Rate": 9.471615989700167e-06, "Pretrain/Loss": 1.9909679889678955, "Pretrain/Loss (Raw)": 1.8933278322219849, "Pretrain/Step": 6885, "Pretrain/Step Time": 8.510775381699204} +{"Pretrain/Learning Rate": 9.464963343632766e-06, "Pretrain/Loss": 1.9906810522079468, "Pretrain/Loss (Raw)": 1.912489652633667, "Pretrain/Step": 6886, "Pretrain/Step Time": 8.506973683834076} +{"Pretrain/Learning Rate": 9.458312489138979e-06, "Pretrain/Loss": 1.9914478063583374, "Pretrain/Loss (Raw)": 1.97904634475708, "Pretrain/Step": 6887, "Pretrain/Step Time": 8.513407429680228} +{"Pretrain/Learning Rate": 9.451663426985838e-06, "Pretrain/Loss": 1.9907379150390625, "Pretrain/Loss (Raw)": 1.9575872421264648, "Pretrain/Step": 6888, "Pretrain/Step Time": 8.518813410773873} +{"Pretrain/Learning Rate": 9.44501615794013e-06, "Pretrain/Loss": 1.9875844717025757, "Pretrain/Loss (Raw)": 1.48030686378479, "Pretrain/Step": 6889, "Pretrain/Step Time": 8.521187711507082} +{"Pretrain/Learning Rate": 9.438370682768473e-06, "Pretrain/Loss": 1.9886398315429688, "Pretrain/Loss (Raw)": 2.0950324535369873, "Pretrain/Step": 6890, "Pretrain/Step Time": 8.521645275875926} +{"Pretrain/Learning Rate": 9.43172700223722e-06, "Pretrain/Loss": 1.9885221719741821, "Pretrain/Loss (Raw)": 1.958312749862671, "Pretrain/Step": 6891, "Pretrain/Step Time": 8.521590346470475} +{"Pretrain/Learning Rate": 9.425085117112577e-06, "Pretrain/Loss": 1.9878346920013428, "Pretrain/Loss (Raw)": 1.9349156618118286, "Pretrain/Step": 6892, "Pretrain/Step Time": 8.515282908454537} +{"Pretrain/Learning Rate": 9.41844502816051e-06, "Pretrain/Loss": 1.987982988357544, "Pretrain/Loss (Raw)": 2.0530028343200684, "Pretrain/Step": 6893, "Pretrain/Step Time": 8.511963224038482} +{"Pretrain/Learning Rate": 9.411806736146788e-06, "Pretrain/Loss": 1.98862886428833, "Pretrain/Loss (Raw)": 1.969895601272583, "Pretrain/Step": 6894, "Pretrain/Step Time": 8.516484988853335} +{"Pretrain/Learning Rate": 9.405170241836955e-06, "Pretrain/Loss": 1.9903504848480225, "Pretrain/Loss (Raw)": 2.2070741653442383, "Pretrain/Step": 6895, "Pretrain/Step Time": 8.520306436344981} +{"Pretrain/Learning Rate": 9.398535545996386e-06, "Pretrain/Loss": 1.9895496368408203, "Pretrain/Loss (Raw)": 2.0858356952667236, "Pretrain/Step": 6896, "Pretrain/Step Time": 8.516559649258852} +{"Pretrain/Learning Rate": 9.391902649390214e-06, "Pretrain/Loss": 1.9903573989868164, "Pretrain/Loss (Raw)": 2.132089376449585, "Pretrain/Step": 6897, "Pretrain/Step Time": 8.509520335122943} +{"Pretrain/Learning Rate": 9.385271552783375e-06, "Pretrain/Loss": 1.991089105606079, "Pretrain/Loss (Raw)": 2.020285129547119, "Pretrain/Step": 6898, "Pretrain/Step Time": 8.508721347898245} +{"Pretrain/Learning Rate": 9.378642256940589e-06, "Pretrain/Loss": 1.9925713539123535, "Pretrain/Loss (Raw)": 2.298567295074463, "Pretrain/Step": 6899, "Pretrain/Step Time": 8.511871894821525} +{"Pretrain/Learning Rate": 9.372014762626401e-06, "Pretrain/Loss": 1.991112232208252, "Pretrain/Loss (Raw)": 1.785128116607666, "Pretrain/Step": 6900, "Pretrain/Step Time": 8.516709258779883} +{"Pretrain/Learning Rate": 9.36538907060511e-06, "Pretrain/Loss": 1.9885910749435425, "Pretrain/Loss (Raw)": 1.8987120389938354, "Pretrain/Step": 6901, "Pretrain/Step Time": 8.518473157659173} +{"Pretrain/Learning Rate": 9.358765181640825e-06, "Pretrain/Loss": 1.9880223274230957, "Pretrain/Loss (Raw)": 1.9934293031692505, "Pretrain/Step": 6902, "Pretrain/Step Time": 8.521730029955506} +{"Pretrain/Learning Rate": 9.352143096497435e-06, "Pretrain/Loss": 1.988701343536377, "Pretrain/Loss (Raw)": 1.9397372007369995, "Pretrain/Step": 6903, "Pretrain/Step Time": 8.514157995581627} +{"Pretrain/Learning Rate": 9.345522815938645e-06, "Pretrain/Loss": 1.9880023002624512, "Pretrain/Loss (Raw)": 1.9458081722259521, "Pretrain/Step": 6904, "Pretrain/Step Time": 8.506433937698603} +{"Pretrain/Learning Rate": 9.33890434072793e-06, "Pretrain/Loss": 1.9877647161483765, "Pretrain/Loss (Raw)": 1.862040400505066, "Pretrain/Step": 6905, "Pretrain/Step Time": 8.504615493118763} +{"Pretrain/Learning Rate": 9.332287671628556e-06, "Pretrain/Loss": 1.9871516227722168, "Pretrain/Loss (Raw)": 2.057506561279297, "Pretrain/Step": 6906, "Pretrain/Step Time": 8.499069578945637} +{"Pretrain/Learning Rate": 9.325672809403606e-06, "Pretrain/Loss": 1.9882906675338745, "Pretrain/Loss (Raw)": 2.054537534713745, "Pretrain/Step": 6907, "Pretrain/Step Time": 8.503643481060863} +{"Pretrain/Learning Rate": 9.319059754815926e-06, "Pretrain/Loss": 1.9857299327850342, "Pretrain/Loss (Raw)": 1.6554056406021118, "Pretrain/Step": 6908, "Pretrain/Step Time": 8.498583499342203} +{"Pretrain/Learning Rate": 9.312448508628169e-06, "Pretrain/Loss": 1.986863374710083, "Pretrain/Loss (Raw)": 2.188511848449707, "Pretrain/Step": 6909, "Pretrain/Step Time": 8.490979252383113} +{"Pretrain/Learning Rate": 9.30583907160276e-06, "Pretrain/Loss": 1.9847495555877686, "Pretrain/Loss (Raw)": 2.1003739833831787, "Pretrain/Step": 6910, "Pretrain/Step Time": 8.492861038073897} +{"Pretrain/Learning Rate": 9.299231444501953e-06, "Pretrain/Loss": 1.9834051132202148, "Pretrain/Loss (Raw)": 1.905656337738037, "Pretrain/Step": 6911, "Pretrain/Step Time": 8.505237374454737} +{"Pretrain/Learning Rate": 9.29262562808776e-06, "Pretrain/Loss": 1.984602689743042, "Pretrain/Loss (Raw)": 2.0569839477539062, "Pretrain/Step": 6912, "Pretrain/Step Time": 8.504944011569023} +{"Pretrain/Learning Rate": 9.286021623121993e-06, "Pretrain/Loss": 1.9860421419143677, "Pretrain/Loss (Raw)": 2.084832191467285, "Pretrain/Step": 6913, "Pretrain/Step Time": 8.505601294338703} +{"Pretrain/Learning Rate": 9.279419430366255e-06, "Pretrain/Loss": 1.984055757522583, "Pretrain/Loss (Raw)": 1.9031412601470947, "Pretrain/Step": 6914, "Pretrain/Step Time": 8.500673023983836} +{"Pretrain/Learning Rate": 9.272819050581952e-06, "Pretrain/Loss": 1.9822931289672852, "Pretrain/Loss (Raw)": 1.8178505897521973, "Pretrain/Step": 6915, "Pretrain/Step Time": 8.499922784045339} +{"Pretrain/Learning Rate": 9.266220484530263e-06, "Pretrain/Loss": 1.9810776710510254, "Pretrain/Loss (Raw)": 2.0474774837493896, "Pretrain/Step": 6916, "Pretrain/Step Time": 8.497413726523519} +{"Pretrain/Learning Rate": 9.259623732972173e-06, "Pretrain/Loss": 1.9799342155456543, "Pretrain/Loss (Raw)": 2.031951904296875, "Pretrain/Step": 6917, "Pretrain/Step Time": 8.504004737362266} +{"Pretrain/Learning Rate": 9.25302879666843e-06, "Pretrain/Loss": 1.979945182800293, "Pretrain/Loss (Raw)": 2.0827388763427734, "Pretrain/Step": 6918, "Pretrain/Step Time": 8.503843516111374} +{"Pretrain/Learning Rate": 9.246435676379623e-06, "Pretrain/Loss": 1.9808228015899658, "Pretrain/Loss (Raw)": 2.0988247394561768, "Pretrain/Step": 6919, "Pretrain/Step Time": 8.50649219378829} +{"Pretrain/Learning Rate": 9.239844372866083e-06, "Pretrain/Loss": 1.9807014465332031, "Pretrain/Loss (Raw)": 1.8302496671676636, "Pretrain/Step": 6920, "Pretrain/Step Time": 8.503085292875767} +{"Pretrain/Learning Rate": 9.233254886887958e-06, "Pretrain/Loss": 1.9802820682525635, "Pretrain/Loss (Raw)": 2.0064268112182617, "Pretrain/Step": 6921, "Pretrain/Step Time": 8.49731970205903} +{"Pretrain/Learning Rate": 9.226667219205163e-06, "Pretrain/Loss": 1.981741189956665, "Pretrain/Loss (Raw)": 2.2088091373443604, "Pretrain/Step": 6922, "Pretrain/Step Time": 8.502672851085663} +{"Pretrain/Learning Rate": 9.220081370577441e-06, "Pretrain/Loss": 1.9832106828689575, "Pretrain/Loss (Raw)": 2.1391382217407227, "Pretrain/Step": 6923, "Pretrain/Step Time": 8.506198504939675} +{"Pretrain/Learning Rate": 9.21349734176429e-06, "Pretrain/Loss": 1.982304573059082, "Pretrain/Loss (Raw)": 1.978715181350708, "Pretrain/Step": 6924, "Pretrain/Step Time": 8.503956509754062} +{"Pretrain/Learning Rate": 9.206915133525016e-06, "Pretrain/Loss": 1.9850000143051147, "Pretrain/Loss (Raw)": 2.2084786891937256, "Pretrain/Step": 6925, "Pretrain/Step Time": 8.504577040672302} +{"Pretrain/Learning Rate": 9.2003347466187e-06, "Pretrain/Loss": 1.9839730262756348, "Pretrain/Loss (Raw)": 1.849921464920044, "Pretrain/Step": 6926, "Pretrain/Step Time": 8.504085309803486} +{"Pretrain/Learning Rate": 9.193756181804248e-06, "Pretrain/Loss": 1.9839701652526855, "Pretrain/Loss (Raw)": 1.9930109977722168, "Pretrain/Step": 6927, "Pretrain/Step Time": 8.500385709106922} +{"Pretrain/Learning Rate": 9.1871794398403e-06, "Pretrain/Loss": 1.9839415550231934, "Pretrain/Loss (Raw)": 1.971418857574463, "Pretrain/Step": 6928, "Pretrain/Step Time": 8.499870702624321} +{"Pretrain/Learning Rate": 9.180604521485337e-06, "Pretrain/Loss": 1.9844074249267578, "Pretrain/Loss (Raw)": 2.055321455001831, "Pretrain/Step": 6929, "Pretrain/Step Time": 8.502109630033374} +{"Pretrain/Learning Rate": 9.174031427497595e-06, "Pretrain/Loss": 1.9817230701446533, "Pretrain/Loss (Raw)": 1.8394625186920166, "Pretrain/Step": 6930, "Pretrain/Step Time": 8.511468147858977} +{"Pretrain/Learning Rate": 9.167460158635141e-06, "Pretrain/Loss": 1.9823806285858154, "Pretrain/Loss (Raw)": 1.997239351272583, "Pretrain/Step": 6931, "Pretrain/Step Time": 8.510359922423959} +{"Pretrain/Learning Rate": 9.16089071565577e-06, "Pretrain/Loss": 1.9820137023925781, "Pretrain/Loss (Raw)": 1.9233182668685913, "Pretrain/Step": 6932, "Pretrain/Step Time": 8.512647692114115} +{"Pretrain/Learning Rate": 9.154323099317128e-06, "Pretrain/Loss": 1.982759952545166, "Pretrain/Loss (Raw)": 2.063009738922119, "Pretrain/Step": 6933, "Pretrain/Step Time": 8.512732433155179} +{"Pretrain/Learning Rate": 9.147757310376612e-06, "Pretrain/Loss": 1.9843227863311768, "Pretrain/Loss (Raw)": 2.0847432613372803, "Pretrain/Step": 6934, "Pretrain/Step Time": 8.503419196233153} +{"Pretrain/Learning Rate": 9.14119334959142e-06, "Pretrain/Loss": 1.9840556383132935, "Pretrain/Loss (Raw)": 2.139291524887085, "Pretrain/Step": 6935, "Pretrain/Step Time": 8.513370519503951} +{"Pretrain/Learning Rate": 9.134631217718534e-06, "Pretrain/Loss": 1.985765814781189, "Pretrain/Loss (Raw)": 2.045632839202881, "Pretrain/Step": 6936, "Pretrain/Step Time": 8.510572684928775} +{"Pretrain/Learning Rate": 9.128070915514744e-06, "Pretrain/Loss": 1.9861667156219482, "Pretrain/Loss (Raw)": 1.9220788478851318, "Pretrain/Step": 6937, "Pretrain/Step Time": 8.514379424974322} +{"Pretrain/Learning Rate": 9.121512443736607e-06, "Pretrain/Loss": 1.986187219619751, "Pretrain/Loss (Raw)": 1.998929500579834, "Pretrain/Step": 6938, "Pretrain/Step Time": 8.51510221324861} +{"Pretrain/Learning Rate": 9.114955803140476e-06, "Pretrain/Loss": 1.9861657619476318, "Pretrain/Loss (Raw)": 2.0043883323669434, "Pretrain/Step": 6939, "Pretrain/Step Time": 8.508741253986955} +{"Pretrain/Learning Rate": 9.108400994482485e-06, "Pretrain/Loss": 1.9859840869903564, "Pretrain/Loss (Raw)": 1.9427236318588257, "Pretrain/Step": 6940, "Pretrain/Step Time": 8.50917519070208} +{"Pretrain/Learning Rate": 9.101848018518586e-06, "Pretrain/Loss": 1.986329197883606, "Pretrain/Loss (Raw)": 2.093104600906372, "Pretrain/Step": 6941, "Pretrain/Step Time": 8.508817993104458} +{"Pretrain/Learning Rate": 9.09529687600449e-06, "Pretrain/Loss": 1.9852910041809082, "Pretrain/Loss (Raw)": 1.89821457862854, "Pretrain/Step": 6942, "Pretrain/Step Time": 8.510448386892676} +{"Pretrain/Learning Rate": 9.0887475676957e-06, "Pretrain/Loss": 1.9852463006973267, "Pretrain/Loss (Raw)": 1.8728793859481812, "Pretrain/Step": 6943, "Pretrain/Step Time": 8.511854378506541} +{"Pretrain/Learning Rate": 9.082200094347506e-06, "Pretrain/Loss": 1.9850263595581055, "Pretrain/Loss (Raw)": 2.149118185043335, "Pretrain/Step": 6944, "Pretrain/Step Time": 8.504797492176294} +{"Pretrain/Learning Rate": 9.075654456715016e-06, "Pretrain/Loss": 1.9830750226974487, "Pretrain/Loss (Raw)": 1.806110143661499, "Pretrain/Step": 6945, "Pretrain/Step Time": 8.49612282589078} +{"Pretrain/Learning Rate": 9.069110655553093e-06, "Pretrain/Loss": 1.9823508262634277, "Pretrain/Loss (Raw)": 1.9089176654815674, "Pretrain/Step": 6946, "Pretrain/Step Time": 8.49866753257811} +{"Pretrain/Learning Rate": 9.062568691616389e-06, "Pretrain/Loss": 1.9825471639633179, "Pretrain/Loss (Raw)": 2.1399967670440674, "Pretrain/Step": 6947, "Pretrain/Step Time": 8.505831252783537} +{"Pretrain/Learning Rate": 9.056028565659369e-06, "Pretrain/Loss": 1.9843566417694092, "Pretrain/Loss (Raw)": 2.170628547668457, "Pretrain/Step": 6948, "Pretrain/Step Time": 8.511983009055257} +{"Pretrain/Learning Rate": 9.049490278436269e-06, "Pretrain/Loss": 1.984572410583496, "Pretrain/Loss (Raw)": 1.9477771520614624, "Pretrain/Step": 6949, "Pretrain/Step Time": 8.51116512529552} +{"Pretrain/Learning Rate": 9.04295383070111e-06, "Pretrain/Loss": 1.9835708141326904, "Pretrain/Loss (Raw)": 1.9364510774612427, "Pretrain/Step": 6950, "Pretrain/Step Time": 8.503548469394445} +{"Pretrain/Learning Rate": 9.036419223207699e-06, "Pretrain/Loss": 1.9821839332580566, "Pretrain/Loss (Raw)": 2.099503517150879, "Pretrain/Step": 6951, "Pretrain/Step Time": 8.501563377678394} +{"Pretrain/Learning Rate": 9.029886456709652e-06, "Pretrain/Loss": 1.9765015840530396, "Pretrain/Loss (Raw)": 1.868589162826538, "Pretrain/Step": 6952, "Pretrain/Step Time": 8.499636877328157} +{"Pretrain/Learning Rate": 9.023355531960353e-06, "Pretrain/Loss": 1.9747610092163086, "Pretrain/Loss (Raw)": 1.7150931358337402, "Pretrain/Step": 6953, "Pretrain/Step Time": 8.50336679071188} +{"Pretrain/Learning Rate": 9.016826449712981e-06, "Pretrain/Loss": 1.9784859418869019, "Pretrain/Loss (Raw)": 2.244074583053589, "Pretrain/Step": 6954, "Pretrain/Step Time": 8.512045186012983} +{"Pretrain/Learning Rate": 9.010299210720487e-06, "Pretrain/Loss": 1.9764180183410645, "Pretrain/Loss (Raw)": 1.8708831071853638, "Pretrain/Step": 6955, "Pretrain/Step Time": 8.509440325200558} +{"Pretrain/Learning Rate": 9.003773815735644e-06, "Pretrain/Loss": 1.9752941131591797, "Pretrain/Loss (Raw)": 1.8362925052642822, "Pretrain/Step": 6956, "Pretrain/Step Time": 8.50513412244618} +{"Pretrain/Learning Rate": 8.997250265510984e-06, "Pretrain/Loss": 1.9768633842468262, "Pretrain/Loss (Raw)": 1.9469034671783447, "Pretrain/Step": 6957, "Pretrain/Step Time": 8.508676502853632} +{"Pretrain/Learning Rate": 8.990728560798827e-06, "Pretrain/Loss": 1.979341745376587, "Pretrain/Loss (Raw)": 2.0763280391693115, "Pretrain/Step": 6958, "Pretrain/Step Time": 8.504157776013017} +{"Pretrain/Learning Rate": 8.984208702351281e-06, "Pretrain/Loss": 1.9809198379516602, "Pretrain/Loss (Raw)": 2.0859975814819336, "Pretrain/Step": 6959, "Pretrain/Step Time": 8.506151232868433} +{"Pretrain/Learning Rate": 8.977690690920269e-06, "Pretrain/Loss": 1.9811432361602783, "Pretrain/Loss (Raw)": 1.9528216123580933, "Pretrain/Step": 6960, "Pretrain/Step Time": 8.518551839515567} +{"Pretrain/Learning Rate": 8.971174527257464e-06, "Pretrain/Loss": 1.9819236993789673, "Pretrain/Loss (Raw)": 2.113147020339966, "Pretrain/Step": 6961, "Pretrain/Step Time": 8.516259616240859} +{"Pretrain/Learning Rate": 8.964660212114343e-06, "Pretrain/Loss": 1.9827687740325928, "Pretrain/Loss (Raw)": 2.0510334968566895, "Pretrain/Step": 6962, "Pretrain/Step Time": 8.511380568146706} +{"Pretrain/Learning Rate": 8.958147746242157e-06, "Pretrain/Loss": 1.982176661491394, "Pretrain/Loss (Raw)": 1.8888874053955078, "Pretrain/Step": 6963, "Pretrain/Step Time": 8.510678252205253} +{"Pretrain/Learning Rate": 8.951637130391976e-06, "Pretrain/Loss": 1.9838258028030396, "Pretrain/Loss (Raw)": 2.112705945968628, "Pretrain/Step": 6964, "Pretrain/Step Time": 8.512173026800156} +{"Pretrain/Learning Rate": 8.945128365314622e-06, "Pretrain/Loss": 1.982011318206787, "Pretrain/Loss (Raw)": 1.8304431438446045, "Pretrain/Step": 6965, "Pretrain/Step Time": 8.52266382612288} +{"Pretrain/Learning Rate": 8.938621451760718e-06, "Pretrain/Loss": 1.985275149345398, "Pretrain/Loss (Raw)": 2.1076366901397705, "Pretrain/Step": 6966, "Pretrain/Step Time": 8.52183017320931} +{"Pretrain/Learning Rate": 8.932116390480663e-06, "Pretrain/Loss": 1.9867446422576904, "Pretrain/Loss (Raw)": 2.0196330547332764, "Pretrain/Step": 6967, "Pretrain/Step Time": 8.516242628917098} +{"Pretrain/Learning Rate": 8.925613182224678e-06, "Pretrain/Loss": 1.9870837926864624, "Pretrain/Loss (Raw)": 2.071094512939453, "Pretrain/Step": 6968, "Pretrain/Step Time": 8.515048883855343} +{"Pretrain/Learning Rate": 8.919111827742708e-06, "Pretrain/Loss": 1.9875688552856445, "Pretrain/Loss (Raw)": 2.060299873352051, "Pretrain/Step": 6969, "Pretrain/Step Time": 8.511022297665477} +{"Pretrain/Learning Rate": 8.912612327784547e-06, "Pretrain/Loss": 1.988062858581543, "Pretrain/Loss (Raw)": 1.9680579900741577, "Pretrain/Step": 6970, "Pretrain/Step Time": 8.514833111315966} +{"Pretrain/Learning Rate": 8.906114683099732e-06, "Pretrain/Loss": 1.98961341381073, "Pretrain/Loss (Raw)": 2.0464818477630615, "Pretrain/Step": 6971, "Pretrain/Step Time": 8.522580860182643} +{"Pretrain/Learning Rate": 8.899618894437622e-06, "Pretrain/Loss": 1.991586685180664, "Pretrain/Loss (Raw)": 2.230790615081787, "Pretrain/Step": 6972, "Pretrain/Step Time": 8.5272500179708} +{"Pretrain/Learning Rate": 8.893124962547311e-06, "Pretrain/Loss": 1.9912505149841309, "Pretrain/Loss (Raw)": 1.7693120241165161, "Pretrain/Step": 6973, "Pretrain/Step Time": 8.522140733897686} +{"Pretrain/Learning Rate": 8.88663288817774e-06, "Pretrain/Loss": 1.9913344383239746, "Pretrain/Loss (Raw)": 2.2332346439361572, "Pretrain/Step": 6974, "Pretrain/Step Time": 8.514607284218073} +{"Pretrain/Learning Rate": 8.880142672077582e-06, "Pretrain/Loss": 1.9898028373718262, "Pretrain/Loss (Raw)": 2.0863754749298096, "Pretrain/Step": 6975, "Pretrain/Step Time": 8.516749134287238} +{"Pretrain/Learning Rate": 8.873654314995348e-06, "Pretrain/Loss": 1.990220308303833, "Pretrain/Loss (Raw)": 2.106701135635376, "Pretrain/Step": 6976, "Pretrain/Step Time": 8.522996554151177} +{"Pretrain/Learning Rate": 8.86716781767927e-06, "Pretrain/Loss": 1.9903006553649902, "Pretrain/Loss (Raw)": 2.2065367698669434, "Pretrain/Step": 6977, "Pretrain/Step Time": 8.519544310867786} +{"Pretrain/Learning Rate": 8.86068318087743e-06, "Pretrain/Loss": 1.9907231330871582, "Pretrain/Loss (Raw)": 2.0071358680725098, "Pretrain/Step": 6978, "Pretrain/Step Time": 8.51933521591127} +{"Pretrain/Learning Rate": 8.854200405337657e-06, "Pretrain/Loss": 1.9914742708206177, "Pretrain/Loss (Raw)": 2.015872001647949, "Pretrain/Step": 6979, "Pretrain/Step Time": 8.522385321557522} +{"Pretrain/Learning Rate": 8.847719491807572e-06, "Pretrain/Loss": 1.9907641410827637, "Pretrain/Loss (Raw)": 2.1175317764282227, "Pretrain/Step": 6980, "Pretrain/Step Time": 8.513284115120769} +{"Pretrain/Learning Rate": 8.841240441034579e-06, "Pretrain/Loss": 1.9913612604141235, "Pretrain/Loss (Raw)": 2.118281602859497, "Pretrain/Step": 6981, "Pretrain/Step Time": 8.513694619759917} +{"Pretrain/Learning Rate": 8.83476325376589e-06, "Pretrain/Loss": 1.9909167289733887, "Pretrain/Loss (Raw)": 1.9272218942642212, "Pretrain/Step": 6982, "Pretrain/Step Time": 8.511791111901402} +{"Pretrain/Learning Rate": 8.828287930748477e-06, "Pretrain/Loss": 1.9945824146270752, "Pretrain/Loss (Raw)": 2.077077627182007, "Pretrain/Step": 6983, "Pretrain/Step Time": 8.508792970329523} +{"Pretrain/Learning Rate": 8.821814472729104e-06, "Pretrain/Loss": 1.9932522773742676, "Pretrain/Loss (Raw)": 1.9471542835235596, "Pretrain/Step": 6984, "Pretrain/Step Time": 8.50841904617846} +{"Pretrain/Learning Rate": 8.815342880454311e-06, "Pretrain/Loss": 1.9914801120758057, "Pretrain/Loss (Raw)": 1.8842779397964478, "Pretrain/Step": 6985, "Pretrain/Step Time": 8.513118650764227} +{"Pretrain/Learning Rate": 8.80887315467045e-06, "Pretrain/Loss": 1.9908664226531982, "Pretrain/Loss (Raw)": 1.9667035341262817, "Pretrain/Step": 6986, "Pretrain/Step Time": 8.503834545612335} +{"Pretrain/Learning Rate": 8.80240529612363e-06, "Pretrain/Loss": 1.990999460220337, "Pretrain/Loss (Raw)": 2.0633556842803955, "Pretrain/Step": 6987, "Pretrain/Step Time": 8.506423894315958} +{"Pretrain/Learning Rate": 8.79593930555975e-06, "Pretrain/Loss": 1.9912294149398804, "Pretrain/Loss (Raw)": 2.1096298694610596, "Pretrain/Step": 6988, "Pretrain/Step Time": 8.5085443649441} +{"Pretrain/Learning Rate": 8.789475183724514e-06, "Pretrain/Loss": 1.9921529293060303, "Pretrain/Loss (Raw)": 1.9024986028671265, "Pretrain/Step": 6989, "Pretrain/Step Time": 8.511213138699532} +{"Pretrain/Learning Rate": 8.783012931363385e-06, "Pretrain/Loss": 1.9896084070205688, "Pretrain/Loss (Raw)": 2.089125156402588, "Pretrain/Step": 6990, "Pretrain/Step Time": 8.512975538149476} +{"Pretrain/Learning Rate": 8.776552549221623e-06, "Pretrain/Loss": 1.9904286861419678, "Pretrain/Loss (Raw)": 2.1537814140319824, "Pretrain/Step": 6991, "Pretrain/Step Time": 8.509802347049117} +{"Pretrain/Learning Rate": 8.770094038044257e-06, "Pretrain/Loss": 1.991760015487671, "Pretrain/Loss (Raw)": 2.120487928390503, "Pretrain/Step": 6992, "Pretrain/Step Time": 8.498006209731102} +{"Pretrain/Learning Rate": 8.763637398576135e-06, "Pretrain/Loss": 1.9922266006469727, "Pretrain/Loss (Raw)": 2.1207430362701416, "Pretrain/Step": 6993, "Pretrain/Step Time": 8.500896044075489} +{"Pretrain/Learning Rate": 8.757182631561859e-06, "Pretrain/Loss": 1.997576117515564, "Pretrain/Loss (Raw)": 2.273500919342041, "Pretrain/Step": 6994, "Pretrain/Step Time": 8.5105537828058} +{"Pretrain/Learning Rate": 8.750729737745819e-06, "Pretrain/Loss": 1.9997087717056274, "Pretrain/Loss (Raw)": 2.0516788959503174, "Pretrain/Step": 6995, "Pretrain/Step Time": 8.515998631715775} +{"Pretrain/Learning Rate": 8.744278717872185e-06, "Pretrain/Loss": 2.0011091232299805, "Pretrain/Loss (Raw)": 2.120753288269043, "Pretrain/Step": 6996, "Pretrain/Step Time": 8.515637440606952} +{"Pretrain/Learning Rate": 8.73782957268494e-06, "Pretrain/Loss": 2.0023725032806396, "Pretrain/Loss (Raw)": 1.9047141075134277, "Pretrain/Step": 6997, "Pretrain/Step Time": 8.509020291268826} +{"Pretrain/Learning Rate": 8.731382302927813e-06, "Pretrain/Loss": 2.004098415374756, "Pretrain/Loss (Raw)": 1.9985301494598389, "Pretrain/Step": 6998, "Pretrain/Step Time": 8.502057991921902} +{"Pretrain/Learning Rate": 8.724936909344342e-06, "Pretrain/Loss": 2.006671667098999, "Pretrain/Loss (Raw)": 2.252349853515625, "Pretrain/Step": 6999, "Pretrain/Step Time": 8.508961219340563} +{"Pretrain/Learning Rate": 8.718493392677829e-06, "Pretrain/Loss": 2.0079843997955322, "Pretrain/Loss (Raw)": 2.071481704711914, "Pretrain/Step": 7000, "Pretrain/Step Time": 8.513642659410834} +{"Pretrain/Learning Rate": 8.712051753671389e-06, "Pretrain/Loss": 2.0071539878845215, "Pretrain/Loss (Raw)": 1.9464068412780762, "Pretrain/Step": 7001, "Pretrain/Step Time": 8.514207374304533} +{"Pretrain/Learning Rate": 8.705611993067892e-06, "Pretrain/Loss": 2.0068140029907227, "Pretrain/Loss (Raw)": 2.09040904045105, "Pretrain/Step": 7002, "Pretrain/Step Time": 8.514198092743754} +{"Pretrain/Learning Rate": 8.699174111609998e-06, "Pretrain/Loss": 2.007368803024292, "Pretrain/Loss (Raw)": 2.163395881652832, "Pretrain/Step": 7003, "Pretrain/Step Time": 8.508680580183864} +{"Pretrain/Learning Rate": 8.692738110040152e-06, "Pretrain/Loss": 2.0078859329223633, "Pretrain/Loss (Raw)": 1.816084861755371, "Pretrain/Step": 7004, "Pretrain/Step Time": 8.504474144428968} +{"Pretrain/Learning Rate": 8.686303989100596e-06, "Pretrain/Loss": 2.0096490383148193, "Pretrain/Loss (Raw)": 2.094930410385132, "Pretrain/Step": 7005, "Pretrain/Step Time": 8.510577216744423} +{"Pretrain/Learning Rate": 8.679871749533338e-06, "Pretrain/Loss": 2.0095791816711426, "Pretrain/Loss (Raw)": 1.8736823797225952, "Pretrain/Step": 7006, "Pretrain/Step Time": 8.511780608445406} +{"Pretrain/Learning Rate": 8.673441392080173e-06, "Pretrain/Loss": 2.008923053741455, "Pretrain/Loss (Raw)": 1.8625774383544922, "Pretrain/Step": 7007, "Pretrain/Step Time": 8.513487422838807} +{"Pretrain/Learning Rate": 8.667012917482673e-06, "Pretrain/Loss": 2.0114879608154297, "Pretrain/Loss (Raw)": 2.1949708461761475, "Pretrain/Step": 7008, "Pretrain/Step Time": 8.514339933171868} +{"Pretrain/Learning Rate": 8.66058632648222e-06, "Pretrain/Loss": 2.0118114948272705, "Pretrain/Loss (Raw)": 1.9699416160583496, "Pretrain/Step": 7009, "Pretrain/Step Time": 8.50421399436891} +{"Pretrain/Learning Rate": 8.654161619819931e-06, "Pretrain/Loss": 2.0144670009613037, "Pretrain/Loss (Raw)": 2.3107852935791016, "Pretrain/Step": 7010, "Pretrain/Step Time": 8.501733992248774} +{"Pretrain/Learning Rate": 8.647738798236757e-06, "Pretrain/Loss": 2.01544189453125, "Pretrain/Loss (Raw)": 2.0127675533294678, "Pretrain/Step": 7011, "Pretrain/Step Time": 8.50897259451449} +{"Pretrain/Learning Rate": 8.641317862473392e-06, "Pretrain/Loss": 2.0150904655456543, "Pretrain/Loss (Raw)": 2.0889534950256348, "Pretrain/Step": 7012, "Pretrain/Step Time": 8.509438203647733} +{"Pretrain/Learning Rate": 8.634898813270348e-06, "Pretrain/Loss": 2.0170443058013916, "Pretrain/Loss (Raw)": 2.1434166431427, "Pretrain/Step": 7013, "Pretrain/Step Time": 8.51397217810154} +{"Pretrain/Learning Rate": 8.628481651367876e-06, "Pretrain/Loss": 2.0185136795043945, "Pretrain/Loss (Raw)": 2.1005799770355225, "Pretrain/Step": 7014, "Pretrain/Step Time": 8.516040276736021} +{"Pretrain/Learning Rate": 8.622066377506049e-06, "Pretrain/Loss": 2.017183303833008, "Pretrain/Loss (Raw)": 1.808760643005371, "Pretrain/Step": 7015, "Pretrain/Step Time": 8.510021286085248} +{"Pretrain/Learning Rate": 8.615652992424697e-06, "Pretrain/Loss": 2.018500328063965, "Pretrain/Loss (Raw)": 2.126171112060547, "Pretrain/Step": 7016, "Pretrain/Step Time": 8.503366170451045} +{"Pretrain/Learning Rate": 8.609241496863463e-06, "Pretrain/Loss": 2.023256778717041, "Pretrain/Loss (Raw)": 2.0891003608703613, "Pretrain/Step": 7017, "Pretrain/Step Time": 8.51009570248425} +{"Pretrain/Learning Rate": 8.602831891561718e-06, "Pretrain/Loss": 2.0224196910858154, "Pretrain/Loss (Raw)": 1.9879059791564941, "Pretrain/Step": 7018, "Pretrain/Step Time": 8.5055844001472} +{"Pretrain/Learning Rate": 8.596424177258677e-06, "Pretrain/Loss": 2.0229597091674805, "Pretrain/Loss (Raw)": 2.0274434089660645, "Pretrain/Step": 7019, "Pretrain/Step Time": 8.506265504285693} +{"Pretrain/Learning Rate": 8.590018354693293e-06, "Pretrain/Loss": 2.023324966430664, "Pretrain/Loss (Raw)": 1.981649398803711, "Pretrain/Step": 7020, "Pretrain/Step Time": 8.510140098631382} +{"Pretrain/Learning Rate": 8.583614424604322e-06, "Pretrain/Loss": 2.022592067718506, "Pretrain/Loss (Raw)": 1.959222674369812, "Pretrain/Step": 7021, "Pretrain/Step Time": 8.506763184443116} +{"Pretrain/Learning Rate": 8.57721238773028e-06, "Pretrain/Loss": 2.0241379737854004, "Pretrain/Loss (Raw)": 2.1677587032318115, "Pretrain/Step": 7022, "Pretrain/Step Time": 8.501898674294353} +{"Pretrain/Learning Rate": 8.570812244809504e-06, "Pretrain/Loss": 2.0217390060424805, "Pretrain/Loss (Raw)": 1.9000227451324463, "Pretrain/Step": 7023, "Pretrain/Step Time": 8.50495021045208} +{"Pretrain/Learning Rate": 8.564413996580073e-06, "Pretrain/Loss": 2.0198187828063965, "Pretrain/Loss (Raw)": 1.8400087356567383, "Pretrain/Step": 7024, "Pretrain/Step Time": 8.509410118684173} +{"Pretrain/Learning Rate": 8.55801764377987e-06, "Pretrain/Loss": 2.0185303688049316, "Pretrain/Loss (Raw)": 1.9672096967697144, "Pretrain/Step": 7025, "Pretrain/Step Time": 8.505451198667288} +{"Pretrain/Learning Rate": 8.551623187146537e-06, "Pretrain/Loss": 2.017061948776245, "Pretrain/Loss (Raw)": 1.8323092460632324, "Pretrain/Step": 7026, "Pretrain/Step Time": 8.507303573191166} +{"Pretrain/Learning Rate": 8.545230627417539e-06, "Pretrain/Loss": 2.0157198905944824, "Pretrain/Loss (Raw)": 2.126781940460205, "Pretrain/Step": 7027, "Pretrain/Step Time": 8.502149656414986} +{"Pretrain/Learning Rate": 8.538839965330079e-06, "Pretrain/Loss": 2.0179390907287598, "Pretrain/Loss (Raw)": 2.069201946258545, "Pretrain/Step": 7028, "Pretrain/Step Time": 8.498624762520194} +{"Pretrain/Learning Rate": 8.532451201621156e-06, "Pretrain/Loss": 2.021008014678955, "Pretrain/Loss (Raw)": 2.291503667831421, "Pretrain/Step": 7029, "Pretrain/Step Time": 8.510399432852864} +{"Pretrain/Learning Rate": 8.526064337027565e-06, "Pretrain/Loss": 2.022814989089966, "Pretrain/Loss (Raw)": 2.2247366905212402, "Pretrain/Step": 7030, "Pretrain/Step Time": 8.508477048948407} +{"Pretrain/Learning Rate": 8.519679372285861e-06, "Pretrain/Loss": 2.023469924926758, "Pretrain/Loss (Raw)": 2.0236034393310547, "Pretrain/Step": 7031, "Pretrain/Step Time": 8.511418968439102} +{"Pretrain/Learning Rate": 8.51329630813239e-06, "Pretrain/Loss": 2.0242655277252197, "Pretrain/Loss (Raw)": 2.0476155281066895, "Pretrain/Step": 7032, "Pretrain/Step Time": 8.508480357006192} +{"Pretrain/Learning Rate": 8.506915145303268e-06, "Pretrain/Loss": 2.02587890625, "Pretrain/Loss (Raw)": 2.0685431957244873, "Pretrain/Step": 7033, "Pretrain/Step Time": 8.507563853636384} +{"Pretrain/Learning Rate": 8.50053588453442e-06, "Pretrain/Loss": 2.023237705230713, "Pretrain/Loss (Raw)": 1.719446063041687, "Pretrain/Step": 7034, "Pretrain/Step Time": 8.508036123588681} +{"Pretrain/Learning Rate": 8.49415852656152e-06, "Pretrain/Loss": 2.0224151611328125, "Pretrain/Loss (Raw)": 1.9492348432540894, "Pretrain/Step": 7035, "Pretrain/Step Time": 8.510347109287977} +{"Pretrain/Learning Rate": 8.487783072120036e-06, "Pretrain/Loss": 2.024977684020996, "Pretrain/Loss (Raw)": 1.9834166765213013, "Pretrain/Step": 7036, "Pretrain/Step Time": 8.51716460287571} +{"Pretrain/Learning Rate": 8.48140952194521e-06, "Pretrain/Loss": 2.0243630409240723, "Pretrain/Loss (Raw)": 2.1098382472991943, "Pretrain/Step": 7037, "Pretrain/Step Time": 8.517864849418402} +{"Pretrain/Learning Rate": 8.475037876772085e-06, "Pretrain/Loss": 2.023200511932373, "Pretrain/Loss (Raw)": 1.9515893459320068, "Pretrain/Step": 7038, "Pretrain/Step Time": 8.520462749525905} +{"Pretrain/Learning Rate": 8.468668137335459e-06, "Pretrain/Loss": 2.023651123046875, "Pretrain/Loss (Raw)": 1.9633277654647827, "Pretrain/Step": 7039, "Pretrain/Step Time": 8.50937982276082} +{"Pretrain/Learning Rate": 8.462300304369921e-06, "Pretrain/Loss": 2.0223774909973145, "Pretrain/Loss (Raw)": 1.893965721130371, "Pretrain/Step": 7040, "Pretrain/Step Time": 8.509601227939129} +{"Pretrain/Learning Rate": 8.455934378609834e-06, "Pretrain/Loss": 2.0201563835144043, "Pretrain/Loss (Raw)": 1.8004865646362305, "Pretrain/Step": 7041, "Pretrain/Step Time": 8.513765569776297} +{"Pretrain/Learning Rate": 8.449570360789358e-06, "Pretrain/Loss": 2.0228772163391113, "Pretrain/Loss (Raw)": 2.251426935195923, "Pretrain/Step": 7042, "Pretrain/Step Time": 8.517341567203403} +{"Pretrain/Learning Rate": 8.443208251642417e-06, "Pretrain/Loss": 2.0239620208740234, "Pretrain/Loss (Raw)": 1.9567039012908936, "Pretrain/Step": 7043, "Pretrain/Step Time": 8.51894997432828} +{"Pretrain/Learning Rate": 8.436848051902721e-06, "Pretrain/Loss": 2.0241200923919678, "Pretrain/Loss (Raw)": 2.067716121673584, "Pretrain/Step": 7044, "Pretrain/Step Time": 8.526548968628049} +{"Pretrain/Learning Rate": 8.430489762303745e-06, "Pretrain/Loss": 2.023858070373535, "Pretrain/Loss (Raw)": 1.9984196424484253, "Pretrain/Step": 7045, "Pretrain/Step Time": 8.513614835217595} +{"Pretrain/Learning Rate": 8.424133383578778e-06, "Pretrain/Loss": 2.02323317527771, "Pretrain/Loss (Raw)": 2.0027191638946533, "Pretrain/Step": 7046, "Pretrain/Step Time": 8.511551460251212} +{"Pretrain/Learning Rate": 8.417778916460856e-06, "Pretrain/Loss": 2.021942615509033, "Pretrain/Loss (Raw)": 1.9336878061294556, "Pretrain/Step": 7047, "Pretrain/Step Time": 8.51364224217832} +{"Pretrain/Learning Rate": 8.411426361682806e-06, "Pretrain/Loss": 2.024066925048828, "Pretrain/Loss (Raw)": 2.102128028869629, "Pretrain/Step": 7048, "Pretrain/Step Time": 8.520771365612745} +{"Pretrain/Learning Rate": 8.40507571997723e-06, "Pretrain/Loss": 2.0222995281219482, "Pretrain/Loss (Raw)": 1.7801991701126099, "Pretrain/Step": 7049, "Pretrain/Step Time": 8.52436108700931} +{"Pretrain/Learning Rate": 8.398726992076534e-06, "Pretrain/Loss": 2.0203685760498047, "Pretrain/Loss (Raw)": 1.9616248607635498, "Pretrain/Step": 7050, "Pretrain/Step Time": 8.5202202424407} +{"Pretrain/Learning Rate": 8.392380178712852e-06, "Pretrain/Loss": 2.018766403198242, "Pretrain/Loss (Raw)": 1.9340695142745972, "Pretrain/Step": 7051, "Pretrain/Step Time": 8.512830130755901} +{"Pretrain/Learning Rate": 8.386035280618156e-06, "Pretrain/Loss": 2.0195093154907227, "Pretrain/Loss (Raw)": 2.073819398880005, "Pretrain/Step": 7052, "Pretrain/Step Time": 8.515175618231297} +{"Pretrain/Learning Rate": 8.37969229852415e-06, "Pretrain/Loss": 2.0183022022247314, "Pretrain/Loss (Raw)": 2.053968906402588, "Pretrain/Step": 7053, "Pretrain/Step Time": 8.518607877194881} +{"Pretrain/Learning Rate": 8.373351233162362e-06, "Pretrain/Loss": 2.019526958465576, "Pretrain/Loss (Raw)": 2.006699323654175, "Pretrain/Step": 7054, "Pretrain/Step Time": 8.525229698047042} +{"Pretrain/Learning Rate": 8.367012085264042e-06, "Pretrain/Loss": 2.020388603210449, "Pretrain/Loss (Raw)": 2.1033096313476562, "Pretrain/Step": 7055, "Pretrain/Step Time": 8.526505948975682} +{"Pretrain/Learning Rate": 8.360674855560274e-06, "Pretrain/Loss": 2.021711826324463, "Pretrain/Loss (Raw)": 2.1407840251922607, "Pretrain/Step": 7056, "Pretrain/Step Time": 8.525611370801926} +{"Pretrain/Learning Rate": 8.354339544781878e-06, "Pretrain/Loss": 2.0216832160949707, "Pretrain/Loss (Raw)": 2.0516390800476074, "Pretrain/Step": 7057, "Pretrain/Step Time": 8.5232057236135} +{"Pretrain/Learning Rate": 8.348006153659502e-06, "Pretrain/Loss": 2.023786783218384, "Pretrain/Loss (Raw)": 2.108736515045166, "Pretrain/Step": 7058, "Pretrain/Step Time": 8.517565099522471} +{"Pretrain/Learning Rate": 8.341674682923503e-06, "Pretrain/Loss": 2.0252439975738525, "Pretrain/Loss (Raw)": 2.1837642192840576, "Pretrain/Step": 7059, "Pretrain/Step Time": 8.525888798758388} +{"Pretrain/Learning Rate": 8.335345133304088e-06, "Pretrain/Loss": 2.0257444381713867, "Pretrain/Loss (Raw)": 1.9873682260513306, "Pretrain/Step": 7060, "Pretrain/Step Time": 8.525667186826468} +{"Pretrain/Learning Rate": 8.329017505531195e-06, "Pretrain/Loss": 2.02357816696167, "Pretrain/Loss (Raw)": 1.7857013940811157, "Pretrain/Step": 7061, "Pretrain/Step Time": 8.525265982374549} +{"Pretrain/Learning Rate": 8.322691800334562e-06, "Pretrain/Loss": 2.0218687057495117, "Pretrain/Loss (Raw)": 1.86592698097229, "Pretrain/Step": 7062, "Pretrain/Step Time": 8.523645317181945} +{"Pretrain/Learning Rate": 8.316368018443688e-06, "Pretrain/Loss": 2.019760847091675, "Pretrain/Loss (Raw)": 1.8695238828659058, "Pretrain/Step": 7063, "Pretrain/Step Time": 8.511271260678768} +{"Pretrain/Learning Rate": 8.310046160587878e-06, "Pretrain/Loss": 2.0178542137145996, "Pretrain/Loss (Raw)": 1.8015681505203247, "Pretrain/Step": 7064, "Pretrain/Step Time": 8.512743616476655} +{"Pretrain/Learning Rate": 8.303726227496191e-06, "Pretrain/Loss": 2.0182857513427734, "Pretrain/Loss (Raw)": 1.9773153066635132, "Pretrain/Step": 7065, "Pretrain/Step Time": 8.514550734311342} +{"Pretrain/Learning Rate": 8.297408219897471e-06, "Pretrain/Loss": 2.0184202194213867, "Pretrain/Loss (Raw)": 2.0161356925964355, "Pretrain/Step": 7066, "Pretrain/Step Time": 8.51501207984984} +{"Pretrain/Learning Rate": 8.291092138520332e-06, "Pretrain/Loss": 2.019294261932373, "Pretrain/Loss (Raw)": 2.1163101196289062, "Pretrain/Step": 7067, "Pretrain/Step Time": 8.515553263947368} +{"Pretrain/Learning Rate": 8.28477798409319e-06, "Pretrain/Loss": 2.0187795162200928, "Pretrain/Loss (Raw)": 1.8768150806427002, "Pretrain/Step": 7068, "Pretrain/Step Time": 8.509891163557768} +{"Pretrain/Learning Rate": 8.278465757344214e-06, "Pretrain/Loss": 2.018792152404785, "Pretrain/Loss (Raw)": 2.094691753387451, "Pretrain/Step": 7069, "Pretrain/Step Time": 8.506579205393791} +{"Pretrain/Learning Rate": 8.272155459001366e-06, "Pretrain/Loss": 2.018308162689209, "Pretrain/Loss (Raw)": 1.836296796798706, "Pretrain/Step": 7070, "Pretrain/Step Time": 8.502421136945486} +{"Pretrain/Learning Rate": 8.265847089792362e-06, "Pretrain/Loss": 2.0205001831054688, "Pretrain/Loss (Raw)": 2.1534488201141357, "Pretrain/Step": 7071, "Pretrain/Step Time": 8.513981049880385} +{"Pretrain/Learning Rate": 8.259540650444736e-06, "Pretrain/Loss": 2.0199201107025146, "Pretrain/Loss (Raw)": 2.074867010116577, "Pretrain/Step": 7072, "Pretrain/Step Time": 8.522113272920251} +{"Pretrain/Learning Rate": 8.253236141685764e-06, "Pretrain/Loss": 2.020503520965576, "Pretrain/Loss (Raw)": 1.8807977437973022, "Pretrain/Step": 7073, "Pretrain/Step Time": 8.52503545023501} +{"Pretrain/Learning Rate": 8.246933564242506e-06, "Pretrain/Loss": 2.02052640914917, "Pretrain/Loss (Raw)": 1.9118224382400513, "Pretrain/Step": 7074, "Pretrain/Step Time": 8.523421600461006} +{"Pretrain/Learning Rate": 8.240632918841823e-06, "Pretrain/Loss": 2.019721508026123, "Pretrain/Loss (Raw)": 2.0370161533355713, "Pretrain/Step": 7075, "Pretrain/Step Time": 8.516460610553622} +{"Pretrain/Learning Rate": 8.234334206210323e-06, "Pretrain/Loss": 2.0190601348876953, "Pretrain/Loss (Raw)": 2.0859456062316895, "Pretrain/Step": 7076, "Pretrain/Step Time": 8.515110416337848} +{"Pretrain/Learning Rate": 8.228037427074403e-06, "Pretrain/Loss": 2.0168604850769043, "Pretrain/Loss (Raw)": 1.6661967039108276, "Pretrain/Step": 7077, "Pretrain/Step Time": 8.521909847855568} +{"Pretrain/Learning Rate": 8.221742582160233e-06, "Pretrain/Loss": 2.017371654510498, "Pretrain/Loss (Raw)": 2.0018951892852783, "Pretrain/Step": 7078, "Pretrain/Step Time": 8.5226621478796} +{"Pretrain/Learning Rate": 8.215449672193776e-06, "Pretrain/Loss": 2.016732692718506, "Pretrain/Loss (Raw)": 2.0177321434020996, "Pretrain/Step": 7079, "Pretrain/Step Time": 8.521347707137465} +{"Pretrain/Learning Rate": 8.209158697900757e-06, "Pretrain/Loss": 2.015859365463257, "Pretrain/Loss (Raw)": 1.7567901611328125, "Pretrain/Step": 7080, "Pretrain/Step Time": 8.52547931484878} +{"Pretrain/Learning Rate": 8.202869660006676e-06, "Pretrain/Loss": 2.0181095600128174, "Pretrain/Loss (Raw)": 2.0031256675720215, "Pretrain/Step": 7081, "Pretrain/Step Time": 8.519918166100979} +{"Pretrain/Learning Rate": 8.19658255923681e-06, "Pretrain/Loss": 2.016545295715332, "Pretrain/Loss (Raw)": 2.043846845626831, "Pretrain/Step": 7082, "Pretrain/Step Time": 8.514188403263688} +{"Pretrain/Learning Rate": 8.19029739631623e-06, "Pretrain/Loss": 2.01851224899292, "Pretrain/Loss (Raw)": 2.122673511505127, "Pretrain/Step": 7083, "Pretrain/Step Time": 8.521178018301725} +{"Pretrain/Learning Rate": 8.184014171969765e-06, "Pretrain/Loss": 2.0204269886016846, "Pretrain/Loss (Raw)": 2.0813567638397217, "Pretrain/Step": 7084, "Pretrain/Step Time": 8.520714035257697} +{"Pretrain/Learning Rate": 8.177732886922023e-06, "Pretrain/Loss": 2.0194783210754395, "Pretrain/Loss (Raw)": 1.825490117073059, "Pretrain/Step": 7085, "Pretrain/Step Time": 8.521387292072177} +{"Pretrain/Learning Rate": 8.17145354189739e-06, "Pretrain/Loss": 2.019474983215332, "Pretrain/Loss (Raw)": 2.0759150981903076, "Pretrain/Step": 7086, "Pretrain/Step Time": 8.517572006210685} +{"Pretrain/Learning Rate": 8.16517613762004e-06, "Pretrain/Loss": 2.0192389488220215, "Pretrain/Loss (Raw)": 2.055755138397217, "Pretrain/Step": 7087, "Pretrain/Step Time": 8.51809248700738} +{"Pretrain/Learning Rate": 8.158900674813904e-06, "Pretrain/Loss": 2.0242855548858643, "Pretrain/Loss (Raw)": 2.5987930297851562, "Pretrain/Step": 7088, "Pretrain/Step Time": 8.507743598893285} +{"Pretrain/Learning Rate": 8.1526271542027e-06, "Pretrain/Loss": 2.023733139038086, "Pretrain/Loss (Raw)": 2.042433738708496, "Pretrain/Step": 7089, "Pretrain/Step Time": 8.51138512417674} +{"Pretrain/Learning Rate": 8.146355576509915e-06, "Pretrain/Loss": 2.0228729248046875, "Pretrain/Loss (Raw)": 1.940909504890442, "Pretrain/Step": 7090, "Pretrain/Step Time": 8.5169661603868} +{"Pretrain/Learning Rate": 8.140085942458828e-06, "Pretrain/Loss": 2.0240795612335205, "Pretrain/Loss (Raw)": 2.043365001678467, "Pretrain/Step": 7091, "Pretrain/Step Time": 8.51161077618599} +{"Pretrain/Learning Rate": 8.133818252772476e-06, "Pretrain/Loss": 2.022244453430176, "Pretrain/Loss (Raw)": 1.8777738809585571, "Pretrain/Step": 7092, "Pretrain/Step Time": 8.510345993563533} +{"Pretrain/Learning Rate": 8.12755250817368e-06, "Pretrain/Loss": 2.0252685546875, "Pretrain/Loss (Raw)": 2.2175257205963135, "Pretrain/Step": 7093, "Pretrain/Step Time": 8.499838322401047} +{"Pretrain/Learning Rate": 8.121288709385025e-06, "Pretrain/Loss": 2.026291847229004, "Pretrain/Loss (Raw)": 2.2386369705200195, "Pretrain/Step": 7094, "Pretrain/Step Time": 8.501508548855782} +{"Pretrain/Learning Rate": 8.11502685712891e-06, "Pretrain/Loss": 2.0262365341186523, "Pretrain/Loss (Raw)": 2.0125458240509033, "Pretrain/Step": 7095, "Pretrain/Step Time": 8.510600350797176} +{"Pretrain/Learning Rate": 8.108766952127445e-06, "Pretrain/Loss": 2.0251660346984863, "Pretrain/Loss (Raw)": 1.9340988397598267, "Pretrain/Step": 7096, "Pretrain/Step Time": 8.514061203226447} +{"Pretrain/Learning Rate": 8.102508995102576e-06, "Pretrain/Loss": 2.0235424041748047, "Pretrain/Loss (Raw)": 1.8524532318115234, "Pretrain/Step": 7097, "Pretrain/Step Time": 8.511703949421644} +{"Pretrain/Learning Rate": 8.096252986775985e-06, "Pretrain/Loss": 2.0230917930603027, "Pretrain/Loss (Raw)": 1.9104000329971313, "Pretrain/Step": 7098, "Pretrain/Step Time": 8.503326922655106} +{"Pretrain/Learning Rate": 8.089998927869172e-06, "Pretrain/Loss": 2.0207786560058594, "Pretrain/Loss (Raw)": 1.7503974437713623, "Pretrain/Step": 7099, "Pretrain/Step Time": 8.498891627416015} +{"Pretrain/Learning Rate": 8.083746819103346e-06, "Pretrain/Loss": 2.0179762840270996, "Pretrain/Loss (Raw)": 1.8720438480377197, "Pretrain/Step": 7100, "Pretrain/Step Time": 8.494702255353332} +{"Pretrain/Learning Rate": 8.077496661199557e-06, "Pretrain/Loss": 2.0202345848083496, "Pretrain/Loss (Raw)": 2.0584287643432617, "Pretrain/Step": 7101, "Pretrain/Step Time": 8.500163009390235} +{"Pretrain/Learning Rate": 8.071248454878596e-06, "Pretrain/Loss": 2.0191898345947266, "Pretrain/Loss (Raw)": 2.0994837284088135, "Pretrain/Step": 7102, "Pretrain/Step Time": 8.501477394253016} +{"Pretrain/Learning Rate": 8.065002200861033e-06, "Pretrain/Loss": 2.018095016479492, "Pretrain/Loss (Raw)": 1.9462461471557617, "Pretrain/Step": 7103, "Pretrain/Step Time": 8.49839791096747} +{"Pretrain/Learning Rate": 8.058757899867209e-06, "Pretrain/Loss": 2.0173792839050293, "Pretrain/Loss (Raw)": 2.0151000022888184, "Pretrain/Step": 7104, "Pretrain/Step Time": 8.49220427684486} +{"Pretrain/Learning Rate": 8.052515552617262e-06, "Pretrain/Loss": 2.014657735824585, "Pretrain/Loss (Raw)": 1.8581626415252686, "Pretrain/Step": 7105, "Pretrain/Step Time": 8.496660267934203} +{"Pretrain/Learning Rate": 8.04627515983108e-06, "Pretrain/Loss": 2.0164108276367188, "Pretrain/Loss (Raw)": 2.2315280437469482, "Pretrain/Step": 7106, "Pretrain/Step Time": 8.501240331679583} +{"Pretrain/Learning Rate": 8.040036722228336e-06, "Pretrain/Loss": 2.015455961227417, "Pretrain/Loss (Raw)": 1.8936586380004883, "Pretrain/Step": 7107, "Pretrain/Step Time": 8.50476292707026} +{"Pretrain/Learning Rate": 8.033800240528466e-06, "Pretrain/Loss": 2.0156073570251465, "Pretrain/Loss (Raw)": 2.136890411376953, "Pretrain/Step": 7108, "Pretrain/Step Time": 8.50827769562602} +{"Pretrain/Learning Rate": 8.027565715450707e-06, "Pretrain/Loss": 2.0151519775390625, "Pretrain/Loss (Raw)": 2.060000419616699, "Pretrain/Step": 7109, "Pretrain/Step Time": 8.508917754516006} +{"Pretrain/Learning Rate": 8.02133314771405e-06, "Pretrain/Loss": 2.017165422439575, "Pretrain/Loss (Raw)": 2.184938430786133, "Pretrain/Step": 7110, "Pretrain/Step Time": 8.50449413061142} +{"Pretrain/Learning Rate": 8.015102538037255e-06, "Pretrain/Loss": 2.0155105590820312, "Pretrain/Loss (Raw)": 1.865234613418579, "Pretrain/Step": 7111, "Pretrain/Step Time": 8.501591397449374} +{"Pretrain/Learning Rate": 8.008873887138868e-06, "Pretrain/Loss": 2.0147318840026855, "Pretrain/Loss (Raw)": 1.8475303649902344, "Pretrain/Step": 7112, "Pretrain/Step Time": 8.506205167621374} +{"Pretrain/Learning Rate": 8.002647195737214e-06, "Pretrain/Loss": 2.0161499977111816, "Pretrain/Loss (Raw)": 2.0657646656036377, "Pretrain/Step": 7113, "Pretrain/Step Time": 8.51038820296526} +{"Pretrain/Learning Rate": 7.996422464550382e-06, "Pretrain/Loss": 2.015261173248291, "Pretrain/Loss (Raw)": 1.852954387664795, "Pretrain/Step": 7114, "Pretrain/Step Time": 8.519773526117206} +{"Pretrain/Learning Rate": 7.990199694296224e-06, "Pretrain/Loss": 2.01481556892395, "Pretrain/Loss (Raw)": 2.006308078765869, "Pretrain/Step": 7115, "Pretrain/Step Time": 8.516091860830784} +{"Pretrain/Learning Rate": 7.9839788856924e-06, "Pretrain/Loss": 2.0139708518981934, "Pretrain/Loss (Raw)": 2.0014865398406982, "Pretrain/Step": 7116, "Pretrain/Step Time": 8.509945388883352} +{"Pretrain/Learning Rate": 7.977760039456313e-06, "Pretrain/Loss": 2.014518976211548, "Pretrain/Loss (Raw)": 1.9726752042770386, "Pretrain/Step": 7117, "Pretrain/Step Time": 8.507456859573722} +{"Pretrain/Learning Rate": 7.97154315630515e-06, "Pretrain/Loss": 2.014667510986328, "Pretrain/Loss (Raw)": 2.1081671714782715, "Pretrain/Step": 7118, "Pretrain/Step Time": 8.510648114606738} +{"Pretrain/Learning Rate": 7.965328236955862e-06, "Pretrain/Loss": 2.0142292976379395, "Pretrain/Loss (Raw)": 2.0976498126983643, "Pretrain/Step": 7119, "Pretrain/Step Time": 8.513301869854331} +{"Pretrain/Learning Rate": 7.959115282125198e-06, "Pretrain/Loss": 2.0131187438964844, "Pretrain/Loss (Raw)": 1.9783653020858765, "Pretrain/Step": 7120, "Pretrain/Step Time": 8.519550187513232} +{"Pretrain/Learning Rate": 7.952904292529661e-06, "Pretrain/Loss": 2.0122597217559814, "Pretrain/Loss (Raw)": 2.010773181915283, "Pretrain/Step": 7121, "Pretrain/Step Time": 8.515919016674161} +{"Pretrain/Learning Rate": 7.946695268885531e-06, "Pretrain/Loss": 2.0088462829589844, "Pretrain/Loss (Raw)": 1.8366152048110962, "Pretrain/Step": 7122, "Pretrain/Step Time": 8.506823468953371} +{"Pretrain/Learning Rate": 7.94048821190885e-06, "Pretrain/Loss": 2.007133960723877, "Pretrain/Loss (Raw)": 1.8324917554855347, "Pretrain/Step": 7123, "Pretrain/Step Time": 8.501476626843214} +{"Pretrain/Learning Rate": 7.934283122315464e-06, "Pretrain/Loss": 2.0041661262512207, "Pretrain/Loss (Raw)": 1.7408684492111206, "Pretrain/Step": 7124, "Pretrain/Step Time": 8.509441556409001} +{"Pretrain/Learning Rate": 7.928080000820968e-06, "Pretrain/Loss": 2.003626823425293, "Pretrain/Loss (Raw)": 1.8356512784957886, "Pretrain/Step": 7125, "Pretrain/Step Time": 8.520644318312407} +{"Pretrain/Learning Rate": 7.921878848140727e-06, "Pretrain/Loss": 2.0053935050964355, "Pretrain/Loss (Raw)": 2.224687337875366, "Pretrain/Step": 7126, "Pretrain/Step Time": 8.521888379007578} +{"Pretrain/Learning Rate": 7.915679664989887e-06, "Pretrain/Loss": 2.0045504570007324, "Pretrain/Loss (Raw)": 2.1444430351257324, "Pretrain/Step": 7127, "Pretrain/Step Time": 8.516794512048364} +{"Pretrain/Learning Rate": 7.909482452083378e-06, "Pretrain/Loss": 2.005739212036133, "Pretrain/Loss (Raw)": 2.2236595153808594, "Pretrain/Step": 7128, "Pretrain/Step Time": 8.514052936807275} +{"Pretrain/Learning Rate": 7.903287210135888e-06, "Pretrain/Loss": 2.0072884559631348, "Pretrain/Loss (Raw)": 2.1446874141693115, "Pretrain/Step": 7129, "Pretrain/Step Time": 8.510092578828335} +{"Pretrain/Learning Rate": 7.897093939861877e-06, "Pretrain/Loss": 2.007071018218994, "Pretrain/Loss (Raw)": 2.062558650970459, "Pretrain/Step": 7130, "Pretrain/Step Time": 8.512701012194157} +{"Pretrain/Learning Rate": 7.890902641975576e-06, "Pretrain/Loss": 2.00604248046875, "Pretrain/Loss (Raw)": 2.0317459106445312, "Pretrain/Step": 7131, "Pretrain/Step Time": 8.516837188974023} +{"Pretrain/Learning Rate": 7.884713317191011e-06, "Pretrain/Loss": 2.007321357727051, "Pretrain/Loss (Raw)": 1.9798119068145752, "Pretrain/Step": 7132, "Pretrain/Step Time": 8.521057389676571} +{"Pretrain/Learning Rate": 7.878525966221958e-06, "Pretrain/Loss": 2.006117343902588, "Pretrain/Loss (Raw)": 1.9407960176467896, "Pretrain/Step": 7133, "Pretrain/Step Time": 8.517091458663344} +{"Pretrain/Learning Rate": 7.87234058978197e-06, "Pretrain/Loss": 2.009537696838379, "Pretrain/Loss (Raw)": 2.3114817142486572, "Pretrain/Step": 7134, "Pretrain/Step Time": 8.514613512903452} +{"Pretrain/Learning Rate": 7.866157188584364e-06, "Pretrain/Loss": 2.0091423988342285, "Pretrain/Loss (Raw)": 1.8119834661483765, "Pretrain/Step": 7135, "Pretrain/Step Time": 8.513529343530536} +{"Pretrain/Learning Rate": 7.859975763342264e-06, "Pretrain/Loss": 2.0050625801086426, "Pretrain/Loss (Raw)": 1.6727752685546875, "Pretrain/Step": 7136, "Pretrain/Step Time": 8.520013658329844} +{"Pretrain/Learning Rate": 7.85379631476851e-06, "Pretrain/Loss": 2.006239891052246, "Pretrain/Loss (Raw)": 2.1206111907958984, "Pretrain/Step": 7137, "Pretrain/Step Time": 8.522257458418608} +{"Pretrain/Learning Rate": 7.847618843575769e-06, "Pretrain/Loss": 2.0029408931732178, "Pretrain/Loss (Raw)": 1.8885306119918823, "Pretrain/Step": 7138, "Pretrain/Step Time": 8.523697040975094} +{"Pretrain/Learning Rate": 7.84144335047644e-06, "Pretrain/Loss": 2.002889394760132, "Pretrain/Loss (Raw)": 2.006192684173584, "Pretrain/Step": 7139, "Pretrain/Step Time": 8.512938709929585} +{"Pretrain/Learning Rate": 7.835269836182733e-06, "Pretrain/Loss": 2.0027153491973877, "Pretrain/Loss (Raw)": 2.066664934158325, "Pretrain/Step": 7140, "Pretrain/Step Time": 8.510190386325121} +{"Pretrain/Learning Rate": 7.829098301406576e-06, "Pretrain/Loss": 2.001246929168701, "Pretrain/Loss (Raw)": 1.955438494682312, "Pretrain/Step": 7141, "Pretrain/Step Time": 8.506400614976883} +{"Pretrain/Learning Rate": 7.82292874685972e-06, "Pretrain/Loss": 1.999966025352478, "Pretrain/Loss (Raw)": 1.9366265535354614, "Pretrain/Step": 7142, "Pretrain/Step Time": 8.513622039929032} +{"Pretrain/Learning Rate": 7.816761173253665e-06, "Pretrain/Loss": 2.001709222793579, "Pretrain/Loss (Raw)": 2.0319015979766846, "Pretrain/Step": 7143, "Pretrain/Step Time": 8.51030744239688} +{"Pretrain/Learning Rate": 7.810595581299681e-06, "Pretrain/Loss": 2.0018861293792725, "Pretrain/Loss (Raw)": 2.1488142013549805, "Pretrain/Step": 7144, "Pretrain/Step Time": 8.510783763602376} +{"Pretrain/Learning Rate": 7.804431971708807e-06, "Pretrain/Loss": 2.0014476776123047, "Pretrain/Loss (Raw)": 2.0329902172088623, "Pretrain/Step": 7145, "Pretrain/Step Time": 8.504418570548296} +{"Pretrain/Learning Rate": 7.798270345191871e-06, "Pretrain/Loss": 1.9991979598999023, "Pretrain/Loss (Raw)": 1.6999218463897705, "Pretrain/Step": 7146, "Pretrain/Step Time": 8.507565962150693} +{"Pretrain/Learning Rate": 7.792110702459456e-06, "Pretrain/Loss": 2.0005106925964355, "Pretrain/Loss (Raw)": 2.195466995239258, "Pretrain/Step": 7147, "Pretrain/Step Time": 8.504725374281406} +{"Pretrain/Learning Rate": 7.785953044221924e-06, "Pretrain/Loss": 1.999903678894043, "Pretrain/Loss (Raw)": 1.9039522409439087, "Pretrain/Step": 7148, "Pretrain/Step Time": 8.515741361305118} +{"Pretrain/Learning Rate": 7.779797371189394e-06, "Pretrain/Loss": 1.9994125366210938, "Pretrain/Loss (Raw)": 1.896370768547058, "Pretrain/Step": 7149, "Pretrain/Step Time": 8.516750873997808} +{"Pretrain/Learning Rate": 7.77364368407178e-06, "Pretrain/Loss": 1.9977236986160278, "Pretrain/Loss (Raw)": 1.9515825510025024, "Pretrain/Step": 7150, "Pretrain/Step Time": 8.518977163359523} +{"Pretrain/Learning Rate": 7.767491983578751e-06, "Pretrain/Loss": 1.99869966506958, "Pretrain/Loss (Raw)": 2.0249288082122803, "Pretrain/Step": 7151, "Pretrain/Step Time": 8.516736716032028} +{"Pretrain/Learning Rate": 7.76134227041975e-06, "Pretrain/Loss": 1.9999468326568604, "Pretrain/Loss (Raw)": 1.999647617340088, "Pretrain/Step": 7152, "Pretrain/Step Time": 8.510264579206705} +{"Pretrain/Learning Rate": 7.755194545303982e-06, "Pretrain/Loss": 2.000919818878174, "Pretrain/Loss (Raw)": 2.0917422771453857, "Pretrain/Step": 7153, "Pretrain/Step Time": 8.513819141313434} +{"Pretrain/Learning Rate": 7.749048808940445e-06, "Pretrain/Loss": 2.003007411956787, "Pretrain/Loss (Raw)": 2.0995450019836426, "Pretrain/Step": 7154, "Pretrain/Step Time": 8.517303541302681} +{"Pretrain/Learning Rate": 7.742905062037891e-06, "Pretrain/Loss": 2.0023460388183594, "Pretrain/Loss (Raw)": 2.042144298553467, "Pretrain/Step": 7155, "Pretrain/Step Time": 8.522012723609805} +{"Pretrain/Learning Rate": 7.736763305304834e-06, "Pretrain/Loss": 2.0022478103637695, "Pretrain/Loss (Raw)": 2.056614637374878, "Pretrain/Step": 7156, "Pretrain/Step Time": 8.527517918497324} +{"Pretrain/Learning Rate": 7.730623539449588e-06, "Pretrain/Loss": 1.9983210563659668, "Pretrain/Loss (Raw)": 1.788869023323059, "Pretrain/Step": 7157, "Pretrain/Step Time": 8.518935203552246} +{"Pretrain/Learning Rate": 7.724485765180212e-06, "Pretrain/Loss": 1.9989134073257446, "Pretrain/Loss (Raw)": 2.300565004348755, "Pretrain/Step": 7158, "Pretrain/Step Time": 8.514116005972028} +{"Pretrain/Learning Rate": 7.71834998320454e-06, "Pretrain/Loss": 1.9993476867675781, "Pretrain/Loss (Raw)": 2.0792019367218018, "Pretrain/Step": 7159, "Pretrain/Step Time": 8.519405676051974} +{"Pretrain/Learning Rate": 7.712216194230177e-06, "Pretrain/Loss": 1.997768759727478, "Pretrain/Loss (Raw)": 1.8454980850219727, "Pretrain/Step": 7160, "Pretrain/Step Time": 8.527940142899752} +{"Pretrain/Learning Rate": 7.70608439896451e-06, "Pretrain/Loss": 1.9970967769622803, "Pretrain/Loss (Raw)": 1.9825313091278076, "Pretrain/Step": 7161, "Pretrain/Step Time": 8.523532068356872} +{"Pretrain/Learning Rate": 7.699954598114684e-06, "Pretrain/Loss": 2.001110553741455, "Pretrain/Loss (Raw)": 2.233192205429077, "Pretrain/Step": 7162, "Pretrain/Step Time": 8.524349642917514} +{"Pretrain/Learning Rate": 7.693826792387613e-06, "Pretrain/Loss": 2.001809597015381, "Pretrain/Loss (Raw)": 2.0387539863586426, "Pretrain/Step": 7163, "Pretrain/Step Time": 8.519033269956708} +{"Pretrain/Learning Rate": 7.68770098248998e-06, "Pretrain/Loss": 2.002293109893799, "Pretrain/Loss (Raw)": 2.0452663898468018, "Pretrain/Step": 7164, "Pretrain/Step Time": 8.51246665045619} +{"Pretrain/Learning Rate": 7.681577169128251e-06, "Pretrain/Loss": 2.0014936923980713, "Pretrain/Loss (Raw)": 2.0075180530548096, "Pretrain/Step": 7165, "Pretrain/Step Time": 8.514167649671435} +{"Pretrain/Learning Rate": 7.675455353008653e-06, "Pretrain/Loss": 2.003552198410034, "Pretrain/Loss (Raw)": 2.2150931358337402, "Pretrain/Step": 7166, "Pretrain/Step Time": 8.514448886737227} +{"Pretrain/Learning Rate": 7.669335534837183e-06, "Pretrain/Loss": 2.003445625305176, "Pretrain/Loss (Raw)": 1.9496827125549316, "Pretrain/Step": 7167, "Pretrain/Step Time": 8.51825794763863} +{"Pretrain/Learning Rate": 7.66321771531959e-06, "Pretrain/Loss": 2.0023932456970215, "Pretrain/Loss (Raw)": 1.7592577934265137, "Pretrain/Step": 7168, "Pretrain/Step Time": 8.51954646781087} +{"Pretrain/Learning Rate": 7.657101895161437e-06, "Pretrain/Loss": 2.00305438041687, "Pretrain/Loss (Raw)": 1.8851051330566406, "Pretrain/Step": 7169, "Pretrain/Step Time": 8.514648320153356} +{"Pretrain/Learning Rate": 7.650988075068011e-06, "Pretrain/Loss": 2.001117706298828, "Pretrain/Loss (Raw)": 2.003532648086548, "Pretrain/Step": 7170, "Pretrain/Step Time": 8.51671164855361} +{"Pretrain/Learning Rate": 7.644876255744393e-06, "Pretrain/Loss": 2.001433849334717, "Pretrain/Loss (Raw)": 1.9971954822540283, "Pretrain/Step": 7171, "Pretrain/Step Time": 8.522686321288347} +{"Pretrain/Learning Rate": 7.63876643789542e-06, "Pretrain/Loss": 1.9998931884765625, "Pretrain/Loss (Raw)": 1.870485782623291, "Pretrain/Step": 7172, "Pretrain/Step Time": 8.515804469585419} +{"Pretrain/Learning Rate": 7.632658622225713e-06, "Pretrain/Loss": 2.000401496887207, "Pretrain/Loss (Raw)": 2.0634984970092773, "Pretrain/Step": 7173, "Pretrain/Step Time": 8.522672101855278} +{"Pretrain/Learning Rate": 7.626552809439655e-06, "Pretrain/Loss": 1.9984018802642822, "Pretrain/Loss (Raw)": 1.7467750310897827, "Pretrain/Step": 7174, "Pretrain/Step Time": 8.52513605542481} +{"Pretrain/Learning Rate": 7.620449000241395e-06, "Pretrain/Loss": 1.9990832805633545, "Pretrain/Loss (Raw)": 2.0208992958068848, "Pretrain/Step": 7175, "Pretrain/Step Time": 8.520590625703335} +{"Pretrain/Learning Rate": 7.614347195334839e-06, "Pretrain/Loss": 2.0003364086151123, "Pretrain/Loss (Raw)": 2.2625246047973633, "Pretrain/Step": 7176, "Pretrain/Step Time": 8.517114751040936} +{"Pretrain/Learning Rate": 7.6082473954237066e-06, "Pretrain/Loss": 2.003068447113037, "Pretrain/Loss (Raw)": 2.1299006938934326, "Pretrain/Step": 7177, "Pretrain/Step Time": 8.520205713808537} +{"Pretrain/Learning Rate": 7.602149601211422e-06, "Pretrain/Loss": 2.0023837089538574, "Pretrain/Loss (Raw)": 1.8739866018295288, "Pretrain/Step": 7178, "Pretrain/Step Time": 8.519587498158216} +{"Pretrain/Learning Rate": 7.596053813401233e-06, "Pretrain/Loss": 2.0041184425354004, "Pretrain/Loss (Raw)": 2.1561028957366943, "Pretrain/Step": 7179, "Pretrain/Step Time": 8.522687388584018} +{"Pretrain/Learning Rate": 7.589960032696122e-06, "Pretrain/Loss": 2.0044994354248047, "Pretrain/Loss (Raw)": 2.1225922107696533, "Pretrain/Step": 7180, "Pretrain/Step Time": 8.521832974627614} +{"Pretrain/Learning Rate": 7.583868259798874e-06, "Pretrain/Loss": 2.006465435028076, "Pretrain/Loss (Raw)": 2.3056182861328125, "Pretrain/Step": 7181, "Pretrain/Step Time": 8.517048908397555} +{"Pretrain/Learning Rate": 7.5777784954119885e-06, "Pretrain/Loss": 2.0072596073150635, "Pretrain/Loss (Raw)": 2.10836124420166, "Pretrain/Step": 7182, "Pretrain/Step Time": 8.50801889412105} +{"Pretrain/Learning Rate": 7.5716907402377915e-06, "Pretrain/Loss": 2.0067687034606934, "Pretrain/Loss (Raw)": 2.0404856204986572, "Pretrain/Step": 7183, "Pretrain/Step Time": 8.506815763190389} +{"Pretrain/Learning Rate": 7.565604994978337e-06, "Pretrain/Loss": 2.006572723388672, "Pretrain/Loss (Raw)": 2.1156721115112305, "Pretrain/Step": 7184, "Pretrain/Step Time": 8.510636862367392} +{"Pretrain/Learning Rate": 7.559521260335483e-06, "Pretrain/Loss": 2.0071394443511963, "Pretrain/Loss (Raw)": 2.124180555343628, "Pretrain/Step": 7185, "Pretrain/Step Time": 8.513359233736992} +{"Pretrain/Learning Rate": 7.553439537010803e-06, "Pretrain/Loss": 2.0060839653015137, "Pretrain/Loss (Raw)": 1.9736411571502686, "Pretrain/Step": 7186, "Pretrain/Step Time": 8.511289240792394} +{"Pretrain/Learning Rate": 7.547359825705696e-06, "Pretrain/Loss": 2.0057544708251953, "Pretrain/Loss (Raw)": 2.1416003704071045, "Pretrain/Step": 7187, "Pretrain/Step Time": 8.50668815150857} +{"Pretrain/Learning Rate": 7.541282127121291e-06, "Pretrain/Loss": 2.004950523376465, "Pretrain/Loss (Raw)": 1.884454607963562, "Pretrain/Step": 7188, "Pretrain/Step Time": 8.508787924423814} +{"Pretrain/Learning Rate": 7.5352064419585e-06, "Pretrain/Loss": 2.0072078704833984, "Pretrain/Loss (Raw)": 2.0746519565582275, "Pretrain/Step": 7189, "Pretrain/Step Time": 8.507209109142423} +{"Pretrain/Learning Rate": 7.529132770917993e-06, "Pretrain/Loss": 2.0094597339630127, "Pretrain/Loss (Raw)": 2.1541576385498047, "Pretrain/Step": 7190, "Pretrain/Step Time": 8.520059114322066} +{"Pretrain/Learning Rate": 7.523061114700228e-06, "Pretrain/Loss": 2.010680675506592, "Pretrain/Loss (Raw)": 2.025819778442383, "Pretrain/Step": 7191, "Pretrain/Step Time": 8.517828088253736} +{"Pretrain/Learning Rate": 7.516991474005408e-06, "Pretrain/Loss": 2.0135302543640137, "Pretrain/Loss (Raw)": 2.1662817001342773, "Pretrain/Step": 7192, "Pretrain/Step Time": 8.52154684253037} +{"Pretrain/Learning Rate": 7.510923849533513e-06, "Pretrain/Loss": 2.0136444568634033, "Pretrain/Loss (Raw)": 1.9919415712356567, "Pretrain/Step": 7193, "Pretrain/Step Time": 8.51460968144238} +{"Pretrain/Learning Rate": 7.504858241984286e-06, "Pretrain/Loss": 2.0147390365600586, "Pretrain/Loss (Raw)": 2.1562507152557373, "Pretrain/Step": 7194, "Pretrain/Step Time": 8.518009116873145} +{"Pretrain/Learning Rate": 7.498794652057251e-06, "Pretrain/Loss": 2.010560989379883, "Pretrain/Loss (Raw)": 1.5815277099609375, "Pretrain/Step": 7195, "Pretrain/Step Time": 8.520268036052585} +{"Pretrain/Learning Rate": 7.492733080451686e-06, "Pretrain/Loss": 2.011023759841919, "Pretrain/Loss (Raw)": 1.9360334873199463, "Pretrain/Step": 7196, "Pretrain/Step Time": 8.51997309923172} +{"Pretrain/Learning Rate": 7.486673527866633e-06, "Pretrain/Loss": 2.0111730098724365, "Pretrain/Loss (Raw)": 2.11381459236145, "Pretrain/Step": 7197, "Pretrain/Step Time": 8.52599130384624} +{"Pretrain/Learning Rate": 7.4806159950009196e-06, "Pretrain/Loss": 2.0107131004333496, "Pretrain/Loss (Raw)": 1.7774090766906738, "Pretrain/Step": 7198, "Pretrain/Step Time": 8.52500743791461} +{"Pretrain/Learning Rate": 7.474560482553125e-06, "Pretrain/Loss": 2.0113487243652344, "Pretrain/Loss (Raw)": 2.2348177433013916, "Pretrain/Step": 7199, "Pretrain/Step Time": 8.517995012924075} +{"Pretrain/Learning Rate": 7.468506991221599e-06, "Pretrain/Loss": 2.011267900466919, "Pretrain/Loss (Raw)": 2.0645253658294678, "Pretrain/Step": 7200, "Pretrain/Step Time": 8.510788215324283} +{"Pretrain/Learning Rate": 7.462455521704448e-06, "Pretrain/Loss": 2.0135035514831543, "Pretrain/Loss (Raw)": 2.1669323444366455, "Pretrain/Step": 7201, "Pretrain/Step Time": 8.510925520211458} +{"Pretrain/Learning Rate": 7.4564060746995765e-06, "Pretrain/Loss": 2.015873670578003, "Pretrain/Loss (Raw)": 2.2152247428894043, "Pretrain/Step": 7202, "Pretrain/Step Time": 8.5206917244941} +{"Pretrain/Learning Rate": 7.450358650904621e-06, "Pretrain/Loss": 2.013244152069092, "Pretrain/Loss (Raw)": 1.7004497051239014, "Pretrain/Step": 7203, "Pretrain/Step Time": 8.5203100964427} +{"Pretrain/Learning Rate": 7.444313251017004e-06, "Pretrain/Loss": 2.008347511291504, "Pretrain/Loss (Raw)": 1.459174394607544, "Pretrain/Step": 7204, "Pretrain/Step Time": 8.51883827149868} +{"Pretrain/Learning Rate": 7.438269875733903e-06, "Pretrain/Loss": 2.0111966133117676, "Pretrain/Loss (Raw)": 2.0308778285980225, "Pretrain/Step": 7205, "Pretrain/Step Time": 8.512618158012629} +{"Pretrain/Learning Rate": 7.432228525752277e-06, "Pretrain/Loss": 2.011176347732544, "Pretrain/Loss (Raw)": 1.9992783069610596, "Pretrain/Step": 7206, "Pretrain/Step Time": 8.51473419368267} +{"Pretrain/Learning Rate": 7.426189201768844e-06, "Pretrain/Loss": 2.0117645263671875, "Pretrain/Loss (Raw)": 2.093017101287842, "Pretrain/Step": 7207, "Pretrain/Step Time": 8.51656568609178} +{"Pretrain/Learning Rate": 7.42015190448008e-06, "Pretrain/Loss": 2.013550281524658, "Pretrain/Loss (Raw)": 1.9853756427764893, "Pretrain/Step": 7208, "Pretrain/Step Time": 8.520422641187906} +{"Pretrain/Learning Rate": 7.4141166345822274e-06, "Pretrain/Loss": 2.010496139526367, "Pretrain/Loss (Raw)": 1.6122074127197266, "Pretrain/Step": 7209, "Pretrain/Step Time": 8.52227451466024} +{"Pretrain/Learning Rate": 7.408083392771323e-06, "Pretrain/Loss": 2.0085325241088867, "Pretrain/Loss (Raw)": 1.7924867868423462, "Pretrain/Step": 7210, "Pretrain/Step Time": 8.521927565336227} +{"Pretrain/Learning Rate": 7.402052179743135e-06, "Pretrain/Loss": 2.0075714588165283, "Pretrain/Loss (Raw)": 1.9996806383132935, "Pretrain/Step": 7211, "Pretrain/Step Time": 8.511853897944093} +{"Pretrain/Learning Rate": 7.396022996193217e-06, "Pretrain/Loss": 2.0074422359466553, "Pretrain/Loss (Raw)": 2.06479549407959, "Pretrain/Step": 7212, "Pretrain/Step Time": 8.51370308920741} +{"Pretrain/Learning Rate": 7.389995842816871e-06, "Pretrain/Loss": 2.008655548095703, "Pretrain/Loss (Raw)": 1.9808034896850586, "Pretrain/Step": 7213, "Pretrain/Step Time": 8.514615265652537} +{"Pretrain/Learning Rate": 7.383970720309191e-06, "Pretrain/Loss": 2.008443832397461, "Pretrain/Loss (Raw)": 2.048811197280884, "Pretrain/Step": 7214, "Pretrain/Step Time": 8.518582306802273} +{"Pretrain/Learning Rate": 7.37794762936502e-06, "Pretrain/Loss": 2.008697032928467, "Pretrain/Loss (Raw)": 2.0881383419036865, "Pretrain/Step": 7215, "Pretrain/Step Time": 8.51881244033575} +{"Pretrain/Learning Rate": 7.371926570678964e-06, "Pretrain/Loss": 2.0028016567230225, "Pretrain/Loss (Raw)": 1.84420907497406, "Pretrain/Step": 7216, "Pretrain/Step Time": 8.51764171756804} +{"Pretrain/Learning Rate": 7.365907544945397e-06, "Pretrain/Loss": 2.0025782585144043, "Pretrain/Loss (Raw)": 2.0138628482818604, "Pretrain/Step": 7217, "Pretrain/Step Time": 8.513555951416492} +{"Pretrain/Learning Rate": 7.359890552858478e-06, "Pretrain/Loss": 2.001483917236328, "Pretrain/Loss (Raw)": 1.8008291721343994, "Pretrain/Step": 7218, "Pretrain/Step Time": 8.508380087092519} +{"Pretrain/Learning Rate": 7.353875595112092e-06, "Pretrain/Loss": 2.002197265625, "Pretrain/Loss (Raw)": 2.134653329849243, "Pretrain/Step": 7219, "Pretrain/Step Time": 8.513136200606823} +{"Pretrain/Learning Rate": 7.347862672399927e-06, "Pretrain/Loss": 2.0028634071350098, "Pretrain/Loss (Raw)": 1.9630584716796875, "Pretrain/Step": 7220, "Pretrain/Step Time": 8.51295955479145} +{"Pretrain/Learning Rate": 7.341851785415415e-06, "Pretrain/Loss": 2.0027010440826416, "Pretrain/Loss (Raw)": 2.196727752685547, "Pretrain/Step": 7221, "Pretrain/Step Time": 8.515676688402891} +{"Pretrain/Learning Rate": 7.335842934851775e-06, "Pretrain/Loss": 1.9991402626037598, "Pretrain/Loss (Raw)": 1.7828396558761597, "Pretrain/Step": 7222, "Pretrain/Step Time": 8.51499710418284} +{"Pretrain/Learning Rate": 7.329836121401951e-06, "Pretrain/Loss": 1.9984924793243408, "Pretrain/Loss (Raw)": 1.92964768409729, "Pretrain/Step": 7223, "Pretrain/Step Time": 8.503284549340606} +{"Pretrain/Learning Rate": 7.323831345758697e-06, "Pretrain/Loss": 1.998343586921692, "Pretrain/Loss (Raw)": 1.9150317907333374, "Pretrain/Step": 7224, "Pretrain/Step Time": 8.504625178873539} +{"Pretrain/Learning Rate": 7.317828608614496e-06, "Pretrain/Loss": 1.9986605644226074, "Pretrain/Loss (Raw)": 1.8930217027664185, "Pretrain/Step": 7225, "Pretrain/Step Time": 8.513079673051834} +{"Pretrain/Learning Rate": 7.311827910661639e-06, "Pretrain/Loss": 1.9992960691452026, "Pretrain/Loss (Raw)": 1.9917608499526978, "Pretrain/Step": 7226, "Pretrain/Step Time": 8.519266409799457} +{"Pretrain/Learning Rate": 7.3058292525921195e-06, "Pretrain/Loss": 1.9989080429077148, "Pretrain/Loss (Raw)": 1.700717806816101, "Pretrain/Step": 7227, "Pretrain/Step Time": 8.517690189182758} +{"Pretrain/Learning Rate": 7.299832635097756e-06, "Pretrain/Loss": 2.003465175628662, "Pretrain/Loss (Raw)": 2.455368757247925, "Pretrain/Step": 7228, "Pretrain/Step Time": 8.519165312871337} +{"Pretrain/Learning Rate": 7.293838058870098e-06, "Pretrain/Loss": 2.0029349327087402, "Pretrain/Loss (Raw)": 1.990559458732605, "Pretrain/Step": 7229, "Pretrain/Step Time": 8.510384684428573} +{"Pretrain/Learning Rate": 7.2878455246004704e-06, "Pretrain/Loss": 2.003612995147705, "Pretrain/Loss (Raw)": 2.1862378120422363, "Pretrain/Step": 7230, "Pretrain/Step Time": 8.514591654762626} +{"Pretrain/Learning Rate": 7.281855032979954e-06, "Pretrain/Loss": 2.003873825073242, "Pretrain/Loss (Raw)": 1.979671835899353, "Pretrain/Step": 7231, "Pretrain/Step Time": 8.518896501511335} +{"Pretrain/Learning Rate": 7.275866584699409e-06, "Pretrain/Loss": 2.0022549629211426, "Pretrain/Loss (Raw)": 1.8078460693359375, "Pretrain/Step": 7232, "Pretrain/Step Time": 8.528922593221068} +{"Pretrain/Learning Rate": 7.269880180449451e-06, "Pretrain/Loss": 2.004573345184326, "Pretrain/Loss (Raw)": 2.15494704246521, "Pretrain/Step": 7233, "Pretrain/Step Time": 8.530074167996645} +{"Pretrain/Learning Rate": 7.263895820920458e-06, "Pretrain/Loss": 2.0049595832824707, "Pretrain/Loss (Raw)": 2.280959129333496, "Pretrain/Step": 7234, "Pretrain/Step Time": 8.525231916457415} +{"Pretrain/Learning Rate": 7.257913506802566e-06, "Pretrain/Loss": 2.0043952465057373, "Pretrain/Loss (Raw)": 1.8214282989501953, "Pretrain/Step": 7235, "Pretrain/Step Time": 8.525528771802783} +{"Pretrain/Learning Rate": 7.251933238785699e-06, "Pretrain/Loss": 2.0025525093078613, "Pretrain/Loss (Raw)": 1.9010261297225952, "Pretrain/Step": 7236, "Pretrain/Step Time": 8.523584241047502} +{"Pretrain/Learning Rate": 7.245955017559522e-06, "Pretrain/Loss": 2.0024263858795166, "Pretrain/Loss (Raw)": 2.0438363552093506, "Pretrain/Step": 7237, "Pretrain/Step Time": 8.52641512453556} +{"Pretrain/Learning Rate": 7.2399788438134665e-06, "Pretrain/Loss": 2.0027809143066406, "Pretrain/Loss (Raw)": 2.2303197383880615, "Pretrain/Step": 7238, "Pretrain/Step Time": 8.528656788170338} +{"Pretrain/Learning Rate": 7.234004718236745e-06, "Pretrain/Loss": 2.0031800270080566, "Pretrain/Loss (Raw)": 1.9163405895233154, "Pretrain/Step": 7239, "Pretrain/Step Time": 8.536698611453176} +{"Pretrain/Learning Rate": 7.228032641518315e-06, "Pretrain/Loss": 2.0036754608154297, "Pretrain/Loss (Raw)": 1.9109500646591187, "Pretrain/Step": 7240, "Pretrain/Step Time": 8.530288005247712} +{"Pretrain/Learning Rate": 7.222062614346906e-06, "Pretrain/Loss": 2.003729820251465, "Pretrain/Loss (Raw)": 2.072697401046753, "Pretrain/Step": 7241, "Pretrain/Step Time": 8.527984181419015} +{"Pretrain/Learning Rate": 7.216094637411e-06, "Pretrain/Loss": 2.0046181678771973, "Pretrain/Loss (Raw)": 1.9666787385940552, "Pretrain/Step": 7242, "Pretrain/Step Time": 8.523444287478924} +{"Pretrain/Learning Rate": 7.21012871139887e-06, "Pretrain/Loss": 2.0043749809265137, "Pretrain/Loss (Raw)": 1.975163221359253, "Pretrain/Step": 7243, "Pretrain/Step Time": 8.521876929327846} +{"Pretrain/Learning Rate": 7.204164836998523e-06, "Pretrain/Loss": 2.003167152404785, "Pretrain/Loss (Raw)": 1.846888780593872, "Pretrain/Step": 7244, "Pretrain/Step Time": 8.533274440094829} +{"Pretrain/Learning Rate": 7.1982030148977474e-06, "Pretrain/Loss": 2.002863645553589, "Pretrain/Loss (Raw)": 1.9338407516479492, "Pretrain/Step": 7245, "Pretrain/Step Time": 8.534670012071729} +{"Pretrain/Learning Rate": 7.192243245784075e-06, "Pretrain/Loss": 2.001936674118042, "Pretrain/Loss (Raw)": 1.9895027875900269, "Pretrain/Step": 7246, "Pretrain/Step Time": 8.528271855786443} +{"Pretrain/Learning Rate": 7.186285530344833e-06, "Pretrain/Loss": 1.999467134475708, "Pretrain/Loss (Raw)": 1.781545639038086, "Pretrain/Step": 7247, "Pretrain/Step Time": 8.52697136811912} +{"Pretrain/Learning Rate": 7.1803298692670825e-06, "Pretrain/Loss": 2.000629425048828, "Pretrain/Loss (Raw)": 2.1271440982818604, "Pretrain/Step": 7248, "Pretrain/Step Time": 8.520991815254092} +{"Pretrain/Learning Rate": 7.174376263237664e-06, "Pretrain/Loss": 2.0021634101867676, "Pretrain/Loss (Raw)": 2.2071187496185303, "Pretrain/Step": 7249, "Pretrain/Step Time": 8.5316880941391} +{"Pretrain/Learning Rate": 7.1684247129431616e-06, "Pretrain/Loss": 2.00315523147583, "Pretrain/Loss (Raw)": 1.9635940790176392, "Pretrain/Step": 7250, "Pretrain/Step Time": 8.540003828704357} +{"Pretrain/Learning Rate": 7.162475219069956e-06, "Pretrain/Loss": 2.004647731781006, "Pretrain/Loss (Raw)": 2.023528814315796, "Pretrain/Step": 7251, "Pretrain/Step Time": 8.540048390626907} +{"Pretrain/Learning Rate": 7.1565277823041596e-06, "Pretrain/Loss": 2.0072107315063477, "Pretrain/Loss (Raw)": 2.068915605545044, "Pretrain/Step": 7252, "Pretrain/Step Time": 8.530220346525311} +{"Pretrain/Learning Rate": 7.1505824033316596e-06, "Pretrain/Loss": 2.0071659088134766, "Pretrain/Loss (Raw)": 1.829902172088623, "Pretrain/Step": 7253, "Pretrain/Step Time": 8.519006859511137} +{"Pretrain/Learning Rate": 7.1446390828381e-06, "Pretrain/Loss": 2.0055360794067383, "Pretrain/Loss (Raw)": 2.016083002090454, "Pretrain/Step": 7254, "Pretrain/Step Time": 8.519030153751373} +{"Pretrain/Learning Rate": 7.138697821508908e-06, "Pretrain/Loss": 2.004934310913086, "Pretrain/Loss (Raw)": 2.0674331188201904, "Pretrain/Step": 7255, "Pretrain/Step Time": 8.522950867190957} +{"Pretrain/Learning Rate": 7.132758620029248e-06, "Pretrain/Loss": 2.003387451171875, "Pretrain/Loss (Raw)": 2.025622844696045, "Pretrain/Step": 7256, "Pretrain/Step Time": 8.520039262250066} +{"Pretrain/Learning Rate": 7.126821479084056e-06, "Pretrain/Loss": 2.0021469593048096, "Pretrain/Loss (Raw)": 1.9859213829040527, "Pretrain/Step": 7257, "Pretrain/Step Time": 8.523260464891791} +{"Pretrain/Learning Rate": 7.120886399358023e-06, "Pretrain/Loss": 2.001716136932373, "Pretrain/Loss (Raw)": 2.007406711578369, "Pretrain/Step": 7258, "Pretrain/Step Time": 8.520999746397138} +{"Pretrain/Learning Rate": 7.114953381535627e-06, "Pretrain/Loss": 2.0032176971435547, "Pretrain/Loss (Raw)": 2.223964214324951, "Pretrain/Step": 7259, "Pretrain/Step Time": 8.515251871198416} +{"Pretrain/Learning Rate": 7.109022426301087e-06, "Pretrain/Loss": 2.003786563873291, "Pretrain/Loss (Raw)": 2.0526504516601562, "Pretrain/Step": 7260, "Pretrain/Step Time": 8.518237175419927} +{"Pretrain/Learning Rate": 7.103093534338384e-06, "Pretrain/Loss": 2.0037825107574463, "Pretrain/Loss (Raw)": 1.9402471780776978, "Pretrain/Step": 7261, "Pretrain/Step Time": 8.52241887897253} +{"Pretrain/Learning Rate": 7.0971667063312624e-06, "Pretrain/Loss": 2.0039544105529785, "Pretrain/Loss (Raw)": 2.3334856033325195, "Pretrain/Step": 7262, "Pretrain/Step Time": 8.520009063184261} +{"Pretrain/Learning Rate": 7.091241942963251e-06, "Pretrain/Loss": 2.00518798828125, "Pretrain/Loss (Raw)": 1.9698643684387207, "Pretrain/Step": 7263, "Pretrain/Step Time": 8.526305563747883} +{"Pretrain/Learning Rate": 7.0853192449175905e-06, "Pretrain/Loss": 2.0079100131988525, "Pretrain/Loss (Raw)": 2.0212182998657227, "Pretrain/Step": 7264, "Pretrain/Step Time": 8.521731417626143} +{"Pretrain/Learning Rate": 7.0793986128773415e-06, "Pretrain/Loss": 2.0064644813537598, "Pretrain/Loss (Raw)": 1.9355535507202148, "Pretrain/Step": 7265, "Pretrain/Step Time": 8.51761108636856} +{"Pretrain/Learning Rate": 7.07348004752528e-06, "Pretrain/Loss": 2.0081677436828613, "Pretrain/Loss (Raw)": 2.106564998626709, "Pretrain/Step": 7266, "Pretrain/Step Time": 8.520397650077939} +{"Pretrain/Learning Rate": 7.067563549543987e-06, "Pretrain/Loss": 2.0079822540283203, "Pretrain/Loss (Raw)": 1.9824581146240234, "Pretrain/Step": 7267, "Pretrain/Step Time": 8.524498693645} +{"Pretrain/Learning Rate": 7.061649119615752e-06, "Pretrain/Loss": 2.0061089992523193, "Pretrain/Loss (Raw)": 1.8269017934799194, "Pretrain/Step": 7268, "Pretrain/Step Time": 8.528171053156257} +{"Pretrain/Learning Rate": 7.055736758422676e-06, "Pretrain/Loss": 2.0069663524627686, "Pretrain/Loss (Raw)": 2.065168619155884, "Pretrain/Step": 7269, "Pretrain/Step Time": 8.5283387247473} +{"Pretrain/Learning Rate": 7.049826466646592e-06, "Pretrain/Loss": 2.007462501525879, "Pretrain/Loss (Raw)": 2.0001280307769775, "Pretrain/Step": 7270, "Pretrain/Step Time": 8.519136682152748} +{"Pretrain/Learning Rate": 7.043918244969106e-06, "Pretrain/Loss": 2.0078177452087402, "Pretrain/Loss (Raw)": 2.0773539543151855, "Pretrain/Step": 7271, "Pretrain/Step Time": 8.517704805359244} +{"Pretrain/Learning Rate": 7.038012094071572e-06, "Pretrain/Loss": 2.006592273712158, "Pretrain/Loss (Raw)": 1.9919557571411133, "Pretrain/Step": 7272, "Pretrain/Step Time": 8.522886967286468} +{"Pretrain/Learning Rate": 7.032108014635128e-06, "Pretrain/Loss": 2.0063817501068115, "Pretrain/Loss (Raw)": 2.006047248840332, "Pretrain/Step": 7273, "Pretrain/Step Time": 8.526909222826362} +{"Pretrain/Learning Rate": 7.026206007340658e-06, "Pretrain/Loss": 2.0100011825561523, "Pretrain/Loss (Raw)": 2.1632437705993652, "Pretrain/Step": 7274, "Pretrain/Step Time": 8.52656303346157} +{"Pretrain/Learning Rate": 7.020306072868804e-06, "Pretrain/Loss": 2.007432460784912, "Pretrain/Loss (Raw)": 1.866649866104126, "Pretrain/Step": 7275, "Pretrain/Step Time": 8.529667653143406} +{"Pretrain/Learning Rate": 7.014408211899973e-06, "Pretrain/Loss": 2.006822347640991, "Pretrain/Loss (Raw)": 1.8258638381958008, "Pretrain/Step": 7276, "Pretrain/Step Time": 8.521669005975127} +{"Pretrain/Learning Rate": 7.008512425114333e-06, "Pretrain/Loss": 2.008445978164673, "Pretrain/Loss (Raw)": 2.104194402694702, "Pretrain/Step": 7277, "Pretrain/Step Time": 8.519340824335814} +{"Pretrain/Learning Rate": 7.002618713191839e-06, "Pretrain/Loss": 2.008141040802002, "Pretrain/Loss (Raw)": 1.9125518798828125, "Pretrain/Step": 7278, "Pretrain/Step Time": 8.51675744727254} +{"Pretrain/Learning Rate": 6.996727076812143e-06, "Pretrain/Loss": 2.0088284015655518, "Pretrain/Loss (Raw)": 2.1128952503204346, "Pretrain/Step": 7279, "Pretrain/Step Time": 8.51749244518578} +{"Pretrain/Learning Rate": 6.990837516654722e-06, "Pretrain/Loss": 2.0065152645111084, "Pretrain/Loss (Raw)": 1.7035902738571167, "Pretrain/Step": 7280, "Pretrain/Step Time": 8.520723236724734} +{"Pretrain/Learning Rate": 6.984950033398782e-06, "Pretrain/Loss": 2.006053924560547, "Pretrain/Loss (Raw)": 2.0326852798461914, "Pretrain/Step": 7281, "Pretrain/Step Time": 8.52657556347549} +{"Pretrain/Learning Rate": 6.979064627723292e-06, "Pretrain/Loss": 2.0048680305480957, "Pretrain/Loss (Raw)": 1.9477548599243164, "Pretrain/Step": 7282, "Pretrain/Step Time": 8.521078240126371} +{"Pretrain/Learning Rate": 6.97318130030698e-06, "Pretrain/Loss": 2.0052378177642822, "Pretrain/Loss (Raw)": 2.0894672870635986, "Pretrain/Step": 7283, "Pretrain/Step Time": 8.515444535762072} +{"Pretrain/Learning Rate": 6.967300051828355e-06, "Pretrain/Loss": 2.0058982372283936, "Pretrain/Loss (Raw)": 2.141160488128662, "Pretrain/Step": 7284, "Pretrain/Step Time": 8.517224190756679} +{"Pretrain/Learning Rate": 6.961420882965661e-06, "Pretrain/Loss": 2.0105133056640625, "Pretrain/Loss (Raw)": 2.379596710205078, "Pretrain/Step": 7285, "Pretrain/Step Time": 8.522243170067668} +{"Pretrain/Learning Rate": 6.9555437943969095e-06, "Pretrain/Loss": 2.006526231765747, "Pretrain/Loss (Raw)": 1.7901982069015503, "Pretrain/Step": 7286, "Pretrain/Step Time": 8.527151990681887} +{"Pretrain/Learning Rate": 6.949668786799867e-06, "Pretrain/Loss": 2.0067973136901855, "Pretrain/Loss (Raw)": 2.1138837337493896, "Pretrain/Step": 7287, "Pretrain/Step Time": 8.520683862268925} +{"Pretrain/Learning Rate": 6.943795860852087e-06, "Pretrain/Loss": 2.008582353591919, "Pretrain/Loss (Raw)": 2.0739917755126953, "Pretrain/Step": 7288, "Pretrain/Step Time": 8.512047108262777} +{"Pretrain/Learning Rate": 6.937925017230848e-06, "Pretrain/Loss": 2.0098400115966797, "Pretrain/Loss (Raw)": 2.1435189247131348, "Pretrain/Step": 7289, "Pretrain/Step Time": 8.51382715627551} +{"Pretrain/Learning Rate": 6.932056256613209e-06, "Pretrain/Loss": 2.008605480194092, "Pretrain/Loss (Raw)": 2.075191020965576, "Pretrain/Step": 7290, "Pretrain/Step Time": 8.519481858238578} +{"Pretrain/Learning Rate": 6.926189579675977e-06, "Pretrain/Loss": 2.0087497234344482, "Pretrain/Loss (Raw)": 2.0571951866149902, "Pretrain/Step": 7291, "Pretrain/Step Time": 8.520639630034566} +{"Pretrain/Learning Rate": 6.920324987095733e-06, "Pretrain/Loss": 2.0082781314849854, "Pretrain/Loss (Raw)": 1.984915018081665, "Pretrain/Step": 7292, "Pretrain/Step Time": 8.523971170186996} +{"Pretrain/Learning Rate": 6.914462479548806e-06, "Pretrain/Loss": 2.009125232696533, "Pretrain/Loss (Raw)": 2.115952730178833, "Pretrain/Step": 7293, "Pretrain/Step Time": 8.517400434240699} +{"Pretrain/Learning Rate": 6.908602057711289e-06, "Pretrain/Loss": 2.0106852054595947, "Pretrain/Loss (Raw)": 2.4147603511810303, "Pretrain/Step": 7294, "Pretrain/Step Time": 8.513511311262846} +{"Pretrain/Learning Rate": 6.902743722259025e-06, "Pretrain/Loss": 2.011202812194824, "Pretrain/Loss (Raw)": 2.0159285068511963, "Pretrain/Step": 7295, "Pretrain/Step Time": 8.509726708754897} +{"Pretrain/Learning Rate": 6.8968874738676385e-06, "Pretrain/Loss": 2.0137970447540283, "Pretrain/Loss (Raw)": 2.0913453102111816, "Pretrain/Step": 7296, "Pretrain/Step Time": 8.509107096120715} +{"Pretrain/Learning Rate": 6.891033313212494e-06, "Pretrain/Loss": 2.0129809379577637, "Pretrain/Loss (Raw)": 1.7806429862976074, "Pretrain/Step": 7297, "Pretrain/Step Time": 8.51645790785551} +{"Pretrain/Learning Rate": 6.885181240968719e-06, "Pretrain/Loss": 2.011874198913574, "Pretrain/Loss (Raw)": 1.861849308013916, "Pretrain/Step": 7298, "Pretrain/Step Time": 8.511980265378952} +{"Pretrain/Learning Rate": 6.879331257811195e-06, "Pretrain/Loss": 2.0124902725219727, "Pretrain/Loss (Raw)": 2.076078414916992, "Pretrain/Step": 7299, "Pretrain/Step Time": 8.50166897289455} +{"Pretrain/Learning Rate": 6.873483364414588e-06, "Pretrain/Loss": 2.0129947662353516, "Pretrain/Loss (Raw)": 1.935032606124878, "Pretrain/Step": 7300, "Pretrain/Step Time": 8.50267625041306} +{"Pretrain/Learning Rate": 6.867637561453291e-06, "Pretrain/Loss": 2.010650634765625, "Pretrain/Loss (Raw)": 1.7634506225585938, "Pretrain/Step": 7301, "Pretrain/Step Time": 8.500589035451412} +{"Pretrain/Learning Rate": 6.861793849601475e-06, "Pretrain/Loss": 2.011720657348633, "Pretrain/Loss (Raw)": 1.8837413787841797, "Pretrain/Step": 7302, "Pretrain/Step Time": 8.505940413102508} +{"Pretrain/Learning Rate": 6.855952229533055e-06, "Pretrain/Loss": 2.01100492477417, "Pretrain/Loss (Raw)": 1.929275393486023, "Pretrain/Step": 7303, "Pretrain/Step Time": 8.511142563074827} +{"Pretrain/Learning Rate": 6.8501127019217346e-06, "Pretrain/Loss": 2.013054370880127, "Pretrain/Loss (Raw)": 2.5248606204986572, "Pretrain/Step": 7304, "Pretrain/Step Time": 8.515379220247269} +{"Pretrain/Learning Rate": 6.844275267440931e-06, "Pretrain/Loss": 2.0147812366485596, "Pretrain/Loss (Raw)": 2.3509576320648193, "Pretrain/Step": 7305, "Pretrain/Step Time": 8.506770828738809} +{"Pretrain/Learning Rate": 6.838439926763859e-06, "Pretrain/Loss": 2.017024517059326, "Pretrain/Loss (Raw)": 2.1611204147338867, "Pretrain/Step": 7306, "Pretrain/Step Time": 8.507058249786496} +{"Pretrain/Learning Rate": 6.832606680563472e-06, "Pretrain/Loss": 2.0152478218078613, "Pretrain/Loss (Raw)": 1.9286813735961914, "Pretrain/Step": 7307, "Pretrain/Step Time": 8.503264470025897} +{"Pretrain/Learning Rate": 6.8267755295125024e-06, "Pretrain/Loss": 2.0144739151000977, "Pretrain/Loss (Raw)": 2.0235369205474854, "Pretrain/Step": 7308, "Pretrain/Step Time": 8.503023356199265} +{"Pretrain/Learning Rate": 6.820946474283399e-06, "Pretrain/Loss": 2.0119383335113525, "Pretrain/Loss (Raw)": 1.9810576438903809, "Pretrain/Step": 7309, "Pretrain/Step Time": 8.513549640774727} +{"Pretrain/Learning Rate": 6.815119515548418e-06, "Pretrain/Loss": 2.009585380554199, "Pretrain/Loss (Raw)": 1.807178258895874, "Pretrain/Step": 7310, "Pretrain/Step Time": 8.522263927385211} +{"Pretrain/Learning Rate": 6.809294653979545e-06, "Pretrain/Loss": 2.0110647678375244, "Pretrain/Loss (Raw)": 2.229872941970825, "Pretrain/Step": 7311, "Pretrain/Step Time": 8.525579120963812} +{"Pretrain/Learning Rate": 6.803471890248531e-06, "Pretrain/Loss": 2.0111587047576904, "Pretrain/Loss (Raw)": 2.127678155899048, "Pretrain/Step": 7312, "Pretrain/Step Time": 8.517424862831831} +{"Pretrain/Learning Rate": 6.797651225026874e-06, "Pretrain/Loss": 2.01129150390625, "Pretrain/Loss (Raw)": 2.141155242919922, "Pretrain/Step": 7313, "Pretrain/Step Time": 8.515129631385207} +{"Pretrain/Learning Rate": 6.791832658985859e-06, "Pretrain/Loss": 2.011007308959961, "Pretrain/Loss (Raw)": 1.9372979402542114, "Pretrain/Step": 7314, "Pretrain/Step Time": 8.52254930883646} +{"Pretrain/Learning Rate": 6.786016192796499e-06, "Pretrain/Loss": 2.010751724243164, "Pretrain/Loss (Raw)": 2.1088922023773193, "Pretrain/Step": 7315, "Pretrain/Step Time": 8.527114590629935} +{"Pretrain/Learning Rate": 6.7802018271295815e-06, "Pretrain/Loss": 2.01174259185791, "Pretrain/Loss (Raw)": 2.011273145675659, "Pretrain/Step": 7316, "Pretrain/Step Time": 8.524059472605586} +{"Pretrain/Learning Rate": 6.774389562655634e-06, "Pretrain/Loss": 2.0113205909729004, "Pretrain/Loss (Raw)": 2.0206146240234375, "Pretrain/Step": 7317, "Pretrain/Step Time": 8.529468074440956} +{"Pretrain/Learning Rate": 6.768579400044966e-06, "Pretrain/Loss": 2.0090150833129883, "Pretrain/Loss (Raw)": 1.8590744733810425, "Pretrain/Step": 7318, "Pretrain/Step Time": 8.517953025177121} +{"Pretrain/Learning Rate": 6.762771339967644e-06, "Pretrain/Loss": 2.00765323638916, "Pretrain/Loss (Raw)": 1.8514904975891113, "Pretrain/Step": 7319, "Pretrain/Step Time": 8.522360322996974} +{"Pretrain/Learning Rate": 6.756965383093455e-06, "Pretrain/Loss": 2.010526180267334, "Pretrain/Loss (Raw)": 2.534013271331787, "Pretrain/Step": 7320, "Pretrain/Step Time": 8.527442764490843} +{"Pretrain/Learning Rate": 6.751161530091988e-06, "Pretrain/Loss": 2.0134034156799316, "Pretrain/Loss (Raw)": 2.360248327255249, "Pretrain/Step": 7321, "Pretrain/Step Time": 8.53298637084663} +{"Pretrain/Learning Rate": 6.745359781632565e-06, "Pretrain/Loss": 2.0132944583892822, "Pretrain/Loss (Raw)": 2.1422882080078125, "Pretrain/Step": 7322, "Pretrain/Step Time": 8.533558959141374} +{"Pretrain/Learning Rate": 6.739560138384271e-06, "Pretrain/Loss": 2.016716480255127, "Pretrain/Loss (Raw)": 2.019569158554077, "Pretrain/Step": 7323, "Pretrain/Step Time": 8.534946847707033} +{"Pretrain/Learning Rate": 6.733762601015942e-06, "Pretrain/Loss": 2.017958879470825, "Pretrain/Loss (Raw)": 2.09505558013916, "Pretrain/Step": 7324, "Pretrain/Step Time": 8.534221919253469} +{"Pretrain/Learning Rate": 6.727967170196186e-06, "Pretrain/Loss": 2.0167245864868164, "Pretrain/Loss (Raw)": 1.9558119773864746, "Pretrain/Step": 7325, "Pretrain/Step Time": 8.528676433488727} +{"Pretrain/Learning Rate": 6.72217384659336e-06, "Pretrain/Loss": 2.018488645553589, "Pretrain/Loss (Raw)": 2.0032155513763428, "Pretrain/Step": 7326, "Pretrain/Step Time": 8.535157414153218} +{"Pretrain/Learning Rate": 6.7163826308755725e-06, "Pretrain/Loss": 2.0162222385406494, "Pretrain/Loss (Raw)": 1.9447232484817505, "Pretrain/Step": 7327, "Pretrain/Step Time": 8.538200218230486} +{"Pretrain/Learning Rate": 6.7105935237106895e-06, "Pretrain/Loss": 2.0161659717559814, "Pretrain/Loss (Raw)": 2.0573225021362305, "Pretrain/Step": 7328, "Pretrain/Step Time": 8.53829468600452} +{"Pretrain/Learning Rate": 6.704806525766353e-06, "Pretrain/Loss": 2.0154032707214355, "Pretrain/Loss (Raw)": 2.069284200668335, "Pretrain/Step": 7329, "Pretrain/Step Time": 8.537196358665824} +{"Pretrain/Learning Rate": 6.699021637709935e-06, "Pretrain/Loss": 2.0136241912841797, "Pretrain/Loss (Raw)": 1.9875342845916748, "Pretrain/Step": 7330, "Pretrain/Step Time": 8.526719719171524} +{"Pretrain/Learning Rate": 6.693238860208578e-06, "Pretrain/Loss": 2.015486717224121, "Pretrain/Loss (Raw)": 1.9388506412506104, "Pretrain/Step": 7331, "Pretrain/Step Time": 8.525875519961119} +{"Pretrain/Learning Rate": 6.687458193929172e-06, "Pretrain/Loss": 2.020534038543701, "Pretrain/Loss (Raw)": 2.1052322387695312, "Pretrain/Step": 7332, "Pretrain/Step Time": 8.529545664787292} +{"Pretrain/Learning Rate": 6.681679639538388e-06, "Pretrain/Loss": 2.020850896835327, "Pretrain/Loss (Raw)": 2.071420431137085, "Pretrain/Step": 7333, "Pretrain/Step Time": 8.53595951013267} +{"Pretrain/Learning Rate": 6.675903197702627e-06, "Pretrain/Loss": 2.0224549770355225, "Pretrain/Loss (Raw)": 2.204615592956543, "Pretrain/Step": 7334, "Pretrain/Step Time": 8.534540450200438} +{"Pretrain/Learning Rate": 6.6701288690880545e-06, "Pretrain/Loss": 2.0242197513580322, "Pretrain/Loss (Raw)": 2.3188982009887695, "Pretrain/Step": 7335, "Pretrain/Step Time": 8.534476548433304} +{"Pretrain/Learning Rate": 6.664356654360588e-06, "Pretrain/Loss": 2.0241336822509766, "Pretrain/Loss (Raw)": 1.9743353128433228, "Pretrain/Step": 7336, "Pretrain/Step Time": 8.524314496666193} +{"Pretrain/Learning Rate": 6.658586554185916e-06, "Pretrain/Loss": 2.0277154445648193, "Pretrain/Loss (Raw)": 2.0706915855407715, "Pretrain/Step": 7337, "Pretrain/Step Time": 8.522855820134282} +{"Pretrain/Learning Rate": 6.652818569229474e-06, "Pretrain/Loss": 2.0306107997894287, "Pretrain/Loss (Raw)": 2.1631054878234863, "Pretrain/Step": 7338, "Pretrain/Step Time": 8.532080963253975} +{"Pretrain/Learning Rate": 6.647052700156447e-06, "Pretrain/Loss": 2.0300958156585693, "Pretrain/Loss (Raw)": 1.933754801750183, "Pretrain/Step": 7339, "Pretrain/Step Time": 8.53725559823215} +{"Pretrain/Learning Rate": 6.6412889476317765e-06, "Pretrain/Loss": 2.0305962562561035, "Pretrain/Loss (Raw)": 2.1288483142852783, "Pretrain/Step": 7340, "Pretrain/Step Time": 8.53676282428205} +{"Pretrain/Learning Rate": 6.635527312320183e-06, "Pretrain/Loss": 2.031601905822754, "Pretrain/Loss (Raw)": 2.1095287799835205, "Pretrain/Step": 7341, "Pretrain/Step Time": 8.536341177299619} +{"Pretrain/Learning Rate": 6.629767794886116e-06, "Pretrain/Loss": 2.0314910411834717, "Pretrain/Loss (Raw)": 2.0346169471740723, "Pretrain/Step": 7342, "Pretrain/Step Time": 8.539117524400353} +{"Pretrain/Learning Rate": 6.624010395993791e-06, "Pretrain/Loss": 2.0299291610717773, "Pretrain/Loss (Raw)": 1.8882049322128296, "Pretrain/Step": 7343, "Pretrain/Step Time": 8.53500852920115} +{"Pretrain/Learning Rate": 6.618255116307171e-06, "Pretrain/Loss": 2.030820369720459, "Pretrain/Loss (Raw)": 1.9583220481872559, "Pretrain/Step": 7344, "Pretrain/Step Time": 8.533722100779414} +{"Pretrain/Learning Rate": 6.61250195649e-06, "Pretrain/Loss": 2.029723644256592, "Pretrain/Loss (Raw)": 1.873454213142395, "Pretrain/Step": 7345, "Pretrain/Step Time": 8.539968706667423} +{"Pretrain/Learning Rate": 6.606750917205734e-06, "Pretrain/Loss": 2.0291733741760254, "Pretrain/Loss (Raw)": 1.7304129600524902, "Pretrain/Step": 7346, "Pretrain/Step Time": 8.541042605414987} +{"Pretrain/Learning Rate": 6.601001999117634e-06, "Pretrain/Loss": 2.0314579010009766, "Pretrain/Loss (Raw)": 2.4270710945129395, "Pretrain/Step": 7347, "Pretrain/Step Time": 8.537783475592732} +{"Pretrain/Learning Rate": 6.595255202888672e-06, "Pretrain/Loss": 2.0314669609069824, "Pretrain/Loss (Raw)": 1.9642139673233032, "Pretrain/Step": 7348, "Pretrain/Step Time": 8.538484198972583} +{"Pretrain/Learning Rate": 6.589510529181622e-06, "Pretrain/Loss": 2.0298054218292236, "Pretrain/Loss (Raw)": 1.9840307235717773, "Pretrain/Step": 7349, "Pretrain/Step Time": 8.535096552222967} +{"Pretrain/Learning Rate": 6.583767978658959e-06, "Pretrain/Loss": 2.0314769744873047, "Pretrain/Loss (Raw)": 1.996813178062439, "Pretrain/Step": 7350, "Pretrain/Step Time": 8.540351936593652} +{"Pretrain/Learning Rate": 6.578027551982957e-06, "Pretrain/Loss": 2.032121419906616, "Pretrain/Loss (Raw)": 2.0121355056762695, "Pretrain/Step": 7351, "Pretrain/Step Time": 8.54098760150373} +{"Pretrain/Learning Rate": 6.5722892498156165e-06, "Pretrain/Loss": 2.0345091819763184, "Pretrain/Loss (Raw)": 2.220665454864502, "Pretrain/Step": 7352, "Pretrain/Step Time": 8.536790838465095} +{"Pretrain/Learning Rate": 6.566553072818729e-06, "Pretrain/Loss": 2.0337929725646973, "Pretrain/Loss (Raw)": 1.8013381958007812, "Pretrain/Step": 7353, "Pretrain/Step Time": 8.530259173363447} +{"Pretrain/Learning Rate": 6.560819021653791e-06, "Pretrain/Loss": 2.0333056449890137, "Pretrain/Loss (Raw)": 1.9294184446334839, "Pretrain/Step": 7354, "Pretrain/Step Time": 8.528291836380959} +{"Pretrain/Learning Rate": 6.555087096982096e-06, "Pretrain/Loss": 2.035334587097168, "Pretrain/Loss (Raw)": 1.9603683948516846, "Pretrain/Step": 7355, "Pretrain/Step Time": 8.526070728898048} +{"Pretrain/Learning Rate": 6.549357299464673e-06, "Pretrain/Loss": 2.0327181816101074, "Pretrain/Loss (Raw)": 2.1204910278320312, "Pretrain/Step": 7356, "Pretrain/Step Time": 8.52839483693242} +{"Pretrain/Learning Rate": 6.54362962976231e-06, "Pretrain/Loss": 2.0328729152679443, "Pretrain/Loss (Raw)": 2.0103673934936523, "Pretrain/Step": 7357, "Pretrain/Step Time": 8.541142091155052} +{"Pretrain/Learning Rate": 6.5379040885355376e-06, "Pretrain/Loss": 2.0315678119659424, "Pretrain/Loss (Raw)": 2.0191831588745117, "Pretrain/Step": 7358, "Pretrain/Step Time": 8.53697419166565} +{"Pretrain/Learning Rate": 6.532180676444663e-06, "Pretrain/Loss": 2.0310420989990234, "Pretrain/Loss (Raw)": 1.9123605489730835, "Pretrain/Step": 7359, "Pretrain/Step Time": 8.534246290102601} +{"Pretrain/Learning Rate": 6.52645939414975e-06, "Pretrain/Loss": 2.032040596008301, "Pretrain/Loss (Raw)": 1.935671329498291, "Pretrain/Step": 7360, "Pretrain/Step Time": 8.525073694065213} +{"Pretrain/Learning Rate": 6.5207402423105775e-06, "Pretrain/Loss": 2.030290126800537, "Pretrain/Loss (Raw)": 1.9309076070785522, "Pretrain/Step": 7361, "Pretrain/Step Time": 8.520139588043094} +{"Pretrain/Learning Rate": 6.515023221586722e-06, "Pretrain/Loss": 2.026968002319336, "Pretrain/Loss (Raw)": 1.8557168245315552, "Pretrain/Step": 7362, "Pretrain/Step Time": 8.526474745944142} +{"Pretrain/Learning Rate": 6.5093083326374954e-06, "Pretrain/Loss": 2.0281999111175537, "Pretrain/Loss (Raw)": 1.9790964126586914, "Pretrain/Step": 7363, "Pretrain/Step Time": 8.518358564004302} +{"Pretrain/Learning Rate": 6.50359557612196e-06, "Pretrain/Loss": 2.028940439224243, "Pretrain/Loss (Raw)": 1.995830774307251, "Pretrain/Step": 7364, "Pretrain/Step Time": 8.525524662807584} +{"Pretrain/Learning Rate": 6.497884952698935e-06, "Pretrain/Loss": 2.0292205810546875, "Pretrain/Loss (Raw)": 2.0796608924865723, "Pretrain/Step": 7365, "Pretrain/Step Time": 8.517712578177452} +{"Pretrain/Learning Rate": 6.492176463027009e-06, "Pretrain/Loss": 2.027219295501709, "Pretrain/Loss (Raw)": 1.9741957187652588, "Pretrain/Step": 7366, "Pretrain/Step Time": 8.516508614644408} +{"Pretrain/Learning Rate": 6.486470107764505e-06, "Pretrain/Loss": 2.028730869293213, "Pretrain/Loss (Raw)": 2.109819173812866, "Pretrain/Step": 7367, "Pretrain/Step Time": 8.517036417499185} +{"Pretrain/Learning Rate": 6.480765887569506e-06, "Pretrain/Loss": 2.0297961235046387, "Pretrain/Loss (Raw)": 2.0472962856292725, "Pretrain/Step": 7368, "Pretrain/Step Time": 8.523241519927979} +{"Pretrain/Learning Rate": 6.475063803099846e-06, "Pretrain/Loss": 2.030599594116211, "Pretrain/Loss (Raw)": 2.175548791885376, "Pretrain/Step": 7369, "Pretrain/Step Time": 8.517154665663838} +{"Pretrain/Learning Rate": 6.469363855013125e-06, "Pretrain/Loss": 2.031200408935547, "Pretrain/Loss (Raw)": 2.043562412261963, "Pretrain/Step": 7370, "Pretrain/Step Time": 8.517015680670738} +{"Pretrain/Learning Rate": 6.463666043966685e-06, "Pretrain/Loss": 2.030665874481201, "Pretrain/Loss (Raw)": 1.9067230224609375, "Pretrain/Step": 7371, "Pretrain/Step Time": 8.51835085824132} +{"Pretrain/Learning Rate": 6.457970370617622e-06, "Pretrain/Loss": 2.031602382659912, "Pretrain/Loss (Raw)": 1.9668093919754028, "Pretrain/Step": 7372, "Pretrain/Step Time": 8.507769133895636} +{"Pretrain/Learning Rate": 6.452276835622781e-06, "Pretrain/Loss": 2.0324578285217285, "Pretrain/Loss (Raw)": 2.0433108806610107, "Pretrain/Step": 7373, "Pretrain/Step Time": 8.513055872172117} +{"Pretrain/Learning Rate": 6.446585439638783e-06, "Pretrain/Loss": 2.03371262550354, "Pretrain/Loss (Raw)": 2.150127410888672, "Pretrain/Step": 7374, "Pretrain/Step Time": 8.519623517990112} +{"Pretrain/Learning Rate": 6.440896183321979e-06, "Pretrain/Loss": 2.0351943969726562, "Pretrain/Loss (Raw)": 1.9712018966674805, "Pretrain/Step": 7375, "Pretrain/Step Time": 8.516761662438512} +{"Pretrain/Learning Rate": 6.435209067328479e-06, "Pretrain/Loss": 2.0332555770874023, "Pretrain/Loss (Raw)": 1.8789621591567993, "Pretrain/Step": 7376, "Pretrain/Step Time": 8.522866545245051} +{"Pretrain/Learning Rate": 6.429524092314143e-06, "Pretrain/Loss": 2.032081127166748, "Pretrain/Loss (Raw)": 2.056825876235962, "Pretrain/Step": 7377, "Pretrain/Step Time": 8.515918610617518} +{"Pretrain/Learning Rate": 6.423841258934604e-06, "Pretrain/Loss": 2.031881332397461, "Pretrain/Loss (Raw)": 1.9380314350128174, "Pretrain/Step": 7378, "Pretrain/Step Time": 8.50733538158238} +{"Pretrain/Learning Rate": 6.418160567845224e-06, "Pretrain/Loss": 2.0328001976013184, "Pretrain/Loss (Raw)": 2.141096353530884, "Pretrain/Step": 7379, "Pretrain/Step Time": 8.515541145578027} +{"Pretrain/Learning Rate": 6.412482019701127e-06, "Pretrain/Loss": 2.030944585800171, "Pretrain/Loss (Raw)": 1.8314142227172852, "Pretrain/Step": 7380, "Pretrain/Step Time": 8.521617885679007} +{"Pretrain/Learning Rate": 6.4068056151571855e-06, "Pretrain/Loss": 2.0315351486206055, "Pretrain/Loss (Raw)": 1.905498743057251, "Pretrain/Step": 7381, "Pretrain/Step Time": 8.52190301939845} +{"Pretrain/Learning Rate": 6.40113135486804e-06, "Pretrain/Loss": 2.0301332473754883, "Pretrain/Loss (Raw)": 1.8366222381591797, "Pretrain/Step": 7382, "Pretrain/Step Time": 8.517866007983685} +{"Pretrain/Learning Rate": 6.395459239488069e-06, "Pretrain/Loss": 2.0307888984680176, "Pretrain/Loss (Raw)": 2.151353359222412, "Pretrain/Step": 7383, "Pretrain/Step Time": 8.513098273426294} +{"Pretrain/Learning Rate": 6.389789269671403e-06, "Pretrain/Loss": 2.030599355697632, "Pretrain/Loss (Raw)": 2.001376152038574, "Pretrain/Step": 7384, "Pretrain/Step Time": 8.512856723740697} +{"Pretrain/Learning Rate": 6.384121446071928e-06, "Pretrain/Loss": 2.029439926147461, "Pretrain/Loss (Raw)": 1.8375005722045898, "Pretrain/Step": 7385, "Pretrain/Step Time": 8.510159390047193} +{"Pretrain/Learning Rate": 6.378455769343302e-06, "Pretrain/Loss": 2.029545307159424, "Pretrain/Loss (Raw)": 2.0209028720855713, "Pretrain/Step": 7386, "Pretrain/Step Time": 8.519276142120361} +{"Pretrain/Learning Rate": 6.372792240138891e-06, "Pretrain/Loss": 2.0278077125549316, "Pretrain/Loss (Raw)": 2.0015463829040527, "Pretrain/Step": 7387, "Pretrain/Step Time": 8.521936692297459} +{"Pretrain/Learning Rate": 6.3671308591118615e-06, "Pretrain/Loss": 2.0266900062561035, "Pretrain/Loss (Raw)": 1.909602403640747, "Pretrain/Step": 7388, "Pretrain/Step Time": 8.517554374411702} +{"Pretrain/Learning Rate": 6.361471626915091e-06, "Pretrain/Loss": 2.027719020843506, "Pretrain/Loss (Raw)": 2.071953296661377, "Pretrain/Step": 7389, "Pretrain/Step Time": 8.514097794890404} +{"Pretrain/Learning Rate": 6.355814544201258e-06, "Pretrain/Loss": 2.023575782775879, "Pretrain/Loss (Raw)": 1.8031669855117798, "Pretrain/Step": 7390, "Pretrain/Step Time": 8.512284079566598} +{"Pretrain/Learning Rate": 6.35015961162273e-06, "Pretrain/Loss": 2.0237998962402344, "Pretrain/Loss (Raw)": 1.9985301494598389, "Pretrain/Step": 7391, "Pretrain/Step Time": 8.507307408377528} +{"Pretrain/Learning Rate": 6.344506829831684e-06, "Pretrain/Loss": 2.024540424346924, "Pretrain/Loss (Raw)": 2.1160125732421875, "Pretrain/Step": 7392, "Pretrain/Step Time": 8.50969341956079} +{"Pretrain/Learning Rate": 6.3388561994800115e-06, "Pretrain/Loss": 2.025700569152832, "Pretrain/Loss (Raw)": 2.084066390991211, "Pretrain/Step": 7393, "Pretrain/Step Time": 8.512617405503988} +{"Pretrain/Learning Rate": 6.333207721219389e-06, "Pretrain/Loss": 2.0256996154785156, "Pretrain/Loss (Raw)": 2.1064627170562744, "Pretrain/Step": 7394, "Pretrain/Step Time": 8.525046462193131} +{"Pretrain/Learning Rate": 6.327561395701201e-06, "Pretrain/Loss": 2.0266854763031006, "Pretrain/Loss (Raw)": 2.1086063385009766, "Pretrain/Step": 7395, "Pretrain/Step Time": 8.524628488346934} +{"Pretrain/Learning Rate": 6.321917223576626e-06, "Pretrain/Loss": 2.0286998748779297, "Pretrain/Loss (Raw)": 2.084749460220337, "Pretrain/Step": 7396, "Pretrain/Step Time": 8.524777807295322} +{"Pretrain/Learning Rate": 6.316275205496572e-06, "Pretrain/Loss": 2.030177116394043, "Pretrain/Loss (Raw)": 2.2542643547058105, "Pretrain/Step": 7397, "Pretrain/Step Time": 8.524805033579469} +{"Pretrain/Learning Rate": 6.310635342111701e-06, "Pretrain/Loss": 2.0298819541931152, "Pretrain/Loss (Raw)": 1.9623546600341797, "Pretrain/Step": 7398, "Pretrain/Step Time": 8.523422500118613} +{"Pretrain/Learning Rate": 6.304997634072421e-06, "Pretrain/Loss": 2.0278592109680176, "Pretrain/Loss (Raw)": 1.8184329271316528, "Pretrain/Step": 7399, "Pretrain/Step Time": 8.536246865987778} +{"Pretrain/Learning Rate": 6.299362082028909e-06, "Pretrain/Loss": 2.028014659881592, "Pretrain/Loss (Raw)": 2.0118556022644043, "Pretrain/Step": 7400, "Pretrain/Step Time": 8.53325585834682} +{"Pretrain/Learning Rate": 6.293728686631095e-06, "Pretrain/Loss": 2.0270533561706543, "Pretrain/Loss (Raw)": 1.8829923868179321, "Pretrain/Step": 7401, "Pretrain/Step Time": 8.528616381809115} +{"Pretrain/Learning Rate": 6.288097448528624e-06, "Pretrain/Loss": 2.025574207305908, "Pretrain/Loss (Raw)": 1.9739058017730713, "Pretrain/Step": 7402, "Pretrain/Step Time": 8.52699002623558} +{"Pretrain/Learning Rate": 6.2824683683709335e-06, "Pretrain/Loss": 2.0255208015441895, "Pretrain/Loss (Raw)": 1.8598366975784302, "Pretrain/Step": 7403, "Pretrain/Step Time": 8.525273406878114} +{"Pretrain/Learning Rate": 6.2768414468071915e-06, "Pretrain/Loss": 2.026665210723877, "Pretrain/Loss (Raw)": 1.972371220588684, "Pretrain/Step": 7404, "Pretrain/Step Time": 8.52225081063807} +{"Pretrain/Learning Rate": 6.27121668448632e-06, "Pretrain/Loss": 2.023400068283081, "Pretrain/Loss (Raw)": 1.6862237453460693, "Pretrain/Step": 7405, "Pretrain/Step Time": 8.532202057540417} +{"Pretrain/Learning Rate": 6.265594082056986e-06, "Pretrain/Loss": 2.0238747596740723, "Pretrain/Loss (Raw)": 1.9733169078826904, "Pretrain/Step": 7406, "Pretrain/Step Time": 8.538423841819167} +{"Pretrain/Learning Rate": 6.25997364016763e-06, "Pretrain/Loss": 2.021986246109009, "Pretrain/Loss (Raw)": 1.871166467666626, "Pretrain/Step": 7407, "Pretrain/Step Time": 8.532565351575613} +{"Pretrain/Learning Rate": 6.254355359466418e-06, "Pretrain/Loss": 2.0249392986297607, "Pretrain/Loss (Raw)": 2.081583023071289, "Pretrain/Step": 7408, "Pretrain/Step Time": 8.529387453570962} +{"Pretrain/Learning Rate": 6.248739240601282e-06, "Pretrain/Loss": 2.0257019996643066, "Pretrain/Loss (Raw)": 2.1303017139434814, "Pretrain/Step": 7409, "Pretrain/Step Time": 8.520838428288698} +{"Pretrain/Learning Rate": 6.243125284219883e-06, "Pretrain/Loss": 2.0246224403381348, "Pretrain/Loss (Raw)": 1.8095635175704956, "Pretrain/Step": 7410, "Pretrain/Step Time": 8.525818169116974} +{"Pretrain/Learning Rate": 6.237513490969674e-06, "Pretrain/Loss": 2.023494243621826, "Pretrain/Loss (Raw)": 1.9450786113739014, "Pretrain/Step": 7411, "Pretrain/Step Time": 8.531457252800465} +{"Pretrain/Learning Rate": 6.231903861497817e-06, "Pretrain/Loss": 2.02272367477417, "Pretrain/Loss (Raw)": 2.042550563812256, "Pretrain/Step": 7412, "Pretrain/Step Time": 8.534473426640034} +{"Pretrain/Learning Rate": 6.226296396451245e-06, "Pretrain/Loss": 2.019322395324707, "Pretrain/Loss (Raw)": 1.9441823959350586, "Pretrain/Step": 7413, "Pretrain/Step Time": 8.529939372092485} +{"Pretrain/Learning Rate": 6.2206910964766325e-06, "Pretrain/Loss": 2.0213968753814697, "Pretrain/Loss (Raw)": 2.0557665824890137, "Pretrain/Step": 7414, "Pretrain/Step Time": 8.530224658548832} +{"Pretrain/Learning Rate": 6.21508796222042e-06, "Pretrain/Loss": 2.0204834938049316, "Pretrain/Loss (Raw)": 1.9969427585601807, "Pretrain/Step": 7415, "Pretrain/Step Time": 8.528983840718865} +{"Pretrain/Learning Rate": 6.2094869943287805e-06, "Pretrain/Loss": 2.0201339721679688, "Pretrain/Loss (Raw)": 2.029264450073242, "Pretrain/Step": 7416, "Pretrain/Step Time": 8.530892049893737} +{"Pretrain/Learning Rate": 6.203888193447646e-06, "Pretrain/Loss": 2.022843599319458, "Pretrain/Loss (Raw)": 2.4903459548950195, "Pretrain/Step": 7417, "Pretrain/Step Time": 8.538950711488724} +{"Pretrain/Learning Rate": 6.198291560222685e-06, "Pretrain/Loss": 2.0212106704711914, "Pretrain/Loss (Raw)": 1.8662036657333374, "Pretrain/Step": 7418, "Pretrain/Step Time": 8.53781507536769} +{"Pretrain/Learning Rate": 6.192697095299349e-06, "Pretrain/Loss": 2.020859956741333, "Pretrain/Loss (Raw)": 2.012295961380005, "Pretrain/Step": 7419, "Pretrain/Step Time": 8.534724911674857} +{"Pretrain/Learning Rate": 6.187104799322804e-06, "Pretrain/Loss": 2.020872116088867, "Pretrain/Loss (Raw)": 1.9864928722381592, "Pretrain/Step": 7420, "Pretrain/Step Time": 8.529697811231017} +{"Pretrain/Learning Rate": 6.1815146729379855e-06, "Pretrain/Loss": 2.0222620964050293, "Pretrain/Loss (Raw)": 2.293833017349243, "Pretrain/Step": 7421, "Pretrain/Step Time": 8.53401805832982} +{"Pretrain/Learning Rate": 6.17592671678956e-06, "Pretrain/Loss": 2.0178332328796387, "Pretrain/Loss (Raw)": 1.8478782176971436, "Pretrain/Step": 7422, "Pretrain/Step Time": 8.54420149512589} +{"Pretrain/Learning Rate": 6.170340931521976e-06, "Pretrain/Loss": 2.0181148052215576, "Pretrain/Loss (Raw)": 2.0519604682922363, "Pretrain/Step": 7423, "Pretrain/Step Time": 8.54640487767756} +{"Pretrain/Learning Rate": 6.164757317779404e-06, "Pretrain/Loss": 2.0185770988464355, "Pretrain/Loss (Raw)": 2.150517463684082, "Pretrain/Step": 7424, "Pretrain/Step Time": 8.54960242845118} +{"Pretrain/Learning Rate": 6.159175876205775e-06, "Pretrain/Loss": 2.019023895263672, "Pretrain/Loss (Raw)": 1.8378173112869263, "Pretrain/Step": 7425, "Pretrain/Step Time": 8.543849498033524} +{"Pretrain/Learning Rate": 6.153596607444756e-06, "Pretrain/Loss": 2.0204172134399414, "Pretrain/Loss (Raw)": 2.040200710296631, "Pretrain/Step": 7426, "Pretrain/Step Time": 8.5434361230582} +{"Pretrain/Learning Rate": 6.148019512139797e-06, "Pretrain/Loss": 2.019434690475464, "Pretrain/Loss (Raw)": 1.9503182172775269, "Pretrain/Step": 7427, "Pretrain/Step Time": 8.543648347258568} +{"Pretrain/Learning Rate": 6.142444590934046e-06, "Pretrain/Loss": 2.020442485809326, "Pretrain/Loss (Raw)": 2.0640480518341064, "Pretrain/Step": 7428, "Pretrain/Step Time": 8.544480280950665} +{"Pretrain/Learning Rate": 6.136871844470454e-06, "Pretrain/Loss": 2.022343158721924, "Pretrain/Loss (Raw)": 2.0067098140716553, "Pretrain/Step": 7429, "Pretrain/Step Time": 8.54304002597928} +{"Pretrain/Learning Rate": 6.131301273391679e-06, "Pretrain/Loss": 2.024571180343628, "Pretrain/Loss (Raw)": 2.1689345836639404, "Pretrain/Step": 7430, "Pretrain/Step Time": 8.54319728910923} +{"Pretrain/Learning Rate": 6.125732878340168e-06, "Pretrain/Loss": 2.0255064964294434, "Pretrain/Loss (Raw)": 2.049006223678589, "Pretrain/Step": 7431, "Pretrain/Step Time": 8.536610970273614} +{"Pretrain/Learning Rate": 6.120166659958065e-06, "Pretrain/Loss": 2.020153284072876, "Pretrain/Loss (Raw)": 1.8396652936935425, "Pretrain/Step": 7432, "Pretrain/Step Time": 8.532699855044484} +{"Pretrain/Learning Rate": 6.1146026188873134e-06, "Pretrain/Loss": 2.016552209854126, "Pretrain/Loss (Raw)": 1.8900024890899658, "Pretrain/Step": 7433, "Pretrain/Step Time": 8.53918768465519} +{"Pretrain/Learning Rate": 6.1090407557695735e-06, "Pretrain/Loss": 2.0156774520874023, "Pretrain/Loss (Raw)": 2.0491437911987305, "Pretrain/Step": 7434, "Pretrain/Step Time": 8.548393175005913} +{"Pretrain/Learning Rate": 6.103481071246284e-06, "Pretrain/Loss": 2.0148508548736572, "Pretrain/Loss (Raw)": 1.8228815793991089, "Pretrain/Step": 7435, "Pretrain/Step Time": 8.54726404324174} +{"Pretrain/Learning Rate": 6.097923565958588e-06, "Pretrain/Loss": 2.013686180114746, "Pretrain/Loss (Raw)": 1.8744564056396484, "Pretrain/Step": 7436, "Pretrain/Step Time": 8.54804209060967} +{"Pretrain/Learning Rate": 6.092368240547422e-06, "Pretrain/Loss": 2.013587236404419, "Pretrain/Loss (Raw)": 1.9684064388275146, "Pretrain/Step": 7437, "Pretrain/Step Time": 8.538415493443608} +{"Pretrain/Learning Rate": 6.0868150956534445e-06, "Pretrain/Loss": 2.0151548385620117, "Pretrain/Loss (Raw)": 2.007838010787964, "Pretrain/Step": 7438, "Pretrain/Step Time": 8.531557206064463} +{"Pretrain/Learning Rate": 6.081264131917075e-06, "Pretrain/Loss": 2.0138847827911377, "Pretrain/Loss (Raw)": 2.067293405532837, "Pretrain/Step": 7439, "Pretrain/Step Time": 8.531067410483956} +{"Pretrain/Learning Rate": 6.075715349978464e-06, "Pretrain/Loss": 2.011587142944336, "Pretrain/Loss (Raw)": 1.8335902690887451, "Pretrain/Step": 7440, "Pretrain/Step Time": 8.539191262796521} +{"Pretrain/Learning Rate": 6.070168750477534e-06, "Pretrain/Loss": 2.0093612670898438, "Pretrain/Loss (Raw)": 1.8562335968017578, "Pretrain/Step": 7441, "Pretrain/Step Time": 8.53672032430768} +{"Pretrain/Learning Rate": 6.0646243340539584e-06, "Pretrain/Loss": 2.008934497833252, "Pretrain/Loss (Raw)": 1.8826563358306885, "Pretrain/Step": 7442, "Pretrain/Step Time": 8.531271142885089} +{"Pretrain/Learning Rate": 6.059082101347119e-06, "Pretrain/Loss": 2.008681058883667, "Pretrain/Loss (Raw)": 2.076443910598755, "Pretrain/Step": 7443, "Pretrain/Step Time": 8.524298295378685} +{"Pretrain/Learning Rate": 6.053542052996189e-06, "Pretrain/Loss": 2.0075507164001465, "Pretrain/Loss (Raw)": 1.8666181564331055, "Pretrain/Step": 7444, "Pretrain/Step Time": 8.523422257974744} +{"Pretrain/Learning Rate": 6.048004189640061e-06, "Pretrain/Loss": 2.008005142211914, "Pretrain/Loss (Raw)": 2.0787813663482666, "Pretrain/Step": 7445, "Pretrain/Step Time": 8.52423950843513} +{"Pretrain/Learning Rate": 6.0424685119174095e-06, "Pretrain/Loss": 2.0088298320770264, "Pretrain/Loss (Raw)": 1.9646120071411133, "Pretrain/Step": 7446, "Pretrain/Step Time": 8.529320295900106} +{"Pretrain/Learning Rate": 6.036935020466605e-06, "Pretrain/Loss": 2.0091805458068848, "Pretrain/Loss (Raw)": 1.8964039087295532, "Pretrain/Step": 7447, "Pretrain/Step Time": 8.528189469128847} +{"Pretrain/Learning Rate": 6.031403715925818e-06, "Pretrain/Loss": 2.0028116703033447, "Pretrain/Loss (Raw)": 1.7188091278076172, "Pretrain/Step": 7448, "Pretrain/Step Time": 8.517734818160534} +{"Pretrain/Learning Rate": 6.025874598932937e-06, "Pretrain/Loss": 2.000012159347534, "Pretrain/Loss (Raw)": 2.0018842220306396, "Pretrain/Step": 7449, "Pretrain/Step Time": 8.51894274353981} +{"Pretrain/Learning Rate": 6.020347670125606e-06, "Pretrain/Loss": 2.000725269317627, "Pretrain/Loss (Raw)": 2.2335827350616455, "Pretrain/Step": 7450, "Pretrain/Step Time": 8.511298723518848} +{"Pretrain/Learning Rate": 6.014822930141212e-06, "Pretrain/Loss": 2.0007710456848145, "Pretrain/Loss (Raw)": 2.02541184425354, "Pretrain/Step": 7451, "Pretrain/Step Time": 8.506931565701962} +{"Pretrain/Learning Rate": 6.0093003796169026e-06, "Pretrain/Loss": 2.0005595684051514, "Pretrain/Loss (Raw)": 2.0679972171783447, "Pretrain/Step": 7452, "Pretrain/Step Time": 8.519552450627089} +{"Pretrain/Learning Rate": 6.003780019189565e-06, "Pretrain/Loss": 2.001920223236084, "Pretrain/Loss (Raw)": 2.1299705505371094, "Pretrain/Step": 7453, "Pretrain/Step Time": 8.521009111776948} +{"Pretrain/Learning Rate": 5.998261849495826e-06, "Pretrain/Loss": 2.0019869804382324, "Pretrain/Loss (Raw)": 2.011765480041504, "Pretrain/Step": 7454, "Pretrain/Step Time": 8.513689547777176} +{"Pretrain/Learning Rate": 5.9927458711720615e-06, "Pretrain/Loss": 2.0001206398010254, "Pretrain/Loss (Raw)": 1.7058289051055908, "Pretrain/Step": 7455, "Pretrain/Step Time": 8.510843817144632} +{"Pretrain/Learning Rate": 5.9872320848544165e-06, "Pretrain/Loss": 1.9989442825317383, "Pretrain/Loss (Raw)": 1.9067500829696655, "Pretrain/Step": 7456, "Pretrain/Step Time": 8.508981859311461} +{"Pretrain/Learning Rate": 5.9817204911787576e-06, "Pretrain/Loss": 1.998224139213562, "Pretrain/Loss (Raw)": 1.9771113395690918, "Pretrain/Step": 7457, "Pretrain/Step Time": 8.51427948102355} +{"Pretrain/Learning Rate": 5.976211090780712e-06, "Pretrain/Loss": 1.9981950521469116, "Pretrain/Loss (Raw)": 1.983801245689392, "Pretrain/Step": 7458, "Pretrain/Step Time": 8.515931509435177} +{"Pretrain/Learning Rate": 5.970703884295636e-06, "Pretrain/Loss": 1.998844861984253, "Pretrain/Loss (Raw)": 2.022012233734131, "Pretrain/Step": 7459, "Pretrain/Step Time": 8.517139611765742} +{"Pretrain/Learning Rate": 5.965198872358665e-06, "Pretrain/Loss": 1.998931884765625, "Pretrain/Loss (Raw)": 2.116382360458374, "Pretrain/Step": 7460, "Pretrain/Step Time": 8.513802122324705} +{"Pretrain/Learning Rate": 5.959696055604655e-06, "Pretrain/Loss": 1.9991542100906372, "Pretrain/Loss (Raw)": 2.0998942852020264, "Pretrain/Step": 7461, "Pretrain/Step Time": 8.509485566988587} +{"Pretrain/Learning Rate": 5.9541954346682165e-06, "Pretrain/Loss": 1.9968010187149048, "Pretrain/Loss (Raw)": 1.9033966064453125, "Pretrain/Step": 7462, "Pretrain/Step Time": 8.509376155212522} +{"Pretrain/Learning Rate": 5.948697010183701e-06, "Pretrain/Loss": 1.9985605478286743, "Pretrain/Loss (Raw)": 2.5441064834594727, "Pretrain/Step": 7463, "Pretrain/Step Time": 8.513218741863966} +{"Pretrain/Learning Rate": 5.943200782785227e-06, "Pretrain/Loss": 1.997546672821045, "Pretrain/Loss (Raw)": 1.844573736190796, "Pretrain/Step": 7464, "Pretrain/Step Time": 8.513043025508523} +{"Pretrain/Learning Rate": 5.937706753106634e-06, "Pretrain/Loss": 1.9970018863677979, "Pretrain/Loss (Raw)": 2.000962257385254, "Pretrain/Step": 7465, "Pretrain/Step Time": 8.513443941250443} +{"Pretrain/Learning Rate": 5.932214921781526e-06, "Pretrain/Loss": 1.9948022365570068, "Pretrain/Loss (Raw)": 1.8815325498580933, "Pretrain/Step": 7466, "Pretrain/Step Time": 8.505626935511827} +{"Pretrain/Learning Rate": 5.9267252894432355e-06, "Pretrain/Loss": 1.994774580001831, "Pretrain/Loss (Raw)": 1.9302055835723877, "Pretrain/Step": 7467, "Pretrain/Step Time": 8.498611966148019} +{"Pretrain/Learning Rate": 5.921237856724867e-06, "Pretrain/Loss": 1.9939494132995605, "Pretrain/Loss (Raw)": 2.0232491493225098, "Pretrain/Step": 7468, "Pretrain/Step Time": 8.500873243436217} +{"Pretrain/Learning Rate": 5.915752624259252e-06, "Pretrain/Loss": 1.9922057390213013, "Pretrain/Loss (Raw)": 1.8863372802734375, "Pretrain/Step": 7469, "Pretrain/Step Time": 8.499855814501643} +{"Pretrain/Learning Rate": 5.910269592678971e-06, "Pretrain/Loss": 1.9913583993911743, "Pretrain/Loss (Raw)": 1.9261564016342163, "Pretrain/Step": 7470, "Pretrain/Step Time": 8.497657161206007} +{"Pretrain/Learning Rate": 5.904788762616348e-06, "Pretrain/Loss": 1.990473985671997, "Pretrain/Loss (Raw)": 1.7749903202056885, "Pretrain/Step": 7471, "Pretrain/Step Time": 8.504386752843857} +{"Pretrain/Learning Rate": 5.899310134703479e-06, "Pretrain/Loss": 1.990919828414917, "Pretrain/Loss (Raw)": 2.015397548675537, "Pretrain/Step": 7472, "Pretrain/Step Time": 8.515462655574083} +{"Pretrain/Learning Rate": 5.893833709572155e-06, "Pretrain/Loss": 1.9913092851638794, "Pretrain/Loss (Raw)": 1.9233042001724243, "Pretrain/Step": 7473, "Pretrain/Step Time": 8.506280779838562} +{"Pretrain/Learning Rate": 5.88835948785397e-06, "Pretrain/Loss": 1.991686224937439, "Pretrain/Loss (Raw)": 1.7786600589752197, "Pretrain/Step": 7474, "Pretrain/Step Time": 8.504561530426145} +{"Pretrain/Learning Rate": 5.882887470180215e-06, "Pretrain/Loss": 1.9879910945892334, "Pretrain/Loss (Raw)": 1.9541000127792358, "Pretrain/Step": 7475, "Pretrain/Step Time": 8.50827681273222} +{"Pretrain/Learning Rate": 5.877417657181975e-06, "Pretrain/Loss": 1.9898686408996582, "Pretrain/Loss (Raw)": 2.2045257091522217, "Pretrain/Step": 7476, "Pretrain/Step Time": 8.508296817541122} +{"Pretrain/Learning Rate": 5.871950049490024e-06, "Pretrain/Loss": 1.9897130727767944, "Pretrain/Loss (Raw)": 1.9641391038894653, "Pretrain/Step": 7477, "Pretrain/Step Time": 8.514897657558322} +{"Pretrain/Learning Rate": 5.866484647734935e-06, "Pretrain/Loss": 1.9903827905654907, "Pretrain/Loss (Raw)": 2.0825304985046387, "Pretrain/Step": 7478, "Pretrain/Step Time": 8.510263031348586} +{"Pretrain/Learning Rate": 5.861021452546997e-06, "Pretrain/Loss": 1.9903217554092407, "Pretrain/Loss (Raw)": 2.0043156147003174, "Pretrain/Step": 7479, "Pretrain/Step Time": 8.510465919971466} +{"Pretrain/Learning Rate": 5.855560464556253e-06, "Pretrain/Loss": 1.9882845878601074, "Pretrain/Loss (Raw)": 1.9599087238311768, "Pretrain/Step": 7480, "Pretrain/Step Time": 8.510280242189765} +{"Pretrain/Learning Rate": 5.8501016843924785e-06, "Pretrain/Loss": 1.990821361541748, "Pretrain/Loss (Raw)": 2.126046895980835, "Pretrain/Step": 7481, "Pretrain/Step Time": 8.51618019118905} +{"Pretrain/Learning Rate": 5.844645112685215e-06, "Pretrain/Loss": 1.9916157722473145, "Pretrain/Loss (Raw)": 2.031096935272217, "Pretrain/Step": 7482, "Pretrain/Step Time": 8.517422616481781} +{"Pretrain/Learning Rate": 5.839190750063756e-06, "Pretrain/Loss": 1.9923162460327148, "Pretrain/Loss (Raw)": 2.0500266551971436, "Pretrain/Step": 7483, "Pretrain/Step Time": 8.518933948129416} +{"Pretrain/Learning Rate": 5.833738597157093e-06, "Pretrain/Loss": 1.9935845136642456, "Pretrain/Loss (Raw)": 2.282841920852661, "Pretrain/Step": 7484, "Pretrain/Step Time": 8.52082847058773} +{"Pretrain/Learning Rate": 5.828288654594016e-06, "Pretrain/Loss": 1.9943822622299194, "Pretrain/Loss (Raw)": 2.1124823093414307, "Pretrain/Step": 7485, "Pretrain/Step Time": 8.510252933949232} +{"Pretrain/Learning Rate": 5.822840923003023e-06, "Pretrain/Loss": 1.993888258934021, "Pretrain/Loss (Raw)": 1.95595121383667, "Pretrain/Step": 7486, "Pretrain/Step Time": 8.508833855390549} +{"Pretrain/Learning Rate": 5.817395403012396e-06, "Pretrain/Loss": 1.9949136972427368, "Pretrain/Loss (Raw)": 2.043605089187622, "Pretrain/Step": 7487, "Pretrain/Step Time": 8.512231020256877} +{"Pretrain/Learning Rate": 5.8119520952501085e-06, "Pretrain/Loss": 1.995296835899353, "Pretrain/Loss (Raw)": 1.9847153425216675, "Pretrain/Step": 7488, "Pretrain/Step Time": 8.516602901741862} +{"Pretrain/Learning Rate": 5.806511000343931e-06, "Pretrain/Loss": 1.9967479705810547, "Pretrain/Loss (Raw)": 2.116645336151123, "Pretrain/Step": 7489, "Pretrain/Step Time": 8.520757539197803} +{"Pretrain/Learning Rate": 5.801072118921347e-06, "Pretrain/Loss": 1.9961944818496704, "Pretrain/Loss (Raw)": 1.7848834991455078, "Pretrain/Step": 7490, "Pretrain/Step Time": 8.524029524996877} +{"Pretrain/Learning Rate": 5.7956354516095935e-06, "Pretrain/Loss": 1.99767005443573, "Pretrain/Loss (Raw)": 2.1679651737213135, "Pretrain/Step": 7491, "Pretrain/Step Time": 8.524163164198399} +{"Pretrain/Learning Rate": 5.790200999035647e-06, "Pretrain/Loss": 1.9981715679168701, "Pretrain/Loss (Raw)": 2.0600361824035645, "Pretrain/Step": 7492, "Pretrain/Step Time": 8.517179248854518} +{"Pretrain/Learning Rate": 5.784768761826248e-06, "Pretrain/Loss": 1.9979609251022339, "Pretrain/Loss (Raw)": 2.0526816844940186, "Pretrain/Step": 7493, "Pretrain/Step Time": 8.519572330638766} +{"Pretrain/Learning Rate": 5.779338740607859e-06, "Pretrain/Loss": 1.9979307651519775, "Pretrain/Loss (Raw)": 1.970349669456482, "Pretrain/Step": 7494, "Pretrain/Step Time": 8.519520977512002} +{"Pretrain/Learning Rate": 5.773910936006699e-06, "Pretrain/Loss": 1.9959492683410645, "Pretrain/Loss (Raw)": 1.8561757802963257, "Pretrain/Step": 7495, "Pretrain/Step Time": 8.516101691871881} +{"Pretrain/Learning Rate": 5.768485348648719e-06, "Pretrain/Loss": 1.9954869747161865, "Pretrain/Loss (Raw)": 1.9881203174591064, "Pretrain/Step": 7496, "Pretrain/Step Time": 8.52063025534153} +{"Pretrain/Learning Rate": 5.763061979159637e-06, "Pretrain/Loss": 1.991551399230957, "Pretrain/Loss (Raw)": 1.6718052625656128, "Pretrain/Step": 7497, "Pretrain/Step Time": 8.526224050670862} +{"Pretrain/Learning Rate": 5.757640828164895e-06, "Pretrain/Loss": 1.9922902584075928, "Pretrain/Loss (Raw)": 2.1381404399871826, "Pretrain/Step": 7498, "Pretrain/Step Time": 8.521360510960221} +{"Pretrain/Learning Rate": 5.7522218962896865e-06, "Pretrain/Loss": 1.9943252801895142, "Pretrain/Loss (Raw)": 2.1672112941741943, "Pretrain/Step": 7499, "Pretrain/Step Time": 8.520326932892203} +{"Pretrain/Learning Rate": 5.746805184158941e-06, "Pretrain/Loss": 1.9949499368667603, "Pretrain/Loss (Raw)": 2.046754837036133, "Pretrain/Step": 7500, "Pretrain/Step Time": 8.52638704329729} +{"Pretrain/Learning Rate": 5.74139069239735e-06, "Pretrain/Loss": 1.9918642044067383, "Pretrain/Loss (Raw)": 1.6483395099639893, "Pretrain/Step": 7501, "Pretrain/Step Time": 8.5247093886137} +{"Pretrain/Learning Rate": 5.735978421629337e-06, "Pretrain/Loss": 1.9903558492660522, "Pretrain/Loss (Raw)": 1.9570685625076294, "Pretrain/Step": 7502, "Pretrain/Step Time": 8.522827845066786} +{"Pretrain/Learning Rate": 5.730568372479064e-06, "Pretrain/Loss": 1.9908726215362549, "Pretrain/Loss (Raw)": 2.037341356277466, "Pretrain/Step": 7503, "Pretrain/Step Time": 8.522559756413102} +{"Pretrain/Learning Rate": 5.725160545570443e-06, "Pretrain/Loss": 1.992348551750183, "Pretrain/Loss (Raw)": 2.0678751468658447, "Pretrain/Step": 7504, "Pretrain/Step Time": 8.51707729883492} +{"Pretrain/Learning Rate": 5.719754941527139e-06, "Pretrain/Loss": 1.9905837774276733, "Pretrain/Loss (Raw)": 1.8309221267700195, "Pretrain/Step": 7505, "Pretrain/Step Time": 8.516971280798316} +{"Pretrain/Learning Rate": 5.7143515609725475e-06, "Pretrain/Loss": 1.9909083843231201, "Pretrain/Loss (Raw)": 1.9796007871627808, "Pretrain/Step": 7506, "Pretrain/Step Time": 8.525908818468451} +{"Pretrain/Learning Rate": 5.7089504045298115e-06, "Pretrain/Loss": 1.989971399307251, "Pretrain/Loss (Raw)": 2.0211586952209473, "Pretrain/Step": 7507, "Pretrain/Step Time": 8.519483802840114} +{"Pretrain/Learning Rate": 5.703551472821808e-06, "Pretrain/Loss": 1.9918094873428345, "Pretrain/Loss (Raw)": 2.0666983127593994, "Pretrain/Step": 7508, "Pretrain/Step Time": 8.523262191563845} +{"Pretrain/Learning Rate": 5.698154766471186e-06, "Pretrain/Loss": 1.9909627437591553, "Pretrain/Loss (Raw)": 1.7970904111862183, "Pretrain/Step": 7509, "Pretrain/Step Time": 8.529891425743699} +{"Pretrain/Learning Rate": 5.692760286100307e-06, "Pretrain/Loss": 1.9935882091522217, "Pretrain/Loss (Raw)": 2.1727092266082764, "Pretrain/Step": 7510, "Pretrain/Step Time": 8.529118435457349} +{"Pretrain/Learning Rate": 5.6873680323312916e-06, "Pretrain/Loss": 1.9937936067581177, "Pretrain/Loss (Raw)": 2.1776225566864014, "Pretrain/Step": 7511, "Pretrain/Step Time": 8.533555287867785} +{"Pretrain/Learning Rate": 5.681978005785993e-06, "Pretrain/Loss": 1.994642972946167, "Pretrain/Loss (Raw)": 2.110093355178833, "Pretrain/Step": 7512, "Pretrain/Step Time": 8.53962529450655} +{"Pretrain/Learning Rate": 5.676590207086035e-06, "Pretrain/Loss": 1.9964473247528076, "Pretrain/Loss (Raw)": 2.0684592723846436, "Pretrain/Step": 7513, "Pretrain/Step Time": 8.544447906315327} +{"Pretrain/Learning Rate": 5.671204636852734e-06, "Pretrain/Loss": 1.9979296922683716, "Pretrain/Loss (Raw)": 2.2106544971466064, "Pretrain/Step": 7514, "Pretrain/Step Time": 8.53311382420361} +{"Pretrain/Learning Rate": 5.6658212957071995e-06, "Pretrain/Loss": 1.9981111288070679, "Pretrain/Loss (Raw)": 2.0247862339019775, "Pretrain/Step": 7515, "Pretrain/Step Time": 8.53137150220573} +{"Pretrain/Learning Rate": 5.6604401842702545e-06, "Pretrain/Loss": 1.9987683296203613, "Pretrain/Loss (Raw)": 1.9937059879302979, "Pretrain/Step": 7516, "Pretrain/Step Time": 8.528835883364081} +{"Pretrain/Learning Rate": 5.6550613031624925e-06, "Pretrain/Loss": 1.998008370399475, "Pretrain/Loss (Raw)": 1.9746875762939453, "Pretrain/Step": 7517, "Pretrain/Step Time": 8.53160315938294} +{"Pretrain/Learning Rate": 5.649684653004203e-06, "Pretrain/Loss": 1.9990650415420532, "Pretrain/Loss (Raw)": 1.938425064086914, "Pretrain/Step": 7518, "Pretrain/Step Time": 8.542549194768071} +{"Pretrain/Learning Rate": 5.644310234415467e-06, "Pretrain/Loss": 2.0010814666748047, "Pretrain/Loss (Raw)": 2.25661563873291, "Pretrain/Step": 7519, "Pretrain/Step Time": 8.541753441095352} +{"Pretrain/Learning Rate": 5.638938048016082e-06, "Pretrain/Loss": 1.9981640577316284, "Pretrain/Loss (Raw)": 1.7425895929336548, "Pretrain/Step": 7520, "Pretrain/Step Time": 8.535062370821834} +{"Pretrain/Learning Rate": 5.633568094425593e-06, "Pretrain/Loss": 1.9969614744186401, "Pretrain/Loss (Raw)": 1.9301284551620483, "Pretrain/Step": 7521, "Pretrain/Step Time": 8.532630167901516} +{"Pretrain/Learning Rate": 5.6282003742632846e-06, "Pretrain/Loss": 1.996649146080017, "Pretrain/Loss (Raw)": 2.0665066242218018, "Pretrain/Step": 7522, "Pretrain/Step Time": 8.51808019168675} +{"Pretrain/Learning Rate": 5.622834888148188e-06, "Pretrain/Loss": 1.9956307411193848, "Pretrain/Loss (Raw)": 1.9782559871673584, "Pretrain/Step": 7523, "Pretrain/Step Time": 8.520372536033392} +{"Pretrain/Learning Rate": 5.617471636699098e-06, "Pretrain/Loss": 1.9954673051834106, "Pretrain/Loss (Raw)": 2.0638082027435303, "Pretrain/Step": 7524, "Pretrain/Step Time": 8.529804868623614} +{"Pretrain/Learning Rate": 5.612110620534497e-06, "Pretrain/Loss": 1.9931607246398926, "Pretrain/Loss (Raw)": 1.9590232372283936, "Pretrain/Step": 7525, "Pretrain/Step Time": 8.52616572380066} +{"Pretrain/Learning Rate": 5.606751840272664e-06, "Pretrain/Loss": 1.9950075149536133, "Pretrain/Loss (Raw)": 2.1987297534942627, "Pretrain/Step": 7526, "Pretrain/Step Time": 8.525608237832785} +{"Pretrain/Learning Rate": 5.601395296531586e-06, "Pretrain/Loss": 1.9951881170272827, "Pretrain/Loss (Raw)": 1.8415648937225342, "Pretrain/Step": 7527, "Pretrain/Step Time": 8.519351243972778} +{"Pretrain/Learning Rate": 5.596040989929027e-06, "Pretrain/Loss": 1.9981857538223267, "Pretrain/Loss (Raw)": 2.39555287361145, "Pretrain/Step": 7528, "Pretrain/Step Time": 8.516263803467155} +{"Pretrain/Learning Rate": 5.5906889210824405e-06, "Pretrain/Loss": 2.0000319480895996, "Pretrain/Loss (Raw)": 2.1192996501922607, "Pretrain/Step": 7529, "Pretrain/Step Time": 8.517546959221363} +{"Pretrain/Learning Rate": 5.585339090609073e-06, "Pretrain/Loss": 2.00045108795166, "Pretrain/Loss (Raw)": 2.0275864601135254, "Pretrain/Step": 7530, "Pretrain/Step Time": 8.525062557309866} +{"Pretrain/Learning Rate": 5.579991499125889e-06, "Pretrain/Loss": 1.9991087913513184, "Pretrain/Loss (Raw)": 1.688000202178955, "Pretrain/Step": 7531, "Pretrain/Step Time": 8.526867352426052} +{"Pretrain/Learning Rate": 5.574646147249596e-06, "Pretrain/Loss": 2.0006892681121826, "Pretrain/Loss (Raw)": 2.174684524536133, "Pretrain/Step": 7532, "Pretrain/Step Time": 8.527664395049214} +{"Pretrain/Learning Rate": 5.569303035596635e-06, "Pretrain/Loss": 2.0028305053710938, "Pretrain/Loss (Raw)": 1.9602844715118408, "Pretrain/Step": 7533, "Pretrain/Step Time": 8.514719491824508} +{"Pretrain/Learning Rate": 5.563962164783215e-06, "Pretrain/Loss": 2.0037693977355957, "Pretrain/Loss (Raw)": 2.09348201751709, "Pretrain/Step": 7534, "Pretrain/Step Time": 8.509510677307844} +{"Pretrain/Learning Rate": 5.558623535425267e-06, "Pretrain/Loss": 2.0056934356689453, "Pretrain/Loss (Raw)": 2.117464780807495, "Pretrain/Step": 7535, "Pretrain/Step Time": 8.518328752368689} +{"Pretrain/Learning Rate": 5.553287148138461e-06, "Pretrain/Loss": 2.0060691833496094, "Pretrain/Loss (Raw)": 2.1296632289886475, "Pretrain/Step": 7536, "Pretrain/Step Time": 8.52580737695098} +{"Pretrain/Learning Rate": 5.5479530035382115e-06, "Pretrain/Loss": 2.004988193511963, "Pretrain/Loss (Raw)": 1.9919471740722656, "Pretrain/Step": 7537, "Pretrain/Step Time": 8.529294492676854} +{"Pretrain/Learning Rate": 5.542621102239686e-06, "Pretrain/Loss": 2.0067920684814453, "Pretrain/Loss (Raw)": 2.040459632873535, "Pretrain/Step": 7538, "Pretrain/Step Time": 8.524740500375628} +{"Pretrain/Learning Rate": 5.537291444857787e-06, "Pretrain/Loss": 2.0084779262542725, "Pretrain/Loss (Raw)": 2.1608870029449463, "Pretrain/Step": 7539, "Pretrain/Step Time": 8.521993428468704} +{"Pretrain/Learning Rate": 5.531964032007144e-06, "Pretrain/Loss": 2.008779287338257, "Pretrain/Loss (Raw)": 2.081113338470459, "Pretrain/Step": 7540, "Pretrain/Step Time": 8.513185702264309} +{"Pretrain/Learning Rate": 5.526638864302144e-06, "Pretrain/Loss": 2.010770082473755, "Pretrain/Loss (Raw)": 2.1989943981170654, "Pretrain/Step": 7541, "Pretrain/Step Time": 8.519352769479156} +{"Pretrain/Learning Rate": 5.521315942356914e-06, "Pretrain/Loss": 2.010342597961426, "Pretrain/Loss (Raw)": 2.0010249614715576, "Pretrain/Step": 7542, "Pretrain/Step Time": 8.519605662673712} +{"Pretrain/Learning Rate": 5.5159952667853204e-06, "Pretrain/Loss": 2.0102312564849854, "Pretrain/Loss (Raw)": 1.9827163219451904, "Pretrain/Step": 7543, "Pretrain/Step Time": 8.521678978577256} +{"Pretrain/Learning Rate": 5.510676838200959e-06, "Pretrain/Loss": 2.0101091861724854, "Pretrain/Loss (Raw)": 2.0136516094207764, "Pretrain/Step": 7544, "Pretrain/Step Time": 8.520255886018276} +{"Pretrain/Learning Rate": 5.505360657217179e-06, "Pretrain/Loss": 2.006361484527588, "Pretrain/Loss (Raw)": 2.0106165409088135, "Pretrain/Step": 7545, "Pretrain/Step Time": 8.51277181878686} +{"Pretrain/Learning Rate": 5.5000467244470745e-06, "Pretrain/Loss": 2.007746696472168, "Pretrain/Loss (Raw)": 2.043513774871826, "Pretrain/Step": 7546, "Pretrain/Step Time": 8.513269245624542} +{"Pretrain/Learning Rate": 5.494735040503468e-06, "Pretrain/Loss": 2.0074760913848877, "Pretrain/Loss (Raw)": 1.9776664972305298, "Pretrain/Step": 7547, "Pretrain/Step Time": 8.52552580460906} +{"Pretrain/Learning Rate": 5.48942560599893e-06, "Pretrain/Loss": 2.007984161376953, "Pretrain/Loss (Raw)": 2.0515520572662354, "Pretrain/Step": 7548, "Pretrain/Step Time": 8.524489805102348} +{"Pretrain/Learning Rate": 5.4841184215457615e-06, "Pretrain/Loss": 2.007493019104004, "Pretrain/Loss (Raw)": 2.2309176921844482, "Pretrain/Step": 7549, "Pretrain/Step Time": 8.524922823533416} +{"Pretrain/Learning Rate": 5.478813487756024e-06, "Pretrain/Loss": 2.008223056793213, "Pretrain/Loss (Raw)": 1.9413166046142578, "Pretrain/Step": 7550, "Pretrain/Step Time": 8.515187749639153} +{"Pretrain/Learning Rate": 5.473510805241502e-06, "Pretrain/Loss": 2.008232831954956, "Pretrain/Loss (Raw)": 2.0532379150390625, "Pretrain/Step": 7551, "Pretrain/Step Time": 8.509713109582663} +{"Pretrain/Learning Rate": 5.468210374613727e-06, "Pretrain/Loss": 2.0081424713134766, "Pretrain/Loss (Raw)": 2.1389408111572266, "Pretrain/Step": 7552, "Pretrain/Step Time": 8.507905714213848} +{"Pretrain/Learning Rate": 5.46291219648396e-06, "Pretrain/Loss": 2.0098633766174316, "Pretrain/Loss (Raw)": 2.058089256286621, "Pretrain/Step": 7553, "Pretrain/Step Time": 8.509731564670801} +{"Pretrain/Learning Rate": 5.457616271463234e-06, "Pretrain/Loss": 2.008613109588623, "Pretrain/Loss (Raw)": 1.8801873922348022, "Pretrain/Step": 7554, "Pretrain/Step Time": 8.513109816238284} +{"Pretrain/Learning Rate": 5.452322600162274e-06, "Pretrain/Loss": 2.0089735984802246, "Pretrain/Loss (Raw)": 1.996461033821106, "Pretrain/Step": 7555, "Pretrain/Step Time": 8.51395695656538} +{"Pretrain/Learning Rate": 5.447031183191589e-06, "Pretrain/Loss": 2.0060195922851562, "Pretrain/Loss (Raw)": 1.6859490871429443, "Pretrain/Step": 7556, "Pretrain/Step Time": 8.510475059971213} +{"Pretrain/Learning Rate": 5.441742021161398e-06, "Pretrain/Loss": 2.006392002105713, "Pretrain/Loss (Raw)": 2.0543553829193115, "Pretrain/Step": 7557, "Pretrain/Step Time": 8.507268195971847} +{"Pretrain/Learning Rate": 5.436455114681693e-06, "Pretrain/Loss": 2.0050840377807617, "Pretrain/Loss (Raw)": 2.0015084743499756, "Pretrain/Step": 7558, "Pretrain/Step Time": 8.506594076752663} +{"Pretrain/Learning Rate": 5.431170464362157e-06, "Pretrain/Loss": 2.0050528049468994, "Pretrain/Loss (Raw)": 2.045013904571533, "Pretrain/Step": 7559, "Pretrain/Step Time": 8.51904365234077} +{"Pretrain/Learning Rate": 5.42588807081226e-06, "Pretrain/Loss": 2.007399320602417, "Pretrain/Loss (Raw)": 2.1400182247161865, "Pretrain/Step": 7560, "Pretrain/Step Time": 8.517378691583872} +{"Pretrain/Learning Rate": 5.420607934641181e-06, "Pretrain/Loss": 2.008540630340576, "Pretrain/Loss (Raw)": 2.0360825061798096, "Pretrain/Step": 7561, "Pretrain/Step Time": 8.51233740337193} +{"Pretrain/Learning Rate": 5.415330056457871e-06, "Pretrain/Loss": 2.0063560009002686, "Pretrain/Loss (Raw)": 1.7695274353027344, "Pretrain/Step": 7562, "Pretrain/Step Time": 8.503218218684196} +{"Pretrain/Learning Rate": 5.410054436870968e-06, "Pretrain/Loss": 2.013066530227661, "Pretrain/Loss (Raw)": 2.6818387508392334, "Pretrain/Step": 7563, "Pretrain/Step Time": 8.507427318021655} +{"Pretrain/Learning Rate": 5.404781076488901e-06, "Pretrain/Loss": 2.0142552852630615, "Pretrain/Loss (Raw)": 2.026616334915161, "Pretrain/Step": 7564, "Pretrain/Step Time": 8.50950837880373} +{"Pretrain/Learning Rate": 5.399509975919828e-06, "Pretrain/Loss": 2.013652801513672, "Pretrain/Loss (Raw)": 1.8912794589996338, "Pretrain/Step": 7565, "Pretrain/Step Time": 8.514736387878656} +{"Pretrain/Learning Rate": 5.394241135771613e-06, "Pretrain/Loss": 2.0140116214752197, "Pretrain/Loss (Raw)": 2.0537562370300293, "Pretrain/Step": 7566, "Pretrain/Step Time": 8.514041753485799} +{"Pretrain/Learning Rate": 5.388974556651902e-06, "Pretrain/Loss": 2.0144383907318115, "Pretrain/Loss (Raw)": 2.12192964553833, "Pretrain/Step": 7567, "Pretrain/Step Time": 8.510062700137496} +{"Pretrain/Learning Rate": 5.3837102391680465e-06, "Pretrain/Loss": 2.0152549743652344, "Pretrain/Loss (Raw)": 1.9381235837936401, "Pretrain/Step": 7568, "Pretrain/Step Time": 8.50092483125627} +{"Pretrain/Learning Rate": 5.378448183927176e-06, "Pretrain/Loss": 2.017192840576172, "Pretrain/Loss (Raw)": 2.104285717010498, "Pretrain/Step": 7569, "Pretrain/Step Time": 8.502753349021077} +{"Pretrain/Learning Rate": 5.373188391536108e-06, "Pretrain/Loss": 2.0197019577026367, "Pretrain/Loss (Raw)": 2.203800916671753, "Pretrain/Step": 7570, "Pretrain/Step Time": 8.504927100613713} +{"Pretrain/Learning Rate": 5.3679308626014445e-06, "Pretrain/Loss": 2.018857002258301, "Pretrain/Loss (Raw)": 1.9682916402816772, "Pretrain/Step": 7571, "Pretrain/Step Time": 8.511551808565855} +{"Pretrain/Learning Rate": 5.362675597729505e-06, "Pretrain/Loss": 2.0195131301879883, "Pretrain/Loss (Raw)": 1.9506092071533203, "Pretrain/Step": 7572, "Pretrain/Step Time": 8.511467594653368} +{"Pretrain/Learning Rate": 5.357422597526349e-06, "Pretrain/Loss": 2.0173585414886475, "Pretrain/Loss (Raw)": 1.8030015230178833, "Pretrain/Step": 7573, "Pretrain/Step Time": 8.513071920722723} +{"Pretrain/Learning Rate": 5.3521718625977715e-06, "Pretrain/Loss": 2.0191707611083984, "Pretrain/Loss (Raw)": 2.196542739868164, "Pretrain/Step": 7574, "Pretrain/Step Time": 8.502010513097048} +{"Pretrain/Learning Rate": 5.346923393549325e-06, "Pretrain/Loss": 2.0213329792022705, "Pretrain/Loss (Raw)": 2.1731972694396973, "Pretrain/Step": 7575, "Pretrain/Step Time": 8.504184111952782} +{"Pretrain/Learning Rate": 5.34167719098628e-06, "Pretrain/Loss": 2.0231680870056152, "Pretrain/Loss (Raw)": 1.9536869525909424, "Pretrain/Step": 7576, "Pretrain/Step Time": 8.509295539930463} +{"Pretrain/Learning Rate": 5.336433255513656e-06, "Pretrain/Loss": 2.022775173187256, "Pretrain/Loss (Raw)": 1.9516087770462036, "Pretrain/Step": 7577, "Pretrain/Step Time": 8.512120481580496} +{"Pretrain/Learning Rate": 5.331191587736198e-06, "Pretrain/Loss": 2.0212061405181885, "Pretrain/Loss (Raw)": 2.032738208770752, "Pretrain/Step": 7578, "Pretrain/Step Time": 8.513561841100454} +{"Pretrain/Learning Rate": 5.325952188258418e-06, "Pretrain/Loss": 2.0215022563934326, "Pretrain/Loss (Raw)": 2.063326120376587, "Pretrain/Step": 7579, "Pretrain/Step Time": 8.51598042063415} +{"Pretrain/Learning Rate": 5.320715057684536e-06, "Pretrain/Loss": 2.0197629928588867, "Pretrain/Loss (Raw)": 1.8453600406646729, "Pretrain/Step": 7580, "Pretrain/Step Time": 8.504278333857656} +{"Pretrain/Learning Rate": 5.315480196618527e-06, "Pretrain/Loss": 2.018195629119873, "Pretrain/Loss (Raw)": 1.9293510913848877, "Pretrain/Step": 7581, "Pretrain/Step Time": 8.502043072134256} +{"Pretrain/Learning Rate": 5.310247605664093e-06, "Pretrain/Loss": 2.016890048980713, "Pretrain/Loss (Raw)": 1.844665765762329, "Pretrain/Step": 7582, "Pretrain/Step Time": 8.503224870190024} +{"Pretrain/Learning Rate": 5.30501728542469e-06, "Pretrain/Loss": 2.0205957889556885, "Pretrain/Loss (Raw)": 2.180166482925415, "Pretrain/Step": 7583, "Pretrain/Step Time": 8.509714778512716} +{"Pretrain/Learning Rate": 5.299789236503503e-06, "Pretrain/Loss": 2.0197722911834717, "Pretrain/Loss (Raw)": 1.801322102546692, "Pretrain/Step": 7584, "Pretrain/Step Time": 8.509629031643271} +{"Pretrain/Learning Rate": 5.294563459503449e-06, "Pretrain/Loss": 2.0187249183654785, "Pretrain/Loss (Raw)": 1.843029499053955, "Pretrain/Step": 7585, "Pretrain/Step Time": 8.517951468005776} +{"Pretrain/Learning Rate": 5.2893399550271835e-06, "Pretrain/Loss": 2.0188097953796387, "Pretrain/Loss (Raw)": 1.994688868522644, "Pretrain/Step": 7586, "Pretrain/Step Time": 8.514023000374436} +{"Pretrain/Learning Rate": 5.2841187236771226e-06, "Pretrain/Loss": 2.0175981521606445, "Pretrain/Loss (Raw)": 1.8669233322143555, "Pretrain/Step": 7587, "Pretrain/Step Time": 8.513691045343876} +{"Pretrain/Learning Rate": 5.278899766055395e-06, "Pretrain/Loss": 2.0157740116119385, "Pretrain/Loss (Raw)": 1.8828834295272827, "Pretrain/Step": 7588, "Pretrain/Step Time": 8.511301627382636} +{"Pretrain/Learning Rate": 5.273683082763875e-06, "Pretrain/Loss": 2.0166666507720947, "Pretrain/Loss (Raw)": 2.214155673980713, "Pretrain/Step": 7589, "Pretrain/Step Time": 8.512019645422697} +{"Pretrain/Learning Rate": 5.26846867440417e-06, "Pretrain/Loss": 2.0145881175994873, "Pretrain/Loss (Raw)": 1.637339472770691, "Pretrain/Step": 7590, "Pretrain/Step Time": 8.52461377903819} +{"Pretrain/Learning Rate": 5.263256541577641e-06, "Pretrain/Loss": 2.0098066329956055, "Pretrain/Loss (Raw)": 1.932082176208496, "Pretrain/Step": 7591, "Pretrain/Step Time": 8.519974768161774} +{"Pretrain/Learning Rate": 5.25804668488537e-06, "Pretrain/Loss": 2.0099730491638184, "Pretrain/Loss (Raw)": 1.865858793258667, "Pretrain/Step": 7592, "Pretrain/Step Time": 8.52076411806047} +{"Pretrain/Learning Rate": 5.252839104928184e-06, "Pretrain/Loss": 2.0113208293914795, "Pretrain/Loss (Raw)": 2.1734862327575684, "Pretrain/Step": 7593, "Pretrain/Step Time": 8.520181972533464} +{"Pretrain/Learning Rate": 5.247633802306637e-06, "Pretrain/Loss": 2.0131475925445557, "Pretrain/Loss (Raw)": 2.115370512008667, "Pretrain/Step": 7594, "Pretrain/Step Time": 8.516809176653624} +{"Pretrain/Learning Rate": 5.242430777621049e-06, "Pretrain/Loss": 2.0126943588256836, "Pretrain/Loss (Raw)": 1.8721767663955688, "Pretrain/Step": 7595, "Pretrain/Step Time": 8.525891158729792} +{"Pretrain/Learning Rate": 5.2372300314714295e-06, "Pretrain/Loss": 2.013676166534424, "Pretrain/Loss (Raw)": 2.1489439010620117, "Pretrain/Step": 7596, "Pretrain/Step Time": 8.531740063801408} +{"Pretrain/Learning Rate": 5.232031564457576e-06, "Pretrain/Loss": 2.0153775215148926, "Pretrain/Loss (Raw)": 2.1040968894958496, "Pretrain/Step": 7597, "Pretrain/Step Time": 8.532086119055748} +{"Pretrain/Learning Rate": 5.226835377178984e-06, "Pretrain/Loss": 2.0162758827209473, "Pretrain/Loss (Raw)": 2.041163682937622, "Pretrain/Step": 7598, "Pretrain/Step Time": 8.533634891733527} +{"Pretrain/Learning Rate": 5.221641470234928e-06, "Pretrain/Loss": 2.016019821166992, "Pretrain/Loss (Raw)": 1.7421945333480835, "Pretrain/Step": 7599, "Pretrain/Step Time": 8.530505634844303} +{"Pretrain/Learning Rate": 5.216449844224358e-06, "Pretrain/Loss": 2.0163750648498535, "Pretrain/Loss (Raw)": 2.0608487129211426, "Pretrain/Step": 7600, "Pretrain/Step Time": 8.516257865354419} +{"Pretrain/Learning Rate": 5.211260499746026e-06, "Pretrain/Loss": 2.0160725116729736, "Pretrain/Loss (Raw)": 1.8845957517623901, "Pretrain/Step": 7601, "Pretrain/Step Time": 8.526326067745686} +{"Pretrain/Learning Rate": 5.206073437398371e-06, "Pretrain/Loss": 2.018303155899048, "Pretrain/Loss (Raw)": 2.064180374145508, "Pretrain/Step": 7602, "Pretrain/Step Time": 8.527579706162214} +{"Pretrain/Learning Rate": 5.200888657779615e-06, "Pretrain/Loss": 2.018954038619995, "Pretrain/Loss (Raw)": 2.0374224185943604, "Pretrain/Step": 7603, "Pretrain/Step Time": 8.530243750661612} +{"Pretrain/Learning Rate": 5.19570616148766e-06, "Pretrain/Loss": 2.0171589851379395, "Pretrain/Loss (Raw)": 1.974769949913025, "Pretrain/Step": 7604, "Pretrain/Step Time": 8.52694384381175} +{"Pretrain/Learning Rate": 5.190525949120193e-06, "Pretrain/Loss": 2.01639461517334, "Pretrain/Loss (Raw)": 1.8662562370300293, "Pretrain/Step": 7605, "Pretrain/Step Time": 8.523599699139595} +{"Pretrain/Learning Rate": 5.18534802127463e-06, "Pretrain/Loss": 2.0192995071411133, "Pretrain/Loss (Raw)": 2.4544150829315186, "Pretrain/Step": 7606, "Pretrain/Step Time": 8.520925989374518} +{"Pretrain/Learning Rate": 5.1801723785480925e-06, "Pretrain/Loss": 2.018759250640869, "Pretrain/Loss (Raw)": 1.9351098537445068, "Pretrain/Step": 7607, "Pretrain/Step Time": 8.527294786646962} +{"Pretrain/Learning Rate": 5.174999021537475e-06, "Pretrain/Loss": 2.0193674564361572, "Pretrain/Loss (Raw)": 2.037790060043335, "Pretrain/Step": 7608, "Pretrain/Step Time": 8.530201697722077} +{"Pretrain/Learning Rate": 5.169827950839384e-06, "Pretrain/Loss": 2.0191092491149902, "Pretrain/Loss (Raw)": 2.0930094718933105, "Pretrain/Step": 7609, "Pretrain/Step Time": 8.526185503229499} +{"Pretrain/Learning Rate": 5.164659167050187e-06, "Pretrain/Loss": 2.0194334983825684, "Pretrain/Loss (Raw)": 2.0725791454315186, "Pretrain/Step": 7610, "Pretrain/Step Time": 8.524276375770569} +{"Pretrain/Learning Rate": 5.15949267076595e-06, "Pretrain/Loss": 2.018620491027832, "Pretrain/Loss (Raw)": 1.9459648132324219, "Pretrain/Step": 7611, "Pretrain/Step Time": 8.527812972664833} +{"Pretrain/Learning Rate": 5.1543284625825165e-06, "Pretrain/Loss": 2.0170884132385254, "Pretrain/Loss (Raw)": 2.086710214614868, "Pretrain/Step": 7612, "Pretrain/Step Time": 8.519358724355698} +{"Pretrain/Learning Rate": 5.149166543095444e-06, "Pretrain/Loss": 2.014092445373535, "Pretrain/Loss (Raw)": 1.7290033102035522, "Pretrain/Step": 7613, "Pretrain/Step Time": 8.530623590573668} +{"Pretrain/Learning Rate": 5.144006912900021e-06, "Pretrain/Loss": 2.011063575744629, "Pretrain/Loss (Raw)": 1.568284273147583, "Pretrain/Step": 7614, "Pretrain/Step Time": 8.53335596434772} +{"Pretrain/Learning Rate": 5.138849572591281e-06, "Pretrain/Loss": 2.0142366886138916, "Pretrain/Loss (Raw)": 2.449753522872925, "Pretrain/Step": 7615, "Pretrain/Step Time": 8.531298466026783} +{"Pretrain/Learning Rate": 5.133694522764002e-06, "Pretrain/Loss": 2.0153908729553223, "Pretrain/Loss (Raw)": 2.1324660778045654, "Pretrain/Step": 7616, "Pretrain/Step Time": 8.525446036830544} +{"Pretrain/Learning Rate": 5.128541764012687e-06, "Pretrain/Loss": 2.013472557067871, "Pretrain/Loss (Raw)": 1.8710638284683228, "Pretrain/Step": 7617, "Pretrain/Step Time": 8.523569276556373} +{"Pretrain/Learning Rate": 5.123391296931571e-06, "Pretrain/Loss": 2.013948917388916, "Pretrain/Loss (Raw)": 1.8458880186080933, "Pretrain/Step": 7618, "Pretrain/Step Time": 8.51509009487927} +{"Pretrain/Learning Rate": 5.118243122114625e-06, "Pretrain/Loss": 2.0130984783172607, "Pretrain/Loss (Raw)": 2.059096336364746, "Pretrain/Step": 7619, "Pretrain/Step Time": 8.518445687368512} +{"Pretrain/Learning Rate": 5.113097240155576e-06, "Pretrain/Loss": 2.011842727661133, "Pretrain/Loss (Raw)": 1.8992958068847656, "Pretrain/Step": 7620, "Pretrain/Step Time": 8.525975175201893} +{"Pretrain/Learning Rate": 5.107953651647862e-06, "Pretrain/Loss": 2.010857582092285, "Pretrain/Loss (Raw)": 1.9265986680984497, "Pretrain/Step": 7621, "Pretrain/Step Time": 8.533250829204917} +{"Pretrain/Learning Rate": 5.10281235718467e-06, "Pretrain/Loss": 2.010871410369873, "Pretrain/Loss (Raw)": 1.9721112251281738, "Pretrain/Step": 7622, "Pretrain/Step Time": 8.530257878825068} +{"Pretrain/Learning Rate": 5.097673357358907e-06, "Pretrain/Loss": 2.0120625495910645, "Pretrain/Loss (Raw)": 2.0086405277252197, "Pretrain/Step": 7623, "Pretrain/Step Time": 8.526810564100742} +{"Pretrain/Learning Rate": 5.092536652763241e-06, "Pretrain/Loss": 2.011838436126709, "Pretrain/Loss (Raw)": 1.9594321250915527, "Pretrain/Step": 7624, "Pretrain/Step Time": 8.519235670566559} +{"Pretrain/Learning Rate": 5.087402243990056e-06, "Pretrain/Loss": 2.0133321285247803, "Pretrain/Loss (Raw)": 1.8630073070526123, "Pretrain/Step": 7625, "Pretrain/Step Time": 8.523139744997025} +{"Pretrain/Learning Rate": 5.0822701316314755e-06, "Pretrain/Loss": 2.0115580558776855, "Pretrain/Loss (Raw)": 1.911050796508789, "Pretrain/Step": 7626, "Pretrain/Step Time": 8.526733359321952} +{"Pretrain/Learning Rate": 5.0771403162793525e-06, "Pretrain/Loss": 2.009676218032837, "Pretrain/Loss (Raw)": 1.9263347387313843, "Pretrain/Step": 7627, "Pretrain/Step Time": 8.527128271758556} +{"Pretrain/Learning Rate": 5.072012798525294e-06, "Pretrain/Loss": 2.0096628665924072, "Pretrain/Loss (Raw)": 2.045048952102661, "Pretrain/Step": 7628, "Pretrain/Step Time": 8.521104419603944} +{"Pretrain/Learning Rate": 5.0668875789606245e-06, "Pretrain/Loss": 2.0109219551086426, "Pretrain/Loss (Raw)": 1.8095091581344604, "Pretrain/Step": 7629, "Pretrain/Step Time": 8.519942604005337} +{"Pretrain/Learning Rate": 5.061764658176407e-06, "Pretrain/Loss": 2.0127477645874023, "Pretrain/Loss (Raw)": 2.190772771835327, "Pretrain/Step": 7630, "Pretrain/Step Time": 8.514833327382803} +{"Pretrain/Learning Rate": 5.056644036763433e-06, "Pretrain/Loss": 2.0129847526550293, "Pretrain/Loss (Raw)": 2.067676305770874, "Pretrain/Step": 7631, "Pretrain/Step Time": 8.523967944085598} +{"Pretrain/Learning Rate": 5.051525715312253e-06, "Pretrain/Loss": 2.012199640274048, "Pretrain/Loss (Raw)": 1.9673768281936646, "Pretrain/Step": 7632, "Pretrain/Step Time": 8.526938430964947} +{"Pretrain/Learning Rate": 5.046409694413129e-06, "Pretrain/Loss": 2.0146913528442383, "Pretrain/Loss (Raw)": 2.1498310565948486, "Pretrain/Step": 7633, "Pretrain/Step Time": 8.524663342162967} +{"Pretrain/Learning Rate": 5.04129597465606e-06, "Pretrain/Loss": 2.0145835876464844, "Pretrain/Loss (Raw)": 1.9658496379852295, "Pretrain/Step": 7634, "Pretrain/Step Time": 8.51780410297215} +{"Pretrain/Learning Rate": 5.0361845566307825e-06, "Pretrain/Loss": 2.0122783184051514, "Pretrain/Loss (Raw)": 1.7260661125183105, "Pretrain/Step": 7635, "Pretrain/Step Time": 8.513051740825176} +{"Pretrain/Learning Rate": 5.0310754409267886e-06, "Pretrain/Loss": 2.0112967491149902, "Pretrain/Loss (Raw)": 1.9410645961761475, "Pretrain/Step": 7636, "Pretrain/Step Time": 8.508491568267345} +{"Pretrain/Learning Rate": 5.025968628133259e-06, "Pretrain/Loss": 2.0140180587768555, "Pretrain/Loss (Raw)": 2.145402669906616, "Pretrain/Step": 7637, "Pretrain/Step Time": 8.513979153707623} +{"Pretrain/Learning Rate": 5.020864118839152e-06, "Pretrain/Loss": 2.0114922523498535, "Pretrain/Loss (Raw)": 1.8494354486465454, "Pretrain/Step": 7638, "Pretrain/Step Time": 8.51510870270431} +{"Pretrain/Learning Rate": 5.015761913633135e-06, "Pretrain/Loss": 2.010164976119995, "Pretrain/Loss (Raw)": 2.0077035427093506, "Pretrain/Step": 7639, "Pretrain/Step Time": 8.513274628669024} +{"Pretrain/Learning Rate": 5.010662013103637e-06, "Pretrain/Loss": 2.009127616882324, "Pretrain/Loss (Raw)": 1.9773186445236206, "Pretrain/Step": 7640, "Pretrain/Step Time": 8.507791448384523} +{"Pretrain/Learning Rate": 5.0055644178387735e-06, "Pretrain/Loss": 2.008288860321045, "Pretrain/Loss (Raw)": 1.9610835313796997, "Pretrain/Step": 7641, "Pretrain/Step Time": 8.503079514950514} +{"Pretrain/Learning Rate": 5.0004691284264435e-06, "Pretrain/Loss": 2.007174015045166, "Pretrain/Loss (Raw)": 2.067983388900757, "Pretrain/Step": 7642, "Pretrain/Step Time": 8.514502642676234} +{"Pretrain/Learning Rate": 4.99537614545425e-06, "Pretrain/Loss": 2.0083987712860107, "Pretrain/Loss (Raw)": 2.1815412044525146, "Pretrain/Step": 7643, "Pretrain/Step Time": 8.511312136426568} +{"Pretrain/Learning Rate": 4.990285469509559e-06, "Pretrain/Loss": 2.007099151611328, "Pretrain/Loss (Raw)": 1.8273636102676392, "Pretrain/Step": 7644, "Pretrain/Step Time": 8.512049650773406} +{"Pretrain/Learning Rate": 4.98519710117942e-06, "Pretrain/Loss": 2.006974458694458, "Pretrain/Loss (Raw)": 1.9587242603302002, "Pretrain/Step": 7645, "Pretrain/Step Time": 8.50983482785523} +{"Pretrain/Learning Rate": 4.980111041050667e-06, "Pretrain/Loss": 2.0056262016296387, "Pretrain/Loss (Raw)": 1.7658445835113525, "Pretrain/Step": 7646, "Pretrain/Step Time": 8.500212371349335} +{"Pretrain/Learning Rate": 4.975027289709855e-06, "Pretrain/Loss": 2.0045852661132812, "Pretrain/Loss (Raw)": 2.1233766078948975, "Pretrain/Step": 7647, "Pretrain/Step Time": 8.504722313955426} +{"Pretrain/Learning Rate": 4.969945847743246e-06, "Pretrain/Loss": 2.006899833679199, "Pretrain/Loss (Raw)": 2.03885817527771, "Pretrain/Step": 7648, "Pretrain/Step Time": 8.509604599326849} +{"Pretrain/Learning Rate": 4.964866715736874e-06, "Pretrain/Loss": 2.0084803104400635, "Pretrain/Loss (Raw)": 2.1324048042297363, "Pretrain/Step": 7649, "Pretrain/Step Time": 8.514103440567851} +{"Pretrain/Learning Rate": 4.959789894276473e-06, "Pretrain/Loss": 2.0081255435943604, "Pretrain/Loss (Raw)": 2.021123170852661, "Pretrain/Step": 7650, "Pretrain/Step Time": 8.5115972943604} +{"Pretrain/Learning Rate": 4.9547153839475476e-06, "Pretrain/Loss": 2.007922649383545, "Pretrain/Loss (Raw)": 1.952274203300476, "Pretrain/Step": 7651, "Pretrain/Step Time": 8.504943553358316} +{"Pretrain/Learning Rate": 4.949643185335287e-06, "Pretrain/Loss": 2.008173942565918, "Pretrain/Loss (Raw)": 2.0959620475769043, "Pretrain/Step": 7652, "Pretrain/Step Time": 8.490326063707471} +{"Pretrain/Learning Rate": 4.944573299024663e-06, "Pretrain/Loss": 2.0066323280334473, "Pretrain/Loss (Raw)": 1.7616996765136719, "Pretrain/Step": 7653, "Pretrain/Step Time": 8.496807070448995} +{"Pretrain/Learning Rate": 4.939505725600341e-06, "Pretrain/Loss": 2.0051651000976562, "Pretrain/Loss (Raw)": 2.0109403133392334, "Pretrain/Step": 7654, "Pretrain/Step Time": 8.504945473745465} +{"Pretrain/Learning Rate": 4.934440465646762e-06, "Pretrain/Loss": 2.0066781044006348, "Pretrain/Loss (Raw)": 2.0352094173431396, "Pretrain/Step": 7655, "Pretrain/Step Time": 8.498952081426978} +{"Pretrain/Learning Rate": 4.929377519748046e-06, "Pretrain/Loss": 2.004304885864258, "Pretrain/Loss (Raw)": 2.0918264389038086, "Pretrain/Step": 7656, "Pretrain/Step Time": 8.502331513911486} +{"Pretrain/Learning Rate": 4.924316888488098e-06, "Pretrain/Loss": 2.003980875015259, "Pretrain/Loss (Raw)": 2.077780246734619, "Pretrain/Step": 7657, "Pretrain/Step Time": 8.501525141298771} +{"Pretrain/Learning Rate": 4.919258572450527e-06, "Pretrain/Loss": 2.0046744346618652, "Pretrain/Loss (Raw)": 2.116391181945801, "Pretrain/Step": 7658, "Pretrain/Step Time": 8.49540819786489} +{"Pretrain/Learning Rate": 4.914202572218679e-06, "Pretrain/Loss": 2.007004737854004, "Pretrain/Loss (Raw)": 1.9862428903579712, "Pretrain/Step": 7659, "Pretrain/Step Time": 8.49772322922945} +{"Pretrain/Learning Rate": 4.909148888375631e-06, "Pretrain/Loss": 2.0075364112854004, "Pretrain/Loss (Raw)": 2.242758274078369, "Pretrain/Step": 7660, "Pretrain/Step Time": 8.501789392903447} +{"Pretrain/Learning Rate": 4.904097521504214e-06, "Pretrain/Loss": 2.0065603256225586, "Pretrain/Loss (Raw)": 1.83535897731781, "Pretrain/Step": 7661, "Pretrain/Step Time": 8.504576353356242} +{"Pretrain/Learning Rate": 4.899048472186962e-06, "Pretrain/Loss": 2.0028703212738037, "Pretrain/Loss (Raw)": 1.6211519241333008, "Pretrain/Step": 7662, "Pretrain/Step Time": 8.50871174968779} +{"Pretrain/Learning Rate": 4.8940017410061625e-06, "Pretrain/Loss": 2.001880168914795, "Pretrain/Loss (Raw)": 1.9907323122024536, "Pretrain/Step": 7663, "Pretrain/Step Time": 8.500673942267895} +{"Pretrain/Learning Rate": 4.888957328543817e-06, "Pretrain/Loss": 2.001164197921753, "Pretrain/Loss (Raw)": 2.0380067825317383, "Pretrain/Step": 7664, "Pretrain/Step Time": 8.49521428719163} +{"Pretrain/Learning Rate": 4.8839152353816835e-06, "Pretrain/Loss": 2.005819320678711, "Pretrain/Loss (Raw)": 2.587782144546509, "Pretrain/Step": 7665, "Pretrain/Step Time": 8.494503647089005} +{"Pretrain/Learning Rate": 4.8788754621012375e-06, "Pretrain/Loss": 2.005919933319092, "Pretrain/Loss (Raw)": 2.0533649921417236, "Pretrain/Step": 7666, "Pretrain/Step Time": 8.501676890999079} +{"Pretrain/Learning Rate": 4.873838009283685e-06, "Pretrain/Loss": 2.0049734115600586, "Pretrain/Loss (Raw)": 2.0397531986236572, "Pretrain/Step": 7667, "Pretrain/Step Time": 8.503637310117483} +{"Pretrain/Learning Rate": 4.868802877509965e-06, "Pretrain/Loss": 2.0059757232666016, "Pretrain/Loss (Raw)": 2.2094171047210693, "Pretrain/Step": 7668, "Pretrain/Step Time": 8.508213302120566} +{"Pretrain/Learning Rate": 4.863770067360765e-06, "Pretrain/Loss": 2.004439115524292, "Pretrain/Loss (Raw)": 2.0022754669189453, "Pretrain/Step": 7669, "Pretrain/Step Time": 8.498828554525971} +{"Pretrain/Learning Rate": 4.858739579416488e-06, "Pretrain/Loss": 2.005825996398926, "Pretrain/Loss (Raw)": 2.1785287857055664, "Pretrain/Step": 7670, "Pretrain/Step Time": 8.493839468806982} +{"Pretrain/Learning Rate": 4.85371141425727e-06, "Pretrain/Loss": 2.004997968673706, "Pretrain/Loss (Raw)": 1.8767589330673218, "Pretrain/Step": 7671, "Pretrain/Step Time": 8.495641643181443} +{"Pretrain/Learning Rate": 4.848685572462977e-06, "Pretrain/Loss": 2.005404233932495, "Pretrain/Loss (Raw)": 2.0656368732452393, "Pretrain/Step": 7672, "Pretrain/Step Time": 8.499387403950095} +{"Pretrain/Learning Rate": 4.843662054613227e-06, "Pretrain/Loss": 2.004218578338623, "Pretrain/Loss (Raw)": 1.8588550090789795, "Pretrain/Step": 7673, "Pretrain/Step Time": 8.508238455280662} +{"Pretrain/Learning Rate": 4.838640861287347e-06, "Pretrain/Loss": 2.006120443344116, "Pretrain/Loss (Raw)": 2.2869462966918945, "Pretrain/Step": 7674, "Pretrain/Step Time": 8.507498946040869} +{"Pretrain/Learning Rate": 4.833621993064408e-06, "Pretrain/Loss": 2.0060949325561523, "Pretrain/Loss (Raw)": 1.974419355392456, "Pretrain/Step": 7675, "Pretrain/Step Time": 8.500467773526907} +{"Pretrain/Learning Rate": 4.8286054505231994e-06, "Pretrain/Loss": 2.0055084228515625, "Pretrain/Loss (Raw)": 1.9764633178710938, "Pretrain/Step": 7676, "Pretrain/Step Time": 8.499756874516606} +{"Pretrain/Learning Rate": 4.823591234242269e-06, "Pretrain/Loss": 2.003693103790283, "Pretrain/Loss (Raw)": 1.9985406398773193, "Pretrain/Step": 7677, "Pretrain/Step Time": 8.50305100902915} +{"Pretrain/Learning Rate": 4.818579344799873e-06, "Pretrain/Loss": 2.004323720932007, "Pretrain/Loss (Raw)": 2.0220537185668945, "Pretrain/Step": 7678, "Pretrain/Step Time": 8.51117398403585} +{"Pretrain/Learning Rate": 4.813569782774005e-06, "Pretrain/Loss": 2.0050032138824463, "Pretrain/Loss (Raw)": 2.1402182579040527, "Pretrain/Step": 7679, "Pretrain/Step Time": 8.514177404344082} +{"Pretrain/Learning Rate": 4.808562548742382e-06, "Pretrain/Loss": 2.0046417713165283, "Pretrain/Loss (Raw)": 2.0926871299743652, "Pretrain/Step": 7680, "Pretrain/Step Time": 8.511255932971835} +{"Pretrain/Learning Rate": 4.803557643282486e-06, "Pretrain/Loss": 2.0040574073791504, "Pretrain/Loss (Raw)": 1.9833039045333862, "Pretrain/Step": 7681, "Pretrain/Step Time": 8.511052491143346} +{"Pretrain/Learning Rate": 4.798555066971478e-06, "Pretrain/Loss": 2.005404233932495, "Pretrain/Loss (Raw)": 2.0525665283203125, "Pretrain/Step": 7682, "Pretrain/Step Time": 8.506081342697144} +{"Pretrain/Learning Rate": 4.793554820386298e-06, "Pretrain/Loss": 2.0066747665405273, "Pretrain/Loss (Raw)": 2.1590874195098877, "Pretrain/Step": 7683, "Pretrain/Step Time": 8.504447557032108} +{"Pretrain/Learning Rate": 4.788556904103586e-06, "Pretrain/Loss": 2.007582187652588, "Pretrain/Loss (Raw)": 1.802098274230957, "Pretrain/Step": 7684, "Pretrain/Step Time": 8.507593167945743} +{"Pretrain/Learning Rate": 4.783561318699745e-06, "Pretrain/Loss": 2.006610870361328, "Pretrain/Loss (Raw)": 1.9300287961959839, "Pretrain/Step": 7685, "Pretrain/Step Time": 8.515983384102583} +{"Pretrain/Learning Rate": 4.778568064750863e-06, "Pretrain/Loss": 2.006866931915283, "Pretrain/Loss (Raw)": 2.034252643585205, "Pretrain/Step": 7686, "Pretrain/Step Time": 8.518093867227435} +{"Pretrain/Learning Rate": 4.773577142832797e-06, "Pretrain/Loss": 2.0074052810668945, "Pretrain/Loss (Raw)": 2.1139559745788574, "Pretrain/Step": 7687, "Pretrain/Step Time": 8.505347143858671} +{"Pretrain/Learning Rate": 4.768588553521136e-06, "Pretrain/Loss": 2.006180763244629, "Pretrain/Loss (Raw)": 1.9832454919815063, "Pretrain/Step": 7688, "Pretrain/Step Time": 8.50423738732934} +{"Pretrain/Learning Rate": 4.763602297391167e-06, "Pretrain/Loss": 2.0028233528137207, "Pretrain/Loss (Raw)": 1.6063451766967773, "Pretrain/Step": 7689, "Pretrain/Step Time": 8.509326748549938} +{"Pretrain/Learning Rate": 4.758618375017943e-06, "Pretrain/Loss": 2.0052883625030518, "Pretrain/Loss (Raw)": 2.085073232650757, "Pretrain/Step": 7690, "Pretrain/Step Time": 8.513561991974711} +{"Pretrain/Learning Rate": 4.753636786976223e-06, "Pretrain/Loss": 1.9999513626098633, "Pretrain/Loss (Raw)": 1.9986903667449951, "Pretrain/Step": 7691, "Pretrain/Step Time": 8.51730653271079} +{"Pretrain/Learning Rate": 4.748657533840525e-06, "Pretrain/Loss": 2.0009474754333496, "Pretrain/Loss (Raw)": 2.154104471206665, "Pretrain/Step": 7692, "Pretrain/Step Time": 8.516429087147117} +{"Pretrain/Learning Rate": 4.743680616185053e-06, "Pretrain/Loss": 2.001718521118164, "Pretrain/Loss (Raw)": 1.9899747371673584, "Pretrain/Step": 7693, "Pretrain/Step Time": 8.511071886867285} +{"Pretrain/Learning Rate": 4.738706034583793e-06, "Pretrain/Loss": 2.001249074935913, "Pretrain/Loss (Raw)": 1.993681788444519, "Pretrain/Step": 7694, "Pretrain/Step Time": 8.523746471852064} +{"Pretrain/Learning Rate": 4.73373378961042e-06, "Pretrain/Loss": 2.000713586807251, "Pretrain/Loss (Raw)": 2.053382158279419, "Pretrain/Step": 7695, "Pretrain/Step Time": 8.522135401144624} +{"Pretrain/Learning Rate": 4.728763881838375e-06, "Pretrain/Loss": 2.0017359256744385, "Pretrain/Loss (Raw)": 2.0689964294433594, "Pretrain/Step": 7696, "Pretrain/Step Time": 8.529240239411592} +{"Pretrain/Learning Rate": 4.723796311840789e-06, "Pretrain/Loss": 2.0019328594207764, "Pretrain/Loss (Raw)": 2.1294915676116943, "Pretrain/Step": 7697, "Pretrain/Step Time": 8.531408494338393} +{"Pretrain/Learning Rate": 4.7188310801905635e-06, "Pretrain/Loss": 2.000856637954712, "Pretrain/Loss (Raw)": 2.0660512447357178, "Pretrain/Step": 7698, "Pretrain/Step Time": 8.53810779005289} +{"Pretrain/Learning Rate": 4.713868187460307e-06, "Pretrain/Loss": 2.0012292861938477, "Pretrain/Loss (Raw)": 2.0159590244293213, "Pretrain/Step": 7699, "Pretrain/Step Time": 8.529065001755953} +{"Pretrain/Learning Rate": 4.708907634222359e-06, "Pretrain/Loss": 2.002631187438965, "Pretrain/Loss (Raw)": 2.1300766468048096, "Pretrain/Step": 7700, "Pretrain/Step Time": 8.52988083846867} +{"Pretrain/Learning Rate": 4.703949421048795e-06, "Pretrain/Loss": 2.0054125785827637, "Pretrain/Loss (Raw)": 2.159010887145996, "Pretrain/Step": 7701, "Pretrain/Step Time": 8.524741349741817} +{"Pretrain/Learning Rate": 4.698993548511427e-06, "Pretrain/Loss": 2.005434513092041, "Pretrain/Loss (Raw)": 2.1993801593780518, "Pretrain/Step": 7702, "Pretrain/Step Time": 8.535295637324452} +{"Pretrain/Learning Rate": 4.6940400171817835e-06, "Pretrain/Loss": 2.005375862121582, "Pretrain/Loss (Raw)": 2.165672540664673, "Pretrain/Step": 7703, "Pretrain/Step Time": 8.532741786912084} +{"Pretrain/Learning Rate": 4.68908882763113e-06, "Pretrain/Loss": 2.00539493560791, "Pretrain/Loss (Raw)": 1.956107258796692, "Pretrain/Step": 7704, "Pretrain/Step Time": 8.53173398412764} +{"Pretrain/Learning Rate": 4.684139980430455e-06, "Pretrain/Loss": 2.006798267364502, "Pretrain/Loss (Raw)": 2.1312601566314697, "Pretrain/Step": 7705, "Pretrain/Step Time": 8.525258082896471} +{"Pretrain/Learning Rate": 4.679193476150495e-06, "Pretrain/Loss": 2.007479667663574, "Pretrain/Loss (Raw)": 2.1199519634246826, "Pretrain/Step": 7706, "Pretrain/Step Time": 8.523365525528789} +{"Pretrain/Learning Rate": 4.674249315361698e-06, "Pretrain/Loss": 2.0075581073760986, "Pretrain/Loss (Raw)": 2.073364734649658, "Pretrain/Step": 7707, "Pretrain/Step Time": 8.524103488773108} +{"Pretrain/Learning Rate": 4.669307498634251e-06, "Pretrain/Loss": 2.0092148780822754, "Pretrain/Loss (Raw)": 2.057424306869507, "Pretrain/Step": 7708, "Pretrain/Step Time": 8.534168360754848} +{"Pretrain/Learning Rate": 4.664368026538054e-06, "Pretrain/Loss": 2.01009464263916, "Pretrain/Loss (Raw)": 2.0419700145721436, "Pretrain/Step": 7709, "Pretrain/Step Time": 8.537362296134233} +{"Pretrain/Learning Rate": 4.6594308996427694e-06, "Pretrain/Loss": 2.012429714202881, "Pretrain/Loss (Raw)": 2.143542528152466, "Pretrain/Step": 7710, "Pretrain/Step Time": 8.536641385406256} +{"Pretrain/Learning Rate": 4.654496118517762e-06, "Pretrain/Loss": 2.0086824893951416, "Pretrain/Loss (Raw)": 1.700524926185608, "Pretrain/Step": 7711, "Pretrain/Step Time": 8.528001300990582} +{"Pretrain/Learning Rate": 4.64956368373213e-06, "Pretrain/Loss": 2.0100789070129395, "Pretrain/Loss (Raw)": 1.9800481796264648, "Pretrain/Step": 7712, "Pretrain/Step Time": 8.532690107822418} +{"Pretrain/Learning Rate": 4.644633595854706e-06, "Pretrain/Loss": 2.0116944313049316, "Pretrain/Loss (Raw)": 2.0498039722442627, "Pretrain/Step": 7713, "Pretrain/Step Time": 8.527415584772825} +{"Pretrain/Learning Rate": 4.6397058554540575e-06, "Pretrain/Loss": 2.0111987590789795, "Pretrain/Loss (Raw)": 1.9312772750854492, "Pretrain/Step": 7714, "Pretrain/Step Time": 8.532054796814919} +{"Pretrain/Learning Rate": 4.6347804630984735e-06, "Pretrain/Loss": 2.0116748809814453, "Pretrain/Loss (Raw)": 1.9278391599655151, "Pretrain/Step": 7715, "Pretrain/Step Time": 8.538970461115241} +{"Pretrain/Learning Rate": 4.629857419355968e-06, "Pretrain/Loss": 2.0118184089660645, "Pretrain/Loss (Raw)": 1.9012675285339355, "Pretrain/Step": 7716, "Pretrain/Step Time": 8.540233423933387} +{"Pretrain/Learning Rate": 4.624936724794285e-06, "Pretrain/Loss": 2.0100340843200684, "Pretrain/Loss (Raw)": 1.9857807159423828, "Pretrain/Step": 7717, "Pretrain/Step Time": 8.538480091840029} +{"Pretrain/Learning Rate": 4.620018379980917e-06, "Pretrain/Loss": 2.0146377086639404, "Pretrain/Loss (Raw)": 2.226597547531128, "Pretrain/Step": 7718, "Pretrain/Step Time": 8.52197784371674} +{"Pretrain/Learning Rate": 4.6151023854830635e-06, "Pretrain/Loss": 2.012502431869507, "Pretrain/Loss (Raw)": 1.6587649583816528, "Pretrain/Step": 7719, "Pretrain/Step Time": 8.526221886277199} +{"Pretrain/Learning Rate": 4.610188741867657e-06, "Pretrain/Loss": 2.014029026031494, "Pretrain/Loss (Raw)": 2.061267137527466, "Pretrain/Step": 7720, "Pretrain/Step Time": 8.532239640131593} +{"Pretrain/Learning Rate": 4.6052774497013615e-06, "Pretrain/Loss": 2.011692762374878, "Pretrain/Loss (Raw)": 1.8744386434555054, "Pretrain/Step": 7721, "Pretrain/Step Time": 8.536605961620808} +{"Pretrain/Learning Rate": 4.600368509550584e-06, "Pretrain/Loss": 2.0095088481903076, "Pretrain/Loss (Raw)": 1.835816740989685, "Pretrain/Step": 7722, "Pretrain/Step Time": 8.540064366534352} +{"Pretrain/Learning Rate": 4.5954619219814254e-06, "Pretrain/Loss": 2.01356840133667, "Pretrain/Loss (Raw)": 2.3917980194091797, "Pretrain/Step": 7723, "Pretrain/Step Time": 8.533094672486186} +{"Pretrain/Learning Rate": 4.590557687559754e-06, "Pretrain/Loss": 2.010709762573242, "Pretrain/Loss (Raw)": 1.7830688953399658, "Pretrain/Step": 7724, "Pretrain/Step Time": 8.530292429029942} +{"Pretrain/Learning Rate": 4.585655806851136e-06, "Pretrain/Loss": 2.0087099075317383, "Pretrain/Loss (Raw)": 1.8481011390686035, "Pretrain/Step": 7725, "Pretrain/Step Time": 8.530394338071346} +{"Pretrain/Learning Rate": 4.5807562804208975e-06, "Pretrain/Loss": 2.0073513984680176, "Pretrain/Loss (Raw)": 1.8672831058502197, "Pretrain/Step": 7726, "Pretrain/Step Time": 8.526543417945504} +{"Pretrain/Learning Rate": 4.575859108834049e-06, "Pretrain/Loss": 2.0091097354888916, "Pretrain/Loss (Raw)": 1.9672402143478394, "Pretrain/Step": 7727, "Pretrain/Step Time": 8.528867967426777} +{"Pretrain/Learning Rate": 4.570964292655372e-06, "Pretrain/Loss": 2.0082902908325195, "Pretrain/Loss (Raw)": 1.9559682607650757, "Pretrain/Step": 7728, "Pretrain/Step Time": 8.529216354712844} +{"Pretrain/Learning Rate": 4.56607183244937e-06, "Pretrain/Loss": 2.0096094608306885, "Pretrain/Loss (Raw)": 2.0534393787384033, "Pretrain/Step": 7729, "Pretrain/Step Time": 8.519765101373196} +{"Pretrain/Learning Rate": 4.56118172878024e-06, "Pretrain/Loss": 2.009911298751831, "Pretrain/Loss (Raw)": 2.102816104888916, "Pretrain/Step": 7730, "Pretrain/Step Time": 8.528111593797803} +{"Pretrain/Learning Rate": 4.556293982211951e-06, "Pretrain/Loss": 2.0104446411132812, "Pretrain/Loss (Raw)": 2.105680227279663, "Pretrain/Step": 7731, "Pretrain/Step Time": 8.5289556812495} +{"Pretrain/Learning Rate": 4.551408593308165e-06, "Pretrain/Loss": 2.011112689971924, "Pretrain/Loss (Raw)": 2.0603091716766357, "Pretrain/Step": 7732, "Pretrain/Step Time": 8.529991718009114} +{"Pretrain/Learning Rate": 4.5465255626323116e-06, "Pretrain/Loss": 2.0125041007995605, "Pretrain/Loss (Raw)": 2.044316530227661, "Pretrain/Step": 7733, "Pretrain/Step Time": 8.526686558499932} +{"Pretrain/Learning Rate": 4.541644890747495e-06, "Pretrain/Loss": 2.0114166736602783, "Pretrain/Loss (Raw)": 2.315253496170044, "Pretrain/Step": 7734, "Pretrain/Step Time": 8.52498191036284} +{"Pretrain/Learning Rate": 4.536766578216603e-06, "Pretrain/Loss": 2.0123181343078613, "Pretrain/Loss (Raw)": 2.050473690032959, "Pretrain/Step": 7735, "Pretrain/Step Time": 8.522120397537947} +{"Pretrain/Learning Rate": 4.531890625602206e-06, "Pretrain/Loss": 2.0119142532348633, "Pretrain/Loss (Raw)": 1.9861023426055908, "Pretrain/Step": 7736, "Pretrain/Step Time": 8.526635067537427} +{"Pretrain/Learning Rate": 4.5270170334666435e-06, "Pretrain/Loss": 2.0106730461120605, "Pretrain/Loss (Raw)": 1.9341216087341309, "Pretrain/Step": 7737, "Pretrain/Step Time": 8.529673272743821} +{"Pretrain/Learning Rate": 4.522145802371936e-06, "Pretrain/Loss": 2.009880304336548, "Pretrain/Loss (Raw)": 1.9711151123046875, "Pretrain/Step": 7738, "Pretrain/Step Time": 8.533729244023561} +{"Pretrain/Learning Rate": 4.517276932879877e-06, "Pretrain/Loss": 2.0097529888153076, "Pretrain/Loss (Raw)": 1.9296610355377197, "Pretrain/Step": 7739, "Pretrain/Step Time": 8.530303439125419} +{"Pretrain/Learning Rate": 4.512410425551958e-06, "Pretrain/Loss": 2.0098912715911865, "Pretrain/Loss (Raw)": 2.104447841644287, "Pretrain/Step": 7740, "Pretrain/Step Time": 8.533517075702548} +{"Pretrain/Learning Rate": 4.507546280949413e-06, "Pretrain/Loss": 2.012894630432129, "Pretrain/Loss (Raw)": 2.1134254932403564, "Pretrain/Step": 7741, "Pretrain/Step Time": 8.520964765921235} +{"Pretrain/Learning Rate": 4.502684499633183e-06, "Pretrain/Loss": 2.016444683074951, "Pretrain/Loss (Raw)": 2.0226638317108154, "Pretrain/Step": 7742, "Pretrain/Step Time": 8.524543004110456} +{"Pretrain/Learning Rate": 4.4978250821639725e-06, "Pretrain/Loss": 2.010298252105713, "Pretrain/Loss (Raw)": 1.6630111932754517, "Pretrain/Step": 7743, "Pretrain/Step Time": 8.525723090395331} +{"Pretrain/Learning Rate": 4.492968029102182e-06, "Pretrain/Loss": 2.0098791122436523, "Pretrain/Loss (Raw)": 2.078841209411621, "Pretrain/Step": 7744, "Pretrain/Step Time": 8.525684740394354} +{"Pretrain/Learning Rate": 4.488113341007951e-06, "Pretrain/Loss": 2.008845329284668, "Pretrain/Loss (Raw)": 1.73874032497406, "Pretrain/Step": 7745, "Pretrain/Step Time": 8.527164006605744} +{"Pretrain/Learning Rate": 4.48326101844114e-06, "Pretrain/Loss": 2.006650924682617, "Pretrain/Loss (Raw)": 1.5649832487106323, "Pretrain/Step": 7746, "Pretrain/Step Time": 8.524382542818785} +{"Pretrain/Learning Rate": 4.4784110619613514e-06, "Pretrain/Loss": 2.0078225135803223, "Pretrain/Loss (Raw)": 2.2090697288513184, "Pretrain/Step": 7747, "Pretrain/Step Time": 8.52562895976007} +{"Pretrain/Learning Rate": 4.473563472127898e-06, "Pretrain/Loss": 2.0098767280578613, "Pretrain/Loss (Raw)": 2.1622400283813477, "Pretrain/Step": 7748, "Pretrain/Step Time": 8.51786814071238} +{"Pretrain/Learning Rate": 4.468718249499831e-06, "Pretrain/Loss": 2.010375499725342, "Pretrain/Loss (Raw)": 1.9904600381851196, "Pretrain/Step": 7749, "Pretrain/Step Time": 8.515666048973799} +{"Pretrain/Learning Rate": 4.463875394635916e-06, "Pretrain/Loss": 2.0136334896087646, "Pretrain/Loss (Raw)": 2.3891196250915527, "Pretrain/Step": 7750, "Pretrain/Step Time": 8.523162985220551} +{"Pretrain/Learning Rate": 4.459034908094664e-06, "Pretrain/Loss": 2.0128486156463623, "Pretrain/Loss (Raw)": 1.9081648588180542, "Pretrain/Step": 7751, "Pretrain/Step Time": 8.52845723927021} +{"Pretrain/Learning Rate": 4.454196790434301e-06, "Pretrain/Loss": 2.012946844100952, "Pretrain/Loss (Raw)": 1.9720125198364258, "Pretrain/Step": 7752, "Pretrain/Step Time": 8.526534605771303} +{"Pretrain/Learning Rate": 4.44936104221278e-06, "Pretrain/Loss": 2.0137739181518555, "Pretrain/Loss (Raw)": 1.9688507318496704, "Pretrain/Step": 7753, "Pretrain/Step Time": 8.518432883545756} +{"Pretrain/Learning Rate": 4.444527663987771e-06, "Pretrain/Loss": 2.0154995918273926, "Pretrain/Loss (Raw)": 2.131948709487915, "Pretrain/Step": 7754, "Pretrain/Step Time": 8.520930252969265} +{"Pretrain/Learning Rate": 4.439696656316703e-06, "Pretrain/Loss": 2.016827344894409, "Pretrain/Loss (Raw)": 2.096273899078369, "Pretrain/Step": 7755, "Pretrain/Step Time": 8.52939566411078} +{"Pretrain/Learning Rate": 4.434868019756697e-06, "Pretrain/Loss": 2.0163145065307617, "Pretrain/Loss (Raw)": 1.979457974433899, "Pretrain/Step": 7756, "Pretrain/Step Time": 8.529120242223144} +{"Pretrain/Learning Rate": 4.430041754864617e-06, "Pretrain/Loss": 2.016451358795166, "Pretrain/Loss (Raw)": 1.826980471611023, "Pretrain/Step": 7757, "Pretrain/Step Time": 8.527257984504104} +{"Pretrain/Learning Rate": 4.4252178621970455e-06, "Pretrain/Loss": 2.0140645503997803, "Pretrain/Loss (Raw)": 1.8852591514587402, "Pretrain/Step": 7758, "Pretrain/Step Time": 8.528064157813787} +{"Pretrain/Learning Rate": 4.420396342310309e-06, "Pretrain/Loss": 2.0126452445983887, "Pretrain/Loss (Raw)": 1.8860105276107788, "Pretrain/Step": 7759, "Pretrain/Step Time": 8.521930281072855} +{"Pretrain/Learning Rate": 4.41557719576044e-06, "Pretrain/Loss": 2.0133211612701416, "Pretrain/Loss (Raw)": 2.0539066791534424, "Pretrain/Step": 7760, "Pretrain/Step Time": 8.519356681033969} +{"Pretrain/Learning Rate": 4.410760423103205e-06, "Pretrain/Loss": 2.0130114555358887, "Pretrain/Loss (Raw)": 2.1101901531219482, "Pretrain/Step": 7761, "Pretrain/Step Time": 8.52798905596137} +{"Pretrain/Learning Rate": 4.405946024894092e-06, "Pretrain/Loss": 2.0134615898132324, "Pretrain/Loss (Raw)": 2.0234622955322266, "Pretrain/Step": 7762, "Pretrain/Step Time": 8.52374085597694} +{"Pretrain/Learning Rate": 4.401134001688337e-06, "Pretrain/Loss": 2.016145706176758, "Pretrain/Loss (Raw)": 2.0696136951446533, "Pretrain/Step": 7763, "Pretrain/Step Time": 8.529031310230494} +{"Pretrain/Learning Rate": 4.396324354040862e-06, "Pretrain/Loss": 2.017505168914795, "Pretrain/Loss (Raw)": 2.115089178085327, "Pretrain/Step": 7764, "Pretrain/Step Time": 8.52696505561471} +{"Pretrain/Learning Rate": 4.391517082506358e-06, "Pretrain/Loss": 2.0202291011810303, "Pretrain/Loss (Raw)": 2.4940855503082275, "Pretrain/Step": 7765, "Pretrain/Step Time": 8.516115061938763} +{"Pretrain/Learning Rate": 4.386712187639205e-06, "Pretrain/Loss": 2.020752429962158, "Pretrain/Loss (Raw)": 1.9164021015167236, "Pretrain/Step": 7766, "Pretrain/Step Time": 8.517013400793076} +{"Pretrain/Learning Rate": 4.38190966999355e-06, "Pretrain/Loss": 2.0210914611816406, "Pretrain/Loss (Raw)": 2.0510966777801514, "Pretrain/Step": 7767, "Pretrain/Step Time": 8.519167374819517} +{"Pretrain/Learning Rate": 4.377109530123217e-06, "Pretrain/Loss": 2.0183286666870117, "Pretrain/Loss (Raw)": 1.6236969232559204, "Pretrain/Step": 7768, "Pretrain/Step Time": 8.52353416197002} +{"Pretrain/Learning Rate": 4.372311768581794e-06, "Pretrain/Loss": 2.0200705528259277, "Pretrain/Loss (Raw)": 2.184065580368042, "Pretrain/Step": 7769, "Pretrain/Step Time": 8.525101438164711} +{"Pretrain/Learning Rate": 4.367516385922574e-06, "Pretrain/Loss": 2.0181212425231934, "Pretrain/Loss (Raw)": 1.8184638023376465, "Pretrain/Step": 7770, "Pretrain/Step Time": 8.520304899662733} +{"Pretrain/Learning Rate": 4.362723382698594e-06, "Pretrain/Loss": 2.0185279846191406, "Pretrain/Loss (Raw)": 2.2335870265960693, "Pretrain/Step": 7771, "Pretrain/Step Time": 8.522539546713233} +{"Pretrain/Learning Rate": 4.357932759462599e-06, "Pretrain/Loss": 2.0184555053710938, "Pretrain/Loss (Raw)": 1.818082332611084, "Pretrain/Step": 7772, "Pretrain/Step Time": 8.522728905081749} +{"Pretrain/Learning Rate": 4.35314451676706e-06, "Pretrain/Loss": 2.0186586380004883, "Pretrain/Loss (Raw)": 1.9847487211227417, "Pretrain/Step": 7773, "Pretrain/Step Time": 8.523843090981245} +{"Pretrain/Learning Rate": 4.348358655164203e-06, "Pretrain/Loss": 2.023608922958374, "Pretrain/Loss (Raw)": 2.399451494216919, "Pretrain/Step": 7774, "Pretrain/Step Time": 8.532667519524693} +{"Pretrain/Learning Rate": 4.343575175205922e-06, "Pretrain/Loss": 2.0235819816589355, "Pretrain/Loss (Raw)": 2.1199471950531006, "Pretrain/Step": 7775, "Pretrain/Step Time": 8.527264025062323} +{"Pretrain/Learning Rate": 4.338794077443897e-06, "Pretrain/Loss": 2.027564287185669, "Pretrain/Loss (Raw)": 2.5485992431640625, "Pretrain/Step": 7776, "Pretrain/Step Time": 8.523109085857868} +{"Pretrain/Learning Rate": 4.334015362429491e-06, "Pretrain/Loss": 2.027374267578125, "Pretrain/Loss (Raw)": 2.1080615520477295, "Pretrain/Step": 7777, "Pretrain/Step Time": 8.523077694699168} +{"Pretrain/Learning Rate": 4.329239030713827e-06, "Pretrain/Loss": 2.028406858444214, "Pretrain/Loss (Raw)": 2.1533050537109375, "Pretrain/Step": 7778, "Pretrain/Step Time": 8.523942461237311} +{"Pretrain/Learning Rate": 4.3244650828477114e-06, "Pretrain/Loss": 2.026785373687744, "Pretrain/Loss (Raw)": 1.7447339296340942, "Pretrain/Step": 7779, "Pretrain/Step Time": 8.526192504912615} +{"Pretrain/Learning Rate": 4.319693519381712e-06, "Pretrain/Loss": 2.0292558670043945, "Pretrain/Loss (Raw)": 2.412186861038208, "Pretrain/Step": 7780, "Pretrain/Step Time": 8.535065738484263} +{"Pretrain/Learning Rate": 4.314924340866105e-06, "Pretrain/Loss": 2.0297458171844482, "Pretrain/Loss (Raw)": 1.8243920803070068, "Pretrain/Step": 7781, "Pretrain/Step Time": 8.531962620094419} +{"Pretrain/Learning Rate": 4.310157547850896e-06, "Pretrain/Loss": 2.0288052558898926, "Pretrain/Loss (Raw)": 1.890537142753601, "Pretrain/Step": 7782, "Pretrain/Step Time": 8.527857581153512} +{"Pretrain/Learning Rate": 4.3053931408858055e-06, "Pretrain/Loss": 2.029388666152954, "Pretrain/Loss (Raw)": 2.1099133491516113, "Pretrain/Step": 7783, "Pretrain/Step Time": 8.52851552888751} +{"Pretrain/Learning Rate": 4.300631120520301e-06, "Pretrain/Loss": 2.0283212661743164, "Pretrain/Loss (Raw)": 1.9551947116851807, "Pretrain/Step": 7784, "Pretrain/Step Time": 8.52286747470498} +{"Pretrain/Learning Rate": 4.295871487303554e-06, "Pretrain/Loss": 2.028125762939453, "Pretrain/Loss (Raw)": 2.052738904953003, "Pretrain/Step": 7785, "Pretrain/Step Time": 8.530190415680408} +{"Pretrain/Learning Rate": 4.291114241784467e-06, "Pretrain/Loss": 2.0269198417663574, "Pretrain/Loss (Raw)": 1.962060570716858, "Pretrain/Step": 7786, "Pretrain/Step Time": 8.53172117099166} +{"Pretrain/Learning Rate": 4.286359384511662e-06, "Pretrain/Loss": 2.0279643535614014, "Pretrain/Loss (Raw)": 2.119922637939453, "Pretrain/Step": 7787, "Pretrain/Step Time": 8.538153743371367} +{"Pretrain/Learning Rate": 4.281606916033507e-06, "Pretrain/Loss": 2.025890350341797, "Pretrain/Loss (Raw)": 1.977312684059143, "Pretrain/Step": 7788, "Pretrain/Step Time": 8.538308354094625} +{"Pretrain/Learning Rate": 4.276856836898072e-06, "Pretrain/Loss": 2.0246357917785645, "Pretrain/Loss (Raw)": 1.6747666597366333, "Pretrain/Step": 7789, "Pretrain/Step Time": 8.537738487124443} +{"Pretrain/Learning Rate": 4.272109147653155e-06, "Pretrain/Loss": 2.026695728302002, "Pretrain/Loss (Raw)": 1.8847993612289429, "Pretrain/Step": 7790, "Pretrain/Step Time": 8.53779772669077} +{"Pretrain/Learning Rate": 4.267363848846278e-06, "Pretrain/Loss": 2.0269615650177, "Pretrain/Loss (Raw)": 2.0247747898101807, "Pretrain/Step": 7791, "Pretrain/Step Time": 8.538055013865232} +{"Pretrain/Learning Rate": 4.262620941024703e-06, "Pretrain/Loss": 2.025542974472046, "Pretrain/Loss (Raw)": 1.8564268350601196, "Pretrain/Step": 7792, "Pretrain/Step Time": 8.545784706249833} +{"Pretrain/Learning Rate": 4.2578804247353996e-06, "Pretrain/Loss": 2.0219478607177734, "Pretrain/Loss (Raw)": 2.127603769302368, "Pretrain/Step": 7793, "Pretrain/Step Time": 8.547381214797497} +{"Pretrain/Learning Rate": 4.253142300525068e-06, "Pretrain/Loss": 2.0229263305664062, "Pretrain/Loss (Raw)": 2.1786246299743652, "Pretrain/Step": 7794, "Pretrain/Step Time": 8.541294991970062} +{"Pretrain/Learning Rate": 4.248406568940119e-06, "Pretrain/Loss": 2.021901845932007, "Pretrain/Loss (Raw)": 1.9086037874221802, "Pretrain/Step": 7795, "Pretrain/Step Time": 8.542045000940561} +{"Pretrain/Learning Rate": 4.243673230526715e-06, "Pretrain/Loss": 2.021066427230835, "Pretrain/Loss (Raw)": 2.1024906635284424, "Pretrain/Step": 7796, "Pretrain/Step Time": 8.535916328430176} +{"Pretrain/Learning Rate": 4.238942285830724e-06, "Pretrain/Loss": 2.022554874420166, "Pretrain/Loss (Raw)": 2.1927802562713623, "Pretrain/Step": 7797, "Pretrain/Step Time": 8.540441675111651} +{"Pretrain/Learning Rate": 4.234213735397738e-06, "Pretrain/Loss": 2.0232701301574707, "Pretrain/Loss (Raw)": 2.270076274871826, "Pretrain/Step": 7798, "Pretrain/Step Time": 8.550596822053194} +{"Pretrain/Learning Rate": 4.229487579773067e-06, "Pretrain/Loss": 2.022965431213379, "Pretrain/Loss (Raw)": 1.8377885818481445, "Pretrain/Step": 7799, "Pretrain/Step Time": 8.548140680417418} +{"Pretrain/Learning Rate": 4.22476381950177e-06, "Pretrain/Loss": 2.0208845138549805, "Pretrain/Loss (Raw)": 1.7992744445800781, "Pretrain/Step": 7800, "Pretrain/Step Time": 8.54300000704825} +{"Pretrain/Learning Rate": 4.220042455128603e-06, "Pretrain/Loss": 2.023533582687378, "Pretrain/Loss (Raw)": 2.1979143619537354, "Pretrain/Step": 7801, "Pretrain/Step Time": 8.532324014231563} +{"Pretrain/Learning Rate": 4.215323487198061e-06, "Pretrain/Loss": 2.018491744995117, "Pretrain/Loss (Raw)": 1.6415966749191284, "Pretrain/Step": 7802, "Pretrain/Step Time": 8.528654046356678} +{"Pretrain/Learning Rate": 4.210606916254348e-06, "Pretrain/Loss": 2.026675224304199, "Pretrain/Loss (Raw)": 3.0218873023986816, "Pretrain/Step": 7803, "Pretrain/Step Time": 8.525568837299943} +{"Pretrain/Learning Rate": 4.205892742841422e-06, "Pretrain/Loss": 2.0265824794769287, "Pretrain/Loss (Raw)": 1.9646217823028564, "Pretrain/Step": 7804, "Pretrain/Step Time": 8.535739922896028} +{"Pretrain/Learning Rate": 4.2011809675029154e-06, "Pretrain/Loss": 2.0273072719573975, "Pretrain/Loss (Raw)": 2.091298818588257, "Pretrain/Step": 7805, "Pretrain/Step Time": 8.531847076490521} +{"Pretrain/Learning Rate": 4.196471590782236e-06, "Pretrain/Loss": 2.0272750854492188, "Pretrain/Loss (Raw)": 2.017958402633667, "Pretrain/Step": 7806, "Pretrain/Step Time": 8.526504784822464} +{"Pretrain/Learning Rate": 4.191764613222474e-06, "Pretrain/Loss": 2.025679111480713, "Pretrain/Loss (Raw)": 1.9359196424484253, "Pretrain/Step": 7807, "Pretrain/Step Time": 8.523934440687299} +{"Pretrain/Learning Rate": 4.18706003536648e-06, "Pretrain/Loss": 2.0255134105682373, "Pretrain/Loss (Raw)": 2.0714805126190186, "Pretrain/Step": 7808, "Pretrain/Step Time": 8.521565645933151} +{"Pretrain/Learning Rate": 4.182357857756786e-06, "Pretrain/Loss": 2.0266833305358887, "Pretrain/Loss (Raw)": 2.1330442428588867, "Pretrain/Step": 7809, "Pretrain/Step Time": 8.521786691620946} +{"Pretrain/Learning Rate": 4.1776580809356845e-06, "Pretrain/Loss": 2.026632308959961, "Pretrain/Loss (Raw)": 2.0460259914398193, "Pretrain/Step": 7810, "Pretrain/Step Time": 8.534602740779519} +{"Pretrain/Learning Rate": 4.172960705445164e-06, "Pretrain/Loss": 2.027717351913452, "Pretrain/Loss (Raw)": 2.297987461090088, "Pretrain/Step": 7811, "Pretrain/Step Time": 8.541538970544934} +{"Pretrain/Learning Rate": 4.168265731826965e-06, "Pretrain/Loss": 2.0267415046691895, "Pretrain/Loss (Raw)": 1.6771764755249023, "Pretrain/Step": 7812, "Pretrain/Step Time": 8.539852399379015} +{"Pretrain/Learning Rate": 4.163573160622522e-06, "Pretrain/Loss": 2.0276355743408203, "Pretrain/Loss (Raw)": 2.044466257095337, "Pretrain/Step": 7813, "Pretrain/Step Time": 8.532046044245362} +{"Pretrain/Learning Rate": 4.1588829923730005e-06, "Pretrain/Loss": 2.027038812637329, "Pretrain/Loss (Raw)": 1.957869529724121, "Pretrain/Step": 7814, "Pretrain/Step Time": 8.529167897999287} +{"Pretrain/Learning Rate": 4.1541952276193095e-06, "Pretrain/Loss": 2.0261142253875732, "Pretrain/Loss (Raw)": 1.99562406539917, "Pretrain/Step": 7815, "Pretrain/Step Time": 8.530687510967255} +{"Pretrain/Learning Rate": 4.149509866902043e-06, "Pretrain/Loss": 2.0262789726257324, "Pretrain/Loss (Raw)": 2.004312038421631, "Pretrain/Step": 7816, "Pretrain/Step Time": 8.544387781992555} +{"Pretrain/Learning Rate": 4.144826910761556e-06, "Pretrain/Loss": 2.029646873474121, "Pretrain/Loss (Raw)": 2.0374443531036377, "Pretrain/Step": 7817, "Pretrain/Step Time": 8.540558200329542} +{"Pretrain/Learning Rate": 4.140146359737895e-06, "Pretrain/Loss": 2.029574394226074, "Pretrain/Loss (Raw)": 2.0757896900177, "Pretrain/Step": 7818, "Pretrain/Step Time": 8.534939102828503} +{"Pretrain/Learning Rate": 4.135468214370864e-06, "Pretrain/Loss": 2.029153823852539, "Pretrain/Loss (Raw)": 1.9449033737182617, "Pretrain/Step": 7819, "Pretrain/Step Time": 8.526898885145783} +{"Pretrain/Learning Rate": 4.130792475199943e-06, "Pretrain/Loss": 2.026211738586426, "Pretrain/Loss (Raw)": 1.777470350265503, "Pretrain/Step": 7820, "Pretrain/Step Time": 8.52617339976132} +{"Pretrain/Learning Rate": 4.126119142764379e-06, "Pretrain/Loss": 2.0248823165893555, "Pretrain/Loss (Raw)": 1.8198107481002808, "Pretrain/Step": 7821, "Pretrain/Step Time": 8.526763448491693} +{"Pretrain/Learning Rate": 4.121448217603116e-06, "Pretrain/Loss": 2.0238125324249268, "Pretrain/Loss (Raw)": 1.856752872467041, "Pretrain/Step": 7822, "Pretrain/Step Time": 8.521157253533602} +{"Pretrain/Learning Rate": 4.116779700254828e-06, "Pretrain/Loss": 2.024171829223633, "Pretrain/Loss (Raw)": 2.0993685722351074, "Pretrain/Step": 7823, "Pretrain/Step Time": 8.526122694835067} +{"Pretrain/Learning Rate": 4.1121135912579044e-06, "Pretrain/Loss": 2.023346424102783, "Pretrain/Loss (Raw)": 1.963357925415039, "Pretrain/Step": 7824, "Pretrain/Step Time": 8.525222834199667} +{"Pretrain/Learning Rate": 4.1074498911504725e-06, "Pretrain/Loss": 2.0229995250701904, "Pretrain/Loss (Raw)": 2.0850882530212402, "Pretrain/Step": 7825, "Pretrain/Step Time": 8.520164577290416} +{"Pretrain/Learning Rate": 4.102788600470369e-06, "Pretrain/Loss": 2.0241241455078125, "Pretrain/Loss (Raw)": 2.210020065307617, "Pretrain/Step": 7826, "Pretrain/Step Time": 8.511878026649356} +{"Pretrain/Learning Rate": 4.098129719755156e-06, "Pretrain/Loss": 2.02411150932312, "Pretrain/Loss (Raw)": 2.014322280883789, "Pretrain/Step": 7827, "Pretrain/Step Time": 8.517846297472715} +{"Pretrain/Learning Rate": 4.093473249542109e-06, "Pretrain/Loss": 2.0239574909210205, "Pretrain/Loss (Raw)": 2.1103713512420654, "Pretrain/Step": 7828, "Pretrain/Step Time": 8.528297552838922} +{"Pretrain/Learning Rate": 4.0888191903682485e-06, "Pretrain/Loss": 2.0215020179748535, "Pretrain/Loss (Raw)": 1.8447009325027466, "Pretrain/Step": 7829, "Pretrain/Step Time": 8.529770074412227} +{"Pretrain/Learning Rate": 4.084167542770295e-06, "Pretrain/Loss": 2.022064685821533, "Pretrain/Loss (Raw)": 2.271409273147583, "Pretrain/Step": 7830, "Pretrain/Step Time": 8.520870078355074} +{"Pretrain/Learning Rate": 4.079518307284699e-06, "Pretrain/Loss": 2.020956516265869, "Pretrain/Loss (Raw)": 2.02382230758667, "Pretrain/Step": 7831, "Pretrain/Step Time": 8.521392170339823} +{"Pretrain/Learning Rate": 4.074871484447626e-06, "Pretrain/Loss": 2.019508123397827, "Pretrain/Loss (Raw)": 1.7707144021987915, "Pretrain/Step": 7832, "Pretrain/Step Time": 8.518684409558773} +{"Pretrain/Learning Rate": 4.070227074794983e-06, "Pretrain/Loss": 2.0195913314819336, "Pretrain/Loss (Raw)": 2.1418888568878174, "Pretrain/Step": 7833, "Pretrain/Step Time": 8.520817246288061} +{"Pretrain/Learning Rate": 4.06558507886238e-06, "Pretrain/Loss": 2.0165112018585205, "Pretrain/Loss (Raw)": 1.725718379020691, "Pretrain/Step": 7834, "Pretrain/Step Time": 8.527196984738111} +{"Pretrain/Learning Rate": 4.0609454971851476e-06, "Pretrain/Loss": 2.017112970352173, "Pretrain/Loss (Raw)": 2.1503915786743164, "Pretrain/Step": 7835, "Pretrain/Step Time": 8.524776734411716} +{"Pretrain/Learning Rate": 4.0563083302983444e-06, "Pretrain/Loss": 2.015598773956299, "Pretrain/Loss (Raw)": 1.863602876663208, "Pretrain/Step": 7836, "Pretrain/Step Time": 8.516394978389144} +{"Pretrain/Learning Rate": 4.051673578736761e-06, "Pretrain/Loss": 2.0146372318267822, "Pretrain/Loss (Raw)": 1.9188957214355469, "Pretrain/Step": 7837, "Pretrain/Step Time": 8.5161257609725} +{"Pretrain/Learning Rate": 4.047041243034894e-06, "Pretrain/Loss": 2.011528253555298, "Pretrain/Loss (Raw)": 1.7455931901931763, "Pretrain/Step": 7838, "Pretrain/Step Time": 8.524669628590345} +{"Pretrain/Learning Rate": 4.04241132372696e-06, "Pretrain/Loss": 2.015042781829834, "Pretrain/Loss (Raw)": 2.150377035140991, "Pretrain/Step": 7839, "Pretrain/Step Time": 8.531048282980919} +{"Pretrain/Learning Rate": 4.037783821346905e-06, "Pretrain/Loss": 2.0138025283813477, "Pretrain/Loss (Raw)": 1.8213027715682983, "Pretrain/Step": 7840, "Pretrain/Step Time": 8.526039231568575} +{"Pretrain/Learning Rate": 4.033158736428402e-06, "Pretrain/Loss": 2.0131006240844727, "Pretrain/Loss (Raw)": 1.9599804878234863, "Pretrain/Step": 7841, "Pretrain/Step Time": 8.51959560252726} +{"Pretrain/Learning Rate": 4.0285360695048316e-06, "Pretrain/Loss": 2.016080379486084, "Pretrain/Loss (Raw)": 2.3126516342163086, "Pretrain/Step": 7842, "Pretrain/Step Time": 8.51544950902462} +{"Pretrain/Learning Rate": 4.023915821109306e-06, "Pretrain/Loss": 2.017409324645996, "Pretrain/Loss (Raw)": 2.09796142578125, "Pretrain/Step": 7843, "Pretrain/Step Time": 8.510313585400581} +{"Pretrain/Learning Rate": 4.01929799177464e-06, "Pretrain/Loss": 2.0183331966400146, "Pretrain/Loss (Raw)": 2.019508123397827, "Pretrain/Step": 7844, "Pretrain/Step Time": 8.514113005250692} +{"Pretrain/Learning Rate": 4.014682582033407e-06, "Pretrain/Loss": 2.018444061279297, "Pretrain/Loss (Raw)": 1.9999558925628662, "Pretrain/Step": 7845, "Pretrain/Step Time": 8.518880980089307} +{"Pretrain/Learning Rate": 4.010069592417853e-06, "Pretrain/Loss": 2.0143017768859863, "Pretrain/Loss (Raw)": 1.6964341402053833, "Pretrain/Step": 7846, "Pretrain/Step Time": 8.521217247471213} +{"Pretrain/Learning Rate": 4.00545902345999e-06, "Pretrain/Loss": 2.018984317779541, "Pretrain/Loss (Raw)": 2.2580997943878174, "Pretrain/Step": 7847, "Pretrain/Step Time": 8.516664346680045} +{"Pretrain/Learning Rate": 4.000850875691514e-06, "Pretrain/Loss": 2.019376277923584, "Pretrain/Loss (Raw)": 2.111440658569336, "Pretrain/Step": 7848, "Pretrain/Step Time": 8.511888448148966} +{"Pretrain/Learning Rate": 3.9962451496438765e-06, "Pretrain/Loss": 2.020163059234619, "Pretrain/Loss (Raw)": 1.9751362800598145, "Pretrain/Step": 7849, "Pretrain/Step Time": 8.506813783198595} +{"Pretrain/Learning Rate": 3.99164184584821e-06, "Pretrain/Loss": 2.01971435546875, "Pretrain/Loss (Raw)": 1.7784197330474854, "Pretrain/Step": 7850, "Pretrain/Step Time": 8.515081180259585} +{"Pretrain/Learning Rate": 3.987040964835409e-06, "Pretrain/Loss": 2.017362117767334, "Pretrain/Loss (Raw)": 2.0906805992126465, "Pretrain/Step": 7851, "Pretrain/Step Time": 8.517093732953072} +{"Pretrain/Learning Rate": 3.9824425071360525e-06, "Pretrain/Loss": 2.0198843479156494, "Pretrain/Loss (Raw)": 2.1059303283691406, "Pretrain/Step": 7852, "Pretrain/Step Time": 8.51457654684782} +{"Pretrain/Learning Rate": 3.977846473280469e-06, "Pretrain/Loss": 2.0208256244659424, "Pretrain/Loss (Raw)": 1.9685711860656738, "Pretrain/Step": 7853, "Pretrain/Step Time": 8.513820458203554} +{"Pretrain/Learning Rate": 3.973252863798691e-06, "Pretrain/Loss": 2.022172451019287, "Pretrain/Loss (Raw)": 2.039687395095825, "Pretrain/Step": 7854, "Pretrain/Step Time": 8.51536045782268} +{"Pretrain/Learning Rate": 3.968661679220468e-06, "Pretrain/Loss": 2.021564245223999, "Pretrain/Loss (Raw)": 1.8893847465515137, "Pretrain/Step": 7855, "Pretrain/Step Time": 8.512834414839745} +{"Pretrain/Learning Rate": 3.964072920075296e-06, "Pretrain/Loss": 2.0198962688446045, "Pretrain/Loss (Raw)": 1.7424697875976562, "Pretrain/Step": 7856, "Pretrain/Step Time": 8.515377616509795} +{"Pretrain/Learning Rate": 3.959486586892344e-06, "Pretrain/Loss": 2.0191826820373535, "Pretrain/Loss (Raw)": 1.9621050357818604, "Pretrain/Step": 7857, "Pretrain/Step Time": 8.523892909288406} +{"Pretrain/Learning Rate": 3.954902680200553e-06, "Pretrain/Loss": 2.0200648307800293, "Pretrain/Loss (Raw)": 2.2157230377197266, "Pretrain/Step": 7858, "Pretrain/Step Time": 8.514886669814587} +{"Pretrain/Learning Rate": 3.950321200528548e-06, "Pretrain/Loss": 2.0190346240997314, "Pretrain/Loss (Raw)": 1.9738043546676636, "Pretrain/Step": 7859, "Pretrain/Step Time": 8.507973421365023} +{"Pretrain/Learning Rate": 3.9457421484047015e-06, "Pretrain/Loss": 2.017118215560913, "Pretrain/Loss (Raw)": 1.815000057220459, "Pretrain/Step": 7860, "Pretrain/Step Time": 8.50829111598432} +{"Pretrain/Learning Rate": 3.941165524357071e-06, "Pretrain/Loss": 2.0159051418304443, "Pretrain/Loss (Raw)": 1.889066457748413, "Pretrain/Step": 7861, "Pretrain/Step Time": 8.509726762771606} +{"Pretrain/Learning Rate": 3.936591328913472e-06, "Pretrain/Loss": 2.013216495513916, "Pretrain/Loss (Raw)": 1.971139669418335, "Pretrain/Step": 7862, "Pretrain/Step Time": 8.510946227237582} +{"Pretrain/Learning Rate": 3.932019562601405e-06, "Pretrain/Loss": 2.010000467300415, "Pretrain/Loss (Raw)": 1.638788104057312, "Pretrain/Step": 7863, "Pretrain/Step Time": 8.510703701525927} +{"Pretrain/Learning Rate": 3.927450225948132e-06, "Pretrain/Loss": 2.0117764472961426, "Pretrain/Loss (Raw)": 2.213416337966919, "Pretrain/Step": 7864, "Pretrain/Step Time": 8.511736236512661} +{"Pretrain/Learning Rate": 3.922883319480586e-06, "Pretrain/Loss": 2.011948347091675, "Pretrain/Loss (Raw)": 1.9561467170715332, "Pretrain/Step": 7865, "Pretrain/Step Time": 8.513051062822342} +{"Pretrain/Learning Rate": 3.9183188437254576e-06, "Pretrain/Loss": 2.0133719444274902, "Pretrain/Loss (Raw)": 2.153337001800537, "Pretrain/Step": 7866, "Pretrain/Step Time": 8.507138308137655} +{"Pretrain/Learning Rate": 3.9137567992091394e-06, "Pretrain/Loss": 2.0145931243896484, "Pretrain/Loss (Raw)": 2.0859482288360596, "Pretrain/Step": 7867, "Pretrain/Step Time": 8.506752248853445} +{"Pretrain/Learning Rate": 3.90919718645775e-06, "Pretrain/Loss": 2.0140178203582764, "Pretrain/Loss (Raw)": 2.0308120250701904, "Pretrain/Step": 7868, "Pretrain/Step Time": 8.505942029878497} +{"Pretrain/Learning Rate": 3.904640005997118e-06, "Pretrain/Loss": 2.0122828483581543, "Pretrain/Loss (Raw)": 1.8913493156433105, "Pretrain/Step": 7869, "Pretrain/Step Time": 8.515019161626697} +{"Pretrain/Learning Rate": 3.900085258352812e-06, "Pretrain/Loss": 2.0113749504089355, "Pretrain/Loss (Raw)": 1.9064676761627197, "Pretrain/Step": 7870, "Pretrain/Step Time": 8.519663678482175} +{"Pretrain/Learning Rate": 3.895532944050098e-06, "Pretrain/Loss": 2.014963150024414, "Pretrain/Loss (Raw)": 2.1222872734069824, "Pretrain/Step": 7871, "Pretrain/Step Time": 8.519036872312427} +{"Pretrain/Learning Rate": 3.890983063613976e-06, "Pretrain/Loss": 2.0140295028686523, "Pretrain/Loss (Raw)": 1.9593359231948853, "Pretrain/Step": 7872, "Pretrain/Step Time": 8.519490050151944} +{"Pretrain/Learning Rate": 3.886435617569148e-06, "Pretrain/Loss": 2.0154621601104736, "Pretrain/Loss (Raw)": 1.9221326112747192, "Pretrain/Step": 7873, "Pretrain/Step Time": 8.517997112125158} +{"Pretrain/Learning Rate": 3.881890606440058e-06, "Pretrain/Loss": 2.0184099674224854, "Pretrain/Loss (Raw)": 1.9422881603240967, "Pretrain/Step": 7874, "Pretrain/Step Time": 8.52519030123949} +{"Pretrain/Learning Rate": 3.87734803075086e-06, "Pretrain/Loss": 2.015944004058838, "Pretrain/Loss (Raw)": 1.8934544324874878, "Pretrain/Step": 7875, "Pretrain/Step Time": 8.523567045107484} +{"Pretrain/Learning Rate": 3.872807891025418e-06, "Pretrain/Loss": 2.0141332149505615, "Pretrain/Loss (Raw)": 1.9304449558258057, "Pretrain/Step": 7876, "Pretrain/Step Time": 8.531190741807222} +{"Pretrain/Learning Rate": 3.868270187787318e-06, "Pretrain/Loss": 2.0141067504882812, "Pretrain/Loss (Raw)": 1.987094759941101, "Pretrain/Step": 7877, "Pretrain/Step Time": 8.526354247704148} +{"Pretrain/Learning Rate": 3.863734921559884e-06, "Pretrain/Loss": 2.0119662284851074, "Pretrain/Loss (Raw)": 2.1151373386383057, "Pretrain/Step": 7878, "Pretrain/Step Time": 8.51978169940412} +{"Pretrain/Learning Rate": 3.859202092866135e-06, "Pretrain/Loss": 2.011807441711426, "Pretrain/Loss (Raw)": 1.887816309928894, "Pretrain/Step": 7879, "Pretrain/Step Time": 8.51392274722457} +{"Pretrain/Learning Rate": 3.854671702228818e-06, "Pretrain/Loss": 2.010789632797241, "Pretrain/Loss (Raw)": 1.8417224884033203, "Pretrain/Step": 7880, "Pretrain/Step Time": 8.520898249000311} +{"Pretrain/Learning Rate": 3.850143750170395e-06, "Pretrain/Loss": 2.0121428966522217, "Pretrain/Loss (Raw)": 2.1420538425445557, "Pretrain/Step": 7881, "Pretrain/Step Time": 8.530566105619073} +{"Pretrain/Learning Rate": 3.8456182372130636e-06, "Pretrain/Loss": 2.0106749534606934, "Pretrain/Loss (Raw)": 1.9440780878067017, "Pretrain/Step": 7882, "Pretrain/Step Time": 8.528178721666336} +{"Pretrain/Learning Rate": 3.841095163878719e-06, "Pretrain/Loss": 2.0102853775024414, "Pretrain/Loss (Raw)": 2.0464134216308594, "Pretrain/Step": 7883, "Pretrain/Step Time": 8.521183732897043} +{"Pretrain/Learning Rate": 3.836574530688983e-06, "Pretrain/Loss": 2.0095348358154297, "Pretrain/Loss (Raw)": 1.8833578824996948, "Pretrain/Step": 7884, "Pretrain/Step Time": 8.523719316348433} +{"Pretrain/Learning Rate": 3.832056338165193e-06, "Pretrain/Loss": 2.0100255012512207, "Pretrain/Loss (Raw)": 1.8898365497589111, "Pretrain/Step": 7885, "Pretrain/Step Time": 8.520214680582285} +{"Pretrain/Learning Rate": 3.827540586828418e-06, "Pretrain/Loss": 2.0090532302856445, "Pretrain/Loss (Raw)": 1.7607978582382202, "Pretrain/Step": 7886, "Pretrain/Step Time": 8.527125537395477} +{"Pretrain/Learning Rate": 3.823027277199432e-06, "Pretrain/Loss": 2.01088809967041, "Pretrain/Loss (Raw)": 2.120847702026367, "Pretrain/Step": 7887, "Pretrain/Step Time": 8.526173183694482} +{"Pretrain/Learning Rate": 3.818516409798728e-06, "Pretrain/Loss": 2.0105113983154297, "Pretrain/Loss (Raw)": 2.005699396133423, "Pretrain/Step": 7888, "Pretrain/Step Time": 8.537281952798367} +{"Pretrain/Learning Rate": 3.814007985146517e-06, "Pretrain/Loss": 2.011223316192627, "Pretrain/Loss (Raw)": 2.201317310333252, "Pretrain/Step": 7889, "Pretrain/Step Time": 8.5290417522192} +{"Pretrain/Learning Rate": 3.8095020037627467e-06, "Pretrain/Loss": 2.01084303855896, "Pretrain/Loss (Raw)": 1.9747867584228516, "Pretrain/Step": 7890, "Pretrain/Step Time": 8.529837464913726} +{"Pretrain/Learning Rate": 3.8049984661670477e-06, "Pretrain/Loss": 2.01202654838562, "Pretrain/Loss (Raw)": 2.221108913421631, "Pretrain/Step": 7891, "Pretrain/Step Time": 8.528783457353711} +{"Pretrain/Learning Rate": 3.8004973728788057e-06, "Pretrain/Loss": 2.011014938354492, "Pretrain/Loss (Raw)": 1.985597848892212, "Pretrain/Step": 7892, "Pretrain/Step Time": 8.529716301709414} +{"Pretrain/Learning Rate": 3.795998724417096e-06, "Pretrain/Loss": 2.006002187728882, "Pretrain/Loss (Raw)": 1.85245943069458, "Pretrain/Step": 7893, "Pretrain/Step Time": 8.537385165691376} +{"Pretrain/Learning Rate": 3.7915025213007354e-06, "Pretrain/Loss": 2.007185935974121, "Pretrain/Loss (Raw)": 2.0678861141204834, "Pretrain/Step": 7894, "Pretrain/Step Time": 8.535489682108164} +{"Pretrain/Learning Rate": 3.7870087640482444e-06, "Pretrain/Loss": 2.005415916442871, "Pretrain/Loss (Raw)": 1.824538230895996, "Pretrain/Step": 7895, "Pretrain/Step Time": 8.533482249826193} +{"Pretrain/Learning Rate": 3.782517453177853e-06, "Pretrain/Loss": 2.0085296630859375, "Pretrain/Loss (Raw)": 2.02228045463562, "Pretrain/Step": 7896, "Pretrain/Step Time": 8.533235969021916} +{"Pretrain/Learning Rate": 3.778028589207541e-06, "Pretrain/Loss": 2.0077829360961914, "Pretrain/Loss (Raw)": 2.088467597961426, "Pretrain/Step": 7897, "Pretrain/Step Time": 8.530579317361116} +{"Pretrain/Learning Rate": 3.773542172654962e-06, "Pretrain/Loss": 2.0088608264923096, "Pretrain/Loss (Raw)": 1.9564543962478638, "Pretrain/Step": 7898, "Pretrain/Step Time": 8.525094233453274} +{"Pretrain/Learning Rate": 3.769058204037526e-06, "Pretrain/Loss": 2.0073695182800293, "Pretrain/Loss (Raw)": 2.042715549468994, "Pretrain/Step": 7899, "Pretrain/Step Time": 8.527323560789227} +{"Pretrain/Learning Rate": 3.7645766838723395e-06, "Pretrain/Loss": 2.008436679840088, "Pretrain/Loss (Raw)": 1.954652190208435, "Pretrain/Step": 7900, "Pretrain/Step Time": 8.528611088171601} +{"Pretrain/Learning Rate": 3.7600976126762415e-06, "Pretrain/Loss": 2.009119749069214, "Pretrain/Loss (Raw)": 2.0721917152404785, "Pretrain/Step": 7901, "Pretrain/Step Time": 8.53076422587037} +{"Pretrain/Learning Rate": 3.7556209909657635e-06, "Pretrain/Loss": 2.0069613456726074, "Pretrain/Loss (Raw)": 2.1231770515441895, "Pretrain/Step": 7902, "Pretrain/Step Time": 8.524096198379993} +{"Pretrain/Learning Rate": 3.751146819257187e-06, "Pretrain/Loss": 2.0066938400268555, "Pretrain/Loss (Raw)": 2.085700750350952, "Pretrain/Step": 7903, "Pretrain/Step Time": 8.525174994021654} +{"Pretrain/Learning Rate": 3.7466750980664795e-06, "Pretrain/Loss": 2.001268148422241, "Pretrain/Loss (Raw)": 1.85409677028656, "Pretrain/Step": 7904, "Pretrain/Step Time": 8.533457417041063} +{"Pretrain/Learning Rate": 3.7422058279093593e-06, "Pretrain/Loss": 2.0012598037719727, "Pretrain/Loss (Raw)": 2.106987476348877, "Pretrain/Step": 7905, "Pretrain/Step Time": 8.539948366582394} +{"Pretrain/Learning Rate": 3.737739009301222e-06, "Pretrain/Loss": 2.0000901222229004, "Pretrain/Loss (Raw)": 2.003622531890869, "Pretrain/Step": 7906, "Pretrain/Step Time": 8.53944399021566} +{"Pretrain/Learning Rate": 3.73327464275722e-06, "Pretrain/Loss": 2.0016980171203613, "Pretrain/Loss (Raw)": 1.9505292177200317, "Pretrain/Step": 7907, "Pretrain/Step Time": 8.537365345284343} +{"Pretrain/Learning Rate": 3.728812728792197e-06, "Pretrain/Loss": 1.9978129863739014, "Pretrain/Loss (Raw)": 1.9148751497268677, "Pretrain/Step": 7908, "Pretrain/Step Time": 8.53178302012384} +{"Pretrain/Learning Rate": 3.7243532679207242e-06, "Pretrain/Loss": 1.9993066787719727, "Pretrain/Loss (Raw)": 2.015608310699463, "Pretrain/Step": 7909, "Pretrain/Step Time": 8.526138786226511} +{"Pretrain/Learning Rate": 3.7198962606570826e-06, "Pretrain/Loss": 1.9996225833892822, "Pretrain/Loss (Raw)": 1.9309766292572021, "Pretrain/Step": 7910, "Pretrain/Step Time": 8.530055584385991} +{"Pretrain/Learning Rate": 3.7154417075152826e-06, "Pretrain/Loss": 1.999001145362854, "Pretrain/Loss (Raw)": 2.0303494930267334, "Pretrain/Step": 7911, "Pretrain/Step Time": 8.53487958572805} +{"Pretrain/Learning Rate": 3.7109896090090413e-06, "Pretrain/Loss": 1.9990663528442383, "Pretrain/Loss (Raw)": 1.9635344743728638, "Pretrain/Step": 7912, "Pretrain/Step Time": 8.539070101454854} +{"Pretrain/Learning Rate": 3.7065399656517953e-06, "Pretrain/Loss": 1.998195767402649, "Pretrain/Loss (Raw)": 1.9413352012634277, "Pretrain/Step": 7913, "Pretrain/Step Time": 8.530853362753987} +{"Pretrain/Learning Rate": 3.702092777956692e-06, "Pretrain/Loss": 2.0006494522094727, "Pretrain/Loss (Raw)": 2.2761340141296387, "Pretrain/Step": 7914, "Pretrain/Step Time": 8.526746354997158} +{"Pretrain/Learning Rate": 3.6976480464366162e-06, "Pretrain/Loss": 2.0001258850097656, "Pretrain/Loss (Raw)": 2.052872896194458, "Pretrain/Step": 7915, "Pretrain/Step Time": 8.518036780878901} +{"Pretrain/Learning Rate": 3.693205771604147e-06, "Pretrain/Loss": 1.999934196472168, "Pretrain/Loss (Raw)": 1.9527885913848877, "Pretrain/Step": 7916, "Pretrain/Step Time": 8.511746652424335} +{"Pretrain/Learning Rate": 3.68876595397159e-06, "Pretrain/Loss": 2.0022294521331787, "Pretrain/Loss (Raw)": 1.9685618877410889, "Pretrain/Step": 7917, "Pretrain/Step Time": 8.520253317430615} +{"Pretrain/Learning Rate": 3.6843285940509594e-06, "Pretrain/Loss": 2.0024352073669434, "Pretrain/Loss (Raw)": 1.9111518859863281, "Pretrain/Step": 7918, "Pretrain/Step Time": 8.51665060594678} +{"Pretrain/Learning Rate": 3.6798936923540027e-06, "Pretrain/Loss": 2.002326488494873, "Pretrain/Loss (Raw)": 2.010857343673706, "Pretrain/Step": 7919, "Pretrain/Step Time": 8.51828133687377} +{"Pretrain/Learning Rate": 3.6754612493921675e-06, "Pretrain/Loss": 2.0043249130249023, "Pretrain/Loss (Raw)": 2.112189531326294, "Pretrain/Step": 7920, "Pretrain/Step Time": 8.510791644454002} +{"Pretrain/Learning Rate": 3.6710312656766276e-06, "Pretrain/Loss": 2.0032083988189697, "Pretrain/Loss (Raw)": 1.9847095012664795, "Pretrain/Step": 7921, "Pretrain/Step Time": 8.509444151073694} +{"Pretrain/Learning Rate": 3.6666037417182607e-06, "Pretrain/Loss": 2.0015769004821777, "Pretrain/Loss (Raw)": 1.9698137044906616, "Pretrain/Step": 7922, "Pretrain/Step Time": 8.509476464241743} +{"Pretrain/Learning Rate": 3.6621786780276834e-06, "Pretrain/Loss": 2.0019381046295166, "Pretrain/Loss (Raw)": 1.9548230171203613, "Pretrain/Step": 7923, "Pretrain/Step Time": 8.515121502801776} +{"Pretrain/Learning Rate": 3.6577560751152096e-06, "Pretrain/Loss": 1.9992964267730713, "Pretrain/Loss (Raw)": 1.7643437385559082, "Pretrain/Step": 7924, "Pretrain/Step Time": 8.517279662191868} +{"Pretrain/Learning Rate": 3.65333593349087e-06, "Pretrain/Loss": 1.998302936553955, "Pretrain/Loss (Raw)": 2.0656356811523438, "Pretrain/Step": 7925, "Pretrain/Step Time": 8.513779573142529} +{"Pretrain/Learning Rate": 3.6489182536644156e-06, "Pretrain/Loss": 1.9951289892196655, "Pretrain/Loss (Raw)": 1.8638032674789429, "Pretrain/Step": 7926, "Pretrain/Step Time": 8.505873741582036} +{"Pretrain/Learning Rate": 3.644503036145322e-06, "Pretrain/Loss": 1.9953889846801758, "Pretrain/Loss (Raw)": 1.8710490465164185, "Pretrain/Step": 7927, "Pretrain/Step Time": 8.505572471767664} +{"Pretrain/Learning Rate": 3.6400902814427707e-06, "Pretrain/Loss": 1.9969701766967773, "Pretrain/Loss (Raw)": 2.0016603469848633, "Pretrain/Step": 7928, "Pretrain/Step Time": 8.510608475655317} +{"Pretrain/Learning Rate": 3.6356799900656576e-06, "Pretrain/Loss": 1.994752049446106, "Pretrain/Loss (Raw)": 1.9140264987945557, "Pretrain/Step": 7929, "Pretrain/Step Time": 8.519601676613092} +{"Pretrain/Learning Rate": 3.6312721625225947e-06, "Pretrain/Loss": 1.99907386302948, "Pretrain/Loss (Raw)": 2.1947877407073975, "Pretrain/Step": 7930, "Pretrain/Step Time": 8.51729897223413} +{"Pretrain/Learning Rate": 3.626866799321929e-06, "Pretrain/Loss": 1.9926682710647583, "Pretrain/Loss (Raw)": 2.2019591331481934, "Pretrain/Step": 7931, "Pretrain/Step Time": 8.515367958694696} +{"Pretrain/Learning Rate": 3.622463900971687e-06, "Pretrain/Loss": 1.993867039680481, "Pretrain/Loss (Raw)": 2.118068218231201, "Pretrain/Step": 7932, "Pretrain/Step Time": 8.505609441548586} +{"Pretrain/Learning Rate": 3.618063467979649e-06, "Pretrain/Loss": 1.9935778379440308, "Pretrain/Loss (Raw)": 2.054288864135742, "Pretrain/Step": 7933, "Pretrain/Step Time": 8.514768831431866} +{"Pretrain/Learning Rate": 3.6136655008532807e-06, "Pretrain/Loss": 1.9936827421188354, "Pretrain/Loss (Raw)": 2.0313825607299805, "Pretrain/Step": 7934, "Pretrain/Step Time": 8.516953933984041} +{"Pretrain/Learning Rate": 3.6092700000997876e-06, "Pretrain/Loss": 1.9949487447738647, "Pretrain/Loss (Raw)": 2.097954034805298, "Pretrain/Step": 7935, "Pretrain/Step Time": 8.517522679641843} +{"Pretrain/Learning Rate": 3.6048769662260757e-06, "Pretrain/Loss": 1.9924867153167725, "Pretrain/Loss (Raw)": 1.7563416957855225, "Pretrain/Step": 7936, "Pretrain/Step Time": 8.520302394405007} +{"Pretrain/Learning Rate": 3.600486399738762e-06, "Pretrain/Loss": 1.9911401271820068, "Pretrain/Loss (Raw)": 1.960692048072815, "Pretrain/Step": 7937, "Pretrain/Step Time": 8.520212946459651} +{"Pretrain/Learning Rate": 3.596098301144207e-06, "Pretrain/Loss": 1.9921865463256836, "Pretrain/Loss (Raw)": 2.1799678802490234, "Pretrain/Step": 7938, "Pretrain/Step Time": 8.506108809262514} +{"Pretrain/Learning Rate": 3.591712670948444e-06, "Pretrain/Loss": 1.9900803565979004, "Pretrain/Loss (Raw)": 2.028391122817993, "Pretrain/Step": 7939, "Pretrain/Step Time": 8.49897882156074} +{"Pretrain/Learning Rate": 3.5873295096572583e-06, "Pretrain/Loss": 1.9936461448669434, "Pretrain/Loss (Raw)": 2.133594274520874, "Pretrain/Step": 7940, "Pretrain/Step Time": 8.503585753962398} +{"Pretrain/Learning Rate": 3.58294881777613e-06, "Pretrain/Loss": 1.9949607849121094, "Pretrain/Loss (Raw)": 2.2127633094787598, "Pretrain/Step": 7941, "Pretrain/Step Time": 8.510819485411048} +{"Pretrain/Learning Rate": 3.578570595810274e-06, "Pretrain/Loss": 1.9969606399536133, "Pretrain/Loss (Raw)": 2.2138564586639404, "Pretrain/Step": 7942, "Pretrain/Step Time": 8.513573955744505} +{"Pretrain/Learning Rate": 3.5741948442645864e-06, "Pretrain/Loss": 1.9973480701446533, "Pretrain/Loss (Raw)": 2.0451772212982178, "Pretrain/Step": 7943, "Pretrain/Step Time": 8.515740593895316} +{"Pretrain/Learning Rate": 3.569821563643719e-06, "Pretrain/Loss": 1.998964786529541, "Pretrain/Loss (Raw)": 2.2112598419189453, "Pretrain/Step": 7944, "Pretrain/Step Time": 8.503270126879215} +{"Pretrain/Learning Rate": 3.5654507544520016e-06, "Pretrain/Loss": 1.9984058141708374, "Pretrain/Loss (Raw)": 1.9658982753753662, "Pretrain/Step": 7945, "Pretrain/Step Time": 8.503002036362886} +{"Pretrain/Learning Rate": 3.5610824171935205e-06, "Pretrain/Loss": 1.99791419506073, "Pretrain/Loss (Raw)": 2.012874126434326, "Pretrain/Step": 7946, "Pretrain/Step Time": 8.510047936812043} +{"Pretrain/Learning Rate": 3.5567165523720275e-06, "Pretrain/Loss": 1.9988895654678345, "Pretrain/Loss (Raw)": 2.069736957550049, "Pretrain/Step": 7947, "Pretrain/Step Time": 8.51910788193345} +{"Pretrain/Learning Rate": 3.552353160491029e-06, "Pretrain/Loss": 2.000241279602051, "Pretrain/Loss (Raw)": 1.9504921436309814, "Pretrain/Step": 7948, "Pretrain/Step Time": 8.524172289296985} +{"Pretrain/Learning Rate": 3.54799224205373e-06, "Pretrain/Loss": 2.000577449798584, "Pretrain/Loss (Raw)": 1.8628472089767456, "Pretrain/Step": 7949, "Pretrain/Step Time": 8.524373343214393} +{"Pretrain/Learning Rate": 3.5436337975630536e-06, "Pretrain/Loss": 1.9996130466461182, "Pretrain/Loss (Raw)": 1.733302354812622, "Pretrain/Step": 7950, "Pretrain/Step Time": 8.515460669994354} +{"Pretrain/Learning Rate": 3.5392778275216227e-06, "Pretrain/Loss": 1.9990004301071167, "Pretrain/Loss (Raw)": 2.0209431648254395, "Pretrain/Step": 7951, "Pretrain/Step Time": 8.510911121964455} +{"Pretrain/Learning Rate": 3.5349243324318076e-06, "Pretrain/Loss": 1.9987878799438477, "Pretrain/Loss (Raw)": 1.9361696243286133, "Pretrain/Step": 7952, "Pretrain/Step Time": 8.505714062601328} +{"Pretrain/Learning Rate": 3.5305733127956654e-06, "Pretrain/Loss": 1.99891996383667, "Pretrain/Loss (Raw)": 2.1019811630249023, "Pretrain/Step": 7953, "Pretrain/Step Time": 8.507426416501403} +{"Pretrain/Learning Rate": 3.5262247691149747e-06, "Pretrain/Loss": 1.9969744682312012, "Pretrain/Loss (Raw)": 1.961006760597229, "Pretrain/Step": 7954, "Pretrain/Step Time": 8.518573047593236} +{"Pretrain/Learning Rate": 3.5218787018912263e-06, "Pretrain/Loss": 1.9976377487182617, "Pretrain/Loss (Raw)": 2.0992319583892822, "Pretrain/Step": 7955, "Pretrain/Step Time": 8.51979518122971} +{"Pretrain/Learning Rate": 3.517535111625639e-06, "Pretrain/Loss": 1.9965314865112305, "Pretrain/Loss (Raw)": 1.9687520265579224, "Pretrain/Step": 7956, "Pretrain/Step Time": 8.509854363277555} +{"Pretrain/Learning Rate": 3.5131939988191335e-06, "Pretrain/Loss": 1.9981032609939575, "Pretrain/Loss (Raw)": 2.0459108352661133, "Pretrain/Step": 7957, "Pretrain/Step Time": 8.50903706625104} +{"Pretrain/Learning Rate": 3.508855363972344e-06, "Pretrain/Loss": 1.9961214065551758, "Pretrain/Loss (Raw)": 2.0177268981933594, "Pretrain/Step": 7958, "Pretrain/Step Time": 8.513540038838983} +{"Pretrain/Learning Rate": 3.5045192075856186e-06, "Pretrain/Loss": 1.9966456890106201, "Pretrain/Loss (Raw)": 2.0909156799316406, "Pretrain/Step": 7959, "Pretrain/Step Time": 8.515878889709711} +{"Pretrain/Learning Rate": 3.5001855301590336e-06, "Pretrain/Loss": 1.9975650310516357, "Pretrain/Loss (Raw)": 1.8883917331695557, "Pretrain/Step": 7960, "Pretrain/Step Time": 8.521464925259352} +{"Pretrain/Learning Rate": 3.495854332192361e-06, "Pretrain/Loss": 1.9967072010040283, "Pretrain/Loss (Raw)": 2.0320911407470703, "Pretrain/Step": 7961, "Pretrain/Step Time": 8.522887168452144} +{"Pretrain/Learning Rate": 3.491525614185101e-06, "Pretrain/Loss": 2.0005578994750977, "Pretrain/Loss (Raw)": 2.2186005115509033, "Pretrain/Step": 7962, "Pretrain/Step Time": 8.517600134015083} +{"Pretrain/Learning Rate": 3.4871993766364518e-06, "Pretrain/Loss": 2.0008130073547363, "Pretrain/Loss (Raw)": 2.183032512664795, "Pretrain/Step": 7963, "Pretrain/Step Time": 8.518202729523182} +{"Pretrain/Learning Rate": 3.482875620045348e-06, "Pretrain/Loss": 2.0020499229431152, "Pretrain/Loss (Raw)": 2.0219521522521973, "Pretrain/Step": 7964, "Pretrain/Step Time": 8.51754798553884} +{"Pretrain/Learning Rate": 3.4785543449104173e-06, "Pretrain/Loss": 2.0020108222961426, "Pretrain/Loss (Raw)": 1.9138896465301514, "Pretrain/Step": 7965, "Pretrain/Step Time": 8.523947201669216} +{"Pretrain/Learning Rate": 3.474235551730015e-06, "Pretrain/Loss": 2.0040600299835205, "Pretrain/Loss (Raw)": 2.0078861713409424, "Pretrain/Step": 7966, "Pretrain/Step Time": 8.519110402092338} +{"Pretrain/Learning Rate": 3.4699192410021953e-06, "Pretrain/Loss": 2.0023787021636963, "Pretrain/Loss (Raw)": 1.935162901878357, "Pretrain/Step": 7967, "Pretrain/Step Time": 8.513711273670197} +{"Pretrain/Learning Rate": 3.4656054132247483e-06, "Pretrain/Loss": 2.003049850463867, "Pretrain/Loss (Raw)": 1.907232403755188, "Pretrain/Step": 7968, "Pretrain/Step Time": 8.518107708543539} +{"Pretrain/Learning Rate": 3.4612940688951574e-06, "Pretrain/Loss": 2.003819704055786, "Pretrain/Loss (Raw)": 2.0585055351257324, "Pretrain/Step": 7969, "Pretrain/Step Time": 8.51303149946034} +{"Pretrain/Learning Rate": 3.456985208510627e-06, "Pretrain/Loss": 2.0009078979492188, "Pretrain/Loss (Raw)": 1.939910888671875, "Pretrain/Step": 7970, "Pretrain/Step Time": 8.51645753160119} +{"Pretrain/Learning Rate": 3.452678832568071e-06, "Pretrain/Loss": 1.9992554187774658, "Pretrain/Loss (Raw)": 1.8864778280258179, "Pretrain/Step": 7971, "Pretrain/Step Time": 8.522318623960018} +{"Pretrain/Learning Rate": 3.448374941564139e-06, "Pretrain/Loss": 1.9992387294769287, "Pretrain/Loss (Raw)": 2.0173592567443848, "Pretrain/Step": 7972, "Pretrain/Step Time": 8.522582480683923} +{"Pretrain/Learning Rate": 3.4440735359951515e-06, "Pretrain/Loss": 1.998721957206726, "Pretrain/Loss (Raw)": 1.9338183403015137, "Pretrain/Step": 7973, "Pretrain/Step Time": 8.518100226297975} +{"Pretrain/Learning Rate": 3.439774616357183e-06, "Pretrain/Loss": 2.000912666320801, "Pretrain/Loss (Raw)": 1.9768173694610596, "Pretrain/Step": 7974, "Pretrain/Step Time": 8.518891355022788} +{"Pretrain/Learning Rate": 3.4354781831459985e-06, "Pretrain/Loss": 1.997657299041748, "Pretrain/Loss (Raw)": 1.841436743736267, "Pretrain/Step": 7975, "Pretrain/Step Time": 8.518025679513812} +{"Pretrain/Learning Rate": 3.431184236857088e-06, "Pretrain/Loss": 1.9957435131072998, "Pretrain/Loss (Raw)": 1.8664684295654297, "Pretrain/Step": 7976, "Pretrain/Step Time": 8.52459136582911} +{"Pretrain/Learning Rate": 3.426892777985646e-06, "Pretrain/Loss": 1.996605396270752, "Pretrain/Loss (Raw)": 2.0854785442352295, "Pretrain/Step": 7977, "Pretrain/Step Time": 8.535200919955969} +{"Pretrain/Learning Rate": 3.4226038070265837e-06, "Pretrain/Loss": 1.9988007545471191, "Pretrain/Loss (Raw)": 2.05938982963562, "Pretrain/Step": 7978, "Pretrain/Step Time": 8.527725810185075} +{"Pretrain/Learning Rate": 3.418317324474529e-06, "Pretrain/Loss": 1.9971485137939453, "Pretrain/Loss (Raw)": 1.8792202472686768, "Pretrain/Step": 7979, "Pretrain/Step Time": 8.524852784350514} +{"Pretrain/Learning Rate": 3.414033330823815e-06, "Pretrain/Loss": 1.995302438735962, "Pretrain/Loss (Raw)": 1.8696140050888062, "Pretrain/Step": 7980, "Pretrain/Step Time": 8.519256120547652} +{"Pretrain/Learning Rate": 3.409751826568497e-06, "Pretrain/Loss": 1.9969327449798584, "Pretrain/Loss (Raw)": 2.177260160446167, "Pretrain/Step": 7981, "Pretrain/Step Time": 8.517518183216453} +{"Pretrain/Learning Rate": 3.405472812202326e-06, "Pretrain/Loss": 1.9965327978134155, "Pretrain/Loss (Raw)": 1.988499402999878, "Pretrain/Step": 7982, "Pretrain/Step Time": 8.518783511593938} +{"Pretrain/Learning Rate": 3.4011962882188024e-06, "Pretrain/Loss": 1.9976277351379395, "Pretrain/Loss (Raw)": 2.0295426845550537, "Pretrain/Step": 7983, "Pretrain/Step Time": 8.527772709727287} +{"Pretrain/Learning Rate": 3.3969222551110845e-06, "Pretrain/Loss": 1.9994463920593262, "Pretrain/Loss (Raw)": 1.975253939628601, "Pretrain/Step": 7984, "Pretrain/Step Time": 8.5284543056041} +{"Pretrain/Learning Rate": 3.3926507133720973e-06, "Pretrain/Loss": 1.9985071420669556, "Pretrain/Loss (Raw)": 1.8418844938278198, "Pretrain/Step": 7985, "Pretrain/Step Time": 8.521437687799335} +{"Pretrain/Learning Rate": 3.3883816634944416e-06, "Pretrain/Loss": 1.995243787765503, "Pretrain/Loss (Raw)": 1.7980057001113892, "Pretrain/Step": 7986, "Pretrain/Step Time": 8.518449813127518} +{"Pretrain/Learning Rate": 3.384115105970459e-06, "Pretrain/Loss": 1.9962987899780273, "Pretrain/Loss (Raw)": 2.1088616847991943, "Pretrain/Step": 7987, "Pretrain/Step Time": 8.52485634572804} +{"Pretrain/Learning Rate": 3.3798510412921702e-06, "Pretrain/Loss": 1.9966762065887451, "Pretrain/Loss (Raw)": 1.8632842302322388, "Pretrain/Step": 7988, "Pretrain/Step Time": 8.52618670463562} +{"Pretrain/Learning Rate": 3.37558946995134e-06, "Pretrain/Loss": 1.9957199096679688, "Pretrain/Loss (Raw)": 1.7666739225387573, "Pretrain/Step": 7989, "Pretrain/Step Time": 8.523675430566072} +{"Pretrain/Learning Rate": 3.371330392439434e-06, "Pretrain/Loss": 1.9958045482635498, "Pretrain/Loss (Raw)": 1.9819713830947876, "Pretrain/Step": 7990, "Pretrain/Step Time": 8.526022410020232} +{"Pretrain/Learning Rate": 3.36707380924762e-06, "Pretrain/Loss": 1.9988768100738525, "Pretrain/Loss (Raw)": 2.032046318054199, "Pretrain/Step": 7991, "Pretrain/Step Time": 8.522860756143928} +{"Pretrain/Learning Rate": 3.362819720866789e-06, "Pretrain/Loss": 1.9984707832336426, "Pretrain/Loss (Raw)": 2.1614279747009277, "Pretrain/Step": 7992, "Pretrain/Step Time": 8.518179193139076} +{"Pretrain/Learning Rate": 3.358568127787551e-06, "Pretrain/Loss": 2.001434803009033, "Pretrain/Loss (Raw)": 2.3355677127838135, "Pretrain/Step": 7993, "Pretrain/Step Time": 8.514416182413697} +{"Pretrain/Learning Rate": 3.3543190305002136e-06, "Pretrain/Loss": 2.0003275871276855, "Pretrain/Loss (Raw)": 2.011591911315918, "Pretrain/Step": 7994, "Pretrain/Step Time": 8.522084834054112} +{"Pretrain/Learning Rate": 3.350072429494805e-06, "Pretrain/Loss": 2.000109910964966, "Pretrain/Loss (Raw)": 2.0580997467041016, "Pretrain/Step": 7995, "Pretrain/Step Time": 8.521767722442746} +{"Pretrain/Learning Rate": 3.345828325261055e-06, "Pretrain/Loss": 1.9999754428863525, "Pretrain/Loss (Raw)": 2.0135974884033203, "Pretrain/Step": 7996, "Pretrain/Step Time": 8.525740627199411} +{"Pretrain/Learning Rate": 3.341586718288425e-06, "Pretrain/Loss": 2.0002694129943848, "Pretrain/Loss (Raw)": 1.928955316543579, "Pretrain/Step": 7997, "Pretrain/Step Time": 8.519677055999637} +{"Pretrain/Learning Rate": 3.3373476090660745e-06, "Pretrain/Loss": 2.001286029815674, "Pretrain/Loss (Raw)": 2.0366039276123047, "Pretrain/Step": 7998, "Pretrain/Step Time": 8.51106720790267} +{"Pretrain/Learning Rate": 3.333110998082875e-06, "Pretrain/Loss": 1.9986705780029297, "Pretrain/Loss (Raw)": 1.7875220775604248, "Pretrain/Step": 7999, "Pretrain/Step Time": 8.513224843889475} +{"Pretrain/Learning Rate": 3.3288768858274063e-06, "Pretrain/Loss": 1.998465895652771, "Pretrain/Loss (Raw)": 1.9331237077713013, "Pretrain/Step": 8000, "Pretrain/Step Time": 8.521830379962921} +{"Pretrain/Learning Rate": 3.3246452727879797e-06, "Pretrain/Loss": 1.9973748922348022, "Pretrain/Loss (Raw)": 1.7824890613555908, "Pretrain/Step": 8001, "Pretrain/Step Time": 8.520028796046972} +{"Pretrain/Learning Rate": 3.3204161594525967e-06, "Pretrain/Loss": 1.998517394065857, "Pretrain/Loss (Raw)": 2.0885374546051025, "Pretrain/Step": 8002, "Pretrain/Step Time": 8.516403278335929} +{"Pretrain/Learning Rate": 3.3161895463089787e-06, "Pretrain/Loss": 1.9995536804199219, "Pretrain/Loss (Raw)": 2.026088237762451, "Pretrain/Step": 8003, "Pretrain/Step Time": 8.51452500373125} +{"Pretrain/Learning Rate": 3.311965433844555e-06, "Pretrain/Loss": 2.001095771789551, "Pretrain/Loss (Raw)": 2.1278364658355713, "Pretrain/Step": 8004, "Pretrain/Step Time": 8.506889434531331} +{"Pretrain/Learning Rate": 3.3077438225464803e-06, "Pretrain/Loss": 2.002321481704712, "Pretrain/Loss (Raw)": 2.1439783573150635, "Pretrain/Step": 8005, "Pretrain/Step Time": 8.5091633182019} +{"Pretrain/Learning Rate": 3.3035247129016065e-06, "Pretrain/Loss": 2.000898838043213, "Pretrain/Loss (Raw)": 1.933072805404663, "Pretrain/Step": 8006, "Pretrain/Step Time": 8.514162693172693} +{"Pretrain/Learning Rate": 3.2993081053964982e-06, "Pretrain/Loss": 2.000411033630371, "Pretrain/Loss (Raw)": 1.8253511190414429, "Pretrain/Step": 8007, "Pretrain/Step Time": 8.519374253228307} +{"Pretrain/Learning Rate": 3.295094000517432e-06, "Pretrain/Loss": 2.001706600189209, "Pretrain/Loss (Raw)": 2.0075676441192627, "Pretrain/Step": 8008, "Pretrain/Step Time": 8.5102100931108} +{"Pretrain/Learning Rate": 3.2908823987504085e-06, "Pretrain/Loss": 1.9997563362121582, "Pretrain/Loss (Raw)": 1.8924120664596558, "Pretrain/Step": 8009, "Pretrain/Step Time": 8.50048041343689} +{"Pretrain/Learning Rate": 3.286673300581122e-06, "Pretrain/Loss": 2.0003864765167236, "Pretrain/Loss (Raw)": 2.024721145629883, "Pretrain/Step": 8010, "Pretrain/Step Time": 8.499420456588268} +{"Pretrain/Learning Rate": 3.2824667064949883e-06, "Pretrain/Loss": 1.9985957145690918, "Pretrain/Loss (Raw)": 1.817209243774414, "Pretrain/Step": 8011, "Pretrain/Step Time": 8.501741351559758} +{"Pretrain/Learning Rate": 3.2782626169771236e-06, "Pretrain/Loss": 2.000194549560547, "Pretrain/Loss (Raw)": 2.088026523590088, "Pretrain/Step": 8012, "Pretrain/Step Time": 8.497884580865502} +{"Pretrain/Learning Rate": 3.2740610325123823e-06, "Pretrain/Loss": 2.003432035446167, "Pretrain/Loss (Raw)": 2.3042056560516357, "Pretrain/Step": 8013, "Pretrain/Step Time": 8.504303319379687} +{"Pretrain/Learning Rate": 3.2698619535852877e-06, "Pretrain/Loss": 2.0057623386383057, "Pretrain/Loss (Raw)": 2.059082269668579, "Pretrain/Step": 8014, "Pretrain/Step Time": 8.502820398658514} +{"Pretrain/Learning Rate": 3.2656653806801134e-06, "Pretrain/Loss": 2.008270263671875, "Pretrain/Loss (Raw)": 2.441884994506836, "Pretrain/Step": 8015, "Pretrain/Step Time": 8.499765546992421} +{"Pretrain/Learning Rate": 3.261471314280817e-06, "Pretrain/Loss": 2.008406400680542, "Pretrain/Loss (Raw)": 2.0230841636657715, "Pretrain/Step": 8016, "Pretrain/Step Time": 8.489883821457624} +{"Pretrain/Learning Rate": 3.2572797548710897e-06, "Pretrain/Loss": 2.0057640075683594, "Pretrain/Loss (Raw)": 1.8631038665771484, "Pretrain/Step": 8017, "Pretrain/Step Time": 8.49498582072556} +{"Pretrain/Learning Rate": 3.2530907029343165e-06, "Pretrain/Loss": 2.004685163497925, "Pretrain/Loss (Raw)": 1.8366843461990356, "Pretrain/Step": 8018, "Pretrain/Step Time": 8.502370096743107} +{"Pretrain/Learning Rate": 3.2489041589535948e-06, "Pretrain/Loss": 2.0032591819763184, "Pretrain/Loss (Raw)": 2.038609504699707, "Pretrain/Step": 8019, "Pretrain/Step Time": 8.506484845653176} +{"Pretrain/Learning Rate": 3.244720123411743e-06, "Pretrain/Loss": 2.0044147968292236, "Pretrain/Loss (Raw)": 2.13350510597229, "Pretrain/Step": 8020, "Pretrain/Step Time": 8.508006170392036} +{"Pretrain/Learning Rate": 3.2405385967912787e-06, "Pretrain/Loss": 2.0057613849639893, "Pretrain/Loss (Raw)": 2.0248212814331055, "Pretrain/Step": 8021, "Pretrain/Step Time": 8.501690123230219} +{"Pretrain/Learning Rate": 3.2363595795744413e-06, "Pretrain/Loss": 2.0073704719543457, "Pretrain/Loss (Raw)": 2.273841381072998, "Pretrain/Step": 8022, "Pretrain/Step Time": 8.500583721324801} +{"Pretrain/Learning Rate": 3.232183072243164e-06, "Pretrain/Loss": 2.0041513442993164, "Pretrain/Loss (Raw)": 1.4125138521194458, "Pretrain/Step": 8023, "Pretrain/Step Time": 8.511591084301472} +{"Pretrain/Learning Rate": 3.2280090752791175e-06, "Pretrain/Loss": 2.0044667720794678, "Pretrain/Loss (Raw)": 2.0626420974731445, "Pretrain/Step": 8024, "Pretrain/Step Time": 8.5094097815454} +{"Pretrain/Learning Rate": 3.2238375891636504e-06, "Pretrain/Loss": 2.0044925212860107, "Pretrain/Loss (Raw)": 2.0917747020721436, "Pretrain/Step": 8025, "Pretrain/Step Time": 8.50639820843935} +{"Pretrain/Learning Rate": 3.2196686143778467e-06, "Pretrain/Loss": 2.0025551319122314, "Pretrain/Loss (Raw)": 1.7084527015686035, "Pretrain/Step": 8026, "Pretrain/Step Time": 8.50867079384625} +{"Pretrain/Learning Rate": 3.2155021514024857e-06, "Pretrain/Loss": 2.0030832290649414, "Pretrain/Loss (Raw)": 2.110299587249756, "Pretrain/Step": 8027, "Pretrain/Step Time": 8.507529688999057} +{"Pretrain/Learning Rate": 3.211338200718081e-06, "Pretrain/Loss": 2.0023908615112305, "Pretrain/Loss (Raw)": 1.8660223484039307, "Pretrain/Step": 8028, "Pretrain/Step Time": 8.502168837934732} +{"Pretrain/Learning Rate": 3.2071767628048145e-06, "Pretrain/Loss": 2.0041987895965576, "Pretrain/Loss (Raw)": 2.303640127182007, "Pretrain/Step": 8029, "Pretrain/Step Time": 8.506825596094131} +{"Pretrain/Learning Rate": 3.203017838142622e-06, "Pretrain/Loss": 2.0029871463775635, "Pretrain/Loss (Raw)": 1.968064308166504, "Pretrain/Step": 8030, "Pretrain/Step Time": 8.507915582507849} +{"Pretrain/Learning Rate": 3.198861427211122e-06, "Pretrain/Loss": 2.0016632080078125, "Pretrain/Loss (Raw)": 1.9162410497665405, "Pretrain/Step": 8031, "Pretrain/Step Time": 8.512173533439636} +{"Pretrain/Learning Rate": 3.1947075304896516e-06, "Pretrain/Loss": 2.002357006072998, "Pretrain/Loss (Raw)": 1.9428868293762207, "Pretrain/Step": 8032, "Pretrain/Step Time": 8.505777217447758} +{"Pretrain/Learning Rate": 3.190556148457255e-06, "Pretrain/Loss": 2.0001275539398193, "Pretrain/Loss (Raw)": 1.8216311931610107, "Pretrain/Step": 8033, "Pretrain/Step Time": 8.499914890155196} +{"Pretrain/Learning Rate": 3.1864072815926988e-06, "Pretrain/Loss": 2.0022029876708984, "Pretrain/Loss (Raw)": 2.2692697048187256, "Pretrain/Step": 8034, "Pretrain/Step Time": 8.50274271145463} +{"Pretrain/Learning Rate": 3.1822609303744423e-06, "Pretrain/Loss": 2.002906560897827, "Pretrain/Loss (Raw)": 2.0405919551849365, "Pretrain/Step": 8035, "Pretrain/Step Time": 8.507523879408836} +{"Pretrain/Learning Rate": 3.178117095280664e-06, "Pretrain/Loss": 2.0042929649353027, "Pretrain/Loss (Raw)": 2.0923471450805664, "Pretrain/Step": 8036, "Pretrain/Step Time": 8.512752054259181} +{"Pretrain/Learning Rate": 3.173975776789245e-06, "Pretrain/Loss": 2.0048091411590576, "Pretrain/Loss (Raw)": 2.0816917419433594, "Pretrain/Step": 8037, "Pretrain/Step Time": 8.515412956476212} +{"Pretrain/Learning Rate": 3.1698369753777933e-06, "Pretrain/Loss": 2.0052785873413086, "Pretrain/Loss (Raw)": 1.9910624027252197, "Pretrain/Step": 8038, "Pretrain/Step Time": 8.510370256379247} +{"Pretrain/Learning Rate": 3.165700691523607e-06, "Pretrain/Loss": 2.005805015563965, "Pretrain/Loss (Raw)": 2.097719669342041, "Pretrain/Step": 8039, "Pretrain/Step Time": 8.50750476308167} +{"Pretrain/Learning Rate": 3.1615669257037045e-06, "Pretrain/Loss": 2.006413221359253, "Pretrain/Loss (Raw)": 2.0413665771484375, "Pretrain/Step": 8040, "Pretrain/Step Time": 8.506692074239254} +{"Pretrain/Learning Rate": 3.1574356783948047e-06, "Pretrain/Loss": 2.0081355571746826, "Pretrain/Loss (Raw)": 2.1618287563323975, "Pretrain/Step": 8041, "Pretrain/Step Time": 8.509020386263728} +{"Pretrain/Learning Rate": 3.1533069500733534e-06, "Pretrain/Loss": 2.005753517150879, "Pretrain/Loss (Raw)": 1.9712212085723877, "Pretrain/Step": 8042, "Pretrain/Step Time": 8.520365081727505} +{"Pretrain/Learning Rate": 3.1491807412154905e-06, "Pretrain/Loss": 2.0043649673461914, "Pretrain/Loss (Raw)": 1.875117540359497, "Pretrain/Step": 8043, "Pretrain/Step Time": 8.518854014575481} +{"Pretrain/Learning Rate": 3.145057052297068e-06, "Pretrain/Loss": 2.0040040016174316, "Pretrain/Loss (Raw)": 1.9065839052200317, "Pretrain/Step": 8044, "Pretrain/Step Time": 8.52076922915876} +{"Pretrain/Learning Rate": 3.140935883793644e-06, "Pretrain/Loss": 2.0039615631103516, "Pretrain/Loss (Raw)": 1.963144063949585, "Pretrain/Step": 8045, "Pretrain/Step Time": 8.51033654436469} +{"Pretrain/Learning Rate": 3.136817236180503e-06, "Pretrain/Loss": 2.0043983459472656, "Pretrain/Loss (Raw)": 1.9670625925064087, "Pretrain/Step": 8046, "Pretrain/Step Time": 8.511349610984325} +{"Pretrain/Learning Rate": 3.1327011099326233e-06, "Pretrain/Loss": 2.006761074066162, "Pretrain/Loss (Raw)": 2.3133010864257812, "Pretrain/Step": 8047, "Pretrain/Step Time": 8.512809226289392} +{"Pretrain/Learning Rate": 3.128587505524691e-06, "Pretrain/Loss": 2.0030479431152344, "Pretrain/Loss (Raw)": 1.6368995904922485, "Pretrain/Step": 8048, "Pretrain/Step Time": 8.519721740856767} +{"Pretrain/Learning Rate": 3.124476423431105e-06, "Pretrain/Loss": 2.003925323486328, "Pretrain/Loss (Raw)": 2.0970113277435303, "Pretrain/Step": 8049, "Pretrain/Step Time": 8.519006194546819} +{"Pretrain/Learning Rate": 3.1203678641259836e-06, "Pretrain/Loss": 2.006028890609741, "Pretrain/Loss (Raw)": 2.2390694618225098, "Pretrain/Step": 8050, "Pretrain/Step Time": 8.525287739932537} +{"Pretrain/Learning Rate": 3.116261828083139e-06, "Pretrain/Loss": 2.0053861141204834, "Pretrain/Loss (Raw)": 1.8725264072418213, "Pretrain/Step": 8051, "Pretrain/Step Time": 8.518826704472303} +{"Pretrain/Learning Rate": 3.112158315776104e-06, "Pretrain/Loss": 2.007009983062744, "Pretrain/Loss (Raw)": 1.972227692604065, "Pretrain/Step": 8052, "Pretrain/Step Time": 8.515586884692311} +{"Pretrain/Learning Rate": 3.108057327678102e-06, "Pretrain/Loss": 2.007197380065918, "Pretrain/Loss (Raw)": 2.0896143913269043, "Pretrain/Step": 8053, "Pretrain/Step Time": 8.523192346096039} +{"Pretrain/Learning Rate": 3.1039588642620937e-06, "Pretrain/Loss": 2.0099329948425293, "Pretrain/Loss (Raw)": 2.213977098464966, "Pretrain/Step": 8054, "Pretrain/Step Time": 8.52858224324882} +{"Pretrain/Learning Rate": 3.099862926000724e-06, "Pretrain/Loss": 2.01063871383667, "Pretrain/Loss (Raw)": 1.961372971534729, "Pretrain/Step": 8055, "Pretrain/Step Time": 8.532400911673903} +{"Pretrain/Learning Rate": 3.0957695133663616e-06, "Pretrain/Loss": 2.01189923286438, "Pretrain/Loss (Raw)": 2.1629858016967773, "Pretrain/Step": 8056, "Pretrain/Step Time": 8.52844007499516} +{"Pretrain/Learning Rate": 3.091678626831071e-06, "Pretrain/Loss": 2.013228416442871, "Pretrain/Loss (Raw)": 2.0841546058654785, "Pretrain/Step": 8057, "Pretrain/Step Time": 8.521613286808133} +{"Pretrain/Learning Rate": 3.0875902668666383e-06, "Pretrain/Loss": 2.0131304264068604, "Pretrain/Loss (Raw)": 2.182267665863037, "Pretrain/Step": 8058, "Pretrain/Step Time": 8.52132417075336} +{"Pretrain/Learning Rate": 3.0835044339445536e-06, "Pretrain/Loss": 2.0096163749694824, "Pretrain/Loss (Raw)": 1.7521671056747437, "Pretrain/Step": 8059, "Pretrain/Step Time": 8.528209619224072} +{"Pretrain/Learning Rate": 3.079421128536003e-06, "Pretrain/Loss": 2.0084714889526367, "Pretrain/Loss (Raw)": 1.9715063571929932, "Pretrain/Step": 8060, "Pretrain/Step Time": 8.535582521930337} +{"Pretrain/Learning Rate": 3.075340351111908e-06, "Pretrain/Loss": 2.0058717727661133, "Pretrain/Loss (Raw)": 1.7215317487716675, "Pretrain/Step": 8061, "Pretrain/Step Time": 8.527987696230412} +{"Pretrain/Learning Rate": 3.071262102142877e-06, "Pretrain/Loss": 2.006962299346924, "Pretrain/Loss (Raw)": 2.170973300933838, "Pretrain/Step": 8062, "Pretrain/Step Time": 8.523379569873214} +{"Pretrain/Learning Rate": 3.0671863820992324e-06, "Pretrain/Loss": 2.0038435459136963, "Pretrain/Loss (Raw)": 1.6987468004226685, "Pretrain/Step": 8063, "Pretrain/Step Time": 8.525145318359137} +{"Pretrain/Learning Rate": 3.0631131914509977e-06, "Pretrain/Loss": 2.0066184997558594, "Pretrain/Loss (Raw)": 2.1115291118621826, "Pretrain/Step": 8064, "Pretrain/Step Time": 8.522978123277426} +{"Pretrain/Learning Rate": 3.0590425306679327e-06, "Pretrain/Loss": 2.0058085918426514, "Pretrain/Loss (Raw)": 1.8570153713226318, "Pretrain/Step": 8065, "Pretrain/Step Time": 8.528579130768776} +{"Pretrain/Learning Rate": 3.0549744002194597e-06, "Pretrain/Loss": 2.0050697326660156, "Pretrain/Loss (Raw)": 2.0854125022888184, "Pretrain/Step": 8066, "Pretrain/Step Time": 8.529432771727443} +{"Pretrain/Learning Rate": 3.0509088005747534e-06, "Pretrain/Loss": 2.005251169204712, "Pretrain/Loss (Raw)": 2.051616668701172, "Pretrain/Step": 8067, "Pretrain/Step Time": 8.534131897613406} +{"Pretrain/Learning Rate": 3.0468457322026663e-06, "Pretrain/Loss": 2.0052430629730225, "Pretrain/Loss (Raw)": 2.132556676864624, "Pretrain/Step": 8068, "Pretrain/Step Time": 8.529606606811285} +{"Pretrain/Learning Rate": 3.0427851955717846e-06, "Pretrain/Loss": 2.0049405097961426, "Pretrain/Loss (Raw)": 2.174029588699341, "Pretrain/Step": 8069, "Pretrain/Step Time": 8.527965813875198} +{"Pretrain/Learning Rate": 3.0387271911503728e-06, "Pretrain/Loss": 2.002474784851074, "Pretrain/Loss (Raw)": 1.8982466459274292, "Pretrain/Step": 8070, "Pretrain/Step Time": 8.521284507587552} +{"Pretrain/Learning Rate": 3.034671719406429e-06, "Pretrain/Loss": 2.0021615028381348, "Pretrain/Loss (Raw)": 2.005103588104248, "Pretrain/Step": 8071, "Pretrain/Step Time": 8.520722411572933} +{"Pretrain/Learning Rate": 3.0306187808076423e-06, "Pretrain/Loss": 2.002488136291504, "Pretrain/Loss (Raw)": 2.2530324459075928, "Pretrain/Step": 8072, "Pretrain/Step Time": 8.533482491970062} +{"Pretrain/Learning Rate": 3.0265683758214315e-06, "Pretrain/Loss": 2.0019195079803467, "Pretrain/Loss (Raw)": 1.8931306600570679, "Pretrain/Step": 8073, "Pretrain/Step Time": 8.53895876929164} +{"Pretrain/Learning Rate": 3.022520504914886e-06, "Pretrain/Loss": 2.0031847953796387, "Pretrain/Loss (Raw)": 2.174811363220215, "Pretrain/Step": 8074, "Pretrain/Step Time": 8.531079543754458} +{"Pretrain/Learning Rate": 3.0184751685548435e-06, "Pretrain/Loss": 2.0041415691375732, "Pretrain/Loss (Raw)": 2.1922366619110107, "Pretrain/Step": 8075, "Pretrain/Step Time": 8.522795017808676} +{"Pretrain/Learning Rate": 3.0144323672078256e-06, "Pretrain/Loss": 2.0083789825439453, "Pretrain/Loss (Raw)": 2.492849588394165, "Pretrain/Step": 8076, "Pretrain/Step Time": 8.516250405460596} +{"Pretrain/Learning Rate": 3.0103921013400647e-06, "Pretrain/Loss": 2.0087571144104004, "Pretrain/Loss (Raw)": 1.9112555980682373, "Pretrain/Step": 8077, "Pretrain/Step Time": 8.5181550309062} +{"Pretrain/Learning Rate": 3.0063543714175024e-06, "Pretrain/Loss": 2.0111641883850098, "Pretrain/Loss (Raw)": 2.0414299964904785, "Pretrain/Step": 8078, "Pretrain/Step Time": 8.520828660577536} +{"Pretrain/Learning Rate": 3.0023191779057963e-06, "Pretrain/Loss": 2.0106215476989746, "Pretrain/Loss (Raw)": 1.9514775276184082, "Pretrain/Step": 8079, "Pretrain/Step Time": 8.526470011100173} +{"Pretrain/Learning Rate": 2.9982865212702965e-06, "Pretrain/Loss": 2.011430501937866, "Pretrain/Loss (Raw)": 2.0397121906280518, "Pretrain/Step": 8080, "Pretrain/Step Time": 8.526477305218577} +{"Pretrain/Learning Rate": 2.994256401976073e-06, "Pretrain/Loss": 2.0098254680633545, "Pretrain/Loss (Raw)": 1.896531105041504, "Pretrain/Step": 8081, "Pretrain/Step Time": 8.52955923229456} +{"Pretrain/Learning Rate": 2.9902288204878894e-06, "Pretrain/Loss": 2.007871627807617, "Pretrain/Loss (Raw)": 1.7109031677246094, "Pretrain/Step": 8082, "Pretrain/Step Time": 8.520420331507921} +{"Pretrain/Learning Rate": 2.9862037772702356e-06, "Pretrain/Loss": 2.008756399154663, "Pretrain/Loss (Raw)": 2.2125203609466553, "Pretrain/Step": 8083, "Pretrain/Step Time": 8.517018714919686} +{"Pretrain/Learning Rate": 2.982181272787296e-06, "Pretrain/Loss": 2.009460210800171, "Pretrain/Loss (Raw)": 2.058814764022827, "Pretrain/Step": 8084, "Pretrain/Step Time": 8.523202158510685} +{"Pretrain/Learning Rate": 2.9781613075029636e-06, "Pretrain/Loss": 2.0090582370758057, "Pretrain/Loss (Raw)": 1.994471549987793, "Pretrain/Step": 8085, "Pretrain/Step Time": 8.519118243828416} +{"Pretrain/Learning Rate": 2.9741438818808366e-06, "Pretrain/Loss": 2.0099024772644043, "Pretrain/Loss (Raw)": 2.1257686614990234, "Pretrain/Step": 8086, "Pretrain/Step Time": 8.517368024215102} +{"Pretrain/Learning Rate": 2.9701289963842276e-06, "Pretrain/Loss": 2.0110883712768555, "Pretrain/Loss (Raw)": 2.24273419380188, "Pretrain/Step": 8087, "Pretrain/Step Time": 8.51280028000474} +{"Pretrain/Learning Rate": 2.966116651476153e-06, "Pretrain/Loss": 2.0124263763427734, "Pretrain/Loss (Raw)": 2.0596492290496826, "Pretrain/Step": 8088, "Pretrain/Step Time": 8.510074723511934} +{"Pretrain/Learning Rate": 2.9621068476193335e-06, "Pretrain/Loss": 2.013019323348999, "Pretrain/Loss (Raw)": 2.1079659461975098, "Pretrain/Step": 8089, "Pretrain/Step Time": 8.512377325445414} +{"Pretrain/Learning Rate": 2.958099585276192e-06, "Pretrain/Loss": 2.010683059692383, "Pretrain/Loss (Raw)": 1.9195795059204102, "Pretrain/Step": 8090, "Pretrain/Step Time": 8.518992619588971} +{"Pretrain/Learning Rate": 2.9540948649088767e-06, "Pretrain/Loss": 2.010103702545166, "Pretrain/Loss (Raw)": 2.108889102935791, "Pretrain/Step": 8091, "Pretrain/Step Time": 8.51893600076437} +{"Pretrain/Learning Rate": 2.950092686979225e-06, "Pretrain/Loss": 2.0105059146881104, "Pretrain/Loss (Raw)": 2.07342267036438, "Pretrain/Step": 8092, "Pretrain/Step Time": 8.522961298003793} +{"Pretrain/Learning Rate": 2.9460930519487865e-06, "Pretrain/Loss": 2.013486862182617, "Pretrain/Loss (Raw)": 2.2954492568969727, "Pretrain/Step": 8093, "Pretrain/Step Time": 8.514435451477766} +{"Pretrain/Learning Rate": 2.942095960278815e-06, "Pretrain/Loss": 2.014089345932007, "Pretrain/Loss (Raw)": 2.084994316101074, "Pretrain/Step": 8094, "Pretrain/Step Time": 8.515156656503677} +{"Pretrain/Learning Rate": 2.938101412430283e-06, "Pretrain/Loss": 2.0136117935180664, "Pretrain/Loss (Raw)": 1.8740328550338745, "Pretrain/Step": 8095, "Pretrain/Step Time": 8.518970368430018} +{"Pretrain/Learning Rate": 2.9341094088638527e-06, "Pretrain/Loss": 2.014669418334961, "Pretrain/Loss (Raw)": 2.042630434036255, "Pretrain/Step": 8096, "Pretrain/Step Time": 8.515318781137466} +{"Pretrain/Learning Rate": 2.9301199500399057e-06, "Pretrain/Loss": 2.0130748748779297, "Pretrain/Loss (Raw)": 1.8543752431869507, "Pretrain/Step": 8097, "Pretrain/Step Time": 8.516334857791662} +{"Pretrain/Learning Rate": 2.9261330364185184e-06, "Pretrain/Loss": 2.0150840282440186, "Pretrain/Loss (Raw)": 2.1970930099487305, "Pretrain/Step": 8098, "Pretrain/Step Time": 8.51574619859457} +{"Pretrain/Learning Rate": 2.9221486684594873e-06, "Pretrain/Loss": 2.015648365020752, "Pretrain/Loss (Raw)": 1.9587385654449463, "Pretrain/Step": 8099, "Pretrain/Step Time": 8.509276257827878} +{"Pretrain/Learning Rate": 2.9181668466223084e-06, "Pretrain/Loss": 2.017324924468994, "Pretrain/Loss (Raw)": 2.231945037841797, "Pretrain/Step": 8100, "Pretrain/Step Time": 8.50479131564498} +{"Pretrain/Learning Rate": 2.914187571366175e-06, "Pretrain/Loss": 2.0183067321777344, "Pretrain/Loss (Raw)": 2.059473752975464, "Pretrain/Step": 8101, "Pretrain/Step Time": 8.510656040161848} +{"Pretrain/Learning Rate": 2.9102108431500076e-06, "Pretrain/Loss": 2.017861843109131, "Pretrain/Loss (Raw)": 1.919876217842102, "Pretrain/Step": 8102, "Pretrain/Step Time": 8.512891883030534} +{"Pretrain/Learning Rate": 2.9062366624324154e-06, "Pretrain/Loss": 2.0207128524780273, "Pretrain/Loss (Raw)": 2.206390380859375, "Pretrain/Step": 8103, "Pretrain/Step Time": 8.515381483361125} +{"Pretrain/Learning Rate": 2.9022650296717245e-06, "Pretrain/Loss": 2.0243735313415527, "Pretrain/Loss (Raw)": 2.335045099258423, "Pretrain/Step": 8104, "Pretrain/Step Time": 8.507164493203163} +{"Pretrain/Learning Rate": 2.898295945325949e-06, "Pretrain/Loss": 2.024327039718628, "Pretrain/Loss (Raw)": 2.079484462738037, "Pretrain/Step": 8105, "Pretrain/Step Time": 8.49419941008091} +{"Pretrain/Learning Rate": 2.8943294098528447e-06, "Pretrain/Loss": 2.025290012359619, "Pretrain/Loss (Raw)": 2.1826701164245605, "Pretrain/Step": 8106, "Pretrain/Step Time": 8.496186574921012} +{"Pretrain/Learning Rate": 2.890365423709826e-06, "Pretrain/Loss": 2.025911808013916, "Pretrain/Loss (Raw)": 1.958791971206665, "Pretrain/Step": 8107, "Pretrain/Step Time": 8.503512993454933} +{"Pretrain/Learning Rate": 2.8864039873540583e-06, "Pretrain/Loss": 2.026520252227783, "Pretrain/Loss (Raw)": 1.947513222694397, "Pretrain/Step": 8108, "Pretrain/Step Time": 8.512426815927029} +{"Pretrain/Learning Rate": 2.8824451012423786e-06, "Pretrain/Loss": 2.0239484310150146, "Pretrain/Loss (Raw)": 1.8480558395385742, "Pretrain/Step": 8109, "Pretrain/Step Time": 8.515395583584905} +{"Pretrain/Learning Rate": 2.878488765831361e-06, "Pretrain/Loss": 2.0232484340667725, "Pretrain/Loss (Raw)": 1.8989057540893555, "Pretrain/Step": 8110, "Pretrain/Step Time": 8.510692307725549} +{"Pretrain/Learning Rate": 2.874534981577248e-06, "Pretrain/Loss": 2.0243022441864014, "Pretrain/Loss (Raw)": 2.1644294261932373, "Pretrain/Step": 8111, "Pretrain/Step Time": 8.503049513325095} +{"Pretrain/Learning Rate": 2.870583748936026e-06, "Pretrain/Loss": 2.025613784790039, "Pretrain/Loss (Raw)": 2.143160343170166, "Pretrain/Step": 8112, "Pretrain/Step Time": 8.51074574328959} +{"Pretrain/Learning Rate": 2.8666350683633576e-06, "Pretrain/Loss": 2.028242349624634, "Pretrain/Loss (Raw)": 2.178295612335205, "Pretrain/Step": 8113, "Pretrain/Step Time": 8.514758192002773} +{"Pretrain/Learning Rate": 2.8626889403146395e-06, "Pretrain/Loss": 2.0303733348846436, "Pretrain/Loss (Raw)": 2.070789337158203, "Pretrain/Step": 8114, "Pretrain/Step Time": 8.517946427688003} +{"Pretrain/Learning Rate": 2.8587453652449386e-06, "Pretrain/Loss": 2.030914306640625, "Pretrain/Loss (Raw)": 2.1781184673309326, "Pretrain/Step": 8115, "Pretrain/Step Time": 8.511513222008944} +{"Pretrain/Learning Rate": 2.8548043436090577e-06, "Pretrain/Loss": 2.031906843185425, "Pretrain/Loss (Raw)": 1.9903377294540405, "Pretrain/Step": 8116, "Pretrain/Step Time": 8.50843359529972} +{"Pretrain/Learning Rate": 2.8508658758614944e-06, "Pretrain/Loss": 2.034428834915161, "Pretrain/Loss (Raw)": 2.08945894241333, "Pretrain/Step": 8117, "Pretrain/Step Time": 8.510809818282723} +{"Pretrain/Learning Rate": 2.846929962456446e-06, "Pretrain/Loss": 2.035207748413086, "Pretrain/Loss (Raw)": 2.0816709995269775, "Pretrain/Step": 8118, "Pretrain/Step Time": 8.51757107116282} +{"Pretrain/Learning Rate": 2.8429966038478196e-06, "Pretrain/Loss": 2.0340821743011475, "Pretrain/Loss (Raw)": 1.8879899978637695, "Pretrain/Step": 8119, "Pretrain/Step Time": 8.517311135306954} +{"Pretrain/Learning Rate": 2.839065800489235e-06, "Pretrain/Loss": 2.034525156021118, "Pretrain/Loss (Raw)": 2.218146562576294, "Pretrain/Step": 8120, "Pretrain/Step Time": 8.515547960996628} +{"Pretrain/Learning Rate": 2.835137552834008e-06, "Pretrain/Loss": 2.0331687927246094, "Pretrain/Loss (Raw)": 2.161926507949829, "Pretrain/Step": 8121, "Pretrain/Step Time": 8.51392463222146} +{"Pretrain/Learning Rate": 2.8312118613351644e-06, "Pretrain/Loss": 2.0336012840270996, "Pretrain/Loss (Raw)": 2.0669376850128174, "Pretrain/Step": 8122, "Pretrain/Step Time": 8.506331695243716} +{"Pretrain/Learning Rate": 2.8272887264454262e-06, "Pretrain/Loss": 2.033748149871826, "Pretrain/Loss (Raw)": 2.0769107341766357, "Pretrain/Step": 8123, "Pretrain/Step Time": 8.503976048901677} +{"Pretrain/Learning Rate": 2.8233681486172393e-06, "Pretrain/Loss": 2.0332961082458496, "Pretrain/Loss (Raw)": 1.9557206630706787, "Pretrain/Step": 8124, "Pretrain/Step Time": 8.502599889412522} +{"Pretrain/Learning Rate": 2.8194501283027366e-06, "Pretrain/Loss": 2.034168243408203, "Pretrain/Loss (Raw)": 2.040609359741211, "Pretrain/Step": 8125, "Pretrain/Step Time": 8.514333095401525} +{"Pretrain/Learning Rate": 2.815534665953762e-06, "Pretrain/Loss": 2.0334134101867676, "Pretrain/Loss (Raw)": 1.9400051832199097, "Pretrain/Step": 8126, "Pretrain/Step Time": 8.514159509912133} +{"Pretrain/Learning Rate": 2.8116217620218626e-06, "Pretrain/Loss": 2.0359463691711426, "Pretrain/Loss (Raw)": 2.1117100715637207, "Pretrain/Step": 8127, "Pretrain/Step Time": 8.51765450462699} +{"Pretrain/Learning Rate": 2.8077114169583e-06, "Pretrain/Loss": 2.037108898162842, "Pretrain/Loss (Raw)": 2.0819480419158936, "Pretrain/Step": 8128, "Pretrain/Step Time": 8.509199939668179} +{"Pretrain/Learning Rate": 2.8038036312140333e-06, "Pretrain/Loss": 2.0388424396514893, "Pretrain/Loss (Raw)": 2.0043540000915527, "Pretrain/Step": 8129, "Pretrain/Step Time": 8.509246429428458} +{"Pretrain/Learning Rate": 2.79989840523972e-06, "Pretrain/Loss": 2.038658857345581, "Pretrain/Loss (Raw)": 2.065042018890381, "Pretrain/Step": 8130, "Pretrain/Step Time": 8.513243291527033} +{"Pretrain/Learning Rate": 2.795995739485732e-06, "Pretrain/Loss": 2.0381758213043213, "Pretrain/Loss (Raw)": 1.9642670154571533, "Pretrain/Step": 8131, "Pretrain/Step Time": 8.515811195597053} +{"Pretrain/Learning Rate": 2.7920956344021475e-06, "Pretrain/Loss": 2.035987377166748, "Pretrain/Loss (Raw)": 1.8477239608764648, "Pretrain/Step": 8132, "Pretrain/Step Time": 8.524600498378277} +{"Pretrain/Learning Rate": 2.78819809043874e-06, "Pretrain/Loss": 2.034719944000244, "Pretrain/Loss (Raw)": 1.9817581176757812, "Pretrain/Step": 8133, "Pretrain/Step Time": 8.520594919100404} +{"Pretrain/Learning Rate": 2.7843031080449944e-06, "Pretrain/Loss": 2.034287214279175, "Pretrain/Loss (Raw)": 1.877671241760254, "Pretrain/Step": 8134, "Pretrain/Step Time": 8.517290197312832} +{"Pretrain/Learning Rate": 2.780410687670096e-06, "Pretrain/Loss": 2.035506248474121, "Pretrain/Loss (Raw)": 1.981399655342102, "Pretrain/Step": 8135, "Pretrain/Step Time": 8.511842491105199} +{"Pretrain/Learning Rate": 2.776520829762941e-06, "Pretrain/Loss": 2.0365958213806152, "Pretrain/Loss (Raw)": 2.1470367908477783, "Pretrain/Step": 8136, "Pretrain/Step Time": 8.517294809222221} +{"Pretrain/Learning Rate": 2.7726335347721263e-06, "Pretrain/Loss": 2.039177417755127, "Pretrain/Loss (Raw)": 2.222834587097168, "Pretrain/Step": 8137, "Pretrain/Step Time": 8.523123115301132} +{"Pretrain/Learning Rate": 2.7687488031459484e-06, "Pretrain/Loss": 2.0393104553222656, "Pretrain/Loss (Raw)": 2.0417673587799072, "Pretrain/Step": 8138, "Pretrain/Step Time": 8.527758238837123} +{"Pretrain/Learning Rate": 2.7648666353324136e-06, "Pretrain/Loss": 2.0428011417388916, "Pretrain/Loss (Raw)": 2.264000177383423, "Pretrain/Step": 8139, "Pretrain/Step Time": 8.524965565651655} +{"Pretrain/Learning Rate": 2.7609870317792385e-06, "Pretrain/Loss": 2.0415802001953125, "Pretrain/Loss (Raw)": 1.9317518472671509, "Pretrain/Step": 8140, "Pretrain/Step Time": 8.525824382901192} +{"Pretrain/Learning Rate": 2.757109992933832e-06, "Pretrain/Loss": 2.0382003784179688, "Pretrain/Loss (Raw)": 1.8715726137161255, "Pretrain/Step": 8141, "Pretrain/Step Time": 8.52005104534328} +{"Pretrain/Learning Rate": 2.753235519243308e-06, "Pretrain/Loss": 2.0390915870666504, "Pretrain/Loss (Raw)": 2.17317795753479, "Pretrain/Step": 8142, "Pretrain/Step Time": 8.524916494265199} +{"Pretrain/Learning Rate": 2.7493636111544985e-06, "Pretrain/Loss": 2.03373384475708, "Pretrain/Loss (Raw)": 1.7560960054397583, "Pretrain/Step": 8143, "Pretrain/Step Time": 8.532572453841567} +{"Pretrain/Learning Rate": 2.745494269113927e-06, "Pretrain/Loss": 2.0352911949157715, "Pretrain/Loss (Raw)": 2.2224068641662598, "Pretrain/Step": 8144, "Pretrain/Step Time": 8.533204562962055} +{"Pretrain/Learning Rate": 2.741627493567822e-06, "Pretrain/Loss": 2.03633975982666, "Pretrain/Loss (Raw)": 1.9973235130310059, "Pretrain/Step": 8145, "Pretrain/Step Time": 8.533321589231491} +{"Pretrain/Learning Rate": 2.7377632849621164e-06, "Pretrain/Loss": 2.0374248027801514, "Pretrain/Loss (Raw)": 1.9755781888961792, "Pretrain/Step": 8146, "Pretrain/Step Time": 8.530528966337442} +{"Pretrain/Learning Rate": 2.7339016437424535e-06, "Pretrain/Loss": 2.0375101566314697, "Pretrain/Loss (Raw)": 2.0495212078094482, "Pretrain/Step": 8147, "Pretrain/Step Time": 8.52590194530785} +{"Pretrain/Learning Rate": 2.7300425703541773e-06, "Pretrain/Loss": 2.0363426208496094, "Pretrain/Loss (Raw)": 1.9840774536132812, "Pretrain/Step": 8148, "Pretrain/Step Time": 8.527359766885638} +{"Pretrain/Learning Rate": 2.726186065242331e-06, "Pretrain/Loss": 2.0362675189971924, "Pretrain/Loss (Raw)": 2.0152039527893066, "Pretrain/Step": 8149, "Pretrain/Step Time": 8.529084511101246} +{"Pretrain/Learning Rate": 2.7223321288516597e-06, "Pretrain/Loss": 2.0341155529022217, "Pretrain/Loss (Raw)": 1.998387098312378, "Pretrain/Step": 8150, "Pretrain/Step Time": 8.534769112244248} +{"Pretrain/Learning Rate": 2.7184807616266323e-06, "Pretrain/Loss": 2.0398268699645996, "Pretrain/Loss (Raw)": 2.1435813903808594, "Pretrain/Step": 8151, "Pretrain/Step Time": 8.52022597566247} +{"Pretrain/Learning Rate": 2.714631964011388e-06, "Pretrain/Loss": 2.0407347679138184, "Pretrain/Loss (Raw)": 2.1788268089294434, "Pretrain/Step": 8152, "Pretrain/Step Time": 8.517842795699835} +{"Pretrain/Learning Rate": 2.7107857364498027e-06, "Pretrain/Loss": 2.0394067764282227, "Pretrain/Loss (Raw)": 1.9217990636825562, "Pretrain/Step": 8153, "Pretrain/Step Time": 8.524513451382518} +{"Pretrain/Learning Rate": 2.7069420793854298e-06, "Pretrain/Loss": 2.041810989379883, "Pretrain/Loss (Raw)": 2.016195297241211, "Pretrain/Step": 8154, "Pretrain/Step Time": 8.524153446778655} +{"Pretrain/Learning Rate": 2.7031009932615563e-06, "Pretrain/Loss": 2.040367841720581, "Pretrain/Loss (Raw)": 1.9255658388137817, "Pretrain/Step": 8155, "Pretrain/Step Time": 8.527027696371078} +{"Pretrain/Learning Rate": 2.6992624785211334e-06, "Pretrain/Loss": 2.041050434112549, "Pretrain/Loss (Raw)": 1.9534261226654053, "Pretrain/Step": 8156, "Pretrain/Step Time": 8.532667616382241} +{"Pretrain/Learning Rate": 2.6954265356068515e-06, "Pretrain/Loss": 2.038937568664551, "Pretrain/Loss (Raw)": 2.033142566680908, "Pretrain/Step": 8157, "Pretrain/Step Time": 8.522016385570168} +{"Pretrain/Learning Rate": 2.691593164961084e-06, "Pretrain/Loss": 2.038637161254883, "Pretrain/Loss (Raw)": 1.9296225309371948, "Pretrain/Step": 8158, "Pretrain/Step Time": 8.521208487451077} +{"Pretrain/Learning Rate": 2.6877623670259115e-06, "Pretrain/Loss": 2.0409908294677734, "Pretrain/Loss (Raw)": 2.2175302505493164, "Pretrain/Step": 8159, "Pretrain/Step Time": 8.51937823370099} +{"Pretrain/Learning Rate": 2.6839341422431165e-06, "Pretrain/Loss": 2.0415234565734863, "Pretrain/Loss (Raw)": 2.0110692977905273, "Pretrain/Step": 8160, "Pretrain/Step Time": 8.515949944034219} +{"Pretrain/Learning Rate": 2.6801084910542008e-06, "Pretrain/Loss": 2.0433013439178467, "Pretrain/Loss (Raw)": 2.0492029190063477, "Pretrain/Step": 8161, "Pretrain/Step Time": 8.522705474868417} +{"Pretrain/Learning Rate": 2.6762854139003452e-06, "Pretrain/Loss": 2.039644479751587, "Pretrain/Loss (Raw)": 1.8011952638626099, "Pretrain/Step": 8162, "Pretrain/Step Time": 8.522429237142205} +{"Pretrain/Learning Rate": 2.6724649112224496e-06, "Pretrain/Loss": 2.040417194366455, "Pretrain/Loss (Raw)": 2.139500379562378, "Pretrain/Step": 8163, "Pretrain/Step Time": 8.517083698883653} +{"Pretrain/Learning Rate": 2.6686469834611066e-06, "Pretrain/Loss": 2.0389468669891357, "Pretrain/Loss (Raw)": 1.9041368961334229, "Pretrain/Step": 8164, "Pretrain/Step Time": 8.509992288425565} +{"Pretrain/Learning Rate": 2.66483163105663e-06, "Pretrain/Loss": 2.03910231590271, "Pretrain/Loss (Raw)": 2.101574659347534, "Pretrain/Step": 8165, "Pretrain/Step Time": 8.517427451908588} +{"Pretrain/Learning Rate": 2.6610188544490126e-06, "Pretrain/Loss": 2.0406527519226074, "Pretrain/Loss (Raw)": 2.1895434856414795, "Pretrain/Step": 8166, "Pretrain/Step Time": 8.520482763648033} +{"Pretrain/Learning Rate": 2.657208654077967e-06, "Pretrain/Loss": 2.03950834274292, "Pretrain/Loss (Raw)": 1.9512196779251099, "Pretrain/Step": 8167, "Pretrain/Step Time": 8.523956015706062} +{"Pretrain/Learning Rate": 2.653401030382896e-06, "Pretrain/Loss": 2.0384812355041504, "Pretrain/Loss (Raw)": 1.9099009037017822, "Pretrain/Step": 8168, "Pretrain/Step Time": 8.52228264324367} +{"Pretrain/Learning Rate": 2.649595983802927e-06, "Pretrain/Loss": 2.038239002227783, "Pretrain/Loss (Raw)": 2.130812644958496, "Pretrain/Step": 8169, "Pretrain/Step Time": 8.52269995957613} +{"Pretrain/Learning Rate": 2.645793514776865e-06, "Pretrain/Loss": 2.038553237915039, "Pretrain/Loss (Raw)": 2.0114381313323975, "Pretrain/Step": 8170, "Pretrain/Step Time": 8.51364753395319} +{"Pretrain/Learning Rate": 2.64199362374323e-06, "Pretrain/Loss": 2.03888201713562, "Pretrain/Loss (Raw)": 1.917216420173645, "Pretrain/Step": 8171, "Pretrain/Step Time": 8.515944747254252} +{"Pretrain/Learning Rate": 2.6381963111402423e-06, "Pretrain/Loss": 2.039588451385498, "Pretrain/Loss (Raw)": 1.997002363204956, "Pretrain/Step": 8172, "Pretrain/Step Time": 8.516335647553205} +{"Pretrain/Learning Rate": 2.6344015774058345e-06, "Pretrain/Loss": 2.039769411087036, "Pretrain/Loss (Raw)": 1.986305832862854, "Pretrain/Step": 8173, "Pretrain/Step Time": 8.518777415156364} +{"Pretrain/Learning Rate": 2.630609422977623e-06, "Pretrain/Loss": 2.0382862091064453, "Pretrain/Loss (Raw)": 1.7771990299224854, "Pretrain/Step": 8174, "Pretrain/Step Time": 8.523989776149392} +{"Pretrain/Learning Rate": 2.6268198482929442e-06, "Pretrain/Loss": 2.0364060401916504, "Pretrain/Loss (Raw)": 2.072662591934204, "Pretrain/Step": 8175, "Pretrain/Step Time": 8.52275600284338} +{"Pretrain/Learning Rate": 2.6230328537888204e-06, "Pretrain/Loss": 2.039278984069824, "Pretrain/Loss (Raw)": 2.0046463012695312, "Pretrain/Step": 8176, "Pretrain/Step Time": 8.51385392807424} +{"Pretrain/Learning Rate": 2.6192484399019947e-06, "Pretrain/Loss": 2.0395290851593018, "Pretrain/Loss (Raw)": 2.128999948501587, "Pretrain/Step": 8177, "Pretrain/Step Time": 8.52239920757711} +{"Pretrain/Learning Rate": 2.615466607068903e-06, "Pretrain/Loss": 2.038086414337158, "Pretrain/Loss (Raw)": 2.0544068813323975, "Pretrain/Step": 8178, "Pretrain/Step Time": 8.51688282750547} +{"Pretrain/Learning Rate": 2.611687355725681e-06, "Pretrain/Loss": 2.0394787788391113, "Pretrain/Loss (Raw)": 2.050776720046997, "Pretrain/Step": 8179, "Pretrain/Step Time": 8.515840612351894} +{"Pretrain/Learning Rate": 2.6079106863081655e-06, "Pretrain/Loss": 2.0392708778381348, "Pretrain/Loss (Raw)": 1.9455931186676025, "Pretrain/Step": 8180, "Pretrain/Step Time": 8.51939175836742} +{"Pretrain/Learning Rate": 2.604136599251908e-06, "Pretrain/Loss": 2.0381205081939697, "Pretrain/Loss (Raw)": 1.9423584938049316, "Pretrain/Step": 8181, "Pretrain/Step Time": 8.510370966047049} +{"Pretrain/Learning Rate": 2.600365094992152e-06, "Pretrain/Loss": 2.035780429840088, "Pretrain/Loss (Raw)": 1.9144659042358398, "Pretrain/Step": 8182, "Pretrain/Step Time": 8.506663715466857} +{"Pretrain/Learning Rate": 2.596596173963839e-06, "Pretrain/Loss": 2.035459041595459, "Pretrain/Loss (Raw)": 1.9202238321304321, "Pretrain/Step": 8183, "Pretrain/Step Time": 8.506559036672115} +{"Pretrain/Learning Rate": 2.592829836601629e-06, "Pretrain/Loss": 2.0347280502319336, "Pretrain/Loss (Raw)": 2.069424867630005, "Pretrain/Step": 8184, "Pretrain/Step Time": 8.510412808507681} +{"Pretrain/Learning Rate": 2.5890660833398667e-06, "Pretrain/Loss": 2.0337588787078857, "Pretrain/Loss (Raw)": 1.960081934928894, "Pretrain/Step": 8185, "Pretrain/Step Time": 8.516028609126806} +{"Pretrain/Learning Rate": 2.5853049146126076e-06, "Pretrain/Loss": 2.03155779838562, "Pretrain/Loss (Raw)": 1.9005458354949951, "Pretrain/Step": 8186, "Pretrain/Step Time": 8.523210283368826} +{"Pretrain/Learning Rate": 2.581546330853604e-06, "Pretrain/Loss": 2.0354607105255127, "Pretrain/Loss (Raw)": 2.2517573833465576, "Pretrain/Step": 8187, "Pretrain/Step Time": 8.5183762088418} +{"Pretrain/Learning Rate": 2.5777903324963187e-06, "Pretrain/Loss": 2.036324977874756, "Pretrain/Loss (Raw)": 2.0821218490600586, "Pretrain/Step": 8188, "Pretrain/Step Time": 8.511062685400248} +{"Pretrain/Learning Rate": 2.574036919973913e-06, "Pretrain/Loss": 2.038661479949951, "Pretrain/Loss (Raw)": 2.020617723464966, "Pretrain/Step": 8189, "Pretrain/Step Time": 8.512250274419785} +{"Pretrain/Learning Rate": 2.5702860937192403e-06, "Pretrain/Loss": 2.0378098487854004, "Pretrain/Loss (Raw)": 2.0619375705718994, "Pretrain/Step": 8190, "Pretrain/Step Time": 8.520849401131272} +{"Pretrain/Learning Rate": 2.566537854164866e-06, "Pretrain/Loss": 2.0398097038269043, "Pretrain/Loss (Raw)": 1.9547516107559204, "Pretrain/Step": 8191, "Pretrain/Step Time": 8.519825277850032} +{"Pretrain/Learning Rate": 2.5627922017430637e-06, "Pretrain/Loss": 2.040266990661621, "Pretrain/Loss (Raw)": 2.170034885406494, "Pretrain/Step": 8192, "Pretrain/Step Time": 8.518528105691075} +{"Pretrain/Learning Rate": 2.559049136885783e-06, "Pretrain/Loss": 2.0414981842041016, "Pretrain/Loss (Raw)": 2.0146236419677734, "Pretrain/Step": 8193, "Pretrain/Step Time": 8.510747300460935} +{"Pretrain/Learning Rate": 2.555308660024708e-06, "Pretrain/Loss": 2.0407958030700684, "Pretrain/Loss (Raw)": 1.9954992532730103, "Pretrain/Step": 8194, "Pretrain/Step Time": 8.51282918639481} +{"Pretrain/Learning Rate": 2.551570771591194e-06, "Pretrain/Loss": 2.040614604949951, "Pretrain/Loss (Raw)": 2.0284221172332764, "Pretrain/Step": 8195, "Pretrain/Step Time": 8.51245073787868} +{"Pretrain/Learning Rate": 2.54783547201633e-06, "Pretrain/Loss": 2.040306568145752, "Pretrain/Loss (Raw)": 2.093162775039673, "Pretrain/Step": 8196, "Pretrain/Step Time": 8.514778876677155} +{"Pretrain/Learning Rate": 2.5441027617308684e-06, "Pretrain/Loss": 2.0398874282836914, "Pretrain/Loss (Raw)": 2.120335340499878, "Pretrain/Step": 8197, "Pretrain/Step Time": 8.51345763169229} +{"Pretrain/Learning Rate": 2.540372641165295e-06, "Pretrain/Loss": 2.0417816638946533, "Pretrain/Loss (Raw)": 2.140721082687378, "Pretrain/Step": 8198, "Pretrain/Step Time": 8.515218369662762} +{"Pretrain/Learning Rate": 2.536645110749783e-06, "Pretrain/Loss": 2.0414021015167236, "Pretrain/Loss (Raw)": 1.9565227031707764, "Pretrain/Step": 8199, "Pretrain/Step Time": 8.511378491297364} +{"Pretrain/Learning Rate": 2.5329201709142074e-06, "Pretrain/Loss": 2.0385279655456543, "Pretrain/Loss (Raw)": 1.8851449489593506, "Pretrain/Step": 8200, "Pretrain/Step Time": 8.500412123277783} +{"Pretrain/Learning Rate": 2.5291978220881416e-06, "Pretrain/Loss": 2.0398921966552734, "Pretrain/Loss (Raw)": 2.0677523612976074, "Pretrain/Step": 8201, "Pretrain/Step Time": 8.502593969926238} +{"Pretrain/Learning Rate": 2.525478064700873e-06, "Pretrain/Loss": 2.0391054153442383, "Pretrain/Loss (Raw)": 2.0741193294525146, "Pretrain/Step": 8202, "Pretrain/Step Time": 8.510075736790895} +{"Pretrain/Learning Rate": 2.5217608991813776e-06, "Pretrain/Loss": 2.0384128093719482, "Pretrain/Loss (Raw)": 2.1035749912261963, "Pretrain/Step": 8203, "Pretrain/Step Time": 8.51242245733738} +{"Pretrain/Learning Rate": 2.5180463259583344e-06, "Pretrain/Loss": 2.0351028442382812, "Pretrain/Loss (Raw)": 2.069148302078247, "Pretrain/Step": 8204, "Pretrain/Step Time": 8.516907749697566} +{"Pretrain/Learning Rate": 2.514334345460126e-06, "Pretrain/Loss": 2.037639856338501, "Pretrain/Loss (Raw)": 2.2360262870788574, "Pretrain/Step": 8205, "Pretrain/Step Time": 8.51860305480659} +{"Pretrain/Learning Rate": 2.5106249581148406e-06, "Pretrain/Loss": 2.0371670722961426, "Pretrain/Loss (Raw)": 1.980918526649475, "Pretrain/Step": 8206, "Pretrain/Step Time": 8.516833191737533} +{"Pretrain/Learning Rate": 2.5069181643502552e-06, "Pretrain/Loss": 2.0385966300964355, "Pretrain/Loss (Raw)": 2.1344335079193115, "Pretrain/Step": 8207, "Pretrain/Step Time": 8.515024235472083} +{"Pretrain/Learning Rate": 2.503213964593862e-06, "Pretrain/Loss": 2.0406546592712402, "Pretrain/Loss (Raw)": 2.3031365871429443, "Pretrain/Step": 8208, "Pretrain/Step Time": 8.524345435202122} +{"Pretrain/Learning Rate": 2.4995123592728374e-06, "Pretrain/Loss": 2.0413873195648193, "Pretrain/Loss (Raw)": 1.9903427362442017, "Pretrain/Step": 8209, "Pretrain/Step Time": 8.519220909103751} +{"Pretrain/Learning Rate": 2.495813348814077e-06, "Pretrain/Loss": 2.0422215461730957, "Pretrain/Loss (Raw)": 1.8176827430725098, "Pretrain/Step": 8210, "Pretrain/Step Time": 8.51612707413733} +{"Pretrain/Learning Rate": 2.4921169336441645e-06, "Pretrain/Loss": 2.0416083335876465, "Pretrain/Loss (Raw)": 2.134019374847412, "Pretrain/Step": 8211, "Pretrain/Step Time": 8.514531204476953} +{"Pretrain/Learning Rate": 2.4884231141893864e-06, "Pretrain/Loss": 2.042250156402588, "Pretrain/Loss (Raw)": 2.140956163406372, "Pretrain/Step": 8212, "Pretrain/Step Time": 8.50666026212275} +{"Pretrain/Learning Rate": 2.48473189087573e-06, "Pretrain/Loss": 2.0420327186584473, "Pretrain/Loss (Raw)": 1.9666281938552856, "Pretrain/Step": 8213, "Pretrain/Step Time": 8.51197935640812} +{"Pretrain/Learning Rate": 2.4810432641288933e-06, "Pretrain/Loss": 2.0386202335357666, "Pretrain/Loss (Raw)": 1.688997507095337, "Pretrain/Step": 8214, "Pretrain/Step Time": 8.515436604619026} +{"Pretrain/Learning Rate": 2.4773572343742584e-06, "Pretrain/Loss": 2.037574291229248, "Pretrain/Loss (Raw)": 2.1088290214538574, "Pretrain/Step": 8215, "Pretrain/Step Time": 8.516545401886106} +{"Pretrain/Learning Rate": 2.473673802036916e-06, "Pretrain/Loss": 2.038151502609253, "Pretrain/Loss (Raw)": 2.1335301399230957, "Pretrain/Step": 8216, "Pretrain/Step Time": 8.51860942132771} +{"Pretrain/Learning Rate": 2.4699929675416565e-06, "Pretrain/Loss": 2.036635637283325, "Pretrain/Loss (Raw)": 1.9139553308486938, "Pretrain/Step": 8217, "Pretrain/Step Time": 8.513566132634878} +{"Pretrain/Learning Rate": 2.466314731312977e-06, "Pretrain/Loss": 2.039538621902466, "Pretrain/Loss (Raw)": 2.291167974472046, "Pretrain/Step": 8218, "Pretrain/Step Time": 8.509057013317943} +{"Pretrain/Learning Rate": 2.4626390937750624e-06, "Pretrain/Loss": 2.039618492126465, "Pretrain/Loss (Raw)": 2.119107723236084, "Pretrain/Step": 8219, "Pretrain/Step Time": 8.505211398005486} +{"Pretrain/Learning Rate": 2.4589660553518108e-06, "Pretrain/Loss": 2.0388646125793457, "Pretrain/Loss (Raw)": 1.976942539215088, "Pretrain/Step": 8220, "Pretrain/Step Time": 8.509039007127285} +{"Pretrain/Learning Rate": 2.4552956164668018e-06, "Pretrain/Loss": 2.0367369651794434, "Pretrain/Loss (Raw)": 2.023111581802368, "Pretrain/Step": 8221, "Pretrain/Step Time": 8.518726252019405} +{"Pretrain/Learning Rate": 2.4516277775433443e-06, "Pretrain/Loss": 2.036876678466797, "Pretrain/Loss (Raw)": 2.1028764247894287, "Pretrain/Step": 8222, "Pretrain/Step Time": 8.520742068067193} +{"Pretrain/Learning Rate": 2.4479625390044226e-06, "Pretrain/Loss": 2.038853883743286, "Pretrain/Loss (Raw)": 2.1270840167999268, "Pretrain/Step": 8223, "Pretrain/Step Time": 8.515976455062628} +{"Pretrain/Learning Rate": 2.444299901272723e-06, "Pretrain/Loss": 2.038147449493408, "Pretrain/Loss (Raw)": 1.952202320098877, "Pretrain/Step": 8224, "Pretrain/Step Time": 8.521051352843642} +{"Pretrain/Learning Rate": 2.4406398647706523e-06, "Pretrain/Loss": 2.038055181503296, "Pretrain/Loss (Raw)": 1.8425887823104858, "Pretrain/Step": 8225, "Pretrain/Step Time": 8.523127319291234} +{"Pretrain/Learning Rate": 2.4369824299202926e-06, "Pretrain/Loss": 2.0343573093414307, "Pretrain/Loss (Raw)": 1.723763108253479, "Pretrain/Step": 8226, "Pretrain/Step Time": 8.526366885751486} +{"Pretrain/Learning Rate": 2.433327597143442e-06, "Pretrain/Loss": 2.0346455574035645, "Pretrain/Loss (Raw)": 1.9956121444702148, "Pretrain/Step": 8227, "Pretrain/Step Time": 8.525016596540809} +{"Pretrain/Learning Rate": 2.4296753668615833e-06, "Pretrain/Loss": 2.0335001945495605, "Pretrain/Loss (Raw)": 2.085341691970825, "Pretrain/Step": 8228, "Pretrain/Step Time": 8.523854311555624} +{"Pretrain/Learning Rate": 2.4260257394959213e-06, "Pretrain/Loss": 2.03385591506958, "Pretrain/Loss (Raw)": 2.10498309135437, "Pretrain/Step": 8229, "Pretrain/Step Time": 8.517442155629396} +{"Pretrain/Learning Rate": 2.422378715467344e-06, "Pretrain/Loss": 2.0337910652160645, "Pretrain/Loss (Raw)": 1.911607265472412, "Pretrain/Step": 8230, "Pretrain/Step Time": 8.514867648482323} +{"Pretrain/Learning Rate": 2.4187342951964424e-06, "Pretrain/Loss": 2.0331177711486816, "Pretrain/Loss (Raw)": 2.120217800140381, "Pretrain/Step": 8231, "Pretrain/Step Time": 8.514244494959712} +{"Pretrain/Learning Rate": 2.4150924791035035e-06, "Pretrain/Loss": 2.030745029449463, "Pretrain/Loss (Raw)": 2.0313191413879395, "Pretrain/Step": 8232, "Pretrain/Step Time": 8.52551251091063} +{"Pretrain/Learning Rate": 2.411453267608535e-06, "Pretrain/Loss": 2.0298359394073486, "Pretrain/Loss (Raw)": 1.963125467300415, "Pretrain/Step": 8233, "Pretrain/Step Time": 8.527271255850792} +{"Pretrain/Learning Rate": 2.4078166611312044e-06, "Pretrain/Loss": 2.0264840126037598, "Pretrain/Loss (Raw)": 1.7536331415176392, "Pretrain/Step": 8234, "Pretrain/Step Time": 8.52203587628901} +{"Pretrain/Learning Rate": 2.40418266009092e-06, "Pretrain/Loss": 2.0261688232421875, "Pretrain/Loss (Raw)": 1.9184513092041016, "Pretrain/Step": 8235, "Pretrain/Step Time": 8.5192192196846} +{"Pretrain/Learning Rate": 2.4005512649067612e-06, "Pretrain/Loss": 2.028278350830078, "Pretrain/Loss (Raw)": 2.217539072036743, "Pretrain/Step": 8236, "Pretrain/Step Time": 8.5106565002352} +{"Pretrain/Learning Rate": 2.396922475997532e-06, "Pretrain/Loss": 2.0298266410827637, "Pretrain/Loss (Raw)": 2.0462088584899902, "Pretrain/Step": 8237, "Pretrain/Step Time": 8.510349256917834} +{"Pretrain/Learning Rate": 2.393296293781702e-06, "Pretrain/Loss": 2.031724452972412, "Pretrain/Loss (Raw)": 2.1418263912200928, "Pretrain/Step": 8238, "Pretrain/Step Time": 8.525455504655838} +{"Pretrain/Learning Rate": 2.3896727186774744e-06, "Pretrain/Loss": 2.028801918029785, "Pretrain/Loss (Raw)": 1.7903202772140503, "Pretrain/Step": 8239, "Pretrain/Step Time": 8.5239187926054} +{"Pretrain/Learning Rate": 2.386051751102733e-06, "Pretrain/Loss": 2.0282809734344482, "Pretrain/Loss (Raw)": 2.0765042304992676, "Pretrain/Step": 8240, "Pretrain/Step Time": 8.51671545021236} +{"Pretrain/Learning Rate": 2.382433391475064e-06, "Pretrain/Loss": 2.026218891143799, "Pretrain/Loss (Raw)": 1.9143449068069458, "Pretrain/Step": 8241, "Pretrain/Step Time": 8.516095124185085} +{"Pretrain/Learning Rate": 2.3788176402117502e-06, "Pretrain/Loss": 2.026939868927002, "Pretrain/Loss (Raw)": 2.163064479827881, "Pretrain/Step": 8242, "Pretrain/Step Time": 8.511647161096334} +{"Pretrain/Learning Rate": 2.3752044977297827e-06, "Pretrain/Loss": 2.0261993408203125, "Pretrain/Loss (Raw)": 2.083334445953369, "Pretrain/Step": 8243, "Pretrain/Step Time": 8.519529091194272} +{"Pretrain/Learning Rate": 2.371593964445845e-06, "Pretrain/Loss": 2.0268588066101074, "Pretrain/Loss (Raw)": 2.0747463703155518, "Pretrain/Step": 8244, "Pretrain/Step Time": 8.52269435301423} +{"Pretrain/Learning Rate": 2.367986040776321e-06, "Pretrain/Loss": 2.025460720062256, "Pretrain/Loss (Raw)": 1.9104868173599243, "Pretrain/Step": 8245, "Pretrain/Step Time": 8.530074244365096} +{"Pretrain/Learning Rate": 2.3643807271372886e-06, "Pretrain/Loss": 2.024113416671753, "Pretrain/Loss (Raw)": 1.9092516899108887, "Pretrain/Step": 8246, "Pretrain/Step Time": 8.519424673169851} +{"Pretrain/Learning Rate": 2.360778023944535e-06, "Pretrain/Loss": 2.0257513523101807, "Pretrain/Loss (Raw)": 2.097635269165039, "Pretrain/Step": 8247, "Pretrain/Step Time": 8.518990609794855} +{"Pretrain/Learning Rate": 2.3571779316135413e-06, "Pretrain/Loss": 2.0225818157196045, "Pretrain/Loss (Raw)": 1.8124463558197021, "Pretrain/Step": 8248, "Pretrain/Step Time": 8.51920091547072} +{"Pretrain/Learning Rate": 2.3535804505594837e-06, "Pretrain/Loss": 2.0208098888397217, "Pretrain/Loss (Raw)": 1.935128927230835, "Pretrain/Step": 8249, "Pretrain/Step Time": 8.518588811159134} +{"Pretrain/Learning Rate": 2.3499855811972393e-06, "Pretrain/Loss": 2.020599365234375, "Pretrain/Loss (Raw)": 2.0399885177612305, "Pretrain/Step": 8250, "Pretrain/Step Time": 8.527871487662196} +{"Pretrain/Learning Rate": 2.34639332394139e-06, "Pretrain/Loss": 2.0216026306152344, "Pretrain/Loss (Raw)": 2.205331325531006, "Pretrain/Step": 8251, "Pretrain/Step Time": 8.532842928543687} +{"Pretrain/Learning Rate": 2.3428036792062124e-06, "Pretrain/Loss": 2.0221190452575684, "Pretrain/Loss (Raw)": 2.021839141845703, "Pretrain/Step": 8252, "Pretrain/Step Time": 8.529076877981424} +{"Pretrain/Learning Rate": 2.3392166474056758e-06, "Pretrain/Loss": 2.0210185050964355, "Pretrain/Loss (Raw)": 1.8997318744659424, "Pretrain/Step": 8253, "Pretrain/Step Time": 8.51643394306302} +{"Pretrain/Learning Rate": 2.3356322289534547e-06, "Pretrain/Loss": 2.022346019744873, "Pretrain/Loss (Raw)": 2.109910488128662, "Pretrain/Step": 8254, "Pretrain/Step Time": 8.513631163164973} +{"Pretrain/Learning Rate": 2.332050424262927e-06, "Pretrain/Loss": 2.0217714309692383, "Pretrain/Loss (Raw)": 2.038154363632202, "Pretrain/Step": 8255, "Pretrain/Step Time": 8.505689593032002} +{"Pretrain/Learning Rate": 2.3284712337471593e-06, "Pretrain/Loss": 2.0199060440063477, "Pretrain/Loss (Raw)": 1.8431798219680786, "Pretrain/Step": 8256, "Pretrain/Step Time": 8.515971755608916} +{"Pretrain/Learning Rate": 2.3248946578189186e-06, "Pretrain/Loss": 2.019275665283203, "Pretrain/Loss (Raw)": 1.9236984252929688, "Pretrain/Step": 8257, "Pretrain/Step Time": 8.52064017765224} +{"Pretrain/Learning Rate": 2.321320696890672e-06, "Pretrain/Loss": 2.0226340293884277, "Pretrain/Loss (Raw)": 2.4949138164520264, "Pretrain/Step": 8258, "Pretrain/Step Time": 8.513954112306237} +{"Pretrain/Learning Rate": 2.317749351374593e-06, "Pretrain/Loss": 2.0195412635803223, "Pretrain/Loss (Raw)": 1.5683724880218506, "Pretrain/Step": 8259, "Pretrain/Step Time": 8.514865189790726} +{"Pretrain/Learning Rate": 2.3141806216825405e-06, "Pretrain/Loss": 2.0221590995788574, "Pretrain/Loss (Raw)": 2.18280029296875, "Pretrain/Step": 8260, "Pretrain/Step Time": 8.508739499375224} +{"Pretrain/Learning Rate": 2.310614508226078e-06, "Pretrain/Loss": 2.0217528343200684, "Pretrain/Loss (Raw)": 1.9297277927398682, "Pretrain/Step": 8261, "Pretrain/Step Time": 8.51147985085845} +{"Pretrain/Learning Rate": 2.3070510114164613e-06, "Pretrain/Loss": 2.022761821746826, "Pretrain/Loss (Raw)": 2.006869316101074, "Pretrain/Step": 8262, "Pretrain/Step Time": 8.519308092072606} +{"Pretrain/Learning Rate": 2.303490131664657e-06, "Pretrain/Loss": 2.0233452320098877, "Pretrain/Loss (Raw)": 2.0560503005981445, "Pretrain/Step": 8263, "Pretrain/Step Time": 8.523390026763082} +{"Pretrain/Learning Rate": 2.299931869381322e-06, "Pretrain/Loss": 2.0224084854125977, "Pretrain/Loss (Raw)": 2.0271456241607666, "Pretrain/Step": 8264, "Pretrain/Step Time": 8.51946560665965} +{"Pretrain/Learning Rate": 2.2963762249768067e-06, "Pretrain/Loss": 2.021303653717041, "Pretrain/Loss (Raw)": 2.0814208984375, "Pretrain/Step": 8265, "Pretrain/Step Time": 8.512470532208681} +{"Pretrain/Learning Rate": 2.2928231988611716e-06, "Pretrain/Loss": 2.019033908843994, "Pretrain/Loss (Raw)": 1.751230001449585, "Pretrain/Step": 8266, "Pretrain/Step Time": 8.506822399795055} +{"Pretrain/Learning Rate": 2.289272791444166e-06, "Pretrain/Loss": 2.0142998695373535, "Pretrain/Loss (Raw)": 1.6580480337142944, "Pretrain/Step": 8267, "Pretrain/Step Time": 8.508062893524766} +{"Pretrain/Learning Rate": 2.285725003135239e-06, "Pretrain/Loss": 2.0133113861083984, "Pretrain/Loss (Raw)": 1.8052089214324951, "Pretrain/Step": 8268, "Pretrain/Step Time": 8.515005446970463} +{"Pretrain/Learning Rate": 2.2821798343435314e-06, "Pretrain/Loss": 2.014096736907959, "Pretrain/Loss (Raw)": 1.972129225730896, "Pretrain/Step": 8269, "Pretrain/Step Time": 8.520729137584567} +{"Pretrain/Learning Rate": 2.2786372854779e-06, "Pretrain/Loss": 2.0123131275177, "Pretrain/Loss (Raw)": 1.9448641538619995, "Pretrain/Step": 8270, "Pretrain/Step Time": 8.515034014359117} +{"Pretrain/Learning Rate": 2.2750973569468843e-06, "Pretrain/Loss": 2.013864517211914, "Pretrain/Loss (Raw)": 1.9546611309051514, "Pretrain/Step": 8271, "Pretrain/Step Time": 8.508995762094855} +{"Pretrain/Learning Rate": 2.2715600491587245e-06, "Pretrain/Loss": 2.013110637664795, "Pretrain/Loss (Raw)": 2.125908851623535, "Pretrain/Step": 8272, "Pretrain/Step Time": 8.505964813753963} +{"Pretrain/Learning Rate": 2.268025362521353e-06, "Pretrain/Loss": 2.0118415355682373, "Pretrain/Loss (Raw)": 1.8348944187164307, "Pretrain/Step": 8273, "Pretrain/Step Time": 8.500709602609277} +{"Pretrain/Learning Rate": 2.264493297442424e-06, "Pretrain/Loss": 2.013120651245117, "Pretrain/Loss (Raw)": 2.1393253803253174, "Pretrain/Step": 8274, "Pretrain/Step Time": 8.506600299850106} +{"Pretrain/Learning Rate": 2.260963854329254e-06, "Pretrain/Loss": 2.012287139892578, "Pretrain/Loss (Raw)": 1.9427944421768188, "Pretrain/Step": 8275, "Pretrain/Step Time": 8.51057987473905} +{"Pretrain/Learning Rate": 2.2574370335888854e-06, "Pretrain/Loss": 2.0140843391418457, "Pretrain/Loss (Raw)": 2.2141354084014893, "Pretrain/Step": 8276, "Pretrain/Step Time": 8.505056455731392} +{"Pretrain/Learning Rate": 2.2539128356280387e-06, "Pretrain/Loss": 2.0145914554595947, "Pretrain/Loss (Raw)": 2.0800960063934326, "Pretrain/Step": 8277, "Pretrain/Step Time": 8.502586415037513} +{"Pretrain/Learning Rate": 2.2503912608531576e-06, "Pretrain/Loss": 2.0157339572906494, "Pretrain/Loss (Raw)": 2.1446433067321777, "Pretrain/Step": 8278, "Pretrain/Step Time": 8.502824114635587} +{"Pretrain/Learning Rate": 2.2468723096703447e-06, "Pretrain/Loss": 2.0157387256622314, "Pretrain/Loss (Raw)": 2.1441760063171387, "Pretrain/Step": 8279, "Pretrain/Step Time": 8.509538065642118} +{"Pretrain/Learning Rate": 2.24335598248544e-06, "Pretrain/Loss": 2.0129165649414062, "Pretrain/Loss (Raw)": 1.8176003694534302, "Pretrain/Step": 8280, "Pretrain/Step Time": 8.512373927980661} +{"Pretrain/Learning Rate": 2.239842279703952e-06, "Pretrain/Loss": 2.0115489959716797, "Pretrain/Loss (Raw)": 1.74674391746521, "Pretrain/Step": 8281, "Pretrain/Step Time": 8.516070071607828} +{"Pretrain/Learning Rate": 2.2363312017311094e-06, "Pretrain/Loss": 2.012214422225952, "Pretrain/Loss (Raw)": 2.101374626159668, "Pretrain/Step": 8282, "Pretrain/Step Time": 8.516298772767186} +{"Pretrain/Learning Rate": 2.2328227489718106e-06, "Pretrain/Loss": 2.0130772590637207, "Pretrain/Loss (Raw)": 2.036024332046509, "Pretrain/Step": 8283, "Pretrain/Step Time": 8.513244088739157} +{"Pretrain/Learning Rate": 2.229316921830679e-06, "Pretrain/Loss": 2.0148544311523438, "Pretrain/Loss (Raw)": 2.180901050567627, "Pretrain/Step": 8284, "Pretrain/Step Time": 8.510959777981043} +{"Pretrain/Learning Rate": 2.2258137207120165e-06, "Pretrain/Loss": 2.0166497230529785, "Pretrain/Loss (Raw)": 2.262913942337036, "Pretrain/Step": 8285, "Pretrain/Step Time": 8.520076360553503} +{"Pretrain/Learning Rate": 2.222313146019833e-06, "Pretrain/Loss": 2.016199827194214, "Pretrain/Loss (Raw)": 1.8720580339431763, "Pretrain/Step": 8286, "Pretrain/Step Time": 8.514966668561101} +{"Pretrain/Learning Rate": 2.2188151981578252e-06, "Pretrain/Loss": 2.0142223834991455, "Pretrain/Loss (Raw)": 1.96442711353302, "Pretrain/Step": 8287, "Pretrain/Step Time": 8.51331676542759} +{"Pretrain/Learning Rate": 2.215319877529404e-06, "Pretrain/Loss": 2.015725612640381, "Pretrain/Loss (Raw)": 2.2034783363342285, "Pretrain/Step": 8288, "Pretrain/Step Time": 8.51266816817224} +{"Pretrain/Learning Rate": 2.211827184537657e-06, "Pretrain/Loss": 2.0160322189331055, "Pretrain/Loss (Raw)": 2.088456153869629, "Pretrain/Step": 8289, "Pretrain/Step Time": 8.502645913511515} +{"Pretrain/Learning Rate": 2.2083371195853796e-06, "Pretrain/Loss": 2.0211052894592285, "Pretrain/Loss (Raw)": 2.450528621673584, "Pretrain/Step": 8290, "Pretrain/Step Time": 8.505411537364125} +{"Pretrain/Learning Rate": 2.204849683075061e-06, "Pretrain/Loss": 2.020573616027832, "Pretrain/Loss (Raw)": 2.0714638233184814, "Pretrain/Step": 8291, "Pretrain/Step Time": 8.512528521940112} +{"Pretrain/Learning Rate": 2.2013648754088954e-06, "Pretrain/Loss": 2.0220088958740234, "Pretrain/Loss (Raw)": 2.0878639221191406, "Pretrain/Step": 8292, "Pretrain/Step Time": 8.510323949158192} +{"Pretrain/Learning Rate": 2.1978826969887624e-06, "Pretrain/Loss": 2.0215609073638916, "Pretrain/Loss (Raw)": 2.044203519821167, "Pretrain/Step": 8293, "Pretrain/Step Time": 8.508716452866793} +{"Pretrain/Learning Rate": 2.1944031482162425e-06, "Pretrain/Loss": 2.0202975273132324, "Pretrain/Loss (Raw)": 2.0278213024139404, "Pretrain/Step": 8294, "Pretrain/Step Time": 8.505046362057328} +{"Pretrain/Learning Rate": 2.1909262294926126e-06, "Pretrain/Loss": 2.019303321838379, "Pretrain/Loss (Raw)": 1.823984146118164, "Pretrain/Step": 8295, "Pretrain/Step Time": 8.500211700797081} +{"Pretrain/Learning Rate": 2.1874519412188545e-06, "Pretrain/Loss": 2.018393039703369, "Pretrain/Loss (Raw)": 1.7933942079544067, "Pretrain/Step": 8296, "Pretrain/Step Time": 8.500822320580482} +{"Pretrain/Learning Rate": 2.1839802837956336e-06, "Pretrain/Loss": 2.018260955810547, "Pretrain/Loss (Raw)": 2.1139116287231445, "Pretrain/Step": 8297, "Pretrain/Step Time": 8.496212722733617} +{"Pretrain/Learning Rate": 2.180511257623319e-06, "Pretrain/Loss": 2.0182580947875977, "Pretrain/Loss (Raw)": 2.0110507011413574, "Pretrain/Step": 8298, "Pretrain/Step Time": 8.511735307052732} +{"Pretrain/Learning Rate": 2.1770448631019708e-06, "Pretrain/Loss": 2.018714666366577, "Pretrain/Loss (Raw)": 1.9756641387939453, "Pretrain/Step": 8299, "Pretrain/Step Time": 8.517395785078406} +{"Pretrain/Learning Rate": 2.1735811006313583e-06, "Pretrain/Loss": 2.0167222023010254, "Pretrain/Loss (Raw)": 1.7419556379318237, "Pretrain/Step": 8300, "Pretrain/Step Time": 8.515776982530951} +{"Pretrain/Learning Rate": 2.170119970610937e-06, "Pretrain/Loss": 2.015604019165039, "Pretrain/Loss (Raw)": 1.843174934387207, "Pretrain/Step": 8301, "Pretrain/Step Time": 8.515678010880947} +{"Pretrain/Learning Rate": 2.1666614734398573e-06, "Pretrain/Loss": 2.017726421356201, "Pretrain/Loss (Raw)": 2.0488808155059814, "Pretrain/Step": 8302, "Pretrain/Step Time": 8.507499903440475} +{"Pretrain/Learning Rate": 2.163205609516966e-06, "Pretrain/Loss": 2.0169947147369385, "Pretrain/Loss (Raw)": 1.9790019989013672, "Pretrain/Step": 8303, "Pretrain/Step Time": 8.516444310545921} +{"Pretrain/Learning Rate": 2.1597523792408176e-06, "Pretrain/Loss": 2.017285108566284, "Pretrain/Loss (Raw)": 2.04182767868042, "Pretrain/Step": 8304, "Pretrain/Step Time": 8.519061172381043} +{"Pretrain/Learning Rate": 2.156301783009654e-06, "Pretrain/Loss": 2.0153932571411133, "Pretrain/Loss (Raw)": 1.8868192434310913, "Pretrain/Step": 8305, "Pretrain/Step Time": 8.512145187705755} +{"Pretrain/Learning Rate": 2.1528538212214066e-06, "Pretrain/Loss": 2.014636993408203, "Pretrain/Loss (Raw)": 1.9576081037521362, "Pretrain/Step": 8306, "Pretrain/Step Time": 8.511302337050438} +{"Pretrain/Learning Rate": 2.1494084942737193e-06, "Pretrain/Loss": 2.0156381130218506, "Pretrain/Loss (Raw)": 2.1789355278015137, "Pretrain/Step": 8307, "Pretrain/Step Time": 8.50827956572175} +{"Pretrain/Learning Rate": 2.1459658025639208e-06, "Pretrain/Loss": 2.0168933868408203, "Pretrain/Loss (Raw)": 2.1062510013580322, "Pretrain/Step": 8308, "Pretrain/Step Time": 8.513295445591211} +{"Pretrain/Learning Rate": 2.142525746489038e-06, "Pretrain/Loss": 2.016657829284668, "Pretrain/Loss (Raw)": 1.9122267961502075, "Pretrain/Step": 8309, "Pretrain/Step Time": 8.523185843601823} +{"Pretrain/Learning Rate": 2.1390883264457903e-06, "Pretrain/Loss": 2.016787052154541, "Pretrain/Loss (Raw)": 1.9309810400009155, "Pretrain/Step": 8310, "Pretrain/Step Time": 8.520889328792691} +{"Pretrain/Learning Rate": 2.135653542830604e-06, "Pretrain/Loss": 2.017256498336792, "Pretrain/Loss (Raw)": 1.9803266525268555, "Pretrain/Step": 8311, "Pretrain/Step Time": 8.516542686149478} +{"Pretrain/Learning Rate": 2.132221396039591e-06, "Pretrain/Loss": 2.0176758766174316, "Pretrain/Loss (Raw)": 2.123121738433838, "Pretrain/Step": 8312, "Pretrain/Step Time": 8.511212198063731} +{"Pretrain/Learning Rate": 2.1287918864685645e-06, "Pretrain/Loss": 2.0194790363311768, "Pretrain/Loss (Raw)": 2.190880537033081, "Pretrain/Step": 8313, "Pretrain/Step Time": 8.504093548282981} +{"Pretrain/Learning Rate": 2.1253650145130254e-06, "Pretrain/Loss": 2.0210373401641846, "Pretrain/Loss (Raw)": 2.0999977588653564, "Pretrain/Step": 8314, "Pretrain/Step Time": 8.501465955749154} +{"Pretrain/Learning Rate": 2.121940780568188e-06, "Pretrain/Loss": 2.0186681747436523, "Pretrain/Loss (Raw)": 1.9485238790512085, "Pretrain/Step": 8315, "Pretrain/Step Time": 8.504509050399065} +{"Pretrain/Learning Rate": 2.1185191850289386e-06, "Pretrain/Loss": 2.0215158462524414, "Pretrain/Loss (Raw)": 2.446593999862671, "Pretrain/Step": 8316, "Pretrain/Step Time": 8.511385053396225} +{"Pretrain/Learning Rate": 2.115100228289882e-06, "Pretrain/Loss": 2.0241966247558594, "Pretrain/Loss (Raw)": 2.363738775253296, "Pretrain/Step": 8317, "Pretrain/Step Time": 8.514342153444886} +{"Pretrain/Learning Rate": 2.111683910745299e-06, "Pretrain/Loss": 2.024458408355713, "Pretrain/Loss (Raw)": 2.095468282699585, "Pretrain/Step": 8318, "Pretrain/Step Time": 8.507650528103113} +{"Pretrain/Learning Rate": 2.108270232789192e-06, "Pretrain/Loss": 2.0252208709716797, "Pretrain/Loss (Raw)": 2.0523345470428467, "Pretrain/Step": 8319, "Pretrain/Step Time": 8.508418487384915} +{"Pretrain/Learning Rate": 2.10485919481522e-06, "Pretrain/Loss": 2.0248541831970215, "Pretrain/Loss (Raw)": 2.123126745223999, "Pretrain/Step": 8320, "Pretrain/Step Time": 8.516961924731731} +{"Pretrain/Learning Rate": 2.101450797216775e-06, "Pretrain/Loss": 2.0222344398498535, "Pretrain/Loss (Raw)": 1.6793129444122314, "Pretrain/Step": 8321, "Pretrain/Step Time": 8.52648040652275} +{"Pretrain/Learning Rate": 2.098045040386923e-06, "Pretrain/Loss": 2.0194244384765625, "Pretrain/Loss (Raw)": 1.6357758045196533, "Pretrain/Step": 8322, "Pretrain/Step Time": 8.523757791146636} +{"Pretrain/Learning Rate": 2.0946419247184435e-06, "Pretrain/Loss": 2.0189900398254395, "Pretrain/Loss (Raw)": 1.9728212356567383, "Pretrain/Step": 8323, "Pretrain/Step Time": 8.519803585484624} +{"Pretrain/Learning Rate": 2.0912414506037814e-06, "Pretrain/Loss": 2.020308017730713, "Pretrain/Loss (Raw)": 2.2618939876556396, "Pretrain/Step": 8324, "Pretrain/Step Time": 8.515500554814935} +{"Pretrain/Learning Rate": 2.087843618435109e-06, "Pretrain/Loss": 2.017545700073242, "Pretrain/Loss (Raw)": 1.7667399644851685, "Pretrain/Step": 8325, "Pretrain/Step Time": 8.514649173244834} +{"Pretrain/Learning Rate": 2.0844484286042744e-06, "Pretrain/Loss": 2.0170910358428955, "Pretrain/Loss (Raw)": 2.0825235843658447, "Pretrain/Step": 8326, "Pretrain/Step Time": 8.515500877052546} +{"Pretrain/Learning Rate": 2.0810558815028303e-06, "Pretrain/Loss": 2.017775058746338, "Pretrain/Loss (Raw)": 2.0440685749053955, "Pretrain/Step": 8327, "Pretrain/Step Time": 8.519466368481517} +{"Pretrain/Learning Rate": 2.077665977522017e-06, "Pretrain/Loss": 2.0199689865112305, "Pretrain/Loss (Raw)": 2.1659746170043945, "Pretrain/Step": 8328, "Pretrain/Step Time": 8.524899024516344} +{"Pretrain/Learning Rate": 2.07427871705278e-06, "Pretrain/Loss": 2.0186967849731445, "Pretrain/Loss (Raw)": 1.9049122333526611, "Pretrain/Step": 8329, "Pretrain/Step Time": 8.518329914659262} +{"Pretrain/Learning Rate": 2.0708941004857485e-06, "Pretrain/Loss": 2.01861572265625, "Pretrain/Loss (Raw)": 2.0637576580047607, "Pretrain/Step": 8330, "Pretrain/Step Time": 8.512181714177132} +{"Pretrain/Learning Rate": 2.0675121282112577e-06, "Pretrain/Loss": 2.0178298950195312, "Pretrain/Loss (Raw)": 2.002986192703247, "Pretrain/Step": 8331, "Pretrain/Step Time": 8.509995687752962} +{"Pretrain/Learning Rate": 2.064132800619323e-06, "Pretrain/Loss": 2.01641845703125, "Pretrain/Loss (Raw)": 1.8884553909301758, "Pretrain/Step": 8332, "Pretrain/Step Time": 8.517077235504985} +{"Pretrain/Learning Rate": 2.0607561180996772e-06, "Pretrain/Loss": 2.0127224922180176, "Pretrain/Loss (Raw)": 1.7629501819610596, "Pretrain/Step": 8333, "Pretrain/Step Time": 8.521968455985188} +{"Pretrain/Learning Rate": 2.0573820810417283e-06, "Pretrain/Loss": 2.0137271881103516, "Pretrain/Loss (Raw)": 2.109532117843628, "Pretrain/Step": 8334, "Pretrain/Step Time": 8.524130679666996} +{"Pretrain/Learning Rate": 2.0540106898345874e-06, "Pretrain/Loss": 2.0121893882751465, "Pretrain/Loss (Raw)": 1.9376057386398315, "Pretrain/Step": 8335, "Pretrain/Step Time": 8.52229997701943} +{"Pretrain/Learning Rate": 2.0506419448670543e-06, "Pretrain/Loss": 2.011949062347412, "Pretrain/Loss (Raw)": 2.2723662853240967, "Pretrain/Step": 8336, "Pretrain/Step Time": 8.517558513209224} +{"Pretrain/Learning Rate": 2.047275846527638e-06, "Pretrain/Loss": 2.012387275695801, "Pretrain/Loss (Raw)": 2.0464584827423096, "Pretrain/Step": 8337, "Pretrain/Step Time": 8.517997864633799} +{"Pretrain/Learning Rate": 2.043912395204525e-06, "Pretrain/Loss": 2.0136334896087646, "Pretrain/Loss (Raw)": 1.9771705865859985, "Pretrain/Step": 8338, "Pretrain/Step Time": 8.520219402387738} +{"Pretrain/Learning Rate": 2.040551591285611e-06, "Pretrain/Loss": 2.011521339416504, "Pretrain/Loss (Raw)": 1.8636585474014282, "Pretrain/Step": 8339, "Pretrain/Step Time": 8.524734534323215} +{"Pretrain/Learning Rate": 2.0371934351584716e-06, "Pretrain/Loss": 2.0105624198913574, "Pretrain/Loss (Raw)": 2.018216133117676, "Pretrain/Step": 8340, "Pretrain/Step Time": 8.530542807653546} +{"Pretrain/Learning Rate": 2.0338379272103915e-06, "Pretrain/Loss": 2.011734962463379, "Pretrain/Loss (Raw)": 2.116727352142334, "Pretrain/Step": 8341, "Pretrain/Step Time": 8.527870621532202} +{"Pretrain/Learning Rate": 2.0304850678283415e-06, "Pretrain/Loss": 2.014296293258667, "Pretrain/Loss (Raw)": 2.016839027404785, "Pretrain/Step": 8342, "Pretrain/Step Time": 8.525681257247925} +{"Pretrain/Learning Rate": 2.027134857398991e-06, "Pretrain/Loss": 2.013688564300537, "Pretrain/Loss (Raw)": 2.031031847000122, "Pretrain/Step": 8343, "Pretrain/Step Time": 8.523081608116627} +{"Pretrain/Learning Rate": 2.023787296308696e-06, "Pretrain/Loss": 2.0114569664001465, "Pretrain/Loss (Raw)": 1.8478991985321045, "Pretrain/Step": 8344, "Pretrain/Step Time": 8.524451890960336} +{"Pretrain/Learning Rate": 2.0204423849435216e-06, "Pretrain/Loss": 2.0149524211883545, "Pretrain/Loss (Raw)": 2.3613646030426025, "Pretrain/Step": 8345, "Pretrain/Step Time": 8.525027772411704} +{"Pretrain/Learning Rate": 2.017100123689214e-06, "Pretrain/Loss": 2.013211250305176, "Pretrain/Loss (Raw)": 2.0683035850524902, "Pretrain/Step": 8346, "Pretrain/Step Time": 8.523977659642696} +{"Pretrain/Learning Rate": 2.013760512931215e-06, "Pretrain/Loss": 2.0129318237304688, "Pretrain/Loss (Raw)": 2.083329200744629, "Pretrain/Step": 8347, "Pretrain/Step Time": 8.52971257828176} +{"Pretrain/Learning Rate": 2.0104235530546743e-06, "Pretrain/Loss": 2.015439748764038, "Pretrain/Loss (Raw)": 2.297957181930542, "Pretrain/Step": 8348, "Pretrain/Step Time": 8.520712023600936} +{"Pretrain/Learning Rate": 2.0070892444444185e-06, "Pretrain/Loss": 2.015244960784912, "Pretrain/Loss (Raw)": 1.9982175827026367, "Pretrain/Step": 8349, "Pretrain/Step Time": 8.510129362344742} +{"Pretrain/Learning Rate": 2.0037575874849753e-06, "Pretrain/Loss": 2.016252279281616, "Pretrain/Loss (Raw)": 2.2318015098571777, "Pretrain/Step": 8350, "Pretrain/Step Time": 8.507185919210315} +{"Pretrain/Learning Rate": 2.0004285825605677e-06, "Pretrain/Loss": 2.016047239303589, "Pretrain/Loss (Raw)": 2.100837469100952, "Pretrain/Step": 8351, "Pretrain/Step Time": 8.508243711665273} +{"Pretrain/Learning Rate": 1.9971022300551174e-06, "Pretrain/Loss": 2.016587734222412, "Pretrain/Loss (Raw)": 2.0213613510131836, "Pretrain/Step": 8352, "Pretrain/Step Time": 8.508451756089926} +{"Pretrain/Learning Rate": 1.9937785303522303e-06, "Pretrain/Loss": 2.0175015926361084, "Pretrain/Loss (Raw)": 1.9595829248428345, "Pretrain/Step": 8353, "Pretrain/Step Time": 8.509313087910414} +{"Pretrain/Learning Rate": 1.990457483835212e-06, "Pretrain/Loss": 2.019169569015503, "Pretrain/Loss (Raw)": 1.9372620582580566, "Pretrain/Step": 8354, "Pretrain/Step Time": 8.504344826564193} +{"Pretrain/Learning Rate": 1.9871390908870554e-06, "Pretrain/Loss": 2.0182621479034424, "Pretrain/Loss (Raw)": 1.8794444799423218, "Pretrain/Step": 8355, "Pretrain/Step Time": 8.507194619625807} +{"Pretrain/Learning Rate": 1.9838233518904655e-06, "Pretrain/Loss": 2.0174942016601562, "Pretrain/Loss (Raw)": 1.9870448112487793, "Pretrain/Step": 8356, "Pretrain/Step Time": 8.512539234012365} +{"Pretrain/Learning Rate": 1.9805102672278226e-06, "Pretrain/Loss": 2.016164779663086, "Pretrain/Loss (Raw)": 1.9348384141921997, "Pretrain/Step": 8357, "Pretrain/Step Time": 8.515703918412328} +{"Pretrain/Learning Rate": 1.9771998372812044e-06, "Pretrain/Loss": 2.016315221786499, "Pretrain/Loss (Raw)": 1.9308485984802246, "Pretrain/Step": 8358, "Pretrain/Step Time": 8.520797405391932} +{"Pretrain/Learning Rate": 1.9738920624323862e-06, "Pretrain/Loss": 2.0144543647766113, "Pretrain/Loss (Raw)": 1.8820561170578003, "Pretrain/Step": 8359, "Pretrain/Step Time": 8.51874328404665} +{"Pretrain/Learning Rate": 1.9705869430628465e-06, "Pretrain/Loss": 2.013688564300537, "Pretrain/Loss (Raw)": 1.9332709312438965, "Pretrain/Step": 8360, "Pretrain/Step Time": 8.511536467820406} +{"Pretrain/Learning Rate": 1.96728447955373e-06, "Pretrain/Loss": 2.014943838119507, "Pretrain/Loss (Raw)": 2.1238162517547607, "Pretrain/Step": 8361, "Pretrain/Step Time": 8.51659388653934} +{"Pretrain/Learning Rate": 1.963984672285904e-06, "Pretrain/Loss": 2.0192806720733643, "Pretrain/Loss (Raw)": 2.30875301361084, "Pretrain/Step": 8362, "Pretrain/Step Time": 8.52465588413179} +{"Pretrain/Learning Rate": 1.960687521639912e-06, "Pretrain/Loss": 2.0202488899230957, "Pretrain/Loss (Raw)": 2.042351245880127, "Pretrain/Step": 8363, "Pretrain/Step Time": 8.51993803679943} +{"Pretrain/Learning Rate": 1.9573930279960073e-06, "Pretrain/Loss": 2.0149662494659424, "Pretrain/Loss (Raw)": 1.5413627624511719, "Pretrain/Step": 8364, "Pretrain/Step Time": 8.523135796189308} +{"Pretrain/Learning Rate": 1.954101191734112e-06, "Pretrain/Loss": 2.0144667625427246, "Pretrain/Loss (Raw)": 1.9822828769683838, "Pretrain/Step": 8365, "Pretrain/Step Time": 8.521848423406482} +{"Pretrain/Learning Rate": 1.9508120132338657e-06, "Pretrain/Loss": 2.0131235122680664, "Pretrain/Loss (Raw)": 1.9699060916900635, "Pretrain/Step": 8366, "Pretrain/Step Time": 8.506286334246397} +{"Pretrain/Learning Rate": 1.9475254928745883e-06, "Pretrain/Loss": 2.017515182495117, "Pretrain/Loss (Raw)": 2.3524410724639893, "Pretrain/Step": 8367, "Pretrain/Step Time": 8.515752153471112} +{"Pretrain/Learning Rate": 1.9442416310353012e-06, "Pretrain/Loss": 2.0164928436279297, "Pretrain/Loss (Raw)": 1.9456442594528198, "Pretrain/Step": 8368, "Pretrain/Step Time": 8.513941263779998} +{"Pretrain/Learning Rate": 1.940960428094704e-06, "Pretrain/Loss": 2.0159919261932373, "Pretrain/Loss (Raw)": 1.8502267599105835, "Pretrain/Step": 8369, "Pretrain/Step Time": 8.509939989075065} +{"Pretrain/Learning Rate": 1.937681884431214e-06, "Pretrain/Loss": 2.015301465988159, "Pretrain/Loss (Raw)": 2.0746891498565674, "Pretrain/Step": 8370, "Pretrain/Step Time": 8.5108454041183} +{"Pretrain/Learning Rate": 1.9344060004229225e-06, "Pretrain/Loss": 2.015108108520508, "Pretrain/Loss (Raw)": 2.0585885047912598, "Pretrain/Step": 8371, "Pretrain/Step Time": 8.505993250757456} +{"Pretrain/Learning Rate": 1.9311327764476196e-06, "Pretrain/Loss": 2.0174269676208496, "Pretrain/Loss (Raw)": 2.3715806007385254, "Pretrain/Step": 8372, "Pretrain/Step Time": 8.500738225877285} +{"Pretrain/Learning Rate": 1.927862212882783e-06, "Pretrain/Loss": 2.0202150344848633, "Pretrain/Loss (Raw)": 2.2673263549804688, "Pretrain/Step": 8373, "Pretrain/Step Time": 8.500946456566453} +{"Pretrain/Learning Rate": 1.9245943101056014e-06, "Pretrain/Loss": 2.0206339359283447, "Pretrain/Loss (Raw)": 1.9628745317459106, "Pretrain/Step": 8374, "Pretrain/Step Time": 8.505638040602207} +{"Pretrain/Learning Rate": 1.9213290684929386e-06, "Pretrain/Loss": 2.0207419395446777, "Pretrain/Loss (Raw)": 2.1114847660064697, "Pretrain/Step": 8375, "Pretrain/Step Time": 8.50591510348022} +{"Pretrain/Learning Rate": 1.9180664884213577e-06, "Pretrain/Loss": 2.0216805934906006, "Pretrain/Loss (Raw)": 1.9325711727142334, "Pretrain/Step": 8376, "Pretrain/Step Time": 8.507976166903973} +{"Pretrain/Learning Rate": 1.9148065702671108e-06, "Pretrain/Loss": 2.0232388973236084, "Pretrain/Loss (Raw)": 2.134589910507202, "Pretrain/Step": 8377, "Pretrain/Step Time": 8.507477948442101} +{"Pretrain/Learning Rate": 1.9115493144061555e-06, "Pretrain/Loss": 2.023360252380371, "Pretrain/Loss (Raw)": 2.055535078048706, "Pretrain/Step": 8378, "Pretrain/Step Time": 8.497134292498231} +{"Pretrain/Learning Rate": 1.9082947212141293e-06, "Pretrain/Loss": 2.021557569503784, "Pretrain/Loss (Raw)": 1.974570393562317, "Pretrain/Step": 8379, "Pretrain/Step Time": 8.494001476094127} +{"Pretrain/Learning Rate": 1.9050427910663693e-06, "Pretrain/Loss": 2.022122383117676, "Pretrain/Loss (Raw)": 2.0941474437713623, "Pretrain/Step": 8380, "Pretrain/Step Time": 8.504829660058022} +{"Pretrain/Learning Rate": 1.901793524337897e-06, "Pretrain/Loss": 2.0216822624206543, "Pretrain/Loss (Raw)": 1.8434008359909058, "Pretrain/Step": 8381, "Pretrain/Step Time": 8.509405685588717} +{"Pretrain/Learning Rate": 1.8985469214034407e-06, "Pretrain/Loss": 2.0206663608551025, "Pretrain/Loss (Raw)": 1.9798800945281982, "Pretrain/Step": 8382, "Pretrain/Step Time": 8.517533274367452} +{"Pretrain/Learning Rate": 1.8953029826374119e-06, "Pretrain/Loss": 2.0216100215911865, "Pretrain/Loss (Raw)": 2.1589245796203613, "Pretrain/Step": 8383, "Pretrain/Step Time": 8.515256376937032} +{"Pretrain/Learning Rate": 1.8920617084139142e-06, "Pretrain/Loss": 2.023447036743164, "Pretrain/Loss (Raw)": 2.0783002376556396, "Pretrain/Step": 8384, "Pretrain/Step Time": 8.50418914295733} +{"Pretrain/Learning Rate": 1.8888230991067457e-06, "Pretrain/Loss": 2.024169921875, "Pretrain/Loss (Raw)": 2.0162551403045654, "Pretrain/Step": 8385, "Pretrain/Step Time": 8.508408086374402} +{"Pretrain/Learning Rate": 1.885587155089405e-06, "Pretrain/Loss": 2.020214080810547, "Pretrain/Loss (Raw)": 1.9885693788528442, "Pretrain/Step": 8386, "Pretrain/Step Time": 8.510950684547424} +{"Pretrain/Learning Rate": 1.8823538767350712e-06, "Pretrain/Loss": 2.0222606658935547, "Pretrain/Loss (Raw)": 1.8303335905075073, "Pretrain/Step": 8387, "Pretrain/Step Time": 8.507424622774124} +{"Pretrain/Learning Rate": 1.8791232644166212e-06, "Pretrain/Loss": 2.0209498405456543, "Pretrain/Loss (Raw)": 2.0150110721588135, "Pretrain/Step": 8388, "Pretrain/Step Time": 8.507479716092348} +{"Pretrain/Learning Rate": 1.8758953185066264e-06, "Pretrain/Loss": 2.0227723121643066, "Pretrain/Loss (Raw)": 2.1630020141601562, "Pretrain/Step": 8389, "Pretrain/Step Time": 8.504152156412601} +{"Pretrain/Learning Rate": 1.87267003937735e-06, "Pretrain/Loss": 2.0200047492980957, "Pretrain/Loss (Raw)": 1.6526292562484741, "Pretrain/Step": 8390, "Pretrain/Step Time": 8.498120456933975} +{"Pretrain/Learning Rate": 1.8694474274007417e-06, "Pretrain/Loss": 2.02081298828125, "Pretrain/Loss (Raw)": 2.159515142440796, "Pretrain/Step": 8391, "Pretrain/Step Time": 8.49571400694549} +{"Pretrain/Learning Rate": 1.8662274829484488e-06, "Pretrain/Loss": 2.0186026096343994, "Pretrain/Loss (Raw)": 1.7441807985305786, "Pretrain/Step": 8392, "Pretrain/Step Time": 8.499546501785517} +{"Pretrain/Learning Rate": 1.8630102063918158e-06, "Pretrain/Loss": 2.017648220062256, "Pretrain/Loss (Raw)": 1.9592684507369995, "Pretrain/Step": 8393, "Pretrain/Step Time": 8.512024557217956} +{"Pretrain/Learning Rate": 1.859795598101871e-06, "Pretrain/Loss": 2.017436981201172, "Pretrain/Loss (Raw)": 1.7242014408111572, "Pretrain/Step": 8394, "Pretrain/Step Time": 8.520877512171865} +{"Pretrain/Learning Rate": 1.8565836584493374e-06, "Pretrain/Loss": 2.020017623901367, "Pretrain/Loss (Raw)": 1.9883735179901123, "Pretrain/Step": 8395, "Pretrain/Step Time": 8.517288321629167} +{"Pretrain/Learning Rate": 1.8533743878046295e-06, "Pretrain/Loss": 2.0239758491516113, "Pretrain/Loss (Raw)": 2.311861515045166, "Pretrain/Step": 8396, "Pretrain/Step Time": 8.513093685731292} +{"Pretrain/Learning Rate": 1.8501677865378597e-06, "Pretrain/Loss": 2.0263478755950928, "Pretrain/Loss (Raw)": 2.2757558822631836, "Pretrain/Step": 8397, "Pretrain/Step Time": 8.509851267561316} +{"Pretrain/Learning Rate": 1.8469638550188267e-06, "Pretrain/Loss": 2.025383472442627, "Pretrain/Loss (Raw)": 1.8214112520217896, "Pretrain/Step": 8398, "Pretrain/Step Time": 8.515671089291573} +{"Pretrain/Learning Rate": 1.8437625936170239e-06, "Pretrain/Loss": 2.0239028930664062, "Pretrain/Loss (Raw)": 1.7651556730270386, "Pretrain/Step": 8399, "Pretrain/Step Time": 8.517609372735023} +{"Pretrain/Learning Rate": 1.8405640027016307e-06, "Pretrain/Loss": 2.0239315032958984, "Pretrain/Loss (Raw)": 2.12953519821167, "Pretrain/Step": 8400, "Pretrain/Step Time": 8.520925806835294} +{"Pretrain/Learning Rate": 1.8373680826415358e-06, "Pretrain/Loss": 2.0253143310546875, "Pretrain/Loss (Raw)": 2.011949062347412, "Pretrain/Step": 8401, "Pretrain/Step Time": 8.518987128511071} +{"Pretrain/Learning Rate": 1.8341748338052882e-06, "Pretrain/Loss": 2.0248489379882812, "Pretrain/Loss (Raw)": 2.0797410011291504, "Pretrain/Step": 8402, "Pretrain/Step Time": 8.509395595639944} +{"Pretrain/Learning Rate": 1.8309842565611663e-06, "Pretrain/Loss": 2.0260009765625, "Pretrain/Loss (Raw)": 2.0902204513549805, "Pretrain/Step": 8403, "Pretrain/Step Time": 8.50548742711544} +{"Pretrain/Learning Rate": 1.8277963512771112e-06, "Pretrain/Loss": 2.0242629051208496, "Pretrain/Loss (Raw)": 1.9916659593582153, "Pretrain/Step": 8404, "Pretrain/Step Time": 8.510751785710454} +{"Pretrain/Learning Rate": 1.824611118320782e-06, "Pretrain/Loss": 2.022463798522949, "Pretrain/Loss (Raw)": 1.8498458862304688, "Pretrain/Step": 8405, "Pretrain/Step Time": 8.515039004385471} +{"Pretrain/Learning Rate": 1.8214285580594931e-06, "Pretrain/Loss": 2.021327018737793, "Pretrain/Loss (Raw)": 1.9990935325622559, "Pretrain/Step": 8406, "Pretrain/Step Time": 8.519194446504116} +{"Pretrain/Learning Rate": 1.8182486708602898e-06, "Pretrain/Loss": 2.020886182785034, "Pretrain/Loss (Raw)": 2.0877859592437744, "Pretrain/Step": 8407, "Pretrain/Step Time": 8.512171206995845} +{"Pretrain/Learning Rate": 1.8150714570898868e-06, "Pretrain/Loss": 2.021134614944458, "Pretrain/Loss (Raw)": 1.8493762016296387, "Pretrain/Step": 8408, "Pretrain/Step Time": 8.510870104655623} +{"Pretrain/Learning Rate": 1.8118969171146915e-06, "Pretrain/Loss": 2.0244436264038086, "Pretrain/Loss (Raw)": 2.1703264713287354, "Pretrain/Step": 8409, "Pretrain/Step Time": 8.503184031695127} +{"Pretrain/Learning Rate": 1.8087250513008082e-06, "Pretrain/Loss": 2.0237300395965576, "Pretrain/Loss (Raw)": 2.010014772415161, "Pretrain/Step": 8410, "Pretrain/Step Time": 8.512587090954185} +{"Pretrain/Learning Rate": 1.8055558600140354e-06, "Pretrain/Loss": 2.023575782775879, "Pretrain/Loss (Raw)": 2.0162956714630127, "Pretrain/Step": 8411, "Pretrain/Step Time": 8.521285334601998} +{"Pretrain/Learning Rate": 1.8023893436198592e-06, "Pretrain/Loss": 2.0223052501678467, "Pretrain/Loss (Raw)": 2.018247365951538, "Pretrain/Step": 8412, "Pretrain/Step Time": 8.521885832771659} +{"Pretrain/Learning Rate": 1.7992255024834509e-06, "Pretrain/Loss": 2.020862102508545, "Pretrain/Loss (Raw)": 2.0782036781311035, "Pretrain/Step": 8413, "Pretrain/Step Time": 8.51313673518598} +{"Pretrain/Learning Rate": 1.79606433696968e-06, "Pretrain/Loss": 2.0220789909362793, "Pretrain/Loss (Raw)": 2.02780818939209, "Pretrain/Step": 8414, "Pretrain/Step Time": 8.518541052937508} +{"Pretrain/Learning Rate": 1.792905847443116e-06, "Pretrain/Loss": 2.0233073234558105, "Pretrain/Loss (Raw)": 2.1216554641723633, "Pretrain/Step": 8415, "Pretrain/Step Time": 8.517484271898866} +{"Pretrain/Learning Rate": 1.7897500342680063e-06, "Pretrain/Loss": 2.0220704078674316, "Pretrain/Loss (Raw)": 2.0451464653015137, "Pretrain/Step": 8416, "Pretrain/Step Time": 8.525028321892023} +{"Pretrain/Learning Rate": 1.7865968978082903e-06, "Pretrain/Loss": 2.019702911376953, "Pretrain/Loss (Raw)": 1.7854046821594238, "Pretrain/Step": 8417, "Pretrain/Step Time": 8.526772385463119} +{"Pretrain/Learning Rate": 1.7834464384276022e-06, "Pretrain/Loss": 2.0169265270233154, "Pretrain/Loss (Raw)": 2.0951812267303467, "Pretrain/Step": 8418, "Pretrain/Step Time": 8.525929424911737} +{"Pretrain/Learning Rate": 1.7802986564892737e-06, "Pretrain/Loss": 2.0168237686157227, "Pretrain/Loss (Raw)": 2.058305025100708, "Pretrain/Step": 8419, "Pretrain/Step Time": 8.516938818618655} +{"Pretrain/Learning Rate": 1.7771535523563198e-06, "Pretrain/Loss": 2.0189316272735596, "Pretrain/Loss (Raw)": 2.3576791286468506, "Pretrain/Step": 8420, "Pretrain/Step Time": 8.522405041381717} +{"Pretrain/Learning Rate": 1.7740111263914478e-06, "Pretrain/Loss": 2.016474485397339, "Pretrain/Loss (Raw)": 1.7296900749206543, "Pretrain/Step": 8421, "Pretrain/Step Time": 8.526702303439379} +{"Pretrain/Learning Rate": 1.7708713789570536e-06, "Pretrain/Loss": 2.0169153213500977, "Pretrain/Loss (Raw)": 2.0842432975769043, "Pretrain/Step": 8422, "Pretrain/Step Time": 8.533108910545707} +{"Pretrain/Learning Rate": 1.767734310415234e-06, "Pretrain/Loss": 2.017652988433838, "Pretrain/Loss (Raw)": 1.9184163808822632, "Pretrain/Step": 8423, "Pretrain/Step Time": 8.530828645452857} +{"Pretrain/Learning Rate": 1.7645999211277686e-06, "Pretrain/Loss": 2.020092010498047, "Pretrain/Loss (Raw)": 2.105597734451294, "Pretrain/Step": 8424, "Pretrain/Step Time": 8.533579772338271} +{"Pretrain/Learning Rate": 1.7614682114561298e-06, "Pretrain/Loss": 2.0188136100769043, "Pretrain/Loss (Raw)": 1.9502755403518677, "Pretrain/Step": 8425, "Pretrain/Step Time": 8.534209072589874} +{"Pretrain/Learning Rate": 1.7583391817614757e-06, "Pretrain/Loss": 2.0187742710113525, "Pretrain/Loss (Raw)": 2.0059897899627686, "Pretrain/Step": 8426, "Pretrain/Step Time": 8.517631715163589} +{"Pretrain/Learning Rate": 1.7552128324046707e-06, "Pretrain/Loss": 2.020517349243164, "Pretrain/Loss (Raw)": 2.19879412651062, "Pretrain/Step": 8427, "Pretrain/Step Time": 8.514885231852531} +{"Pretrain/Learning Rate": 1.752089163746254e-06, "Pretrain/Loss": 2.0242018699645996, "Pretrain/Loss (Raw)": 2.213557243347168, "Pretrain/Step": 8428, "Pretrain/Step Time": 8.528850534930825} +{"Pretrain/Learning Rate": 1.7489681761464565e-06, "Pretrain/Loss": 2.0255465507507324, "Pretrain/Loss (Raw)": 2.0153043270111084, "Pretrain/Step": 8429, "Pretrain/Step Time": 8.52687843888998} +{"Pretrain/Learning Rate": 1.7458498699652186e-06, "Pretrain/Loss": 2.0261449813842773, "Pretrain/Loss (Raw)": 2.1254639625549316, "Pretrain/Step": 8430, "Pretrain/Step Time": 8.527449876070023} +{"Pretrain/Learning Rate": 1.7427342455621498e-06, "Pretrain/Loss": 2.025906562805176, "Pretrain/Loss (Raw)": 1.948504090309143, "Pretrain/Step": 8431, "Pretrain/Step Time": 8.51650271192193} +{"Pretrain/Learning Rate": 1.7396213032965597e-06, "Pretrain/Loss": 2.027273178100586, "Pretrain/Loss (Raw)": 2.216724395751953, "Pretrain/Step": 8432, "Pretrain/Step Time": 8.518609231337905} +{"Pretrain/Learning Rate": 1.7365110435274419e-06, "Pretrain/Loss": 2.02748966217041, "Pretrain/Loss (Raw)": 1.9145208597183228, "Pretrain/Step": 8433, "Pretrain/Step Time": 8.519398955628276} +{"Pretrain/Learning Rate": 1.733403466613498e-06, "Pretrain/Loss": 2.0286319255828857, "Pretrain/Loss (Raw)": 2.103842258453369, "Pretrain/Step": 8434, "Pretrain/Step Time": 8.525947012007236} +{"Pretrain/Learning Rate": 1.7302985729131e-06, "Pretrain/Loss": 2.026588201522827, "Pretrain/Loss (Raw)": 1.917337417602539, "Pretrain/Step": 8435, "Pretrain/Step Time": 8.528824783861637} +{"Pretrain/Learning Rate": 1.7271963627843223e-06, "Pretrain/Loss": 2.0273094177246094, "Pretrain/Loss (Raw)": 2.1985957622528076, "Pretrain/Step": 8436, "Pretrain/Step Time": 8.522172452881932} +{"Pretrain/Learning Rate": 1.7240968365849208e-06, "Pretrain/Loss": 2.0282602310180664, "Pretrain/Loss (Raw)": 2.033916473388672, "Pretrain/Step": 8437, "Pretrain/Step Time": 8.511421423405409} +{"Pretrain/Learning Rate": 1.7209999946723564e-06, "Pretrain/Loss": 2.028777599334717, "Pretrain/Loss (Raw)": 1.9971849918365479, "Pretrain/Step": 8438, "Pretrain/Step Time": 8.514163214713335} +{"Pretrain/Learning Rate": 1.717905837403766e-06, "Pretrain/Loss": 2.029592990875244, "Pretrain/Loss (Raw)": 2.084718942642212, "Pretrain/Step": 8439, "Pretrain/Step Time": 8.525173822417855} +{"Pretrain/Learning Rate": 1.7148143651359833e-06, "Pretrain/Loss": 2.02880859375, "Pretrain/Loss (Raw)": 2.022709846496582, "Pretrain/Step": 8440, "Pretrain/Step Time": 8.527125412598252} +{"Pretrain/Learning Rate": 1.711725578225526e-06, "Pretrain/Loss": 2.0281620025634766, "Pretrain/Loss (Raw)": 2.108095169067383, "Pretrain/Step": 8441, "Pretrain/Step Time": 8.529012132436037} +{"Pretrain/Learning Rate": 1.708639477028623e-06, "Pretrain/Loss": 2.0279147624969482, "Pretrain/Loss (Raw)": 2.0683646202087402, "Pretrain/Step": 8442, "Pretrain/Step Time": 8.528749419376254} +{"Pretrain/Learning Rate": 1.705556061901159e-06, "Pretrain/Loss": 2.0287578105926514, "Pretrain/Loss (Raw)": 2.056431531906128, "Pretrain/Step": 8443, "Pretrain/Step Time": 8.531082794070244} +{"Pretrain/Learning Rate": 1.7024753331987442e-06, "Pretrain/Loss": 2.0237631797790527, "Pretrain/Loss (Raw)": 1.8073053359985352, "Pretrain/Step": 8444, "Pretrain/Step Time": 8.525944596156478} +{"Pretrain/Learning Rate": 1.699397291276647e-06, "Pretrain/Loss": 2.020906925201416, "Pretrain/Loss (Raw)": 1.9981168508529663, "Pretrain/Step": 8445, "Pretrain/Step Time": 8.525762064382434} +{"Pretrain/Learning Rate": 1.6963219364898613e-06, "Pretrain/Loss": 2.020003080368042, "Pretrain/Loss (Raw)": 1.979764699935913, "Pretrain/Step": 8446, "Pretrain/Step Time": 8.520765656605363} +{"Pretrain/Learning Rate": 1.6932492691930312e-06, "Pretrain/Loss": 2.018388509750366, "Pretrain/Loss (Raw)": 1.8456908464431763, "Pretrain/Step": 8447, "Pretrain/Step Time": 8.526859194040298} +{"Pretrain/Learning Rate": 1.6901792897405233e-06, "Pretrain/Loss": 2.015065908432007, "Pretrain/Loss (Raw)": 1.6978321075439453, "Pretrain/Step": 8448, "Pretrain/Step Time": 8.51808456517756} +{"Pretrain/Learning Rate": 1.6871119984863765e-06, "Pretrain/Loss": 2.0175442695617676, "Pretrain/Loss (Raw)": 1.996513843536377, "Pretrain/Step": 8449, "Pretrain/Step Time": 8.507544316351414} +{"Pretrain/Learning Rate": 1.6840473957843355e-06, "Pretrain/Loss": 2.020416259765625, "Pretrain/Loss (Raw)": 2.003417730331421, "Pretrain/Step": 8450, "Pretrain/Step Time": 8.520149303600192} +{"Pretrain/Learning Rate": 1.6809854819878096e-06, "Pretrain/Loss": 2.017735242843628, "Pretrain/Loss (Raw)": 1.6296440362930298, "Pretrain/Step": 8451, "Pretrain/Step Time": 8.523257993161678} +{"Pretrain/Learning Rate": 1.6779262574499243e-06, "Pretrain/Loss": 2.015688896179199, "Pretrain/Loss (Raw)": 1.9999552965164185, "Pretrain/Step": 8452, "Pretrain/Step Time": 8.52228214778006} +{"Pretrain/Learning Rate": 1.674869722523481e-06, "Pretrain/Loss": 2.018089771270752, "Pretrain/Loss (Raw)": 2.0740721225738525, "Pretrain/Step": 8453, "Pretrain/Step Time": 8.520627973601222} +{"Pretrain/Learning Rate": 1.6718158775609727e-06, "Pretrain/Loss": 2.0181987285614014, "Pretrain/Loss (Raw)": 2.096466541290283, "Pretrain/Step": 8454, "Pretrain/Step Time": 8.516635656356812} +{"Pretrain/Learning Rate": 1.6687647229145787e-06, "Pretrain/Loss": 2.018258810043335, "Pretrain/Loss (Raw)": 2.051771402359009, "Pretrain/Step": 8455, "Pretrain/Step Time": 8.517058998346329} +{"Pretrain/Learning Rate": 1.6657162589361814e-06, "Pretrain/Loss": 2.0172319412231445, "Pretrain/Loss (Raw)": 2.034529447555542, "Pretrain/Step": 8456, "Pretrain/Step Time": 8.519224870949984} +{"Pretrain/Learning Rate": 1.6626704859773413e-06, "Pretrain/Loss": 2.0177321434020996, "Pretrain/Loss (Raw)": 1.9689500331878662, "Pretrain/Step": 8457, "Pretrain/Step Time": 8.523740701377392} +{"Pretrain/Learning Rate": 1.6596274043893078e-06, "Pretrain/Loss": 2.0160927772521973, "Pretrain/Loss (Raw)": 1.8538835048675537, "Pretrain/Step": 8458, "Pretrain/Step Time": 8.523054022341967} +{"Pretrain/Learning Rate": 1.6565870145230228e-06, "Pretrain/Loss": 2.0156702995300293, "Pretrain/Loss (Raw)": 1.9489132165908813, "Pretrain/Step": 8459, "Pretrain/Step Time": 8.52086996100843} +{"Pretrain/Learning Rate": 1.653549316729125e-06, "Pretrain/Loss": 2.016294002532959, "Pretrain/Loss (Raw)": 1.9682962894439697, "Pretrain/Step": 8460, "Pretrain/Step Time": 8.511585908010602} +{"Pretrain/Learning Rate": 1.6505143113579314e-06, "Pretrain/Loss": 2.0171666145324707, "Pretrain/Loss (Raw)": 1.8746410608291626, "Pretrain/Step": 8461, "Pretrain/Step Time": 8.499733325093985} +{"Pretrain/Learning Rate": 1.6474819987594536e-06, "Pretrain/Loss": 2.017655849456787, "Pretrain/Loss (Raw)": 2.172156572341919, "Pretrain/Step": 8462, "Pretrain/Step Time": 8.507042169570923} +{"Pretrain/Learning Rate": 1.64445237928339e-06, "Pretrain/Loss": 2.0180959701538086, "Pretrain/Loss (Raw)": 1.9939631223678589, "Pretrain/Step": 8463, "Pretrain/Step Time": 8.507007509469986} +{"Pretrain/Learning Rate": 1.6414254532791357e-06, "Pretrain/Loss": 2.0168581008911133, "Pretrain/Loss (Raw)": 2.1139075756073, "Pretrain/Step": 8464, "Pretrain/Step Time": 8.501972740516067} +{"Pretrain/Learning Rate": 1.6384012210957672e-06, "Pretrain/Loss": 2.016681432723999, "Pretrain/Loss (Raw)": 2.0238285064697266, "Pretrain/Step": 8465, "Pretrain/Step Time": 8.504083290696144} +{"Pretrain/Learning Rate": 1.6353796830820529e-06, "Pretrain/Loss": 2.017868757247925, "Pretrain/Loss (Raw)": 2.1291751861572266, "Pretrain/Step": 8466, "Pretrain/Step Time": 8.501833636313677} +{"Pretrain/Learning Rate": 1.6323608395864498e-06, "Pretrain/Loss": 2.018923759460449, "Pretrain/Loss (Raw)": 1.9986697435379028, "Pretrain/Step": 8467, "Pretrain/Step Time": 8.495760193094611} +{"Pretrain/Learning Rate": 1.6293446909571075e-06, "Pretrain/Loss": 2.021044969558716, "Pretrain/Loss (Raw)": 2.289741039276123, "Pretrain/Step": 8468, "Pretrain/Step Time": 8.491762146353722} +{"Pretrain/Learning Rate": 1.6263312375418643e-06, "Pretrain/Loss": 2.0216431617736816, "Pretrain/Loss (Raw)": 2.1932930946350098, "Pretrain/Step": 8469, "Pretrain/Step Time": 8.499432273209095} +{"Pretrain/Learning Rate": 1.6233204796882368e-06, "Pretrain/Loss": 2.021003246307373, "Pretrain/Loss (Raw)": 1.9349195957183838, "Pretrain/Step": 8470, "Pretrain/Step Time": 8.499278699979186} +{"Pretrain/Learning Rate": 1.6203124177434497e-06, "Pretrain/Loss": 2.0196473598480225, "Pretrain/Loss (Raw)": 1.8574938774108887, "Pretrain/Step": 8471, "Pretrain/Step Time": 8.508608249947429} +{"Pretrain/Learning Rate": 1.6173070520544065e-06, "Pretrain/Loss": 2.0215373039245605, "Pretrain/Loss (Raw)": 2.089801073074341, "Pretrain/Step": 8472, "Pretrain/Step Time": 8.503517905250192} +{"Pretrain/Learning Rate": 1.6143043829676934e-06, "Pretrain/Loss": 2.0163321495056152, "Pretrain/Loss (Raw)": 1.6951329708099365, "Pretrain/Step": 8473, "Pretrain/Step Time": 8.49864037334919} +{"Pretrain/Learning Rate": 1.611304410829595e-06, "Pretrain/Loss": 2.0153908729553223, "Pretrain/Loss (Raw)": 1.9477958679199219, "Pretrain/Step": 8474, "Pretrain/Step Time": 8.501742705702782} +{"Pretrain/Learning Rate": 1.6083071359860868e-06, "Pretrain/Loss": 2.015566110610962, "Pretrain/Loss (Raw)": 2.1057686805725098, "Pretrain/Step": 8475, "Pretrain/Step Time": 8.504218423739076} +{"Pretrain/Learning Rate": 1.6053125587828233e-06, "Pretrain/Loss": 2.0132241249084473, "Pretrain/Loss (Raw)": 1.9981552362442017, "Pretrain/Step": 8476, "Pretrain/Step Time": 8.504936264827847} +{"Pretrain/Learning Rate": 1.6023206795651557e-06, "Pretrain/Loss": 2.0131983757019043, "Pretrain/Loss (Raw)": 1.9949535131454468, "Pretrain/Step": 8477, "Pretrain/Step Time": 8.506426198408008} +{"Pretrain/Learning Rate": 1.5993314986781166e-06, "Pretrain/Loss": 2.011967182159424, "Pretrain/Loss (Raw)": 2.0742127895355225, "Pretrain/Step": 8478, "Pretrain/Step Time": 8.504560248926282} +{"Pretrain/Learning Rate": 1.5963450164664385e-06, "Pretrain/Loss": 2.0107030868530273, "Pretrain/Loss (Raw)": 1.9390325546264648, "Pretrain/Step": 8479, "Pretrain/Step Time": 8.499191407114267} +{"Pretrain/Learning Rate": 1.5933612332745373e-06, "Pretrain/Loss": 2.010544776916504, "Pretrain/Loss (Raw)": 2.001081943511963, "Pretrain/Step": 8480, "Pretrain/Step Time": 8.501190207898617} +{"Pretrain/Learning Rate": 1.5903801494465131e-06, "Pretrain/Loss": 2.0126729011535645, "Pretrain/Loss (Raw)": 2.231983184814453, "Pretrain/Step": 8481, "Pretrain/Step Time": 8.504970965906978} +{"Pretrain/Learning Rate": 1.5874017653261574e-06, "Pretrain/Loss": 2.0133657455444336, "Pretrain/Loss (Raw)": 2.0259592533111572, "Pretrain/Step": 8482, "Pretrain/Step Time": 8.507846498861909} +{"Pretrain/Learning Rate": 1.5844260812569621e-06, "Pretrain/Loss": 2.0132620334625244, "Pretrain/Loss (Raw)": 1.866154432296753, "Pretrain/Step": 8483, "Pretrain/Step Time": 8.515114840120077} +{"Pretrain/Learning Rate": 1.5814530975820806e-06, "Pretrain/Loss": 2.0135796070098877, "Pretrain/Loss (Raw)": 2.0276896953582764, "Pretrain/Step": 8484, "Pretrain/Step Time": 8.510052431374788} +{"Pretrain/Learning Rate": 1.578482814644383e-06, "Pretrain/Loss": 2.0128426551818848, "Pretrain/Loss (Raw)": 1.8405120372772217, "Pretrain/Step": 8485, "Pretrain/Step Time": 8.505898592993617} +{"Pretrain/Learning Rate": 1.5755152327864093e-06, "Pretrain/Loss": 2.014444589614868, "Pretrain/Loss (Raw)": 2.1359100341796875, "Pretrain/Step": 8486, "Pretrain/Step Time": 8.502539563924074} +{"Pretrain/Learning Rate": 1.572550352350405e-06, "Pretrain/Loss": 2.014575958251953, "Pretrain/Loss (Raw)": 1.8988516330718994, "Pretrain/Step": 8487, "Pretrain/Step Time": 8.513901827856898} +{"Pretrain/Learning Rate": 1.5695881736782825e-06, "Pretrain/Loss": 2.014625310897827, "Pretrain/Loss (Raw)": 1.9395928382873535, "Pretrain/Step": 8488, "Pretrain/Step Time": 8.51147785410285} +{"Pretrain/Learning Rate": 1.5666286971116605e-06, "Pretrain/Loss": 2.0138566493988037, "Pretrain/Loss (Raw)": 2.0254323482513428, "Pretrain/Step": 8489, "Pretrain/Step Time": 8.509060023352504} +{"Pretrain/Learning Rate": 1.5636719229918385e-06, "Pretrain/Loss": 2.0113158226013184, "Pretrain/Loss (Raw)": 1.9835270643234253, "Pretrain/Step": 8490, "Pretrain/Step Time": 8.501989774405956} +{"Pretrain/Learning Rate": 1.5607178516598126e-06, "Pretrain/Loss": 2.011735439300537, "Pretrain/Loss (Raw)": 2.096069574356079, "Pretrain/Step": 8491, "Pretrain/Step Time": 8.504743246361613} +{"Pretrain/Learning Rate": 1.557766483456244e-06, "Pretrain/Loss": 2.016615152359009, "Pretrain/Loss (Raw)": 2.1659481525421143, "Pretrain/Step": 8492, "Pretrain/Step Time": 8.507159793749452} +{"Pretrain/Learning Rate": 1.5548178187215128e-06, "Pretrain/Loss": 2.017373561859131, "Pretrain/Loss (Raw)": 2.0793497562408447, "Pretrain/Step": 8493, "Pretrain/Step Time": 8.508478129282594} +{"Pretrain/Learning Rate": 1.5518718577956697e-06, "Pretrain/Loss": 2.0170040130615234, "Pretrain/Loss (Raw)": 1.9226163625717163, "Pretrain/Step": 8494, "Pretrain/Step Time": 8.523164769634604} +{"Pretrain/Learning Rate": 1.5489286010184539e-06, "Pretrain/Loss": 2.014737129211426, "Pretrain/Loss (Raw)": 2.0622987747192383, "Pretrain/Step": 8495, "Pretrain/Step Time": 8.515705686062574} +{"Pretrain/Learning Rate": 1.545988048729291e-06, "Pretrain/Loss": 2.0164132118225098, "Pretrain/Loss (Raw)": 2.160165309906006, "Pretrain/Step": 8496, "Pretrain/Step Time": 8.516154028475285} +{"Pretrain/Learning Rate": 1.5430502012673126e-06, "Pretrain/Loss": 2.018009901046753, "Pretrain/Loss (Raw)": 2.0546157360076904, "Pretrain/Step": 8497, "Pretrain/Step Time": 8.514488060027361} +{"Pretrain/Learning Rate": 1.5401150589713171e-06, "Pretrain/Loss": 2.0161330699920654, "Pretrain/Loss (Raw)": 1.8344453573226929, "Pretrain/Step": 8498, "Pretrain/Step Time": 8.520781066268682} +{"Pretrain/Learning Rate": 1.5371826221797975e-06, "Pretrain/Loss": 2.0167131423950195, "Pretrain/Loss (Raw)": 2.132819414138794, "Pretrain/Step": 8499, "Pretrain/Step Time": 8.517513671889901} +{"Pretrain/Learning Rate": 1.534252891230936e-06, "Pretrain/Loss": 2.0124173164367676, "Pretrain/Loss (Raw)": 1.821739673614502, "Pretrain/Step": 8500, "Pretrain/Step Time": 8.532003540545702} +{"Pretrain/Learning Rate": 1.5313258664626073e-06, "Pretrain/Loss": 2.0103111267089844, "Pretrain/Loss (Raw)": 1.9977433681488037, "Pretrain/Step": 8501, "Pretrain/Step Time": 8.529297782108188} +{"Pretrain/Learning Rate": 1.5284015482123714e-06, "Pretrain/Loss": 2.009434223175049, "Pretrain/Loss (Raw)": 1.8506439924240112, "Pretrain/Step": 8502, "Pretrain/Step Time": 8.526816979050636} +{"Pretrain/Learning Rate": 1.5254799368174672e-06, "Pretrain/Loss": 2.009575366973877, "Pretrain/Loss (Raw)": 2.1295154094696045, "Pretrain/Step": 8503, "Pretrain/Step Time": 8.530460439622402} +{"Pretrain/Learning Rate": 1.5225610326148304e-06, "Pretrain/Loss": 2.0086522102355957, "Pretrain/Loss (Raw)": 1.8143939971923828, "Pretrain/Step": 8504, "Pretrain/Step Time": 8.524780262261629} +{"Pretrain/Learning Rate": 1.5196448359410891e-06, "Pretrain/Loss": 2.0057101249694824, "Pretrain/Loss (Raw)": 1.7580348253250122, "Pretrain/Step": 8505, "Pretrain/Step Time": 8.529159950092435} +{"Pretrain/Learning Rate": 1.5167313471325468e-06, "Pretrain/Loss": 2.00630259513855, "Pretrain/Loss (Raw)": 2.131351947784424, "Pretrain/Step": 8506, "Pretrain/Step Time": 8.536317978054285} +{"Pretrain/Learning Rate": 1.513820566525201e-06, "Pretrain/Loss": 2.0065314769744873, "Pretrain/Loss (Raw)": 2.0038859844207764, "Pretrain/Step": 8507, "Pretrain/Step Time": 8.538318533450365} +{"Pretrain/Learning Rate": 1.510912494454736e-06, "Pretrain/Loss": 2.005981922149658, "Pretrain/Loss (Raw)": 2.0238025188446045, "Pretrain/Step": 8508, "Pretrain/Step Time": 8.533314317464828} +{"Pretrain/Learning Rate": 1.5080071312565308e-06, "Pretrain/Loss": 2.005491018295288, "Pretrain/Loss (Raw)": 1.7805631160736084, "Pretrain/Step": 8509, "Pretrain/Step Time": 8.527896573767066} +{"Pretrain/Learning Rate": 1.5051044772656397e-06, "Pretrain/Loss": 2.0068764686584473, "Pretrain/Loss (Raw)": 2.1572444438934326, "Pretrain/Step": 8510, "Pretrain/Step Time": 8.520318178460002} +{"Pretrain/Learning Rate": 1.5022045328168088e-06, "Pretrain/Loss": 2.00508975982666, "Pretrain/Loss (Raw)": 1.9301856756210327, "Pretrain/Step": 8511, "Pretrain/Step Time": 8.53014001250267} +{"Pretrain/Learning Rate": 1.4993072982444816e-06, "Pretrain/Loss": 2.0022640228271484, "Pretrain/Loss (Raw)": 1.7166227102279663, "Pretrain/Step": 8512, "Pretrain/Step Time": 8.532895902171731} +{"Pretrain/Learning Rate": 1.4964127738827744e-06, "Pretrain/Loss": 2.002713441848755, "Pretrain/Loss (Raw)": 2.073786973953247, "Pretrain/Step": 8513, "Pretrain/Step Time": 8.527998013421893} +{"Pretrain/Learning Rate": 1.4935209600654977e-06, "Pretrain/Loss": 2.0028865337371826, "Pretrain/Loss (Raw)": 2.010699987411499, "Pretrain/Step": 8514, "Pretrain/Step Time": 8.5265535954386} +{"Pretrain/Learning Rate": 1.4906318571261484e-06, "Pretrain/Loss": 2.004883289337158, "Pretrain/Loss (Raw)": 2.0859148502349854, "Pretrain/Step": 8515, "Pretrain/Step Time": 8.525749048218131} +{"Pretrain/Learning Rate": 1.4877454653979162e-06, "Pretrain/Loss": 2.002469062805176, "Pretrain/Loss (Raw)": 1.7059804201126099, "Pretrain/Step": 8516, "Pretrain/Step Time": 8.524444408714771} +{"Pretrain/Learning Rate": 1.4848617852136676e-06, "Pretrain/Loss": 2.002190113067627, "Pretrain/Loss (Raw)": 2.1273019313812256, "Pretrain/Step": 8517, "Pretrain/Step Time": 8.533135298639536} +{"Pretrain/Learning Rate": 1.4819808169059674e-06, "Pretrain/Loss": 2.0043582916259766, "Pretrain/Loss (Raw)": 1.930186152458191, "Pretrain/Step": 8518, "Pretrain/Step Time": 8.534392211586237} +{"Pretrain/Learning Rate": 1.4791025608070552e-06, "Pretrain/Loss": 2.002317428588867, "Pretrain/Loss (Raw)": 1.898267149925232, "Pretrain/Step": 8519, "Pretrain/Step Time": 8.53536549769342} +{"Pretrain/Learning Rate": 1.476227017248874e-06, "Pretrain/Loss": 2.004635810852051, "Pretrain/Loss (Raw)": 2.0409469604492188, "Pretrain/Step": 8520, "Pretrain/Step Time": 8.537576891481876} +{"Pretrain/Learning Rate": 1.4733541865630418e-06, "Pretrain/Loss": 2.003166675567627, "Pretrain/Loss (Raw)": 1.7712253332138062, "Pretrain/Step": 8521, "Pretrain/Step Time": 8.527725234627724} +{"Pretrain/Learning Rate": 1.4704840690808659e-06, "Pretrain/Loss": 2.0037546157836914, "Pretrain/Loss (Raw)": 1.7994294166564941, "Pretrain/Step": 8522, "Pretrain/Step Time": 8.519792977720499} +{"Pretrain/Learning Rate": 1.4676166651333367e-06, "Pretrain/Loss": 2.003818988800049, "Pretrain/Loss (Raw)": 1.996611475944519, "Pretrain/Step": 8523, "Pretrain/Step Time": 8.530145330354571} +{"Pretrain/Learning Rate": 1.4647519750511512e-06, "Pretrain/Loss": 2.002227544784546, "Pretrain/Loss (Raw)": 2.1081795692443848, "Pretrain/Step": 8524, "Pretrain/Step Time": 8.534497622400522} +{"Pretrain/Learning Rate": 1.461889999164659e-06, "Pretrain/Loss": 2.000980854034424, "Pretrain/Loss (Raw)": 2.116182565689087, "Pretrain/Step": 8525, "Pretrain/Step Time": 8.531166352331638} +{"Pretrain/Learning Rate": 1.4590307378039348e-06, "Pretrain/Loss": 2.0031306743621826, "Pretrain/Loss (Raw)": 2.096590995788574, "Pretrain/Step": 8526, "Pretrain/Step Time": 8.525218723341823} +{"Pretrain/Learning Rate": 1.4561741912987093e-06, "Pretrain/Loss": 2.004631280899048, "Pretrain/Loss (Raw)": 1.9572244882583618, "Pretrain/Step": 8527, "Pretrain/Step Time": 8.524821953848004} +{"Pretrain/Learning Rate": 1.4533203599784245e-06, "Pretrain/Loss": 2.003265619277954, "Pretrain/Loss (Raw)": 1.9547367095947266, "Pretrain/Step": 8528, "Pretrain/Step Time": 8.522365437820554} +{"Pretrain/Learning Rate": 1.4504692441721867e-06, "Pretrain/Loss": 2.0035696029663086, "Pretrain/Loss (Raw)": 2.0508646965026855, "Pretrain/Step": 8529, "Pretrain/Step Time": 8.528750630095601} +{"Pretrain/Learning Rate": 1.4476208442088052e-06, "Pretrain/Loss": 2.0030856132507324, "Pretrain/Loss (Raw)": 2.01777982711792, "Pretrain/Step": 8530, "Pretrain/Step Time": 8.531263086944818} +{"Pretrain/Learning Rate": 1.4447751604167697e-06, "Pretrain/Loss": 1.9989378452301025, "Pretrain/Loss (Raw)": 1.5592864751815796, "Pretrain/Step": 8531, "Pretrain/Step Time": 8.527946319431067} +{"Pretrain/Learning Rate": 1.4419321931242624e-06, "Pretrain/Loss": 1.9969398975372314, "Pretrain/Loss (Raw)": 1.7359309196472168, "Pretrain/Step": 8532, "Pretrain/Step Time": 8.524592824280262} +{"Pretrain/Learning Rate": 1.4390919426591404e-06, "Pretrain/Loss": 1.998207688331604, "Pretrain/Loss (Raw)": 2.012141704559326, "Pretrain/Step": 8533, "Pretrain/Step Time": 8.518797487020493} +{"Pretrain/Learning Rate": 1.4362544093489583e-06, "Pretrain/Loss": 1.9961423873901367, "Pretrain/Loss (Raw)": 1.7347255945205688, "Pretrain/Step": 8534, "Pretrain/Step Time": 8.520464014261961} +{"Pretrain/Learning Rate": 1.4334195935209572e-06, "Pretrain/Loss": 1.9933416843414307, "Pretrain/Loss (Raw)": 1.729302167892456, "Pretrain/Step": 8535, "Pretrain/Step Time": 8.522217076271772} +{"Pretrain/Learning Rate": 1.4305874955020559e-06, "Pretrain/Loss": 1.9950532913208008, "Pretrain/Loss (Raw)": 2.0684518814086914, "Pretrain/Step": 8536, "Pretrain/Step Time": 8.52437088638544} +{"Pretrain/Learning Rate": 1.427758115618863e-06, "Pretrain/Loss": 1.9923359155654907, "Pretrain/Loss (Raw)": 1.8225183486938477, "Pretrain/Step": 8537, "Pretrain/Step Time": 8.521841827780008} +{"Pretrain/Learning Rate": 1.4249314541976866e-06, "Pretrain/Loss": 1.992613673210144, "Pretrain/Loss (Raw)": 2.0455594062805176, "Pretrain/Step": 8538, "Pretrain/Step Time": 8.514927607029676} +{"Pretrain/Learning Rate": 1.422107511564502e-06, "Pretrain/Loss": 1.9925686120986938, "Pretrain/Loss (Raw)": 2.010528564453125, "Pretrain/Step": 8539, "Pretrain/Step Time": 8.510883584618568} +{"Pretrain/Learning Rate": 1.4192862880449825e-06, "Pretrain/Loss": 1.9904218912124634, "Pretrain/Loss (Raw)": 1.7434628009796143, "Pretrain/Step": 8540, "Pretrain/Step Time": 8.520318320021033} +{"Pretrain/Learning Rate": 1.4164677839644813e-06, "Pretrain/Loss": 1.9903149604797363, "Pretrain/Loss (Raw)": 2.06453537940979, "Pretrain/Step": 8541, "Pretrain/Step Time": 8.517609734088182} +{"Pretrain/Learning Rate": 1.4136519996480469e-06, "Pretrain/Loss": 1.9885607957839966, "Pretrain/Loss (Raw)": 1.803259253501892, "Pretrain/Step": 8542, "Pretrain/Step Time": 8.518024140968919} +{"Pretrain/Learning Rate": 1.4108389354204055e-06, "Pretrain/Loss": 1.9875147342681885, "Pretrain/Loss (Raw)": 1.9877688884735107, "Pretrain/Step": 8543, "Pretrain/Step Time": 8.517803315073252} +{"Pretrain/Learning Rate": 1.4080285916059754e-06, "Pretrain/Loss": 1.9871997833251953, "Pretrain/Loss (Raw)": 2.0048255920410156, "Pretrain/Step": 8544, "Pretrain/Step Time": 8.514154955744743} +{"Pretrain/Learning Rate": 1.405220968528853e-06, "Pretrain/Loss": 1.9885179996490479, "Pretrain/Loss (Raw)": 1.9541471004486084, "Pretrain/Step": 8545, "Pretrain/Step Time": 8.520420840010047} +{"Pretrain/Learning Rate": 1.402416066512835e-06, "Pretrain/Loss": 1.9857947826385498, "Pretrain/Loss (Raw)": 1.7466133832931519, "Pretrain/Step": 8546, "Pretrain/Step Time": 8.525296235457063} +{"Pretrain/Learning Rate": 1.3996138858813928e-06, "Pretrain/Loss": 1.9844915866851807, "Pretrain/Loss (Raw)": 1.891481876373291, "Pretrain/Step": 8547, "Pretrain/Step Time": 8.527040960267186} +{"Pretrain/Learning Rate": 1.396814426957685e-06, "Pretrain/Loss": 1.9817276000976562, "Pretrain/Loss (Raw)": 2.0038747787475586, "Pretrain/Step": 8548, "Pretrain/Step Time": 8.523641956970096} +{"Pretrain/Learning Rate": 1.394017690064553e-06, "Pretrain/Loss": 1.9836530685424805, "Pretrain/Loss (Raw)": 1.9761748313903809, "Pretrain/Step": 8549, "Pretrain/Step Time": 8.513563640415668} +{"Pretrain/Learning Rate": 1.3912236755245416e-06, "Pretrain/Loss": 1.982694387435913, "Pretrain/Loss (Raw)": 1.961533784866333, "Pretrain/Step": 8550, "Pretrain/Step Time": 8.508972607553005} +{"Pretrain/Learning Rate": 1.3884323836598655e-06, "Pretrain/Loss": 1.9837170839309692, "Pretrain/Loss (Raw)": 2.049314498901367, "Pretrain/Step": 8551, "Pretrain/Step Time": 8.516381880268455} +{"Pretrain/Learning Rate": 1.3856438147924229e-06, "Pretrain/Loss": 1.9810261726379395, "Pretrain/Loss (Raw)": 1.7611526250839233, "Pretrain/Step": 8552, "Pretrain/Step Time": 8.514568654820323} +{"Pretrain/Learning Rate": 1.3828579692438142e-06, "Pretrain/Loss": 1.982914686203003, "Pretrain/Loss (Raw)": 2.1920080184936523, "Pretrain/Step": 8553, "Pretrain/Step Time": 8.518044576048851} +{"Pretrain/Learning Rate": 1.3800748473353137e-06, "Pretrain/Loss": 1.9834007024765015, "Pretrain/Loss (Raw)": 2.0682008266448975, "Pretrain/Step": 8554, "Pretrain/Step Time": 8.518571922555566} +{"Pretrain/Learning Rate": 1.377294449387881e-06, "Pretrain/Loss": 1.9822100400924683, "Pretrain/Loss (Raw)": 2.0463876724243164, "Pretrain/Step": 8555, "Pretrain/Step Time": 8.513925759121776} +{"Pretrain/Learning Rate": 1.3745167757221622e-06, "Pretrain/Loss": 1.9832730293273926, "Pretrain/Loss (Raw)": 2.3496170043945312, "Pretrain/Step": 8556, "Pretrain/Step Time": 8.499117465689778} +{"Pretrain/Learning Rate": 1.3717418266585014e-06, "Pretrain/Loss": 1.9837391376495361, "Pretrain/Loss (Raw)": 2.074965715408325, "Pretrain/Step": 8557, "Pretrain/Step Time": 8.501964149996638} +{"Pretrain/Learning Rate": 1.3689696025169118e-06, "Pretrain/Loss": 1.9829981327056885, "Pretrain/Loss (Raw)": 2.0306179523468018, "Pretrain/Step": 8558, "Pretrain/Step Time": 8.510036040097475} +{"Pretrain/Learning Rate": 1.366200103617099e-06, "Pretrain/Loss": 1.985384464263916, "Pretrain/Loss (Raw)": 2.253955602645874, "Pretrain/Step": 8559, "Pretrain/Step Time": 8.512117464095354} +{"Pretrain/Learning Rate": 1.3634333302784546e-06, "Pretrain/Loss": 1.9832075834274292, "Pretrain/Loss (Raw)": 1.9380779266357422, "Pretrain/Step": 8560, "Pretrain/Step Time": 8.509312145411968} +{"Pretrain/Learning Rate": 1.3606692828200623e-06, "Pretrain/Loss": 1.9811797142028809, "Pretrain/Loss (Raw)": 1.6549731492996216, "Pretrain/Step": 8561, "Pretrain/Step Time": 8.506948944181204} +{"Pretrain/Learning Rate": 1.3579079615606781e-06, "Pretrain/Loss": 1.9807363748550415, "Pretrain/Loss (Raw)": 2.0470895767211914, "Pretrain/Step": 8562, "Pretrain/Step Time": 8.497377833351493} +{"Pretrain/Learning Rate": 1.355149366818756e-06, "Pretrain/Loss": 1.9813563823699951, "Pretrain/Loss (Raw)": 1.9966862201690674, "Pretrain/Step": 8563, "Pretrain/Step Time": 8.500127226114273} +{"Pretrain/Learning Rate": 1.3523934989124214e-06, "Pretrain/Loss": 1.9795658588409424, "Pretrain/Loss (Raw)": 1.969416618347168, "Pretrain/Step": 8564, "Pretrain/Step Time": 8.505691152065992} +{"Pretrain/Learning Rate": 1.3496403581595042e-06, "Pretrain/Loss": 1.9800268411636353, "Pretrain/Loss (Raw)": 2.092914342880249, "Pretrain/Step": 8565, "Pretrain/Step Time": 8.508410695940256} +{"Pretrain/Learning Rate": 1.3468899448775023e-06, "Pretrain/Loss": 1.9767327308654785, "Pretrain/Loss (Raw)": 1.5755470991134644, "Pretrain/Step": 8566, "Pretrain/Step Time": 8.506842508912086} +{"Pretrain/Learning Rate": 1.3441422593836128e-06, "Pretrain/Loss": 1.9766087532043457, "Pretrain/Loss (Raw)": 2.068856954574585, "Pretrain/Step": 8567, "Pretrain/Step Time": 8.495885781943798} +{"Pretrain/Learning Rate": 1.3413973019947013e-06, "Pretrain/Loss": 1.9761587381362915, "Pretrain/Loss (Raw)": 1.9650928974151611, "Pretrain/Step": 8568, "Pretrain/Step Time": 8.495281441137195} +{"Pretrain/Learning Rate": 1.3386550730273452e-06, "Pretrain/Loss": 1.9749743938446045, "Pretrain/Loss (Raw)": 1.9565215110778809, "Pretrain/Step": 8569, "Pretrain/Step Time": 8.491858392953873} +{"Pretrain/Learning Rate": 1.3359155727977745e-06, "Pretrain/Loss": 1.974971055984497, "Pretrain/Loss (Raw)": 2.06793212890625, "Pretrain/Step": 8570, "Pretrain/Step Time": 8.500146156176925} +{"Pretrain/Learning Rate": 1.3331788016219315e-06, "Pretrain/Loss": 1.9754977226257324, "Pretrain/Loss (Raw)": 2.123830556869507, "Pretrain/Step": 8571, "Pretrain/Step Time": 8.499320041388273} +{"Pretrain/Learning Rate": 1.3304447598154274e-06, "Pretrain/Loss": 1.9762883186340332, "Pretrain/Loss (Raw)": 1.908501386642456, "Pretrain/Step": 8572, "Pretrain/Step Time": 8.501174347475171} +{"Pretrain/Learning Rate": 1.3277134476935766e-06, "Pretrain/Loss": 1.9776631593704224, "Pretrain/Loss (Raw)": 2.1740927696228027, "Pretrain/Step": 8573, "Pretrain/Step Time": 8.493707163259387} +{"Pretrain/Learning Rate": 1.324984865571352e-06, "Pretrain/Loss": 1.976876139640808, "Pretrain/Loss (Raw)": 1.8790414333343506, "Pretrain/Step": 8574, "Pretrain/Step Time": 8.497389046475291} +{"Pretrain/Learning Rate": 1.3222590137634328e-06, "Pretrain/Loss": 1.977447509765625, "Pretrain/Loss (Raw)": 1.9188286066055298, "Pretrain/Step": 8575, "Pretrain/Step Time": 8.491523440927267} +{"Pretrain/Learning Rate": 1.319535892584181e-06, "Pretrain/Loss": 1.9794225692749023, "Pretrain/Loss (Raw)": 1.950614333152771, "Pretrain/Step": 8576, "Pretrain/Step Time": 8.500834388658404} +{"Pretrain/Learning Rate": 1.3168155023476348e-06, "Pretrain/Loss": 1.9799010753631592, "Pretrain/Loss (Raw)": 2.057781457901001, "Pretrain/Step": 8577, "Pretrain/Step Time": 8.508864637464285} +{"Pretrain/Learning Rate": 1.3140978433675206e-06, "Pretrain/Loss": 1.9782397747039795, "Pretrain/Loss (Raw)": 1.7907640933990479, "Pretrain/Step": 8578, "Pretrain/Step Time": 8.504290878772736} +{"Pretrain/Learning Rate": 1.3113829159572572e-06, "Pretrain/Loss": 1.9817092418670654, "Pretrain/Loss (Raw)": 2.0737316608428955, "Pretrain/Step": 8579, "Pretrain/Step Time": 8.516701832413673} +{"Pretrain/Learning Rate": 1.3086707204299414e-06, "Pretrain/Loss": 1.9818401336669922, "Pretrain/Loss (Raw)": 2.0167124271392822, "Pretrain/Step": 8580, "Pretrain/Step Time": 8.51939045637846} +{"Pretrain/Learning Rate": 1.3059612570983537e-06, "Pretrain/Loss": 1.9821290969848633, "Pretrain/Loss (Raw)": 2.111056089401245, "Pretrain/Step": 8581, "Pretrain/Step Time": 8.519528090953827} +{"Pretrain/Learning Rate": 1.3032545262749635e-06, "Pretrain/Loss": 1.9848449230194092, "Pretrain/Loss (Raw)": 2.44409441947937, "Pretrain/Step": 8582, "Pretrain/Step Time": 8.523970576003194} +{"Pretrain/Learning Rate": 1.3005505282719238e-06, "Pretrain/Loss": 1.9824726581573486, "Pretrain/Loss (Raw)": 1.7481176853179932, "Pretrain/Step": 8583, "Pretrain/Step Time": 8.527303459122777} +{"Pretrain/Learning Rate": 1.297849263401074e-06, "Pretrain/Loss": 1.9819929599761963, "Pretrain/Loss (Raw)": 1.9731252193450928, "Pretrain/Step": 8584, "Pretrain/Step Time": 8.52364875562489} +{"Pretrain/Learning Rate": 1.2951507319739375e-06, "Pretrain/Loss": 1.9823729991912842, "Pretrain/Loss (Raw)": 2.0176093578338623, "Pretrain/Step": 8585, "Pretrain/Step Time": 8.517719311639667} +{"Pretrain/Learning Rate": 1.2924549343017122e-06, "Pretrain/Loss": 1.9821810722351074, "Pretrain/Loss (Raw)": 1.8293157815933228, "Pretrain/Step": 8586, "Pretrain/Step Time": 8.51931249909103} +{"Pretrain/Learning Rate": 1.289761870695305e-06, "Pretrain/Loss": 1.982478380203247, "Pretrain/Loss (Raw)": 1.9869780540466309, "Pretrain/Step": 8587, "Pretrain/Step Time": 8.521233094856143} +{"Pretrain/Learning Rate": 1.2870715414652817e-06, "Pretrain/Loss": 1.9830825328826904, "Pretrain/Loss (Raw)": 2.045624256134033, "Pretrain/Step": 8588, "Pretrain/Step Time": 8.52035447396338} +{"Pretrain/Learning Rate": 1.2843839469219104e-06, "Pretrain/Loss": 1.985334873199463, "Pretrain/Loss (Raw)": 2.1629316806793213, "Pretrain/Step": 8589, "Pretrain/Step Time": 8.53089209087193} +{"Pretrain/Learning Rate": 1.2816990873751267e-06, "Pretrain/Loss": 1.9834308624267578, "Pretrain/Loss (Raw)": 1.928454041481018, "Pretrain/Step": 8590, "Pretrain/Step Time": 8.522612662985921} +{"Pretrain/Learning Rate": 1.2790169631345744e-06, "Pretrain/Loss": 1.981982707977295, "Pretrain/Loss (Raw)": 1.808586597442627, "Pretrain/Step": 8591, "Pretrain/Step Time": 8.52454199641943} +{"Pretrain/Learning Rate": 1.2763375745095645e-06, "Pretrain/Loss": 1.981353998184204, "Pretrain/Loss (Raw)": 2.0334436893463135, "Pretrain/Step": 8592, "Pretrain/Step Time": 8.523880697786808} +{"Pretrain/Learning Rate": 1.2736609218090888e-06, "Pretrain/Loss": 1.979197382926941, "Pretrain/Loss (Raw)": 1.7477757930755615, "Pretrain/Step": 8593, "Pretrain/Step Time": 8.522956749424338} +{"Pretrain/Learning Rate": 1.2709870053418421e-06, "Pretrain/Loss": 1.9804644584655762, "Pretrain/Loss (Raw)": 2.291355848312378, "Pretrain/Step": 8594, "Pretrain/Step Time": 8.526250364258885} +{"Pretrain/Learning Rate": 1.2683158254161887e-06, "Pretrain/Loss": 1.9801318645477295, "Pretrain/Loss (Raw)": 1.9561033248901367, "Pretrain/Step": 8595, "Pretrain/Step Time": 8.535703208297491} +{"Pretrain/Learning Rate": 1.2656473823401821e-06, "Pretrain/Loss": 1.976423740386963, "Pretrain/Loss (Raw)": 1.8151088953018188, "Pretrain/Step": 8596, "Pretrain/Step Time": 8.537123678252101} +{"Pretrain/Learning Rate": 1.2629816764215542e-06, "Pretrain/Loss": 1.9726316928863525, "Pretrain/Loss (Raw)": 1.7079085111618042, "Pretrain/Step": 8597, "Pretrain/Step Time": 8.529520275071263} +{"Pretrain/Learning Rate": 1.2603187079677392e-06, "Pretrain/Loss": 1.9725422859191895, "Pretrain/Loss (Raw)": 1.9234691858291626, "Pretrain/Step": 8598, "Pretrain/Step Time": 8.530792193487287} +{"Pretrain/Learning Rate": 1.2576584772858307e-06, "Pretrain/Loss": 1.9748649597167969, "Pretrain/Loss (Raw)": 2.154787302017212, "Pretrain/Step": 8599, "Pretrain/Step Time": 8.522901594638824} +{"Pretrain/Learning Rate": 1.2550009846826277e-06, "Pretrain/Loss": 1.974606990814209, "Pretrain/Loss (Raw)": 2.056797504425049, "Pretrain/Step": 8600, "Pretrain/Step Time": 8.52193439938128} +{"Pretrain/Learning Rate": 1.2523462304645961e-06, "Pretrain/Loss": 1.976264238357544, "Pretrain/Loss (Raw)": 1.9072515964508057, "Pretrain/Step": 8601, "Pretrain/Step Time": 8.52791658975184} +{"Pretrain/Learning Rate": 1.2496942149379048e-06, "Pretrain/Loss": 1.9762017726898193, "Pretrain/Loss (Raw)": 1.9397915601730347, "Pretrain/Step": 8602, "Pretrain/Step Time": 8.532861087471247} +{"Pretrain/Learning Rate": 1.2470449384083927e-06, "Pretrain/Loss": 1.9753131866455078, "Pretrain/Loss (Raw)": 1.992045283317566, "Pretrain/Step": 8603, "Pretrain/Step Time": 8.52726961672306} +{"Pretrain/Learning Rate": 1.2443984011815845e-06, "Pretrain/Loss": 1.9759777784347534, "Pretrain/Loss (Raw)": 2.0832149982452393, "Pretrain/Step": 8604, "Pretrain/Step Time": 8.528783306479454} +{"Pretrain/Learning Rate": 1.2417546035626864e-06, "Pretrain/Loss": 1.9749186038970947, "Pretrain/Loss (Raw)": 1.8593814373016357, "Pretrain/Step": 8605, "Pretrain/Step Time": 8.527807971462607} +{"Pretrain/Learning Rate": 1.2391135458566072e-06, "Pretrain/Loss": 1.9728734493255615, "Pretrain/Loss (Raw)": 1.8124345541000366, "Pretrain/Step": 8606, "Pretrain/Step Time": 8.531027741730213} +{"Pretrain/Learning Rate": 1.236475228367917e-06, "Pretrain/Loss": 1.9744408130645752, "Pretrain/Loss (Raw)": 2.1396474838256836, "Pretrain/Step": 8607, "Pretrain/Step Time": 8.536096394062042} +{"Pretrain/Learning Rate": 1.2338396514008839e-06, "Pretrain/Loss": 1.9753563404083252, "Pretrain/Loss (Raw)": 2.1182785034179688, "Pretrain/Step": 8608, "Pretrain/Step Time": 8.533447021618485} +{"Pretrain/Learning Rate": 1.2312068152594447e-06, "Pretrain/Loss": 1.9732377529144287, "Pretrain/Loss (Raw)": 1.9607913494110107, "Pretrain/Step": 8609, "Pretrain/Step Time": 8.52846247330308} +{"Pretrain/Learning Rate": 1.228576720247246e-06, "Pretrain/Loss": 1.9736684560775757, "Pretrain/Loss (Raw)": 2.0811002254486084, "Pretrain/Step": 8610, "Pretrain/Step Time": 8.522134866565466} +{"Pretrain/Learning Rate": 1.2259493666675891e-06, "Pretrain/Loss": 1.9736948013305664, "Pretrain/Loss (Raw)": 1.8695322275161743, "Pretrain/Step": 8611, "Pretrain/Step Time": 8.514356004074216} +{"Pretrain/Learning Rate": 1.2233247548234795e-06, "Pretrain/Loss": 1.9721119403839111, "Pretrain/Loss (Raw)": 1.8250668048858643, "Pretrain/Step": 8612, "Pretrain/Step Time": 8.523632641881704} +{"Pretrain/Learning Rate": 1.2207028850175967e-06, "Pretrain/Loss": 1.9730339050292969, "Pretrain/Loss (Raw)": 1.95853853225708, "Pretrain/Step": 8613, "Pretrain/Step Time": 8.531307635828853} +{"Pretrain/Learning Rate": 1.2180837575523158e-06, "Pretrain/Loss": 1.973158597946167, "Pretrain/Loss (Raw)": 2.1518642902374268, "Pretrain/Step": 8614, "Pretrain/Step Time": 8.528600126504898} +{"Pretrain/Learning Rate": 1.2154673727296728e-06, "Pretrain/Loss": 1.9731314182281494, "Pretrain/Loss (Raw)": 1.895369529724121, "Pretrain/Step": 8615, "Pretrain/Step Time": 8.518557192757726} +{"Pretrain/Learning Rate": 1.21285373085141e-06, "Pretrain/Loss": 1.973357081413269, "Pretrain/Loss (Raw)": 1.9684749841690063, "Pretrain/Step": 8616, "Pretrain/Step Time": 8.518939087167382} +{"Pretrain/Learning Rate": 1.2102428322189468e-06, "Pretrain/Loss": 1.972761869430542, "Pretrain/Loss (Raw)": 1.9492542743682861, "Pretrain/Step": 8617, "Pretrain/Step Time": 8.518480941653252} +{"Pretrain/Learning Rate": 1.207634677133379e-06, "Pretrain/Loss": 1.974853515625, "Pretrain/Loss (Raw)": 2.251253843307495, "Pretrain/Step": 8618, "Pretrain/Step Time": 8.525203879922628} +{"Pretrain/Learning Rate": 1.205029265895491e-06, "Pretrain/Loss": 1.9734787940979004, "Pretrain/Loss (Raw)": 1.9201014041900635, "Pretrain/Step": 8619, "Pretrain/Step Time": 8.528736976906657} +{"Pretrain/Learning Rate": 1.2024265988057588e-06, "Pretrain/Loss": 1.9712591171264648, "Pretrain/Loss (Raw)": 1.8818352222442627, "Pretrain/Step": 8620, "Pretrain/Step Time": 8.528560139238834} +{"Pretrain/Learning Rate": 1.1998266761643256e-06, "Pretrain/Loss": 1.9724398851394653, "Pretrain/Loss (Raw)": 2.230480909347534, "Pretrain/Step": 8621, "Pretrain/Step Time": 8.528505088761449} +{"Pretrain/Learning Rate": 1.1972294982710326e-06, "Pretrain/Loss": 1.971081256866455, "Pretrain/Loss (Raw)": 1.7487064599990845, "Pretrain/Step": 8622, "Pretrain/Step Time": 8.516537718474865} +{"Pretrain/Learning Rate": 1.1946350654253924e-06, "Pretrain/Loss": 1.9706213474273682, "Pretrain/Loss (Raw)": 2.0034537315368652, "Pretrain/Step": 8623, "Pretrain/Step Time": 8.512137459591031} +{"Pretrain/Learning Rate": 1.192043377926616e-06, "Pretrain/Loss": 1.9686412811279297, "Pretrain/Loss (Raw)": 1.906717300415039, "Pretrain/Step": 8624, "Pretrain/Step Time": 8.517500553280115} +{"Pretrain/Learning Rate": 1.189454436073581e-06, "Pretrain/Loss": 1.9681086540222168, "Pretrain/Loss (Raw)": 1.9864323139190674, "Pretrain/Step": 8625, "Pretrain/Step Time": 8.520956993103027} +{"Pretrain/Learning Rate": 1.1868682401648595e-06, "Pretrain/Loss": 1.9688563346862793, "Pretrain/Loss (Raw)": 1.9301358461380005, "Pretrain/Step": 8626, "Pretrain/Step Time": 8.517226047813892} +{"Pretrain/Learning Rate": 1.184284790498702e-06, "Pretrain/Loss": 1.9686758518218994, "Pretrain/Loss (Raw)": 2.1097218990325928, "Pretrain/Step": 8627, "Pretrain/Step Time": 8.519151609390974} +{"Pretrain/Learning Rate": 1.1817040873730506e-06, "Pretrain/Loss": 1.9685735702514648, "Pretrain/Loss (Raw)": 1.8086564540863037, "Pretrain/Step": 8628, "Pretrain/Step Time": 8.511852636933327} +{"Pretrain/Learning Rate": 1.1791261310855172e-06, "Pretrain/Loss": 1.9689117670059204, "Pretrain/Loss (Raw)": 2.041032314300537, "Pretrain/Step": 8629, "Pretrain/Step Time": 8.511858139187098} +{"Pretrain/Learning Rate": 1.1765509219334058e-06, "Pretrain/Loss": 1.9701170921325684, "Pretrain/Loss (Raw)": 2.0049171447753906, "Pretrain/Step": 8630, "Pretrain/Step Time": 8.512491062283516} +{"Pretrain/Learning Rate": 1.1739784602136983e-06, "Pretrain/Loss": 1.969887137413025, "Pretrain/Loss (Raw)": 2.1000850200653076, "Pretrain/Step": 8631, "Pretrain/Step Time": 8.516692079603672} +{"Pretrain/Learning Rate": 1.171408746223071e-06, "Pretrain/Loss": 1.9750754833221436, "Pretrain/Loss (Raw)": 2.478494882583618, "Pretrain/Step": 8632, "Pretrain/Step Time": 8.518640583381057} +{"Pretrain/Learning Rate": 1.1688417802578706e-06, "Pretrain/Loss": 1.9754447937011719, "Pretrain/Loss (Raw)": 1.8053139448165894, "Pretrain/Step": 8633, "Pretrain/Step Time": 8.51208127476275} +{"Pretrain/Learning Rate": 1.1662775626141293e-06, "Pretrain/Loss": 1.9771944284439087, "Pretrain/Loss (Raw)": 2.3553028106689453, "Pretrain/Step": 8634, "Pretrain/Step Time": 8.507450049743056} +{"Pretrain/Learning Rate": 1.1637160935875717e-06, "Pretrain/Loss": 1.9766021966934204, "Pretrain/Loss (Raw)": 1.9280881881713867, "Pretrain/Step": 8635, "Pretrain/Step Time": 8.510717356577516} +{"Pretrain/Learning Rate": 1.1611573734735925e-06, "Pretrain/Loss": 1.9756712913513184, "Pretrain/Loss (Raw)": 1.9046393632888794, "Pretrain/Step": 8636, "Pretrain/Step Time": 8.510724252089858} +{"Pretrain/Learning Rate": 1.1586014025672775e-06, "Pretrain/Loss": 1.9784855842590332, "Pretrain/Loss (Raw)": 2.140794277191162, "Pretrain/Step": 8637, "Pretrain/Step Time": 8.512937309220433} +{"Pretrain/Learning Rate": 1.1560481811633912e-06, "Pretrain/Loss": 1.9809794425964355, "Pretrain/Loss (Raw)": 2.4764673709869385, "Pretrain/Step": 8638, "Pretrain/Step Time": 8.51537954248488} +{"Pretrain/Learning Rate": 1.1534977095563892e-06, "Pretrain/Loss": 1.9811010360717773, "Pretrain/Loss (Raw)": 1.9457331895828247, "Pretrain/Step": 8639, "Pretrain/Step Time": 8.510896105319262} +{"Pretrain/Learning Rate": 1.1509499880403979e-06, "Pretrain/Loss": 1.98450767993927, "Pretrain/Loss (Raw)": 2.1526806354522705, "Pretrain/Step": 8640, "Pretrain/Step Time": 8.51151036657393} +{"Pretrain/Learning Rate": 1.1484050169092347e-06, "Pretrain/Loss": 1.9840426445007324, "Pretrain/Loss (Raw)": 2.014268398284912, "Pretrain/Step": 8641, "Pretrain/Step Time": 8.511504363268614} +{"Pretrain/Learning Rate": 1.1458627964563928e-06, "Pretrain/Loss": 1.9822642803192139, "Pretrain/Loss (Raw)": 1.7830744981765747, "Pretrain/Step": 8642, "Pretrain/Step Time": 8.51147104986012} +{"Pretrain/Learning Rate": 1.1433233269750627e-06, "Pretrain/Loss": 1.9806947708129883, "Pretrain/Loss (Raw)": 1.8850175142288208, "Pretrain/Step": 8643, "Pretrain/Step Time": 8.509941762313247} +{"Pretrain/Learning Rate": 1.1407866087581043e-06, "Pretrain/Loss": 1.98389732837677, "Pretrain/Loss (Raw)": 2.115896224975586, "Pretrain/Step": 8644, "Pretrain/Step Time": 8.512612231075764} +{"Pretrain/Learning Rate": 1.1382526420980588e-06, "Pretrain/Loss": 1.9785284996032715, "Pretrain/Loss (Raw)": 1.4400914907455444, "Pretrain/Step": 8645, "Pretrain/Step Time": 8.503802210092545} +{"Pretrain/Learning Rate": 1.135721427287159e-06, "Pretrain/Loss": 1.978471279144287, "Pretrain/Loss (Raw)": 1.9228694438934326, "Pretrain/Step": 8646, "Pretrain/Step Time": 8.501232521608472} +{"Pretrain/Learning Rate": 1.1331929646173162e-06, "Pretrain/Loss": 1.9793052673339844, "Pretrain/Loss (Raw)": 2.005009412765503, "Pretrain/Step": 8647, "Pretrain/Step Time": 8.509380275383592} +{"Pretrain/Learning Rate": 1.1306672543801273e-06, "Pretrain/Loss": 1.9781991243362427, "Pretrain/Loss (Raw)": 1.8993556499481201, "Pretrain/Step": 8648, "Pretrain/Step Time": 8.502977224066854} +{"Pretrain/Learning Rate": 1.1281442968668648e-06, "Pretrain/Loss": 1.9810574054718018, "Pretrain/Loss (Raw)": 2.1370890140533447, "Pretrain/Step": 8649, "Pretrain/Step Time": 8.505421621724963} +{"Pretrain/Learning Rate": 1.125624092368488e-06, "Pretrain/Loss": 1.9831563234329224, "Pretrain/Loss (Raw)": 2.068085193634033, "Pretrain/Step": 8650, "Pretrain/Step Time": 8.507583819329739} +{"Pretrain/Learning Rate": 1.1231066411756475e-06, "Pretrain/Loss": 1.9831368923187256, "Pretrain/Loss (Raw)": 1.9941459894180298, "Pretrain/Step": 8651, "Pretrain/Step Time": 8.495237048715353} +{"Pretrain/Learning Rate": 1.1205919435786554e-06, "Pretrain/Loss": 1.9828412532806396, "Pretrain/Loss (Raw)": 2.0703229904174805, "Pretrain/Step": 8652, "Pretrain/Step Time": 8.491176204755902} +{"Pretrain/Learning Rate": 1.1180799998675245e-06, "Pretrain/Loss": 1.9817347526550293, "Pretrain/Loss (Raw)": 1.9745484590530396, "Pretrain/Step": 8653, "Pretrain/Step Time": 8.497153714299202} +{"Pretrain/Learning Rate": 1.1155708103319395e-06, "Pretrain/Loss": 1.9807021617889404, "Pretrain/Loss (Raw)": 1.9644381999969482, "Pretrain/Step": 8654, "Pretrain/Step Time": 8.492327064275742} +{"Pretrain/Learning Rate": 1.1130643752612858e-06, "Pretrain/Loss": 1.9817214012145996, "Pretrain/Loss (Raw)": 2.0876576900482178, "Pretrain/Step": 8655, "Pretrain/Step Time": 8.50405479222536} +{"Pretrain/Learning Rate": 1.1105606949445984e-06, "Pretrain/Loss": 1.9811899662017822, "Pretrain/Loss (Raw)": 1.886722207069397, "Pretrain/Step": 8656, "Pretrain/Step Time": 8.511673238128424} +{"Pretrain/Learning Rate": 1.1080597696706247e-06, "Pretrain/Loss": 1.9816765785217285, "Pretrain/Loss (Raw)": 2.1131601333618164, "Pretrain/Step": 8657, "Pretrain/Step Time": 8.508706845343113} +{"Pretrain/Learning Rate": 1.1055615997277806e-06, "Pretrain/Loss": 1.9814503192901611, "Pretrain/Loss (Raw)": 1.9888166189193726, "Pretrain/Step": 8658, "Pretrain/Step Time": 8.506160845980048} +{"Pretrain/Learning Rate": 1.1030661854041695e-06, "Pretrain/Loss": 1.9858126640319824, "Pretrain/Loss (Raw)": 2.1176512241363525, "Pretrain/Step": 8659, "Pretrain/Step Time": 8.511028859764338} +{"Pretrain/Learning Rate": 1.1005735269875695e-06, "Pretrain/Loss": 1.9879168272018433, "Pretrain/Loss (Raw)": 2.0052735805511475, "Pretrain/Step": 8660, "Pretrain/Step Time": 8.514883851632476} +{"Pretrain/Learning Rate": 1.0980836247654501e-06, "Pretrain/Loss": 1.9882357120513916, "Pretrain/Loss (Raw)": 2.0529592037200928, "Pretrain/Step": 8661, "Pretrain/Step Time": 8.522187514230609} +{"Pretrain/Learning Rate": 1.0955964790249546e-06, "Pretrain/Loss": 1.9889345169067383, "Pretrain/Loss (Raw)": 1.8241841793060303, "Pretrain/Step": 8662, "Pretrain/Step Time": 8.514242066070437} +{"Pretrain/Learning Rate": 1.0931120900529169e-06, "Pretrain/Loss": 1.9900919198989868, "Pretrain/Loss (Raw)": 1.877445936203003, "Pretrain/Step": 8663, "Pretrain/Step Time": 8.512938199564815} +{"Pretrain/Learning Rate": 1.0906304581358411e-06, "Pretrain/Loss": 1.989609956741333, "Pretrain/Loss (Raw)": 2.006758213043213, "Pretrain/Step": 8664, "Pretrain/Step Time": 8.510424494743347} +{"Pretrain/Learning Rate": 1.0881515835599293e-06, "Pretrain/Loss": 1.9914767742156982, "Pretrain/Loss (Raw)": 2.061475992202759, "Pretrain/Step": 8665, "Pretrain/Step Time": 8.523088222369552} +{"Pretrain/Learning Rate": 1.0856754666110553e-06, "Pretrain/Loss": 1.9923902750015259, "Pretrain/Loss (Raw)": 2.162480592727661, "Pretrain/Step": 8666, "Pretrain/Step Time": 8.521965775638819} +{"Pretrain/Learning Rate": 1.0832021075747711e-06, "Pretrain/Loss": 1.9923102855682373, "Pretrain/Loss (Raw)": 2.0002989768981934, "Pretrain/Step": 8667, "Pretrain/Step Time": 8.522267172113061} +{"Pretrain/Learning Rate": 1.0807315067363184e-06, "Pretrain/Loss": 1.994668960571289, "Pretrain/Loss (Raw)": 2.045349597930908, "Pretrain/Step": 8668, "Pretrain/Step Time": 8.51361509412527} +{"Pretrain/Learning Rate": 1.0782636643806215e-06, "Pretrain/Loss": 1.9950580596923828, "Pretrain/Loss (Raw)": 2.1143622398376465, "Pretrain/Step": 8669, "Pretrain/Step Time": 8.51562070287764} +{"Pretrain/Learning Rate": 1.0757985807922838e-06, "Pretrain/Loss": 1.996985673904419, "Pretrain/Loss (Raw)": 2.0499961376190186, "Pretrain/Step": 8670, "Pretrain/Step Time": 8.512183628976345} +{"Pretrain/Learning Rate": 1.073336256255586e-06, "Pretrain/Loss": 1.9973558187484741, "Pretrain/Loss (Raw)": 2.0351388454437256, "Pretrain/Step": 8671, "Pretrain/Step Time": 8.518522994592786} +{"Pretrain/Learning Rate": 1.0708766910544954e-06, "Pretrain/Loss": 1.9971181154251099, "Pretrain/Loss (Raw)": 1.9743950366973877, "Pretrain/Step": 8672, "Pretrain/Step Time": 8.520162422209978} +{"Pretrain/Learning Rate": 1.0684198854726656e-06, "Pretrain/Loss": 1.9983294010162354, "Pretrain/Loss (Raw)": 2.1091854572296143, "Pretrain/Step": 8673, "Pretrain/Step Time": 8.514395646750927} +{"Pretrain/Learning Rate": 1.065965839793423e-06, "Pretrain/Loss": 2.001838207244873, "Pretrain/Loss (Raw)": 2.1957345008850098, "Pretrain/Step": 8674, "Pretrain/Step Time": 8.513170396909118} +{"Pretrain/Learning Rate": 1.0635145542997772e-06, "Pretrain/Loss": 2.0031731128692627, "Pretrain/Loss (Raw)": 2.0623555183410645, "Pretrain/Step": 8675, "Pretrain/Step Time": 8.51606746762991} +{"Pretrain/Learning Rate": 1.0610660292744296e-06, "Pretrain/Loss": 2.0031328201293945, "Pretrain/Loss (Raw)": 1.9987354278564453, "Pretrain/Step": 8676, "Pretrain/Step Time": 8.519463278353214} +{"Pretrain/Learning Rate": 1.0586202649997517e-06, "Pretrain/Loss": 2.0026912689208984, "Pretrain/Loss (Raw)": 1.9196689128875732, "Pretrain/Step": 8677, "Pretrain/Step Time": 8.523816542699933} +{"Pretrain/Learning Rate": 1.0561772617578014e-06, "Pretrain/Loss": 2.0029995441436768, "Pretrain/Loss (Raw)": 2.0009572505950928, "Pretrain/Step": 8678, "Pretrain/Step Time": 8.520468067377806} +{"Pretrain/Learning Rate": 1.0537370198303116e-06, "Pretrain/Loss": 2.0028090476989746, "Pretrain/Loss (Raw)": 2.0249385833740234, "Pretrain/Step": 8679, "Pretrain/Step Time": 8.515423394739628} +{"Pretrain/Learning Rate": 1.0512995394987096e-06, "Pretrain/Loss": 2.003981828689575, "Pretrain/Loss (Raw)": 1.9112823009490967, "Pretrain/Step": 8680, "Pretrain/Step Time": 8.5217670109123} +{"Pretrain/Learning Rate": 1.048864821044096e-06, "Pretrain/Loss": 2.0033369064331055, "Pretrain/Loss (Raw)": 2.109455108642578, "Pretrain/Step": 8681, "Pretrain/Step Time": 8.518375039100647} +{"Pretrain/Learning Rate": 1.0464328647472515e-06, "Pretrain/Loss": 2.003204345703125, "Pretrain/Loss (Raw)": 2.0512380599975586, "Pretrain/Step": 8682, "Pretrain/Step Time": 8.519917108118534} +{"Pretrain/Learning Rate": 1.0440036708886407e-06, "Pretrain/Loss": 2.0016534328460693, "Pretrain/Loss (Raw)": 1.8478575944900513, "Pretrain/Step": 8683, "Pretrain/Step Time": 8.527724649757147} +{"Pretrain/Learning Rate": 1.0415772397484119e-06, "Pretrain/Loss": 1.9992733001708984, "Pretrain/Loss (Raw)": 2.044966459274292, "Pretrain/Step": 8684, "Pretrain/Step Time": 8.527055872604251} +{"Pretrain/Learning Rate": 1.0391535716063938e-06, "Pretrain/Loss": 1.9996048212051392, "Pretrain/Loss (Raw)": 2.1173996925354004, "Pretrain/Step": 8685, "Pretrain/Step Time": 8.528596043586731} +{"Pretrain/Learning Rate": 1.0367326667420907e-06, "Pretrain/Loss": 2.0031890869140625, "Pretrain/Loss (Raw)": 2.4894232749938965, "Pretrain/Step": 8686, "Pretrain/Step Time": 8.525016963481903} +{"Pretrain/Learning Rate": 1.0343145254346931e-06, "Pretrain/Loss": 2.0013043880462646, "Pretrain/Loss (Raw)": 2.01269268989563, "Pretrain/Step": 8687, "Pretrain/Step Time": 8.522533485665917} +{"Pretrain/Learning Rate": 1.031899147963078e-06, "Pretrain/Loss": 2.000460147857666, "Pretrain/Loss (Raw)": 1.8299959897994995, "Pretrain/Step": 8688, "Pretrain/Step Time": 8.52497755549848} +{"Pretrain/Learning Rate": 1.0294865346057947e-06, "Pretrain/Loss": 2.0013413429260254, "Pretrain/Loss (Raw)": 1.767780065536499, "Pretrain/Step": 8689, "Pretrain/Step Time": 8.52475917711854} +{"Pretrain/Learning Rate": 1.0270766856410764e-06, "Pretrain/Loss": 1.9997551441192627, "Pretrain/Loss (Raw)": 1.8440604209899902, "Pretrain/Step": 8690, "Pretrain/Step Time": 8.528882578015327} +{"Pretrain/Learning Rate": 1.0246696013468338e-06, "Pretrain/Loss": 1.9972598552703857, "Pretrain/Loss (Raw)": 1.6772911548614502, "Pretrain/Step": 8691, "Pretrain/Step Time": 8.52648145146668} +{"Pretrain/Learning Rate": 1.0222652820006785e-06, "Pretrain/Loss": 1.9976297616958618, "Pretrain/Loss (Raw)": 2.0167553424835205, "Pretrain/Step": 8692, "Pretrain/Step Time": 8.52393065392971} +{"Pretrain/Learning Rate": 1.019863727879869e-06, "Pretrain/Loss": 1.9971530437469482, "Pretrain/Loss (Raw)": 2.031911849975586, "Pretrain/Step": 8693, "Pretrain/Step Time": 8.520948749035597} +{"Pretrain/Learning Rate": 1.0174649392613755e-06, "Pretrain/Loss": 2.0014615058898926, "Pretrain/Loss (Raw)": 2.127025604248047, "Pretrain/Step": 8694, "Pretrain/Step Time": 8.524317095056176} +{"Pretrain/Learning Rate": 1.0150689164218325e-06, "Pretrain/Loss": 1.99834144115448, "Pretrain/Loss (Raw)": 1.6694700717926025, "Pretrain/Step": 8695, "Pretrain/Step Time": 8.53636565618217} +{"Pretrain/Learning Rate": 1.0126756596375686e-06, "Pretrain/Loss": 1.998678207397461, "Pretrain/Loss (Raw)": 2.008204460144043, "Pretrain/Step": 8696, "Pretrain/Step Time": 8.533185806125402} +{"Pretrain/Learning Rate": 1.0102851691845716e-06, "Pretrain/Loss": 1.9985871315002441, "Pretrain/Loss (Raw)": 1.9448665380477905, "Pretrain/Step": 8697, "Pretrain/Step Time": 8.536226904019713} +{"Pretrain/Learning Rate": 1.0078974453385375e-06, "Pretrain/Loss": 1.9978306293487549, "Pretrain/Loss (Raw)": 1.9710973501205444, "Pretrain/Step": 8698, "Pretrain/Step Time": 8.529166089370847} +{"Pretrain/Learning Rate": 1.0055124883748213e-06, "Pretrain/Loss": 1.9967050552368164, "Pretrain/Loss (Raw)": 1.9797534942626953, "Pretrain/Step": 8699, "Pretrain/Step Time": 8.526880567893386} +{"Pretrain/Learning Rate": 1.0031302985684777e-06, "Pretrain/Loss": 1.9988198280334473, "Pretrain/Loss (Raw)": 2.1792097091674805, "Pretrain/Step": 8700, "Pretrain/Step Time": 8.521798286587} +{"Pretrain/Learning Rate": 1.0007508761942176e-06, "Pretrain/Loss": 1.9978492259979248, "Pretrain/Loss (Raw)": 2.0498621463775635, "Pretrain/Step": 8701, "Pretrain/Step Time": 8.527170099318027} +{"Pretrain/Learning Rate": 9.983742215264575e-07, "Pretrain/Loss": 1.9987685680389404, "Pretrain/Loss (Raw)": 1.9966964721679688, "Pretrain/Step": 8702, "Pretrain/Step Time": 8.531927205622196} +{"Pretrain/Learning Rate": 9.96000334839281e-07, "Pretrain/Loss": 1.999664545059204, "Pretrain/Loss (Raw)": 2.0335121154785156, "Pretrain/Step": 8703, "Pretrain/Step Time": 8.53416240774095} +{"Pretrain/Learning Rate": 9.93629216406458e-07, "Pretrain/Loss": 2.0014848709106445, "Pretrain/Loss (Raw)": 2.183624744415283, "Pretrain/Step": 8704, "Pretrain/Step Time": 8.529218705371022} +{"Pretrain/Learning Rate": 9.91260866501431e-07, "Pretrain/Loss": 2.000549554824829, "Pretrain/Loss (Raw)": 1.938052773475647, "Pretrain/Step": 8705, "Pretrain/Step Time": 8.520079899579287} +{"Pretrain/Learning Rate": 9.888952853973371e-07, "Pretrain/Loss": 2.003796100616455, "Pretrain/Loss (Raw)": 2.2063329219818115, "Pretrain/Step": 8706, "Pretrain/Step Time": 8.519159480929375} +{"Pretrain/Learning Rate": 9.86532473366983e-07, "Pretrain/Loss": 2.003917694091797, "Pretrain/Loss (Raw)": 2.08929443359375, "Pretrain/Step": 8707, "Pretrain/Step Time": 8.514734331518412} +{"Pretrain/Learning Rate": 9.841724306828587e-07, "Pretrain/Loss": 2.007347583770752, "Pretrain/Loss (Raw)": 2.45572566986084, "Pretrain/Step": 8708, "Pretrain/Step Time": 8.512620072811842} +{"Pretrain/Learning Rate": 9.818151576171358e-07, "Pretrain/Loss": 2.006681203842163, "Pretrain/Loss (Raw)": 2.02577543258667, "Pretrain/Step": 8709, "Pretrain/Step Time": 8.511027418076992} +{"Pretrain/Learning Rate": 9.794606544416662e-07, "Pretrain/Loss": 2.0027265548706055, "Pretrain/Loss (Raw)": 1.9379140138626099, "Pretrain/Step": 8710, "Pretrain/Step Time": 8.508150419220328} +{"Pretrain/Learning Rate": 9.771089214279827e-07, "Pretrain/Loss": 2.0056676864624023, "Pretrain/Loss (Raw)": 2.1245505809783936, "Pretrain/Step": 8711, "Pretrain/Step Time": 8.503669146448374} +{"Pretrain/Learning Rate": 9.74759958847299e-07, "Pretrain/Loss": 2.0048305988311768, "Pretrain/Loss (Raw)": 1.8659917116165161, "Pretrain/Step": 8712, "Pretrain/Step Time": 8.500445425510406} +{"Pretrain/Learning Rate": 9.724137669705036e-07, "Pretrain/Loss": 2.0062708854675293, "Pretrain/Loss (Raw)": 2.20196533203125, "Pretrain/Step": 8713, "Pretrain/Step Time": 8.515737289562821} +{"Pretrain/Learning Rate": 9.700703460681803e-07, "Pretrain/Loss": 2.0075724124908447, "Pretrain/Loss (Raw)": 1.995887279510498, "Pretrain/Step": 8714, "Pretrain/Step Time": 8.514425441622734} +{"Pretrain/Learning Rate": 9.677296964105742e-07, "Pretrain/Loss": 2.007509231567383, "Pretrain/Loss (Raw)": 1.9788981676101685, "Pretrain/Step": 8715, "Pretrain/Step Time": 8.51593093201518} +{"Pretrain/Learning Rate": 9.653918182676218e-07, "Pretrain/Loss": 2.006629705429077, "Pretrain/Loss (Raw)": 1.9330371618270874, "Pretrain/Step": 8716, "Pretrain/Step Time": 8.515035729855299} +{"Pretrain/Learning Rate": 9.630567119089412e-07, "Pretrain/Loss": 2.0061440467834473, "Pretrain/Loss (Raw)": 2.100804090499878, "Pretrain/Step": 8717, "Pretrain/Step Time": 8.504420634359121} +{"Pretrain/Learning Rate": 9.607243776038278e-07, "Pretrain/Loss": 2.007110595703125, "Pretrain/Loss (Raw)": 2.052159309387207, "Pretrain/Step": 8718, "Pretrain/Step Time": 8.511613411828876} +{"Pretrain/Learning Rate": 9.583948156212552e-07, "Pretrain/Loss": 2.0101728439331055, "Pretrain/Loss (Raw)": 2.2005398273468018, "Pretrain/Step": 8719, "Pretrain/Step Time": 8.509192129597068} +{"Pretrain/Learning Rate": 9.560680262298783e-07, "Pretrain/Loss": 2.0091915130615234, "Pretrain/Loss (Raw)": 1.9078456163406372, "Pretrain/Step": 8720, "Pretrain/Step Time": 8.518312318250537} +{"Pretrain/Learning Rate": 9.537440096980377e-07, "Pretrain/Loss": 2.0101873874664307, "Pretrain/Loss (Raw)": 1.8752562999725342, "Pretrain/Step": 8721, "Pretrain/Step Time": 8.518160350620747} +{"Pretrain/Learning Rate": 9.514227662937469e-07, "Pretrain/Loss": 2.0071983337402344, "Pretrain/Loss (Raw)": 1.9087584018707275, "Pretrain/Step": 8722, "Pretrain/Step Time": 8.515810955315828} +{"Pretrain/Learning Rate": 9.49104296284703e-07, "Pretrain/Loss": 2.007631540298462, "Pretrain/Loss (Raw)": 2.011542558670044, "Pretrain/Step": 8723, "Pretrain/Step Time": 8.510755674913526} +{"Pretrain/Learning Rate": 9.467885999382809e-07, "Pretrain/Loss": 2.01043701171875, "Pretrain/Loss (Raw)": 2.174187183380127, "Pretrain/Step": 8724, "Pretrain/Step Time": 8.514603115618229} +{"Pretrain/Learning Rate": 9.444756775215446e-07, "Pretrain/Loss": 2.0129966735839844, "Pretrain/Loss (Raw)": 2.035576343536377, "Pretrain/Step": 8725, "Pretrain/Step Time": 8.51851181127131} +{"Pretrain/Learning Rate": 9.421655293012227e-07, "Pretrain/Loss": 2.012739658355713, "Pretrain/Loss (Raw)": 1.890557885169983, "Pretrain/Step": 8726, "Pretrain/Step Time": 8.513924639672041} +{"Pretrain/Learning Rate": 9.398581555437408e-07, "Pretrain/Loss": 2.013662815093994, "Pretrain/Loss (Raw)": 2.272974729537964, "Pretrain/Step": 8727, "Pretrain/Step Time": 8.514545861631632} +{"Pretrain/Learning Rate": 9.375535565151861e-07, "Pretrain/Loss": 2.0132954120635986, "Pretrain/Loss (Raw)": 2.0097615718841553, "Pretrain/Step": 8728, "Pretrain/Step Time": 8.513393253087997} +{"Pretrain/Learning Rate": 9.352517324813431e-07, "Pretrain/Loss": 2.0145366191864014, "Pretrain/Loss (Raw)": 2.066133975982666, "Pretrain/Step": 8729, "Pretrain/Step Time": 8.508604440838099} +{"Pretrain/Learning Rate": 9.329526837076691e-07, "Pretrain/Loss": 2.0140976905822754, "Pretrain/Loss (Raw)": 1.883562445640564, "Pretrain/Step": 8730, "Pretrain/Step Time": 8.509339986369014} +{"Pretrain/Learning Rate": 9.306564104592963e-07, "Pretrain/Loss": 2.0133073329925537, "Pretrain/Loss (Raw)": 1.8909127712249756, "Pretrain/Step": 8731, "Pretrain/Step Time": 8.51558762602508} +{"Pretrain/Learning Rate": 9.283629130010463e-07, "Pretrain/Loss": 2.0113844871520996, "Pretrain/Loss (Raw)": 1.8370630741119385, "Pretrain/Step": 8732, "Pretrain/Step Time": 8.517536889761686} +{"Pretrain/Learning Rate": 9.260721915974158e-07, "Pretrain/Loss": 2.0119071006774902, "Pretrain/Loss (Raw)": 1.9263209104537964, "Pretrain/Step": 8733, "Pretrain/Step Time": 8.517904607579112} +{"Pretrain/Learning Rate": 9.237842465125768e-07, "Pretrain/Loss": 2.013370990753174, "Pretrain/Loss (Raw)": 1.9997789859771729, "Pretrain/Step": 8734, "Pretrain/Step Time": 8.514367016032338} +{"Pretrain/Learning Rate": 9.214990780103932e-07, "Pretrain/Loss": 2.0124049186706543, "Pretrain/Loss (Raw)": 2.015995979309082, "Pretrain/Step": 8735, "Pretrain/Step Time": 8.512605488300323} +{"Pretrain/Learning Rate": 9.192166863543933e-07, "Pretrain/Loss": 2.0142648220062256, "Pretrain/Loss (Raw)": 2.356361150741577, "Pretrain/Step": 8736, "Pretrain/Step Time": 8.50895831361413} +{"Pretrain/Learning Rate": 9.169370718078024e-07, "Pretrain/Loss": 2.0138864517211914, "Pretrain/Loss (Raw)": 1.9123835563659668, "Pretrain/Step": 8737, "Pretrain/Step Time": 8.516561422497034} +{"Pretrain/Learning Rate": 9.146602346335075e-07, "Pretrain/Loss": 2.012228488922119, "Pretrain/Loss (Raw)": 1.8688349723815918, "Pretrain/Step": 8738, "Pretrain/Step Time": 8.519825739786029} +{"Pretrain/Learning Rate": 9.123861750940904e-07, "Pretrain/Loss": 2.012436866760254, "Pretrain/Loss (Raw)": 1.8962273597717285, "Pretrain/Step": 8739, "Pretrain/Step Time": 8.52352087572217} +{"Pretrain/Learning Rate": 9.101148934518022e-07, "Pretrain/Loss": 2.0140984058380127, "Pretrain/Loss (Raw)": 2.0377376079559326, "Pretrain/Step": 8740, "Pretrain/Step Time": 8.513051288202405} +{"Pretrain/Learning Rate": 9.078463899685835e-07, "Pretrain/Loss": 2.0135645866394043, "Pretrain/Loss (Raw)": 1.8901946544647217, "Pretrain/Step": 8741, "Pretrain/Step Time": 8.506766917183995} +{"Pretrain/Learning Rate": 9.055806649060416e-07, "Pretrain/Loss": 2.0116114616394043, "Pretrain/Loss (Raw)": 1.9018698930740356, "Pretrain/Step": 8742, "Pretrain/Step Time": 8.511280875653028} +{"Pretrain/Learning Rate": 9.033177185254732e-07, "Pretrain/Loss": 2.015263080596924, "Pretrain/Loss (Raw)": 2.36279559135437, "Pretrain/Step": 8743, "Pretrain/Step Time": 8.520899906754494} +{"Pretrain/Learning Rate": 9.010575510878555e-07, "Pretrain/Loss": 2.016864776611328, "Pretrain/Loss (Raw)": 2.17348575592041, "Pretrain/Step": 8744, "Pretrain/Step Time": 8.523236256092787} +{"Pretrain/Learning Rate": 8.988001628538411e-07, "Pretrain/Loss": 2.0183818340301514, "Pretrain/Loss (Raw)": 2.143446207046509, "Pretrain/Step": 8745, "Pretrain/Step Time": 8.523446535691619} +{"Pretrain/Learning Rate": 8.965455540837553e-07, "Pretrain/Loss": 2.0179696083068848, "Pretrain/Loss (Raw)": 2.1984899044036865, "Pretrain/Step": 8746, "Pretrain/Step Time": 8.51544651761651} +{"Pretrain/Learning Rate": 8.942937250376176e-07, "Pretrain/Loss": 2.0178611278533936, "Pretrain/Loss (Raw)": 1.9062126874923706, "Pretrain/Step": 8747, "Pretrain/Step Time": 8.511037461459637} +{"Pretrain/Learning Rate": 8.920446759751177e-07, "Pretrain/Loss": 2.016911029815674, "Pretrain/Loss (Raw)": 1.760196566581726, "Pretrain/Step": 8748, "Pretrain/Step Time": 8.513280805200338} +{"Pretrain/Learning Rate": 8.897984071556259e-07, "Pretrain/Loss": 2.0125699043273926, "Pretrain/Loss (Raw)": 1.6748405694961548, "Pretrain/Step": 8749, "Pretrain/Step Time": 8.518251031637192} +{"Pretrain/Learning Rate": 8.875549188381904e-07, "Pretrain/Loss": 2.008040428161621, "Pretrain/Loss (Raw)": 1.168917179107666, "Pretrain/Step": 8750, "Pretrain/Step Time": 8.518963132053614} +{"Pretrain/Learning Rate": 8.85314211281546e-07, "Pretrain/Loss": 2.0079808235168457, "Pretrain/Loss (Raw)": 1.995842456817627, "Pretrain/Step": 8751, "Pretrain/Step Time": 8.525177329778671} +{"Pretrain/Learning Rate": 8.830762847440998e-07, "Pretrain/Loss": 2.009718418121338, "Pretrain/Loss (Raw)": 2.129148483276367, "Pretrain/Step": 8752, "Pretrain/Step Time": 8.517339687794447} +{"Pretrain/Learning Rate": 8.808411394839372e-07, "Pretrain/Loss": 2.009754180908203, "Pretrain/Loss (Raw)": 1.9909913539886475, "Pretrain/Step": 8753, "Pretrain/Step Time": 8.51386190019548} +{"Pretrain/Learning Rate": 8.786087757588269e-07, "Pretrain/Loss": 2.0092804431915283, "Pretrain/Loss (Raw)": 1.869486927986145, "Pretrain/Step": 8754, "Pretrain/Step Time": 8.517684517428279} +{"Pretrain/Learning Rate": 8.763791938262184e-07, "Pretrain/Loss": 2.008756637573242, "Pretrain/Loss (Raw)": 2.04266619682312, "Pretrain/Step": 8755, "Pretrain/Step Time": 8.528081668540835} +{"Pretrain/Learning Rate": 8.741523939432339e-07, "Pretrain/Loss": 2.0091042518615723, "Pretrain/Loss (Raw)": 1.853183388710022, "Pretrain/Step": 8756, "Pretrain/Step Time": 8.523653166368604} +{"Pretrain/Learning Rate": 8.719283763666792e-07, "Pretrain/Loss": 2.0087311267852783, "Pretrain/Loss (Raw)": 1.9932334423065186, "Pretrain/Step": 8757, "Pretrain/Step Time": 8.51788454130292} +{"Pretrain/Learning Rate": 8.697071413530433e-07, "Pretrain/Loss": 2.0055184364318848, "Pretrain/Loss (Raw)": 1.5937026739120483, "Pretrain/Step": 8758, "Pretrain/Step Time": 8.517110139131546} +{"Pretrain/Learning Rate": 8.674886891584827e-07, "Pretrain/Loss": 2.0057144165039062, "Pretrain/Loss (Raw)": 2.125175952911377, "Pretrain/Step": 8759, "Pretrain/Step Time": 8.510230535641313} +{"Pretrain/Learning Rate": 8.652730200388426e-07, "Pretrain/Loss": 1.9994759559631348, "Pretrain/Loss (Raw)": 1.6799852848052979, "Pretrain/Step": 8760, "Pretrain/Step Time": 8.516445668414235} +{"Pretrain/Learning Rate": 8.630601342496436e-07, "Pretrain/Loss": 2.0015344619750977, "Pretrain/Loss (Raw)": 2.068765640258789, "Pretrain/Step": 8761, "Pretrain/Step Time": 8.524546593427658} +{"Pretrain/Learning Rate": 8.608500320460899e-07, "Pretrain/Loss": 1.9972772598266602, "Pretrain/Loss (Raw)": 1.810411810874939, "Pretrain/Step": 8762, "Pretrain/Step Time": 8.5251091606915} +{"Pretrain/Learning Rate": 8.586427136830555e-07, "Pretrain/Loss": 1.9986406564712524, "Pretrain/Loss (Raw)": 2.102602481842041, "Pretrain/Step": 8763, "Pretrain/Step Time": 8.519718805328012} +{"Pretrain/Learning Rate": 8.564381794151033e-07, "Pretrain/Loss": 2.0004115104675293, "Pretrain/Loss (Raw)": 2.131322145462036, "Pretrain/Step": 8764, "Pretrain/Step Time": 8.51670690625906} +{"Pretrain/Learning Rate": 8.542364294964633e-07, "Pretrain/Loss": 1.9993340969085693, "Pretrain/Loss (Raw)": 2.0028510093688965, "Pretrain/Step": 8765, "Pretrain/Step Time": 8.518380742520094} +{"Pretrain/Learning Rate": 8.52037464181063e-07, "Pretrain/Loss": 1.9959330558776855, "Pretrain/Loss (Raw)": 2.0411581993103027, "Pretrain/Step": 8766, "Pretrain/Step Time": 8.515324339270592} +{"Pretrain/Learning Rate": 8.498412837224884e-07, "Pretrain/Loss": 1.995084524154663, "Pretrain/Loss (Raw)": 1.8370968103408813, "Pretrain/Step": 8767, "Pretrain/Step Time": 8.5171550065279} +{"Pretrain/Learning Rate": 8.476478883740175e-07, "Pretrain/Loss": 1.9972882270812988, "Pretrain/Loss (Raw)": 2.434783935546875, "Pretrain/Step": 8768, "Pretrain/Step Time": 8.520126825198531} +{"Pretrain/Learning Rate": 8.454572783885978e-07, "Pretrain/Loss": 1.9956865310668945, "Pretrain/Loss (Raw)": 1.8092317581176758, "Pretrain/Step": 8769, "Pretrain/Step Time": 8.51634168997407} +{"Pretrain/Learning Rate": 8.43269454018869e-07, "Pretrain/Loss": 1.9976788759231567, "Pretrain/Loss (Raw)": 2.0381054878234863, "Pretrain/Step": 8770, "Pretrain/Step Time": 8.51692909002304} +{"Pretrain/Learning Rate": 8.410844155171376e-07, "Pretrain/Loss": 1.9993382692337036, "Pretrain/Loss (Raw)": 2.0974061489105225, "Pretrain/Step": 8771, "Pretrain/Step Time": 8.519222795963287} +{"Pretrain/Learning Rate": 8.389021631353911e-07, "Pretrain/Loss": 1.9982175827026367, "Pretrain/Loss (Raw)": 1.97246515750885, "Pretrain/Step": 8772, "Pretrain/Step Time": 8.5196065697819} +{"Pretrain/Learning Rate": 8.367226971252945e-07, "Pretrain/Loss": 2.003758192062378, "Pretrain/Loss (Raw)": 2.1492714881896973, "Pretrain/Step": 8773, "Pretrain/Step Time": 8.525108622387052} +{"Pretrain/Learning Rate": 8.345460177381998e-07, "Pretrain/Loss": 2.0096402168273926, "Pretrain/Loss (Raw)": 2.6757590770721436, "Pretrain/Step": 8774, "Pretrain/Step Time": 8.52770483493805} +{"Pretrain/Learning Rate": 8.323721252251309e-07, "Pretrain/Loss": 2.009983777999878, "Pretrain/Loss (Raw)": 2.049006938934326, "Pretrain/Step": 8775, "Pretrain/Step Time": 8.52059075050056} +{"Pretrain/Learning Rate": 8.302010198367904e-07, "Pretrain/Loss": 2.009639263153076, "Pretrain/Loss (Raw)": 1.8552570343017578, "Pretrain/Step": 8776, "Pretrain/Step Time": 8.51954042352736} +{"Pretrain/Learning Rate": 8.280327018235556e-07, "Pretrain/Loss": 2.0071661472320557, "Pretrain/Loss (Raw)": 1.820513129234314, "Pretrain/Step": 8777, "Pretrain/Step Time": 8.51613213121891} +{"Pretrain/Learning Rate": 8.258671714354987e-07, "Pretrain/Loss": 2.006645441055298, "Pretrain/Loss (Raw)": 2.001444101333618, "Pretrain/Step": 8778, "Pretrain/Step Time": 8.518485829234123} +{"Pretrain/Learning Rate": 8.23704428922345e-07, "Pretrain/Loss": 2.0047965049743652, "Pretrain/Loss (Raw)": 1.7574927806854248, "Pretrain/Step": 8779, "Pretrain/Step Time": 8.525723662227392} +{"Pretrain/Learning Rate": 8.215444745335227e-07, "Pretrain/Loss": 2.002537727355957, "Pretrain/Loss (Raw)": 1.7811707258224487, "Pretrain/Step": 8780, "Pretrain/Step Time": 8.5280392896384} +{"Pretrain/Learning Rate": 8.193873085181214e-07, "Pretrain/Loss": 2.002978563308716, "Pretrain/Loss (Raw)": 2.030974864959717, "Pretrain/Step": 8781, "Pretrain/Step Time": 8.525188067927957} +{"Pretrain/Learning Rate": 8.172329311249255e-07, "Pretrain/Loss": 2.0010814666748047, "Pretrain/Loss (Raw)": 1.7216383218765259, "Pretrain/Step": 8782, "Pretrain/Step Time": 8.52532004378736} +{"Pretrain/Learning Rate": 8.150813426023751e-07, "Pretrain/Loss": 2.002356767654419, "Pretrain/Loss (Raw)": 2.250887155532837, "Pretrain/Step": 8783, "Pretrain/Step Time": 8.511056620627642} +{"Pretrain/Learning Rate": 8.129325431986079e-07, "Pretrain/Loss": 2.0030479431152344, "Pretrain/Loss (Raw)": 1.9751837253570557, "Pretrain/Step": 8784, "Pretrain/Step Time": 8.508391965180635} +{"Pretrain/Learning Rate": 8.107865331614339e-07, "Pretrain/Loss": 2.0012741088867188, "Pretrain/Loss (Raw)": 1.8861140012741089, "Pretrain/Step": 8785, "Pretrain/Step Time": 8.51170052587986} +{"Pretrain/Learning Rate": 8.086433127383413e-07, "Pretrain/Loss": 2.0022482872009277, "Pretrain/Loss (Raw)": 2.1135382652282715, "Pretrain/Step": 8786, "Pretrain/Step Time": 8.517325071617961} +{"Pretrain/Learning Rate": 8.065028821764909e-07, "Pretrain/Loss": 2.000232219696045, "Pretrain/Loss (Raw)": 1.8595539331436157, "Pretrain/Step": 8787, "Pretrain/Step Time": 8.518407233059406} +{"Pretrain/Learning Rate": 8.043652417227349e-07, "Pretrain/Loss": 1.9992403984069824, "Pretrain/Loss (Raw)": 1.8783458471298218, "Pretrain/Step": 8788, "Pretrain/Step Time": 8.512147642672062} +{"Pretrain/Learning Rate": 8.022303916235929e-07, "Pretrain/Loss": 1.9997174739837646, "Pretrain/Loss (Raw)": 2.1140058040618896, "Pretrain/Step": 8789, "Pretrain/Step Time": 8.508610574528575} +{"Pretrain/Learning Rate": 8.000983321252681e-07, "Pretrain/Loss": 2.000431776046753, "Pretrain/Loss (Raw)": 1.9156293869018555, "Pretrain/Step": 8790, "Pretrain/Step Time": 8.51077626645565} +{"Pretrain/Learning Rate": 7.979690634736304e-07, "Pretrain/Loss": 2.0017809867858887, "Pretrain/Loss (Raw)": 2.0501742362976074, "Pretrain/Step": 8791, "Pretrain/Step Time": 8.519612077623606} +{"Pretrain/Learning Rate": 7.958425859142498e-07, "Pretrain/Loss": 2.001551628112793, "Pretrain/Loss (Raw)": 1.9773457050323486, "Pretrain/Step": 8792, "Pretrain/Step Time": 8.524611221626401} +{"Pretrain/Learning Rate": 7.937188996923556e-07, "Pretrain/Loss": 2.0025222301483154, "Pretrain/Loss (Raw)": 2.185731887817383, "Pretrain/Step": 8793, "Pretrain/Step Time": 8.515205977484584} +{"Pretrain/Learning Rate": 7.915980050528599e-07, "Pretrain/Loss": 2.0015134811401367, "Pretrain/Loss (Raw)": 2.0333807468414307, "Pretrain/Step": 8794, "Pretrain/Step Time": 8.510707193985581} +{"Pretrain/Learning Rate": 7.894799022403532e-07, "Pretrain/Loss": 2.001826047897339, "Pretrain/Loss (Raw)": 2.040313243865967, "Pretrain/Step": 8795, "Pretrain/Step Time": 8.504414159804583} +{"Pretrain/Learning Rate": 7.873645914991123e-07, "Pretrain/Loss": 2.000999927520752, "Pretrain/Loss (Raw)": 1.9395581483840942, "Pretrain/Step": 8796, "Pretrain/Step Time": 8.5092095695436} +{"Pretrain/Learning Rate": 7.852520730730812e-07, "Pretrain/Loss": 2.000657558441162, "Pretrain/Loss (Raw)": 2.0705690383911133, "Pretrain/Step": 8797, "Pretrain/Step Time": 8.51396113075316} +{"Pretrain/Learning Rate": 7.831423472058785e-07, "Pretrain/Loss": 1.9999475479125977, "Pretrain/Loss (Raw)": 1.9591212272644043, "Pretrain/Step": 8798, "Pretrain/Step Time": 8.515372928231955} +{"Pretrain/Learning Rate": 7.810354141408211e-07, "Pretrain/Loss": 1.9994192123413086, "Pretrain/Loss (Raw)": 1.9675030708312988, "Pretrain/Step": 8799, "Pretrain/Step Time": 8.511577166616917} +{"Pretrain/Learning Rate": 7.789312741208809e-07, "Pretrain/Loss": 1.9986032247543335, "Pretrain/Loss (Raw)": 1.8699413537979126, "Pretrain/Step": 8800, "Pretrain/Step Time": 8.50745259411633} +{"Pretrain/Learning Rate": 7.768299273887198e-07, "Pretrain/Loss": 1.9988832473754883, "Pretrain/Loss (Raw)": 2.145026922225952, "Pretrain/Step": 8801, "Pretrain/Step Time": 8.510464707389474} +{"Pretrain/Learning Rate": 7.747313741866713e-07, "Pretrain/Loss": 1.9951940774917603, "Pretrain/Loss (Raw)": 1.7235335111618042, "Pretrain/Step": 8802, "Pretrain/Step Time": 8.510657967999578} +{"Pretrain/Learning Rate": 7.726356147567559e-07, "Pretrain/Loss": 1.995163083076477, "Pretrain/Loss (Raw)": 2.05838942527771, "Pretrain/Step": 8803, "Pretrain/Step Time": 8.510586511343718} +{"Pretrain/Learning Rate": 7.705426493406665e-07, "Pretrain/Loss": 1.9951426982879639, "Pretrain/Loss (Raw)": 1.996118187904358, "Pretrain/Step": 8804, "Pretrain/Step Time": 8.508563075214624} +{"Pretrain/Learning Rate": 7.684524781797708e-07, "Pretrain/Loss": 1.9974963665008545, "Pretrain/Loss (Raw)": 2.220942258834839, "Pretrain/Step": 8805, "Pretrain/Step Time": 8.505349777638912} +{"Pretrain/Learning Rate": 7.663651015151152e-07, "Pretrain/Loss": 1.9998939037322998, "Pretrain/Loss (Raw)": 2.3078625202178955, "Pretrain/Step": 8806, "Pretrain/Step Time": 8.50641711615026} +{"Pretrain/Learning Rate": 7.64280519587432e-07, "Pretrain/Loss": 1.9986196756362915, "Pretrain/Loss (Raw)": 1.8618265390396118, "Pretrain/Step": 8807, "Pretrain/Step Time": 8.512100525200367} +{"Pretrain/Learning Rate": 7.621987326371205e-07, "Pretrain/Loss": 2.0000967979431152, "Pretrain/Loss (Raw)": 2.100324869155884, "Pretrain/Step": 8808, "Pretrain/Step Time": 8.514105958864093} +{"Pretrain/Learning Rate": 7.601197409042665e-07, "Pretrain/Loss": 1.9990581274032593, "Pretrain/Loss (Raw)": 1.9765127897262573, "Pretrain/Step": 8809, "Pretrain/Step Time": 8.513441246002913} +{"Pretrain/Learning Rate": 7.5804354462862e-07, "Pretrain/Loss": 1.998988151550293, "Pretrain/Loss (Raw)": 2.042309284210205, "Pretrain/Step": 8810, "Pretrain/Step Time": 8.51400332711637} +{"Pretrain/Learning Rate": 7.55970144049628e-07, "Pretrain/Loss": 2.0000786781311035, "Pretrain/Loss (Raw)": 1.9874346256256104, "Pretrain/Step": 8811, "Pretrain/Step Time": 8.506522903218865} +{"Pretrain/Learning Rate": 7.538995394063996e-07, "Pretrain/Loss": 1.9997090101242065, "Pretrain/Loss (Raw)": 1.9976286888122559, "Pretrain/Step": 8812, "Pretrain/Step Time": 8.506819974631071} +{"Pretrain/Learning Rate": 7.518317309377298e-07, "Pretrain/Loss": 1.9978060722351074, "Pretrain/Loss (Raw)": 1.873834252357483, "Pretrain/Step": 8813, "Pretrain/Step Time": 8.505759987980127} +{"Pretrain/Learning Rate": 7.497667188820834e-07, "Pretrain/Loss": 1.9933996200561523, "Pretrain/Loss (Raw)": 1.9254051446914673, "Pretrain/Step": 8814, "Pretrain/Step Time": 8.507832136005163} +{"Pretrain/Learning Rate": 7.477045034776087e-07, "Pretrain/Loss": 1.9929680824279785, "Pretrain/Loss (Raw)": 1.9574618339538574, "Pretrain/Step": 8815, "Pretrain/Step Time": 8.51231841929257} +{"Pretrain/Learning Rate": 7.45645084962135e-07, "Pretrain/Loss": 1.9946707487106323, "Pretrain/Loss (Raw)": 2.0479166507720947, "Pretrain/Step": 8816, "Pretrain/Step Time": 8.5115247964859} +{"Pretrain/Learning Rate": 7.435884635731582e-07, "Pretrain/Loss": 1.9969964027404785, "Pretrain/Loss (Raw)": 2.065462112426758, "Pretrain/Step": 8817, "Pretrain/Step Time": 8.510780099779367} +{"Pretrain/Learning Rate": 7.415346395478584e-07, "Pretrain/Loss": 1.998891830444336, "Pretrain/Loss (Raw)": 2.0866880416870117, "Pretrain/Step": 8818, "Pretrain/Step Time": 8.505378391593695} +{"Pretrain/Learning Rate": 7.394836131230987e-07, "Pretrain/Loss": 1.9986157417297363, "Pretrain/Loss (Raw)": 1.6419501304626465, "Pretrain/Step": 8819, "Pretrain/Step Time": 8.507206721231341} +{"Pretrain/Learning Rate": 7.37435384535401e-07, "Pretrain/Loss": 2.000089168548584, "Pretrain/Loss (Raw)": 2.20534086227417, "Pretrain/Step": 8820, "Pretrain/Step Time": 8.512518625706434} +{"Pretrain/Learning Rate": 7.353899540209902e-07, "Pretrain/Loss": 1.999272108078003, "Pretrain/Loss (Raw)": 1.927335500717163, "Pretrain/Step": 8821, "Pretrain/Step Time": 8.517496479675174} +{"Pretrain/Learning Rate": 7.333473218157416e-07, "Pretrain/Loss": 1.9985864162445068, "Pretrain/Loss (Raw)": 2.039287567138672, "Pretrain/Step": 8822, "Pretrain/Step Time": 8.514313116669655} +{"Pretrain/Learning Rate": 7.313074881552362e-07, "Pretrain/Loss": 2.005599021911621, "Pretrain/Loss (Raw)": 2.5670831203460693, "Pretrain/Step": 8823, "Pretrain/Step Time": 8.503322262316942} +{"Pretrain/Learning Rate": 7.292704532747024e-07, "Pretrain/Loss": 2.0061850547790527, "Pretrain/Loss (Raw)": 2.0832021236419678, "Pretrain/Step": 8824, "Pretrain/Step Time": 8.503844326362014} +{"Pretrain/Learning Rate": 7.272362174090691e-07, "Pretrain/Loss": 2.005409002304077, "Pretrain/Loss (Raw)": 1.845525860786438, "Pretrain/Step": 8825, "Pretrain/Step Time": 8.510284408926964} +{"Pretrain/Learning Rate": 7.252047807929347e-07, "Pretrain/Loss": 2.005230188369751, "Pretrain/Loss (Raw)": 1.9482184648513794, "Pretrain/Step": 8826, "Pretrain/Step Time": 8.512077508494258} +{"Pretrain/Learning Rate": 7.2317614366057e-07, "Pretrain/Loss": 2.004948616027832, "Pretrain/Loss (Raw)": 1.943704605102539, "Pretrain/Step": 8827, "Pretrain/Step Time": 8.50989786349237} +{"Pretrain/Learning Rate": 7.211503062459268e-07, "Pretrain/Loss": 2.0021958351135254, "Pretrain/Loss (Raw)": 1.8268232345581055, "Pretrain/Step": 8828, "Pretrain/Step Time": 8.518888395279646} +{"Pretrain/Learning Rate": 7.191272687826378e-07, "Pretrain/Loss": 2.001476526260376, "Pretrain/Loss (Raw)": 1.9578144550323486, "Pretrain/Step": 8829, "Pretrain/Step Time": 8.513119058683515} +{"Pretrain/Learning Rate": 7.17107031504008e-07, "Pretrain/Loss": 2.000734329223633, "Pretrain/Loss (Raw)": 1.9017051458358765, "Pretrain/Step": 8830, "Pretrain/Step Time": 8.508381189778447} +{"Pretrain/Learning Rate": 7.150895946430203e-07, "Pretrain/Loss": 2.0005128383636475, "Pretrain/Loss (Raw)": 2.0051512718200684, "Pretrain/Step": 8831, "Pretrain/Step Time": 8.5065513048321} +{"Pretrain/Learning Rate": 7.130749584323304e-07, "Pretrain/Loss": 1.998966932296753, "Pretrain/Loss (Raw)": 1.9857532978057861, "Pretrain/Step": 8832, "Pretrain/Step Time": 8.51375731267035} +{"Pretrain/Learning Rate": 7.110631231042858e-07, "Pretrain/Loss": 1.9984409809112549, "Pretrain/Loss (Raw)": 1.8707265853881836, "Pretrain/Step": 8833, "Pretrain/Step Time": 8.51889955252409} +{"Pretrain/Learning Rate": 7.090540888908925e-07, "Pretrain/Loss": 1.9983229637145996, "Pretrain/Loss (Raw)": 2.191226005554199, "Pretrain/Step": 8834, "Pretrain/Step Time": 8.516228908672929} +{"Pretrain/Learning Rate": 7.070478560238458e-07, "Pretrain/Loss": 1.9974663257598877, "Pretrain/Loss (Raw)": 1.979638934135437, "Pretrain/Step": 8835, "Pretrain/Step Time": 8.50444171205163} +{"Pretrain/Learning Rate": 7.050444247345078e-07, "Pretrain/Loss": 1.9942994117736816, "Pretrain/Loss (Raw)": 2.0503780841827393, "Pretrain/Step": 8836, "Pretrain/Step Time": 8.50378223694861} +{"Pretrain/Learning Rate": 7.030437952539326e-07, "Pretrain/Loss": 1.9942327737808228, "Pretrain/Loss (Raw)": 2.017228603363037, "Pretrain/Step": 8837, "Pretrain/Step Time": 8.507643323391676} +{"Pretrain/Learning Rate": 7.010459678128384e-07, "Pretrain/Loss": 1.9923983812332153, "Pretrain/Loss (Raw)": 1.7031365633010864, "Pretrain/Step": 8838, "Pretrain/Step Time": 8.51678590849042} +{"Pretrain/Learning Rate": 6.990509426416186e-07, "Pretrain/Loss": 1.993497610092163, "Pretrain/Loss (Raw)": 2.265239715576172, "Pretrain/Step": 8839, "Pretrain/Step Time": 8.522239301353693} +{"Pretrain/Learning Rate": 6.970587199703588e-07, "Pretrain/Loss": 1.9950069189071655, "Pretrain/Loss (Raw)": 2.059180498123169, "Pretrain/Step": 8840, "Pretrain/Step Time": 8.521236447617412} +{"Pretrain/Learning Rate": 6.950693000288055e-07, "Pretrain/Loss": 1.99405837059021, "Pretrain/Loss (Raw)": 2.0805585384368896, "Pretrain/Step": 8841, "Pretrain/Step Time": 8.505734553560615} +{"Pretrain/Learning Rate": 6.930826830463922e-07, "Pretrain/Loss": 1.9940273761749268, "Pretrain/Loss (Raw)": 1.991916537284851, "Pretrain/Step": 8842, "Pretrain/Step Time": 8.505587568506598} +{"Pretrain/Learning Rate": 6.910988692522158e-07, "Pretrain/Loss": 1.9945597648620605, "Pretrain/Loss (Raw)": 2.047020435333252, "Pretrain/Step": 8843, "Pretrain/Step Time": 8.509806521236897} +{"Pretrain/Learning Rate": 6.891178588750686e-07, "Pretrain/Loss": 1.9943920373916626, "Pretrain/Loss (Raw)": 1.911591649055481, "Pretrain/Step": 8844, "Pretrain/Step Time": 8.516726793721318} +{"Pretrain/Learning Rate": 6.871396521434065e-07, "Pretrain/Loss": 1.9933243989944458, "Pretrain/Loss (Raw)": 1.964156985282898, "Pretrain/Step": 8845, "Pretrain/Step Time": 8.524409551173449} +{"Pretrain/Learning Rate": 6.851642492853666e-07, "Pretrain/Loss": 1.9924784898757935, "Pretrain/Loss (Raw)": 1.9438670873641968, "Pretrain/Step": 8846, "Pretrain/Step Time": 8.516843168064952} +{"Pretrain/Learning Rate": 6.831916505287555e-07, "Pretrain/Loss": 1.9901328086853027, "Pretrain/Loss (Raw)": 1.9002810716629028, "Pretrain/Step": 8847, "Pretrain/Step Time": 8.515483455732465} +{"Pretrain/Learning Rate": 6.812218561010719e-07, "Pretrain/Loss": 1.9915835857391357, "Pretrain/Loss (Raw)": 2.0935707092285156, "Pretrain/Step": 8848, "Pretrain/Step Time": 8.510771498084068} +{"Pretrain/Learning Rate": 6.792548662294785e-07, "Pretrain/Loss": 1.9934803247451782, "Pretrain/Loss (Raw)": 2.1180360317230225, "Pretrain/Step": 8849, "Pretrain/Step Time": 8.516738468781114} +{"Pretrain/Learning Rate": 6.772906811408159e-07, "Pretrain/Loss": 1.994403600692749, "Pretrain/Loss (Raw)": 2.0269253253936768, "Pretrain/Step": 8850, "Pretrain/Step Time": 8.516819661483169} +{"Pretrain/Learning Rate": 6.75329301061603e-07, "Pretrain/Loss": 1.9952433109283447, "Pretrain/Loss (Raw)": 2.119020462036133, "Pretrain/Step": 8851, "Pretrain/Step Time": 8.517521338537335} +{"Pretrain/Learning Rate": 6.733707262180394e-07, "Pretrain/Loss": 1.9929301738739014, "Pretrain/Loss (Raw)": 1.8781119585037231, "Pretrain/Step": 8852, "Pretrain/Step Time": 8.512729469686747} +{"Pretrain/Learning Rate": 6.714149568359945e-07, "Pretrain/Loss": 1.9938111305236816, "Pretrain/Loss (Raw)": 2.148348808288574, "Pretrain/Step": 8853, "Pretrain/Step Time": 8.511317119002342} +{"Pretrain/Learning Rate": 6.694619931410156e-07, "Pretrain/Loss": 1.9949861764907837, "Pretrain/Loss (Raw)": 2.040957450866699, "Pretrain/Step": 8854, "Pretrain/Step Time": 8.512061592191458} +{"Pretrain/Learning Rate": 6.675118353583254e-07, "Pretrain/Loss": 1.993285894393921, "Pretrain/Loss (Raw)": 2.055335760116577, "Pretrain/Step": 8855, "Pretrain/Step Time": 8.517806814983487} +{"Pretrain/Learning Rate": 6.655644837128328e-07, "Pretrain/Loss": 1.9935686588287354, "Pretrain/Loss (Raw)": 2.0459470748901367, "Pretrain/Step": 8856, "Pretrain/Step Time": 8.518217904493213} +{"Pretrain/Learning Rate": 6.636199384291137e-07, "Pretrain/Loss": 1.992551326751709, "Pretrain/Loss (Raw)": 1.9359149932861328, "Pretrain/Step": 8857, "Pretrain/Step Time": 8.517964920029044} +{"Pretrain/Learning Rate": 6.616781997314164e-07, "Pretrain/Loss": 1.995438575744629, "Pretrain/Loss (Raw)": 2.2531487941741943, "Pretrain/Step": 8858, "Pretrain/Step Time": 8.51167225651443} +{"Pretrain/Learning Rate": 6.597392678436731e-07, "Pretrain/Loss": 1.9966654777526855, "Pretrain/Loss (Raw)": 2.0479204654693604, "Pretrain/Step": 8859, "Pretrain/Step Time": 8.509512575343251} +{"Pretrain/Learning Rate": 6.578031429894993e-07, "Pretrain/Loss": 1.9973245859146118, "Pretrain/Loss (Raw)": 1.921455979347229, "Pretrain/Step": 8860, "Pretrain/Step Time": 8.506168156862259} +{"Pretrain/Learning Rate": 6.558698253921664e-07, "Pretrain/Loss": 1.9982163906097412, "Pretrain/Loss (Raw)": 2.040472984313965, "Pretrain/Step": 8861, "Pretrain/Step Time": 8.50974634476006} +{"Pretrain/Learning Rate": 6.539393152746404e-07, "Pretrain/Loss": 2.000243663787842, "Pretrain/Loss (Raw)": 2.2592790126800537, "Pretrain/Step": 8862, "Pretrain/Step Time": 8.510902816429734} +{"Pretrain/Learning Rate": 6.520116128595516e-07, "Pretrain/Loss": 2.0017805099487305, "Pretrain/Loss (Raw)": 2.212693929672241, "Pretrain/Step": 8863, "Pretrain/Step Time": 8.513779105618596} +{"Pretrain/Learning Rate": 6.500867183692195e-07, "Pretrain/Loss": 1.9981002807617188, "Pretrain/Loss (Raw)": 1.8853042125701904, "Pretrain/Step": 8864, "Pretrain/Step Time": 8.51398585177958} +{"Pretrain/Learning Rate": 6.481646320256246e-07, "Pretrain/Loss": 1.9984440803527832, "Pretrain/Loss (Raw)": 1.9563945531845093, "Pretrain/Step": 8865, "Pretrain/Step Time": 8.505277633666992} +{"Pretrain/Learning Rate": 6.462453540504343e-07, "Pretrain/Loss": 1.9962711334228516, "Pretrain/Loss (Raw)": 1.5906952619552612, "Pretrain/Step": 8866, "Pretrain/Step Time": 8.51027956046164} +{"Pretrain/Learning Rate": 6.443288846649881e-07, "Pretrain/Loss": 1.9979848861694336, "Pretrain/Loss (Raw)": 2.115584373474121, "Pretrain/Step": 8867, "Pretrain/Step Time": 8.507746819406748} +{"Pretrain/Learning Rate": 6.424152240903065e-07, "Pretrain/Loss": 1.9986884593963623, "Pretrain/Loss (Raw)": 2.1277902126312256, "Pretrain/Step": 8868, "Pretrain/Step Time": 8.512580469250679} +{"Pretrain/Learning Rate": 6.405043725470738e-07, "Pretrain/Loss": 2.001220464706421, "Pretrain/Loss (Raw)": 2.2142996788024902, "Pretrain/Step": 8869, "Pretrain/Step Time": 8.514998881146312} +{"Pretrain/Learning Rate": 6.385963302556641e-07, "Pretrain/Loss": 2.002955198287964, "Pretrain/Loss (Raw)": 2.123908042907715, "Pretrain/Step": 8870, "Pretrain/Step Time": 8.50930024124682} +{"Pretrain/Learning Rate": 6.366910974361206e-07, "Pretrain/Loss": 2.001039505004883, "Pretrain/Loss (Raw)": 2.1176087856292725, "Pretrain/Step": 8871, "Pretrain/Step Time": 8.500604724511504} +{"Pretrain/Learning Rate": 6.347886743081649e-07, "Pretrain/Loss": 1.9987560510635376, "Pretrain/Loss (Raw)": 1.8811732530593872, "Pretrain/Step": 8872, "Pretrain/Step Time": 8.49966018088162} +{"Pretrain/Learning Rate": 6.328890610911881e-07, "Pretrain/Loss": 1.99818754196167, "Pretrain/Loss (Raw)": 2.0706958770751953, "Pretrain/Step": 8873, "Pretrain/Step Time": 8.503854680806398} +{"Pretrain/Learning Rate": 6.309922580042676e-07, "Pretrain/Loss": 1.9976195096969604, "Pretrain/Loss (Raw)": 2.1257832050323486, "Pretrain/Step": 8874, "Pretrain/Step Time": 8.504556866362691} +{"Pretrain/Learning Rate": 6.290982652661509e-07, "Pretrain/Loss": 1.9964346885681152, "Pretrain/Loss (Raw)": 1.7545496225357056, "Pretrain/Step": 8875, "Pretrain/Step Time": 8.511836281046271} +{"Pretrain/Learning Rate": 6.272070830952631e-07, "Pretrain/Loss": 1.997361183166504, "Pretrain/Loss (Raw)": 1.878786325454712, "Pretrain/Step": 8876, "Pretrain/Step Time": 8.505874687805772} +{"Pretrain/Learning Rate": 6.253187117096992e-07, "Pretrain/Loss": 1.9994268417358398, "Pretrain/Loss (Raw)": 1.9392344951629639, "Pretrain/Step": 8877, "Pretrain/Step Time": 8.498489029705524} +{"Pretrain/Learning Rate": 6.234331513272435e-07, "Pretrain/Loss": 2.0055105686187744, "Pretrain/Loss (Raw)": 1.9476428031921387, "Pretrain/Step": 8878, "Pretrain/Step Time": 8.499754099175334} +{"Pretrain/Learning Rate": 6.215504021653412e-07, "Pretrain/Loss": 2.004784107208252, "Pretrain/Loss (Raw)": 1.9028574228286743, "Pretrain/Step": 8879, "Pretrain/Step Time": 8.504465812817216} +{"Pretrain/Learning Rate": 6.196704644411189e-07, "Pretrain/Loss": 2.0045371055603027, "Pretrain/Loss (Raw)": 2.097517967224121, "Pretrain/Step": 8880, "Pretrain/Step Time": 8.506482139229774} +{"Pretrain/Learning Rate": 6.177933383713835e-07, "Pretrain/Loss": 2.005723476409912, "Pretrain/Loss (Raw)": 2.1428513526916504, "Pretrain/Step": 8881, "Pretrain/Step Time": 8.513241594657302} +{"Pretrain/Learning Rate": 6.159190241726148e-07, "Pretrain/Loss": 2.003204345703125, "Pretrain/Loss (Raw)": 1.5470476150512695, "Pretrain/Step": 8882, "Pretrain/Step Time": 8.511787379160523} +{"Pretrain/Learning Rate": 6.140475220609676e-07, "Pretrain/Loss": 2.0006260871887207, "Pretrain/Loss (Raw)": 1.7126657962799072, "Pretrain/Step": 8883, "Pretrain/Step Time": 8.502330346032977} +{"Pretrain/Learning Rate": 6.121788322522637e-07, "Pretrain/Loss": 2.003876209259033, "Pretrain/Loss (Raw)": 2.269200325012207, "Pretrain/Step": 8884, "Pretrain/Step Time": 8.49905501678586} +{"Pretrain/Learning Rate": 6.103129549620223e-07, "Pretrain/Loss": 2.006831645965576, "Pretrain/Loss (Raw)": 2.371499538421631, "Pretrain/Step": 8885, "Pretrain/Step Time": 8.512813806533813} +{"Pretrain/Learning Rate": 6.084498904054187e-07, "Pretrain/Loss": 2.010830879211426, "Pretrain/Loss (Raw)": 2.1056346893310547, "Pretrain/Step": 8886, "Pretrain/Step Time": 8.51419711112976} +{"Pretrain/Learning Rate": 6.065896387973086e-07, "Pretrain/Loss": 2.00823974609375, "Pretrain/Loss (Raw)": 1.793509840965271, "Pretrain/Step": 8887, "Pretrain/Step Time": 8.513855943456292} +{"Pretrain/Learning Rate": 6.04732200352226e-07, "Pretrain/Loss": 2.0090601444244385, "Pretrain/Loss (Raw)": 1.7849695682525635, "Pretrain/Step": 8888, "Pretrain/Step Time": 8.507429160177708} +{"Pretrain/Learning Rate": 6.028775752843801e-07, "Pretrain/Loss": 2.008405923843384, "Pretrain/Loss (Raw)": 1.9850343465805054, "Pretrain/Step": 8889, "Pretrain/Step Time": 8.50479555875063} +{"Pretrain/Learning Rate": 6.010257638076583e-07, "Pretrain/Loss": 2.009509801864624, "Pretrain/Loss (Raw)": 1.9517067670822144, "Pretrain/Step": 8890, "Pretrain/Step Time": 8.501986606046557} +{"Pretrain/Learning Rate": 5.991767661356145e-07, "Pretrain/Loss": 2.008596181869507, "Pretrain/Loss (Raw)": 1.985662817955017, "Pretrain/Step": 8891, "Pretrain/Step Time": 8.512625580653548} +{"Pretrain/Learning Rate": 5.973305824814867e-07, "Pretrain/Loss": 2.0078835487365723, "Pretrain/Loss (Raw)": 2.040125608444214, "Pretrain/Step": 8892, "Pretrain/Step Time": 8.508222721517086} +{"Pretrain/Learning Rate": 5.954872130581851e-07, "Pretrain/Loss": 2.0076985359191895, "Pretrain/Loss (Raw)": 1.9791450500488281, "Pretrain/Step": 8893, "Pretrain/Step Time": 8.508120907470584} +{"Pretrain/Learning Rate": 5.936466580782979e-07, "Pretrain/Loss": 2.009056568145752, "Pretrain/Loss (Raw)": 2.2149908542633057, "Pretrain/Step": 8894, "Pretrain/Step Time": 8.511609761044383} +{"Pretrain/Learning Rate": 5.918089177540858e-07, "Pretrain/Loss": 2.009780168533325, "Pretrain/Loss (Raw)": 1.9297198057174683, "Pretrain/Step": 8895, "Pretrain/Step Time": 8.508298743516207} +{"Pretrain/Learning Rate": 5.899739922974795e-07, "Pretrain/Loss": 2.006624221801758, "Pretrain/Loss (Raw)": 2.0308032035827637, "Pretrain/Step": 8896, "Pretrain/Step Time": 8.50767682120204} +{"Pretrain/Learning Rate": 5.881418819200985e-07, "Pretrain/Loss": 2.008662700653076, "Pretrain/Loss (Raw)": 2.0701584815979004, "Pretrain/Step": 8897, "Pretrain/Step Time": 8.510734628885984} +{"Pretrain/Learning Rate": 5.863125868332292e-07, "Pretrain/Loss": 2.007981538772583, "Pretrain/Loss (Raw)": 1.950933575630188, "Pretrain/Step": 8898, "Pretrain/Step Time": 8.509593529626727} +{"Pretrain/Learning Rate": 5.844861072478336e-07, "Pretrain/Loss": 2.0046305656433105, "Pretrain/Loss (Raw)": 1.6684576272964478, "Pretrain/Step": 8899, "Pretrain/Step Time": 8.511193534359336} +{"Pretrain/Learning Rate": 5.826624433745486e-07, "Pretrain/Loss": 2.004990816116333, "Pretrain/Loss (Raw)": 2.0186028480529785, "Pretrain/Step": 8900, "Pretrain/Step Time": 8.50568725168705} +{"Pretrain/Learning Rate": 5.808415954236924e-07, "Pretrain/Loss": 2.003798484802246, "Pretrain/Loss (Raw)": 1.9966529607772827, "Pretrain/Step": 8901, "Pretrain/Step Time": 8.50430080294609} +{"Pretrain/Learning Rate": 5.790235636052438e-07, "Pretrain/Loss": 1.9990335702896118, "Pretrain/Loss (Raw)": 2.0658509731292725, "Pretrain/Step": 8902, "Pretrain/Step Time": 8.507174111902714} +{"Pretrain/Learning Rate": 5.772083481288771e-07, "Pretrain/Loss": 1.9973355531692505, "Pretrain/Loss (Raw)": 1.83164381980896, "Pretrain/Step": 8903, "Pretrain/Step Time": 8.507468743249774} +{"Pretrain/Learning Rate": 5.753959492039246e-07, "Pretrain/Loss": 1.9979796409606934, "Pretrain/Loss (Raw)": 1.937700867652893, "Pretrain/Step": 8904, "Pretrain/Step Time": 8.512949092313647} +{"Pretrain/Learning Rate": 5.73586367039411e-07, "Pretrain/Loss": 1.9982235431671143, "Pretrain/Loss (Raw)": 1.8517240285873413, "Pretrain/Step": 8905, "Pretrain/Step Time": 8.514539569616318} +{"Pretrain/Learning Rate": 5.717796018440108e-07, "Pretrain/Loss": 1.9988288879394531, "Pretrain/Loss (Raw)": 2.0789451599121094, "Pretrain/Step": 8906, "Pretrain/Step Time": 8.510353652760386} +{"Pretrain/Learning Rate": 5.69975653826102e-07, "Pretrain/Loss": 2.003880500793457, "Pretrain/Loss (Raw)": 2.4041075706481934, "Pretrain/Step": 8907, "Pretrain/Step Time": 8.506218142807484} +{"Pretrain/Learning Rate": 5.681745231937124e-07, "Pretrain/Loss": 2.003931999206543, "Pretrain/Loss (Raw)": 1.787735939025879, "Pretrain/Step": 8908, "Pretrain/Step Time": 8.506767390295863} +{"Pretrain/Learning Rate": 5.663762101545706e-07, "Pretrain/Loss": 2.005977153778076, "Pretrain/Loss (Raw)": 2.2927517890930176, "Pretrain/Step": 8909, "Pretrain/Step Time": 8.516248909756541} +{"Pretrain/Learning Rate": 5.645807149160548e-07, "Pretrain/Loss": 2.006211519241333, "Pretrain/Loss (Raw)": 1.7516528367996216, "Pretrain/Step": 8910, "Pretrain/Step Time": 8.516284687444568} +{"Pretrain/Learning Rate": 5.627880376852357e-07, "Pretrain/Loss": 2.0050299167633057, "Pretrain/Loss (Raw)": 2.0996475219726562, "Pretrain/Step": 8911, "Pretrain/Step Time": 8.520410154014826} +{"Pretrain/Learning Rate": 5.609981786688534e-07, "Pretrain/Loss": 2.0053677558898926, "Pretrain/Loss (Raw)": 2.0184097290039062, "Pretrain/Step": 8912, "Pretrain/Step Time": 8.514618022367358} +{"Pretrain/Learning Rate": 5.592111380733206e-07, "Pretrain/Loss": 2.0054430961608887, "Pretrain/Loss (Raw)": 1.8957637548446655, "Pretrain/Step": 8913, "Pretrain/Step Time": 8.508998969569802} +{"Pretrain/Learning Rate": 5.574269161047252e-07, "Pretrain/Loss": 2.0039803981781006, "Pretrain/Loss (Raw)": 1.926332950592041, "Pretrain/Step": 8914, "Pretrain/Step Time": 8.50770121999085} +{"Pretrain/Learning Rate": 5.556455129688387e-07, "Pretrain/Loss": 2.005234479904175, "Pretrain/Loss (Raw)": 2.020061731338501, "Pretrain/Step": 8915, "Pretrain/Step Time": 8.509085359051824} +{"Pretrain/Learning Rate": 5.538669288710968e-07, "Pretrain/Loss": 2.0079405307769775, "Pretrain/Loss (Raw)": 2.224722385406494, "Pretrain/Step": 8916, "Pretrain/Step Time": 8.516610819846392} +{"Pretrain/Learning Rate": 5.520911640166132e-07, "Pretrain/Loss": 2.008206605911255, "Pretrain/Loss (Raw)": 2.148061990737915, "Pretrain/Step": 8917, "Pretrain/Step Time": 8.516458993777633} +{"Pretrain/Learning Rate": 5.503182186101796e-07, "Pretrain/Loss": 2.0085644721984863, "Pretrain/Loss (Raw)": 1.9614384174346924, "Pretrain/Step": 8918, "Pretrain/Step Time": 8.511930156499147} +{"Pretrain/Learning Rate": 5.485480928562603e-07, "Pretrain/Loss": 2.007746934890747, "Pretrain/Loss (Raw)": 1.9455310106277466, "Pretrain/Step": 8919, "Pretrain/Step Time": 8.507198747247458} +{"Pretrain/Learning Rate": 5.467807869589919e-07, "Pretrain/Loss": 2.0087180137634277, "Pretrain/Loss (Raw)": 2.1016342639923096, "Pretrain/Step": 8920, "Pretrain/Step Time": 8.507329821586609} +{"Pretrain/Learning Rate": 5.45016301122192e-07, "Pretrain/Loss": 2.0088367462158203, "Pretrain/Loss (Raw)": 2.2009458541870117, "Pretrain/Step": 8921, "Pretrain/Step Time": 8.517523365095258} +{"Pretrain/Learning Rate": 5.432546355493479e-07, "Pretrain/Loss": 2.0090343952178955, "Pretrain/Loss (Raw)": 2.058673858642578, "Pretrain/Step": 8922, "Pretrain/Step Time": 8.519691344350576} +{"Pretrain/Learning Rate": 5.414957904436219e-07, "Pretrain/Loss": 2.009202003479004, "Pretrain/Loss (Raw)": 2.061776876449585, "Pretrain/Step": 8923, "Pretrain/Step Time": 8.524368913844228} +{"Pretrain/Learning Rate": 5.397397660078573e-07, "Pretrain/Loss": 2.0095715522766113, "Pretrain/Loss (Raw)": 1.9868526458740234, "Pretrain/Step": 8924, "Pretrain/Step Time": 8.518212143331766} +{"Pretrain/Learning Rate": 5.37986562444559e-07, "Pretrain/Loss": 2.0101113319396973, "Pretrain/Loss (Raw)": 2.139671802520752, "Pretrain/Step": 8925, "Pretrain/Step Time": 8.511776672676206} +{"Pretrain/Learning Rate": 5.362361799559207e-07, "Pretrain/Loss": 2.0104329586029053, "Pretrain/Loss (Raw)": 2.0002880096435547, "Pretrain/Step": 8926, "Pretrain/Step Time": 8.516046468168497} +{"Pretrain/Learning Rate": 5.344886187438031e-07, "Pretrain/Loss": 2.010928153991699, "Pretrain/Loss (Raw)": 2.0308682918548584, "Pretrain/Step": 8927, "Pretrain/Step Time": 8.522629709914327} +{"Pretrain/Learning Rate": 5.327438790097449e-07, "Pretrain/Loss": 2.012619733810425, "Pretrain/Loss (Raw)": 2.08647084236145, "Pretrain/Step": 8928, "Pretrain/Step Time": 8.524407101795077} +{"Pretrain/Learning Rate": 5.310019609549521e-07, "Pretrain/Loss": 2.01171875, "Pretrain/Loss (Raw)": 2.029731273651123, "Pretrain/Step": 8929, "Pretrain/Step Time": 8.519746067002416} +{"Pretrain/Learning Rate": 5.292628647803194e-07, "Pretrain/Loss": 2.014130115509033, "Pretrain/Loss (Raw)": 2.0321719646453857, "Pretrain/Step": 8930, "Pretrain/Step Time": 8.515692219138145} +{"Pretrain/Learning Rate": 5.27526590686403e-07, "Pretrain/Loss": 2.0141050815582275, "Pretrain/Loss (Raw)": 2.0551702976226807, "Pretrain/Step": 8931, "Pretrain/Step Time": 8.512360634282231} +{"Pretrain/Learning Rate": 5.257931388734344e-07, "Pretrain/Loss": 2.0136845111846924, "Pretrain/Loss (Raw)": 1.9422852993011475, "Pretrain/Step": 8932, "Pretrain/Step Time": 8.517966637387872} +{"Pretrain/Learning Rate": 5.240625095413287e-07, "Pretrain/Loss": 2.010925769805908, "Pretrain/Loss (Raw)": 1.867837905883789, "Pretrain/Step": 8933, "Pretrain/Step Time": 8.51518946327269} +{"Pretrain/Learning Rate": 5.223347028896708e-07, "Pretrain/Loss": 2.0089526176452637, "Pretrain/Loss (Raw)": 2.055280923843384, "Pretrain/Step": 8934, "Pretrain/Step Time": 8.51532094553113} +{"Pretrain/Learning Rate": 5.206097191177151e-07, "Pretrain/Loss": 2.0110127925872803, "Pretrain/Loss (Raw)": 2.1255366802215576, "Pretrain/Step": 8935, "Pretrain/Step Time": 8.510858241468668} +{"Pretrain/Learning Rate": 5.188875584243996e-07, "Pretrain/Loss": 2.009956121444702, "Pretrain/Loss (Raw)": 1.9650667905807495, "Pretrain/Step": 8936, "Pretrain/Step Time": 8.500802742317319} +{"Pretrain/Learning Rate": 5.171682210083268e-07, "Pretrain/Loss": 2.0111730098724365, "Pretrain/Loss (Raw)": 2.132284641265869, "Pretrain/Step": 8937, "Pretrain/Step Time": 8.507286839187145} +{"Pretrain/Learning Rate": 5.15451707067785e-07, "Pretrain/Loss": 2.010291814804077, "Pretrain/Loss (Raw)": 1.9294977188110352, "Pretrain/Step": 8938, "Pretrain/Step Time": 8.513168174773455} +{"Pretrain/Learning Rate": 5.137380168007244e-07, "Pretrain/Loss": 2.008136749267578, "Pretrain/Loss (Raw)": 1.7116169929504395, "Pretrain/Step": 8939, "Pretrain/Step Time": 8.513988008722663} +{"Pretrain/Learning Rate": 5.120271504047813e-07, "Pretrain/Loss": 2.0066092014312744, "Pretrain/Loss (Raw)": 1.8020719289779663, "Pretrain/Step": 8940, "Pretrain/Step Time": 8.51595457084477} +{"Pretrain/Learning Rate": 5.103191080772535e-07, "Pretrain/Loss": 2.005357265472412, "Pretrain/Loss (Raw)": 1.7135804891586304, "Pretrain/Step": 8941, "Pretrain/Step Time": 8.511959057301283} +{"Pretrain/Learning Rate": 5.086138900151333e-07, "Pretrain/Loss": 2.0053694248199463, "Pretrain/Loss (Raw)": 1.927000641822815, "Pretrain/Step": 8942, "Pretrain/Step Time": 8.509741999208927} +{"Pretrain/Learning Rate": 5.069114964150606e-07, "Pretrain/Loss": 2.0057849884033203, "Pretrain/Loss (Raw)": 2.0106279850006104, "Pretrain/Step": 8943, "Pretrain/Step Time": 8.509499678388238} +{"Pretrain/Learning Rate": 5.052119274733702e-07, "Pretrain/Loss": 2.0053539276123047, "Pretrain/Loss (Raw)": 1.9927326440811157, "Pretrain/Step": 8944, "Pretrain/Step Time": 8.517493944615126} +{"Pretrain/Learning Rate": 5.035151833860635e-07, "Pretrain/Loss": 2.004214286804199, "Pretrain/Loss (Raw)": 1.9196172952651978, "Pretrain/Step": 8945, "Pretrain/Step Time": 8.519780788570642} +{"Pretrain/Learning Rate": 5.018212643488202e-07, "Pretrain/Loss": 2.002927780151367, "Pretrain/Loss (Raw)": 1.9219970703125, "Pretrain/Step": 8946, "Pretrain/Step Time": 8.523450626060367} +{"Pretrain/Learning Rate": 5.001301705569838e-07, "Pretrain/Loss": 2.005310297012329, "Pretrain/Loss (Raw)": 1.9469099044799805, "Pretrain/Step": 8947, "Pretrain/Step Time": 8.519599681720138} +{"Pretrain/Learning Rate": 4.984419022055848e-07, "Pretrain/Loss": 2.003657817840576, "Pretrain/Loss (Raw)": 1.993828535079956, "Pretrain/Step": 8948, "Pretrain/Step Time": 8.512924615293741} +{"Pretrain/Learning Rate": 4.967564594893198e-07, "Pretrain/Loss": 2.0044894218444824, "Pretrain/Loss (Raw)": 2.0337941646575928, "Pretrain/Step": 8949, "Pretrain/Step Time": 8.51239774376154} +{"Pretrain/Learning Rate": 4.95073842602567e-07, "Pretrain/Loss": 2.0056276321411133, "Pretrain/Loss (Raw)": 2.1849677562713623, "Pretrain/Step": 8950, "Pretrain/Step Time": 8.51616733521223} +{"Pretrain/Learning Rate": 4.933940517393626e-07, "Pretrain/Loss": 2.002124547958374, "Pretrain/Loss (Raw)": 2.118685245513916, "Pretrain/Step": 8951, "Pretrain/Step Time": 8.519771460443735} +{"Pretrain/Learning Rate": 4.917170870934407e-07, "Pretrain/Loss": 2.001434803009033, "Pretrain/Loss (Raw)": 1.9949308633804321, "Pretrain/Step": 8952, "Pretrain/Step Time": 8.52250374481082} +{"Pretrain/Learning Rate": 4.900429488581909e-07, "Pretrain/Loss": 2.004578113555908, "Pretrain/Loss (Raw)": 2.2478387355804443, "Pretrain/Step": 8953, "Pretrain/Step Time": 8.517305823042989} +{"Pretrain/Learning Rate": 4.883716372266811e-07, "Pretrain/Loss": 2.0049920082092285, "Pretrain/Loss (Raw)": 2.0012009143829346, "Pretrain/Step": 8954, "Pretrain/Step Time": 8.512033462524414} +{"Pretrain/Learning Rate": 4.867031523916571e-07, "Pretrain/Loss": 2.005417823791504, "Pretrain/Loss (Raw)": 1.998240351676941, "Pretrain/Step": 8955, "Pretrain/Step Time": 8.517133720219135} +{"Pretrain/Learning Rate": 4.850374945455344e-07, "Pretrain/Loss": 2.006321907043457, "Pretrain/Loss (Raw)": 1.9425338506698608, "Pretrain/Step": 8956, "Pretrain/Step Time": 8.51894629187882} +{"Pretrain/Learning Rate": 4.833746638804093e-07, "Pretrain/Loss": 2.00651216506958, "Pretrain/Loss (Raw)": 1.9821710586547852, "Pretrain/Step": 8957, "Pretrain/Step Time": 8.516634797677398} +{"Pretrain/Learning Rate": 4.817146605880424e-07, "Pretrain/Loss": 2.0073204040527344, "Pretrain/Loss (Raw)": 2.0051465034484863, "Pretrain/Step": 8958, "Pretrain/Step Time": 8.518889965489507} +{"Pretrain/Learning Rate": 4.800574848598749e-07, "Pretrain/Loss": 2.007354259490967, "Pretrain/Loss (Raw)": 2.0094850063323975, "Pretrain/Step": 8959, "Pretrain/Step Time": 8.520294114947319} +{"Pretrain/Learning Rate": 4.784031368870206e-07, "Pretrain/Loss": 2.0077128410339355, "Pretrain/Loss (Raw)": 2.0316414833068848, "Pretrain/Step": 8960, "Pretrain/Step Time": 8.512987473979592} +{"Pretrain/Learning Rate": 4.7675161686026595e-07, "Pretrain/Loss": 2.0064661502838135, "Pretrain/Loss (Raw)": 1.7111682891845703, "Pretrain/Step": 8961, "Pretrain/Step Time": 8.514261107891798} +{"Pretrain/Learning Rate": 4.751029249700695e-07, "Pretrain/Loss": 2.0065808296203613, "Pretrain/Loss (Raw)": 2.205899715423584, "Pretrain/Step": 8962, "Pretrain/Step Time": 8.521094569936395} +{"Pretrain/Learning Rate": 4.734570614065709e-07, "Pretrain/Loss": 2.006467819213867, "Pretrain/Loss (Raw)": 1.9651906490325928, "Pretrain/Step": 8963, "Pretrain/Step Time": 8.521623525768518} +{"Pretrain/Learning Rate": 4.718140263595794e-07, "Pretrain/Loss": 2.005366802215576, "Pretrain/Loss (Raw)": 1.9094152450561523, "Pretrain/Step": 8964, "Pretrain/Step Time": 8.521981736645103} +{"Pretrain/Learning Rate": 4.701738200185712e-07, "Pretrain/Loss": 2.0069868564605713, "Pretrain/Loss (Raw)": 2.2246129512786865, "Pretrain/Step": 8965, "Pretrain/Step Time": 8.523420426994562} +{"Pretrain/Learning Rate": 4.6853644257270624e-07, "Pretrain/Loss": 2.0113704204559326, "Pretrain/Loss (Raw)": 2.2642416954040527, "Pretrain/Step": 8966, "Pretrain/Step Time": 8.513479037210345} +{"Pretrain/Learning Rate": 4.6690189421081943e-07, "Pretrain/Loss": 2.007939338684082, "Pretrain/Loss (Raw)": 1.8260430097579956, "Pretrain/Step": 8967, "Pretrain/Step Time": 8.508290128782392} +{"Pretrain/Learning Rate": 4.6527017512140723e-07, "Pretrain/Loss": 2.0062379837036133, "Pretrain/Loss (Raw)": 1.841400146484375, "Pretrain/Step": 8968, "Pretrain/Step Time": 8.518048264086246} +{"Pretrain/Learning Rate": 4.6364128549264976e-07, "Pretrain/Loss": 2.0095744132995605, "Pretrain/Loss (Raw)": 2.507625102996826, "Pretrain/Step": 8969, "Pretrain/Step Time": 8.518204595893621} +{"Pretrain/Learning Rate": 4.6201522551239664e-07, "Pretrain/Loss": 2.0092883110046387, "Pretrain/Loss (Raw)": 1.955299735069275, "Pretrain/Step": 8970, "Pretrain/Step Time": 8.519998624920845} +{"Pretrain/Learning Rate": 4.603919953681757e-07, "Pretrain/Loss": 2.0088043212890625, "Pretrain/Loss (Raw)": 1.9850804805755615, "Pretrain/Step": 8971, "Pretrain/Step Time": 8.515094965696335} +{"Pretrain/Learning Rate": 4.587715952471872e-07, "Pretrain/Loss": 2.0096335411071777, "Pretrain/Loss (Raw)": 2.0177159309387207, "Pretrain/Step": 8972, "Pretrain/Step Time": 8.507589189335704} +{"Pretrain/Learning Rate": 4.5715402533629826e-07, "Pretrain/Loss": 2.0085723400115967, "Pretrain/Loss (Raw)": 1.8283393383026123, "Pretrain/Step": 8973, "Pretrain/Step Time": 8.507479567080736} +{"Pretrain/Learning Rate": 4.5553928582205417e-07, "Pretrain/Loss": 2.0077171325683594, "Pretrain/Loss (Raw)": 1.8344110250473022, "Pretrain/Step": 8974, "Pretrain/Step Time": 8.513587461784482} +{"Pretrain/Learning Rate": 4.539273768906782e-07, "Pretrain/Loss": 2.008021831512451, "Pretrain/Loss (Raw)": 1.9392749071121216, "Pretrain/Step": 8975, "Pretrain/Step Time": 8.514075757935643} +{"Pretrain/Learning Rate": 4.523182987280633e-07, "Pretrain/Loss": 2.0079500675201416, "Pretrain/Loss (Raw)": 2.0843753814697266, "Pretrain/Step": 8976, "Pretrain/Step Time": 8.511347409337759} +{"Pretrain/Learning Rate": 4.507120515197749e-07, "Pretrain/Loss": 2.007768392562866, "Pretrain/Loss (Raw)": 2.0947957038879395, "Pretrain/Step": 8977, "Pretrain/Step Time": 8.505067985504866} +{"Pretrain/Learning Rate": 4.49108635451051e-07, "Pretrain/Loss": 2.0084047317504883, "Pretrain/Loss (Raw)": 2.1083528995513916, "Pretrain/Step": 8978, "Pretrain/Step Time": 8.508044810965657} +{"Pretrain/Learning Rate": 4.475080507068102e-07, "Pretrain/Loss": 2.006917953491211, "Pretrain/Loss (Raw)": 1.9287183284759521, "Pretrain/Step": 8979, "Pretrain/Step Time": 8.502911698073149} +{"Pretrain/Learning Rate": 4.4591029747163283e-07, "Pretrain/Loss": 2.0086960792541504, "Pretrain/Loss (Raw)": 2.105706214904785, "Pretrain/Step": 8980, "Pretrain/Step Time": 8.510600414127111} +{"Pretrain/Learning Rate": 4.443153759297852e-07, "Pretrain/Loss": 2.005216121673584, "Pretrain/Loss (Raw)": 1.7029337882995605, "Pretrain/Step": 8981, "Pretrain/Step Time": 8.513426054269075} +{"Pretrain/Learning Rate": 4.427232862651953e-07, "Pretrain/Loss": 2.0055556297302246, "Pretrain/Loss (Raw)": 2.0843961238861084, "Pretrain/Step": 8982, "Pretrain/Step Time": 8.510973237454891} +{"Pretrain/Learning Rate": 4.4113402866147734e-07, "Pretrain/Loss": 2.0065369606018066, "Pretrain/Loss (Raw)": 2.1809425354003906, "Pretrain/Step": 8983, "Pretrain/Step Time": 8.50568343885243} +{"Pretrain/Learning Rate": 4.395476033019069e-07, "Pretrain/Loss": 2.0051932334899902, "Pretrain/Loss (Raw)": 1.8739663362503052, "Pretrain/Step": 8984, "Pretrain/Step Time": 8.507425105199218} +{"Pretrain/Learning Rate": 4.3796401036944043e-07, "Pretrain/Loss": 2.0061464309692383, "Pretrain/Loss (Raw)": 2.0579304695129395, "Pretrain/Step": 8985, "Pretrain/Step Time": 8.520020674914122} +{"Pretrain/Learning Rate": 4.3638325004670135e-07, "Pretrain/Loss": 2.0051305294036865, "Pretrain/Loss (Raw)": 2.123101234436035, "Pretrain/Step": 8986, "Pretrain/Step Time": 8.516299396753311} +{"Pretrain/Learning Rate": 4.3480532251599647e-07, "Pretrain/Loss": 2.0042011737823486, "Pretrain/Loss (Raw)": 1.9289699792861938, "Pretrain/Step": 8987, "Pretrain/Step Time": 8.512505980208516} +{"Pretrain/Learning Rate": 4.3323022795929425e-07, "Pretrain/Loss": 2.004666328430176, "Pretrain/Loss (Raw)": 1.980993628501892, "Pretrain/Step": 8988, "Pretrain/Step Time": 8.512024765834212} +{"Pretrain/Learning Rate": 4.316579665582465e-07, "Pretrain/Loss": 2.004517078399658, "Pretrain/Loss (Raw)": 2.021385908126831, "Pretrain/Step": 8989, "Pretrain/Step Time": 8.506363475695252} +{"Pretrain/Learning Rate": 4.300885384941694e-07, "Pretrain/Loss": 2.002930164337158, "Pretrain/Loss (Raw)": 2.056114673614502, "Pretrain/Step": 8990, "Pretrain/Step Time": 8.505204198881984} +{"Pretrain/Learning Rate": 4.285219439480653e-07, "Pretrain/Loss": 1.999118447303772, "Pretrain/Loss (Raw)": 1.7248008251190186, "Pretrain/Step": 8991, "Pretrain/Step Time": 8.50467960909009} +{"Pretrain/Learning Rate": 4.2695818310058975e-07, "Pretrain/Loss": 1.999403715133667, "Pretrain/Loss (Raw)": 1.921848177909851, "Pretrain/Step": 8992, "Pretrain/Step Time": 8.509469296783209} +{"Pretrain/Learning Rate": 4.253972561320901e-07, "Pretrain/Loss": 2.0006754398345947, "Pretrain/Loss (Raw)": 2.1191651821136475, "Pretrain/Step": 8993, "Pretrain/Step Time": 8.516337199136615} +{"Pretrain/Learning Rate": 4.23839163222578e-07, "Pretrain/Loss": 2.000817060470581, "Pretrain/Loss (Raw)": 1.6088175773620605, "Pretrain/Step": 8994, "Pretrain/Step Time": 8.514166202396154} +{"Pretrain/Learning Rate": 4.222839045517402e-07, "Pretrain/Loss": 2.0000767707824707, "Pretrain/Loss (Raw)": 2.0208280086517334, "Pretrain/Step": 8995, "Pretrain/Step Time": 8.511538330465555} +{"Pretrain/Learning Rate": 4.2073148029893593e-07, "Pretrain/Loss": 1.999456524848938, "Pretrain/Loss (Raw)": 2.048393964767456, "Pretrain/Step": 8996, "Pretrain/Step Time": 8.510374339297414} +{"Pretrain/Learning Rate": 4.191818906431999e-07, "Pretrain/Loss": 1.997213363647461, "Pretrain/Loss (Raw)": 1.9271906614303589, "Pretrain/Step": 8997, "Pretrain/Step Time": 8.510108329355717} +{"Pretrain/Learning Rate": 4.176351357632363e-07, "Pretrain/Loss": 1.9953113794326782, "Pretrain/Loss (Raw)": 1.8804244995117188, "Pretrain/Step": 8998, "Pretrain/Step Time": 8.520182186737657} +{"Pretrain/Learning Rate": 4.160912158374247e-07, "Pretrain/Loss": 1.9950335025787354, "Pretrain/Loss (Raw)": 2.082052230834961, "Pretrain/Step": 8999, "Pretrain/Step Time": 8.51914950273931} +{"Pretrain/Learning Rate": 4.1455013104381714e-07, "Pretrain/Loss": 1.9959990978240967, "Pretrain/Loss (Raw)": 2.004765510559082, "Pretrain/Step": 9000, "Pretrain/Step Time": 8.523909902200103} +{"Pretrain/Learning Rate": 4.1301188156013803e-07, "Pretrain/Loss": 1.995492935180664, "Pretrain/Loss (Raw)": 2.0059235095977783, "Pretrain/Step": 9001, "Pretrain/Step Time": 8.516375517472625} +{"Pretrain/Learning Rate": 4.1147646756378997e-07, "Pretrain/Loss": 1.9926797151565552, "Pretrain/Loss (Raw)": 1.7656890153884888, "Pretrain/Step": 9002, "Pretrain/Step Time": 8.513687308877707} +{"Pretrain/Learning Rate": 4.099438892318369e-07, "Pretrain/Loss": 1.9924709796905518, "Pretrain/Loss (Raw)": 1.7278372049331665, "Pretrain/Step": 9003, "Pretrain/Step Time": 8.510799759998918} +{"Pretrain/Learning Rate": 4.084141467410263e-07, "Pretrain/Loss": 1.992380976676941, "Pretrain/Loss (Raw)": 1.8672455549240112, "Pretrain/Step": 9004, "Pretrain/Step Time": 8.517908124253154} +{"Pretrain/Learning Rate": 4.0688724026777814e-07, "Pretrain/Loss": 1.9921698570251465, "Pretrain/Loss (Raw)": 1.9122391939163208, "Pretrain/Step": 9005, "Pretrain/Step Time": 8.517023403197527} +{"Pretrain/Learning Rate": 4.0536316998817937e-07, "Pretrain/Loss": 1.9943583011627197, "Pretrain/Loss (Raw)": 2.2277345657348633, "Pretrain/Step": 9006, "Pretrain/Step Time": 8.517265053465962} +{"Pretrain/Learning Rate": 4.038419360779921e-07, "Pretrain/Loss": 1.993984580039978, "Pretrain/Loss (Raw)": 1.8550292253494263, "Pretrain/Step": 9007, "Pretrain/Step Time": 8.509578973054886} +{"Pretrain/Learning Rate": 4.023235387126567e-07, "Pretrain/Loss": 1.991950511932373, "Pretrain/Loss (Raw)": 1.8371537923812866, "Pretrain/Step": 9008, "Pretrain/Step Time": 8.507708245888352} +{"Pretrain/Learning Rate": 4.008079780672774e-07, "Pretrain/Loss": 1.9912151098251343, "Pretrain/Loss (Raw)": 2.0487308502197266, "Pretrain/Step": 9009, "Pretrain/Step Time": 8.51073806360364} +{"Pretrain/Learning Rate": 3.992952543166367e-07, "Pretrain/Loss": 1.9966408014297485, "Pretrain/Loss (Raw)": 2.24153208732605, "Pretrain/Step": 9010, "Pretrain/Step Time": 8.509911792352796} +{"Pretrain/Learning Rate": 3.977853676351867e-07, "Pretrain/Loss": 1.995683193206787, "Pretrain/Loss (Raw)": 1.5900943279266357, "Pretrain/Step": 9011, "Pretrain/Step Time": 8.511532187461853} +{"Pretrain/Learning Rate": 3.9627831819706305e-07, "Pretrain/Loss": 1.9939515590667725, "Pretrain/Loss (Raw)": 2.0475471019744873, "Pretrain/Step": 9012, "Pretrain/Step Time": 8.515662167221308} +{"Pretrain/Learning Rate": 3.947741061760574e-07, "Pretrain/Loss": 1.9925036430358887, "Pretrain/Loss (Raw)": 2.186180830001831, "Pretrain/Step": 9013, "Pretrain/Step Time": 8.500593898817897} +{"Pretrain/Learning Rate": 3.932727317456475e-07, "Pretrain/Loss": 1.9913020133972168, "Pretrain/Loss (Raw)": 1.951791524887085, "Pretrain/Step": 9014, "Pretrain/Step Time": 8.499187465757132} +{"Pretrain/Learning Rate": 3.9177419507897274e-07, "Pretrain/Loss": 1.993373155593872, "Pretrain/Loss (Raw)": 2.058638095855713, "Pretrain/Step": 9015, "Pretrain/Step Time": 8.503990560770035} +{"Pretrain/Learning Rate": 3.902784963488587e-07, "Pretrain/Loss": 1.9959542751312256, "Pretrain/Loss (Raw)": 2.115333080291748, "Pretrain/Step": 9016, "Pretrain/Step Time": 8.506086206063628} +{"Pretrain/Learning Rate": 3.887856357277925e-07, "Pretrain/Loss": 1.9973291158676147, "Pretrain/Loss (Raw)": 2.1610262393951416, "Pretrain/Step": 9017, "Pretrain/Step Time": 8.51412794366479} +{"Pretrain/Learning Rate": 3.872956133879391e-07, "Pretrain/Loss": 1.998967170715332, "Pretrain/Loss (Raw)": 2.161395311355591, "Pretrain/Step": 9018, "Pretrain/Step Time": 8.514918996021152} +{"Pretrain/Learning Rate": 3.858084295011333e-07, "Pretrain/Loss": 1.9994666576385498, "Pretrain/Loss (Raw)": 2.049588680267334, "Pretrain/Step": 9019, "Pretrain/Step Time": 8.505793100222945} +{"Pretrain/Learning Rate": 3.843240842388879e-07, "Pretrain/Loss": 1.998291015625, "Pretrain/Loss (Raw)": 1.8896276950836182, "Pretrain/Step": 9020, "Pretrain/Step Time": 8.506623588502407} +{"Pretrain/Learning Rate": 3.8284257777237984e-07, "Pretrain/Loss": 1.998272180557251, "Pretrain/Loss (Raw)": 1.9767472743988037, "Pretrain/Step": 9021, "Pretrain/Step Time": 8.508074821904302} +{"Pretrain/Learning Rate": 3.8136391027246696e-07, "Pretrain/Loss": 1.9976253509521484, "Pretrain/Loss (Raw)": 2.1322014331817627, "Pretrain/Step": 9022, "Pretrain/Step Time": 8.518115229904652} +{"Pretrain/Learning Rate": 3.7988808190967116e-07, "Pretrain/Loss": 1.9992300271987915, "Pretrain/Loss (Raw)": 2.1351115703582764, "Pretrain/Step": 9023, "Pretrain/Step Time": 8.521033439785242} +{"Pretrain/Learning Rate": 3.7841509285420076e-07, "Pretrain/Loss": 2.0049686431884766, "Pretrain/Loss (Raw)": 2.7653274536132812, "Pretrain/Step": 9024, "Pretrain/Step Time": 8.517462825402617} +{"Pretrain/Learning Rate": 3.769449432759198e-07, "Pretrain/Loss": 2.0025553703308105, "Pretrain/Loss (Raw)": 1.7612813711166382, "Pretrain/Step": 9025, "Pretrain/Step Time": 8.517631700262427} +{"Pretrain/Learning Rate": 3.7547763334437603e-07, "Pretrain/Loss": 2.0018796920776367, "Pretrain/Loss (Raw)": 1.864470362663269, "Pretrain/Step": 9026, "Pretrain/Step Time": 8.519362453371286} +{"Pretrain/Learning Rate": 3.740131632287841e-07, "Pretrain/Loss": 2.005148410797119, "Pretrain/Loss (Raw)": 2.0868113040924072, "Pretrain/Step": 9027, "Pretrain/Step Time": 8.522858848795295} +{"Pretrain/Learning Rate": 3.725515330980395e-07, "Pretrain/Loss": 2.0039823055267334, "Pretrain/Loss (Raw)": 1.869346261024475, "Pretrain/Step": 9028, "Pretrain/Step Time": 8.529697259888053} +{"Pretrain/Learning Rate": 3.71092743120699e-07, "Pretrain/Loss": 2.0045933723449707, "Pretrain/Loss (Raw)": 2.0748701095581055, "Pretrain/Step": 9029, "Pretrain/Step Time": 8.528696976602077} +{"Pretrain/Learning Rate": 3.6963679346499746e-07, "Pretrain/Loss": 2.0027663707733154, "Pretrain/Loss (Raw)": 1.8319884538650513, "Pretrain/Step": 9030, "Pretrain/Step Time": 8.522307612001896} +{"Pretrain/Learning Rate": 3.681836842988423e-07, "Pretrain/Loss": 2.0045015811920166, "Pretrain/Loss (Raw)": 2.0537643432617188, "Pretrain/Step": 9031, "Pretrain/Step Time": 8.519286202266812} +{"Pretrain/Learning Rate": 3.6673341578981614e-07, "Pretrain/Loss": 2.004434108734131, "Pretrain/Loss (Raw)": 1.9290709495544434, "Pretrain/Step": 9032, "Pretrain/Step Time": 8.5118179153651} +{"Pretrain/Learning Rate": 3.6528598810516567e-07, "Pretrain/Loss": 2.0051379203796387, "Pretrain/Loss (Raw)": 1.9417825937271118, "Pretrain/Step": 9033, "Pretrain/Step Time": 8.521294118836522} +{"Pretrain/Learning Rate": 3.6384140141181853e-07, "Pretrain/Loss": 2.004361152648926, "Pretrain/Loss (Raw)": 1.9795351028442383, "Pretrain/Step": 9034, "Pretrain/Step Time": 8.526454161852598} +{"Pretrain/Learning Rate": 3.6239965587637203e-07, "Pretrain/Loss": 2.0004255771636963, "Pretrain/Loss (Raw)": 1.9003571271896362, "Pretrain/Step": 9035, "Pretrain/Step Time": 8.529347514733672} +{"Pretrain/Learning Rate": 3.609607516650931e-07, "Pretrain/Loss": 2.001518726348877, "Pretrain/Loss (Raw)": 1.9276466369628906, "Pretrain/Step": 9036, "Pretrain/Step Time": 8.527725430205464} +{"Pretrain/Learning Rate": 3.5952468894392133e-07, "Pretrain/Loss": 1.9987666606903076, "Pretrain/Loss (Raw)": 1.9404903650283813, "Pretrain/Step": 9037, "Pretrain/Step Time": 8.515366610139608} +{"Pretrain/Learning Rate": 3.5809146787847415e-07, "Pretrain/Loss": 2.001821279525757, "Pretrain/Loss (Raw)": 2.1426639556884766, "Pretrain/Step": 9038, "Pretrain/Step Time": 8.51710033789277} +{"Pretrain/Learning Rate": 3.5666108863403327e-07, "Pretrain/Loss": 2.0010807514190674, "Pretrain/Loss (Raw)": 2.0048465728759766, "Pretrain/Step": 9039, "Pretrain/Step Time": 8.517698239535093} +{"Pretrain/Learning Rate": 3.552335513755611e-07, "Pretrain/Loss": 2.001166343688965, "Pretrain/Loss (Raw)": 2.0293474197387695, "Pretrain/Step": 9040, "Pretrain/Step Time": 8.52568811364472} +{"Pretrain/Learning Rate": 3.538088562676817e-07, "Pretrain/Loss": 2.0016932487487793, "Pretrain/Loss (Raw)": 1.963228464126587, "Pretrain/Step": 9041, "Pretrain/Step Time": 8.526378510519862} +{"Pretrain/Learning Rate": 3.523870034747051e-07, "Pretrain/Loss": 2.002419948577881, "Pretrain/Loss (Raw)": 2.019359827041626, "Pretrain/Step": 9042, "Pretrain/Step Time": 8.522120542824268} +{"Pretrain/Learning Rate": 3.50967993160603e-07, "Pretrain/Loss": 2.0029830932617188, "Pretrain/Loss (Raw)": 2.0921239852905273, "Pretrain/Step": 9043, "Pretrain/Step Time": 8.517919456586242} +{"Pretrain/Learning Rate": 3.4955182548901955e-07, "Pretrain/Loss": 2.0015907287597656, "Pretrain/Loss (Raw)": 2.0465011596679688, "Pretrain/Step": 9044, "Pretrain/Step Time": 8.513291290029883} +{"Pretrain/Learning Rate": 3.4813850062327956e-07, "Pretrain/Loss": 2.0001349449157715, "Pretrain/Loss (Raw)": 1.9617151021957397, "Pretrain/Step": 9045, "Pretrain/Step Time": 8.51940525881946} +{"Pretrain/Learning Rate": 3.467280187263694e-07, "Pretrain/Loss": 2.000621795654297, "Pretrain/Loss (Raw)": 2.0237538814544678, "Pretrain/Step": 9046, "Pretrain/Step Time": 8.527855321764946} +{"Pretrain/Learning Rate": 3.4532037996095334e-07, "Pretrain/Loss": 2.001514434814453, "Pretrain/Loss (Raw)": 2.0598154067993164, "Pretrain/Step": 9047, "Pretrain/Step Time": 8.52515054307878} +{"Pretrain/Learning Rate": 3.4391558448936825e-07, "Pretrain/Loss": 2.0020830631256104, "Pretrain/Loss (Raw)": 2.174412488937378, "Pretrain/Step": 9048, "Pretrain/Step Time": 8.522938026115298} +{"Pretrain/Learning Rate": 3.4251363247362054e-07, "Pretrain/Loss": 2.000640392303467, "Pretrain/Loss (Raw)": 2.016279935836792, "Pretrain/Step": 9049, "Pretrain/Step Time": 8.512274168431759} +{"Pretrain/Learning Rate": 3.4111452407539214e-07, "Pretrain/Loss": 2.000655174255371, "Pretrain/Loss (Raw)": 2.0605926513671875, "Pretrain/Step": 9050, "Pretrain/Step Time": 8.515634283423424} +{"Pretrain/Learning Rate": 3.397182594560344e-07, "Pretrain/Loss": 2.0018625259399414, "Pretrain/Loss (Raw)": 2.216294527053833, "Pretrain/Step": 9051, "Pretrain/Step Time": 8.512382727116346} +{"Pretrain/Learning Rate": 3.3832483877656584e-07, "Pretrain/Loss": 2.0011343955993652, "Pretrain/Loss (Raw)": 1.8936669826507568, "Pretrain/Step": 9052, "Pretrain/Step Time": 8.51640398800373} +{"Pretrain/Learning Rate": 3.369342621976884e-07, "Pretrain/Loss": 1.9994432926177979, "Pretrain/Loss (Raw)": 1.9231921434402466, "Pretrain/Step": 9053, "Pretrain/Step Time": 8.52119723521173} +{"Pretrain/Learning Rate": 3.355465298797711e-07, "Pretrain/Loss": 1.998491883277893, "Pretrain/Loss (Raw)": 1.8785170316696167, "Pretrain/Step": 9054, "Pretrain/Step Time": 8.515593944117427} +{"Pretrain/Learning Rate": 3.3416164198284694e-07, "Pretrain/Loss": 1.9972970485687256, "Pretrain/Loss (Raw)": 1.877915859222412, "Pretrain/Step": 9055, "Pretrain/Step Time": 8.506014944985509} +{"Pretrain/Learning Rate": 3.327795986666327e-07, "Pretrain/Loss": 1.9979382753372192, "Pretrain/Loss (Raw)": 2.1685609817504883, "Pretrain/Step": 9056, "Pretrain/Step Time": 8.508766306564212} +{"Pretrain/Learning Rate": 3.3140040009051186e-07, "Pretrain/Loss": 1.9979777336120605, "Pretrain/Loss (Raw)": 2.0347836017608643, "Pretrain/Step": 9057, "Pretrain/Step Time": 8.516288055106997} +{"Pretrain/Learning Rate": 3.300240464135379e-07, "Pretrain/Loss": 1.9987493753433228, "Pretrain/Loss (Raw)": 2.1309361457824707, "Pretrain/Step": 9058, "Pretrain/Step Time": 8.513743486255407} +{"Pretrain/Learning Rate": 3.286505377944393e-07, "Pretrain/Loss": 1.9983015060424805, "Pretrain/Loss (Raw)": 1.997847080230713, "Pretrain/Step": 9059, "Pretrain/Step Time": 8.515446873381734} +{"Pretrain/Learning Rate": 3.2727987439161724e-07, "Pretrain/Loss": 1.9986101388931274, "Pretrain/Loss (Raw)": 1.9817829132080078, "Pretrain/Step": 9060, "Pretrain/Step Time": 8.50687300041318} +{"Pretrain/Learning Rate": 3.2591205636313957e-07, "Pretrain/Loss": 1.9991209506988525, "Pretrain/Loss (Raw)": 1.9332176446914673, "Pretrain/Step": 9061, "Pretrain/Step Time": 8.511775694787502} +{"Pretrain/Learning Rate": 3.2454708386675525e-07, "Pretrain/Loss": 1.99806547164917, "Pretrain/Loss (Raw)": 1.9201877117156982, "Pretrain/Step": 9062, "Pretrain/Step Time": 8.516523994505405} +{"Pretrain/Learning Rate": 3.2318495705987437e-07, "Pretrain/Loss": 1.9978114366531372, "Pretrain/Loss (Raw)": 2.093017101287842, "Pretrain/Step": 9063, "Pretrain/Step Time": 8.520959047600627} +{"Pretrain/Learning Rate": 3.218256760995825e-07, "Pretrain/Loss": 1.9976475238800049, "Pretrain/Loss (Raw)": 1.9440830945968628, "Pretrain/Step": 9064, "Pretrain/Step Time": 8.52313275076449} +{"Pretrain/Learning Rate": 3.20469241142643e-07, "Pretrain/Loss": 1.9964261054992676, "Pretrain/Loss (Raw)": 1.9759384393692017, "Pretrain/Step": 9065, "Pretrain/Step Time": 8.519258445128798} +{"Pretrain/Learning Rate": 3.1911565234548633e-07, "Pretrain/Loss": 1.996852159500122, "Pretrain/Loss (Raw)": 1.9840567111968994, "Pretrain/Step": 9066, "Pretrain/Step Time": 8.51020066998899} +{"Pretrain/Learning Rate": 3.177649098642099e-07, "Pretrain/Loss": 1.9994075298309326, "Pretrain/Loss (Raw)": 2.038698196411133, "Pretrain/Step": 9067, "Pretrain/Step Time": 8.506583325564861} +{"Pretrain/Learning Rate": 3.1641701385459186e-07, "Pretrain/Loss": 2.001161575317383, "Pretrain/Loss (Raw)": 2.02658748626709, "Pretrain/Step": 9068, "Pretrain/Step Time": 8.509735766798258} +{"Pretrain/Learning Rate": 3.150719644720773e-07, "Pretrain/Loss": 2.004347085952759, "Pretrain/Loss (Raw)": 2.121330738067627, "Pretrain/Step": 9069, "Pretrain/Step Time": 8.513134999200702} +{"Pretrain/Learning Rate": 3.1372976187178105e-07, "Pretrain/Loss": 2.006376266479492, "Pretrain/Loss (Raw)": 2.1867103576660156, "Pretrain/Step": 9070, "Pretrain/Step Time": 8.516843823716044} +{"Pretrain/Learning Rate": 3.123904062084959e-07, "Pretrain/Loss": 2.0069756507873535, "Pretrain/Loss (Raw)": 2.0873613357543945, "Pretrain/Step": 9071, "Pretrain/Step Time": 8.511339040473104} +{"Pretrain/Learning Rate": 3.110538976366789e-07, "Pretrain/Loss": 2.006112575531006, "Pretrain/Loss (Raw)": 1.8822606801986694, "Pretrain/Step": 9072, "Pretrain/Step Time": 8.5039415769279} +{"Pretrain/Learning Rate": 3.0972023631046786e-07, "Pretrain/Loss": 2.0080606937408447, "Pretrain/Loss (Raw)": 2.1689772605895996, "Pretrain/Step": 9073, "Pretrain/Step Time": 8.502668373286724} +{"Pretrain/Learning Rate": 3.083894223836592e-07, "Pretrain/Loss": 2.010031223297119, "Pretrain/Loss (Raw)": 2.1742489337921143, "Pretrain/Step": 9074, "Pretrain/Step Time": 8.50581869110465} +{"Pretrain/Learning Rate": 3.070614560097357e-07, "Pretrain/Loss": 2.0107529163360596, "Pretrain/Loss (Raw)": 2.0392661094665527, "Pretrain/Step": 9075, "Pretrain/Step Time": 8.507989620789886} +{"Pretrain/Learning Rate": 3.0573633734184146e-07, "Pretrain/Loss": 2.009272336959839, "Pretrain/Loss (Raw)": 1.804297924041748, "Pretrain/Step": 9076, "Pretrain/Step Time": 8.511627811938524} +{"Pretrain/Learning Rate": 3.044140665327988e-07, "Pretrain/Loss": 2.0091638565063477, "Pretrain/Loss (Raw)": 2.0199263095855713, "Pretrain/Step": 9077, "Pretrain/Step Time": 8.512544635683298} +{"Pretrain/Learning Rate": 3.0309464373509125e-07, "Pretrain/Loss": 2.0089259147644043, "Pretrain/Loss (Raw)": 2.1545205116271973, "Pretrain/Step": 9078, "Pretrain/Step Time": 8.504339888691902} +{"Pretrain/Learning Rate": 3.017780691008859e-07, "Pretrain/Loss": 2.0085113048553467, "Pretrain/Loss (Raw)": 2.0656113624572754, "Pretrain/Step": 9079, "Pretrain/Step Time": 8.499671963974833} +{"Pretrain/Learning Rate": 3.00464342782017e-07, "Pretrain/Loss": 2.009108304977417, "Pretrain/Loss (Raw)": 2.0713348388671875, "Pretrain/Step": 9080, "Pretrain/Step Time": 8.509294161573052} +{"Pretrain/Learning Rate": 2.9915346492998817e-07, "Pretrain/Loss": 2.008812427520752, "Pretrain/Loss (Raw)": 2.2099549770355225, "Pretrain/Step": 9081, "Pretrain/Step Time": 8.507614951580763} +{"Pretrain/Learning Rate": 2.9784543569597314e-07, "Pretrain/Loss": 2.0090584754943848, "Pretrain/Loss (Raw)": 2.032702684402466, "Pretrain/Step": 9082, "Pretrain/Step Time": 8.511481393128633} +{"Pretrain/Learning Rate": 2.9654025523082607e-07, "Pretrain/Loss": 2.0097858905792236, "Pretrain/Loss (Raw)": 2.091360569000244, "Pretrain/Step": 9083, "Pretrain/Step Time": 8.50569219328463} +{"Pretrain/Learning Rate": 2.9523792368506275e-07, "Pretrain/Loss": 2.0084495544433594, "Pretrain/Loss (Raw)": 1.7714669704437256, "Pretrain/Step": 9084, "Pretrain/Step Time": 8.497241059318185} +{"Pretrain/Learning Rate": 2.9393844120887415e-07, "Pretrain/Loss": 2.0099079608917236, "Pretrain/Loss (Raw)": 2.168877124786377, "Pretrain/Step": 9085, "Pretrain/Step Time": 8.501546813175082} +{"Pretrain/Learning Rate": 2.926418079521237e-07, "Pretrain/Loss": 2.0093555450439453, "Pretrain/Loss (Raw)": 1.93441903591156, "Pretrain/Step": 9086, "Pretrain/Step Time": 8.503930043429136} +{"Pretrain/Learning Rate": 2.913480240643446e-07, "Pretrain/Loss": 2.0116236209869385, "Pretrain/Loss (Raw)": 2.2997961044311523, "Pretrain/Step": 9087, "Pretrain/Step Time": 8.506310187280178} +{"Pretrain/Learning Rate": 2.900570896947424e-07, "Pretrain/Loss": 2.010477066040039, "Pretrain/Loss (Raw)": 1.8848663568496704, "Pretrain/Step": 9088, "Pretrain/Step Time": 8.501256808638573} +{"Pretrain/Learning Rate": 2.8876900499219263e-07, "Pretrain/Loss": 2.0125186443328857, "Pretrain/Loss (Raw)": 1.9725227355957031, "Pretrain/Step": 9089, "Pretrain/Step Time": 8.501961782574654} +{"Pretrain/Learning Rate": 2.8748377010524574e-07, "Pretrain/Loss": 2.0111072063446045, "Pretrain/Loss (Raw)": 2.0252368450164795, "Pretrain/Step": 9090, "Pretrain/Step Time": 8.492795500904322} +{"Pretrain/Learning Rate": 2.8620138518211934e-07, "Pretrain/Loss": 2.0099663734436035, "Pretrain/Loss (Raw)": 1.8191674947738647, "Pretrain/Step": 9091, "Pretrain/Step Time": 8.49981133081019} +{"Pretrain/Learning Rate": 2.849218503707035e-07, "Pretrain/Loss": 2.0117104053497314, "Pretrain/Loss (Raw)": 2.132617712020874, "Pretrain/Step": 9092, "Pretrain/Step Time": 8.50066502019763} +{"Pretrain/Learning Rate": 2.836451658185607e-07, "Pretrain/Loss": 2.0096068382263184, "Pretrain/Loss (Raw)": 1.9553695917129517, "Pretrain/Step": 9093, "Pretrain/Step Time": 8.501201277598739} +{"Pretrain/Learning Rate": 2.82371331672926e-07, "Pretrain/Loss": 2.0085511207580566, "Pretrain/Loss (Raw)": 2.1291074752807617, "Pretrain/Step": 9094, "Pretrain/Step Time": 8.505555449053645} +{"Pretrain/Learning Rate": 2.8110034808070396e-07, "Pretrain/Loss": 2.012087821960449, "Pretrain/Loss (Raw)": 2.2787628173828125, "Pretrain/Step": 9095, "Pretrain/Step Time": 8.503180606290698} +{"Pretrain/Learning Rate": 2.7983221518846634e-07, "Pretrain/Loss": 2.0133779048919678, "Pretrain/Loss (Raw)": 2.006511926651001, "Pretrain/Step": 9096, "Pretrain/Step Time": 8.489826275035739} +{"Pretrain/Learning Rate": 2.7856693314246287e-07, "Pretrain/Loss": 2.008786201477051, "Pretrain/Loss (Raw)": 1.9198743104934692, "Pretrain/Step": 9097, "Pretrain/Step Time": 8.491219921037555} +{"Pretrain/Learning Rate": 2.773045020886156e-07, "Pretrain/Loss": 2.0095200538635254, "Pretrain/Loss (Raw)": 2.0492355823516846, "Pretrain/Step": 9098, "Pretrain/Step Time": 8.494988773018122} +{"Pretrain/Learning Rate": 2.760449221725081e-07, "Pretrain/Loss": 2.007788896560669, "Pretrain/Loss (Raw)": 1.7634944915771484, "Pretrain/Step": 9099, "Pretrain/Step Time": 8.502126140519977} +{"Pretrain/Learning Rate": 2.74788193539402e-07, "Pretrain/Loss": 2.007725715637207, "Pretrain/Loss (Raw)": 2.0096213817596436, "Pretrain/Step": 9100, "Pretrain/Step Time": 8.509219421073794} +{"Pretrain/Learning Rate": 2.7353431633423134e-07, "Pretrain/Loss": 2.0085136890411377, "Pretrain/Loss (Raw)": 1.929228663444519, "Pretrain/Step": 9101, "Pretrain/Step Time": 8.50755426287651} +{"Pretrain/Learning Rate": 2.722832907015971e-07, "Pretrain/Loss": 2.0099735260009766, "Pretrain/Loss (Raw)": 2.0212767124176025, "Pretrain/Step": 9102, "Pretrain/Step Time": 8.501441922038794} +{"Pretrain/Learning Rate": 2.710351167857783e-07, "Pretrain/Loss": 2.008991241455078, "Pretrain/Loss (Raw)": 1.813539981842041, "Pretrain/Step": 9103, "Pretrain/Step Time": 8.499633030965924} +{"Pretrain/Learning Rate": 2.6978979473071264e-07, "Pretrain/Loss": 2.0090510845184326, "Pretrain/Loss (Raw)": 2.0920279026031494, "Pretrain/Step": 9104, "Pretrain/Step Time": 8.508030770346522} +{"Pretrain/Learning Rate": 2.6854732468002133e-07, "Pretrain/Loss": 2.0091052055358887, "Pretrain/Loss (Raw)": 2.1017022132873535, "Pretrain/Step": 9105, "Pretrain/Step Time": 8.514874901622534} +{"Pretrain/Learning Rate": 2.6730770677699245e-07, "Pretrain/Loss": 2.0097179412841797, "Pretrain/Loss (Raw)": 2.18680739402771, "Pretrain/Step": 9106, "Pretrain/Step Time": 8.512982986867428} +{"Pretrain/Learning Rate": 2.6607094116458123e-07, "Pretrain/Loss": 2.013066291809082, "Pretrain/Loss (Raw)": 2.3573126792907715, "Pretrain/Step": 9107, "Pretrain/Step Time": 8.519555523991585} +{"Pretrain/Learning Rate": 2.6483702798542066e-07, "Pretrain/Loss": 2.013410806655884, "Pretrain/Loss (Raw)": 2.1497936248779297, "Pretrain/Step": 9108, "Pretrain/Step Time": 8.512327615171671} +{"Pretrain/Learning Rate": 2.636059673818081e-07, "Pretrain/Loss": 2.015364170074463, "Pretrain/Loss (Raw)": 1.9529591798782349, "Pretrain/Step": 9109, "Pretrain/Step Time": 8.50858674198389} +{"Pretrain/Learning Rate": 2.623777594957216e-07, "Pretrain/Loss": 2.0144705772399902, "Pretrain/Loss (Raw)": 1.970026969909668, "Pretrain/Step": 9110, "Pretrain/Step Time": 8.51256793178618} +{"Pretrain/Learning Rate": 2.6115240446879517e-07, "Pretrain/Loss": 2.0129566192626953, "Pretrain/Loss (Raw)": 1.9871301651000977, "Pretrain/Step": 9111, "Pretrain/Step Time": 8.52081155218184} +{"Pretrain/Learning Rate": 2.599299024423491e-07, "Pretrain/Loss": 2.0152487754821777, "Pretrain/Loss (Raw)": 2.167398452758789, "Pretrain/Step": 9112, "Pretrain/Step Time": 8.522985408082604} +{"Pretrain/Learning Rate": 2.587102535573621e-07, "Pretrain/Loss": 2.0135693550109863, "Pretrain/Loss (Raw)": 1.8429666757583618, "Pretrain/Step": 9113, "Pretrain/Step Time": 8.511750966310501} +{"Pretrain/Learning Rate": 2.5749345795449687e-07, "Pretrain/Loss": 2.0104613304138184, "Pretrain/Loss (Raw)": 1.7252428531646729, "Pretrain/Step": 9114, "Pretrain/Step Time": 8.511982029303908} +{"Pretrain/Learning Rate": 2.562795157740744e-07, "Pretrain/Loss": 2.0109617710113525, "Pretrain/Loss (Raw)": 1.9930375814437866, "Pretrain/Step": 9115, "Pretrain/Step Time": 8.510511199012399} +{"Pretrain/Learning Rate": 2.5506842715609656e-07, "Pretrain/Loss": 2.0110325813293457, "Pretrain/Loss (Raw)": 1.9900400638580322, "Pretrain/Step": 9116, "Pretrain/Step Time": 8.520356148481369} +{"Pretrain/Learning Rate": 2.5386019224022673e-07, "Pretrain/Loss": 2.0103821754455566, "Pretrain/Loss (Raw)": 1.9381358623504639, "Pretrain/Step": 9117, "Pretrain/Step Time": 8.527192739769816} +{"Pretrain/Learning Rate": 2.526548111658117e-07, "Pretrain/Loss": 2.0099024772644043, "Pretrain/Loss (Raw)": 1.9947099685668945, "Pretrain/Step": 9118, "Pretrain/Step Time": 8.533615726977587} +{"Pretrain/Learning Rate": 2.514522840718542e-07, "Pretrain/Loss": 2.011381149291992, "Pretrain/Loss (Raw)": 1.9140864610671997, "Pretrain/Step": 9119, "Pretrain/Step Time": 8.535010375082493} +{"Pretrain/Learning Rate": 2.502526110970377e-07, "Pretrain/Loss": 2.010622978210449, "Pretrain/Loss (Raw)": 1.8248041868209839, "Pretrain/Step": 9120, "Pretrain/Step Time": 8.529336662963033} +{"Pretrain/Learning Rate": 2.490557923797154e-07, "Pretrain/Loss": 2.011826515197754, "Pretrain/Loss (Raw)": 2.273205041885376, "Pretrain/Step": 9121, "Pretrain/Step Time": 8.520518070086837} +{"Pretrain/Learning Rate": 2.478618280579104e-07, "Pretrain/Loss": 2.014565944671631, "Pretrain/Loss (Raw)": 1.9594883918762207, "Pretrain/Step": 9122, "Pretrain/Step Time": 8.524138920009136} +{"Pretrain/Learning Rate": 2.466707182693151e-07, "Pretrain/Loss": 2.013917922973633, "Pretrain/Loss (Raw)": 1.937868595123291, "Pretrain/Step": 9123, "Pretrain/Step Time": 8.534920293837786} +{"Pretrain/Learning Rate": 2.45482463151292e-07, "Pretrain/Loss": 2.013190984725952, "Pretrain/Loss (Raw)": 1.9553558826446533, "Pretrain/Step": 9124, "Pretrain/Step Time": 8.531339548528194} +{"Pretrain/Learning Rate": 2.442970628408814e-07, "Pretrain/Loss": 2.0124082565307617, "Pretrain/Loss (Raw)": 1.8269766569137573, "Pretrain/Step": 9125, "Pretrain/Step Time": 8.529941868036985} +{"Pretrain/Learning Rate": 2.4311451747478233e-07, "Pretrain/Loss": 2.0109810829162598, "Pretrain/Loss (Raw)": 1.6977654695510864, "Pretrain/Step": 9126, "Pretrain/Step Time": 8.525450920686126} +{"Pretrain/Learning Rate": 2.4193482718937733e-07, "Pretrain/Loss": 2.0101547241210938, "Pretrain/Loss (Raw)": 1.9762850999832153, "Pretrain/Step": 9127, "Pretrain/Step Time": 8.523566687479615} +{"Pretrain/Learning Rate": 2.4075799212071317e-07, "Pretrain/Loss": 2.009265899658203, "Pretrain/Loss (Raw)": 1.8909850120544434, "Pretrain/Step": 9128, "Pretrain/Step Time": 8.526450393721461} +{"Pretrain/Learning Rate": 2.395840124045062e-07, "Pretrain/Loss": 2.0084426403045654, "Pretrain/Loss (Raw)": 1.9005526304244995, "Pretrain/Step": 9129, "Pretrain/Step Time": 8.526348600164056} +{"Pretrain/Learning Rate": 2.384128881761455e-07, "Pretrain/Loss": 2.0087122917175293, "Pretrain/Loss (Raw)": 1.8002071380615234, "Pretrain/Step": 9130, "Pretrain/Step Time": 8.535943321883678} +{"Pretrain/Learning Rate": 2.3724461957068956e-07, "Pretrain/Loss": 2.0122222900390625, "Pretrain/Loss (Raw)": 2.177133083343506, "Pretrain/Step": 9131, "Pretrain/Step Time": 8.52999697253108} +{"Pretrain/Learning Rate": 2.360792067228723e-07, "Pretrain/Loss": 2.012552261352539, "Pretrain/Loss (Raw)": 1.9094324111938477, "Pretrain/Step": 9132, "Pretrain/Step Time": 8.52453581430018} +{"Pretrain/Learning Rate": 2.349166497670918e-07, "Pretrain/Loss": 2.0132241249084473, "Pretrain/Loss (Raw)": 1.998242735862732, "Pretrain/Step": 9133, "Pretrain/Step Time": 8.52644164673984} +{"Pretrain/Learning Rate": 2.337569488374186e-07, "Pretrain/Loss": 2.012160539627075, "Pretrain/Loss (Raw)": 2.0916028022766113, "Pretrain/Step": 9134, "Pretrain/Step Time": 8.522837158292532} +{"Pretrain/Learning Rate": 2.3260010406759846e-07, "Pretrain/Loss": 2.0134787559509277, "Pretrain/Loss (Raw)": 2.023794651031494, "Pretrain/Step": 9135, "Pretrain/Step Time": 8.528713095933199} +{"Pretrain/Learning Rate": 2.3144611559104134e-07, "Pretrain/Loss": 2.01405668258667, "Pretrain/Loss (Raw)": 1.9111117124557495, "Pretrain/Step": 9136, "Pretrain/Step Time": 8.53952556848526} +{"Pretrain/Learning Rate": 2.3029498354083245e-07, "Pretrain/Loss": 2.0134878158569336, "Pretrain/Loss (Raw)": 1.975899338722229, "Pretrain/Step": 9137, "Pretrain/Step Time": 8.529378719627857} +{"Pretrain/Learning Rate": 2.2914670804972394e-07, "Pretrain/Loss": 2.0108425617218018, "Pretrain/Loss (Raw)": 1.902956247329712, "Pretrain/Step": 9138, "Pretrain/Step Time": 8.526417953893542} +{"Pretrain/Learning Rate": 2.2800128925014042e-07, "Pretrain/Loss": 2.01440691947937, "Pretrain/Loss (Raw)": 2.046337604522705, "Pretrain/Step": 9139, "Pretrain/Step Time": 8.527458239346743} +{"Pretrain/Learning Rate": 2.26858727274179e-07, "Pretrain/Loss": 2.013751983642578, "Pretrain/Loss (Raw)": 1.9636930227279663, "Pretrain/Step": 9140, "Pretrain/Step Time": 8.533027831465006} +{"Pretrain/Learning Rate": 2.2571902225360374e-07, "Pretrain/Loss": 2.01328444480896, "Pretrain/Loss (Raw)": 2.126356363296509, "Pretrain/Step": 9141, "Pretrain/Step Time": 8.537131214514375} +{"Pretrain/Learning Rate": 2.2458217431984842e-07, "Pretrain/Loss": 2.014951229095459, "Pretrain/Loss (Raw)": 2.1651246547698975, "Pretrain/Step": 9142, "Pretrain/Step Time": 8.53414049372077} +{"Pretrain/Learning Rate": 2.2344818360402476e-07, "Pretrain/Loss": 2.014894723892212, "Pretrain/Loss (Raw)": 2.0514090061187744, "Pretrain/Step": 9143, "Pretrain/Step Time": 8.528973652049899} +{"Pretrain/Learning Rate": 2.2231705023690875e-07, "Pretrain/Loss": 2.0144107341766357, "Pretrain/Loss (Raw)": 2.0533950328826904, "Pretrain/Step": 9144, "Pretrain/Step Time": 8.528010273352265} +{"Pretrain/Learning Rate": 2.2118877434894325e-07, "Pretrain/Loss": 2.0129566192626953, "Pretrain/Loss (Raw)": 1.9748839139938354, "Pretrain/Step": 9145, "Pretrain/Step Time": 8.526487166061997} +{"Pretrain/Learning Rate": 2.2006335607025196e-07, "Pretrain/Loss": 2.011545181274414, "Pretrain/Loss (Raw)": 1.9807323217391968, "Pretrain/Step": 9146, "Pretrain/Step Time": 8.533348117023706} +{"Pretrain/Learning Rate": 2.1894079553062276e-07, "Pretrain/Loss": 2.0110721588134766, "Pretrain/Loss (Raw)": 1.9890377521514893, "Pretrain/Step": 9147, "Pretrain/Step Time": 8.530658656731248} +{"Pretrain/Learning Rate": 2.1782109285951034e-07, "Pretrain/Loss": 2.0091352462768555, "Pretrain/Loss (Raw)": 1.6416987180709839, "Pretrain/Step": 9148, "Pretrain/Step Time": 8.53116911649704} +{"Pretrain/Learning Rate": 2.167042481860504e-07, "Pretrain/Loss": 2.009531259536743, "Pretrain/Loss (Raw)": 2.027454376220703, "Pretrain/Step": 9149, "Pretrain/Step Time": 8.52733762934804} +{"Pretrain/Learning Rate": 2.1559026163903427e-07, "Pretrain/Loss": 2.009305238723755, "Pretrain/Loss (Raw)": 2.1032602787017822, "Pretrain/Step": 9150, "Pretrain/Step Time": 8.514934975653887} +{"Pretrain/Learning Rate": 2.1447913334694258e-07, "Pretrain/Loss": 2.0067625045776367, "Pretrain/Loss (Raw)": 1.8096548318862915, "Pretrain/Step": 9151, "Pretrain/Step Time": 8.513340801000595} +{"Pretrain/Learning Rate": 2.1337086343790613e-07, "Pretrain/Loss": 2.001108407974243, "Pretrain/Loss (Raw)": 2.0416104793548584, "Pretrain/Step": 9152, "Pretrain/Step Time": 8.516486063599586} +{"Pretrain/Learning Rate": 2.1226545203974212e-07, "Pretrain/Loss": 2.003199338912964, "Pretrain/Loss (Raw)": 2.0288991928100586, "Pretrain/Step": 9153, "Pretrain/Step Time": 8.513544069603086} +{"Pretrain/Learning Rate": 2.1116289927992917e-07, "Pretrain/Loss": 2.004178524017334, "Pretrain/Loss (Raw)": 1.9898262023925781, "Pretrain/Step": 9154, "Pretrain/Step Time": 8.513434506952763} +{"Pretrain/Learning Rate": 2.1006320528562107e-07, "Pretrain/Loss": 2.002969980239868, "Pretrain/Loss (Raw)": 1.9321203231811523, "Pretrain/Step": 9155, "Pretrain/Step Time": 8.50950925052166} +{"Pretrain/Learning Rate": 2.0896637018363863e-07, "Pretrain/Loss": 2.0045242309570312, "Pretrain/Loss (Raw)": 2.0682883262634277, "Pretrain/Step": 9156, "Pretrain/Step Time": 8.505365457385778} +{"Pretrain/Learning Rate": 2.0787239410047232e-07, "Pretrain/Loss": 2.0044281482696533, "Pretrain/Loss (Raw)": 2.062556505203247, "Pretrain/Step": 9157, "Pretrain/Step Time": 8.512586513534188} +{"Pretrain/Learning Rate": 2.0678127716228236e-07, "Pretrain/Loss": 2.006295919418335, "Pretrain/Loss (Raw)": 2.0710620880126953, "Pretrain/Step": 9158, "Pretrain/Step Time": 8.510516088455915} +{"Pretrain/Learning Rate": 2.056930194949097e-07, "Pretrain/Loss": 2.0048580169677734, "Pretrain/Loss (Raw)": 1.8697164058685303, "Pretrain/Step": 9159, "Pretrain/Step Time": 8.513177221640944} +{"Pretrain/Learning Rate": 2.0460762122385125e-07, "Pretrain/Loss": 2.004957914352417, "Pretrain/Loss (Raw)": 1.941866159439087, "Pretrain/Step": 9160, "Pretrain/Step Time": 8.518202234059572} +{"Pretrain/Learning Rate": 2.035250824742818e-07, "Pretrain/Loss": 2.007925510406494, "Pretrain/Loss (Raw)": 2.321606397628784, "Pretrain/Step": 9161, "Pretrain/Step Time": 8.503775333985686} +{"Pretrain/Learning Rate": 2.02445403371046e-07, "Pretrain/Loss": 2.009338617324829, "Pretrain/Loss (Raw)": 2.1604316234588623, "Pretrain/Step": 9162, "Pretrain/Step Time": 8.500280141830444} +{"Pretrain/Learning Rate": 2.0136858403865534e-07, "Pretrain/Loss": 2.010279417037964, "Pretrain/Loss (Raw)": 2.0207815170288086, "Pretrain/Step": 9163, "Pretrain/Step Time": 8.505084589123726} +{"Pretrain/Learning Rate": 2.00294624601291e-07, "Pretrain/Loss": 2.01041841506958, "Pretrain/Loss (Raw)": 1.9454375505447388, "Pretrain/Step": 9164, "Pretrain/Step Time": 8.501057559624314} +{"Pretrain/Learning Rate": 1.9922352518281505e-07, "Pretrain/Loss": 2.0103919506073, "Pretrain/Loss (Raw)": 1.937094807624817, "Pretrain/Step": 9165, "Pretrain/Step Time": 8.502914490178227} +{"Pretrain/Learning Rate": 1.9815528590674537e-07, "Pretrain/Loss": 2.0077829360961914, "Pretrain/Loss (Raw)": 1.8087249994277954, "Pretrain/Step": 9166, "Pretrain/Step Time": 8.511240972205997} +{"Pretrain/Learning Rate": 1.9708990689627783e-07, "Pretrain/Loss": 2.007582187652588, "Pretrain/Loss (Raw)": 1.979148030281067, "Pretrain/Step": 9167, "Pretrain/Step Time": 8.505569344386458} +{"Pretrain/Learning Rate": 1.9602738827427802e-07, "Pretrain/Loss": 2.007260322570801, "Pretrain/Loss (Raw)": 1.9881610870361328, "Pretrain/Step": 9168, "Pretrain/Step Time": 8.502275090664625} +{"Pretrain/Learning Rate": 1.9496773016327852e-07, "Pretrain/Loss": 2.0073909759521484, "Pretrain/Loss (Raw)": 1.9799379110336304, "Pretrain/Step": 9169, "Pretrain/Step Time": 8.508454507216811} +{"Pretrain/Learning Rate": 1.9391093268548988e-07, "Pretrain/Loss": 2.007106304168701, "Pretrain/Loss (Raw)": 1.9829227924346924, "Pretrain/Step": 9170, "Pretrain/Step Time": 8.512382632121444} +{"Pretrain/Learning Rate": 1.9285699596277852e-07, "Pretrain/Loss": 2.006348133087158, "Pretrain/Loss (Raw)": 1.9950993061065674, "Pretrain/Step": 9171, "Pretrain/Step Time": 8.510325331240892} +{"Pretrain/Learning Rate": 1.918059201166944e-07, "Pretrain/Loss": 2.0064210891723633, "Pretrain/Loss (Raw)": 2.05584454536438, "Pretrain/Step": 9172, "Pretrain/Step Time": 8.508283911272883} +{"Pretrain/Learning Rate": 1.9075770526845172e-07, "Pretrain/Loss": 2.0066568851470947, "Pretrain/Loss (Raw)": 1.9918551445007324, "Pretrain/Step": 9173, "Pretrain/Step Time": 8.501835705712438} +{"Pretrain/Learning Rate": 1.8971235153893708e-07, "Pretrain/Loss": 2.007319927215576, "Pretrain/Loss (Raw)": 2.1086292266845703, "Pretrain/Step": 9174, "Pretrain/Step Time": 8.497163686901331} +{"Pretrain/Learning Rate": 1.8866985904870127e-07, "Pretrain/Loss": 2.0079641342163086, "Pretrain/Loss (Raw)": 2.1422665119171143, "Pretrain/Step": 9175, "Pretrain/Step Time": 8.502440709620714} +{"Pretrain/Learning Rate": 1.8763022791797314e-07, "Pretrain/Loss": 2.0075440406799316, "Pretrain/Loss (Raw)": 2.120656728744507, "Pretrain/Step": 9176, "Pretrain/Step Time": 8.503504928201437} +{"Pretrain/Learning Rate": 1.8659345826664844e-07, "Pretrain/Loss": 2.005232810974121, "Pretrain/Loss (Raw)": 1.7204501628875732, "Pretrain/Step": 9177, "Pretrain/Step Time": 8.5043835490942} +{"Pretrain/Learning Rate": 1.8555955021428984e-07, "Pretrain/Loss": 2.0041627883911133, "Pretrain/Loss (Raw)": 1.9236366748809814, "Pretrain/Step": 9178, "Pretrain/Step Time": 8.50117831863463} +{"Pretrain/Learning Rate": 1.8452850388013255e-07, "Pretrain/Loss": 2.0020573139190674, "Pretrain/Loss (Raw)": 1.9467815160751343, "Pretrain/Step": 9179, "Pretrain/Step Time": 8.498913342133164} +{"Pretrain/Learning Rate": 1.8350031938308144e-07, "Pretrain/Loss": 2.002162456512451, "Pretrain/Loss (Raw)": 1.9071136713027954, "Pretrain/Step": 9180, "Pretrain/Step Time": 8.495614159852266} +{"Pretrain/Learning Rate": 1.8247499684171666e-07, "Pretrain/Loss": 2.00118350982666, "Pretrain/Loss (Raw)": 1.797910451889038, "Pretrain/Step": 9181, "Pretrain/Step Time": 8.499498570337892} +{"Pretrain/Learning Rate": 1.8145253637427695e-07, "Pretrain/Loss": 2.002077102661133, "Pretrain/Loss (Raw)": 1.9928913116455078, "Pretrain/Step": 9182, "Pretrain/Step Time": 8.505779454484582} +{"Pretrain/Learning Rate": 1.8043293809867635e-07, "Pretrain/Loss": 2.003575563430786, "Pretrain/Loss (Raw)": 2.0697224140167236, "Pretrain/Step": 9183, "Pretrain/Step Time": 8.510504342615604} +{"Pretrain/Learning Rate": 1.7941620213250688e-07, "Pretrain/Loss": 2.001779556274414, "Pretrain/Loss (Raw)": 1.93865168094635, "Pretrain/Step": 9184, "Pretrain/Step Time": 8.509958317503333} +{"Pretrain/Learning Rate": 1.7840232859301919e-07, "Pretrain/Loss": 2.001793622970581, "Pretrain/Loss (Raw)": 2.0365922451019287, "Pretrain/Step": 9185, "Pretrain/Step Time": 8.501451946794987} +{"Pretrain/Learning Rate": 1.7739131759713924e-07, "Pretrain/Loss": 1.9990054368972778, "Pretrain/Loss (Raw)": 1.7740566730499268, "Pretrain/Step": 9186, "Pretrain/Step Time": 8.498242175206542} +{"Pretrain/Learning Rate": 1.7638316926145702e-07, "Pretrain/Loss": 1.9980944395065308, "Pretrain/Loss (Raw)": 1.8812400102615356, "Pretrain/Step": 9187, "Pretrain/Step Time": 8.50348661839962} +{"Pretrain/Learning Rate": 1.7537788370224351e-07, "Pretrain/Loss": 1.9986557960510254, "Pretrain/Loss (Raw)": 2.0536255836486816, "Pretrain/Step": 9188, "Pretrain/Step Time": 8.506935521960258} +{"Pretrain/Learning Rate": 1.7437546103542814e-07, "Pretrain/Loss": 1.9999219179153442, "Pretrain/Loss (Raw)": 2.0952723026275635, "Pretrain/Step": 9189, "Pretrain/Step Time": 8.512481763958931} +{"Pretrain/Learning Rate": 1.7337590137661842e-07, "Pretrain/Loss": 2.000537633895874, "Pretrain/Loss (Raw)": 1.999009132385254, "Pretrain/Step": 9190, "Pretrain/Step Time": 8.510375497862697} +{"Pretrain/Learning Rate": 1.7237920484108327e-07, "Pretrain/Loss": 1.999436616897583, "Pretrain/Loss (Raw)": 1.952073574066162, "Pretrain/Step": 9191, "Pretrain/Step Time": 8.503148877993226} +{"Pretrain/Learning Rate": 1.7138537154377243e-07, "Pretrain/Loss": 1.9986387491226196, "Pretrain/Loss (Raw)": 1.8419663906097412, "Pretrain/Step": 9192, "Pretrain/Step Time": 8.500601820647717} +{"Pretrain/Learning Rate": 1.70394401599297e-07, "Pretrain/Loss": 2.0007119178771973, "Pretrain/Loss (Raw)": 2.2413034439086914, "Pretrain/Step": 9193, "Pretrain/Step Time": 8.50340593419969} +{"Pretrain/Learning Rate": 1.6940629512194052e-07, "Pretrain/Loss": 2.001734972000122, "Pretrain/Loss (Raw)": 2.115020513534546, "Pretrain/Step": 9194, "Pretrain/Step Time": 8.505279127508402} +{"Pretrain/Learning Rate": 1.6842105222565352e-07, "Pretrain/Loss": 2.0037832260131836, "Pretrain/Loss (Raw)": 2.3008551597595215, "Pretrain/Step": 9195, "Pretrain/Step Time": 8.514627518132329} +{"Pretrain/Learning Rate": 1.6743867302406458e-07, "Pretrain/Loss": 2.004300594329834, "Pretrain/Loss (Raw)": 2.092822551727295, "Pretrain/Step": 9196, "Pretrain/Step Time": 8.521772179752588} +{"Pretrain/Learning Rate": 1.6645915763045804e-07, "Pretrain/Loss": 2.002793788909912, "Pretrain/Loss (Raw)": 1.9284700155258179, "Pretrain/Step": 9197, "Pretrain/Step Time": 8.517409896478057} +{"Pretrain/Learning Rate": 1.654825061578047e-07, "Pretrain/Loss": 2.000652313232422, "Pretrain/Loss (Raw)": 1.9125721454620361, "Pretrain/Step": 9198, "Pretrain/Step Time": 8.506320506334305} +{"Pretrain/Learning Rate": 1.6450871871873108e-07, "Pretrain/Loss": 1.9979790449142456, "Pretrain/Loss (Raw)": 1.745200753211975, "Pretrain/Step": 9199, "Pretrain/Step Time": 8.511078575626016} +{"Pretrain/Learning Rate": 1.6353779542554182e-07, "Pretrain/Loss": 1.9983015060424805, "Pretrain/Loss (Raw)": 1.9235243797302246, "Pretrain/Step": 9200, "Pretrain/Step Time": 8.516672493889928} +{"Pretrain/Learning Rate": 1.6256973639020569e-07, "Pretrain/Loss": 1.9975444078445435, "Pretrain/Loss (Raw)": 2.0720717906951904, "Pretrain/Step": 9201, "Pretrain/Step Time": 8.524273987859488} +{"Pretrain/Learning Rate": 1.6160454172436667e-07, "Pretrain/Loss": 1.9983404874801636, "Pretrain/Loss (Raw)": 2.2761635780334473, "Pretrain/Step": 9202, "Pretrain/Step Time": 8.527051471173763} +{"Pretrain/Learning Rate": 1.60642211539333e-07, "Pretrain/Loss": 1.9981898069381714, "Pretrain/Loss (Raw)": 2.0199708938598633, "Pretrain/Step": 9203, "Pretrain/Step Time": 8.522773291915655} +{"Pretrain/Learning Rate": 1.5968274594608812e-07, "Pretrain/Loss": 2.0002918243408203, "Pretrain/Loss (Raw)": 2.0733494758605957, "Pretrain/Step": 9204, "Pretrain/Step Time": 8.521721709519625} +{"Pretrain/Learning Rate": 1.587261450552796e-07, "Pretrain/Loss": 1.999670386314392, "Pretrain/Loss (Raw)": 1.9403786659240723, "Pretrain/Step": 9205, "Pretrain/Step Time": 8.51870191656053} +{"Pretrain/Learning Rate": 1.5777240897722757e-07, "Pretrain/Loss": 1.997771978378296, "Pretrain/Loss (Raw)": 1.9115313291549683, "Pretrain/Step": 9206, "Pretrain/Step Time": 8.528765331953764} +{"Pretrain/Learning Rate": 1.5682153782192177e-07, "Pretrain/Loss": 1.9986364841461182, "Pretrain/Loss (Raw)": 2.1762545108795166, "Pretrain/Step": 9207, "Pretrain/Step Time": 8.528337074443698} +{"Pretrain/Learning Rate": 1.5587353169902175e-07, "Pretrain/Loss": 1.999229907989502, "Pretrain/Loss (Raw)": 2.1473066806793213, "Pretrain/Step": 9208, "Pretrain/Step Time": 8.526982724666595} +{"Pretrain/Learning Rate": 1.5492839071785392e-07, "Pretrain/Loss": 1.999969720840454, "Pretrain/Loss (Raw)": 2.3046443462371826, "Pretrain/Step": 9209, "Pretrain/Step Time": 8.52660639770329} +{"Pretrain/Learning Rate": 1.5398611498742e-07, "Pretrain/Loss": 1.9997122287750244, "Pretrain/Loss (Raw)": 1.9997535943984985, "Pretrain/Step": 9210, "Pretrain/Step Time": 8.522446766495705} +{"Pretrain/Learning Rate": 1.5304670461638582e-07, "Pretrain/Loss": 1.9982446432113647, "Pretrain/Loss (Raw)": 1.9034960269927979, "Pretrain/Step": 9211, "Pretrain/Step Time": 8.526500262320042} +{"Pretrain/Learning Rate": 1.521101597130842e-07, "Pretrain/Loss": 2.001397132873535, "Pretrain/Loss (Raw)": 2.1750080585479736, "Pretrain/Step": 9212, "Pretrain/Step Time": 8.533009907230735} +{"Pretrain/Learning Rate": 1.5117648038553144e-07, "Pretrain/Loss": 1.9994592666625977, "Pretrain/Loss (Raw)": 1.9208109378814697, "Pretrain/Step": 9213, "Pretrain/Step Time": 8.53702574595809} +{"Pretrain/Learning Rate": 1.502456667413943e-07, "Pretrain/Loss": 2.0001556873321533, "Pretrain/Loss (Raw)": 2.023554801940918, "Pretrain/Step": 9214, "Pretrain/Step Time": 8.53183712810278} +{"Pretrain/Learning Rate": 1.493177188880257e-07, "Pretrain/Loss": 1.996649980545044, "Pretrain/Loss (Raw)": 1.851074457168579, "Pretrain/Step": 9215, "Pretrain/Step Time": 8.529330033808947} +{"Pretrain/Learning Rate": 1.4839263693243732e-07, "Pretrain/Loss": 1.9977869987487793, "Pretrain/Loss (Raw)": 2.0304155349731445, "Pretrain/Step": 9216, "Pretrain/Step Time": 8.53064845316112} +{"Pretrain/Learning Rate": 1.4747042098131326e-07, "Pretrain/Loss": 1.9965507984161377, "Pretrain/Loss (Raw)": 1.8142786026000977, "Pretrain/Step": 9217, "Pretrain/Step Time": 8.529403183609247} +{"Pretrain/Learning Rate": 1.4655107114101007e-07, "Pretrain/Loss": 1.9949021339416504, "Pretrain/Loss (Raw)": 1.814218282699585, "Pretrain/Step": 9218, "Pretrain/Step Time": 8.535053415223956} +{"Pretrain/Learning Rate": 1.4563458751755132e-07, "Pretrain/Loss": 1.996793508529663, "Pretrain/Loss (Raw)": 2.0612549781799316, "Pretrain/Step": 9219, "Pretrain/Step Time": 8.531644532456994} +{"Pretrain/Learning Rate": 1.4472097021662745e-07, "Pretrain/Loss": 1.9961549043655396, "Pretrain/Loss (Raw)": 2.050879716873169, "Pretrain/Step": 9220, "Pretrain/Step Time": 8.53453310765326} +{"Pretrain/Learning Rate": 1.4381021934360417e-07, "Pretrain/Loss": 1.9969282150268555, "Pretrain/Loss (Raw)": 2.0543384552001953, "Pretrain/Step": 9221, "Pretrain/Step Time": 8.528646109625697} +{"Pretrain/Learning Rate": 1.4290233500351414e-07, "Pretrain/Loss": 1.9950350522994995, "Pretrain/Loss (Raw)": 1.8867937326431274, "Pretrain/Step": 9222, "Pretrain/Step Time": 8.52503770031035} +{"Pretrain/Learning Rate": 1.4199731730105693e-07, "Pretrain/Loss": 1.9925565719604492, "Pretrain/Loss (Raw)": 1.9615163803100586, "Pretrain/Step": 9223, "Pretrain/Step Time": 8.534328866750002} +{"Pretrain/Learning Rate": 1.4109516634060182e-07, "Pretrain/Loss": 1.9947422742843628, "Pretrain/Loss (Raw)": 2.2862870693206787, "Pretrain/Step": 9224, "Pretrain/Step Time": 8.536630112677813} +{"Pretrain/Learning Rate": 1.401958822261934e-07, "Pretrain/Loss": 1.9945919513702393, "Pretrain/Loss (Raw)": 1.900629997253418, "Pretrain/Step": 9225, "Pretrain/Step Time": 8.536972245201468} +{"Pretrain/Learning Rate": 1.3929946506153758e-07, "Pretrain/Loss": 1.9939696788787842, "Pretrain/Loss (Raw)": 1.969594955444336, "Pretrain/Step": 9226, "Pretrain/Step Time": 8.53254609555006} +{"Pretrain/Learning Rate": 1.3840591495001554e-07, "Pretrain/Loss": 1.9976575374603271, "Pretrain/Loss (Raw)": 2.235513687133789, "Pretrain/Step": 9227, "Pretrain/Step Time": 8.526640258729458} +{"Pretrain/Learning Rate": 1.375152319946754e-07, "Pretrain/Loss": 1.9968984127044678, "Pretrain/Loss (Raw)": 1.9124799966812134, "Pretrain/Step": 9228, "Pretrain/Step Time": 8.517179576680064} +{"Pretrain/Learning Rate": 1.3662741629823506e-07, "Pretrain/Loss": 1.9971495866775513, "Pretrain/Loss (Raw)": 1.9613703489303589, "Pretrain/Step": 9229, "Pretrain/Step Time": 8.520751973614097} +{"Pretrain/Learning Rate": 1.357424679630792e-07, "Pretrain/Loss": 1.9957234859466553, "Pretrain/Loss (Raw)": 1.838729739189148, "Pretrain/Step": 9230, "Pretrain/Step Time": 8.525954615324736} +{"Pretrain/Learning Rate": 1.348603870912679e-07, "Pretrain/Loss": 1.9976098537445068, "Pretrain/Loss (Raw)": 2.055004119873047, "Pretrain/Step": 9231, "Pretrain/Step Time": 8.533145790919662} +{"Pretrain/Learning Rate": 1.3398117378452534e-07, "Pretrain/Loss": 1.996229887008667, "Pretrain/Loss (Raw)": 1.9153884649276733, "Pretrain/Step": 9232, "Pretrain/Step Time": 8.527937773615122} +{"Pretrain/Learning Rate": 1.331048281442454e-07, "Pretrain/Loss": 1.9971822500228882, "Pretrain/Loss (Raw)": 2.223604202270508, "Pretrain/Step": 9233, "Pretrain/Step Time": 8.52237788029015} +{"Pretrain/Learning Rate": 1.322313502714917e-07, "Pretrain/Loss": 1.9970371723175049, "Pretrain/Loss (Raw)": 2.1682231426239014, "Pretrain/Step": 9234, "Pretrain/Step Time": 8.521240359172225} +{"Pretrain/Learning Rate": 1.3136074026700307e-07, "Pretrain/Loss": 1.992643117904663, "Pretrain/Loss (Raw)": 1.7948899269104004, "Pretrain/Step": 9235, "Pretrain/Step Time": 8.521346652880311} +{"Pretrain/Learning Rate": 1.30492998231177e-07, "Pretrain/Loss": 1.991258144378662, "Pretrain/Loss (Raw)": 1.9725148677825928, "Pretrain/Step": 9236, "Pretrain/Step Time": 8.523871371522546} +{"Pretrain/Learning Rate": 1.296281242640862e-07, "Pretrain/Loss": 1.99141263961792, "Pretrain/Loss (Raw)": 1.972732424736023, "Pretrain/Step": 9237, "Pretrain/Step Time": 8.521841088309884} +{"Pretrain/Learning Rate": 1.2876611846547593e-07, "Pretrain/Loss": 1.9911298751831055, "Pretrain/Loss (Raw)": 1.9338364601135254, "Pretrain/Step": 9238, "Pretrain/Step Time": 8.522106627002358} +{"Pretrain/Learning Rate": 1.2790698093474995e-07, "Pretrain/Loss": 1.9913859367370605, "Pretrain/Loss (Raw)": 2.0199031829833984, "Pretrain/Step": 9239, "Pretrain/Step Time": 8.513647293671966} +{"Pretrain/Learning Rate": 1.270507117709957e-07, "Pretrain/Loss": 1.9902080297470093, "Pretrain/Loss (Raw)": 2.016619920730591, "Pretrain/Step": 9240, "Pretrain/Step Time": 8.51217620074749} +{"Pretrain/Learning Rate": 1.2619731107295917e-07, "Pretrain/Loss": 1.9909560680389404, "Pretrain/Loss (Raw)": 1.938727617263794, "Pretrain/Step": 9241, "Pretrain/Step Time": 8.521460259333253} +{"Pretrain/Learning Rate": 1.2534677893905334e-07, "Pretrain/Loss": 1.9933507442474365, "Pretrain/Loss (Raw)": 2.0317423343658447, "Pretrain/Step": 9242, "Pretrain/Step Time": 8.522442223504186} +{"Pretrain/Learning Rate": 1.244991154673747e-07, "Pretrain/Loss": 1.994222640991211, "Pretrain/Loss (Raw)": 2.104642152786255, "Pretrain/Step": 9243, "Pretrain/Step Time": 8.52388103120029} +{"Pretrain/Learning Rate": 1.2365432075567007e-07, "Pretrain/Loss": 1.9944638013839722, "Pretrain/Loss (Raw)": 2.0209250450134277, "Pretrain/Step": 9244, "Pretrain/Step Time": 8.51409511640668} +{"Pretrain/Learning Rate": 1.228123949013754e-07, "Pretrain/Loss": 1.9957019090652466, "Pretrain/Loss (Raw)": 2.0966081619262695, "Pretrain/Step": 9245, "Pretrain/Step Time": 8.509100090712309} +{"Pretrain/Learning Rate": 1.2197333800157973e-07, "Pretrain/Loss": 1.992877721786499, "Pretrain/Loss (Raw)": 1.6332145929336548, "Pretrain/Step": 9246, "Pretrain/Step Time": 8.506502151489258} +{"Pretrain/Learning Rate": 1.2113715015304728e-07, "Pretrain/Loss": 1.9933782815933228, "Pretrain/Loss (Raw)": 1.978157877922058, "Pretrain/Step": 9247, "Pretrain/Step Time": 8.510286936536431} +{"Pretrain/Learning Rate": 1.2030383145221203e-07, "Pretrain/Loss": 1.9965239763259888, "Pretrain/Loss (Raw)": 2.2274460792541504, "Pretrain/Step": 9248, "Pretrain/Step Time": 8.51104318909347} +{"Pretrain/Learning Rate": 1.1947338199517489e-07, "Pretrain/Loss": 1.9946409463882446, "Pretrain/Loss (Raw)": 2.032191514968872, "Pretrain/Step": 9249, "Pretrain/Step Time": 8.511830979958177} +{"Pretrain/Learning Rate": 1.1864580187770647e-07, "Pretrain/Loss": 1.9951684474945068, "Pretrain/Loss (Raw)": 2.0269956588745117, "Pretrain/Step": 9250, "Pretrain/Step Time": 8.50543038547039} +{"Pretrain/Learning Rate": 1.1782109119524986e-07, "Pretrain/Loss": 1.996478796005249, "Pretrain/Loss (Raw)": 2.1055994033813477, "Pretrain/Step": 9251, "Pretrain/Step Time": 8.495829235762358} +{"Pretrain/Learning Rate": 1.169992500429179e-07, "Pretrain/Loss": 1.9973227977752686, "Pretrain/Loss (Raw)": 2.063394784927368, "Pretrain/Step": 9252, "Pretrain/Step Time": 8.5004220623523} +{"Pretrain/Learning Rate": 1.1618027851548197e-07, "Pretrain/Loss": 1.998999834060669, "Pretrain/Loss (Raw)": 2.0416371822357178, "Pretrain/Step": 9253, "Pretrain/Step Time": 8.502071462571621} +{"Pretrain/Learning Rate": 1.1536417670739152e-07, "Pretrain/Loss": 2.003026008605957, "Pretrain/Loss (Raw)": 2.213108539581299, "Pretrain/Step": 9254, "Pretrain/Step Time": 8.499758142977953} +{"Pretrain/Learning Rate": 1.1455094471276573e-07, "Pretrain/Loss": 2.000593662261963, "Pretrain/Loss (Raw)": 1.664921522140503, "Pretrain/Step": 9255, "Pretrain/Step Time": 8.503924304619431} +{"Pretrain/Learning Rate": 1.1374058262539067e-07, "Pretrain/Loss": 2.0031421184539795, "Pretrain/Loss (Raw)": 2.2172110080718994, "Pretrain/Step": 9256, "Pretrain/Step Time": 8.495109824463725} +{"Pretrain/Learning Rate": 1.1293309053871659e-07, "Pretrain/Loss": 2.0037131309509277, "Pretrain/Loss (Raw)": 1.9736597537994385, "Pretrain/Step": 9257, "Pretrain/Step Time": 8.49681973643601} +{"Pretrain/Learning Rate": 1.1212846854587177e-07, "Pretrain/Loss": 2.005585193634033, "Pretrain/Loss (Raw)": 2.039825677871704, "Pretrain/Step": 9258, "Pretrain/Step Time": 8.498364768922329} +{"Pretrain/Learning Rate": 1.113267167396459e-07, "Pretrain/Loss": 2.004943370819092, "Pretrain/Loss (Raw)": 2.094975471496582, "Pretrain/Step": 9259, "Pretrain/Step Time": 8.499804800376296} +{"Pretrain/Learning Rate": 1.1052783521250387e-07, "Pretrain/Loss": 2.006147623062134, "Pretrain/Loss (Raw)": 2.063568353652954, "Pretrain/Step": 9260, "Pretrain/Step Time": 8.498178772628307} +{"Pretrain/Learning Rate": 1.0973182405657479e-07, "Pretrain/Loss": 2.005497932434082, "Pretrain/Loss (Raw)": 1.9150612354278564, "Pretrain/Step": 9261, "Pretrain/Step Time": 8.497256828472018} +{"Pretrain/Learning Rate": 1.089386833636602e-07, "Pretrain/Loss": 2.0052990913391113, "Pretrain/Loss (Raw)": 2.0661537647247314, "Pretrain/Step": 9262, "Pretrain/Step Time": 8.49835110642016} +{"Pretrain/Learning Rate": 1.0814841322522585e-07, "Pretrain/Loss": 2.0062999725341797, "Pretrain/Loss (Raw)": 2.151930093765259, "Pretrain/Step": 9263, "Pretrain/Step Time": 8.49577846750617} +{"Pretrain/Learning Rate": 1.0736101373240992e-07, "Pretrain/Loss": 2.005394458770752, "Pretrain/Loss (Raw)": 1.7952051162719727, "Pretrain/Step": 9264, "Pretrain/Step Time": 8.493264654651284} +{"Pretrain/Learning Rate": 1.0657648497601757e-07, "Pretrain/Loss": 2.0055999755859375, "Pretrain/Loss (Raw)": 2.002203941345215, "Pretrain/Step": 9265, "Pretrain/Step Time": 8.494558801874518} +{"Pretrain/Learning Rate": 1.0579482704653199e-07, "Pretrain/Loss": 2.006964683532715, "Pretrain/Loss (Raw)": 2.0776479244232178, "Pretrain/Step": 9266, "Pretrain/Step Time": 8.50196086615324} +{"Pretrain/Learning Rate": 1.0501604003408938e-07, "Pretrain/Loss": 2.007880687713623, "Pretrain/Loss (Raw)": 2.1635875701904297, "Pretrain/Step": 9267, "Pretrain/Step Time": 8.505106221884489} +{"Pretrain/Learning Rate": 1.042401240285068e-07, "Pretrain/Loss": 2.0093419551849365, "Pretrain/Loss (Raw)": 2.15071177482605, "Pretrain/Step": 9268, "Pretrain/Step Time": 8.497258814051747} +{"Pretrain/Learning Rate": 1.0346707911926268e-07, "Pretrain/Loss": 2.0084805488586426, "Pretrain/Loss (Raw)": 2.0160884857177734, "Pretrain/Step": 9269, "Pretrain/Step Time": 8.496992696076632} +{"Pretrain/Learning Rate": 1.0269690539551625e-07, "Pretrain/Loss": 2.0061135292053223, "Pretrain/Loss (Raw)": 1.8621635437011719, "Pretrain/Step": 9270, "Pretrain/Step Time": 8.50037538073957} +{"Pretrain/Learning Rate": 1.0192960294607978e-07, "Pretrain/Loss": 2.0073885917663574, "Pretrain/Loss (Raw)": 2.2146379947662354, "Pretrain/Step": 9271, "Pretrain/Step Time": 8.511599676683545} +{"Pretrain/Learning Rate": 1.011651718594464e-07, "Pretrain/Loss": 2.0071613788604736, "Pretrain/Loss (Raw)": 2.024294853210449, "Pretrain/Step": 9272, "Pretrain/Step Time": 8.514785636216402} +{"Pretrain/Learning Rate": 1.0040361222377059e-07, "Pretrain/Loss": 2.007232189178467, "Pretrain/Loss (Raw)": 1.9839533567428589, "Pretrain/Step": 9273, "Pretrain/Step Time": 8.50559307448566} +{"Pretrain/Learning Rate": 9.964492412688209e-08, "Pretrain/Loss": 2.0086991786956787, "Pretrain/Loss (Raw)": 2.168510675430298, "Pretrain/Step": 9274, "Pretrain/Step Time": 8.500535951927304} +{"Pretrain/Learning Rate": 9.88891076562748e-08, "Pretrain/Loss": 2.009079694747925, "Pretrain/Loss (Raw)": 2.037726879119873, "Pretrain/Step": 9275, "Pretrain/Step Time": 8.501587072387338} +{"Pretrain/Learning Rate": 9.813616289911509e-08, "Pretrain/Loss": 2.0126190185546875, "Pretrain/Loss (Raw)": 2.0947201251983643, "Pretrain/Step": 9276, "Pretrain/Step Time": 8.510220712050796} +{"Pretrain/Learning Rate": 9.738608994223352e-08, "Pretrain/Loss": 2.013906478881836, "Pretrain/Loss (Raw)": 2.192256212234497, "Pretrain/Step": 9277, "Pretrain/Step Time": 8.512343602254987} +{"Pretrain/Learning Rate": 9.663888887213313e-08, "Pretrain/Loss": 2.012031078338623, "Pretrain/Loss (Raw)": 1.8632142543792725, "Pretrain/Step": 9278, "Pretrain/Step Time": 8.516346113756299} +{"Pretrain/Learning Rate": 9.589455977498385e-08, "Pretrain/Loss": 2.0133631229400635, "Pretrain/Loss (Raw)": 1.9801689386367798, "Pretrain/Step": 9279, "Pretrain/Step Time": 8.51374065876007} +{"Pretrain/Learning Rate": 9.515310273662814e-08, "Pretrain/Loss": 2.013174533843994, "Pretrain/Loss (Raw)": 2.0174522399902344, "Pretrain/Step": 9280, "Pretrain/Step Time": 8.507985793054104} +{"Pretrain/Learning Rate": 9.441451784256706e-08, "Pretrain/Loss": 2.0130810737609863, "Pretrain/Loss (Raw)": 2.0169475078582764, "Pretrain/Step": 9281, "Pretrain/Step Time": 8.50831663236022} +{"Pretrain/Learning Rate": 9.3678805177988e-08, "Pretrain/Loss": 2.013190746307373, "Pretrain/Loss (Raw)": 2.0038490295410156, "Pretrain/Step": 9282, "Pretrain/Step Time": 8.504714671522379} +{"Pretrain/Learning Rate": 9.294596482772866e-08, "Pretrain/Loss": 2.0151848793029785, "Pretrain/Loss (Raw)": 2.187396764755249, "Pretrain/Step": 9283, "Pretrain/Step Time": 8.51112188026309} +{"Pretrain/Learning Rate": 9.221599687630755e-08, "Pretrain/Loss": 2.0125420093536377, "Pretrain/Loss (Raw)": 1.7299911975860596, "Pretrain/Step": 9284, "Pretrain/Step Time": 8.514025654643774} +{"Pretrain/Learning Rate": 9.148890140790733e-08, "Pretrain/Loss": 2.0128231048583984, "Pretrain/Loss (Raw)": 2.098529815673828, "Pretrain/Step": 9285, "Pretrain/Step Time": 8.514935621991754} +{"Pretrain/Learning Rate": 9.076467850638037e-08, "Pretrain/Loss": 2.011115550994873, "Pretrain/Loss (Raw)": 1.8524706363677979, "Pretrain/Step": 9286, "Pretrain/Step Time": 8.515058651566505} +{"Pretrain/Learning Rate": 9.004332825524597e-08, "Pretrain/Loss": 2.0126028060913086, "Pretrain/Loss (Raw)": 2.060117483139038, "Pretrain/Step": 9287, "Pretrain/Step Time": 8.513420458883047} +{"Pretrain/Learning Rate": 8.932485073769592e-08, "Pretrain/Loss": 2.013193130493164, "Pretrain/Loss (Raw)": 2.017427921295166, "Pretrain/Step": 9288, "Pretrain/Step Time": 8.514300430193543} +{"Pretrain/Learning Rate": 8.860924603658338e-08, "Pretrain/Loss": 2.0079355239868164, "Pretrain/Loss (Raw)": 1.6486366987228394, "Pretrain/Step": 9289, "Pretrain/Step Time": 8.520900083705783} +{"Pretrain/Learning Rate": 8.789651423444234e-08, "Pretrain/Loss": 2.0072150230407715, "Pretrain/Loss (Raw)": 2.068192481994629, "Pretrain/Step": 9290, "Pretrain/Step Time": 8.526828160509467} +{"Pretrain/Learning Rate": 8.718665541346261e-08, "Pretrain/Loss": 2.008643865585327, "Pretrain/Loss (Raw)": 2.2036800384521484, "Pretrain/Step": 9291, "Pretrain/Step Time": 8.520500591024756} +{"Pretrain/Learning Rate": 8.647966965551202e-08, "Pretrain/Loss": 2.011009693145752, "Pretrain/Loss (Raw)": 2.248262882232666, "Pretrain/Step": 9292, "Pretrain/Step Time": 8.52046375349164} +{"Pretrain/Learning Rate": 8.577555704212259e-08, "Pretrain/Loss": 2.011977195739746, "Pretrain/Loss (Raw)": 2.0609211921691895, "Pretrain/Step": 9293, "Pretrain/Step Time": 8.521452074870467} +{"Pretrain/Learning Rate": 8.507431765449603e-08, "Pretrain/Loss": 2.013737916946411, "Pretrain/Loss (Raw)": 2.034107208251953, "Pretrain/Step": 9294, "Pretrain/Step Time": 8.51682461425662} +{"Pretrain/Learning Rate": 8.437595157350098e-08, "Pretrain/Loss": 2.014246702194214, "Pretrain/Loss (Raw)": 2.044290542602539, "Pretrain/Step": 9295, "Pretrain/Step Time": 8.526068367064} +{"Pretrain/Learning Rate": 8.368045887967858e-08, "Pretrain/Loss": 2.0141685009002686, "Pretrain/Loss (Raw)": 1.9781500101089478, "Pretrain/Step": 9296, "Pretrain/Step Time": 8.529804753139615} +{"Pretrain/Learning Rate": 8.298783965323409e-08, "Pretrain/Loss": 2.0132243633270264, "Pretrain/Loss (Raw)": 1.8590821027755737, "Pretrain/Step": 9297, "Pretrain/Step Time": 8.524755004793406} +{"Pretrain/Learning Rate": 8.22980939740453e-08, "Pretrain/Loss": 2.0146737098693848, "Pretrain/Loss (Raw)": 2.1684372425079346, "Pretrain/Step": 9298, "Pretrain/Step Time": 8.521040480583906} +{"Pretrain/Learning Rate": 8.161122192165693e-08, "Pretrain/Loss": 2.0136923789978027, "Pretrain/Loss (Raw)": 1.8694703578948975, "Pretrain/Step": 9299, "Pretrain/Step Time": 8.521604292094707} +{"Pretrain/Learning Rate": 8.092722357528059e-08, "Pretrain/Loss": 2.014120578765869, "Pretrain/Loss (Raw)": 2.1106884479522705, "Pretrain/Step": 9300, "Pretrain/Step Time": 8.523910865187645} +{"Pretrain/Learning Rate": 8.024609901380042e-08, "Pretrain/Loss": 2.0140161514282227, "Pretrain/Loss (Raw)": 1.978472352027893, "Pretrain/Step": 9301, "Pretrain/Step Time": 8.529794121161103} +{"Pretrain/Learning Rate": 7.956784831576469e-08, "Pretrain/Loss": 2.0132908821105957, "Pretrain/Loss (Raw)": 2.0157806873321533, "Pretrain/Step": 9302, "Pretrain/Step Time": 8.527578558772802} +{"Pretrain/Learning Rate": 7.889247155939417e-08, "Pretrain/Loss": 2.011791706085205, "Pretrain/Loss (Raw)": 1.950363039970398, "Pretrain/Step": 9303, "Pretrain/Step Time": 8.521544460207224} +{"Pretrain/Learning Rate": 7.821996882257654e-08, "Pretrain/Loss": 2.010800838470459, "Pretrain/Loss (Raw)": 1.993860125541687, "Pretrain/Step": 9304, "Pretrain/Step Time": 8.51846482232213} +{"Pretrain/Learning Rate": 7.755034018286644e-08, "Pretrain/Loss": 2.0136754512786865, "Pretrain/Loss (Raw)": 2.088388681411743, "Pretrain/Step": 9305, "Pretrain/Step Time": 8.515536326915026} +{"Pretrain/Learning Rate": 7.688358571748821e-08, "Pretrain/Loss": 2.014514684677124, "Pretrain/Loss (Raw)": 2.031038284301758, "Pretrain/Step": 9306, "Pretrain/Step Time": 8.518849169835448} +{"Pretrain/Learning Rate": 7.621970550333868e-08, "Pretrain/Loss": 2.016083240509033, "Pretrain/Loss (Raw)": 2.147556781768799, "Pretrain/Step": 9307, "Pretrain/Step Time": 8.518926609307528} +{"Pretrain/Learning Rate": 7.555869961697881e-08, "Pretrain/Loss": 2.0177290439605713, "Pretrain/Loss (Raw)": 2.1177892684936523, "Pretrain/Step": 9308, "Pretrain/Step Time": 8.532449843361974} +{"Pretrain/Learning Rate": 7.490056813463375e-08, "Pretrain/Loss": 2.017416477203369, "Pretrain/Loss (Raw)": 1.7579045295715332, "Pretrain/Step": 9309, "Pretrain/Step Time": 8.526461113244295} +{"Pretrain/Learning Rate": 7.424531113220945e-08, "Pretrain/Loss": 2.01784610748291, "Pretrain/Loss (Raw)": 2.0478858947753906, "Pretrain/Step": 9310, "Pretrain/Step Time": 8.520075976848602} +{"Pretrain/Learning Rate": 7.359292868526769e-08, "Pretrain/Loss": 2.0180201530456543, "Pretrain/Loss (Raw)": 2.091989040374756, "Pretrain/Step": 9311, "Pretrain/Step Time": 8.517313504591584} +{"Pretrain/Learning Rate": 7.294342086904827e-08, "Pretrain/Loss": 2.018073081970215, "Pretrain/Loss (Raw)": 1.9454635381698608, "Pretrain/Step": 9312, "Pretrain/Step Time": 8.520721811801195} +{"Pretrain/Learning Rate": 7.229678775845238e-08, "Pretrain/Loss": 2.0173091888427734, "Pretrain/Loss (Raw)": 1.9388023614883423, "Pretrain/Step": 9313, "Pretrain/Step Time": 8.526385929435492} +{"Pretrain/Learning Rate": 7.165302942805374e-08, "Pretrain/Loss": 2.0186312198638916, "Pretrain/Loss (Raw)": 1.9432653188705444, "Pretrain/Step": 9314, "Pretrain/Step Time": 8.532509990036488} +{"Pretrain/Learning Rate": 7.101214595209571e-08, "Pretrain/Loss": 2.0208020210266113, "Pretrain/Loss (Raw)": 2.1590940952301025, "Pretrain/Step": 9315, "Pretrain/Step Time": 8.526508796960115} +{"Pretrain/Learning Rate": 7.037413740448306e-08, "Pretrain/Loss": 2.020643949508667, "Pretrain/Loss (Raw)": 2.03340744972229, "Pretrain/Step": 9316, "Pretrain/Step Time": 8.528774345293641} +{"Pretrain/Learning Rate": 6.973900385880138e-08, "Pretrain/Loss": 2.021456241607666, "Pretrain/Loss (Raw)": 2.1992428302764893, "Pretrain/Step": 9317, "Pretrain/Step Time": 8.518674023449421} +{"Pretrain/Learning Rate": 6.910674538828931e-08, "Pretrain/Loss": 2.021066188812256, "Pretrain/Loss (Raw)": 1.9490938186645508, "Pretrain/Step": 9318, "Pretrain/Step Time": 8.524344274774194} +{"Pretrain/Learning Rate": 6.847736206586908e-08, "Pretrain/Loss": 2.021177291870117, "Pretrain/Loss (Raw)": 1.9662648439407349, "Pretrain/Step": 9319, "Pretrain/Step Time": 8.528603345155716} +{"Pretrain/Learning Rate": 6.785085396411872e-08, "Pretrain/Loss": 2.020963430404663, "Pretrain/Loss (Raw)": 1.814620852470398, "Pretrain/Step": 9320, "Pretrain/Step Time": 8.532300988212228} +{"Pretrain/Learning Rate": 6.722722115529156e-08, "Pretrain/Loss": 2.020948886871338, "Pretrain/Loss (Raw)": 2.2394468784332275, "Pretrain/Step": 9321, "Pretrain/Step Time": 8.529650321230292} +{"Pretrain/Learning Rate": 6.660646371130785e-08, "Pretrain/Loss": 2.019778251647949, "Pretrain/Loss (Raw)": 1.9651747941970825, "Pretrain/Step": 9322, "Pretrain/Step Time": 8.52935891225934} +{"Pretrain/Learning Rate": 6.598858170375755e-08, "Pretrain/Loss": 2.0177178382873535, "Pretrain/Loss (Raw)": 2.0371222496032715, "Pretrain/Step": 9323, "Pretrain/Step Time": 8.526621891185641} +{"Pretrain/Learning Rate": 6.537357520389753e-08, "Pretrain/Loss": 2.017223358154297, "Pretrain/Loss (Raw)": 2.0295228958129883, "Pretrain/Step": 9324, "Pretrain/Step Time": 8.525536743924022} +{"Pretrain/Learning Rate": 6.476144428265163e-08, "Pretrain/Loss": 2.01788592338562, "Pretrain/Loss (Raw)": 2.0132734775543213, "Pretrain/Step": 9325, "Pretrain/Step Time": 8.526283929124475} +{"Pretrain/Learning Rate": 6.415218901061614e-08, "Pretrain/Loss": 2.0193655490875244, "Pretrain/Loss (Raw)": 2.1019625663757324, "Pretrain/Step": 9326, "Pretrain/Step Time": 8.53130622394383} +{"Pretrain/Learning Rate": 6.354580945805156e-08, "Pretrain/Loss": 2.0198440551757812, "Pretrain/Loss (Raw)": 1.8064628839492798, "Pretrain/Step": 9327, "Pretrain/Step Time": 8.52835769020021} +{"Pretrain/Learning Rate": 6.294230569488802e-08, "Pretrain/Loss": 2.023077964782715, "Pretrain/Loss (Raw)": 2.337441921234131, "Pretrain/Step": 9328, "Pretrain/Step Time": 8.520596044138074} +{"Pretrain/Learning Rate": 6.234167779072542e-08, "Pretrain/Loss": 2.020958423614502, "Pretrain/Loss (Raw)": 1.8007750511169434, "Pretrain/Step": 9329, "Pretrain/Step Time": 8.520803149789572} +{"Pretrain/Learning Rate": 6.174392581483057e-08, "Pretrain/Loss": 2.019273042678833, "Pretrain/Loss (Raw)": 2.06044864654541, "Pretrain/Step": 9330, "Pretrain/Step Time": 8.51733535528183} +{"Pretrain/Learning Rate": 6.114904983613722e-08, "Pretrain/Loss": 2.019453525543213, "Pretrain/Loss (Raw)": 2.043062686920166, "Pretrain/Step": 9331, "Pretrain/Step Time": 8.519484713673592} +{"Pretrain/Learning Rate": 6.055704992325162e-08, "Pretrain/Loss": 2.0166900157928467, "Pretrain/Loss (Raw)": 1.719617247581482, "Pretrain/Step": 9332, "Pretrain/Step Time": 8.51828240416944} +{"Pretrain/Learning Rate": 5.99679261444469e-08, "Pretrain/Loss": 2.018599033355713, "Pretrain/Loss (Raw)": 2.1847293376922607, "Pretrain/Step": 9333, "Pretrain/Step Time": 8.518375985324383} +{"Pretrain/Learning Rate": 5.938167856766319e-08, "Pretrain/Loss": 2.0194334983825684, "Pretrain/Loss (Raw)": 2.0183768272399902, "Pretrain/Step": 9334, "Pretrain/Step Time": 8.512471558526158} +{"Pretrain/Learning Rate": 5.87983072605075e-08, "Pretrain/Loss": 2.017871141433716, "Pretrain/Loss (Raw)": 1.9762341976165771, "Pretrain/Step": 9335, "Pretrain/Step Time": 8.521708454936743} +{"Pretrain/Learning Rate": 5.821781229025658e-08, "Pretrain/Loss": 2.018510341644287, "Pretrain/Loss (Raw)": 2.2291481494903564, "Pretrain/Step": 9336, "Pretrain/Step Time": 8.513588095083833} +{"Pretrain/Learning Rate": 5.764019372385687e-08, "Pretrain/Loss": 2.0166115760803223, "Pretrain/Loss (Raw)": 2.061595916748047, "Pretrain/Step": 9337, "Pretrain/Step Time": 8.515139674767852} +{"Pretrain/Learning Rate": 5.706545162792454e-08, "Pretrain/Loss": 2.0164201259613037, "Pretrain/Loss (Raw)": 1.9752455949783325, "Pretrain/Step": 9338, "Pretrain/Step Time": 8.514628659933805} +{"Pretrain/Learning Rate": 5.649358606873989e-08, "Pretrain/Loss": 2.0170769691467285, "Pretrain/Loss (Raw)": 1.9875898361206055, "Pretrain/Step": 9339, "Pretrain/Step Time": 8.508592678233981} +{"Pretrain/Learning Rate": 5.5924597112250176e-08, "Pretrain/Loss": 2.016953468322754, "Pretrain/Loss (Raw)": 2.1591780185699463, "Pretrain/Step": 9340, "Pretrain/Step Time": 8.50254842825234} +{"Pretrain/Learning Rate": 5.5358484824077905e-08, "Pretrain/Loss": 2.018596649169922, "Pretrain/Loss (Raw)": 2.131140947341919, "Pretrain/Step": 9341, "Pretrain/Step Time": 8.498984517529607} +{"Pretrain/Learning Rate": 5.479524926950696e-08, "Pretrain/Loss": 2.0192432403564453, "Pretrain/Loss (Raw)": 2.1063218116760254, "Pretrain/Step": 9342, "Pretrain/Step Time": 8.511319803074002} +{"Pretrain/Learning Rate": 5.4234890513490954e-08, "Pretrain/Loss": 2.020585060119629, "Pretrain/Loss (Raw)": 2.0227906703948975, "Pretrain/Step": 9343, "Pretrain/Step Time": 8.508028157055378} +{"Pretrain/Learning Rate": 5.367740862065873e-08, "Pretrain/Loss": 2.02079176902771, "Pretrain/Loss (Raw)": 2.0569007396698, "Pretrain/Step": 9344, "Pretrain/Step Time": 8.513237120583653} +{"Pretrain/Learning Rate": 5.3122803655300533e-08, "Pretrain/Loss": 2.0218429565429688, "Pretrain/Loss (Raw)": 1.948850393295288, "Pretrain/Step": 9345, "Pretrain/Step Time": 8.509198965504766} +{"Pretrain/Learning Rate": 5.257107568137076e-08, "Pretrain/Loss": 2.0230696201324463, "Pretrain/Loss (Raw)": 1.971218466758728, "Pretrain/Step": 9346, "Pretrain/Step Time": 8.502537118270993} +{"Pretrain/Learning Rate": 5.2022224762501845e-08, "Pretrain/Loss": 2.0228211879730225, "Pretrain/Loss (Raw)": 2.0294623374938965, "Pretrain/Step": 9347, "Pretrain/Step Time": 8.503421550616622} +{"Pretrain/Learning Rate": 5.147625096199038e-08, "Pretrain/Loss": 2.0209150314331055, "Pretrain/Loss (Raw)": 1.8068897724151611, "Pretrain/Step": 9348, "Pretrain/Step Time": 8.505066337063909} +{"Pretrain/Learning Rate": 5.0933154342797105e-08, "Pretrain/Loss": 2.0210914611816406, "Pretrain/Loss (Raw)": 2.0769155025482178, "Pretrain/Step": 9349, "Pretrain/Step Time": 8.505670243874192} +{"Pretrain/Learning Rate": 5.039293496755526e-08, "Pretrain/Loss": 2.0208544731140137, "Pretrain/Loss (Raw)": 1.8564633131027222, "Pretrain/Step": 9350, "Pretrain/Step Time": 8.50753453746438} +{"Pretrain/Learning Rate": 4.9855592898567784e-08, "Pretrain/Loss": 2.02116322517395, "Pretrain/Loss (Raw)": 2.0010337829589844, "Pretrain/Step": 9351, "Pretrain/Step Time": 8.499621517956257} +{"Pretrain/Learning Rate": 4.9321128197804543e-08, "Pretrain/Loss": 2.0190792083740234, "Pretrain/Loss (Raw)": 2.019545078277588, "Pretrain/Step": 9352, "Pretrain/Step Time": 8.497955221682787} +{"Pretrain/Learning Rate": 4.8789540926896806e-08, "Pretrain/Loss": 2.018266201019287, "Pretrain/Loss (Raw)": 1.7965364456176758, "Pretrain/Step": 9353, "Pretrain/Step Time": 8.508410722017288} +{"Pretrain/Learning Rate": 4.826083114715385e-08, "Pretrain/Loss": 2.0192389488220215, "Pretrain/Loss (Raw)": 2.094132900238037, "Pretrain/Step": 9354, "Pretrain/Step Time": 8.51260543987155} +{"Pretrain/Learning Rate": 4.7734998919549135e-08, "Pretrain/Loss": 2.017184019088745, "Pretrain/Loss (Raw)": 1.972467303276062, "Pretrain/Step": 9355, "Pretrain/Step Time": 8.513560896739364} +{"Pretrain/Learning Rate": 4.7212044304723035e-08, "Pretrain/Loss": 2.01790714263916, "Pretrain/Loss (Raw)": 2.005037546157837, "Pretrain/Step": 9356, "Pretrain/Step Time": 8.518060259521008} +{"Pretrain/Learning Rate": 4.6691967362985645e-08, "Pretrain/Loss": 2.018907070159912, "Pretrain/Loss (Raw)": 2.0893609523773193, "Pretrain/Step": 9357, "Pretrain/Step Time": 8.511578707024455} +{"Pretrain/Learning Rate": 4.6174768154316764e-08, "Pretrain/Loss": 2.0231966972351074, "Pretrain/Loss (Raw)": 2.387817144393921, "Pretrain/Step": 9358, "Pretrain/Step Time": 8.504553582519293} +{"Pretrain/Learning Rate": 4.566044673835479e-08, "Pretrain/Loss": 2.021998882293701, "Pretrain/Loss (Raw)": 1.9016505479812622, "Pretrain/Step": 9359, "Pretrain/Step Time": 8.506164904683828} +{"Pretrain/Learning Rate": 4.514900317442172e-08, "Pretrain/Loss": 2.0217795372009277, "Pretrain/Loss (Raw)": 1.8873203992843628, "Pretrain/Step": 9360, "Pretrain/Step Time": 8.50799865834415} +{"Pretrain/Learning Rate": 4.464043752149816e-08, "Pretrain/Loss": 2.0188114643096924, "Pretrain/Loss (Raw)": 1.8437013626098633, "Pretrain/Step": 9361, "Pretrain/Step Time": 8.509258901700377} +{"Pretrain/Learning Rate": 4.413474983823163e-08, "Pretrain/Loss": 2.0179600715637207, "Pretrain/Loss (Raw)": 2.059246301651001, "Pretrain/Step": 9362, "Pretrain/Step Time": 8.50828343257308} +{"Pretrain/Learning Rate": 4.363194018293937e-08, "Pretrain/Loss": 2.019656181335449, "Pretrain/Loss (Raw)": 2.012012243270874, "Pretrain/Step": 9363, "Pretrain/Step Time": 8.50340492092073} +{"Pretrain/Learning Rate": 4.313200861361388e-08, "Pretrain/Loss": 2.0202503204345703, "Pretrain/Loss (Raw)": 2.0485501289367676, "Pretrain/Step": 9364, "Pretrain/Step Time": 8.498842945322394} +{"Pretrain/Learning Rate": 4.2634955187900727e-08, "Pretrain/Loss": 2.0206234455108643, "Pretrain/Loss (Raw)": 2.0204918384552, "Pretrain/Step": 9365, "Pretrain/Step Time": 8.505299214273691} +{"Pretrain/Learning Rate": 4.2140779963131815e-08, "Pretrain/Loss": 2.0214526653289795, "Pretrain/Loss (Raw)": 2.039982795715332, "Pretrain/Step": 9366, "Pretrain/Step Time": 8.507109733298421} +{"Pretrain/Learning Rate": 4.164948299629212e-08, "Pretrain/Loss": 2.021362066268921, "Pretrain/Loss (Raw)": 2.0082902908325195, "Pretrain/Step": 9367, "Pretrain/Step Time": 8.507692461833358} +{"Pretrain/Learning Rate": 4.1161064344041875e-08, "Pretrain/Loss": 2.021289348602295, "Pretrain/Loss (Raw)": 2.007328748703003, "Pretrain/Step": 9368, "Pretrain/Step Time": 8.512083809822798} +{"Pretrain/Learning Rate": 4.0675524062708245e-08, "Pretrain/Loss": 2.022888660430908, "Pretrain/Loss (Raw)": 2.1434333324432373, "Pretrain/Step": 9369, "Pretrain/Step Time": 8.501699943095446} +{"Pretrain/Learning Rate": 4.019286220828255e-08, "Pretrain/Loss": 2.022780179977417, "Pretrain/Loss (Raw)": 2.017848014831543, "Pretrain/Step": 9370, "Pretrain/Step Time": 8.501100845634937} +{"Pretrain/Learning Rate": 3.971307883643416e-08, "Pretrain/Loss": 2.0233731269836426, "Pretrain/Loss (Raw)": 2.180562734603882, "Pretrain/Step": 9371, "Pretrain/Step Time": 8.504854433238506} +{"Pretrain/Learning Rate": 3.923617400248825e-08, "Pretrain/Loss": 2.0213804244995117, "Pretrain/Loss (Raw)": 1.7658554315567017, "Pretrain/Step": 9372, "Pretrain/Step Time": 8.516633873805404} +{"Pretrain/Learning Rate": 3.876214776144527e-08, "Pretrain/Loss": 2.020211935043335, "Pretrain/Loss (Raw)": 1.9470133781433105, "Pretrain/Step": 9373, "Pretrain/Step Time": 8.517633143812418} +{"Pretrain/Learning Rate": 3.8291000167972604e-08, "Pretrain/Loss": 2.022944688796997, "Pretrain/Loss (Raw)": 1.9830365180969238, "Pretrain/Step": 9374, "Pretrain/Step Time": 8.51733773201704} +{"Pretrain/Learning Rate": 3.782273127640734e-08, "Pretrain/Loss": 2.022430658340454, "Pretrain/Loss (Raw)": 1.9123386144638062, "Pretrain/Step": 9375, "Pretrain/Step Time": 8.505467677488923} +{"Pretrain/Learning Rate": 3.735734114074796e-08, "Pretrain/Loss": 2.0193796157836914, "Pretrain/Loss (Raw)": 1.8369152545928955, "Pretrain/Step": 9376, "Pretrain/Step Time": 8.507187593728304} +{"Pretrain/Learning Rate": 3.6894829814668185e-08, "Pretrain/Loss": 2.0199601650238037, "Pretrain/Loss (Raw)": 2.106509208679199, "Pretrain/Step": 9377, "Pretrain/Step Time": 8.514775009825826} +{"Pretrain/Learning Rate": 3.643519735150869e-08, "Pretrain/Loss": 2.018388271331787, "Pretrain/Loss (Raw)": 1.8257927894592285, "Pretrain/Step": 9378, "Pretrain/Step Time": 8.516888676211238} +{"Pretrain/Learning Rate": 3.5978443804274286e-08, "Pretrain/Loss": 2.017834186553955, "Pretrain/Loss (Raw)": 2.0346972942352295, "Pretrain/Step": 9379, "Pretrain/Step Time": 8.517134597525} +{"Pretrain/Learning Rate": 3.552456922563674e-08, "Pretrain/Loss": 2.018963575363159, "Pretrain/Loss (Raw)": 2.207939863204956, "Pretrain/Step": 9380, "Pretrain/Step Time": 8.5178651958704} +{"Pretrain/Learning Rate": 3.5073573667945836e-08, "Pretrain/Loss": 2.019688844680786, "Pretrain/Loss (Raw)": 2.134472608566284, "Pretrain/Step": 9381, "Pretrain/Step Time": 8.511966206133366} +{"Pretrain/Learning Rate": 3.46254571832072e-08, "Pretrain/Loss": 2.018982410430908, "Pretrain/Loss (Raw)": 2.122659683227539, "Pretrain/Step": 9382, "Pretrain/Step Time": 8.511736733838916} +{"Pretrain/Learning Rate": 3.418021982310171e-08, "Pretrain/Loss": 2.020836353302002, "Pretrain/Loss (Raw)": 1.9022538661956787, "Pretrain/Step": 9383, "Pretrain/Step Time": 8.513019615784287} +{"Pretrain/Learning Rate": 3.3737861638977184e-08, "Pretrain/Loss": 2.0191917419433594, "Pretrain/Loss (Raw)": 2.0067121982574463, "Pretrain/Step": 9384, "Pretrain/Step Time": 8.523170582950115} +{"Pretrain/Learning Rate": 3.3298382681845595e-08, "Pretrain/Loss": 2.019594192504883, "Pretrain/Loss (Raw)": 2.025181770324707, "Pretrain/Step": 9385, "Pretrain/Step Time": 8.522691080346704} +{"Pretrain/Learning Rate": 3.28617830023914e-08, "Pretrain/Loss": 2.0197641849517822, "Pretrain/Loss (Raw)": 2.0615463256835938, "Pretrain/Step": 9386, "Pretrain/Step Time": 8.517360035330057} +{"Pretrain/Learning Rate": 3.242806265096876e-08, "Pretrain/Loss": 2.022519111633301, "Pretrain/Loss (Raw)": 2.447605848312378, "Pretrain/Step": 9387, "Pretrain/Step Time": 8.516040252521634} +{"Pretrain/Learning Rate": 3.199722167759045e-08, "Pretrain/Loss": 2.022599697113037, "Pretrain/Loss (Raw)": 2.073890209197998, "Pretrain/Step": 9388, "Pretrain/Step Time": 8.515932224690914} +{"Pretrain/Learning Rate": 3.15692601319445e-08, "Pretrain/Loss": 2.026789426803589, "Pretrain/Loss (Raw)": 2.4513344764709473, "Pretrain/Step": 9389, "Pretrain/Step Time": 8.522678153589368} +{"Pretrain/Learning Rate": 3.114417806338865e-08, "Pretrain/Loss": 2.026036500930786, "Pretrain/Loss (Raw)": 1.9698001146316528, "Pretrain/Step": 9390, "Pretrain/Step Time": 8.528653033077717} +{"Pretrain/Learning Rate": 3.072197552094203e-08, "Pretrain/Loss": 2.024857521057129, "Pretrain/Loss (Raw)": 2.0010106563568115, "Pretrain/Step": 9391, "Pretrain/Step Time": 8.529406676068902} +{"Pretrain/Learning Rate": 3.0302652553296226e-08, "Pretrain/Loss": 2.027057409286499, "Pretrain/Loss (Raw)": 2.0767979621887207, "Pretrain/Step": 9392, "Pretrain/Step Time": 8.525774689391255} +{"Pretrain/Learning Rate": 2.98862092088098e-08, "Pretrain/Loss": 2.0278000831604004, "Pretrain/Loss (Raw)": 2.0972585678100586, "Pretrain/Step": 9393, "Pretrain/Step Time": 8.526641506701708} +{"Pretrain/Learning Rate": 2.947264553551099e-08, "Pretrain/Loss": 2.02902889251709, "Pretrain/Loss (Raw)": 2.234924793243408, "Pretrain/Step": 9394, "Pretrain/Step Time": 8.51848248578608} +{"Pretrain/Learning Rate": 2.9061961581089424e-08, "Pretrain/Loss": 2.0265750885009766, "Pretrain/Loss (Raw)": 1.8495310544967651, "Pretrain/Step": 9395, "Pretrain/Step Time": 8.51192968338728} +{"Pretrain/Learning Rate": 2.8654157392909997e-08, "Pretrain/Loss": 2.0257604122161865, "Pretrain/Loss (Raw)": 2.0464282035827637, "Pretrain/Step": 9396, "Pretrain/Step Time": 8.522886842489243} +{"Pretrain/Learning Rate": 2.824923301800175e-08, "Pretrain/Loss": 2.0271620750427246, "Pretrain/Loss (Raw)": 2.1954991817474365, "Pretrain/Step": 9397, "Pretrain/Step Time": 8.52474144473672} +{"Pretrain/Learning Rate": 2.7847188503063447e-08, "Pretrain/Loss": 2.029921054840088, "Pretrain/Loss (Raw)": 2.2152936458587646, "Pretrain/Step": 9398, "Pretrain/Step Time": 8.523991161957383} +{"Pretrain/Learning Rate": 2.7448023894457997e-08, "Pretrain/Loss": 2.02662992477417, "Pretrain/Loss (Raw)": 1.793409824371338, "Pretrain/Step": 9399, "Pretrain/Step Time": 8.513139521703124} +{"Pretrain/Learning Rate": 2.7051739238223572e-08, "Pretrain/Loss": 2.025999069213867, "Pretrain/Loss (Raw)": 1.943522572517395, "Pretrain/Step": 9400, "Pretrain/Step Time": 8.509830286726356} +{"Pretrain/Learning Rate": 2.6658334580056954e-08, "Pretrain/Loss": 2.02708101272583, "Pretrain/Loss (Raw)": 2.122417449951172, "Pretrain/Step": 9401, "Pretrain/Step Time": 8.51405968517065} +{"Pretrain/Learning Rate": 2.626780996533018e-08, "Pretrain/Loss": 2.024807929992676, "Pretrain/Loss (Raw)": 1.877575159072876, "Pretrain/Step": 9402, "Pretrain/Step Time": 8.52119878679514} +{"Pretrain/Learning Rate": 2.588016543907945e-08, "Pretrain/Loss": 2.0274925231933594, "Pretrain/Loss (Raw)": 2.3813655376434326, "Pretrain/Step": 9403, "Pretrain/Step Time": 8.523817848414183} +{"Pretrain/Learning Rate": 2.549540104601067e-08, "Pretrain/Loss": 2.0275068283081055, "Pretrain/Loss (Raw)": 2.096548318862915, "Pretrain/Step": 9404, "Pretrain/Step Time": 8.51598896831274} +{"Pretrain/Learning Rate": 2.5113516830493898e-08, "Pretrain/Loss": 2.02713680267334, "Pretrain/Loss (Raw)": 2.144880771636963, "Pretrain/Step": 9405, "Pretrain/Step Time": 8.515227658674121} +{"Pretrain/Learning Rate": 2.4734512836574465e-08, "Pretrain/Loss": 2.0268282890319824, "Pretrain/Loss (Raw)": 1.8237156867980957, "Pretrain/Step": 9406, "Pretrain/Step Time": 8.508805051445961} +{"Pretrain/Learning Rate": 2.4358389107956292e-08, "Pretrain/Loss": 2.027550220489502, "Pretrain/Loss (Raw)": 2.0725698471069336, "Pretrain/Step": 9407, "Pretrain/Step Time": 8.512698808684945} +{"Pretrain/Learning Rate": 2.3985145688018575e-08, "Pretrain/Loss": 2.0281765460968018, "Pretrain/Loss (Raw)": 2.097644090652466, "Pretrain/Step": 9408, "Pretrain/Step Time": 8.51893749088049} +{"Pretrain/Learning Rate": 2.361478261980743e-08, "Pretrain/Loss": 2.0254368782043457, "Pretrain/Loss (Raw)": 1.6662847995758057, "Pretrain/Step": 9409, "Pretrain/Step Time": 8.521487155929208} +{"Pretrain/Learning Rate": 2.324729994602759e-08, "Pretrain/Loss": 2.0248639583587646, "Pretrain/Loss (Raw)": 1.9304817914962769, "Pretrain/Step": 9410, "Pretrain/Step Time": 8.52354221045971} +{"Pretrain/Learning Rate": 2.288269770906737e-08, "Pretrain/Loss": 2.0232110023498535, "Pretrain/Loss (Raw)": 1.9758508205413818, "Pretrain/Step": 9411, "Pretrain/Step Time": 8.52060736157} +{"Pretrain/Learning Rate": 2.2520975950968137e-08, "Pretrain/Loss": 2.0257375240325928, "Pretrain/Loss (Raw)": 2.053366184234619, "Pretrain/Step": 9412, "Pretrain/Step Time": 8.518178835511208} +{"Pretrain/Learning Rate": 2.2162134713446524e-08, "Pretrain/Loss": 2.0272929668426514, "Pretrain/Loss (Raw)": 2.2976274490356445, "Pretrain/Step": 9413, "Pretrain/Step Time": 8.512089245021343} +{"Pretrain/Learning Rate": 2.1806174037888872e-08, "Pretrain/Loss": 2.027313709259033, "Pretrain/Loss (Raw)": 1.8551242351531982, "Pretrain/Step": 9414, "Pretrain/Step Time": 8.512960746884346} +{"Pretrain/Learning Rate": 2.1453093965342896e-08, "Pretrain/Loss": 2.0282323360443115, "Pretrain/Loss (Raw)": 2.177713632583618, "Pretrain/Step": 9415, "Pretrain/Step Time": 8.515901425853372} +{"Pretrain/Learning Rate": 2.110289453653158e-08, "Pretrain/Loss": 2.0286624431610107, "Pretrain/Loss (Raw)": 2.072479724884033, "Pretrain/Step": 9416, "Pretrain/Step Time": 8.51585909537971} +{"Pretrain/Learning Rate": 2.0755575791836513e-08, "Pretrain/Loss": 2.030521869659424, "Pretrain/Loss (Raw)": 1.8866437673568726, "Pretrain/Step": 9417, "Pretrain/Step Time": 8.513500912114978} +{"Pretrain/Learning Rate": 2.041113777131731e-08, "Pretrain/Loss": 2.0296478271484375, "Pretrain/Loss (Raw)": 1.9563229084014893, "Pretrain/Step": 9418, "Pretrain/Step Time": 8.507482746616006} +{"Pretrain/Learning Rate": 2.0069580514689435e-08, "Pretrain/Loss": 2.0277438163757324, "Pretrain/Loss (Raw)": 1.959943413734436, "Pretrain/Step": 9419, "Pretrain/Step Time": 8.515433963388205} +{"Pretrain/Learning Rate": 1.9730904061349143e-08, "Pretrain/Loss": 2.0256526470184326, "Pretrain/Loss (Raw)": 1.9806164503097534, "Pretrain/Step": 9420, "Pretrain/Step Time": 8.51535152643919} +{"Pretrain/Learning Rate": 1.939510845035131e-08, "Pretrain/Loss": 2.0249431133270264, "Pretrain/Loss (Raw)": 1.970080018043518, "Pretrain/Step": 9421, "Pretrain/Step Time": 8.512204820290208} +{"Pretrain/Learning Rate": 1.9062193720423284e-08, "Pretrain/Loss": 2.0262179374694824, "Pretrain/Loss (Raw)": 2.1973178386688232, "Pretrain/Step": 9422, "Pretrain/Step Time": 8.50857750698924} +{"Pretrain/Learning Rate": 1.8732159909956583e-08, "Pretrain/Loss": 2.02500581741333, "Pretrain/Loss (Raw)": 1.8891252279281616, "Pretrain/Step": 9423, "Pretrain/Step Time": 8.502370163798332} +{"Pretrain/Learning Rate": 1.8405007057012425e-08, "Pretrain/Loss": 2.023292303085327, "Pretrain/Loss (Raw)": 1.7588127851486206, "Pretrain/Step": 9424, "Pretrain/Step Time": 8.497861301526427} +{"Pretrain/Learning Rate": 1.8080735199318966e-08, "Pretrain/Loss": 2.019818067550659, "Pretrain/Loss (Raw)": 1.4143726825714111, "Pretrain/Step": 9425, "Pretrain/Step Time": 8.500654505565763} +{"Pretrain/Learning Rate": 1.775934437427684e-08, "Pretrain/Loss": 2.0195655822753906, "Pretrain/Loss (Raw)": 2.136098861694336, "Pretrain/Step": 9426, "Pretrain/Step Time": 8.503219028934836} +{"Pretrain/Learning Rate": 1.7440834618945302e-08, "Pretrain/Loss": 2.0201640129089355, "Pretrain/Loss (Raw)": 1.9461129903793335, "Pretrain/Step": 9427, "Pretrain/Step Time": 8.504774453118443} +{"Pretrain/Learning Rate": 1.7125205970058843e-08, "Pretrain/Loss": 2.0198705196380615, "Pretrain/Loss (Raw)": 2.0730957984924316, "Pretrain/Step": 9428, "Pretrain/Step Time": 8.504452008754015} +{"Pretrain/Learning Rate": 1.681245846401336e-08, "Pretrain/Loss": 2.0222008228302, "Pretrain/Loss (Raw)": 2.2767465114593506, "Pretrain/Step": 9429, "Pretrain/Step Time": 8.494740346446633} +{"Pretrain/Learning Rate": 1.650259213688554e-08, "Pretrain/Loss": 2.021989345550537, "Pretrain/Loss (Raw)": 1.9887185096740723, "Pretrain/Step": 9430, "Pretrain/Step Time": 8.50039297901094} +{"Pretrain/Learning Rate": 1.6195607024399593e-08, "Pretrain/Loss": 2.0227510929107666, "Pretrain/Loss (Raw)": 2.0478665828704834, "Pretrain/Step": 9431, "Pretrain/Step Time": 8.50610913708806} +{"Pretrain/Learning Rate": 1.5891503161968857e-08, "Pretrain/Loss": 2.022134304046631, "Pretrain/Loss (Raw)": 1.9149143695831299, "Pretrain/Step": 9432, "Pretrain/Step Time": 8.507353816181421} +{"Pretrain/Learning Rate": 1.559028058465417e-08, "Pretrain/Loss": 2.0219383239746094, "Pretrain/Loss (Raw)": 2.0632989406585693, "Pretrain/Step": 9433, "Pretrain/Step Time": 8.510731808841228} +{"Pretrain/Learning Rate": 1.5291939327202742e-08, "Pretrain/Loss": 2.0228419303894043, "Pretrain/Loss (Raw)": 2.1467032432556152, "Pretrain/Step": 9434, "Pretrain/Step Time": 8.50756311789155} +{"Pretrain/Learning Rate": 1.499647942401483e-08, "Pretrain/Loss": 2.0224196910858154, "Pretrain/Loss (Raw)": 2.0935184955596924, "Pretrain/Step": 9435, "Pretrain/Step Time": 8.507647663354874} +{"Pretrain/Learning Rate": 1.4703900909165957e-08, "Pretrain/Loss": 2.021634578704834, "Pretrain/Loss (Raw)": 2.0172853469848633, "Pretrain/Step": 9436, "Pretrain/Step Time": 8.503976644948125} +{"Pretrain/Learning Rate": 1.4414203816398574e-08, "Pretrain/Loss": 2.0249381065368652, "Pretrain/Loss (Raw)": 2.18076753616333, "Pretrain/Step": 9437, "Pretrain/Step Time": 8.508968368172646} +{"Pretrain/Learning Rate": 1.4127388179119294e-08, "Pretrain/Loss": 2.022148370742798, "Pretrain/Loss (Raw)": 1.6907912492752075, "Pretrain/Step": 9438, "Pretrain/Step Time": 8.511007875204086} +{"Pretrain/Learning Rate": 1.3843454030409986e-08, "Pretrain/Loss": 2.020545721054077, "Pretrain/Loss (Raw)": 1.8868621587753296, "Pretrain/Step": 9439, "Pretrain/Step Time": 8.510629231110215} +{"Pretrain/Learning Rate": 1.3562401403008352e-08, "Pretrain/Loss": 2.020601511001587, "Pretrain/Loss (Raw)": 1.952608346939087, "Pretrain/Step": 9440, "Pretrain/Step Time": 8.504997318610549} +{"Pretrain/Learning Rate": 1.3284230329332902e-08, "Pretrain/Loss": 2.0215370655059814, "Pretrain/Loss (Raw)": 2.058547258377075, "Pretrain/Step": 9441, "Pretrain/Step Time": 8.498155813664198} +{"Pretrain/Learning Rate": 1.3008940841460759e-08, "Pretrain/Loss": 2.021646022796631, "Pretrain/Loss (Raw)": 1.9571869373321533, "Pretrain/Step": 9442, "Pretrain/Step Time": 8.49884931370616} +{"Pretrain/Learning Rate": 1.2736532971141523e-08, "Pretrain/Loss": 2.019627094268799, "Pretrain/Loss (Raw)": 1.900691270828247, "Pretrain/Step": 9443, "Pretrain/Step Time": 8.504173761233687} +{"Pretrain/Learning Rate": 1.2467006749788956e-08, "Pretrain/Loss": 2.019078254699707, "Pretrain/Loss (Raw)": 1.963161826133728, "Pretrain/Step": 9444, "Pretrain/Step Time": 8.51024573855102} +{"Pretrain/Learning Rate": 1.2200362208483751e-08, "Pretrain/Loss": 2.017551898956299, "Pretrain/Loss (Raw)": 2.0038414001464844, "Pretrain/Step": 9445, "Pretrain/Step Time": 8.512781051918864} +{"Pretrain/Learning Rate": 1.1936599377981861e-08, "Pretrain/Loss": 2.0186400413513184, "Pretrain/Loss (Raw)": 2.0884013175964355, "Pretrain/Step": 9446, "Pretrain/Step Time": 8.504220925271511} +{"Pretrain/Learning Rate": 1.1675718288697845e-08, "Pretrain/Loss": 2.019191026687622, "Pretrain/Loss (Raw)": 2.036783218383789, "Pretrain/Step": 9447, "Pretrain/Step Time": 8.499890459701419} +{"Pretrain/Learning Rate": 1.1417718970718749e-08, "Pretrain/Loss": 2.0211181640625, "Pretrain/Loss (Raw)": 2.061304807662964, "Pretrain/Step": 9448, "Pretrain/Step Time": 8.50156337581575} +{"Pretrain/Learning Rate": 1.1162601453798549e-08, "Pretrain/Loss": 2.0219669342041016, "Pretrain/Loss (Raw)": 2.3480818271636963, "Pretrain/Step": 9449, "Pretrain/Step Time": 8.514229597523808} +{"Pretrain/Learning Rate": 1.0910365767358155e-08, "Pretrain/Loss": 2.0218958854675293, "Pretrain/Loss (Raw)": 1.9560672044754028, "Pretrain/Step": 9450, "Pretrain/Step Time": 8.51628734357655} +{"Pretrain/Learning Rate": 1.0661011940488186e-08, "Pretrain/Loss": 2.022505283355713, "Pretrain/Loss (Raw)": 2.115137815475464, "Pretrain/Step": 9451, "Pretrain/Step Time": 8.511915123090148} +{"Pretrain/Learning Rate": 1.0414540001943418e-08, "Pretrain/Loss": 2.0218706130981445, "Pretrain/Loss (Raw)": 1.948293685913086, "Pretrain/Step": 9452, "Pretrain/Step Time": 8.50106742605567} +{"Pretrain/Learning Rate": 1.017094998014556e-08, "Pretrain/Loss": 2.0225167274475098, "Pretrain/Loss (Raw)": 2.0959632396698, "Pretrain/Step": 9453, "Pretrain/Step Time": 8.500891199335456} +{"Pretrain/Learning Rate": 9.93024190319436e-09, "Pretrain/Loss": 2.024967670440674, "Pretrain/Loss (Raw)": 2.41568922996521, "Pretrain/Step": 9454, "Pretrain/Step Time": 8.504388390108943} +{"Pretrain/Learning Rate": 9.692415798842614e-09, "Pretrain/Loss": 2.027353048324585, "Pretrain/Loss (Raw)": 2.111799716949463, "Pretrain/Step": 9455, "Pretrain/Step Time": 8.508166089653969} +{"Pretrain/Learning Rate": 9.457471694518383e-09, "Pretrain/Loss": 2.025573968887329, "Pretrain/Loss (Raw)": 2.109713554382324, "Pretrain/Step": 9456, "Pretrain/Step Time": 8.512294117361307} +{"Pretrain/Learning Rate": 9.225409617319436e-09, "Pretrain/Loss": 2.027024269104004, "Pretrain/Loss (Raw)": 1.9864399433135986, "Pretrain/Step": 9457, "Pretrain/Step Time": 8.506330640986562} +{"Pretrain/Learning Rate": 8.996229594007699e-09, "Pretrain/Loss": 2.0264086723327637, "Pretrain/Loss (Raw)": 1.9816445112228394, "Pretrain/Step": 9458, "Pretrain/Step Time": 8.505929274484515} +{"Pretrain/Learning Rate": 8.769931651009255e-09, "Pretrain/Loss": 2.0282506942749023, "Pretrain/Loss (Raw)": 2.278832197189331, "Pretrain/Step": 9459, "Pretrain/Step Time": 8.50285973586142} +{"Pretrain/Learning Rate": 8.546515814425449e-09, "Pretrain/Loss": 2.030566453933716, "Pretrain/Loss (Raw)": 2.016009569168091, "Pretrain/Step": 9460, "Pretrain/Step Time": 8.50818882510066} +{"Pretrain/Learning Rate": 8.325982110024554e-09, "Pretrain/Loss": 2.027489185333252, "Pretrain/Loss (Raw)": 1.7908222675323486, "Pretrain/Step": 9461, "Pretrain/Step Time": 8.506281390786171} +{"Pretrain/Learning Rate": 8.108330563233458e-09, "Pretrain/Loss": 2.0256195068359375, "Pretrain/Loss (Raw)": 1.7790806293487549, "Pretrain/Step": 9462, "Pretrain/Step Time": 8.509550660848618} +{"Pretrain/Learning Rate": 7.893561199154297e-09, "Pretrain/Loss": 2.027554512023926, "Pretrain/Loss (Raw)": 2.2239344120025635, "Pretrain/Step": 9463, "Pretrain/Step Time": 8.505150785669684} +{"Pretrain/Learning Rate": 7.681674042558928e-09, "Pretrain/Loss": 2.0268616676330566, "Pretrain/Loss (Raw)": 2.140439987182617, "Pretrain/Step": 9464, "Pretrain/Step Time": 8.502066668123007} +{"Pretrain/Learning Rate": 7.472669117877807e-09, "Pretrain/Loss": 2.026395797729492, "Pretrain/Loss (Raw)": 2.002002477645874, "Pretrain/Step": 9465, "Pretrain/Step Time": 8.498090332373977} +{"Pretrain/Learning Rate": 7.266546449219424e-09, "Pretrain/Loss": 2.027894973754883, "Pretrain/Loss (Raw)": 2.1670989990234375, "Pretrain/Step": 9466, "Pretrain/Step Time": 8.504707617685199} +{"Pretrain/Learning Rate": 7.0633060603508825e-09, "Pretrain/Loss": 2.024651050567627, "Pretrain/Loss (Raw)": 1.5723720788955688, "Pretrain/Step": 9467, "Pretrain/Step Time": 8.512997686862946} +{"Pretrain/Learning Rate": 6.862947974711764e-09, "Pretrain/Loss": 2.0232162475585938, "Pretrain/Loss (Raw)": 1.9755314588546753, "Pretrain/Step": 9468, "Pretrain/Step Time": 8.514853604137897} +{"Pretrain/Learning Rate": 6.665472215411361e-09, "Pretrain/Loss": 2.022672653198242, "Pretrain/Loss (Raw)": 2.0615577697753906, "Pretrain/Step": 9469, "Pretrain/Step Time": 8.518580866977572} +{"Pretrain/Learning Rate": 6.470878805220348e-09, "Pretrain/Loss": 2.022035837173462, "Pretrain/Loss (Raw)": 2.024824857711792, "Pretrain/Step": 9470, "Pretrain/Step Time": 8.505642216652632} +{"Pretrain/Learning Rate": 6.279167766579108e-09, "Pretrain/Loss": 2.0206425189971924, "Pretrain/Loss (Raw)": 1.8444370031356812, "Pretrain/Step": 9471, "Pretrain/Step Time": 8.507755413651466} +{"Pretrain/Learning Rate": 6.090339121600508e-09, "Pretrain/Loss": 2.019392967224121, "Pretrain/Loss (Raw)": 1.8969430923461914, "Pretrain/Step": 9472, "Pretrain/Step Time": 8.50942426174879} +{"Pretrain/Learning Rate": 5.904392892058796e-09, "Pretrain/Loss": 2.017957925796509, "Pretrain/Loss (Raw)": 1.7651801109313965, "Pretrain/Step": 9473, "Pretrain/Step Time": 8.513218596577644} +{"Pretrain/Learning Rate": 5.721329099400707e-09, "Pretrain/Loss": 2.0167126655578613, "Pretrain/Loss (Raw)": 1.81183922290802, "Pretrain/Step": 9474, "Pretrain/Step Time": 8.518320364877582} +{"Pretrain/Learning Rate": 5.54114776473158e-09, "Pretrain/Loss": 2.015681266784668, "Pretrain/Loss (Raw)": 1.8974109888076782, "Pretrain/Step": 9475, "Pretrain/Step Time": 8.515188651159406} +{"Pretrain/Learning Rate": 5.363848908837565e-09, "Pretrain/Loss": 2.018061399459839, "Pretrain/Loss (Raw)": 2.1115596294403076, "Pretrain/Step": 9476, "Pretrain/Step Time": 8.509298572316766} +{"Pretrain/Learning Rate": 5.1894325521634205e-09, "Pretrain/Loss": 2.01775860786438, "Pretrain/Loss (Raw)": 2.038141965866089, "Pretrain/Step": 9477, "Pretrain/Step Time": 8.51073936931789} +{"Pretrain/Learning Rate": 5.01789871482361e-09, "Pretrain/Loss": 2.0187582969665527, "Pretrain/Loss (Raw)": 1.9844311475753784, "Pretrain/Step": 9478, "Pretrain/Step Time": 8.517178475856781} +{"Pretrain/Learning Rate": 4.849247416599534e-09, "Pretrain/Loss": 2.0182688236236572, "Pretrain/Loss (Raw)": 1.9384011030197144, "Pretrain/Step": 9479, "Pretrain/Step Time": 8.519569030031562} +{"Pretrain/Learning Rate": 4.683478676939523e-09, "Pretrain/Loss": 2.0191352367401123, "Pretrain/Loss (Raw)": 2.130423069000244, "Pretrain/Step": 9480, "Pretrain/Step Time": 8.524449924007058} +{"Pretrain/Learning Rate": 4.520592514964395e-09, "Pretrain/Loss": 2.0219287872314453, "Pretrain/Loss (Raw)": 2.1541171073913574, "Pretrain/Step": 9481, "Pretrain/Step Time": 8.516057038679719} +{"Pretrain/Learning Rate": 4.360588949456345e-09, "Pretrain/Loss": 2.0217480659484863, "Pretrain/Loss (Raw)": 2.0710203647613525, "Pretrain/Step": 9482, "Pretrain/Step Time": 8.511683873832226} +{"Pretrain/Learning Rate": 4.203467998867283e-09, "Pretrain/Loss": 2.022648811340332, "Pretrain/Loss (Raw)": 2.0877416133880615, "Pretrain/Step": 9483, "Pretrain/Step Time": 8.511013578623533} +{"Pretrain/Learning Rate": 4.049229681321598e-09, "Pretrain/Loss": 2.0199782848358154, "Pretrain/Loss (Raw)": 1.663196325302124, "Pretrain/Step": 9484, "Pretrain/Step Time": 8.515134247019887} +{"Pretrain/Learning Rate": 3.897874014599512e-09, "Pretrain/Loss": 2.0192174911499023, "Pretrain/Loss (Raw)": 1.9919732809066772, "Pretrain/Step": 9485, "Pretrain/Step Time": 8.518866017460823} +{"Pretrain/Learning Rate": 3.749401016162058e-09, "Pretrain/Loss": 2.015138626098633, "Pretrain/Loss (Raw)": 1.8657665252685547, "Pretrain/Step": 9486, "Pretrain/Step Time": 8.52369231544435} +{"Pretrain/Learning Rate": 3.603810703131649e-09, "Pretrain/Loss": 2.0142736434936523, "Pretrain/Loss (Raw)": 1.7909414768218994, "Pretrain/Step": 9487, "Pretrain/Step Time": 8.519997872412205} +{"Pretrain/Learning Rate": 3.4611030922948595e-09, "Pretrain/Loss": 2.0157036781311035, "Pretrain/Loss (Raw)": 2.0703325271606445, "Pretrain/Step": 9488, "Pretrain/Step Time": 8.515389297157526} +{"Pretrain/Learning Rate": 3.3212782001107444e-09, "Pretrain/Loss": 2.01798152923584, "Pretrain/Loss (Raw)": 2.1352827548980713, "Pretrain/Step": 9489, "Pretrain/Step Time": 8.512596333399415} +{"Pretrain/Learning Rate": 3.1843360427052937e-09, "Pretrain/Loss": 2.015773296356201, "Pretrain/Loss (Raw)": 1.776570200920105, "Pretrain/Step": 9490, "Pretrain/Step Time": 8.517110323533416} +{"Pretrain/Learning Rate": 3.0502766358714297e-09, "Pretrain/Loss": 2.015188694000244, "Pretrain/Loss (Raw)": 1.9371904134750366, "Pretrain/Step": 9491, "Pretrain/Step Time": 8.52081598341465} +{"Pretrain/Learning Rate": 2.919099995069008e-09, "Pretrain/Loss": 2.014554023742676, "Pretrain/Loss (Raw)": 1.9673041105270386, "Pretrain/Step": 9492, "Pretrain/Step Time": 8.523004474118352} +{"Pretrain/Learning Rate": 2.790806135427593e-09, "Pretrain/Loss": 2.013885021209717, "Pretrain/Loss (Raw)": 1.9348806142807007, "Pretrain/Step": 9493, "Pretrain/Step Time": 8.517993098124862} +{"Pretrain/Learning Rate": 2.665395071740906e-09, "Pretrain/Loss": 2.0140857696533203, "Pretrain/Loss (Raw)": 2.065680980682373, "Pretrain/Step": 9494, "Pretrain/Step Time": 8.51412315480411} +{"Pretrain/Learning Rate": 2.5428668184696024e-09, "Pretrain/Loss": 2.0136964321136475, "Pretrain/Loss (Raw)": 1.9584466218948364, "Pretrain/Step": 9495, "Pretrain/Step Time": 8.51769134402275} +{"Pretrain/Learning Rate": 2.423221389749597e-09, "Pretrain/Loss": 2.0132484436035156, "Pretrain/Loss (Raw)": 1.9499930143356323, "Pretrain/Step": 9496, "Pretrain/Step Time": 8.49259253963828} +{"Pretrain/Learning Rate": 2.306458799372635e-09, "Pretrain/Loss": 2.0110459327697754, "Pretrain/Loss (Raw)": 1.8614938259124756, "Pretrain/Step": 9497, "Pretrain/Step Time": 8.534778298810124} +{"Pretrain/Learning Rate": 2.192579060811273e-09, "Pretrain/Loss": 2.0093657970428467, "Pretrain/Loss (Raw)": 1.8027899265289307, "Pretrain/Step": 9498, "Pretrain/Step Time": 8.549241187050939} +{"Pretrain/Learning Rate": 2.081582187193898e-09, "Pretrain/Loss": 2.007500410079956, "Pretrain/Loss (Raw)": 1.9418128728866577, "Pretrain/Step": 9499, "Pretrain/Step Time": 8.56787907332182} +{"Pretrain/Learning Rate": 1.9734681913213815e-09, "Pretrain/Loss": 2.0104432106018066, "Pretrain/Loss (Raw)": 2.142514944076538, "Pretrain/Step": 9500, "Pretrain/Step Time": 8.58072722516954} +{"Pretrain/Learning Rate": 1.868237085664304e-09, "Pretrain/Loss": 2.0105762481689453, "Pretrain/Loss (Raw)": 1.9640330076217651, "Pretrain/Step": 9501, "Pretrain/Step Time": 8.597722712904215} +{"Pretrain/Learning Rate": 1.7658888823574027e-09, "Pretrain/Loss": 2.0092782974243164, "Pretrain/Loss (Raw)": 1.8169195652008057, "Pretrain/Step": 9502, "Pretrain/Step Time": 8.59415271691978} +{"Pretrain/Learning Rate": 1.6664235932051243e-09, "Pretrain/Loss": 2.0088772773742676, "Pretrain/Loss (Raw)": 1.8610185384750366, "Pretrain/Step": 9503, "Pretrain/Step Time": 8.609003212302923} +{"Pretrain/Learning Rate": 1.5698412296760723e-09, "Pretrain/Loss": 2.0070173740386963, "Pretrain/Loss (Raw)": 1.5988281965255737, "Pretrain/Step": 9504, "Pretrain/Step Time": 8.61235236003995} +{"Pretrain/Learning Rate": 1.4761418029085593e-09, "Pretrain/Loss": 2.005296230316162, "Pretrain/Loss (Raw)": 1.8862121105194092, "Pretrain/Step": 9505, "Pretrain/Step Time": 8.613751009106636} +{"Pretrain/Learning Rate": 1.3853253237078311e-09, "Pretrain/Loss": 2.005601406097412, "Pretrain/Loss (Raw)": 1.8648321628570557, "Pretrain/Step": 9506, "Pretrain/Step Time": 8.616529004648328} +{"Pretrain/Learning Rate": 1.2973918025516174e-09, "Pretrain/Loss": 2.0058820247650146, "Pretrain/Loss (Raw)": 2.070645332336426, "Pretrain/Step": 9507, "Pretrain/Step Time": 8.623450146988034} +{"Pretrain/Learning Rate": 1.2123412495762544e-09, "Pretrain/Loss": 2.002681255340576, "Pretrain/Loss (Raw)": 1.7982114553451538, "Pretrain/Step": 9508, "Pretrain/Step Time": 8.626435017213225} +{"Pretrain/Learning Rate": 1.1301736745905623e-09, "Pretrain/Loss": 2.002265214920044, "Pretrain/Loss (Raw)": 2.081252098083496, "Pretrain/Step": 9509, "Pretrain/Step Time": 8.635512884706259} +{"Pretrain/Learning Rate": 1.050889087075846e-09, "Pretrain/Loss": 1.9994328022003174, "Pretrain/Loss (Raw)": 1.7601104974746704, "Pretrain/Step": 9510, "Pretrain/Step Time": 8.645500214770436} +{"Pretrain/Learning Rate": 9.744874961664652e-10, "Pretrain/Loss": 1.9998369216918945, "Pretrain/Loss (Raw)": 1.9539827108383179, "Pretrain/Step": 9511, "Pretrain/Step Time": 8.654623001813889} +{"Pretrain/Learning Rate": 9.00968910683142e-10, "Pretrain/Loss": 1.9992371797561646, "Pretrain/Loss (Raw)": 1.9299429655075073, "Pretrain/Step": 9512, "Pretrain/Step Time": 8.646740514785051} +{"Pretrain/Learning Rate": 8.303333390968782e-10, "Pretrain/Loss": 2.0006442070007324, "Pretrain/Loss (Raw)": 2.2052907943725586, "Pretrain/Step": 9513, "Pretrain/Step Time": 8.655108857899904} +{"Pretrain/Learning Rate": 7.625807895567106e-10, "Pretrain/Loss": 1.9996578693389893, "Pretrain/Loss (Raw)": 1.9352630376815796, "Pretrain/Step": 9514, "Pretrain/Step Time": 8.656973892822862} +{"Pretrain/Learning Rate": 6.977112698758337e-10, "Pretrain/Loss": 1.9954462051391602, "Pretrain/Loss (Raw)": 1.9085358381271362, "Pretrain/Step": 9515, "Pretrain/Step Time": 8.662486610934138} +{"Pretrain/Learning Rate": 6.357247875371508e-10, "Pretrain/Loss": 1.9942667484283447, "Pretrain/Loss (Raw)": 1.9229034185409546, "Pretrain/Step": 9516, "Pretrain/Step Time": 8.664410138502717} +{"Pretrain/Learning Rate": 5.766213496877226e-10, "Pretrain/Loss": 1.9909851551055908, "Pretrain/Loss (Raw)": 2.0312957763671875, "Pretrain/Step": 9517, "Pretrain/Step Time": 8.66966411843896} +{"Pretrain/Learning Rate": 5.20400963141543e-10, "Pretrain/Loss": 1.9951748847961426, "Pretrain/Loss (Raw)": 2.5060763359069824, "Pretrain/Step": 9518, "Pretrain/Step Time": 8.667812934145331} +{"Pretrain/Learning Rate": 4.670636343850899e-10, "Pretrain/Loss": 1.995223045349121, "Pretrain/Loss (Raw)": 2.007194757461548, "Pretrain/Step": 9519, "Pretrain/Step Time": 8.666570076718926} +{"Pretrain/Learning Rate": 4.1660936956899874e-10, "Pretrain/Loss": 1.9944720268249512, "Pretrain/Loss (Raw)": 1.9806578159332275, "Pretrain/Step": 9520, "Pretrain/Step Time": 8.6679666955024} +{"Pretrain/Learning Rate": 3.6903817451083846e-10, "Pretrain/Loss": 1.9932349920272827, "Pretrain/Loss (Raw)": 1.9389305114746094, "Pretrain/Step": 9521, "Pretrain/Step Time": 8.668243393301964} +{"Pretrain/Learning Rate": 3.2435005469788615e-10, "Pretrain/Loss": 1.990896463394165, "Pretrain/Loss (Raw)": 1.9355813264846802, "Pretrain/Step": 9522, "Pretrain/Step Time": 8.673982249572873} +{"Pretrain/Learning Rate": 2.825450152815767e-10, "Pretrain/Loss": 1.9930825233459473, "Pretrain/Loss (Raw)": 2.1293349266052246, "Pretrain/Step": 9523, "Pretrain/Step Time": 8.674326116219163} +{"Pretrain/Learning Rate": 2.436230610858292e-10, "Pretrain/Loss": 1.9925482273101807, "Pretrain/Loss (Raw)": 1.9780396223068237, "Pretrain/Step": 9524, "Pretrain/Step Time": 8.672260366380215} +{"Pretrain/Learning Rate": 2.075841965987202e-10, "Pretrain/Loss": 1.9919195175170898, "Pretrain/Loss (Raw)": 2.1150381565093994, "Pretrain/Step": 9525, "Pretrain/Step Time": 8.669910723343492} +{"Pretrain/Learning Rate": 1.7442842597525933e-10, "Pretrain/Loss": 1.9899418354034424, "Pretrain/Loss (Raw)": 1.9621491432189941, "Pretrain/Step": 9526, "Pretrain/Step Time": 8.671987805515528} +{"Pretrain/Learning Rate": 1.4415575304016494e-10, "Pretrain/Loss": 1.990346908569336, "Pretrain/Loss (Raw)": 1.845258355140686, "Pretrain/Step": 9527, "Pretrain/Step Time": 8.674062311649323} +{"Pretrain/Learning Rate": 1.1676618128231288e-10, "Pretrain/Loss": 1.990339994430542, "Pretrain/Loss (Raw)": 1.9426417350769043, "Pretrain/Step": 9528, "Pretrain/Step Time": 8.674731213599443} +{"Pretrain/Learning Rate": 9.225971386583876e-11, "Pretrain/Loss": 1.9884283542633057, "Pretrain/Loss (Raw)": 1.8777258396148682, "Pretrain/Step": 9529, "Pretrain/Step Time": 8.679123342037201} +{"Pretrain/Learning Rate": 7.063635361070908e-11, "Pretrain/Loss": 1.9912853240966797, "Pretrain/Loss (Raw)": 2.243269681930542, "Pretrain/Step": 9530, "Pretrain/Step Time": 8.678964903578162} +{"Pretrain/Learning Rate": 5.189610301492564e-11, "Pretrain/Loss": 1.9871561527252197, "Pretrain/Loss (Raw)": 1.852819561958313, "Pretrain/Step": 9531, "Pretrain/Step Time": 8.674995735287666} +{"Pretrain/Learning Rate": 3.6038964235096675e-11, "Pretrain/Loss": 1.9852023124694824, "Pretrain/Loss (Raw)": 1.8464653491973877, "Pretrain/Step": 9532, "Pretrain/Step Time": 8.679487196728587} +{"Pretrain/Learning Rate": 2.3064939105865713e-11, "Pretrain/Loss": 1.9843990802764893, "Pretrain/Loss (Raw)": 2.042065143585205, "Pretrain/Step": 9533, "Pretrain/Step Time": 8.67974596656859} +{"Pretrain/Learning Rate": 1.2974029120482733e-11, "Pretrain/Loss": 1.9861526489257812, "Pretrain/Loss (Raw)": 2.0481815338134766, "Pretrain/Step": 9534, "Pretrain/Step Time": 8.680915985256433} +{"Pretrain/Learning Rate": 5.766235441906353e-12, "Pretrain/Loss": 1.9866864681243896, "Pretrain/Loss (Raw)": 2.1408867835998535, "Pretrain/Step": 9535, "Pretrain/Step Time": 8.680221619084477} +{"Pretrain/Learning Rate": 1.4415589028038411e-12, "Pretrain/Loss": 1.9846482276916504, "Pretrain/Loss (Raw)": 1.8367557525634766, "Pretrain/Step": 9536, "Pretrain/Step Time": 8.676912937313318} +{"Pretrain/Learning Rate": 0.0, "Pretrain/Loss": 1.9878218173980713, "Pretrain/Loss (Raw)": 2.072506904602051, "Pretrain/Step": 9537, "Pretrain/Step Time": 8.674655383452773} +{"Pretrain/Learning Rate": 1.7482517482517484e-07, "Pretrain/Loss": 3.0495123863220215, "Pretrain/Loss (Raw)": 3.0495123863220215, "Pretrain/Step": 1, "Pretrain/Step Time": 12.95364499092102} +{"Pretrain/Learning Rate": 3.496503496503497e-07, "Pretrain/Loss": 2.9827027320861816, "Pretrain/Loss (Raw)": 2.915893077850342, "Pretrain/Step": 2, "Pretrain/Step Time": 11.256503224372864} +{"Pretrain/Learning Rate": 5.244755244755246e-07, "Pretrain/Loss": 3.1030280590057373, "Pretrain/Loss (Raw)": 3.3436782360076904, "Pretrain/Step": 3, "Pretrain/Step Time": 10.109412908554077} +{"Pretrain/Learning Rate": 6.993006993006994e-07, "Pretrain/Loss": 3.207709789276123, "Pretrain/Loss (Raw)": 3.5217559337615967, "Pretrain/Step": 4, "Pretrain/Step Time": 9.613609433174133} +{"Pretrain/Learning Rate": 8.741258741258743e-07, "Pretrain/Loss": 3.203373670578003, "Pretrain/Loss (Raw)": 3.186028003692627, "Pretrain/Step": 5, "Pretrain/Step Time": 9.272698593139648} +{"Pretrain/Learning Rate": 1.0489510489510491e-06, "Pretrain/Loss": 3.241487503051758, "Pretrain/Loss (Raw)": 3.4320576190948486, "Pretrain/Step": 6, "Pretrain/Step Time": 9.046957810719809} +{"Pretrain/Learning Rate": 1.2237762237762238e-06, "Pretrain/Loss": 3.2111220359802246, "Pretrain/Loss (Raw)": 3.02892804145813, "Pretrain/Step": 7, "Pretrain/Step Time": 8.861811740057808} +{"Pretrain/Learning Rate": 1.3986013986013987e-06, "Pretrain/Loss": 3.1283464431762695, "Pretrain/Loss (Raw)": 2.548917293548584, "Pretrain/Step": 8, "Pretrain/Step Time": 8.720082551240921} +{"Pretrain/Learning Rate": 1.5734265734265736e-06, "Pretrain/Loss": 3.1433961391448975, "Pretrain/Loss (Raw)": 3.2637929916381836, "Pretrain/Step": 9, "Pretrain/Step Time": 8.632478210661146} +{"Pretrain/Learning Rate": 1.7482517482517485e-06, "Pretrain/Loss": 3.1318252086639404, "Pretrain/Loss (Raw)": 3.027689218521118, "Pretrain/Step": 10, "Pretrain/Step Time": 8.555041122436524} +{"Pretrain/Learning Rate": 1.9230769230769234e-06, "Pretrain/Loss": 3.098925828933716, "Pretrain/Loss (Raw)": 2.769932746887207, "Pretrain/Step": 11, "Pretrain/Step Time": 8.478097330440175} +{"Pretrain/Learning Rate": 2.0979020979020983e-06, "Pretrain/Loss": 3.088667392730713, "Pretrain/Loss (Raw)": 2.975820779800415, "Pretrain/Step": 12, "Pretrain/Step Time": 8.42659193277359} +{"Pretrain/Learning Rate": 2.2727272727272728e-06, "Pretrain/Loss": 3.0302000045776367, "Pretrain/Loss (Raw)": 2.328589677810669, "Pretrain/Step": 13, "Pretrain/Step Time": 8.391198139924269} +{"Pretrain/Learning Rate": 2.4475524475524477e-06, "Pretrain/Loss": 2.9967503547668457, "Pretrain/Loss (Raw)": 2.5619049072265625, "Pretrain/Step": 14, "Pretrain/Step Time": 8.406827160290309} +{"Pretrain/Learning Rate": 2.6223776223776225e-06, "Pretrain/Loss": 2.969207763671875, "Pretrain/Loss (Raw)": 2.5836100578308105, "Pretrain/Step": 15, "Pretrain/Step Time": 8.425098657608032} +{"Pretrain/Learning Rate": 2.7972027972027974e-06, "Pretrain/Loss": 2.9329142570495605, "Pretrain/Loss (Raw)": 2.388516664505005, "Pretrain/Step": 16, "Pretrain/Step Time": 8.384565308690071} +{"Pretrain/Learning Rate": 2.9720279720279723e-06, "Pretrain/Loss": 2.888662338256836, "Pretrain/Loss (Raw)": 2.180631637573242, "Pretrain/Step": 17, "Pretrain/Step Time": 8.35958200342515} +{"Pretrain/Learning Rate": 3.1468531468531472e-06, "Pretrain/Loss": 2.8819453716278076, "Pretrain/Loss (Raw)": 2.7677550315856934, "Pretrain/Step": 18, "Pretrain/Step Time": 8.345016890101963} +{"Pretrain/Learning Rate": 3.3216783216783217e-06, "Pretrain/Loss": 2.846991539001465, "Pretrain/Loss (Raw)": 2.2178232669830322, "Pretrain/Step": 19, "Pretrain/Step Time": 8.315270310954043} +{"Pretrain/Learning Rate": 3.496503496503497e-06, "Pretrain/Loss": 2.823315382003784, "Pretrain/Loss (Raw)": 2.3734700679779053, "Pretrain/Step": 20, "Pretrain/Step Time": 8.294747030735016} +{"Pretrain/Learning Rate": 3.6713286713286715e-06, "Pretrain/Loss": 2.794271230697632, "Pretrain/Loss (Raw)": 2.213388204574585, "Pretrain/Step": 21, "Pretrain/Step Time": 8.282232557024274} +{"Pretrain/Learning Rate": 3.846153846153847e-06, "Pretrain/Loss": 2.7738592624664307, "Pretrain/Loss (Raw)": 2.3452086448669434, "Pretrain/Step": 22, "Pretrain/Step Time": 8.266032489863308} +{"Pretrain/Learning Rate": 4.020979020979021e-06, "Pretrain/Loss": 2.7702629566192627, "Pretrain/Loss (Raw)": 2.6911468505859375, "Pretrain/Step": 23, "Pretrain/Step Time": 8.252823321715645} +{"Pretrain/Learning Rate": 4.195804195804197e-06, "Pretrain/Loss": 2.7511863708496094, "Pretrain/Loss (Raw)": 2.3124217987060547, "Pretrain/Step": 24, "Pretrain/Step Time": 8.227953453858694} +{"Pretrain/Learning Rate": 4.370629370629371e-06, "Pretrain/Loss": 2.7299716472625732, "Pretrain/Loss (Raw)": 2.220818281173706, "Pretrain/Step": 25, "Pretrain/Step Time": 8.211393098831177} +{"Pretrain/Learning Rate": 4.5454545454545455e-06, "Pretrain/Loss": 2.711491107940674, "Pretrain/Loss (Raw)": 2.249467611312866, "Pretrain/Step": 26, "Pretrain/Step Time": 8.212409973144531} +{"Pretrain/Learning Rate": 4.72027972027972e-06, "Pretrain/Loss": 2.701399087905884, "Pretrain/Loss (Raw)": 2.4390153884887695, "Pretrain/Step": 27, "Pretrain/Step Time": 8.198912240840771} +{"Pretrain/Learning Rate": 4.895104895104895e-06, "Pretrain/Loss": 2.6861188411712646, "Pretrain/Loss (Raw)": 2.2735514640808105, "Pretrain/Step": 28, "Pretrain/Step Time": 8.1867282305445} +{"Pretrain/Learning Rate": 5.06993006993007e-06, "Pretrain/Loss": 2.6718533039093018, "Pretrain/Loss (Raw)": 2.272421360015869, "Pretrain/Step": 29, "Pretrain/Step Time": 8.173745771934247} +{"Pretrain/Learning Rate": 5.244755244755245e-06, "Pretrain/Loss": 2.6573100090026855, "Pretrain/Loss (Raw)": 2.235553026199341, "Pretrain/Step": 30, "Pretrain/Step Time": 8.179933778444926} +{"Pretrain/Learning Rate": 5.419580419580419e-06, "Pretrain/Loss": 2.657907485961914, "Pretrain/Loss (Raw)": 2.675832986831665, "Pretrain/Step": 31, "Pretrain/Step Time": 8.188615283658427} +{"Pretrain/Learning Rate": 5.594405594405595e-06, "Pretrain/Loss": 2.648205280303955, "Pretrain/Loss (Raw)": 2.3474345207214355, "Pretrain/Step": 32, "Pretrain/Step Time": 8.18689800798893} +{"Pretrain/Learning Rate": 5.76923076923077e-06, "Pretrain/Loss": 2.641181707382202, "Pretrain/Loss (Raw)": 2.416422128677368, "Pretrain/Step": 33, "Pretrain/Step Time": 8.177838065407492} +{"Pretrain/Learning Rate": 5.944055944055945e-06, "Pretrain/Loss": 2.6231555938720703, "Pretrain/Loss (Raw)": 2.0282974243164062, "Pretrain/Step": 34, "Pretrain/Step Time": 8.181915858212639} +{"Pretrain/Learning Rate": 6.1188811188811196e-06, "Pretrain/Loss": 2.616266965866089, "Pretrain/Loss (Raw)": 2.382053852081299, "Pretrain/Step": 35, "Pretrain/Step Time": 8.167327008928572} +{"Pretrain/Learning Rate": 6.2937062937062944e-06, "Pretrain/Loss": 2.6046032905578613, "Pretrain/Loss (Raw)": 2.1963701248168945, "Pretrain/Step": 36, "Pretrain/Step Time": 8.155498815907372} +{"Pretrain/Learning Rate": 6.468531468531469e-06, "Pretrain/Loss": 2.5956408977508545, "Pretrain/Loss (Raw)": 2.2729952335357666, "Pretrain/Step": 37, "Pretrain/Step Time": 8.145924278207728} +{"Pretrain/Learning Rate": 6.643356643356643e-06, "Pretrain/Loss": 2.586148500442505, "Pretrain/Loss (Raw)": 2.234935998916626, "Pretrain/Step": 38, "Pretrain/Step Time": 8.136525593305889} +{"Pretrain/Learning Rate": 6.818181818181818e-06, "Pretrain/Loss": 2.5752832889556885, "Pretrain/Loss (Raw)": 2.1624011993408203, "Pretrain/Step": 39, "Pretrain/Step Time": 8.129853285275972} +{"Pretrain/Learning Rate": 6.993006993006994e-06, "Pretrain/Loss": 2.568223714828491, "Pretrain/Loss (Raw)": 2.292895555496216, "Pretrain/Step": 40, "Pretrain/Step Time": 8.127576833963394} +{"Pretrain/Learning Rate": 7.167832167832168e-06, "Pretrain/Loss": 2.5649728775024414, "Pretrain/Loss (Raw)": 2.434943675994873, "Pretrain/Step": 41, "Pretrain/Step Time": 8.123970834220328} +{"Pretrain/Learning Rate": 7.342657342657343e-06, "Pretrain/Loss": 2.5565686225891113, "Pretrain/Loss (Raw)": 2.211989164352417, "Pretrain/Step": 42, "Pretrain/Step Time": 8.120601790291923} +{"Pretrain/Learning Rate": 7.517482517482517e-06, "Pretrain/Loss": 2.5485880374908447, "Pretrain/Loss (Raw)": 2.213407278060913, "Pretrain/Step": 43, "Pretrain/Step Time": 8.110226498093716} +{"Pretrain/Learning Rate": 7.692307692307694e-06, "Pretrain/Loss": 2.5404999256134033, "Pretrain/Loss (Raw)": 2.1927013397216797, "Pretrain/Step": 44, "Pretrain/Step Time": 8.107680521228097} +{"Pretrain/Learning Rate": 7.867132867132867e-06, "Pretrain/Loss": 2.5362770557403564, "Pretrain/Loss (Raw)": 2.350478172302246, "Pretrain/Step": 45, "Pretrain/Step Time": 8.106655025482178} +{"Pretrain/Learning Rate": 8.041958041958042e-06, "Pretrain/Loss": 2.5390772819519043, "Pretrain/Loss (Raw)": 2.665093421936035, "Pretrain/Step": 46, "Pretrain/Step Time": 8.10864525774251} +{"Pretrain/Learning Rate": 8.216783216783217e-06, "Pretrain/Loss": 2.5341286659240723, "Pretrain/Loss (Raw)": 2.3064942359924316, "Pretrain/Step": 47, "Pretrain/Step Time": 8.109380782918727} +{"Pretrain/Learning Rate": 8.391608391608393e-06, "Pretrain/Loss": 2.5308945178985596, "Pretrain/Loss (Raw)": 2.3788795471191406, "Pretrain/Step": 48, "Pretrain/Step Time": 8.114090497295061} +{"Pretrain/Learning Rate": 8.566433566433566e-06, "Pretrain/Loss": 2.522404193878174, "Pretrain/Loss (Raw)": 2.114877700805664, "Pretrain/Step": 49, "Pretrain/Step Time": 8.10920033162954} +{"Pretrain/Learning Rate": 8.741258741258741e-06, "Pretrain/Loss": 2.517392635345459, "Pretrain/Loss (Raw)": 2.271815776824951, "Pretrain/Step": 50, "Pretrain/Step Time": 8.106694588661194} +{"Pretrain/Learning Rate": 8.916083916083918e-06, "Pretrain/Loss": 2.5130951404571533, "Pretrain/Loss (Raw)": 2.298212766647339, "Pretrain/Step": 51, "Pretrain/Step Time": 8.09984483905867} +{"Pretrain/Learning Rate": 9.090909090909091e-06, "Pretrain/Loss": 2.5037827491760254, "Pretrain/Loss (Raw)": 2.028864860534668, "Pretrain/Step": 52, "Pretrain/Step Time": 8.102723557215471} +{"Pretrain/Learning Rate": 9.265734265734266e-06, "Pretrain/Loss": 2.4997031688690186, "Pretrain/Loss (Raw)": 2.287564516067505, "Pretrain/Step": 53, "Pretrain/Step Time": 8.103386959939632} +{"Pretrain/Learning Rate": 9.44055944055944e-06, "Pretrain/Loss": 2.4949822425842285, "Pretrain/Loss (Raw)": 2.244765520095825, "Pretrain/Step": 54, "Pretrain/Step Time": 8.097543760582253} +{"Pretrain/Learning Rate": 9.615384615384616e-06, "Pretrain/Loss": 2.4900801181793213, "Pretrain/Loss (Raw)": 2.2253663539886475, "Pretrain/Step": 55, "Pretrain/Step Time": 8.098534349961714} +{"Pretrain/Learning Rate": 9.79020979020979e-06, "Pretrain/Loss": 2.4852044582366943, "Pretrain/Loss (Raw)": 2.2170538902282715, "Pretrain/Step": 56, "Pretrain/Step Time": 8.099283052342278} +{"Pretrain/Learning Rate": 9.965034965034966e-06, "Pretrain/Loss": 2.4806907176971436, "Pretrain/Loss (Raw)": 2.227916955947876, "Pretrain/Step": 57, "Pretrain/Step Time": 8.092095705500821} +{"Pretrain/Learning Rate": 1.013986013986014e-05, "Pretrain/Loss": 2.478064775466919, "Pretrain/Loss (Raw)": 2.3283889293670654, "Pretrain/Step": 58, "Pretrain/Step Time": 8.089124067076321} +{"Pretrain/Learning Rate": 1.0314685314685315e-05, "Pretrain/Loss": 2.4733023643493652, "Pretrain/Loss (Raw)": 2.1970648765563965, "Pretrain/Step": 59, "Pretrain/Step Time": 8.085424879849967} +{"Pretrain/Learning Rate": 1.048951048951049e-05, "Pretrain/Loss": 2.4719316959381104, "Pretrain/Loss (Raw)": 2.3910701274871826, "Pretrain/Step": 60, "Pretrain/Step Time": 8.080916663010916} +{"Pretrain/Learning Rate": 1.0664335664335665e-05, "Pretrain/Loss": 2.4680845737457275, "Pretrain/Loss (Raw)": 2.237271308898926, "Pretrain/Step": 61, "Pretrain/Step Time": 8.07870925059084} +{"Pretrain/Learning Rate": 1.0839160839160838e-05, "Pretrain/Loss": 2.4640707969665527, "Pretrain/Loss (Raw)": 2.21923828125, "Pretrain/Step": 62, "Pretrain/Step Time": 8.081415603237767} +{"Pretrain/Learning Rate": 1.1013986013986015e-05, "Pretrain/Loss": 2.4586760997772217, "Pretrain/Loss (Raw)": 2.124189853668213, "Pretrain/Step": 63, "Pretrain/Step Time": 8.090558332110207} +{"Pretrain/Learning Rate": 1.118881118881119e-05, "Pretrain/Loss": 2.4588589668273926, "Pretrain/Loss (Raw)": 2.470388174057007, "Pretrain/Step": 64, "Pretrain/Step Time": 8.088200014084578} +{"Pretrain/Learning Rate": 1.1363636363636365e-05, "Pretrain/Loss": 2.457263946533203, "Pretrain/Loss (Raw)": 2.3551721572875977, "Pretrain/Step": 65, "Pretrain/Step Time": 8.08295419399555} +{"Pretrain/Learning Rate": 1.153846153846154e-05, "Pretrain/Loss": 2.4531843662261963, "Pretrain/Loss (Raw)": 2.187994956970215, "Pretrain/Step": 66, "Pretrain/Step Time": 8.082413055680014} +{"Pretrain/Learning Rate": 1.1713286713286714e-05, "Pretrain/Loss": 2.4494998455047607, "Pretrain/Loss (Raw)": 2.2063276767730713, "Pretrain/Step": 67, "Pretrain/Step Time": 8.077263042108337} +{"Pretrain/Learning Rate": 1.188811188811189e-05, "Pretrain/Loss": 2.447176218032837, "Pretrain/Loss (Raw)": 2.291505813598633, "Pretrain/Step": 68, "Pretrain/Step Time": 8.075340649660896} +{"Pretrain/Learning Rate": 1.2062937062937063e-05, "Pretrain/Loss": 2.4406774044036865, "Pretrain/Loss (Raw)": 1.998766303062439, "Pretrain/Step": 69, "Pretrain/Step Time": 8.06760623489601} +{"Pretrain/Learning Rate": 1.2237762237762239e-05, "Pretrain/Loss": 2.436922311782837, "Pretrain/Loss (Raw)": 2.177811861038208, "Pretrain/Step": 70, "Pretrain/Step Time": 8.066276805741447} +{"Pretrain/Learning Rate": 1.2412587412587414e-05, "Pretrain/Loss": 2.4349710941314697, "Pretrain/Loss (Raw)": 2.298388719558716, "Pretrain/Step": 71, "Pretrain/Step Time": 8.062278321091558} +{"Pretrain/Learning Rate": 1.2587412587412589e-05, "Pretrain/Loss": 2.4336676597595215, "Pretrain/Loss (Raw)": 2.3411295413970947, "Pretrain/Step": 72, "Pretrain/Step Time": 8.063158882988823} +{"Pretrain/Learning Rate": 1.2762237762237764e-05, "Pretrain/Loss": 2.4300825595855713, "Pretrain/Loss (Raw)": 2.1719443798065186, "Pretrain/Step": 73, "Pretrain/Step Time": 8.090220030039957} +{"Pretrain/Learning Rate": 1.2937062937062939e-05, "Pretrain/Loss": 2.4276516437530518, "Pretrain/Loss (Raw)": 2.25018572807312, "Pretrain/Step": 74, "Pretrain/Step Time": 8.14458906328356} +{"Pretrain/Learning Rate": 1.3111888111888112e-05, "Pretrain/Loss": 2.4263689517974854, "Pretrain/Loss (Raw)": 2.331463098526001, "Pretrain/Step": 75, "Pretrain/Step Time": 8.143670101165771} +{"Pretrain/Learning Rate": 1.3286713286713287e-05, "Pretrain/Loss": 2.425102710723877, "Pretrain/Loss (Raw)": 2.3301339149475098, "Pretrain/Step": 76, "Pretrain/Step Time": 8.151883994278155} +{"Pretrain/Learning Rate": 1.3461538461538462e-05, "Pretrain/Loss": 2.4251906871795654, "Pretrain/Loss (Raw)": 2.4318881034851074, "Pretrain/Step": 77, "Pretrain/Step Time": 8.146087606231887} +{"Pretrain/Learning Rate": 1.3636363636363637e-05, "Pretrain/Loss": 2.4250097274780273, "Pretrain/Loss (Raw)": 2.4110636711120605, "Pretrain/Step": 78, "Pretrain/Step Time": 8.155634858669378} +{"Pretrain/Learning Rate": 1.381118881118881e-05, "Pretrain/Loss": 2.422966718673706, "Pretrain/Loss (Raw)": 2.263603687286377, "Pretrain/Step": 79, "Pretrain/Step Time": 8.1621636740769} +{"Pretrain/Learning Rate": 1.3986013986013988e-05, "Pretrain/Loss": 2.419226884841919, "Pretrain/Loss (Raw)": 2.1237900257110596, "Pretrain/Step": 80, "Pretrain/Step Time": 8.174949333071709} +{"Pretrain/Learning Rate": 1.4160839160839163e-05, "Pretrain/Loss": 2.416654348373413, "Pretrain/Loss (Raw)": 2.21085262298584, "Pretrain/Step": 81, "Pretrain/Step Time": 8.17424511320797} +{"Pretrain/Learning Rate": 1.4335664335664336e-05, "Pretrain/Loss": 2.4149882793426514, "Pretrain/Loss (Raw)": 2.2800354957580566, "Pretrain/Step": 82, "Pretrain/Step Time": 8.166493537949354} +{"Pretrain/Learning Rate": 1.4510489510489511e-05, "Pretrain/Loss": 2.413377046585083, "Pretrain/Loss (Raw)": 2.281263828277588, "Pretrain/Step": 83, "Pretrain/Step Time": 8.181560321026538} +{"Pretrain/Learning Rate": 1.4685314685314686e-05, "Pretrain/Loss": 2.413121223449707, "Pretrain/Loss (Raw)": 2.391871452331543, "Pretrain/Step": 84, "Pretrain/Step Time": 8.190456123579116} +{"Pretrain/Learning Rate": 1.486013986013986e-05, "Pretrain/Loss": 2.410900831222534, "Pretrain/Loss (Raw)": 2.2243874073028564, "Pretrain/Step": 85, "Pretrain/Step Time": 8.188753829282874} +{"Pretrain/Learning Rate": 1.5034965034965034e-05, "Pretrain/Loss": 2.4088382720947266, "Pretrain/Loss (Raw)": 2.2335429191589355, "Pretrain/Step": 86, "Pretrain/Step Time": 8.188869972561681} +{"Pretrain/Learning Rate": 1.5209790209790212e-05, "Pretrain/Loss": 2.4078545570373535, "Pretrain/Loss (Raw)": 2.3232429027557373, "Pretrain/Step": 87, "Pretrain/Step Time": 8.191096516861313} +{"Pretrain/Learning Rate": 1.5384615384615387e-05, "Pretrain/Loss": 2.4056084156036377, "Pretrain/Loss (Raw)": 2.2102043628692627, "Pretrain/Step": 88, "Pretrain/Step Time": 8.200869275764985} +{"Pretrain/Learning Rate": 1.555944055944056e-05, "Pretrain/Loss": 2.404261350631714, "Pretrain/Loss (Raw)": 2.2857139110565186, "Pretrain/Step": 89, "Pretrain/Step Time": 8.19408868939689} +{"Pretrain/Learning Rate": 1.5734265734265734e-05, "Pretrain/Loss": 2.4005730152130127, "Pretrain/Loss (Raw)": 2.0722973346710205, "Pretrain/Step": 90, "Pretrain/Step Time": 8.195319414138794} +{"Pretrain/Learning Rate": 1.590909090909091e-05, "Pretrain/Loss": 2.3984215259552, "Pretrain/Loss (Raw)": 2.204787492752075, "Pretrain/Step": 91, "Pretrain/Step Time": 8.197691257183369} +{"Pretrain/Learning Rate": 1.6083916083916083e-05, "Pretrain/Loss": 2.3970351219177246, "Pretrain/Loss (Raw)": 2.270864486694336, "Pretrain/Step": 92, "Pretrain/Step Time": 8.199981277403625} +{"Pretrain/Learning Rate": 1.625874125874126e-05, "Pretrain/Loss": 2.3958916664123535, "Pretrain/Loss (Raw)": 2.290719509124756, "Pretrain/Step": 93, "Pretrain/Step Time": 8.204529144430673} +{"Pretrain/Learning Rate": 1.6433566433566433e-05, "Pretrain/Loss": 2.3963944911956787, "Pretrain/Loss (Raw)": 2.443157196044922, "Pretrain/Step": 94, "Pretrain/Step Time": 8.207605468465927} +{"Pretrain/Learning Rate": 1.660839160839161e-05, "Pretrain/Loss": 2.394934892654419, "Pretrain/Loss (Raw)": 2.2576987743377686, "Pretrain/Step": 95, "Pretrain/Step Time": 8.216533982126336} +{"Pretrain/Learning Rate": 1.6783216783216786e-05, "Pretrain/Loss": 2.394338607788086, "Pretrain/Loss (Raw)": 2.3377153873443604, "Pretrain/Step": 96, "Pretrain/Step Time": 8.216026430328688} +{"Pretrain/Learning Rate": 1.695804195804196e-05, "Pretrain/Loss": 2.3960063457489014, "Pretrain/Loss (Raw)": 2.5561115741729736, "Pretrain/Step": 97, "Pretrain/Step Time": 8.229896766623272} +{"Pretrain/Learning Rate": 1.7132867132867133e-05, "Pretrain/Loss": 2.3933677673339844, "Pretrain/Loss (Raw)": 2.137436628341675, "Pretrain/Step": 98, "Pretrain/Step Time": 8.22409439086914} +{"Pretrain/Learning Rate": 1.730769230769231e-05, "Pretrain/Loss": 2.3943426609039307, "Pretrain/Loss (Raw)": 2.4898617267608643, "Pretrain/Step": 99, "Pretrain/Step Time": 8.220659715960725} +{"Pretrain/Learning Rate": 1.7482517482517483e-05, "Pretrain/Loss": 2.3929412364959717, "Pretrain/Loss (Raw)": 2.254199266433716, "Pretrain/Step": 100, "Pretrain/Step Time": 8.229546775817871} +{"Pretrain/Learning Rate": 1.7657342657342656e-05, "Pretrain/Loss": 2.395582675933838, "Pretrain/Loss (Raw)": 2.659755229949951, "Pretrain/Step": 101, "Pretrain/Step Time": 8.232579587709786} +{"Pretrain/Learning Rate": 1.7832167832167836e-05, "Pretrain/Loss": 2.394829034805298, "Pretrain/Loss (Raw)": 2.3186938762664795, "Pretrain/Step": 102, "Pretrain/Step Time": 8.230790867524988} +{"Pretrain/Learning Rate": 1.800699300699301e-05, "Pretrain/Loss": 2.39668345451355, "Pretrain/Loss (Raw)": 2.585829973220825, "Pretrain/Step": 103, "Pretrain/Step Time": 8.23125232076182} +{"Pretrain/Learning Rate": 1.8181818181818182e-05, "Pretrain/Loss": 2.3953487873077393, "Pretrain/Loss (Raw)": 2.257889986038208, "Pretrain/Step": 104, "Pretrain/Step Time": 8.226687231889137} +{"Pretrain/Learning Rate": 1.835664335664336e-05, "Pretrain/Loss": 2.3934073448181152, "Pretrain/Loss (Raw)": 2.1914916038513184, "Pretrain/Step": 105, "Pretrain/Step Time": 8.2336322534652} +{"Pretrain/Learning Rate": 1.8531468531468532e-05, "Pretrain/Loss": 2.3927597999572754, "Pretrain/Loss (Raw)": 2.324756383895874, "Pretrain/Step": 106, "Pretrain/Step Time": 8.231686691068253} +{"Pretrain/Learning Rate": 1.8706293706293705e-05, "Pretrain/Loss": 2.3901898860931396, "Pretrain/Loss (Raw)": 2.1177926063537598, "Pretrain/Step": 107, "Pretrain/Step Time": 8.237442916798814} +{"Pretrain/Learning Rate": 1.888111888111888e-05, "Pretrain/Loss": 2.3878750801086426, "Pretrain/Loss (Raw)": 2.140181541442871, "Pretrain/Step": 108, "Pretrain/Step Time": 8.23645798586033} +{"Pretrain/Learning Rate": 1.9055944055944055e-05, "Pretrain/Loss": 2.3884716033935547, "Pretrain/Loss (Raw)": 2.4529125690460205, "Pretrain/Step": 109, "Pretrain/Step Time": 8.238742266226252} +{"Pretrain/Learning Rate": 1.923076923076923e-05, "Pretrain/Loss": 2.386969804763794, "Pretrain/Loss (Raw)": 2.223256826400757, "Pretrain/Step": 110, "Pretrain/Step Time": 8.247758988900618} +{"Pretrain/Learning Rate": 1.9405594405594408e-05, "Pretrain/Loss": 2.3857734203338623, "Pretrain/Loss (Raw)": 2.2541725635528564, "Pretrain/Step": 111, "Pretrain/Step Time": 8.257806825208235} +{"Pretrain/Learning Rate": 1.958041958041958e-05, "Pretrain/Loss": 2.3825576305389404, "Pretrain/Loss (Raw)": 2.0255746841430664, "Pretrain/Step": 112, "Pretrain/Step Time": 8.262254333921842} +{"Pretrain/Learning Rate": 1.9755244755244758e-05, "Pretrain/Loss": 2.3783137798309326, "Pretrain/Loss (Raw)": 1.9030065536499023, "Pretrain/Step": 113, "Pretrain/Step Time": 8.261745165934604} +{"Pretrain/Learning Rate": 1.993006993006993e-05, "Pretrain/Loss": 2.377488374710083, "Pretrain/Loss (Raw)": 2.2842252254486084, "Pretrain/Step": 114, "Pretrain/Step Time": 8.266236317785163} +{"Pretrain/Learning Rate": 2.0104895104895104e-05, "Pretrain/Loss": 2.3748066425323486, "Pretrain/Loss (Raw)": 2.0691354274749756, "Pretrain/Step": 115, "Pretrain/Step Time": 8.26406195682028} +{"Pretrain/Learning Rate": 2.027972027972028e-05, "Pretrain/Loss": 2.373103141784668, "Pretrain/Loss (Raw)": 2.1771645545959473, "Pretrain/Step": 116, "Pretrain/Step Time": 8.260246774245953} +{"Pretrain/Learning Rate": 2.0454545454545457e-05, "Pretrain/Loss": 2.37287974357605, "Pretrain/Loss (Raw)": 2.346968650817871, "Pretrain/Step": 117, "Pretrain/Step Time": 8.266307661675999} +{"Pretrain/Learning Rate": 2.062937062937063e-05, "Pretrain/Loss": 2.371520757675171, "Pretrain/Loss (Raw)": 2.212519645690918, "Pretrain/Step": 118, "Pretrain/Step Time": 8.261952899270138} +{"Pretrain/Learning Rate": 2.0804195804195807e-05, "Pretrain/Loss": 2.3704562187194824, "Pretrain/Loss (Raw)": 2.2448439598083496, "Pretrain/Step": 119, "Pretrain/Step Time": 8.263871088749221} +{"Pretrain/Learning Rate": 2.097902097902098e-05, "Pretrain/Loss": 2.3688557147979736, "Pretrain/Loss (Raw)": 2.1783649921417236, "Pretrain/Step": 120, "Pretrain/Step Time": 8.262267180283864} +{"Pretrain/Learning Rate": 2.1153846153846154e-05, "Pretrain/Loss": 2.369748115539551, "Pretrain/Loss (Raw)": 2.476874589920044, "Pretrain/Step": 121, "Pretrain/Step Time": 8.261339725541674} +{"Pretrain/Learning Rate": 2.132867132867133e-05, "Pretrain/Loss": 2.3710103034973145, "Pretrain/Loss (Raw)": 2.523744821548462, "Pretrain/Step": 122, "Pretrain/Step Time": 8.268577988030481} +{"Pretrain/Learning Rate": 2.1503496503496503e-05, "Pretrain/Loss": 2.36911940574646, "Pretrain/Loss (Raw)": 2.138425350189209, "Pretrain/Step": 123, "Pretrain/Step Time": 8.269474198178548} +{"Pretrain/Learning Rate": 2.1678321678321677e-05, "Pretrain/Loss": 2.367438554763794, "Pretrain/Loss (Raw)": 2.1607000827789307, "Pretrain/Step": 124, "Pretrain/Step Time": 8.270373171375644} +{"Pretrain/Learning Rate": 2.1853146853146857e-05, "Pretrain/Loss": 2.3675918579101562, "Pretrain/Loss (Raw)": 2.386563777923584, "Pretrain/Step": 125, "Pretrain/Step Time": 8.27046037864685} +{"Pretrain/Learning Rate": 2.202797202797203e-05, "Pretrain/Loss": 2.3693723678588867, "Pretrain/Loss (Raw)": 2.5919442176818848, "Pretrain/Step": 126, "Pretrain/Step Time": 8.272573881679111} +{"Pretrain/Learning Rate": 2.2202797202797203e-05, "Pretrain/Loss": 2.369392156600952, "Pretrain/Loss (Raw)": 2.371899127960205, "Pretrain/Step": 127, "Pretrain/Step Time": 8.2851809929675} +{"Pretrain/Learning Rate": 1.7482517482517484e-07, "Pretrain/Loss": 3.562274217605591, "Pretrain/Loss (Raw)": 3.562274217605591, "Pretrain/Step": 1, "Pretrain/Step Time": 13.99735140800476} +{"Pretrain/Learning Rate": 3.496503496503497e-07, "Pretrain/Loss": 3.299203634262085, "Pretrain/Loss (Raw)": 3.036133050918579, "Pretrain/Step": 2, "Pretrain/Step Time": 11.052282452583313} +{"Pretrain/Learning Rate": 5.244755244755246e-07, "Pretrain/Loss": 3.4999380111694336, "Pretrain/Loss (Raw)": 3.901407241821289, "Pretrain/Step": 3, "Pretrain/Step Time": 10.088669220606485} +{"Pretrain/Learning Rate": 6.993006993006994e-07, "Pretrain/Loss": 3.6056981086730957, "Pretrain/Loss (Raw)": 3.922978401184082, "Pretrain/Step": 4, "Pretrain/Step Time": 9.639900624752045} +{"Pretrain/Learning Rate": 8.741258741258743e-07, "Pretrain/Loss": 3.585742950439453, "Pretrain/Loss (Raw)": 3.5059220790863037, "Pretrain/Step": 5, "Pretrain/Step Time": 9.394181871414185} +{"Pretrain/Learning Rate": 1.0489510489510491e-06, "Pretrain/Loss": 3.584527015686035, "Pretrain/Loss (Raw)": 3.578447103500366, "Pretrain/Step": 6, "Pretrain/Step Time": 9.19188149770101} +{"Pretrain/Learning Rate": 1.2237762237762238e-06, "Pretrain/Loss": 3.6064271926879883, "Pretrain/Loss (Raw)": 3.7378275394439697, "Pretrain/Step": 7, "Pretrain/Step Time": 9.012816054480416} +{"Pretrain/Learning Rate": 1.3986013986013987e-06, "Pretrain/Loss": 3.5500614643096924, "Pretrain/Loss (Raw)": 3.1555025577545166, "Pretrain/Step": 8, "Pretrain/Step Time": 8.877939224243164} +{"Pretrain/Learning Rate": 1.5734265734265736e-06, "Pretrain/Loss": 3.4727940559387207, "Pretrain/Loss (Raw)": 2.8546550273895264, "Pretrain/Step": 9, "Pretrain/Step Time": 8.78874569469028} +{"Pretrain/Learning Rate": 1.7482517482517485e-06, "Pretrain/Loss": 3.4388656616210938, "Pretrain/Loss (Raw)": 3.133510112762451, "Pretrain/Step": 10, "Pretrain/Step Time": 8.769214391708374} +{"Pretrain/Learning Rate": 1.9230769230769234e-06, "Pretrain/Loss": 3.3765640258789062, "Pretrain/Loss (Raw)": 2.7535488605499268, "Pretrain/Step": 11, "Pretrain/Step Time": 8.68964923511852} +{"Pretrain/Learning Rate": 2.0979020979020983e-06, "Pretrain/Loss": 3.3013577461242676, "Pretrain/Loss (Raw)": 2.4740843772888184, "Pretrain/Step": 12, "Pretrain/Step Time": 8.645751257737478} +{"Pretrain/Learning Rate": 2.2727272727272728e-06, "Pretrain/Loss": 3.2794344425201416, "Pretrain/Loss (Raw)": 3.016355037689209, "Pretrain/Step": 13, "Pretrain/Step Time": 8.615777162405161} +{"Pretrain/Learning Rate": 2.4475524475524477e-06, "Pretrain/Loss": 3.2191262245178223, "Pretrain/Loss (Raw)": 2.4351210594177246, "Pretrain/Step": 14, "Pretrain/Step Time": 8.635348013469152} +{"Pretrain/Learning Rate": 2.6223776223776225e-06, "Pretrain/Loss": 3.196312189102173, "Pretrain/Loss (Raw)": 2.876913070678711, "Pretrain/Step": 15, "Pretrain/Step Time": 8.596060657501221} +{"Pretrain/Learning Rate": 2.7972027972027974e-06, "Pretrain/Loss": 3.2113184928894043, "Pretrain/Loss (Raw)": 3.436417818069458, "Pretrain/Step": 16, "Pretrain/Step Time": 8.612409070134163} +{"Pretrain/Learning Rate": 2.9720279720279723e-06, "Pretrain/Loss": 3.2269184589385986, "Pretrain/Loss (Raw)": 3.476515054702759, "Pretrain/Step": 17, "Pretrain/Step Time": 8.599604901145486} +{"Pretrain/Learning Rate": 3.1468531468531472e-06, "Pretrain/Loss": 3.2021002769470215, "Pretrain/Loss (Raw)": 2.780191421508789, "Pretrain/Step": 18, "Pretrain/Step Time": 8.58194210794237} +{"Pretrain/Learning Rate": 3.3216783216783217e-06, "Pretrain/Loss": 3.170070171356201, "Pretrain/Loss (Raw)": 2.5935256481170654, "Pretrain/Step": 19, "Pretrain/Step Time": 8.55590948305632} +{"Pretrain/Learning Rate": 3.496503496503497e-06, "Pretrain/Loss": 3.148106336593628, "Pretrain/Loss (Raw)": 2.73079776763916, "Pretrain/Step": 20, "Pretrain/Step Time": 8.541694498062133} +{"Pretrain/Learning Rate": 3.6713286713286715e-06, "Pretrain/Loss": 3.1372783184051514, "Pretrain/Loss (Raw)": 2.9207170009613037, "Pretrain/Step": 21, "Pretrain/Step Time": 8.534763370241437} +{"Pretrain/Learning Rate": 3.846153846153847e-06, "Pretrain/Loss": 3.132403612136841, "Pretrain/Loss (Raw)": 3.030038356781006, "Pretrain/Step": 22, "Pretrain/Step Time": 8.522457231174815} +{"Pretrain/Learning Rate": 4.020979020979021e-06, "Pretrain/Loss": 3.099351644515991, "Pretrain/Loss (Raw)": 2.372203826904297, "Pretrain/Step": 23, "Pretrain/Step Time": 8.496771656948587} +{"Pretrain/Learning Rate": 4.195804195804197e-06, "Pretrain/Loss": 3.0760552883148193, "Pretrain/Loss (Raw)": 2.540241003036499, "Pretrain/Step": 24, "Pretrain/Step Time": 8.48410772283872} +{"Pretrain/Learning Rate": 4.370629370629371e-06, "Pretrain/Loss": 3.059316396713257, "Pretrain/Loss (Raw)": 2.657588243484497, "Pretrain/Step": 25, "Pretrain/Step Time": 8.465393762588501} +{"Pretrain/Learning Rate": 4.5454545454545455e-06, "Pretrain/Loss": 3.0376980304718018, "Pretrain/Loss (Raw)": 2.497237205505371, "Pretrain/Step": 26, "Pretrain/Step Time": 8.452011942863464} +{"Pretrain/Learning Rate": 4.72027972027972e-06, "Pretrain/Loss": 3.019085645675659, "Pretrain/Loss (Raw)": 2.5351603031158447, "Pretrain/Step": 27, "Pretrain/Step Time": 8.436817540062798} +{"Pretrain/Learning Rate": 4.895104895104895e-06, "Pretrain/Loss": 3.000476121902466, "Pretrain/Loss (Raw)": 2.498020887374878, "Pretrain/Step": 28, "Pretrain/Step Time": 8.440472705023629} +{"Pretrain/Learning Rate": 5.06993006993007e-06, "Pretrain/Loss": 2.9843339920043945, "Pretrain/Loss (Raw)": 2.5323526859283447, "Pretrain/Step": 29, "Pretrain/Step Time": 8.44158255642858} +{"Pretrain/Learning Rate": 5.244755244755245e-06, "Pretrain/Loss": 2.969662666320801, "Pretrain/Loss (Raw)": 2.544189929962158, "Pretrain/Step": 30, "Pretrain/Step Time": 8.437940001487732} +{"Pretrain/Learning Rate": 5.419580419580419e-06, "Pretrain/Loss": 2.9585914611816406, "Pretrain/Loss (Raw)": 2.626465320587158, "Pretrain/Step": 31, "Pretrain/Step Time": 8.44464308984818} +{"Pretrain/Learning Rate": 5.594405594405595e-06, "Pretrain/Loss": 2.9541563987731934, "Pretrain/Loss (Raw)": 2.8166632652282715, "Pretrain/Step": 32, "Pretrain/Step Time": 8.44028939306736} +{"Pretrain/Learning Rate": 5.76923076923077e-06, "Pretrain/Loss": 2.9372379779815674, "Pretrain/Loss (Raw)": 2.3958399295806885, "Pretrain/Step": 33, "Pretrain/Step Time": 8.433101466207793} +{"Pretrain/Learning Rate": 5.944055944055945e-06, "Pretrain/Loss": 2.9272749423980713, "Pretrain/Loss (Raw)": 2.5985023975372314, "Pretrain/Step": 34, "Pretrain/Step Time": 8.423369092099806} +{"Pretrain/Learning Rate": 6.1188811188811196e-06, "Pretrain/Loss": 2.9244985580444336, "Pretrain/Loss (Raw)": 2.8301007747650146, "Pretrain/Step": 35, "Pretrain/Step Time": 8.419386509486607} +{"Pretrain/Learning Rate": 6.2937062937062944e-06, "Pretrain/Loss": 2.909491777420044, "Pretrain/Loss (Raw)": 2.384243965148926, "Pretrain/Step": 36, "Pretrain/Step Time": 8.411708931128183} +{"Pretrain/Learning Rate": 6.468531468531469e-06, "Pretrain/Loss": 2.894151210784912, "Pretrain/Loss (Raw)": 2.3419017791748047, "Pretrain/Step": 37, "Pretrain/Step Time": 8.401721619270944} +{"Pretrain/Learning Rate": 6.643356643356643e-06, "Pretrain/Loss": 2.8813648223876953, "Pretrain/Loss (Raw)": 2.4082629680633545, "Pretrain/Step": 38, "Pretrain/Step Time": 8.397233555191441} +{"Pretrain/Learning Rate": 6.818181818181818e-06, "Pretrain/Loss": 2.864041566848755, "Pretrain/Loss (Raw)": 2.2057642936706543, "Pretrain/Step": 39, "Pretrain/Step Time": 8.384334429716452} +{"Pretrain/Learning Rate": 6.993006993006994e-06, "Pretrain/Loss": 2.854763984680176, "Pretrain/Loss (Raw)": 2.4929332733154297, "Pretrain/Step": 40, "Pretrain/Step Time": 8.385484278202057} +{"Pretrain/Learning Rate": 7.167832167832168e-06, "Pretrain/Loss": 2.8473010063171387, "Pretrain/Loss (Raw)": 2.5487823486328125, "Pretrain/Step": 41, "Pretrain/Step Time": 8.376442868535111} +{"Pretrain/Learning Rate": 7.342657342657343e-06, "Pretrain/Loss": 2.8318753242492676, "Pretrain/Loss (Raw)": 2.199418067932129, "Pretrain/Step": 42, "Pretrain/Step Time": 8.371178712163653} +{"Pretrain/Learning Rate": 7.517482517482517e-06, "Pretrain/Loss": 2.827258825302124, "Pretrain/Loss (Raw)": 2.6333675384521484, "Pretrain/Step": 43, "Pretrain/Step Time": 8.36840074561363} +{"Pretrain/Learning Rate": 7.692307692307694e-06, "Pretrain/Loss": 2.8145668506622314, "Pretrain/Loss (Raw)": 2.2688069343566895, "Pretrain/Step": 44, "Pretrain/Step Time": 8.367356918074869} +{"Pretrain/Learning Rate": 7.867132867132867e-06, "Pretrain/Loss": 2.8029887676239014, "Pretrain/Loss (Raw)": 2.29356050491333, "Pretrain/Step": 45, "Pretrain/Step Time": 8.375877311494616} +{"Pretrain/Learning Rate": 8.041958041958042e-06, "Pretrain/Loss": 2.7903342247009277, "Pretrain/Loss (Raw)": 2.220872163772583, "Pretrain/Step": 46, "Pretrain/Step Time": 8.370129994724108} +{"Pretrain/Learning Rate": 8.216783216783217e-06, "Pretrain/Loss": 2.7822036743164062, "Pretrain/Loss (Raw)": 2.408203363418579, "Pretrain/Step": 47, "Pretrain/Step Time": 8.374383616954722} +{"Pretrain/Learning Rate": 8.391608391608393e-06, "Pretrain/Loss": 2.775571823120117, "Pretrain/Loss (Raw)": 2.463870048522949, "Pretrain/Step": 48, "Pretrain/Step Time": 8.376844296852747} +{"Pretrain/Learning Rate": 8.566433566433566e-06, "Pretrain/Loss": 2.7643232345581055, "Pretrain/Loss (Raw)": 2.2244045734405518, "Pretrain/Step": 49, "Pretrain/Step Time": 8.374402075397725} +{"Pretrain/Learning Rate": 8.741258741258741e-06, "Pretrain/Loss": 2.758248805999756, "Pretrain/Loss (Raw)": 2.4605934619903564, "Pretrain/Step": 50, "Pretrain/Step Time": 8.36819281578064} +{"Pretrain/Learning Rate": 8.916083916083918e-06, "Pretrain/Loss": 2.7564404010772705, "Pretrain/Loss (Raw)": 2.6660330295562744, "Pretrain/Step": 51, "Pretrain/Step Time": 8.364192691503787} +{"Pretrain/Learning Rate": 9.090909090909091e-06, "Pretrain/Loss": 2.7450976371765137, "Pretrain/Loss (Raw)": 2.1666011810302734, "Pretrain/Step": 52, "Pretrain/Step Time": 8.36280697125655} +{"Pretrain/Learning Rate": 9.265734265734266e-06, "Pretrain/Loss": 2.7438366413116455, "Pretrain/Loss (Raw)": 2.678274393081665, "Pretrain/Step": 53, "Pretrain/Step Time": 8.359670004754696} +{"Pretrain/Learning Rate": 9.44055944055944e-06, "Pretrain/Loss": 2.7360591888427734, "Pretrain/Loss (Raw)": 2.3238394260406494, "Pretrain/Step": 54, "Pretrain/Step Time": 8.35351437109488} +{"Pretrain/Learning Rate": 9.615384615384616e-06, "Pretrain/Loss": 2.7295920848846436, "Pretrain/Loss (Raw)": 2.3803701400756836, "Pretrain/Step": 55, "Pretrain/Step Time": 8.347602636163884} +{"Pretrain/Learning Rate": 9.79020979020979e-06, "Pretrain/Loss": 2.726033926010132, "Pretrain/Loss (Raw)": 2.530346393585205, "Pretrain/Step": 56, "Pretrain/Step Time": 8.345070953880038} +{"Pretrain/Learning Rate": 9.965034965034966e-06, "Pretrain/Loss": 2.723172664642334, "Pretrain/Loss (Raw)": 2.5629353523254395, "Pretrain/Step": 57, "Pretrain/Step Time": 8.342266601428651} +{"Pretrain/Learning Rate": 1.013986013986014e-05, "Pretrain/Loss": 2.7142505645751953, "Pretrain/Loss (Raw)": 2.2056846618652344, "Pretrain/Step": 58, "Pretrain/Step Time": 8.336169830684003} +{"Pretrain/Learning Rate": 1.0314685314685315e-05, "Pretrain/Loss": 2.7086071968078613, "Pretrain/Loss (Raw)": 2.3812975883483887, "Pretrain/Step": 59, "Pretrain/Step Time": 8.336073455163987} +{"Pretrain/Learning Rate": 1.048951048951049e-05, "Pretrain/Loss": 2.700220823287964, "Pretrain/Loss (Raw)": 2.2054283618927, "Pretrain/Step": 60, "Pretrain/Step Time": 8.33865076303482} +{"Pretrain/Learning Rate": 1.0664335664335665e-05, "Pretrain/Loss": 2.693171977996826, "Pretrain/Loss (Raw)": 2.2702434062957764, "Pretrain/Step": 61, "Pretrain/Step Time": 8.348055139916841} +{"Pretrain/Learning Rate": 1.0839160839160838e-05, "Pretrain/Loss": 2.691002130508423, "Pretrain/Loss (Raw)": 2.55863618850708, "Pretrain/Step": 62, "Pretrain/Step Time": 8.349907455905791} +{"Pretrain/Learning Rate": 1.1013986013986015e-05, "Pretrain/Loss": 2.6833503246307373, "Pretrain/Loss (Raw)": 2.208921194076538, "Pretrain/Step": 63, "Pretrain/Step Time": 8.357237270900182} +{"Pretrain/Learning Rate": 1.118881118881119e-05, "Pretrain/Loss": 2.6795878410339355, "Pretrain/Loss (Raw)": 2.4425642490386963, "Pretrain/Step": 64, "Pretrain/Step Time": 8.360592406243086} +{"Pretrain/Learning Rate": 1.1363636363636365e-05, "Pretrain/Loss": 2.6702723503112793, "Pretrain/Loss (Raw)": 2.074089288711548, "Pretrain/Step": 65, "Pretrain/Step Time": 8.35780230302077} +{"Pretrain/Learning Rate": 1.153846153846154e-05, "Pretrain/Loss": 2.6670167446136475, "Pretrain/Loss (Raw)": 2.4553921222686768, "Pretrain/Step": 66, "Pretrain/Step Time": 8.352084412719265} +{"Pretrain/Learning Rate": 1.1713286713286714e-05, "Pretrain/Loss": 2.6614229679107666, "Pretrain/Loss (Raw)": 2.29225492477417, "Pretrain/Step": 67, "Pretrain/Step Time": 8.353806050855722} +{"Pretrain/Learning Rate": 1.188811188811189e-05, "Pretrain/Loss": 2.651110887527466, "Pretrain/Loss (Raw)": 1.960188865661621, "Pretrain/Step": 68, "Pretrain/Step Time": 8.351895300781026} +{"Pretrain/Learning Rate": 1.2062937062937063e-05, "Pretrain/Loss": 2.650249481201172, "Pretrain/Loss (Raw)": 2.591676950454712, "Pretrain/Step": 69, "Pretrain/Step Time": 8.34722880349643} +{"Pretrain/Learning Rate": 1.2237762237762239e-05, "Pretrain/Loss": 2.6444644927978516, "Pretrain/Loss (Raw)": 2.245303153991699, "Pretrain/Step": 70, "Pretrain/Step Time": 8.348762134143284} +{"Pretrain/Learning Rate": 1.2412587412587414e-05, "Pretrain/Loss": 2.6421897411346436, "Pretrain/Loss (Raw)": 2.4829561710357666, "Pretrain/Step": 71, "Pretrain/Step Time": 8.346476726129021} +{"Pretrain/Learning Rate": 1.2587412587412589e-05, "Pretrain/Loss": 2.6465225219726562, "Pretrain/Loss (Raw)": 2.95414137840271, "Pretrain/Step": 72, "Pretrain/Step Time": 8.340669357114368} +{"Pretrain/Learning Rate": 1.2762237762237764e-05, "Pretrain/Loss": 2.6412065029144287, "Pretrain/Loss (Raw)": 2.2584493160247803, "Pretrain/Step": 73, "Pretrain/Step Time": 8.372110170860813} +{"Pretrain/Learning Rate": 1.2937062937062939e-05, "Pretrain/Loss": 2.6376218795776367, "Pretrain/Loss (Raw)": 2.3759653568267822, "Pretrain/Step": 74, "Pretrain/Step Time": 8.371818484486761} +{"Pretrain/Learning Rate": 1.3111888111888112e-05, "Pretrain/Loss": 2.6349971294403076, "Pretrain/Loss (Raw)": 2.44075870513916, "Pretrain/Step": 75, "Pretrain/Step Time": 8.385175663630168} +{"Pretrain/Learning Rate": 1.3286713286713287e-05, "Pretrain/Loss": 2.633842945098877, "Pretrain/Loss (Raw)": 2.5472664833068848, "Pretrain/Step": 76, "Pretrain/Step Time": 8.380649196474176} +{"Pretrain/Learning Rate": 1.3461538461538462e-05, "Pretrain/Loss": 2.6306207180023193, "Pretrain/Loss (Raw)": 2.3857429027557373, "Pretrain/Step": 77, "Pretrain/Step Time": 8.389872101994303} +{"Pretrain/Learning Rate": 1.3636363636363637e-05, "Pretrain/Loss": 2.626788377761841, "Pretrain/Loss (Raw)": 2.331691265106201, "Pretrain/Step": 78, "Pretrain/Step Time": 8.400082829671028} +{"Pretrain/Learning Rate": 1.381118881118881e-05, "Pretrain/Loss": 2.624159097671509, "Pretrain/Loss (Raw)": 2.4190640449523926, "Pretrain/Step": 79, "Pretrain/Step Time": 8.401616105550453} +{"Pretrain/Learning Rate": 1.3986013986013988e-05, "Pretrain/Loss": 2.6196212768554688, "Pretrain/Loss (Raw)": 2.261138439178467, "Pretrain/Step": 80, "Pretrain/Step Time": 8.399123841524125} +{"Pretrain/Learning Rate": 1.4160839160839163e-05, "Pretrain/Loss": 2.620600938796997, "Pretrain/Loss (Raw)": 2.698974609375, "Pretrain/Step": 81, "Pretrain/Step Time": 8.39829084313946} +{"Pretrain/Learning Rate": 1.4335664335664336e-05, "Pretrain/Loss": 2.6173222064971924, "Pretrain/Loss (Raw)": 2.3517606258392334, "Pretrain/Step": 82, "Pretrain/Step Time": 8.401716886497125} +{"Pretrain/Learning Rate": 1.4510489510489511e-05, "Pretrain/Loss": 2.6148698329925537, "Pretrain/Loss (Raw)": 2.413787603378296, "Pretrain/Step": 83, "Pretrain/Step Time": 8.401126074503702} +{"Pretrain/Learning Rate": 1.4685314685314686e-05, "Pretrain/Loss": 2.6105542182922363, "Pretrain/Loss (Raw)": 2.2523293495178223, "Pretrain/Step": 84, "Pretrain/Step Time": 8.396802192642575} +{"Pretrain/Learning Rate": 1.486013986013986e-05, "Pretrain/Loss": 2.607983112335205, "Pretrain/Loss (Raw)": 2.392022132873535, "Pretrain/Step": 85, "Pretrain/Step Time": 8.412514321944293} +{"Pretrain/Learning Rate": 1.5034965034965034e-05, "Pretrain/Loss": 2.6031482219696045, "Pretrain/Loss (Raw)": 2.1921937465667725, "Pretrain/Step": 86, "Pretrain/Step Time": 8.418413786000984} +{"Pretrain/Learning Rate": 1.5209790209790212e-05, "Pretrain/Loss": 2.6020286083221436, "Pretrain/Loss (Raw)": 2.5057315826416016, "Pretrain/Step": 87, "Pretrain/Step Time": 8.415077883621741} +{"Pretrain/Learning Rate": 1.5384615384615387e-05, "Pretrain/Loss": 2.6007816791534424, "Pretrain/Loss (Raw)": 2.492276668548584, "Pretrain/Step": 88, "Pretrain/Step Time": 8.408523952419108} +{"Pretrain/Learning Rate": 1.555944055944056e-05, "Pretrain/Loss": 2.5942132472991943, "Pretrain/Loss (Raw)": 2.0162172317504883, "Pretrain/Step": 89, "Pretrain/Step Time": 8.409335198027364} +{"Pretrain/Learning Rate": 1.5734265734265734e-05, "Pretrain/Loss": 2.5917439460754395, "Pretrain/Loss (Raw)": 2.371962547302246, "Pretrain/Step": 90, "Pretrain/Step Time": 8.416246072451274} +{"Pretrain/Learning Rate": 1.590909090909091e-05, "Pretrain/Loss": 2.587873935699463, "Pretrain/Loss (Raw)": 2.239569902420044, "Pretrain/Step": 91, "Pretrain/Step Time": 8.42672115105849} +{"Pretrain/Learning Rate": 1.6083916083916083e-05, "Pretrain/Loss": 2.5812478065490723, "Pretrain/Loss (Raw)": 1.978268027305603, "Pretrain/Step": 92, "Pretrain/Step Time": 8.427311907643857} +{"Pretrain/Learning Rate": 1.625874125874126e-05, "Pretrain/Loss": 2.5776712894439697, "Pretrain/Loss (Raw)": 2.248626708984375, "Pretrain/Step": 93, "Pretrain/Step Time": 8.429885056711012} +{"Pretrain/Learning Rate": 1.6433566433566433e-05, "Pretrain/Loss": 2.5717930793762207, "Pretrain/Loss (Raw)": 2.0251383781433105, "Pretrain/Step": 94, "Pretrain/Step Time": 8.435379317466248} +{"Pretrain/Learning Rate": 1.660839160839161e-05, "Pretrain/Loss": 2.5690128803253174, "Pretrain/Loss (Raw)": 2.3076581954956055, "Pretrain/Step": 95, "Pretrain/Step Time": 8.444995578966642} +{"Pretrain/Learning Rate": 1.6783216783216786e-05, "Pretrain/Loss": 2.5691890716552734, "Pretrain/Loss (Raw)": 2.5859248638153076, "Pretrain/Step": 96, "Pretrain/Step Time": 8.451627602179846} +{"Pretrain/Learning Rate": 1.695804195804196e-05, "Pretrain/Loss": 2.565610885620117, "Pretrain/Loss (Raw)": 2.2221267223358154, "Pretrain/Step": 97, "Pretrain/Step Time": 8.449728882189879} +{"Pretrain/Learning Rate": 1.7132867132867133e-05, "Pretrain/Loss": 2.5634453296661377, "Pretrain/Loss (Raw)": 2.3533899784088135, "Pretrain/Step": 98, "Pretrain/Step Time": 8.445476371414808} +{"Pretrain/Learning Rate": 1.730769230769231e-05, "Pretrain/Loss": 2.558346748352051, "Pretrain/Loss (Raw)": 2.0586965084075928, "Pretrain/Step": 99, "Pretrain/Step Time": 8.4408202147243} +{"Pretrain/Learning Rate": 1.7482517482517483e-05, "Pretrain/Loss": 2.5555262565612793, "Pretrain/Loss (Raw)": 2.276301860809326, "Pretrain/Step": 100, "Pretrain/Step Time": 8.445891575813294} +{"Pretrain/Learning Rate": 1.7657342657342656e-05, "Pretrain/Loss": 2.551508903503418, "Pretrain/Loss (Raw)": 2.149735689163208, "Pretrain/Step": 101, "Pretrain/Step Time": 8.44758111415523} +{"Pretrain/Learning Rate": 1.7832167832167836e-05, "Pretrain/Loss": 2.5468530654907227, "Pretrain/Loss (Raw)": 2.0765886306762695, "Pretrain/Step": 102, "Pretrain/Step Time": 8.443726836466322} +{"Pretrain/Learning Rate": 1.800699300699301e-05, "Pretrain/Loss": 2.550485849380493, "Pretrain/Loss (Raw)": 2.921077251434326, "Pretrain/Step": 103, "Pretrain/Step Time": 8.439545851309322} +{"Pretrain/Learning Rate": 1.8181818181818182e-05, "Pretrain/Loss": 2.549769639968872, "Pretrain/Loss (Raw)": 2.4759700298309326, "Pretrain/Step": 104, "Pretrain/Step Time": 8.438203476942503} +{"Pretrain/Learning Rate": 1.835664335664336e-05, "Pretrain/Loss": 2.5473673343658447, "Pretrain/Loss (Raw)": 2.297555923461914, "Pretrain/Step": 105, "Pretrain/Step Time": 8.439006337665376} +{"Pretrain/Learning Rate": 1.8531468531468532e-05, "Pretrain/Loss": 2.545413017272949, "Pretrain/Loss (Raw)": 2.340219736099243, "Pretrain/Step": 106, "Pretrain/Step Time": 8.441450096526236} +{"Pretrain/Learning Rate": 1.8706293706293705e-05, "Pretrain/Loss": 2.5443480014801025, "Pretrain/Loss (Raw)": 2.431440830230713, "Pretrain/Step": 107, "Pretrain/Step Time": 8.442309613539793} +{"Pretrain/Learning Rate": 1.888111888111888e-05, "Pretrain/Loss": 2.5467495918273926, "Pretrain/Loss (Raw)": 2.803701639175415, "Pretrain/Step": 108, "Pretrain/Step Time": 8.440726982222664} +{"Pretrain/Learning Rate": 1.9055944055944055e-05, "Pretrain/Loss": 2.5447609424591064, "Pretrain/Loss (Raw)": 2.330031156539917, "Pretrain/Step": 109, "Pretrain/Step Time": 8.441677769389722} +{"Pretrain/Learning Rate": 1.923076923076923e-05, "Pretrain/Loss": 2.543491840362549, "Pretrain/Loss (Raw)": 2.40517258644104, "Pretrain/Step": 110, "Pretrain/Step Time": 8.456480431556702} +{"Pretrain/Learning Rate": 1.9405594405594408e-05, "Pretrain/Loss": 2.540290355682373, "Pretrain/Loss (Raw)": 2.188096761703491, "Pretrain/Step": 111, "Pretrain/Step Time": 8.463696619411847} +{"Pretrain/Learning Rate": 1.958041958041958e-05, "Pretrain/Loss": 2.538539171218872, "Pretrain/Loss (Raw)": 2.3441414833068848, "Pretrain/Step": 112, "Pretrain/Step Time": 8.463495597243309} +{"Pretrain/Learning Rate": 1.9755244755244758e-05, "Pretrain/Loss": 2.5374398231506348, "Pretrain/Loss (Raw)": 2.4143402576446533, "Pretrain/Step": 113, "Pretrain/Step Time": 8.463281530194578} +{"Pretrain/Learning Rate": 1.993006993006993e-05, "Pretrain/Loss": 2.5353734493255615, "Pretrain/Loss (Raw)": 2.3018546104431152, "Pretrain/Step": 114, "Pretrain/Step Time": 8.46460093113414} +{"Pretrain/Learning Rate": 2.0104895104895104e-05, "Pretrain/Loss": 2.5343973636627197, "Pretrain/Loss (Raw)": 2.4231579303741455, "Pretrain/Step": 115, "Pretrain/Step Time": 8.463758356674857} +{"Pretrain/Learning Rate": 2.027972027972028e-05, "Pretrain/Loss": 2.5347344875335693, "Pretrain/Loss (Raw)": 2.5734856128692627, "Pretrain/Step": 116, "Pretrain/Step Time": 8.465513352690072} +{"Pretrain/Learning Rate": 2.0454545454545457e-05, "Pretrain/Loss": 2.5336077213287354, "Pretrain/Loss (Raw)": 2.402883768081665, "Pretrain/Step": 117, "Pretrain/Step Time": 8.462570718210987} +{"Pretrain/Learning Rate": 2.062937062937063e-05, "Pretrain/Loss": 2.5312771797180176, "Pretrain/Loss (Raw)": 2.2586159706115723, "Pretrain/Step": 118, "Pretrain/Step Time": 8.463447669805106} +{"Pretrain/Learning Rate": 2.0804195804195807e-05, "Pretrain/Loss": 2.53169584274292, "Pretrain/Loss (Raw)": 2.5810554027557373, "Pretrain/Step": 119, "Pretrain/Step Time": 8.461596935737033} +{"Pretrain/Learning Rate": 2.097902097902098e-05, "Pretrain/Loss": 2.529954433441162, "Pretrain/Loss (Raw)": 2.3227462768554688, "Pretrain/Step": 120, "Pretrain/Step Time": 8.469661527872086} +{"Pretrain/Learning Rate": 2.1153846153846154e-05, "Pretrain/Loss": 2.527409315109253, "Pretrain/Loss (Raw)": 2.2220375537872314, "Pretrain/Step": 121, "Pretrain/Step Time": 8.469436765702303} +{"Pretrain/Learning Rate": 2.132867132867133e-05, "Pretrain/Loss": 2.525055408477783, "Pretrain/Loss (Raw)": 2.2402148246765137, "Pretrain/Step": 122, "Pretrain/Step Time": 8.468354535884545} +{"Pretrain/Learning Rate": 2.1503496503496503e-05, "Pretrain/Loss": 2.522986888885498, "Pretrain/Loss (Raw)": 2.270618438720703, "Pretrain/Step": 123, "Pretrain/Step Time": 8.467855974910705} +{"Pretrain/Learning Rate": 2.1678321678321677e-05, "Pretrain/Loss": 2.521040916442871, "Pretrain/Loss (Raw)": 2.2816896438598633, "Pretrain/Step": 124, "Pretrain/Step Time": 8.468997997622337} +{"Pretrain/Learning Rate": 2.1853146853146857e-05, "Pretrain/Loss": 2.52107834815979, "Pretrain/Loss (Raw)": 2.5256919860839844, "Pretrain/Step": 125, "Pretrain/Step Time": 8.473838184356689} +{"Pretrain/Learning Rate": 2.202797202797203e-05, "Pretrain/Loss": 2.518820285797119, "Pretrain/Loss (Raw)": 2.2365639209747314, "Pretrain/Step": 126, "Pretrain/Step Time": 8.478003859519958} +{"Pretrain/Learning Rate": 2.2202797202797203e-05, "Pretrain/Loss": 2.5213661193847656, "Pretrain/Loss (Raw)": 2.8421568870544434, "Pretrain/Step": 127, "Pretrain/Step Time": 8.478900943215438} +{"Pretrain/Learning Rate": 2.237762237762238e-05, "Pretrain/Loss": 2.520214080810547, "Pretrain/Loss (Raw)": 2.3739407062530518, "Pretrain/Step": 128, "Pretrain/Step Time": 8.476380409672856} +{"Pretrain/Learning Rate": 2.2552447552447553e-05, "Pretrain/Loss": 2.510519027709961, "Pretrain/Loss (Raw)": 2.3212740421295166, "Pretrain/Step": 129, "Pretrain/Step Time": 8.44098785892129} +{"Pretrain/Learning Rate": 2.272727272727273e-05, "Pretrain/Loss": 2.503278970718384, "Pretrain/Loss (Raw)": 2.109412670135498, "Pretrain/Step": 130, "Pretrain/Step Time": 8.45093467272818} +{"Pretrain/Learning Rate": 2.2902097902097902e-05, "Pretrain/Loss": 2.488887310028076, "Pretrain/Loss (Raw)": 2.0592570304870605, "Pretrain/Step": 131, "Pretrain/Step Time": 8.449145779013634} +{"Pretrain/Learning Rate": 2.307692307692308e-05, "Pretrain/Loss": 2.475728988647461, "Pretrain/Loss (Raw)": 2.2387375831604004, "Pretrain/Step": 132, "Pretrain/Step Time": 8.447318345308304} +{"Pretrain/Learning Rate": 2.3251748251748252e-05, "Pretrain/Loss": 2.466336488723755, "Pretrain/Loss (Raw)": 2.3036746978759766, "Pretrain/Step": 133, "Pretrain/Step Time": 8.446086460724473} +{"Pretrain/Learning Rate": 2.342657342657343e-05, "Pretrain/Loss": 2.4545912742614746, "Pretrain/Loss (Raw)": 2.0750532150268555, "Pretrain/Step": 134, "Pretrain/Step Time": 8.447480723261833} +{"Pretrain/Learning Rate": 2.3601398601398602e-05, "Pretrain/Loss": 2.4432735443115234, "Pretrain/Loss (Raw)": 2.289156913757324, "Pretrain/Step": 135, "Pretrain/Step Time": 8.456461170688272} +{"Pretrain/Learning Rate": 2.377622377622378e-05, "Pretrain/Loss": 2.436614513397217, "Pretrain/Loss (Raw)": 2.3031771183013916, "Pretrain/Step": 136, "Pretrain/Step Time": 8.4725779928267} +{"Pretrain/Learning Rate": 2.3951048951048952e-05, "Pretrain/Loss": 2.4313879013061523, "Pretrain/Loss (Raw)": 2.185640811920166, "Pretrain/Step": 137, "Pretrain/Step Time": 8.477147908881307} +{"Pretrain/Learning Rate": 2.4125874125874125e-05, "Pretrain/Loss": 2.4256227016448975, "Pretrain/Loss (Raw)": 2.395552396774292, "Pretrain/Step": 138, "Pretrain/Step Time": 8.472508002072573} +{"Pretrain/Learning Rate": 2.43006993006993e-05, "Pretrain/Loss": 2.422116994857788, "Pretrain/Loss (Raw)": 2.3048110008239746, "Pretrain/Step": 139, "Pretrain/Step Time": 8.478048667311668} +{"Pretrain/Learning Rate": 2.4475524475524478e-05, "Pretrain/Loss": 2.420815944671631, "Pretrain/Loss (Raw)": 2.3075637817382812, "Pretrain/Step": 140, "Pretrain/Step Time": 8.486791705712676} +{"Pretrain/Learning Rate": 2.465034965034965e-05, "Pretrain/Loss": 2.4155282974243164, "Pretrain/Loss (Raw)": 2.3395376205444336, "Pretrain/Step": 141, "Pretrain/Step Time": 8.488778986036777} +{"Pretrain/Learning Rate": 2.4825174825174828e-05, "Pretrain/Loss": 2.416886806488037, "Pretrain/Loss (Raw)": 2.608989953994751, "Pretrain/Step": 142, "Pretrain/Step Time": 8.485686171799898} +{"Pretrain/Learning Rate": 2.5e-05, "Pretrain/Loss": 2.410844564437866, "Pretrain/Loss (Raw)": 2.1035139560699463, "Pretrain/Step": 143, "Pretrain/Step Time": 8.489275408908725} +{"Pretrain/Learning Rate": 2.5174825174825178e-05, "Pretrain/Loss": 2.4009838104248047, "Pretrain/Loss (Raw)": 2.1742491722106934, "Pretrain/Step": 144, "Pretrain/Step Time": 8.481769379228354} +{"Pretrain/Learning Rate": 2.534965034965035e-05, "Pretrain/Loss": 2.3908889293670654, "Pretrain/Loss (Raw)": 2.184385299682617, "Pretrain/Step": 145, "Pretrain/Step Time": 8.482280308380723} +{"Pretrain/Learning Rate": 2.5524475524475528e-05, "Pretrain/Loss": 2.3860435485839844, "Pretrain/Loss (Raw)": 2.1599409580230713, "Pretrain/Step": 146, "Pretrain/Step Time": 8.482902435585856} +{"Pretrain/Learning Rate": 2.5699300699300697e-05, "Pretrain/Loss": 2.386948347091675, "Pretrain/Loss (Raw)": 2.709364175796509, "Pretrain/Step": 147, "Pretrain/Step Time": 8.482136484235525} +{"Pretrain/Learning Rate": 2.5874125874125877e-05, "Pretrain/Loss": 2.384159803390503, "Pretrain/Loss (Raw)": 2.373849630355835, "Pretrain/Step": 148, "Pretrain/Step Time": 8.491495793685317} +{"Pretrain/Learning Rate": 2.6048951048951047e-05, "Pretrain/Loss": 2.379976749420166, "Pretrain/Loss (Raw)": 2.3852972984313965, "Pretrain/Step": 149, "Pretrain/Step Time": 8.497238840907812} +{"Pretrain/Learning Rate": 2.6223776223776224e-05, "Pretrain/Loss": 2.37355375289917, "Pretrain/Loss (Raw)": 2.2078802585601807, "Pretrain/Step": 150, "Pretrain/Step Time": 8.49774064309895} +{"Pretrain/Learning Rate": 2.6398601398601404e-05, "Pretrain/Loss": 2.3737597465515137, "Pretrain/Loss (Raw)": 2.398582935333252, "Pretrain/Step": 151, "Pretrain/Step Time": 8.501256806775928} +{"Pretrain/Learning Rate": 2.6573426573426574e-05, "Pretrain/Loss": 2.3713021278381348, "Pretrain/Loss (Raw)": 2.2256617546081543, "Pretrain/Step": 152, "Pretrain/Step Time": 8.504616379737854} +{"Pretrain/Learning Rate": 2.674825174825175e-05, "Pretrain/Loss": 2.3695406913757324, "Pretrain/Loss (Raw)": 2.4321186542510986, "Pretrain/Step": 153, "Pretrain/Step Time": 8.51406759954989} +{"Pretrain/Learning Rate": 2.6923076923076923e-05, "Pretrain/Loss": 2.368645191192627, "Pretrain/Loss (Raw)": 2.382627010345459, "Pretrain/Step": 154, "Pretrain/Step Time": 8.517089476808906} +{"Pretrain/Learning Rate": 2.70979020979021e-05, "Pretrain/Loss": 2.36728572845459, "Pretrain/Loss (Raw)": 2.361135959625244, "Pretrain/Step": 155, "Pretrain/Step Time": 8.519144263118505} +{"Pretrain/Learning Rate": 2.7272727272727273e-05, "Pretrain/Loss": 2.36604642868042, "Pretrain/Loss (Raw)": 2.339407444000244, "Pretrain/Step": 156, "Pretrain/Step Time": 8.52180252596736} +{"Pretrain/Learning Rate": 2.744755244755245e-05, "Pretrain/Loss": 2.3631675243377686, "Pretrain/Loss (Raw)": 2.163849353790283, "Pretrain/Step": 157, "Pretrain/Step Time": 8.520045479759574} +{"Pretrain/Learning Rate": 2.762237762237762e-05, "Pretrain/Loss": 2.360623836517334, "Pretrain/Loss (Raw)": 2.2186014652252197, "Pretrain/Step": 158, "Pretrain/Step Time": 8.521438024938107} +{"Pretrain/Learning Rate": 2.77972027972028e-05, "Pretrain/Loss": 2.3573498725891113, "Pretrain/Loss (Raw)": 2.2073988914489746, "Pretrain/Step": 159, "Pretrain/Step Time": 8.525004146620631} +{"Pretrain/Learning Rate": 2.7972027972027976e-05, "Pretrain/Loss": 2.352506637573242, "Pretrain/Loss (Raw)": 2.196732759475708, "Pretrain/Step": 160, "Pretrain/Step Time": 8.523937441408634} +{"Pretrain/Learning Rate": 2.8146853146853146e-05, "Pretrain/Loss": 2.3508236408233643, "Pretrain/Loss (Raw)": 2.1804189682006836, "Pretrain/Step": 161, "Pretrain/Step Time": 8.528883896768093} +{"Pretrain/Learning Rate": 2.8321678321678326e-05, "Pretrain/Loss": 2.3508872985839844, "Pretrain/Loss (Raw)": 2.6066503524780273, "Pretrain/Step": 162, "Pretrain/Step Time": 8.530992338433862} +{"Pretrain/Learning Rate": 2.8496503496503496e-05, "Pretrain/Loss": 2.3461694717407227, "Pretrain/Loss (Raw)": 2.2261993885040283, "Pretrain/Step": 163, "Pretrain/Step Time": 8.529027067124844} +{"Pretrain/Learning Rate": 2.8671328671328672e-05, "Pretrain/Loss": 2.3467442989349365, "Pretrain/Loss (Raw)": 2.4578158855438232, "Pretrain/Step": 164, "Pretrain/Step Time": 8.528017224743962} +{"Pretrain/Learning Rate": 2.8846153846153845e-05, "Pretrain/Loss": 2.346999168395996, "Pretrain/Loss (Raw)": 2.3745296001434326, "Pretrain/Step": 165, "Pretrain/Step Time": 8.528485782444477} +{"Pretrain/Learning Rate": 2.9020979020979022e-05, "Pretrain/Loss": 2.3468527793884277, "Pretrain/Loss (Raw)": 2.3895230293273926, "Pretrain/Step": 166, "Pretrain/Step Time": 8.528557296842337} +{"Pretrain/Learning Rate": 2.91958041958042e-05, "Pretrain/Loss": 2.346081018447876, "Pretrain/Loss (Raw)": 2.1069746017456055, "Pretrain/Step": 167, "Pretrain/Step Time": 8.535865306854248} +{"Pretrain/Learning Rate": 2.9370629370629372e-05, "Pretrain/Loss": 2.3464198112487793, "Pretrain/Loss (Raw)": 2.5362868309020996, "Pretrain/Step": 168, "Pretrain/Step Time": 8.539478845894337} +{"Pretrain/Learning Rate": 2.954545454545455e-05, "Pretrain/Loss": 2.344083309173584, "Pretrain/Loss (Raw)": 2.2497525215148926, "Pretrain/Step": 169, "Pretrain/Step Time": 8.540625046938658} +{"Pretrain/Learning Rate": 2.972027972027972e-05, "Pretrain/Loss": 2.343738079071045, "Pretrain/Loss (Raw)": 2.1552460193634033, "Pretrain/Step": 170, "Pretrain/Step Time": 8.542855225503445} +{"Pretrain/Learning Rate": 2.9895104895104898e-05, "Pretrain/Loss": 2.3398666381835938, "Pretrain/Loss (Raw)": 2.1378021240234375, "Pretrain/Step": 171, "Pretrain/Step Time": 8.543031165376306} +{"Pretrain/Learning Rate": 3.0069930069930068e-05, "Pretrain/Loss": 2.3401060104370117, "Pretrain/Loss (Raw)": 2.299453020095825, "Pretrain/Step": 172, "Pretrain/Step Time": 8.54370454698801} +{"Pretrain/Learning Rate": 3.0244755244755245e-05, "Pretrain/Loss": 2.3404250144958496, "Pretrain/Loss (Raw)": 2.334352493286133, "Pretrain/Step": 173, "Pretrain/Step Time": 8.545545967295766} +{"Pretrain/Learning Rate": 3.0419580419580425e-05, "Pretrain/Loss": 2.3406009674072266, "Pretrain/Loss (Raw)": 2.243414878845215, "Pretrain/Step": 174, "Pretrain/Step Time": 8.546356996521354} +{"Pretrain/Learning Rate": 3.0594405594405594e-05, "Pretrain/Loss": 2.3398680686950684, "Pretrain/Loss (Raw)": 2.3143839836120605, "Pretrain/Step": 175, "Pretrain/Step Time": 8.549843024462461} +{"Pretrain/Learning Rate": 3.0769230769230774e-05, "Pretrain/Loss": 2.336683988571167, "Pretrain/Loss (Raw)": 2.056325674057007, "Pretrain/Step": 176, "Pretrain/Step Time": 8.54839088767767} +{"Pretrain/Learning Rate": 3.094405594405594e-05, "Pretrain/Loss": 2.3382937908172607, "Pretrain/Loss (Raw)": 2.430447578430176, "Pretrain/Step": 177, "Pretrain/Step Time": 8.547132719308138} +{"Pretrain/Learning Rate": 3.111888111888112e-05, "Pretrain/Loss": 2.3379857540130615, "Pretrain/Loss (Raw)": 2.4211654663085938, "Pretrain/Step": 178, "Pretrain/Step Time": 8.54971069842577} +{"Pretrain/Learning Rate": 3.1293706293706294e-05, "Pretrain/Loss": 2.3352324962615967, "Pretrain/Loss (Raw)": 2.313612461090088, "Pretrain/Step": 179, "Pretrain/Step Time": 8.565327890217304} +{"Pretrain/Learning Rate": 3.146853146853147e-05, "Pretrain/Loss": 2.3388402462005615, "Pretrain/Loss (Raw)": 2.628382444381714, "Pretrain/Step": 180, "Pretrain/Step Time": 8.563991501927376} +{"Pretrain/Learning Rate": 3.164335664335665e-05, "Pretrain/Loss": 2.335988759994507, "Pretrain/Loss (Raw)": 2.3132917881011963, "Pretrain/Step": 181, "Pretrain/Step Time": 8.56278002075851} +{"Pretrain/Learning Rate": 3.181818181818182e-05, "Pretrain/Loss": 2.3350396156311035, "Pretrain/Loss (Raw)": 2.2023606300354004, "Pretrain/Step": 182, "Pretrain/Step Time": 8.564974594861269} +{"Pretrain/Learning Rate": 3.1993006993006994e-05, "Pretrain/Loss": 2.33479380607605, "Pretrain/Loss (Raw)": 2.348916530609131, "Pretrain/Step": 183, "Pretrain/Step Time": 8.566769022494555} +{"Pretrain/Learning Rate": 3.216783216783217e-05, "Pretrain/Loss": 2.330756902694702, "Pretrain/Loss (Raw)": 2.0136027336120605, "Pretrain/Step": 184, "Pretrain/Step Time": 8.56687731295824} +{"Pretrain/Learning Rate": 3.234265734265735e-05, "Pretrain/Loss": 2.3272206783294678, "Pretrain/Loss (Raw)": 2.1103031635284424, "Pretrain/Step": 185, "Pretrain/Step Time": 8.5667987447232} +{"Pretrain/Learning Rate": 3.251748251748252e-05, "Pretrain/Loss": 2.3262739181518555, "Pretrain/Loss (Raw)": 2.0845284461975098, "Pretrain/Step": 186, "Pretrain/Step Time": 8.577164044603705} +{"Pretrain/Learning Rate": 3.269230769230769e-05, "Pretrain/Loss": 2.3250675201416016, "Pretrain/Loss (Raw)": 2.226851463317871, "Pretrain/Step": 187, "Pretrain/Step Time": 8.578711152076721} +{"Pretrain/Learning Rate": 3.2867132867132866e-05, "Pretrain/Loss": 2.323208808898926, "Pretrain/Loss (Raw)": 1.9675184488296509, "Pretrain/Step": 188, "Pretrain/Step Time": 8.578045865520835} +{"Pretrain/Learning Rate": 3.3041958041958046e-05, "Pretrain/Loss": 2.3247740268707275, "Pretrain/Loss (Raw)": 2.470593214035034, "Pretrain/Step": 189, "Pretrain/Step Time": 8.572980251163244} +{"Pretrain/Learning Rate": 3.321678321678322e-05, "Pretrain/Loss": 2.323269844055176, "Pretrain/Loss (Raw)": 2.366067409515381, "Pretrain/Step": 190, "Pretrain/Step Time": 8.57251838222146} +{"Pretrain/Learning Rate": 3.339160839160839e-05, "Pretrain/Loss": 2.32527232170105, "Pretrain/Loss (Raw)": 2.4652562141418457, "Pretrain/Step": 191, "Pretrain/Step Time": 8.567347921431065} +{"Pretrain/Learning Rate": 3.356643356643357e-05, "Pretrain/Loss": 2.3262763023376465, "Pretrain/Loss (Raw)": 2.5710670948028564, "Pretrain/Step": 192, "Pretrain/Step Time": 8.569357242435217} +{"Pretrain/Learning Rate": 3.374125874125874e-05, "Pretrain/Loss": 2.3282954692840576, "Pretrain/Loss (Raw)": 2.332561492919922, "Pretrain/Step": 193, "Pretrain/Step Time": 8.572343852370977} +{"Pretrain/Learning Rate": 3.391608391608392e-05, "Pretrain/Loss": 2.325486898422241, "Pretrain/Loss (Raw)": 2.0958969593048096, "Pretrain/Step": 194, "Pretrain/Step Time": 8.578433614224195} +{"Pretrain/Learning Rate": 3.409090909090909e-05, "Pretrain/Loss": 2.325381278991699, "Pretrain/Loss (Raw)": 2.278731346130371, "Pretrain/Step": 195, "Pretrain/Step Time": 8.576753234490752} +{"Pretrain/Learning Rate": 3.4265734265734265e-05, "Pretrain/Loss": 2.32731556892395, "Pretrain/Loss (Raw)": 2.2077646255493164, "Pretrain/Step": 196, "Pretrain/Step Time": 8.579420380294323} +{"Pretrain/Learning Rate": 3.4440559440559445e-05, "Pretrain/Loss": 2.3241734504699707, "Pretrain/Loss (Raw)": 2.1894750595092773, "Pretrain/Step": 197, "Pretrain/Step Time": 8.578018935397267} +{"Pretrain/Learning Rate": 3.461538461538462e-05, "Pretrain/Loss": 2.325373649597168, "Pretrain/Loss (Raw)": 2.3989615440368652, "Pretrain/Step": 198, "Pretrain/Step Time": 8.582137916237116} +{"Pretrain/Learning Rate": 3.479020979020979e-05, "Pretrain/Loss": 2.3243160247802734, "Pretrain/Loss (Raw)": 2.3475723266601562, "Pretrain/Step": 199, "Pretrain/Step Time": 8.579547991976142} +{"Pretrain/Learning Rate": 3.4965034965034965e-05, "Pretrain/Loss": 2.3187992572784424, "Pretrain/Loss (Raw)": 2.24798846244812, "Pretrain/Step": 200, "Pretrain/Step Time": 8.582465661689639} +{"Pretrain/Learning Rate": 3.5139860139860145e-05, "Pretrain/Loss": 2.3204574584960938, "Pretrain/Loss (Raw)": 2.470688819885254, "Pretrain/Step": 201, "Pretrain/Step Time": 8.572267603129148} +{"Pretrain/Learning Rate": 3.531468531468531e-05, "Pretrain/Loss": 2.3210113048553467, "Pretrain/Loss (Raw)": 2.446866273880005, "Pretrain/Step": 202, "Pretrain/Step Time": 8.572615845128894} +{"Pretrain/Learning Rate": 3.548951048951049e-05, "Pretrain/Loss": 2.318929672241211, "Pretrain/Loss (Raw)": 2.174304485321045, "Pretrain/Step": 203, "Pretrain/Step Time": 8.562882160767913} +{"Pretrain/Learning Rate": 3.566433566433567e-05, "Pretrain/Loss": 2.3158209323883057, "Pretrain/Loss (Raw)": 2.149355173110962, "Pretrain/Step": 204, "Pretrain/Step Time": 8.567431826144457} +{"Pretrain/Learning Rate": 3.583916083916084e-05, "Pretrain/Loss": 2.3134403228759766, "Pretrain/Loss (Raw)": 2.0810301303863525, "Pretrain/Step": 205, "Pretrain/Step Time": 8.563813945278525} +{"Pretrain/Learning Rate": 3.601398601398602e-05, "Pretrain/Loss": 2.3137683868408203, "Pretrain/Loss (Raw)": 2.373666763305664, "Pretrain/Step": 206, "Pretrain/Step Time": 8.559164173901081} +{"Pretrain/Learning Rate": 3.618881118881119e-05, "Pretrain/Loss": 2.3123483657836914, "Pretrain/Loss (Raw)": 2.237300395965576, "Pretrain/Step": 207, "Pretrain/Step Time": 8.558405073359609} +{"Pretrain/Learning Rate": 3.6363636363636364e-05, "Pretrain/Loss": 2.3102777004241943, "Pretrain/Loss (Raw)": 1.9961013793945312, "Pretrain/Step": 208, "Pretrain/Step Time": 8.558845272287726} +{"Pretrain/Learning Rate": 3.653846153846154e-05, "Pretrain/Loss": 2.3078320026397705, "Pretrain/Loss (Raw)": 2.385946273803711, "Pretrain/Step": 209, "Pretrain/Step Time": 8.561581179499626} +{"Pretrain/Learning Rate": 3.671328671328672e-05, "Pretrain/Loss": 2.3070311546325684, "Pretrain/Loss (Raw)": 2.2492589950561523, "Pretrain/Step": 210, "Pretrain/Step Time": 8.556924477219582} +{"Pretrain/Learning Rate": 3.688811188811189e-05, "Pretrain/Loss": 2.3064513206481934, "Pretrain/Loss (Raw)": 2.3395349979400635, "Pretrain/Step": 211, "Pretrain/Step Time": 8.556057183071971} +{"Pretrain/Learning Rate": 3.7062937062937064e-05, "Pretrain/Loss": 2.3059046268463135, "Pretrain/Loss (Raw)": 2.182371139526367, "Pretrain/Step": 212, "Pretrain/Step Time": 8.561674850061536} +{"Pretrain/Learning Rate": 3.7237762237762244e-05, "Pretrain/Loss": 2.3046376705169678, "Pretrain/Loss (Raw)": 2.2298529148101807, "Pretrain/Step": 213, "Pretrain/Step Time": 8.557509206235409} +{"Pretrain/Learning Rate": 3.741258741258741e-05, "Pretrain/Loss": 2.3053314685821533, "Pretrain/Loss (Raw)": 2.2810072898864746, "Pretrain/Step": 214, "Pretrain/Step Time": 8.560179714113474} +{"Pretrain/Learning Rate": 3.758741258741259e-05, "Pretrain/Loss": 2.302476406097412, "Pretrain/Loss (Raw)": 2.1402642726898193, "Pretrain/Step": 215, "Pretrain/Step Time": 8.560033436864614} +{"Pretrain/Learning Rate": 3.776223776223776e-05, "Pretrain/Loss": 2.3010635375976562, "Pretrain/Loss (Raw)": 2.3114261627197266, "Pretrain/Step": 216, "Pretrain/Step Time": 8.567938972264528} +{"Pretrain/Learning Rate": 3.7937062937062936e-05, "Pretrain/Loss": 2.3040528297424316, "Pretrain/Loss (Raw)": 2.3988380432128906, "Pretrain/Step": 217, "Pretrain/Step Time": 8.572119884192944} +{"Pretrain/Learning Rate": 3.811188811188811e-05, "Pretrain/Loss": 2.304750680923462, "Pretrain/Loss (Raw)": 2.4613144397735596, "Pretrain/Step": 218, "Pretrain/Step Time": 8.567241836339235} +{"Pretrain/Learning Rate": 3.828671328671329e-05, "Pretrain/Loss": 2.30684757232666, "Pretrain/Loss (Raw)": 2.507966995239258, "Pretrain/Step": 219, "Pretrain/Step Time": 8.567891417071223} +{"Pretrain/Learning Rate": 3.846153846153846e-05, "Pretrain/Loss": 2.308389902114868, "Pretrain/Loss (Raw)": 2.175682544708252, "Pretrain/Step": 220, "Pretrain/Step Time": 8.56679635308683} +{"Pretrain/Learning Rate": 3.8636363636363636e-05, "Pretrain/Loss": 2.3061537742614746, "Pretrain/Loss (Raw)": 1.9624085426330566, "Pretrain/Step": 221, "Pretrain/Step Time": 8.562916403636336} +{"Pretrain/Learning Rate": 3.8811188811188816e-05, "Pretrain/Loss": 2.307417631149292, "Pretrain/Loss (Raw)": 2.186922550201416, "Pretrain/Step": 222, "Pretrain/Step Time": 8.561185812577605} +{"Pretrain/Learning Rate": 3.898601398601399e-05, "Pretrain/Loss": 2.3045005798339844, "Pretrain/Loss (Raw)": 1.9342604875564575, "Pretrain/Step": 223, "Pretrain/Step Time": 8.550763925537467} +{"Pretrain/Learning Rate": 3.916083916083916e-05, "Pretrain/Loss": 2.3032164573669434, "Pretrain/Loss (Raw)": 2.4215731620788574, "Pretrain/Step": 224, "Pretrain/Step Time": 8.552627375349402} +{"Pretrain/Learning Rate": 3.9335664335664336e-05, "Pretrain/Loss": 2.3046860694885254, "Pretrain/Loss (Raw)": 2.4102306365966797, "Pretrain/Step": 225, "Pretrain/Step Time": 8.554310977458954} +{"Pretrain/Learning Rate": 3.9510489510489516e-05, "Pretrain/Loss": 2.302593231201172, "Pretrain/Loss (Raw)": 2.085494041442871, "Pretrain/Step": 226, "Pretrain/Step Time": 8.5590233001858} +{"Pretrain/Learning Rate": 3.968531468531469e-05, "Pretrain/Loss": 2.303495407104492, "Pretrain/Loss (Raw)": 2.174171209335327, "Pretrain/Step": 227, "Pretrain/Step Time": 8.564704466611147} +{"Pretrain/Learning Rate": 3.986013986013986e-05, "Pretrain/Loss": 2.303788900375366, "Pretrain/Loss (Raw)": 2.3138952255249023, "Pretrain/Step": 228, "Pretrain/Step Time": 8.558910705149174} +{"Pretrain/Learning Rate": 4.0034965034965035e-05, "Pretrain/Loss": 2.304044485092163, "Pretrain/Loss (Raw)": 2.1824424266815186, "Pretrain/Step": 229, "Pretrain/Step Time": 8.55865933187306} +{"Pretrain/Learning Rate": 4.020979020979021e-05, "Pretrain/Loss": 2.30666446685791, "Pretrain/Loss (Raw)": 2.41195011138916, "Pretrain/Step": 230, "Pretrain/Step Time": 8.566791554912925} +{"Pretrain/Learning Rate": 4.038461538461539e-05, "Pretrain/Loss": 2.302959442138672, "Pretrain/Loss (Raw)": 2.4468300342559814, "Pretrain/Step": 231, "Pretrain/Step Time": 8.569778226315975} +{"Pretrain/Learning Rate": 4.055944055944056e-05, "Pretrain/Loss": 2.3009583950042725, "Pretrain/Loss (Raw)": 2.219834089279175, "Pretrain/Step": 232, "Pretrain/Step Time": 8.57127371430397} +{"Pretrain/Learning Rate": 4.0734265734265735e-05, "Pretrain/Loss": 2.300640344619751, "Pretrain/Loss (Raw)": 2.2568156719207764, "Pretrain/Step": 233, "Pretrain/Step Time": 8.572024747729301} +{"Pretrain/Learning Rate": 4.0909090909090915e-05, "Pretrain/Loss": 2.299684762954712, "Pretrain/Loss (Raw)": 2.21793794631958, "Pretrain/Step": 234, "Pretrain/Step Time": 8.571927709504962} +{"Pretrain/Learning Rate": 4.108391608391609e-05, "Pretrain/Loss": 2.2960143089294434, "Pretrain/Loss (Raw)": 1.9616069793701172, "Pretrain/Step": 235, "Pretrain/Step Time": 8.569900330156088} +{"Pretrain/Learning Rate": 4.125874125874126e-05, "Pretrain/Loss": 2.2911787033081055, "Pretrain/Loss (Raw)": 2.1847498416900635, "Pretrain/Step": 236, "Pretrain/Step Time": 8.57659506984055} +{"Pretrain/Learning Rate": 4.1433566433566434e-05, "Pretrain/Loss": 2.2906274795532227, "Pretrain/Loss (Raw)": 2.2594940662384033, "Pretrain/Step": 237, "Pretrain/Step Time": 8.579178273677826} +{"Pretrain/Learning Rate": 4.1608391608391614e-05, "Pretrain/Loss": 2.2903921604156494, "Pretrain/Loss (Raw)": 2.3750438690185547, "Pretrain/Step": 238, "Pretrain/Step Time": 8.566019836813211} +{"Pretrain/Learning Rate": 4.178321678321678e-05, "Pretrain/Loss": 2.2904767990112305, "Pretrain/Loss (Raw)": 2.1989026069641113, "Pretrain/Step": 239, "Pretrain/Step Time": 8.559922149404883} +{"Pretrain/Learning Rate": 4.195804195804196e-05, "Pretrain/Loss": 2.2884960174560547, "Pretrain/Loss (Raw)": 2.090630054473877, "Pretrain/Step": 240, "Pretrain/Step Time": 8.558143174275756} +{"Pretrain/Learning Rate": 4.213286713286714e-05, "Pretrain/Loss": 2.285933256149292, "Pretrain/Loss (Raw)": 2.086271286010742, "Pretrain/Step": 241, "Pretrain/Step Time": 8.560709169134498} +{"Pretrain/Learning Rate": 4.230769230769231e-05, "Pretrain/Loss": 2.2852635383605957, "Pretrain/Loss (Raw)": 2.216165781021118, "Pretrain/Step": 242, "Pretrain/Step Time": 8.55796917527914} +{"Pretrain/Learning Rate": 4.248251748251749e-05, "Pretrain/Loss": 2.2846555709838867, "Pretrain/Loss (Raw)": 2.3453240394592285, "Pretrain/Step": 243, "Pretrain/Step Time": 8.560853281989694} +{"Pretrain/Learning Rate": 4.265734265734266e-05, "Pretrain/Loss": 2.2817018032073975, "Pretrain/Loss (Raw)": 2.1954288482666016, "Pretrain/Step": 244, "Pretrain/Step Time": 8.55859050527215} +{"Pretrain/Learning Rate": 4.2832167832167833e-05, "Pretrain/Loss": 2.278427839279175, "Pretrain/Loss (Raw)": 1.9837901592254639, "Pretrain/Step": 245, "Pretrain/Step Time": 8.559984907507896} +{"Pretrain/Learning Rate": 4.300699300699301e-05, "Pretrain/Loss": 2.277984142303467, "Pretrain/Loss (Raw)": 2.2018423080444336, "Pretrain/Step": 246, "Pretrain/Step Time": 8.561704386025667} +{"Pretrain/Learning Rate": 4.318181818181819e-05, "Pretrain/Loss": 2.276228427886963, "Pretrain/Loss (Raw)": 2.3563060760498047, "Pretrain/Step": 247, "Pretrain/Step Time": 8.564581139013171} +{"Pretrain/Learning Rate": 4.335664335664335e-05, "Pretrain/Loss": 2.2764201164245605, "Pretrain/Loss (Raw)": 2.3473072052001953, "Pretrain/Step": 248, "Pretrain/Step Time": 8.555817106738687} +{"Pretrain/Learning Rate": 4.353146853146853e-05, "Pretrain/Loss": 2.2753515243530273, "Pretrain/Loss (Raw)": 2.085205316543579, "Pretrain/Step": 249, "Pretrain/Step Time": 8.558505052700639} +{"Pretrain/Learning Rate": 4.370629370629371e-05, "Pretrain/Loss": 2.275343894958496, "Pretrain/Loss (Raw)": 2.2392683029174805, "Pretrain/Step": 250, "Pretrain/Step Time": 8.560414968058467} +{"Pretrain/Learning Rate": 4.388111888111888e-05, "Pretrain/Loss": 2.2748045921325684, "Pretrain/Loss (Raw)": 2.201561450958252, "Pretrain/Step": 251, "Pretrain/Step Time": 8.560322945937514} +{"Pretrain/Learning Rate": 4.405594405594406e-05, "Pretrain/Loss": 2.272977590560913, "Pretrain/Loss (Raw)": 2.0478672981262207, "Pretrain/Step": 252, "Pretrain/Step Time": 8.559457946568727} +{"Pretrain/Learning Rate": 4.423076923076923e-05, "Pretrain/Loss": 2.2713963985443115, "Pretrain/Loss (Raw)": 2.3232831954956055, "Pretrain/Step": 253, "Pretrain/Step Time": 8.55556315369904} +{"Pretrain/Learning Rate": 4.4405594405594406e-05, "Pretrain/Loss": 2.2713065147399902, "Pretrain/Loss (Raw)": 2.2250571250915527, "Pretrain/Step": 254, "Pretrain/Step Time": 8.547492461279035} +{"Pretrain/Learning Rate": 4.458041958041958e-05, "Pretrain/Loss": 2.2673964500427246, "Pretrain/Loss (Raw)": 2.3416569232940674, "Pretrain/Step": 255, "Pretrain/Step Time": 8.550456890836358} +{"Pretrain/Learning Rate": 4.475524475524476e-05, "Pretrain/Loss": 2.2662954330444336, "Pretrain/Loss (Raw)": 2.2330355644226074, "Pretrain/Step": 256, "Pretrain/Step Time": 8.551400046795607} +{"Pretrain/Learning Rate": 4.493006993006993e-05, "Pretrain/Loss": 2.265739917755127, "Pretrain/Loss (Raw)": 2.2501511573791504, "Pretrain/Step": 257, "Pretrain/Step Time": 8.543022755533457} +{"Pretrain/Learning Rate": 4.5104895104895105e-05, "Pretrain/Loss": 2.2670857906341553, "Pretrain/Loss (Raw)": 2.281707763671875, "Pretrain/Step": 258, "Pretrain/Step Time": 8.5341232791543} +{"Pretrain/Learning Rate": 4.5279720279720285e-05, "Pretrain/Loss": 2.2682251930236816, "Pretrain/Loss (Raw)": 2.2050843238830566, "Pretrain/Step": 259, "Pretrain/Step Time": 8.542185045778751} +{"Pretrain/Learning Rate": 4.545454545454546e-05, "Pretrain/Loss": 2.2680413722991943, "Pretrain/Loss (Raw)": 2.215217351913452, "Pretrain/Step": 260, "Pretrain/Step Time": 8.545711427927017} +{"Pretrain/Learning Rate": 4.562937062937063e-05, "Pretrain/Loss": 2.266737937927246, "Pretrain/Loss (Raw)": 2.136826276779175, "Pretrain/Step": 261, "Pretrain/Step Time": 8.551129972562194} +{"Pretrain/Learning Rate": 4.5804195804195805e-05, "Pretrain/Loss": 2.2681896686553955, "Pretrain/Loss (Raw)": 2.260891914367676, "Pretrain/Step": 262, "Pretrain/Step Time": 8.549978153780103} +{"Pretrain/Learning Rate": 4.597902097902098e-05, "Pretrain/Loss": 2.2690248489379883, "Pretrain/Loss (Raw)": 2.3960254192352295, "Pretrain/Step": 263, "Pretrain/Step Time": 8.543274512514472} +{"Pretrain/Learning Rate": 4.615384615384616e-05, "Pretrain/Loss": 2.2703051567077637, "Pretrain/Loss (Raw)": 2.467074394226074, "Pretrain/Step": 264, "Pretrain/Step Time": 8.528572035953403} +{"Pretrain/Learning Rate": 4.632867132867133e-05, "Pretrain/Loss": 2.2707808017730713, "Pretrain/Loss (Raw)": 2.246518611907959, "Pretrain/Step": 265, "Pretrain/Step Time": 8.534966515377164} +{"Pretrain/Learning Rate": 4.6503496503496505e-05, "Pretrain/Loss": 2.269244432449341, "Pretrain/Loss (Raw)": 2.1989083290100098, "Pretrain/Step": 266, "Pretrain/Step Time": 8.53534128703177} +{"Pretrain/Learning Rate": 4.667832167832168e-05, "Pretrain/Loss": 2.26839542388916, "Pretrain/Loss (Raw)": 2.1961264610290527, "Pretrain/Step": 267, "Pretrain/Step Time": 8.540683034807444} +{"Pretrain/Learning Rate": 4.685314685314686e-05, "Pretrain/Loss": 2.269223213195801, "Pretrain/Loss (Raw)": 2.413536787033081, "Pretrain/Step": 268, "Pretrain/Step Time": 8.535276150330901} +{"Pretrain/Learning Rate": 4.702797202797203e-05, "Pretrain/Loss": 2.2687928676605225, "Pretrain/Loss (Raw)": 2.2844319343566895, "Pretrain/Step": 269, "Pretrain/Step Time": 8.533084582537413} +{"Pretrain/Learning Rate": 4.7202797202797204e-05, "Pretrain/Loss": 2.2648744583129883, "Pretrain/Loss (Raw)": 2.1074509620666504, "Pretrain/Step": 270, "Pretrain/Step Time": 8.53297458589077} +{"Pretrain/Learning Rate": 4.7377622377622384e-05, "Pretrain/Loss": 2.264462947845459, "Pretrain/Loss (Raw)": 2.0508041381835938, "Pretrain/Step": 271, "Pretrain/Step Time": 8.531545644626021} +{"Pretrain/Learning Rate": 4.755244755244756e-05, "Pretrain/Loss": 2.2636282444000244, "Pretrain/Loss (Raw)": 2.0674426555633545, "Pretrain/Step": 272, "Pretrain/Step Time": 8.5379340890795} +{"Pretrain/Learning Rate": 4.772727272727273e-05, "Pretrain/Loss": 2.2653262615203857, "Pretrain/Loss (Raw)": 2.4017248153686523, "Pretrain/Step": 273, "Pretrain/Step Time": 8.536465022712946} +{"Pretrain/Learning Rate": 4.7902097902097904e-05, "Pretrain/Loss": 2.2660629749298096, "Pretrain/Loss (Raw)": 2.254244327545166, "Pretrain/Step": 274, "Pretrain/Step Time": 8.536257984116673} +{"Pretrain/Learning Rate": 4.8076923076923084e-05, "Pretrain/Loss": 2.263357162475586, "Pretrain/Loss (Raw)": 2.363027334213257, "Pretrain/Step": 275, "Pretrain/Step Time": 8.540007628500462} +{"Pretrain/Learning Rate": 4.825174825174825e-05, "Pretrain/Loss": 2.263521432876587, "Pretrain/Loss (Raw)": 2.3948748111724854, "Pretrain/Step": 276, "Pretrain/Step Time": 8.52886238694191} +{"Pretrain/Learning Rate": 4.842657342657343e-05, "Pretrain/Loss": 2.263927936553955, "Pretrain/Loss (Raw)": 2.4373342990875244, "Pretrain/Step": 277, "Pretrain/Step Time": 8.522733483463526} +{"Pretrain/Learning Rate": 4.86013986013986e-05, "Pretrain/Loss": 2.263761520385742, "Pretrain/Loss (Raw)": 2.1865618228912354, "Pretrain/Step": 278, "Pretrain/Step Time": 8.531259326264262} +{"Pretrain/Learning Rate": 4.8776223776223776e-05, "Pretrain/Loss": 2.2625088691711426, "Pretrain/Loss (Raw)": 2.2382330894470215, "Pretrain/Step": 279, "Pretrain/Step Time": 8.52888641320169} +{"Pretrain/Learning Rate": 4.8951048951048956e-05, "Pretrain/Loss": 2.263352394104004, "Pretrain/Loss (Raw)": 2.3336336612701416, "Pretrain/Step": 280, "Pretrain/Step Time": 8.528933735564351} +{"Pretrain/Learning Rate": 4.912587412587413e-05, "Pretrain/Loss": 2.260204792022705, "Pretrain/Loss (Raw)": 2.0292274951934814, "Pretrain/Step": 281, "Pretrain/Step Time": 8.519627682864666} +{"Pretrain/Learning Rate": 4.93006993006993e-05, "Pretrain/Loss": 2.2594799995422363, "Pretrain/Loss (Raw)": 2.2898759841918945, "Pretrain/Step": 282, "Pretrain/Step Time": 8.526543628424406} +{"Pretrain/Learning Rate": 4.9475524475524476e-05, "Pretrain/Loss": 2.260188102722168, "Pretrain/Loss (Raw)": 2.4517738819122314, "Pretrain/Step": 283, "Pretrain/Step Time": 8.525486160069704} +{"Pretrain/Learning Rate": 4.9650349650349656e-05, "Pretrain/Loss": 2.258932590484619, "Pretrain/Loss (Raw)": 2.1786911487579346, "Pretrain/Step": 284, "Pretrain/Step Time": 8.528441226109862} +{"Pretrain/Learning Rate": 4.982517482517482e-05, "Pretrain/Loss": 2.2593977451324463, "Pretrain/Loss (Raw)": 2.2233777046203613, "Pretrain/Step": 285, "Pretrain/Step Time": 8.53290668874979} +{"Pretrain/Learning Rate": 5e-05, "Pretrain/Loss": 2.2584471702575684, "Pretrain/Loss (Raw)": 2.096931219100952, "Pretrain/Step": 286, "Pretrain/Step Time": 8.531822195276618} +{"Pretrain/Learning Rate": 4.9999998558441094e-05, "Pretrain/Loss": 2.2591261863708496, "Pretrain/Loss (Raw)": 2.2942962646484375, "Pretrain/Step": 287, "Pretrain/Step Time": 8.526497155427933} +{"Pretrain/Learning Rate": 4.999999423376456e-05, "Pretrain/Loss": 2.2599191665649414, "Pretrain/Loss (Raw)": 2.298232316970825, "Pretrain/Step": 288, "Pretrain/Step Time": 8.52672242000699} +{"Pretrain/Learning Rate": 4.9999987025970884e-05, "Pretrain/Loss": 2.2601613998413086, "Pretrain/Loss (Raw)": 2.2114336490631104, "Pretrain/Step": 289, "Pretrain/Step Time": 8.528088917955756} +{"Pretrain/Learning Rate": 4.99999769350609e-05, "Pretrain/Loss": 2.2580692768096924, "Pretrain/Loss (Raw)": 2.3388659954071045, "Pretrain/Step": 290, "Pretrain/Step Time": 8.527325440198183} +{"Pretrain/Learning Rate": 4.999996396103577e-05, "Pretrain/Loss": 2.259061813354492, "Pretrain/Loss (Raw)": 2.353269577026367, "Pretrain/Step": 291, "Pretrain/Step Time": 8.532321756705642} +{"Pretrain/Learning Rate": 4.999994810389699e-05, "Pretrain/Loss": 2.257032871246338, "Pretrain/Loss (Raw)": 2.1981139183044434, "Pretrain/Step": 292, "Pretrain/Step Time": 8.532300774008036} +{"Pretrain/Learning Rate": 4.999992936364639e-05, "Pretrain/Loss": 2.255007266998291, "Pretrain/Loss (Raw)": 2.115231990814209, "Pretrain/Step": 293, "Pretrain/Step Time": 8.53607896156609} +{"Pretrain/Learning Rate": 4.9999907740286136e-05, "Pretrain/Loss": 2.2520811557769775, "Pretrain/Loss (Raw)": 2.0149757862091064, "Pretrain/Step": 294, "Pretrain/Step Time": 8.541833272203803} +{"Pretrain/Learning Rate": 4.9999883233818724e-05, "Pretrain/Loss": 2.252767562866211, "Pretrain/Loss (Raw)": 2.1948347091674805, "Pretrain/Step": 295, "Pretrain/Step Time": 8.541067946702242} +{"Pretrain/Learning Rate": 4.999985584424696e-05, "Pretrain/Loss": 2.2501425743103027, "Pretrain/Loss (Raw)": 2.200282573699951, "Pretrain/Step": 296, "Pretrain/Step Time": 8.535798154771328} +{"Pretrain/Learning Rate": 4.999982557157403e-05, "Pretrain/Loss": 2.2504987716674805, "Pretrain/Loss (Raw)": 2.295383930206299, "Pretrain/Step": 297, "Pretrain/Step Time": 8.545931039378047} +{"Pretrain/Learning Rate": 4.9999792415803405e-05, "Pretrain/Loss": 2.2514142990112305, "Pretrain/Loss (Raw)": 2.2724132537841797, "Pretrain/Step": 298, "Pretrain/Step Time": 8.542602553963661} +{"Pretrain/Learning Rate": 4.999975637693892e-05, "Pretrain/Loss": 2.2517600059509277, "Pretrain/Loss (Raw)": 2.1820380687713623, "Pretrain/Step": 299, "Pretrain/Step Time": 8.543590031564236} +{"Pretrain/Learning Rate": 4.999971745498472e-05, "Pretrain/Loss": 2.2523231506347656, "Pretrain/Loss (Raw)": 2.371523141860962, "Pretrain/Step": 300, "Pretrain/Step Time": 8.546526746824384} +{"Pretrain/Learning Rate": 4.999967564994531e-05, "Pretrain/Loss": 2.252157688140869, "Pretrain/Loss (Raw)": 2.313185214996338, "Pretrain/Step": 301, "Pretrain/Step Time": 8.541861735284328} +{"Pretrain/Learning Rate": 4.999963096182549e-05, "Pretrain/Loss": 2.2518718242645264, "Pretrain/Loss (Raw)": 2.2068493366241455, "Pretrain/Step": 302, "Pretrain/Step Time": 8.54733007773757} +{"Pretrain/Learning Rate": 4.9999583390630435e-05, "Pretrain/Loss": 2.251504898071289, "Pretrain/Loss (Raw)": 2.2673819065093994, "Pretrain/Step": 303, "Pretrain/Step Time": 8.539976114407182} +{"Pretrain/Learning Rate": 4.999953293636562e-05, "Pretrain/Loss": 2.253840208053589, "Pretrain/Loss (Raw)": 2.355252265930176, "Pretrain/Step": 304, "Pretrain/Step Time": 8.539953913539648} +{"Pretrain/Learning Rate": 4.9999479599036856e-05, "Pretrain/Loss": 2.252232074737549, "Pretrain/Loss (Raw)": 2.2246079444885254, "Pretrain/Step": 305, "Pretrain/Step Time": 8.54298740811646} +{"Pretrain/Learning Rate": 4.9999423378650315e-05, "Pretrain/Loss": 2.2498011589050293, "Pretrain/Loss (Raw)": 2.110013961791992, "Pretrain/Step": 306, "Pretrain/Step Time": 8.541050581261516} +{"Pretrain/Learning Rate": 4.9999364275212466e-05, "Pretrain/Loss": 2.2477529048919678, "Pretrain/Loss (Raw)": 2.0514333248138428, "Pretrain/Step": 307, "Pretrain/Step Time": 8.525559931993484} +{"Pretrain/Learning Rate": 4.9999302288730126e-05, "Pretrain/Loss": 2.24869704246521, "Pretrain/Loss (Raw)": 2.7492332458496094, "Pretrain/Step": 308, "Pretrain/Step Time": 8.53807396069169} +{"Pretrain/Learning Rate": 4.9999237419210445e-05, "Pretrain/Loss": 2.2471604347229004, "Pretrain/Loss (Raw)": 2.116626501083374, "Pretrain/Step": 309, "Pretrain/Step Time": 8.538556564599276} +{"Pretrain/Learning Rate": 4.99991696666609e-05, "Pretrain/Loss": 2.2461836338043213, "Pretrain/Loss (Raw)": 2.0773253440856934, "Pretrain/Step": 310, "Pretrain/Step Time": 8.543318074196577} +{"Pretrain/Learning Rate": 4.999909903108932e-05, "Pretrain/Loss": 2.2474069595336914, "Pretrain/Loss (Raw)": 2.5055177211761475, "Pretrain/Step": 311, "Pretrain/Step Time": 8.546384355053306} +{"Pretrain/Learning Rate": 4.999902551250384e-05, "Pretrain/Loss": 2.247645139694214, "Pretrain/Loss (Raw)": 2.044055461883545, "Pretrain/Step": 312, "Pretrain/Step Time": 8.549929480999708} +{"Pretrain/Learning Rate": 4.999894911091293e-05, "Pretrain/Loss": 2.2470412254333496, "Pretrain/Loss (Raw)": 2.033013343811035, "Pretrain/Step": 313, "Pretrain/Step Time": 8.547799974679947} +{"Pretrain/Learning Rate": 4.999886982632541e-05, "Pretrain/Loss": 2.2488675117492676, "Pretrain/Loss (Raw)": 2.318325996398926, "Pretrain/Step": 314, "Pretrain/Step Time": 8.550514809787273} +{"Pretrain/Learning Rate": 4.999878765875042e-05, "Pretrain/Loss": 2.24751615524292, "Pretrain/Loss (Raw)": 2.0538337230682373, "Pretrain/Step": 315, "Pretrain/Step Time": 8.552051519975066} +{"Pretrain/Learning Rate": 4.999870260819745e-05, "Pretrain/Loss": 2.2493796348571777, "Pretrain/Loss (Raw)": 2.2060697078704834, "Pretrain/Step": 316, "Pretrain/Step Time": 8.55569508485496} +{"Pretrain/Learning Rate": 4.999861467467629e-05, "Pretrain/Loss": 2.2487480640411377, "Pretrain/Loss (Raw)": 2.3897314071655273, "Pretrain/Step": 317, "Pretrain/Step Time": 8.552758926525712} +{"Pretrain/Learning Rate": 4.9998523858197094e-05, "Pretrain/Loss": 2.2477316856384277, "Pretrain/Loss (Raw)": 2.2359986305236816, "Pretrain/Step": 318, "Pretrain/Step Time": 8.553632326424122} +{"Pretrain/Learning Rate": 4.999843015877032e-05, "Pretrain/Loss": 2.2449512481689453, "Pretrain/Loss (Raw)": 2.1093366146087646, "Pretrain/Step": 319, "Pretrain/Step Time": 8.55339627340436} +{"Pretrain/Learning Rate": 4.99983335764068e-05, "Pretrain/Loss": 2.242185592651367, "Pretrain/Loss (Raw)": 2.2170681953430176, "Pretrain/Step": 320, "Pretrain/Step Time": 8.558636842295527} +{"Pretrain/Learning Rate": 4.999823411111765e-05, "Pretrain/Loss": 2.240473508834839, "Pretrain/Loss (Raw)": 2.1134018898010254, "Pretrain/Step": 321, "Pretrain/Step Time": 8.556787144392729} +{"Pretrain/Learning Rate": 4.999813176291433e-05, "Pretrain/Loss": 2.2420151233673096, "Pretrain/Loss (Raw)": 2.2932305335998535, "Pretrain/Step": 322, "Pretrain/Step Time": 8.554501090198755} +{"Pretrain/Learning Rate": 4.999802653180868e-05, "Pretrain/Loss": 2.240936756134033, "Pretrain/Loss (Raw)": 2.140692710876465, "Pretrain/Step": 323, "Pretrain/Step Time": 8.556128963828087} +{"Pretrain/Learning Rate": 4.9997918417812805e-05, "Pretrain/Loss": 2.2397470474243164, "Pretrain/Loss (Raw)": 2.055464029312134, "Pretrain/Step": 324, "Pretrain/Step Time": 8.55300355143845} +{"Pretrain/Learning Rate": 4.999780742093919e-05, "Pretrain/Loss": 2.239051103591919, "Pretrain/Loss (Raw)": 2.1004221439361572, "Pretrain/Step": 325, "Pretrain/Step Time": 8.558224206790328} +{"Pretrain/Learning Rate": 4.999769354120063e-05, "Pretrain/Loss": 2.238616943359375, "Pretrain/Loss (Raw)": 2.343418598175049, "Pretrain/Step": 326, "Pretrain/Step Time": 8.56170872040093} +{"Pretrain/Learning Rate": 4.9997576778610254e-05, "Pretrain/Loss": 2.2380242347717285, "Pretrain/Loss (Raw)": 2.2716915607452393, "Pretrain/Step": 327, "Pretrain/Step Time": 8.562897587195039} +{"Pretrain/Learning Rate": 4.999745713318154e-05, "Pretrain/Loss": 2.2376129627227783, "Pretrain/Loss (Raw)": 2.195340633392334, "Pretrain/Step": 328, "Pretrain/Step Time": 8.56467286683619} +{"Pretrain/Learning Rate": 4.999733460492826e-05, "Pretrain/Loss": 2.234522581100464, "Pretrain/Loss (Raw)": 2.0751147270202637, "Pretrain/Step": 329, "Pretrain/Step Time": 8.556751511991024} +{"Pretrain/Learning Rate": 4.999720919386457e-05, "Pretrain/Loss": 2.230733633041382, "Pretrain/Loss (Raw)": 1.9618968963623047, "Pretrain/Step": 330, "Pretrain/Step Time": 8.55568160302937} +{"Pretrain/Learning Rate": 4.999708090000493e-05, "Pretrain/Loss": 2.230825424194336, "Pretrain/Loss (Raw)": 2.1860318183898926, "Pretrain/Step": 331, "Pretrain/Step Time": 8.561422543600202} +{"Pretrain/Learning Rate": 4.999694972336413e-05, "Pretrain/Loss": 2.2338995933532715, "Pretrain/Loss (Raw)": 2.5428380966186523, "Pretrain/Step": 332, "Pretrain/Step Time": 8.568744672462344} +{"Pretrain/Learning Rate": 4.9996815663957296e-05, "Pretrain/Loss": 2.2353904247283936, "Pretrain/Loss (Raw)": 2.271876096725464, "Pretrain/Step": 333, "Pretrain/Step Time": 8.566245323047042} +{"Pretrain/Learning Rate": 4.9996678721799893e-05, "Pretrain/Loss": 2.2333335876464844, "Pretrain/Loss (Raw)": 2.110403537750244, "Pretrain/Step": 334, "Pretrain/Step Time": 8.566187780350447} +{"Pretrain/Learning Rate": 4.999653889690771e-05, "Pretrain/Loss": 2.232489585876465, "Pretrain/Loss (Raw)": 2.1292691230773926, "Pretrain/Step": 335, "Pretrain/Step Time": 8.562761941924691} +{"Pretrain/Learning Rate": 4.9996396189296865e-05, "Pretrain/Loss": 2.234957218170166, "Pretrain/Loss (Raw)": 2.311918020248413, "Pretrain/Step": 336, "Pretrain/Step Time": 8.565986504778266} +{"Pretrain/Learning Rate": 4.999625059898384e-05, "Pretrain/Loss": 2.233598470687866, "Pretrain/Loss (Raw)": 2.2120630741119385, "Pretrain/Step": 337, "Pretrain/Step Time": 8.561370654031634} +{"Pretrain/Learning Rate": 4.99961021259854e-05, "Pretrain/Loss": 2.2398228645324707, "Pretrain/Loss (Raw)": 3.0459818840026855, "Pretrain/Step": 338, "Pretrain/Step Time": 8.573914490640163} +{"Pretrain/Learning Rate": 4.999595077031868e-05, "Pretrain/Loss": 2.2374825477600098, "Pretrain/Loss (Raw)": 2.0399889945983887, "Pretrain/Step": 339, "Pretrain/Step Time": 8.574189217761159} +{"Pretrain/Learning Rate": 4.9995796532001136e-05, "Pretrain/Loss": 2.237032413482666, "Pretrain/Loss (Raw)": 2.124713897705078, "Pretrain/Step": 340, "Pretrain/Step Time": 8.57248598150909} +{"Pretrain/Learning Rate": 4.999563941105054e-05, "Pretrain/Loss": 2.2366323471069336, "Pretrain/Loss (Raw)": 2.1786694526672363, "Pretrain/Step": 341, "Pretrain/Step Time": 8.566579163074493} +{"Pretrain/Learning Rate": 4.9995479407485035e-05, "Pretrain/Loss": 2.236144542694092, "Pretrain/Loss (Raw)": 2.218569755554199, "Pretrain/Step": 342, "Pretrain/Step Time": 8.557650806382298} +{"Pretrain/Learning Rate": 4.9995316521323066e-05, "Pretrain/Loss": 2.235430955886841, "Pretrain/Loss (Raw)": 2.048910140991211, "Pretrain/Step": 343, "Pretrain/Step Time": 8.560360634699464} +{"Pretrain/Learning Rate": 4.99951507525834e-05, "Pretrain/Loss": 2.2346887588500977, "Pretrain/Loss (Raw)": 2.2164220809936523, "Pretrain/Step": 344, "Pretrain/Step Time": 8.567634241655469} +{"Pretrain/Learning Rate": 4.999498210128518e-05, "Pretrain/Loss": 2.2337653636932373, "Pretrain/Loss (Raw)": 2.2806475162506104, "Pretrain/Step": 345, "Pretrain/Step Time": 8.560707392171025} +{"Pretrain/Learning Rate": 4.9994810567447834e-05, "Pretrain/Loss": 2.233358383178711, "Pretrain/Loss (Raw)": 2.4092206954956055, "Pretrain/Step": 346, "Pretrain/Step Time": 8.561539398506284} +{"Pretrain/Learning Rate": 4.9994636151091165e-05, "Pretrain/Loss": 2.2302639484405518, "Pretrain/Loss (Raw)": 2.111881732940674, "Pretrain/Step": 347, "Pretrain/Step Time": 8.554091185331345} +{"Pretrain/Learning Rate": 4.999445885223527e-05, "Pretrain/Loss": 2.2304415702819824, "Pretrain/Loss (Raw)": 2.198395252227783, "Pretrain/Step": 348, "Pretrain/Step Time": 8.55684701539576} +{"Pretrain/Learning Rate": 4.99942786709006e-05, "Pretrain/Loss": 2.2324604988098145, "Pretrain/Loss (Raw)": 2.2208542823791504, "Pretrain/Step": 349, "Pretrain/Step Time": 8.56241936609149} +{"Pretrain/Learning Rate": 4.999409560710794e-05, "Pretrain/Loss": 2.2326102256774902, "Pretrain/Loss (Raw)": 2.206094980239868, "Pretrain/Step": 350, "Pretrain/Step Time": 8.557837530970573} +{"Pretrain/Learning Rate": 4.99939096608784e-05, "Pretrain/Loss": 2.2340641021728516, "Pretrain/Loss (Raw)": 2.1203553676605225, "Pretrain/Step": 351, "Pretrain/Step Time": 8.564628463238478} +{"Pretrain/Learning Rate": 4.999372083223343e-05, "Pretrain/Loss": 2.230431079864502, "Pretrain/Loss (Raw)": 1.9565194845199585, "Pretrain/Step": 352, "Pretrain/Step Time": 8.55194060690701} +{"Pretrain/Learning Rate": 4.999352912119478e-05, "Pretrain/Loss": 2.2290756702423096, "Pretrain/Loss (Raw)": 2.2367594242095947, "Pretrain/Step": 353, "Pretrain/Step Time": 8.54957851022482} +{"Pretrain/Learning Rate": 4.999333452778459e-05, "Pretrain/Loss": 2.2293930053710938, "Pretrain/Loss (Raw)": 2.1261112689971924, "Pretrain/Step": 354, "Pretrain/Step Time": 8.550121396780014} +{"Pretrain/Learning Rate": 4.999313705202529e-05, "Pretrain/Loss": 2.2309913635253906, "Pretrain/Loss (Raw)": 2.378774642944336, "Pretrain/Step": 355, "Pretrain/Step Time": 8.548043433576822} +{"Pretrain/Learning Rate": 4.999293669393965e-05, "Pretrain/Loss": 2.230644941329956, "Pretrain/Loss (Raw)": 2.2695415019989014, "Pretrain/Step": 356, "Pretrain/Step Time": 8.554402569308877} +{"Pretrain/Learning Rate": 4.999273345355078e-05, "Pretrain/Loss": 2.2303109169006348, "Pretrain/Loss (Raw)": 2.1397085189819336, "Pretrain/Step": 357, "Pretrain/Step Time": 8.551253436133265} +{"Pretrain/Learning Rate": 4.9992527330882125e-05, "Pretrain/Loss": 2.2301459312438965, "Pretrain/Loss (Raw)": 2.39078950881958, "Pretrain/Step": 358, "Pretrain/Step Time": 8.547278724610806} +{"Pretrain/Learning Rate": 4.999231832595744e-05, "Pretrain/Loss": 2.2271206378936768, "Pretrain/Loss (Raw)": 2.0595881938934326, "Pretrain/Step": 359, "Pretrain/Step Time": 8.545666463673115} +{"Pretrain/Learning Rate": 4.9992106438800846e-05, "Pretrain/Loss": 2.226593494415283, "Pretrain/Loss (Raw)": 2.152404308319092, "Pretrain/Step": 360, "Pretrain/Step Time": 8.545250179246068} +{"Pretrain/Learning Rate": 4.999189166943677e-05, "Pretrain/Loss": 2.2247426509857178, "Pretrain/Loss (Raw)": 2.019867181777954, "Pretrain/Step": 361, "Pretrain/Step Time": 8.546429315581918} +{"Pretrain/Learning Rate": 4.999167401788998e-05, "Pretrain/Loss": 2.225490093231201, "Pretrain/Loss (Raw)": 2.313626766204834, "Pretrain/Step": 362, "Pretrain/Step Time": 8.548825412988663} +{"Pretrain/Learning Rate": 4.9991453484185577e-05, "Pretrain/Loss": 2.227395534515381, "Pretrain/Loss (Raw)": 2.205496311187744, "Pretrain/Step": 363, "Pretrain/Step Time": 8.549343736842275} +{"Pretrain/Learning Rate": 4.999123006834899e-05, "Pretrain/Loss": 2.2287707328796387, "Pretrain/Loss (Raw)": 2.3607583045959473, "Pretrain/Step": 364, "Pretrain/Step Time": 8.544557478278875} +{"Pretrain/Learning Rate": 4.9991003770405994e-05, "Pretrain/Loss": 2.227684736251831, "Pretrain/Loss (Raw)": 2.120493173599243, "Pretrain/Step": 365, "Pretrain/Step Time": 8.537981737405062} +{"Pretrain/Learning Rate": 4.999077459038268e-05, "Pretrain/Loss": 2.223604679107666, "Pretrain/Loss (Raw)": 1.8528355360031128, "Pretrain/Step": 366, "Pretrain/Step Time": 8.536167992278934} +{"Pretrain/Learning Rate": 4.9990542528305484e-05, "Pretrain/Loss": 2.224252462387085, "Pretrain/Loss (Raw)": 2.281790256500244, "Pretrain/Step": 367, "Pretrain/Step Time": 8.536097526550293} +{"Pretrain/Learning Rate": 4.999030758420116e-05, "Pretrain/Loss": 2.227750062942505, "Pretrain/Loss (Raw)": 2.538315773010254, "Pretrain/Step": 368, "Pretrain/Step Time": 8.544609447941184} +{"Pretrain/Learning Rate": 4.999006975809681e-05, "Pretrain/Loss": 2.228814125061035, "Pretrain/Loss (Raw)": 2.222456693649292, "Pretrain/Step": 369, "Pretrain/Step Time": 8.53895447589457} +{"Pretrain/Learning Rate": 4.998982905001986e-05, "Pretrain/Loss": 2.2270708084106445, "Pretrain/Loss (Raw)": 1.993064045906067, "Pretrain/Step": 370, "Pretrain/Step Time": 8.5410309843719} +{"Pretrain/Learning Rate": 4.998958545999806e-05, "Pretrain/Loss": 2.228653907775879, "Pretrain/Loss (Raw)": 2.547933578491211, "Pretrain/Step": 371, "Pretrain/Step Time": 8.53874371573329} +{"Pretrain/Learning Rate": 4.998933898805951e-05, "Pretrain/Loss": 2.2290263175964355, "Pretrain/Loss (Raw)": 2.243101119995117, "Pretrain/Step": 372, "Pretrain/Step Time": 8.534807598218322} +{"Pretrain/Learning Rate": 4.9989089634232645e-05, "Pretrain/Loss": 2.2294888496398926, "Pretrain/Loss (Raw)": 2.0430195331573486, "Pretrain/Step": 373, "Pretrain/Step Time": 8.53666515648365} +{"Pretrain/Learning Rate": 4.9988837398546206e-05, "Pretrain/Loss": 2.2289013862609863, "Pretrain/Loss (Raw)": 2.1266088485717773, "Pretrain/Step": 374, "Pretrain/Step Time": 8.538690902292728} +{"Pretrain/Learning Rate": 4.9988582281029284e-05, "Pretrain/Loss": 2.2291626930236816, "Pretrain/Loss (Raw)": 2.389761209487915, "Pretrain/Step": 375, "Pretrain/Step Time": 8.535453835502267} +{"Pretrain/Learning Rate": 4.998832428171131e-05, "Pretrain/Loss": 2.228353977203369, "Pretrain/Loss (Raw)": 2.243800163269043, "Pretrain/Step": 376, "Pretrain/Step Time": 8.544775674119592} +{"Pretrain/Learning Rate": 4.998806340062202e-05, "Pretrain/Loss": 2.2294740676879883, "Pretrain/Loss (Raw)": 2.2285895347595215, "Pretrain/Step": 377, "Pretrain/Step Time": 8.539819775149226} +{"Pretrain/Learning Rate": 4.998779963779152e-05, "Pretrain/Loss": 2.229448080062866, "Pretrain/Loss (Raw)": 2.2359485626220703, "Pretrain/Step": 378, "Pretrain/Step Time": 8.541376322507858} +{"Pretrain/Learning Rate": 4.998753299325021e-05, "Pretrain/Loss": 2.2310330867767334, "Pretrain/Loss (Raw)": 2.4044134616851807, "Pretrain/Step": 379, "Pretrain/Step Time": 8.539100533351302} +{"Pretrain/Learning Rate": 4.998726346702886e-05, "Pretrain/Loss": 2.2317891120910645, "Pretrain/Loss (Raw)": 2.1446433067321777, "Pretrain/Step": 380, "Pretrain/Step Time": 8.54877888225019} +{"Pretrain/Learning Rate": 4.998699105915854e-05, "Pretrain/Loss": 2.2310612201690674, "Pretrain/Loss (Raw)": 2.2301015853881836, "Pretrain/Step": 381, "Pretrain/Step Time": 8.545713232830167} +{"Pretrain/Learning Rate": 4.9986715769670665e-05, "Pretrain/Loss": 2.2298521995544434, "Pretrain/Loss (Raw)": 2.0702946186065674, "Pretrain/Step": 382, "Pretrain/Step Time": 8.553358163684607} +{"Pretrain/Learning Rate": 4.998643759859699e-05, "Pretrain/Loss": 2.230344295501709, "Pretrain/Loss (Raw)": 2.4046757221221924, "Pretrain/Step": 383, "Pretrain/Step Time": 8.548942785710096} +{"Pretrain/Learning Rate": 4.998615654596959e-05, "Pretrain/Loss": 2.2292263507843018, "Pretrain/Loss (Raw)": 2.089916706085205, "Pretrain/Step": 384, "Pretrain/Step Time": 8.547954836860299} +{"Pretrain/Learning Rate": 4.9985872611820885e-05, "Pretrain/Loss": 2.22823429107666, "Pretrain/Loss (Raw)": 2.1231741905212402, "Pretrain/Step": 385, "Pretrain/Step Time": 8.544136215001345} +{"Pretrain/Learning Rate": 4.9985585796183605e-05, "Pretrain/Loss": 2.2285947799682617, "Pretrain/Loss (Raw)": 2.327840805053711, "Pretrain/Step": 386, "Pretrain/Step Time": 8.543805534020066} +{"Pretrain/Learning Rate": 4.998529609909084e-05, "Pretrain/Loss": 2.226270914077759, "Pretrain/Loss (Raw)": 1.9076368808746338, "Pretrain/Step": 387, "Pretrain/Step Time": 8.545487772673368} +{"Pretrain/Learning Rate": 4.998500352057599e-05, "Pretrain/Loss": 2.225100040435791, "Pretrain/Loss (Raw)": 2.0653488636016846, "Pretrain/Step": 388, "Pretrain/Step Time": 8.545168709009886} +{"Pretrain/Learning Rate": 4.9984708060672805e-05, "Pretrain/Loss": 2.2229316234588623, "Pretrain/Loss (Raw)": 1.85927414894104, "Pretrain/Step": 389, "Pretrain/Step Time": 8.54016362503171} +{"Pretrain/Learning Rate": 4.9984409719415345e-05, "Pretrain/Loss": 2.2222697734832764, "Pretrain/Loss (Raw)": 2.1761717796325684, "Pretrain/Step": 390, "Pretrain/Step Time": 8.540449602529407} +{"Pretrain/Learning Rate": 4.9984108496838034e-05, "Pretrain/Loss": 2.221200942993164, "Pretrain/Loss (Raw)": 2.2592034339904785, "Pretrain/Step": 391, "Pretrain/Step Time": 8.54279044084251} +{"Pretrain/Learning Rate": 4.99838043929756e-05, "Pretrain/Loss": 2.2193386554718018, "Pretrain/Loss (Raw)": 2.2287161350250244, "Pretrain/Step": 392, "Pretrain/Step Time": 8.5465041808784} +{"Pretrain/Learning Rate": 4.9983497407863114e-05, "Pretrain/Loss": 2.2185802459716797, "Pretrain/Loss (Raw)": 2.1494507789611816, "Pretrain/Step": 393, "Pretrain/Step Time": 8.536932315677404} +{"Pretrain/Learning Rate": 4.9983187541535984e-05, "Pretrain/Loss": 2.2196431159973145, "Pretrain/Loss (Raw)": 2.334942102432251, "Pretrain/Step": 394, "Pretrain/Step Time": 8.542938135564327} +{"Pretrain/Learning Rate": 4.998287479402994e-05, "Pretrain/Loss": 2.2197437286376953, "Pretrain/Loss (Raw)": 2.208984375, "Pretrain/Step": 395, "Pretrain/Step Time": 8.53758493065834} +{"Pretrain/Learning Rate": 4.998255916538106e-05, "Pretrain/Loss": 2.217949867248535, "Pretrain/Loss (Raw)": 2.183950185775757, "Pretrain/Step": 396, "Pretrain/Step Time": 8.540282240137458} +{"Pretrain/Learning Rate": 4.998224065562572e-05, "Pretrain/Loss": 2.216510772705078, "Pretrain/Loss (Raw)": 2.1002094745635986, "Pretrain/Step": 397, "Pretrain/Step Time": 8.53824325837195} +{"Pretrain/Learning Rate": 4.998191926480068e-05, "Pretrain/Loss": 2.2174651622772217, "Pretrain/Loss (Raw)": 2.2296249866485596, "Pretrain/Step": 398, "Pretrain/Step Time": 8.54255260899663} +{"Pretrain/Learning Rate": 4.998159499294299e-05, "Pretrain/Loss": 2.218189239501953, "Pretrain/Loss (Raw)": 2.1434929370880127, "Pretrain/Step": 399, "Pretrain/Step Time": 8.542343996465206} +{"Pretrain/Learning Rate": 4.998126784009005e-05, "Pretrain/Loss": 2.2205464839935303, "Pretrain/Loss (Raw)": 2.369158983230591, "Pretrain/Step": 400, "Pretrain/Step Time": 8.542504943907261} +{"Pretrain/Learning Rate": 4.998093780627958e-05, "Pretrain/Loss": 2.218136787414551, "Pretrain/Loss (Raw)": 2.0933165550231934, "Pretrain/Step": 401, "Pretrain/Step Time": 8.545726073905826} +{"Pretrain/Learning Rate": 4.9980604891549656e-05, "Pretrain/Loss": 2.217090606689453, "Pretrain/Loss (Raw)": 2.120326042175293, "Pretrain/Step": 402, "Pretrain/Step Time": 8.545932959765196} +{"Pretrain/Learning Rate": 4.998026909593865e-05, "Pretrain/Loss": 2.214629650115967, "Pretrain/Loss (Raw)": 2.0479815006256104, "Pretrain/Step": 403, "Pretrain/Step Time": 8.543044475838542} +{"Pretrain/Learning Rate": 4.997993041948531e-05, "Pretrain/Loss": 2.213388681411743, "Pretrain/Loss (Raw)": 2.2360575199127197, "Pretrain/Step": 404, "Pretrain/Step Time": 8.544076608493924} +{"Pretrain/Learning Rate": 4.997958886222869e-05, "Pretrain/Loss": 2.212402820587158, "Pretrain/Loss (Raw)": 2.3111374378204346, "Pretrain/Step": 405, "Pretrain/Step Time": 8.554145440459251} +{"Pretrain/Learning Rate": 4.9979244424208165e-05, "Pretrain/Loss": 2.2137815952301025, "Pretrain/Loss (Raw)": 2.363053321838379, "Pretrain/Step": 406, "Pretrain/Step Time": 8.543367544189095} +{"Pretrain/Learning Rate": 4.997889710546347e-05, "Pretrain/Loss": 2.2139840126037598, "Pretrain/Loss (Raw)": 2.2641568183898926, "Pretrain/Step": 407, "Pretrain/Step Time": 8.551571695134044} +{"Pretrain/Learning Rate": 4.9978546906034655e-05, "Pretrain/Loss": 2.2135226726531982, "Pretrain/Loss (Raw)": 2.2745702266693115, "Pretrain/Step": 408, "Pretrain/Step Time": 8.550537083297968} +{"Pretrain/Learning Rate": 4.997819382596212e-05, "Pretrain/Loss": 2.2146859169006348, "Pretrain/Loss (Raw)": 2.178135871887207, "Pretrain/Step": 409, "Pretrain/Step Time": 8.553065437823534} +{"Pretrain/Learning Rate": 4.997783786528656e-05, "Pretrain/Loss": 2.2142205238342285, "Pretrain/Loss (Raw)": 2.2302756309509277, "Pretrain/Step": 410, "Pretrain/Step Time": 8.54107029736042} +{"Pretrain/Learning Rate": 4.997747902404904e-05, "Pretrain/Loss": 2.21350359916687, "Pretrain/Loss (Raw)": 2.360018491744995, "Pretrain/Step": 411, "Pretrain/Step Time": 8.553609754890203} +{"Pretrain/Learning Rate": 4.997711730229094e-05, "Pretrain/Loss": 2.213027238845825, "Pretrain/Loss (Raw)": 2.117713689804077, "Pretrain/Step": 412, "Pretrain/Step Time": 8.543071806430817} +{"Pretrain/Learning Rate": 4.9976752700053975e-05, "Pretrain/Loss": 2.213857650756836, "Pretrain/Loss (Raw)": 2.329683780670166, "Pretrain/Step": 413, "Pretrain/Step Time": 8.54158940911293} +{"Pretrain/Learning Rate": 4.9976385217380195e-05, "Pretrain/Loss": 2.215904712677002, "Pretrain/Loss (Raw)": 2.358962059020996, "Pretrain/Step": 414, "Pretrain/Step Time": 8.540699711069465} +{"Pretrain/Learning Rate": 4.997601485431198e-05, "Pretrain/Loss": 2.215423822402954, "Pretrain/Loss (Raw)": 2.2327280044555664, "Pretrain/Step": 415, "Pretrain/Step Time": 8.541577845811844} +{"Pretrain/Learning Rate": 4.997564161089204e-05, "Pretrain/Loss": 2.216182231903076, "Pretrain/Loss (Raw)": 2.3952813148498535, "Pretrain/Step": 416, "Pretrain/Step Time": 8.541081476956606} +{"Pretrain/Learning Rate": 4.9975265487163424e-05, "Pretrain/Loss": 2.2161364555358887, "Pretrain/Loss (Raw)": 2.205573320388794, "Pretrain/Step": 417, "Pretrain/Step Time": 8.540987199172378} +{"Pretrain/Learning Rate": 4.997488648316951e-05, "Pretrain/Loss": 2.215567111968994, "Pretrain/Loss (Raw)": 2.2660436630249023, "Pretrain/Step": 418, "Pretrain/Step Time": 8.54146914742887} +{"Pretrain/Learning Rate": 4.997450459895399e-05, "Pretrain/Loss": 2.215066432952881, "Pretrain/Loss (Raw)": 2.2891743183135986, "Pretrain/Step": 419, "Pretrain/Step Time": 8.541121562942863} +{"Pretrain/Learning Rate": 4.997411983456092e-05, "Pretrain/Loss": 2.21626353263855, "Pretrain/Loss (Raw)": 2.3513245582580566, "Pretrain/Step": 420, "Pretrain/Step Time": 8.544763630256057} +{"Pretrain/Learning Rate": 4.9973732190034674e-05, "Pretrain/Loss": 2.216765880584717, "Pretrain/Loss (Raw)": 2.179542064666748, "Pretrain/Step": 421, "Pretrain/Step Time": 8.541802575811744} +{"Pretrain/Learning Rate": 4.9973341665419946e-05, "Pretrain/Loss": 2.2191200256347656, "Pretrain/Loss (Raw)": 2.316321849822998, "Pretrain/Step": 422, "Pretrain/Step Time": 8.538866881281137} +{"Pretrain/Learning Rate": 4.997294826076178e-05, "Pretrain/Loss": 2.2183680534362793, "Pretrain/Loss (Raw)": 2.098567485809326, "Pretrain/Step": 423, "Pretrain/Step Time": 8.544915206730366} +{"Pretrain/Learning Rate": 4.9972551976105545e-05, "Pretrain/Loss": 2.2180638313293457, "Pretrain/Loss (Raw)": 2.161343812942505, "Pretrain/Step": 424, "Pretrain/Step Time": 8.54729837179184} +{"Pretrain/Learning Rate": 4.9972152811496945e-05, "Pretrain/Loss": 2.2177038192749023, "Pretrain/Loss (Raw)": 2.249271869659424, "Pretrain/Step": 425, "Pretrain/Step Time": 8.536045646294951} +{"Pretrain/Learning Rate": 4.9971750766982e-05, "Pretrain/Loss": 2.2182252407073975, "Pretrain/Loss (Raw)": 2.3391783237457275, "Pretrain/Step": 426, "Pretrain/Step Time": 8.542565720155835} +{"Pretrain/Learning Rate": 4.9971345842607095e-05, "Pretrain/Loss": 2.2184500694274902, "Pretrain/Loss (Raw)": 2.210794687271118, "Pretrain/Step": 427, "Pretrain/Step Time": 8.544722653925419} +{"Pretrain/Learning Rate": 4.997093803841891e-05, "Pretrain/Loss": 2.2179083824157715, "Pretrain/Loss (Raw)": 2.3021984100341797, "Pretrain/Step": 428, "Pretrain/Step Time": 8.542021475732327} +{"Pretrain/Learning Rate": 4.997052735446449e-05, "Pretrain/Loss": 2.2169811725616455, "Pretrain/Loss (Raw)": 2.194498062133789, "Pretrain/Step": 429, "Pretrain/Step Time": 8.55440748296678} +{"Pretrain/Learning Rate": 4.997011379079119e-05, "Pretrain/Loss": 2.2188522815704346, "Pretrain/Loss (Raw)": 2.446370840072632, "Pretrain/Step": 430, "Pretrain/Step Time": 8.548924898728728} +{"Pretrain/Learning Rate": 4.996969734744671e-05, "Pretrain/Loss": 2.21781063079834, "Pretrain/Loss (Raw)": 2.134056806564331, "Pretrain/Step": 431, "Pretrain/Step Time": 8.551651472225785} +{"Pretrain/Learning Rate": 4.996927802447906e-05, "Pretrain/Loss": 2.215853691101074, "Pretrain/Loss (Raw)": 2.104719638824463, "Pretrain/Step": 432, "Pretrain/Step Time": 8.55356946773827} +{"Pretrain/Learning Rate": 4.9968855821936613e-05, "Pretrain/Loss": 2.2163684368133545, "Pretrain/Loss (Raw)": 2.2905218601226807, "Pretrain/Step": 433, "Pretrain/Step Time": 8.551740014925599} +{"Pretrain/Learning Rate": 4.9968430739868056e-05, "Pretrain/Loss": 2.2173056602478027, "Pretrain/Loss (Raw)": 2.2300074100494385, "Pretrain/Step": 434, "Pretrain/Step Time": 8.552548807114363} +{"Pretrain/Learning Rate": 4.9968002778322406e-05, "Pretrain/Loss": 2.2188618183135986, "Pretrain/Loss (Raw)": 2.2505993843078613, "Pretrain/Step": 435, "Pretrain/Step Time": 8.562952116131783} +{"Pretrain/Learning Rate": 4.9967571937349034e-05, "Pretrain/Loss": 2.214682102203369, "Pretrain/Loss (Raw)": 2.2142112255096436, "Pretrain/Step": 436, "Pretrain/Step Time": 8.549723893404007} +{"Pretrain/Learning Rate": 4.996713821699761e-05, "Pretrain/Loss": 2.2163033485412598, "Pretrain/Loss (Raw)": 2.324176788330078, "Pretrain/Step": 437, "Pretrain/Step Time": 8.550075206905603} +{"Pretrain/Learning Rate": 4.9966701617318154e-05, "Pretrain/Loss": 2.217022180557251, "Pretrain/Loss (Raw)": 2.1693241596221924, "Pretrain/Step": 438, "Pretrain/Step Time": 8.546831611543894} +{"Pretrain/Learning Rate": 4.996626213836103e-05, "Pretrain/Loss": 2.2142786979675293, "Pretrain/Loss (Raw)": 2.1543469429016113, "Pretrain/Step": 439, "Pretrain/Step Time": 8.547152981162071} +{"Pretrain/Learning Rate": 4.99658197801769e-05, "Pretrain/Loss": 2.217635154724121, "Pretrain/Loss (Raw)": 2.4737064838409424, "Pretrain/Step": 440, "Pretrain/Step Time": 8.54357223585248} +{"Pretrain/Learning Rate": 4.99653745428168e-05, "Pretrain/Loss": 2.2175211906433105, "Pretrain/Loss (Raw)": 2.0184226036071777, "Pretrain/Step": 441, "Pretrain/Step Time": 8.553565254434943} +{"Pretrain/Learning Rate": 4.9964926426332056e-05, "Pretrain/Loss": 2.2167482376098633, "Pretrain/Loss (Raw)": 2.219377279281616, "Pretrain/Step": 442, "Pretrain/Step Time": 8.54523752629757} +{"Pretrain/Learning Rate": 4.9964475430774364e-05, "Pretrain/Loss": 2.2181553840637207, "Pretrain/Loss (Raw)": 2.2339401245117188, "Pretrain/Step": 443, "Pretrain/Step Time": 8.541650552302599} +{"Pretrain/Learning Rate": 4.996402155619573e-05, "Pretrain/Loss": 2.2188820838928223, "Pretrain/Loss (Raw)": 2.299093723297119, "Pretrain/Step": 444, "Pretrain/Step Time": 8.54092426598072} +{"Pretrain/Learning Rate": 4.9963564802648494e-05, "Pretrain/Loss": 2.217665433883667, "Pretrain/Loss (Raw)": 2.234008312225342, "Pretrain/Step": 445, "Pretrain/Step Time": 8.542962681502104} +{"Pretrain/Learning Rate": 4.9963105170185334e-05, "Pretrain/Loss": 2.2175631523132324, "Pretrain/Loss (Raw)": 2.2229018211364746, "Pretrain/Step": 446, "Pretrain/Step Time": 8.541346793994308} +{"Pretrain/Learning Rate": 4.9962642658859255e-05, "Pretrain/Loss": 2.2191238403320312, "Pretrain/Loss (Raw)": 2.3091180324554443, "Pretrain/Step": 447, "Pretrain/Step Time": 8.539147393777966} +{"Pretrain/Learning Rate": 4.99621772687236e-05, "Pretrain/Loss": 2.219487190246582, "Pretrain/Loss (Raw)": 2.2635393142700195, "Pretrain/Step": 448, "Pretrain/Step Time": 8.535898799076676} +{"Pretrain/Learning Rate": 4.996170899983203e-05, "Pretrain/Loss": 2.22027850151062, "Pretrain/Loss (Raw)": 2.2147130966186523, "Pretrain/Step": 449, "Pretrain/Step Time": 8.535175928846002} +{"Pretrain/Learning Rate": 4.9961237852238554e-05, "Pretrain/Loss": 2.2191686630249023, "Pretrain/Loss (Raw)": 2.1511895656585693, "Pretrain/Step": 450, "Pretrain/Step Time": 8.534992896020412} +{"Pretrain/Learning Rate": 4.996076382599752e-05, "Pretrain/Loss": 2.2206032276153564, "Pretrain/Loss (Raw)": 2.324294328689575, "Pretrain/Step": 451, "Pretrain/Step Time": 8.534670695662498} +{"Pretrain/Learning Rate": 4.996028692116357e-05, "Pretrain/Loss": 2.2214272022247314, "Pretrain/Loss (Raw)": 2.1609411239624023, "Pretrain/Step": 452, "Pretrain/Step Time": 8.535346433520317} +{"Pretrain/Learning Rate": 4.995980713779172e-05, "Pretrain/Loss": 2.2216527462005615, "Pretrain/Loss (Raw)": 2.129305601119995, "Pretrain/Step": 453, "Pretrain/Step Time": 8.538836907595396} +{"Pretrain/Learning Rate": 4.9959324475937297e-05, "Pretrain/Loss": 2.219520092010498, "Pretrain/Loss (Raw)": 2.070403575897217, "Pretrain/Step": 454, "Pretrain/Step Time": 8.530550604686141} +{"Pretrain/Learning Rate": 4.995883893565596e-05, "Pretrain/Loss": 2.2173209190368652, "Pretrain/Loss (Raw)": 1.9902056455612183, "Pretrain/Step": 455, "Pretrain/Step Time": 8.537947772070765} +{"Pretrain/Learning Rate": 4.995835051700371e-05, "Pretrain/Loss": 2.218029499053955, "Pretrain/Loss (Raw)": 2.286041736602783, "Pretrain/Step": 456, "Pretrain/Step Time": 8.53652336448431} +{"Pretrain/Learning Rate": 4.995785922003687e-05, "Pretrain/Loss": 2.218989610671997, "Pretrain/Loss (Raw)": 2.1980197429656982, "Pretrain/Step": 457, "Pretrain/Step Time": 8.537048321217299} +{"Pretrain/Learning Rate": 4.9957365044812097e-05, "Pretrain/Loss": 2.221590042114258, "Pretrain/Loss (Raw)": 2.294766426086426, "Pretrain/Step": 458, "Pretrain/Step Time": 8.539856085553765} +{"Pretrain/Learning Rate": 4.995686799138639e-05, "Pretrain/Loss": 2.2211499214172363, "Pretrain/Loss (Raw)": 2.129689931869507, "Pretrain/Step": 459, "Pretrain/Step Time": 8.535320408642292} +{"Pretrain/Learning Rate": 4.995636805981706e-05, "Pretrain/Loss": 2.217452049255371, "Pretrain/Loss (Raw)": 2.0694944858551025, "Pretrain/Step": 460, "Pretrain/Step Time": 8.529415123164654} +{"Pretrain/Learning Rate": 4.9955865250161774e-05, "Pretrain/Loss": 2.21763277053833, "Pretrain/Loss (Raw)": 2.295013904571533, "Pretrain/Step": 461, "Pretrain/Step Time": 8.528083926066756} +{"Pretrain/Learning Rate": 4.9955359562478504e-05, "Pretrain/Loss": 2.2181336879730225, "Pretrain/Loss (Raw)": 2.174532651901245, "Pretrain/Step": 462, "Pretrain/Step Time": 8.527868684381247} +{"Pretrain/Learning Rate": 4.995485099682558e-05, "Pretrain/Loss": 2.2192132472991943, "Pretrain/Loss (Raw)": 2.267444372177124, "Pretrain/Step": 463, "Pretrain/Step Time": 8.528886480256915} +{"Pretrain/Learning Rate": 4.995433955326165e-05, "Pretrain/Loss": 2.218733787536621, "Pretrain/Loss (Raw)": 2.2505555152893066, "Pretrain/Step": 464, "Pretrain/Step Time": 8.531027076765895} +{"Pretrain/Learning Rate": 4.995382523184569e-05, "Pretrain/Loss": 2.2169759273529053, "Pretrain/Loss (Raw)": 1.987028956413269, "Pretrain/Step": 465, "Pretrain/Step Time": 8.531738832592964} +{"Pretrain/Learning Rate": 4.9953308032637016e-05, "Pretrain/Loss": 2.2087035179138184, "Pretrain/Loss (Raw)": 1.9871599674224854, "Pretrain/Step": 466, "Pretrain/Step Time": 8.52506573498249} +{"Pretrain/Learning Rate": 4.995278795569528e-05, "Pretrain/Loss": 2.20688533782959, "Pretrain/Loss (Raw)": 1.8072174787521362, "Pretrain/Step": 467, "Pretrain/Step Time": 8.525964949280024} +{"Pretrain/Learning Rate": 4.995226500108046e-05, "Pretrain/Loss": 2.206460475921631, "Pretrain/Loss (Raw)": 2.0703437328338623, "Pretrain/Step": 468, "Pretrain/Step Time": 8.521345505490899} +{"Pretrain/Learning Rate": 4.995173916885285e-05, "Pretrain/Loss": 2.206496477127075, "Pretrain/Loss (Raw)": 2.1832995414733887, "Pretrain/Step": 469, "Pretrain/Step Time": 8.522034127265215} +{"Pretrain/Learning Rate": 4.9951210459073105e-05, "Pretrain/Loss": 2.2064502239227295, "Pretrain/Loss (Raw)": 2.2126269340515137, "Pretrain/Step": 470, "Pretrain/Step Time": 8.5232925247401} +{"Pretrain/Learning Rate": 4.99506788718022e-05, "Pretrain/Loss": 2.208474636077881, "Pretrain/Loss (Raw)": 2.308046579360962, "Pretrain/Step": 471, "Pretrain/Step Time": 8.530737360939384} +{"Pretrain/Learning Rate": 4.995014440710144e-05, "Pretrain/Loss": 2.209437847137451, "Pretrain/Loss (Raw)": 2.3396737575531006, "Pretrain/Step": 472, "Pretrain/Step Time": 8.519672844558954} +{"Pretrain/Learning Rate": 4.9949607065032445e-05, "Pretrain/Loss": 2.209897041320801, "Pretrain/Loss (Raw)": 2.3394463062286377, "Pretrain/Step": 473, "Pretrain/Step Time": 8.520976545289159} +{"Pretrain/Learning Rate": 4.99490668456572e-05, "Pretrain/Loss": 2.208176612854004, "Pretrain/Loss (Raw)": 2.18900990486145, "Pretrain/Step": 474, "Pretrain/Step Time": 8.52015220746398} +{"Pretrain/Learning Rate": 4.994852374903801e-05, "Pretrain/Loss": 2.2095937728881836, "Pretrain/Loss (Raw)": 2.29325008392334, "Pretrain/Step": 475, "Pretrain/Step Time": 8.52206864207983} +{"Pretrain/Learning Rate": 4.99479777752375e-05, "Pretrain/Loss": 2.2100977897644043, "Pretrain/Loss (Raw)": 2.2629222869873047, "Pretrain/Step": 476, "Pretrain/Step Time": 8.525242311879992} +{"Pretrain/Learning Rate": 4.994742892431863e-05, "Pretrain/Loss": 2.2083513736724854, "Pretrain/Loss (Raw)": 1.9973390102386475, "Pretrain/Step": 477, "Pretrain/Step Time": 8.517892064526677} +{"Pretrain/Learning Rate": 4.99468771963447e-05, "Pretrain/Loss": 2.2063326835632324, "Pretrain/Loss (Raw)": 1.9477171897888184, "Pretrain/Step": 478, "Pretrain/Step Time": 8.524868765845895} +{"Pretrain/Learning Rate": 4.994632259137935e-05, "Pretrain/Loss": 2.206341028213501, "Pretrain/Loss (Raw)": 2.1213996410369873, "Pretrain/Step": 479, "Pretrain/Step Time": 8.518276445567608} +{"Pretrain/Learning Rate": 4.9945765109486506e-05, "Pretrain/Loss": 2.2078588008880615, "Pretrain/Loss (Raw)": 2.150789260864258, "Pretrain/Step": 480, "Pretrain/Step Time": 8.524613356217742} +{"Pretrain/Learning Rate": 4.99452047507305e-05, "Pretrain/Loss": 2.2072558403015137, "Pretrain/Loss (Raw)": 2.159580945968628, "Pretrain/Step": 481, "Pretrain/Step Time": 8.525082005187869} +{"Pretrain/Learning Rate": 4.994464151517593e-05, "Pretrain/Loss": 2.2079648971557617, "Pretrain/Loss (Raw)": 2.2168877124786377, "Pretrain/Step": 482, "Pretrain/Step Time": 8.52106112614274} +{"Pretrain/Learning Rate": 4.994407540288775e-05, "Pretrain/Loss": 2.2067394256591797, "Pretrain/Loss (Raw)": 2.221895694732666, "Pretrain/Step": 483, "Pretrain/Step Time": 8.52721494436264} +{"Pretrain/Learning Rate": 4.994350641393126e-05, "Pretrain/Loss": 2.2063159942626953, "Pretrain/Loss (Raw)": 2.2153635025024414, "Pretrain/Step": 484, "Pretrain/Step Time": 8.521557081490755} +{"Pretrain/Learning Rate": 4.9942934548372077e-05, "Pretrain/Loss": 2.2080588340759277, "Pretrain/Loss (Raw)": 2.3627936840057373, "Pretrain/Step": 485, "Pretrain/Step Time": 8.520851923152804} +{"Pretrain/Learning Rate": 4.994235980627614e-05, "Pretrain/Loss": 2.2066807746887207, "Pretrain/Loss (Raw)": 2.2143921852111816, "Pretrain/Step": 486, "Pretrain/Step Time": 8.523613721132278} +{"Pretrain/Learning Rate": 4.9941782187709746e-05, "Pretrain/Loss": 2.2092623710632324, "Pretrain/Loss (Raw)": 2.39001202583313, "Pretrain/Step": 487, "Pretrain/Step Time": 8.52443435229361} +{"Pretrain/Learning Rate": 4.994120169273949e-05, "Pretrain/Loss": 2.211229085922241, "Pretrain/Loss (Raw)": 2.4041361808776855, "Pretrain/Step": 488, "Pretrain/Step Time": 8.525583244860172} +{"Pretrain/Learning Rate": 4.9940618321432344e-05, "Pretrain/Loss": 2.211960792541504, "Pretrain/Loss (Raw)": 2.1135756969451904, "Pretrain/Step": 489, "Pretrain/Step Time": 8.524725636467338} +{"Pretrain/Learning Rate": 4.994003207385556e-05, "Pretrain/Loss": 2.210439682006836, "Pretrain/Loss (Raw)": 2.118868350982666, "Pretrain/Step": 490, "Pretrain/Step Time": 8.522180380299687} +{"Pretrain/Learning Rate": 4.9939442950076755e-05, "Pretrain/Loss": 2.2116708755493164, "Pretrain/Loss (Raw)": 2.3630964756011963, "Pretrain/Step": 491, "Pretrain/Step Time": 8.52113083191216} +{"Pretrain/Learning Rate": 4.9938850950163864e-05, "Pretrain/Loss": 2.210972547531128, "Pretrain/Loss (Raw)": 2.271390914916992, "Pretrain/Step": 492, "Pretrain/Step Time": 8.519584504887462} +{"Pretrain/Learning Rate": 4.9938256074185174e-05, "Pretrain/Loss": 2.2106456756591797, "Pretrain/Loss (Raw)": 2.0786752700805664, "Pretrain/Step": 493, "Pretrain/Step Time": 8.521538104861975} +{"Pretrain/Learning Rate": 4.993765832220928e-05, "Pretrain/Loss": 2.215421199798584, "Pretrain/Loss (Raw)": 2.4640963077545166, "Pretrain/Step": 494, "Pretrain/Step Time": 8.521574409678578} +{"Pretrain/Learning Rate": 4.993705769430511e-05, "Pretrain/Loss": 2.2146363258361816, "Pretrain/Loss (Raw)": 2.181300401687622, "Pretrain/Step": 495, "Pretrain/Step Time": 8.52310680784285} +{"Pretrain/Learning Rate": 4.9936454190541945e-05, "Pretrain/Loss": 2.2150070667266846, "Pretrain/Loss (Raw)": 2.5857818126678467, "Pretrain/Step": 496, "Pretrain/Step Time": 8.517679832875729} +{"Pretrain/Learning Rate": 4.993584781098939e-05, "Pretrain/Loss": 2.2167797088623047, "Pretrain/Loss (Raw)": 2.449340343475342, "Pretrain/Step": 497, "Pretrain/Step Time": 8.524482410401106} +{"Pretrain/Learning Rate": 4.993523855571735e-05, "Pretrain/Loss": 2.218625783920288, "Pretrain/Loss (Raw)": 2.229382038116455, "Pretrain/Step": 498, "Pretrain/Step Time": 8.521096240729094} +{"Pretrain/Learning Rate": 4.99346264247961e-05, "Pretrain/Loss": 2.2155704498291016, "Pretrain/Loss (Raw)": 2.1568408012390137, "Pretrain/Step": 499, "Pretrain/Step Time": 8.517515305429697} +{"Pretrain/Learning Rate": 4.993401141829625e-05, "Pretrain/Loss": 2.2141661643981934, "Pretrain/Loss (Raw)": 2.0633440017700195, "Pretrain/Step": 500, "Pretrain/Step Time": 8.522229189053178} +{"Pretrain/Learning Rate": 4.99333935362887e-05, "Pretrain/Loss": 2.2150614261627197, "Pretrain/Loss (Raw)": 2.1576359272003174, "Pretrain/Step": 501, "Pretrain/Step Time": 8.520509315654635} +{"Pretrain/Learning Rate": 4.993277277884471e-05, "Pretrain/Loss": 2.2143406867980957, "Pretrain/Loss (Raw)": 2.0343263149261475, "Pretrain/Step": 502, "Pretrain/Step Time": 8.529302027076483} +{"Pretrain/Learning Rate": 4.993214914603588e-05, "Pretrain/Loss": 2.212543487548828, "Pretrain/Loss (Raw)": 2.159712314605713, "Pretrain/Step": 503, "Pretrain/Step Time": 8.536673178896308} +{"Pretrain/Learning Rate": 4.993152263793414e-05, "Pretrain/Loss": 2.2110977172851562, "Pretrain/Loss (Raw)": 2.058743953704834, "Pretrain/Step": 504, "Pretrain/Step Time": 8.531448068097234} +{"Pretrain/Learning Rate": 4.993089325461171e-05, "Pretrain/Loss": 2.211998462677002, "Pretrain/Loss (Raw)": 2.3438892364501953, "Pretrain/Step": 505, "Pretrain/Step Time": 8.532582476735115} +{"Pretrain/Learning Rate": 4.99302609961412e-05, "Pretrain/Loss": 2.210512638092041, "Pretrain/Loss (Raw)": 2.04575252532959, "Pretrain/Step": 506, "Pretrain/Step Time": 8.524387277662754} +{"Pretrain/Learning Rate": 4.9929625862595516e-05, "Pretrain/Loss": 2.2087669372558594, "Pretrain/Loss (Raw)": 2.1809937953948975, "Pretrain/Step": 507, "Pretrain/Step Time": 8.535802016034722} +{"Pretrain/Learning Rate": 4.9928987854047905e-05, "Pretrain/Loss": 2.208527088165283, "Pretrain/Loss (Raw)": 2.1139419078826904, "Pretrain/Step": 508, "Pretrain/Step Time": 8.525659941136837} +{"Pretrain/Learning Rate": 4.992834697057195e-05, "Pretrain/Loss": 2.2085771560668945, "Pretrain/Loss (Raw)": 2.2365148067474365, "Pretrain/Step": 509, "Pretrain/Step Time": 8.528461676090956} +{"Pretrain/Learning Rate": 4.992770321224155e-05, "Pretrain/Loss": 2.2092602252960205, "Pretrain/Loss (Raw)": 2.1577165126800537, "Pretrain/Step": 510, "Pretrain/Step Time": 8.528959540650249} +{"Pretrain/Learning Rate": 4.992705657913095e-05, "Pretrain/Loss": 2.2079262733459473, "Pretrain/Loss (Raw)": 2.233935832977295, "Pretrain/Step": 511, "Pretrain/Step Time": 8.52750494889915} +{"Pretrain/Learning Rate": 4.9926407071314736e-05, "Pretrain/Loss": 2.2098867893218994, "Pretrain/Loss (Raw)": 2.340866804122925, "Pretrain/Step": 512, "Pretrain/Step Time": 8.527309628203511} +{"Pretrain/Learning Rate": 4.9925754688867796e-05, "Pretrain/Loss": 2.2116198539733887, "Pretrain/Loss (Raw)": 2.344973087310791, "Pretrain/Step": 513, "Pretrain/Step Time": 8.538243548944592} +{"Pretrain/Learning Rate": 4.992509943186537e-05, "Pretrain/Loss": 2.2119996547698975, "Pretrain/Loss (Raw)": 2.376478672027588, "Pretrain/Step": 514, "Pretrain/Step Time": 8.53844521008432} +{"Pretrain/Learning Rate": 4.992444130038302e-05, "Pretrain/Loss": 2.2136597633361816, "Pretrain/Loss (Raw)": 2.120129108428955, "Pretrain/Step": 515, "Pretrain/Step Time": 8.53420321457088} +{"Pretrain/Learning Rate": 4.992378029449666e-05, "Pretrain/Loss": 2.2146944999694824, "Pretrain/Loss (Raw)": 2.197798013687134, "Pretrain/Step": 516, "Pretrain/Step Time": 8.533737305551767} +{"Pretrain/Learning Rate": 4.9923116414282514e-05, "Pretrain/Loss": 2.2170841693878174, "Pretrain/Loss (Raw)": 2.1651675701141357, "Pretrain/Step": 517, "Pretrain/Step Time": 8.531735729426146} +{"Pretrain/Learning Rate": 4.992244965981714e-05, "Pretrain/Loss": 2.216845989227295, "Pretrain/Loss (Raw)": 2.145685911178589, "Pretrain/Step": 518, "Pretrain/Step Time": 8.534455742686987} +{"Pretrain/Learning Rate": 4.9921780031177425e-05, "Pretrain/Loss": 2.215930461883545, "Pretrain/Loss (Raw)": 2.1420035362243652, "Pretrain/Step": 519, "Pretrain/Step Time": 8.540940828621387} +{"Pretrain/Learning Rate": 4.992110752844061e-05, "Pretrain/Loss": 2.216568946838379, "Pretrain/Loss (Raw)": 2.3104407787323, "Pretrain/Step": 520, "Pretrain/Step Time": 8.53923417814076} +{"Pretrain/Learning Rate": 4.992043215168424e-05, "Pretrain/Loss": 2.217207908630371, "Pretrain/Loss (Raw)": 2.2312209606170654, "Pretrain/Step": 521, "Pretrain/Step Time": 8.544816000387073} +{"Pretrain/Learning Rate": 4.99197539009862e-05, "Pretrain/Loss": 2.2175326347351074, "Pretrain/Loss (Raw)": 2.3765416145324707, "Pretrain/Step": 522, "Pretrain/Step Time": 8.54253431968391} +{"Pretrain/Learning Rate": 4.9919072776424726e-05, "Pretrain/Loss": 2.2160511016845703, "Pretrain/Loss (Raw)": 2.0193305015563965, "Pretrain/Step": 523, "Pretrain/Step Time": 8.540565295144916} +{"Pretrain/Learning Rate": 4.9918388778078347e-05, "Pretrain/Loss": 2.2155838012695312, "Pretrain/Loss (Raw)": 2.1241462230682373, "Pretrain/Step": 524, "Pretrain/Step Time": 8.537034878507257} +{"Pretrain/Learning Rate": 4.991770190602596e-05, "Pretrain/Loss": 2.215768814086914, "Pretrain/Loss (Raw)": 2.123904228210449, "Pretrain/Step": 525, "Pretrain/Step Time": 8.544653501361609} +{"Pretrain/Learning Rate": 4.991701216034677e-05, "Pretrain/Loss": 2.2132768630981445, "Pretrain/Loss (Raw)": 1.910622477531433, "Pretrain/Step": 526, "Pretrain/Step Time": 8.536180660128593} +{"Pretrain/Learning Rate": 4.9916319541120324e-05, "Pretrain/Loss": 2.213980197906494, "Pretrain/Loss (Raw)": 2.233546733856201, "Pretrain/Step": 527, "Pretrain/Step Time": 8.535373028367758} +{"Pretrain/Learning Rate": 4.99156240484265e-05, "Pretrain/Loss": 2.21213960647583, "Pretrain/Loss (Raw)": 2.1335277557373047, "Pretrain/Step": 528, "Pretrain/Step Time": 8.533282415941358} +{"Pretrain/Learning Rate": 4.9914925682345504e-05, "Pretrain/Loss": 2.2124528884887695, "Pretrain/Loss (Raw)": 2.133439064025879, "Pretrain/Step": 529, "Pretrain/Step Time": 8.533510053530335} +{"Pretrain/Learning Rate": 4.991422444295788e-05, "Pretrain/Loss": 2.213465690612793, "Pretrain/Loss (Raw)": 2.249932050704956, "Pretrain/Step": 530, "Pretrain/Step Time": 8.531379932537675} +{"Pretrain/Learning Rate": 4.9913520330344486e-05, "Pretrain/Loss": 2.2153353691101074, "Pretrain/Loss (Raw)": 2.2873318195343018, "Pretrain/Step": 531, "Pretrain/Step Time": 8.54009347781539} +{"Pretrain/Learning Rate": 4.991281334458654e-05, "Pretrain/Loss": 2.2169981002807617, "Pretrain/Loss (Raw)": 2.4488840103149414, "Pretrain/Step": 532, "Pretrain/Step Time": 8.543418638408184} +{"Pretrain/Learning Rate": 4.991210348576556e-05, "Pretrain/Loss": 2.2172765731811523, "Pretrain/Loss (Raw)": 2.3468029499053955, "Pretrain/Step": 533, "Pretrain/Step Time": 8.533464454114437} +{"Pretrain/Learning Rate": 4.991139075396342e-05, "Pretrain/Loss": 2.216506004333496, "Pretrain/Loss (Raw)": 2.264394521713257, "Pretrain/Step": 534, "Pretrain/Step Time": 8.537468826398253} +{"Pretrain/Learning Rate": 4.991067514926231e-05, "Pretrain/Loss": 2.2142651081085205, "Pretrain/Loss (Raw)": 1.9773210287094116, "Pretrain/Step": 535, "Pretrain/Step Time": 8.530530957505107} +{"Pretrain/Learning Rate": 4.990995667174476e-05, "Pretrain/Loss": 2.215157985687256, "Pretrain/Loss (Raw)": 2.388864517211914, "Pretrain/Step": 536, "Pretrain/Step Time": 8.531472876667976} +{"Pretrain/Learning Rate": 4.990923532149362e-05, "Pretrain/Loss": 2.216066360473633, "Pretrain/Loss (Raw)": 2.2943806648254395, "Pretrain/Step": 537, "Pretrain/Step Time": 8.537580106407404} +{"Pretrain/Learning Rate": 4.990851109859209e-05, "Pretrain/Loss": 2.215139389038086, "Pretrain/Loss (Raw)": 2.1116511821746826, "Pretrain/Step": 538, "Pretrain/Step Time": 8.544503906741738} +{"Pretrain/Learning Rate": 4.9907784003123695e-05, "Pretrain/Loss": 2.215163230895996, "Pretrain/Loss (Raw)": 2.3630568981170654, "Pretrain/Step": 539, "Pretrain/Step Time": 8.533916860818863} +{"Pretrain/Learning Rate": 4.9907054035172273e-05, "Pretrain/Loss": 2.2160091400146484, "Pretrain/Loss (Raw)": 2.225996732711792, "Pretrain/Step": 540, "Pretrain/Step Time": 8.535197295248508} +{"Pretrain/Learning Rate": 4.9906321194822014e-05, "Pretrain/Loss": 2.2136967182159424, "Pretrain/Loss (Raw)": 2.0336976051330566, "Pretrain/Step": 541, "Pretrain/Step Time": 8.532678691670299} +{"Pretrain/Learning Rate": 4.9905585482157436e-05, "Pretrain/Loss": 2.2131564617156982, "Pretrain/Loss (Raw)": 2.2898013591766357, "Pretrain/Step": 542, "Pretrain/Step Time": 8.543655099347234} +{"Pretrain/Learning Rate": 4.990484689726338e-05, "Pretrain/Loss": 2.2143588066101074, "Pretrain/Loss (Raw)": 2.3866209983825684, "Pretrain/Step": 543, "Pretrain/Step Time": 8.54301598481834} +{"Pretrain/Learning Rate": 4.990410544022502e-05, "Pretrain/Loss": 2.2131552696228027, "Pretrain/Loss (Raw)": 2.241224527359009, "Pretrain/Step": 544, "Pretrain/Step Time": 8.544156566262245} +{"Pretrain/Learning Rate": 4.9903361111127864e-05, "Pretrain/Loss": 2.2152843475341797, "Pretrain/Loss (Raw)": 2.4780995845794678, "Pretrain/Step": 545, "Pretrain/Step Time": 8.539232648909092} +{"Pretrain/Learning Rate": 4.990261391005777e-05, "Pretrain/Loss": 2.215736150741577, "Pretrain/Loss (Raw)": 2.323878288269043, "Pretrain/Step": 546, "Pretrain/Step Time": 8.539590746164322} +{"Pretrain/Learning Rate": 4.9901863837100886e-05, "Pretrain/Loss": 2.2147889137268066, "Pretrain/Loss (Raw)": 2.1679277420043945, "Pretrain/Step": 547, "Pretrain/Step Time": 8.539609860628843} +{"Pretrain/Learning Rate": 4.9901110892343724e-05, "Pretrain/Loss": 2.2143759727478027, "Pretrain/Loss (Raw)": 2.298469066619873, "Pretrain/Step": 548, "Pretrain/Step Time": 8.535662401467562} +{"Pretrain/Learning Rate": 4.9900355075873116e-05, "Pretrain/Loss": 2.214522361755371, "Pretrain/Loss (Raw)": 2.1982903480529785, "Pretrain/Step": 549, "Pretrain/Step Time": 8.542766243219376} +{"Pretrain/Learning Rate": 4.989959638777623e-05, "Pretrain/Loss": 2.2141923904418945, "Pretrain/Loss (Raw)": 2.274085521697998, "Pretrain/Step": 550, "Pretrain/Step Time": 8.541336154565215} +{"Pretrain/Learning Rate": 4.989883482814056e-05, "Pretrain/Loss": 2.2144579887390137, "Pretrain/Loss (Raw)": 2.1325700283050537, "Pretrain/Step": 551, "Pretrain/Step Time": 8.531096069142222} +{"Pretrain/Learning Rate": 4.989807039705392e-05, "Pretrain/Loss": 2.2160415649414062, "Pretrain/Loss (Raw)": 2.364058017730713, "Pretrain/Step": 552, "Pretrain/Step Time": 8.53283242508769} +{"Pretrain/Learning Rate": 4.989730309460449e-05, "Pretrain/Loss": 2.216165542602539, "Pretrain/Loss (Raw)": 2.265105724334717, "Pretrain/Step": 553, "Pretrain/Step Time": 8.535154968500137} +{"Pretrain/Learning Rate": 4.989653292088074e-05, "Pretrain/Loss": 2.2150707244873047, "Pretrain/Loss (Raw)": 2.199031352996826, "Pretrain/Step": 554, "Pretrain/Step Time": 8.537024231627584} +{"Pretrain/Learning Rate": 4.9895759875971495e-05, "Pretrain/Loss": 2.2139248847961426, "Pretrain/Loss (Raw)": 2.0641400814056396, "Pretrain/Step": 555, "Pretrain/Step Time": 8.532072685658932} +{"Pretrain/Learning Rate": 4.9894983959965915e-05, "Pretrain/Loss": 2.2154862880706787, "Pretrain/Loss (Raw)": 2.502047061920166, "Pretrain/Step": 556, "Pretrain/Step Time": 8.533873220905662} +{"Pretrain/Learning Rate": 4.989420517295347e-05, "Pretrain/Loss": 2.2152509689331055, "Pretrain/Loss (Raw)": 2.164407253265381, "Pretrain/Step": 557, "Pretrain/Step Time": 8.517890777438879} +{"Pretrain/Learning Rate": 4.9893423515023986e-05, "Pretrain/Loss": 2.217043161392212, "Pretrain/Loss (Raw)": 2.6757497787475586, "Pretrain/Step": 558, "Pretrain/Step Time": 8.523160520941019} +{"Pretrain/Learning Rate": 4.9892638986267594e-05, "Pretrain/Loss": 2.2170348167419434, "Pretrain/Loss (Raw)": 2.1329963207244873, "Pretrain/Step": 559, "Pretrain/Step Time": 8.519581787288189} +{"Pretrain/Learning Rate": 4.989185158677478e-05, "Pretrain/Loss": 2.21762752532959, "Pretrain/Loss (Raw)": 2.1806094646453857, "Pretrain/Step": 560, "Pretrain/Step Time": 8.52682340145111} +{"Pretrain/Learning Rate": 4.9891061316636346e-05, "Pretrain/Loss": 2.214205265045166, "Pretrain/Loss (Raw)": 1.8524242639541626, "Pretrain/Step": 561, "Pretrain/Step Time": 8.52816403657198} +{"Pretrain/Learning Rate": 4.9890268175943425e-05, "Pretrain/Loss": 2.2130563259124756, "Pretrain/Loss (Raw)": 2.082963466644287, "Pretrain/Step": 562, "Pretrain/Step Time": 8.529756478965282} +{"Pretrain/Learning Rate": 4.9889472164787496e-05, "Pretrain/Loss": 2.212317705154419, "Pretrain/Loss (Raw)": 2.1560778617858887, "Pretrain/Step": 563, "Pretrain/Step Time": 8.524774603545666} +{"Pretrain/Learning Rate": 4.9888673283260355e-05, "Pretrain/Loss": 2.212646484375, "Pretrain/Loss (Raw)": 2.2562806606292725, "Pretrain/Step": 564, "Pretrain/Step Time": 8.526738008484244} +{"Pretrain/Learning Rate": 4.9887871531454134e-05, "Pretrain/Loss": 2.211209297180176, "Pretrain/Loss (Raw)": 2.140207529067993, "Pretrain/Step": 565, "Pretrain/Step Time": 8.533665239810944} +{"Pretrain/Learning Rate": 4.988706690946129e-05, "Pretrain/Loss": 2.2112560272216797, "Pretrain/Loss (Raw)": 2.1753127574920654, "Pretrain/Step": 566, "Pretrain/Step Time": 8.529130881652236} +{"Pretrain/Learning Rate": 4.9886259417374616e-05, "Pretrain/Loss": 2.2113726139068604, "Pretrain/Loss (Raw)": 2.169264554977417, "Pretrain/Step": 567, "Pretrain/Step Time": 8.527201876044273} +{"Pretrain/Learning Rate": 4.988544905528724e-05, "Pretrain/Loss": 2.208611488342285, "Pretrain/Loss (Raw)": 2.12030291557312, "Pretrain/Step": 568, "Pretrain/Step Time": 8.531948249787092} +{"Pretrain/Learning Rate": 4.9884635823292615e-05, "Pretrain/Loss": 2.21237850189209, "Pretrain/Loss (Raw)": 2.5005908012390137, "Pretrain/Step": 569, "Pretrain/Step Time": 8.523320201784372} +{"Pretrain/Learning Rate": 4.988381972148452e-05, "Pretrain/Loss": 2.212965488433838, "Pretrain/Loss (Raw)": 2.294522285461426, "Pretrain/Step": 570, "Pretrain/Step Time": 8.522581273689866} +{"Pretrain/Learning Rate": 4.9883000749957086e-05, "Pretrain/Loss": 2.2116951942443848, "Pretrain/Loss (Raw)": 2.0713162422180176, "Pretrain/Step": 571, "Pretrain/Step Time": 8.528320418670774} +{"Pretrain/Learning Rate": 4.988217890880475e-05, "Pretrain/Loss": 2.2112269401550293, "Pretrain/Loss (Raw)": 2.2391715049743652, "Pretrain/Step": 572, "Pretrain/Step Time": 8.522574728354812} +{"Pretrain/Learning Rate": 4.98813541981223e-05, "Pretrain/Loss": 2.2114248275756836, "Pretrain/Loss (Raw)": 2.2593436241149902, "Pretrain/Step": 573, "Pretrain/Step Time": 8.528314244002104} +{"Pretrain/Learning Rate": 4.988052661800483e-05, "Pretrain/Loss": 2.210129737854004, "Pretrain/Loss (Raw)": 2.0571141242980957, "Pretrain/Step": 574, "Pretrain/Step Time": 8.526981100440025} +{"Pretrain/Learning Rate": 4.98796961685478e-05, "Pretrain/Loss": 2.210019111633301, "Pretrain/Loss (Raw)": 2.294992208480835, "Pretrain/Step": 575, "Pretrain/Step Time": 8.529387641698122} +{"Pretrain/Learning Rate": 4.987886284984695e-05, "Pretrain/Loss": 2.209383487701416, "Pretrain/Loss (Raw)": 2.182163715362549, "Pretrain/Step": 576, "Pretrain/Step Time": 8.522482391446829} +{"Pretrain/Learning Rate": 4.987802666199842e-05, "Pretrain/Loss": 2.209120273590088, "Pretrain/Loss (Raw)": 2.181020736694336, "Pretrain/Step": 577, "Pretrain/Step Time": 8.525866162031889} +{"Pretrain/Learning Rate": 4.987718760509863e-05, "Pretrain/Loss": 2.2119197845458984, "Pretrain/Loss (Raw)": 2.5095343589782715, "Pretrain/Step": 578, "Pretrain/Step Time": 8.527792915701866} +{"Pretrain/Learning Rate": 4.987634567924433e-05, "Pretrain/Loss": 2.210783004760742, "Pretrain/Loss (Raw)": 2.178800344467163, "Pretrain/Step": 579, "Pretrain/Step Time": 8.526011964306235} +{"Pretrain/Learning Rate": 4.9875500884532634e-05, "Pretrain/Loss": 2.2104108333587646, "Pretrain/Loss (Raw)": 2.113266944885254, "Pretrain/Step": 580, "Pretrain/Step Time": 8.53309022076428} +{"Pretrain/Learning Rate": 4.987465322106095e-05, "Pretrain/Loss": 2.210676670074463, "Pretrain/Loss (Raw)": 2.163329601287842, "Pretrain/Step": 581, "Pretrain/Step Time": 8.528075775131583} +{"Pretrain/Learning Rate": 4.987380268892705e-05, "Pretrain/Loss": 2.211268424987793, "Pretrain/Loss (Raw)": 2.146162271499634, "Pretrain/Step": 582, "Pretrain/Step Time": 8.528158588334918} +{"Pretrain/Learning Rate": 4.987294928822901e-05, "Pretrain/Loss": 2.212496757507324, "Pretrain/Loss (Raw)": 2.1474225521087646, "Pretrain/Step": 583, "Pretrain/Step Time": 8.524248393252492} +{"Pretrain/Learning Rate": 4.9872093019065255e-05, "Pretrain/Loss": 2.2111432552337646, "Pretrain/Loss (Raw)": 2.112787961959839, "Pretrain/Step": 584, "Pretrain/Step Time": 8.531015563756227} +{"Pretrain/Learning Rate": 4.987123388153453e-05, "Pretrain/Loss": 2.212982654571533, "Pretrain/Loss (Raw)": 2.4334702491760254, "Pretrain/Step": 585, "Pretrain/Step Time": 8.531577518209815} +{"Pretrain/Learning Rate": 4.9870371875735916e-05, "Pretrain/Loss": 2.212027072906494, "Pretrain/Loss (Raw)": 2.1724631786346436, "Pretrain/Step": 586, "Pretrain/Step Time": 8.532319584861398} +{"Pretrain/Learning Rate": 4.986950700176882e-05, "Pretrain/Loss": 2.212820529937744, "Pretrain/Loss (Raw)": 2.2312514781951904, "Pretrain/Step": 587, "Pretrain/Step Time": 8.532813677564263} +{"Pretrain/Learning Rate": 4.9868639259732996e-05, "Pretrain/Loss": 2.2153701782226562, "Pretrain/Loss (Raw)": 2.395845413208008, "Pretrain/Step": 588, "Pretrain/Step Time": 8.529958130791783} +{"Pretrain/Learning Rate": 4.986776864972851e-05, "Pretrain/Loss": 2.213696002960205, "Pretrain/Loss (Raw)": 2.0807273387908936, "Pretrain/Step": 589, "Pretrain/Step Time": 8.53154563345015} +{"Pretrain/Learning Rate": 4.9866895171855756e-05, "Pretrain/Loss": 2.21382999420166, "Pretrain/Loss (Raw)": 2.191679000854492, "Pretrain/Step": 590, "Pretrain/Step Time": 8.527896312996745} +{"Pretrain/Learning Rate": 4.9866018826215475e-05, "Pretrain/Loss": 2.2142317295074463, "Pretrain/Loss (Raw)": 2.3188488483428955, "Pretrain/Step": 591, "Pretrain/Step Time": 8.536591513082385} +{"Pretrain/Learning Rate": 4.9865139612908736e-05, "Pretrain/Loss": 2.213604688644409, "Pretrain/Loss (Raw)": 2.170288562774658, "Pretrain/Step": 592, "Pretrain/Step Time": 8.531147431582212} +{"Pretrain/Learning Rate": 4.9864257532036924e-05, "Pretrain/Loss": 2.216137647628784, "Pretrain/Loss (Raw)": 2.3112709522247314, "Pretrain/Step": 593, "Pretrain/Step Time": 8.536747064441442} +{"Pretrain/Learning Rate": 4.9863372583701765e-05, "Pretrain/Loss": 2.219167947769165, "Pretrain/Loss (Raw)": 2.375037908554077, "Pretrain/Step": 594, "Pretrain/Step Time": 8.53516117669642} +{"Pretrain/Learning Rate": 4.9862484768005324e-05, "Pretrain/Loss": 2.221970558166504, "Pretrain/Loss (Raw)": 2.165937900543213, "Pretrain/Step": 595, "Pretrain/Step Time": 8.535072715952992} +{"Pretrain/Learning Rate": 4.986159408504999e-05, "Pretrain/Loss": 2.2231013774871826, "Pretrain/Loss (Raw)": 2.215083122253418, "Pretrain/Step": 596, "Pretrain/Step Time": 8.534744415432215} +{"Pretrain/Learning Rate": 4.986070053493846e-05, "Pretrain/Loss": 2.223289966583252, "Pretrain/Loss (Raw)": 2.2074742317199707, "Pretrain/Step": 597, "Pretrain/Step Time": 8.543624587357044} +{"Pretrain/Learning Rate": 4.985980411777381e-05, "Pretrain/Loss": 2.2228167057037354, "Pretrain/Loss (Raw)": 2.1520349979400635, "Pretrain/Step": 598, "Pretrain/Step Time": 8.54247311130166} +{"Pretrain/Learning Rate": 4.9858904833659404e-05, "Pretrain/Loss": 2.221669912338257, "Pretrain/Loss (Raw)": 2.161252737045288, "Pretrain/Step": 599, "Pretrain/Step Time": 8.537228500470519} +{"Pretrain/Learning Rate": 4.985800268269895e-05, "Pretrain/Loss": 2.2224433422088623, "Pretrain/Loss (Raw)": 2.438663959503174, "Pretrain/Step": 600, "Pretrain/Step Time": 8.543282618746161} +{"Pretrain/Learning Rate": 4.9857097664996486e-05, "Pretrain/Loss": 2.2210206985473633, "Pretrain/Loss (Raw)": 2.1573486328125, "Pretrain/Step": 601, "Pretrain/Step Time": 8.544228591024876} +{"Pretrain/Learning Rate": 4.98561897806564e-05, "Pretrain/Loss": 2.220841407775879, "Pretrain/Loss (Raw)": 2.1660664081573486, "Pretrain/Step": 602, "Pretrain/Step Time": 8.544387485831976} +{"Pretrain/Learning Rate": 4.985527902978337e-05, "Pretrain/Loss": 2.2209620475769043, "Pretrain/Loss (Raw)": 2.3086981773376465, "Pretrain/Step": 603, "Pretrain/Step Time": 8.550788134336472} +{"Pretrain/Learning Rate": 4.985436541248245e-05, "Pretrain/Loss": 2.22092866897583, "Pretrain/Loss (Raw)": 2.258629560470581, "Pretrain/Step": 604, "Pretrain/Step Time": 8.539976319298148} +{"Pretrain/Learning Rate": 4.985344892885899e-05, "Pretrain/Loss": 2.222684383392334, "Pretrain/Loss (Raw)": 2.2220852375030518, "Pretrain/Step": 605, "Pretrain/Step Time": 8.545565823093057} +{"Pretrain/Learning Rate": 4.985252957901869e-05, "Pretrain/Loss": 2.2241339683532715, "Pretrain/Loss (Raw)": 2.1332714557647705, "Pretrain/Step": 606, "Pretrain/Step Time": 8.541562864556909} +{"Pretrain/Learning Rate": 4.985160736306756e-05, "Pretrain/Loss": 2.2242274284362793, "Pretrain/Loss (Raw)": 2.133345603942871, "Pretrain/Step": 607, "Pretrain/Step Time": 8.545843115076423} +{"Pretrain/Learning Rate": 4.985068228111198e-05, "Pretrain/Loss": 2.2240703105926514, "Pretrain/Loss (Raw)": 2.1306796073913574, "Pretrain/Step": 608, "Pretrain/Step Time": 8.544682266190648} +{"Pretrain/Learning Rate": 4.984975433325861e-05, "Pretrain/Loss": 2.226146936416626, "Pretrain/Loss (Raw)": 2.425384283065796, "Pretrain/Step": 609, "Pretrain/Step Time": 8.557913156226277} +{"Pretrain/Learning Rate": 4.9848823519614475e-05, "Pretrain/Loss": 2.2250304222106934, "Pretrain/Loss (Raw)": 2.074000358581543, "Pretrain/Step": 610, "Pretrain/Step Time": 8.557016192004085} +{"Pretrain/Learning Rate": 4.9847889840286924e-05, "Pretrain/Loss": 2.22409725189209, "Pretrain/Loss (Raw)": 2.1024343967437744, "Pretrain/Step": 611, "Pretrain/Step Time": 8.55239905975759} +{"Pretrain/Learning Rate": 4.984695329538362e-05, "Pretrain/Loss": 2.2243757247924805, "Pretrain/Loss (Raw)": 2.251002311706543, "Pretrain/Step": 612, "Pretrain/Step Time": 8.552002618089318} +{"Pretrain/Learning Rate": 4.984601388501258e-05, "Pretrain/Loss": 2.2231106758117676, "Pretrain/Loss (Raw)": 2.2008724212646484, "Pretrain/Step": 613, "Pretrain/Step Time": 8.553935680538416} +{"Pretrain/Learning Rate": 4.9845071609282145e-05, "Pretrain/Loss": 2.2222137451171875, "Pretrain/Loss (Raw)": 2.09960675239563, "Pretrain/Step": 614, "Pretrain/Step Time": 8.547704249620438} +{"Pretrain/Learning Rate": 4.984412646830098e-05, "Pretrain/Loss": 2.2212142944335938, "Pretrain/Loss (Raw)": 2.262061834335327, "Pretrain/Step": 615, "Pretrain/Step Time": 8.555148812010884} +{"Pretrain/Learning Rate": 4.9843178462178084e-05, "Pretrain/Loss": 2.21766996383667, "Pretrain/Loss (Raw)": 1.950466513633728, "Pretrain/Step": 616, "Pretrain/Step Time": 8.554768953472376} +{"Pretrain/Learning Rate": 4.984222759102277e-05, "Pretrain/Loss": 2.2204620838165283, "Pretrain/Loss (Raw)": 2.4709603786468506, "Pretrain/Step": 617, "Pretrain/Step Time": 8.558255018666387} +{"Pretrain/Learning Rate": 4.984127385494472e-05, "Pretrain/Loss": 2.2214202880859375, "Pretrain/Loss (Raw)": 2.2415270805358887, "Pretrain/Step": 618, "Pretrain/Step Time": 8.551238434389234} +{"Pretrain/Learning Rate": 4.984031725405392e-05, "Pretrain/Loss": 2.2209768295288086, "Pretrain/Loss (Raw)": 2.30633282661438, "Pretrain/Step": 619, "Pretrain/Step Time": 8.555288627743721} +{"Pretrain/Learning Rate": 4.983935778846067e-05, "Pretrain/Loss": 2.2216217517852783, "Pretrain/Loss (Raw)": 2.353926420211792, "Pretrain/Step": 620, "Pretrain/Step Time": 8.558036800473928} +{"Pretrain/Learning Rate": 4.9838395458275636e-05, "Pretrain/Loss": 2.2232794761657715, "Pretrain/Loss (Raw)": 2.2908554077148438, "Pretrain/Step": 621, "Pretrain/Step Time": 8.560140885412693} +{"Pretrain/Learning Rate": 4.98374302636098e-05, "Pretrain/Loss": 2.221034049987793, "Pretrain/Loss (Raw)": 2.1767189502716064, "Pretrain/Step": 622, "Pretrain/Step Time": 8.56212285719812} +{"Pretrain/Learning Rate": 4.983646220457446e-05, "Pretrain/Loss": 2.222132921218872, "Pretrain/Loss (Raw)": 2.3219542503356934, "Pretrain/Step": 623, "Pretrain/Step Time": 8.563046673312783} +{"Pretrain/Learning Rate": 4.9835491281281274e-05, "Pretrain/Loss": 2.219604969024658, "Pretrain/Loss (Raw)": 2.2622039318084717, "Pretrain/Step": 624, "Pretrain/Step Time": 8.561220478266478} +{"Pretrain/Learning Rate": 4.9834517493842196e-05, "Pretrain/Loss": 2.2163922786712646, "Pretrain/Loss (Raw)": 2.038084030151367, "Pretrain/Step": 625, "Pretrain/Step Time": 8.557963088154793} +{"Pretrain/Learning Rate": 4.983354084236954e-05, "Pretrain/Loss": 2.2149810791015625, "Pretrain/Loss (Raw)": 2.0487687587738037, "Pretrain/Step": 626, "Pretrain/Step Time": 8.559114994481206} +{"Pretrain/Learning Rate": 4.983256132697594e-05, "Pretrain/Loss": 2.2150402069091797, "Pretrain/Loss (Raw)": 2.164397954940796, "Pretrain/Step": 627, "Pretrain/Step Time": 8.567602081224322} +{"Pretrain/Learning Rate": 4.983157894777435e-05, "Pretrain/Loss": 2.2167258262634277, "Pretrain/Loss (Raw)": 2.279130697250366, "Pretrain/Step": 628, "Pretrain/Step Time": 8.564881779253483} +{"Pretrain/Learning Rate": 4.983059370487806e-05, "Pretrain/Loss": 2.2161049842834473, "Pretrain/Loss (Raw)": 2.0781304836273193, "Pretrain/Step": 629, "Pretrain/Step Time": 8.56290645711124} +{"Pretrain/Learning Rate": 4.9829605598400705e-05, "Pretrain/Loss": 2.2184081077575684, "Pretrain/Loss (Raw)": 2.329155683517456, "Pretrain/Step": 630, "Pretrain/Step Time": 8.551133094355464} +{"Pretrain/Learning Rate": 4.982861462845623e-05, "Pretrain/Loss": 2.219759464263916, "Pretrain/Loss (Raw)": 2.3326704502105713, "Pretrain/Step": 631, "Pretrain/Step Time": 8.547242011874914} +{"Pretrain/Learning Rate": 4.982762079515892e-05, "Pretrain/Loss": 2.220036745071411, "Pretrain/Loss (Raw)": 2.094233989715576, "Pretrain/Step": 632, "Pretrain/Step Time": 8.547223512083292} +{"Pretrain/Learning Rate": 4.982662409862339e-05, "Pretrain/Loss": 2.219038963317871, "Pretrain/Loss (Raw)": 2.2161707878112793, "Pretrain/Step": 633, "Pretrain/Step Time": 8.553177049383521} +{"Pretrain/Learning Rate": 4.9825624538964576e-05, "Pretrain/Loss": 2.221315860748291, "Pretrain/Loss (Raw)": 2.33718204498291, "Pretrain/Step": 634, "Pretrain/Step Time": 8.555400701239705} +{"Pretrain/Learning Rate": 4.982462211629776e-05, "Pretrain/Loss": 2.2207093238830566, "Pretrain/Loss (Raw)": 2.1033682823181152, "Pretrain/Step": 635, "Pretrain/Step Time": 8.549003025516868} +{"Pretrain/Learning Rate": 4.9823616830738546e-05, "Pretrain/Loss": 2.2217955589294434, "Pretrain/Loss (Raw)": 2.2529642581939697, "Pretrain/Step": 636, "Pretrain/Step Time": 8.549404492601752} +{"Pretrain/Learning Rate": 4.9822608682402866e-05, "Pretrain/Loss": 2.221543312072754, "Pretrain/Loss (Raw)": 2.2042534351348877, "Pretrain/Step": 637, "Pretrain/Step Time": 8.550692679360509} +{"Pretrain/Learning Rate": 4.9821597671406984e-05, "Pretrain/Loss": 2.2210440635681152, "Pretrain/Loss (Raw)": 2.093787908554077, "Pretrain/Step": 638, "Pretrain/Step Time": 8.543073270469904} +{"Pretrain/Learning Rate": 4.982058379786749e-05, "Pretrain/Loss": 2.221621513366699, "Pretrain/Loss (Raw)": 2.3078725337982178, "Pretrain/Step": 639, "Pretrain/Step Time": 8.550253760069609} +{"Pretrain/Learning Rate": 4.9819567061901327e-05, "Pretrain/Loss": 2.2199759483337402, "Pretrain/Loss (Raw)": 2.1302382946014404, "Pretrain/Step": 640, "Pretrain/Step Time": 8.5545922704041} +{"Pretrain/Learning Rate": 4.981854746362573e-05, "Pretrain/Loss": 2.2204060554504395, "Pretrain/Loss (Raw)": 2.400017261505127, "Pretrain/Step": 641, "Pretrain/Step Time": 8.548395665362477} +{"Pretrain/Learning Rate": 4.981752500315829e-05, "Pretrain/Loss": 2.218492031097412, "Pretrain/Loss (Raw)": 2.1314914226531982, "Pretrain/Step": 642, "Pretrain/Step Time": 8.547506183385849} +{"Pretrain/Learning Rate": 4.981649968061692e-05, "Pretrain/Loss": 2.2242431640625, "Pretrain/Loss (Raw)": 2.856278896331787, "Pretrain/Step": 643, "Pretrain/Step Time": 8.544631144031882} +{"Pretrain/Learning Rate": 4.981547149611987e-05, "Pretrain/Loss": 2.222254753112793, "Pretrain/Loss (Raw)": 1.943253517150879, "Pretrain/Step": 644, "Pretrain/Step Time": 8.54270906932652} +{"Pretrain/Learning Rate": 4.9814440449785715e-05, "Pretrain/Loss": 2.2221341133117676, "Pretrain/Loss (Raw)": 2.1497762203216553, "Pretrain/Step": 645, "Pretrain/Step Time": 8.54839712753892} +{"Pretrain/Learning Rate": 4.9813406541733355e-05, "Pretrain/Loss": 2.2268588542938232, "Pretrain/Loss (Raw)": 2.750427007675171, "Pretrain/Step": 646, "Pretrain/Step Time": 8.54781354777515} +{"Pretrain/Learning Rate": 4.981236977208203e-05, "Pretrain/Loss": 2.2276196479797363, "Pretrain/Loss (Raw)": 2.23935604095459, "Pretrain/Step": 647, "Pretrain/Step Time": 8.539162877947092} +{"Pretrain/Learning Rate": 4.98113301409513e-05, "Pretrain/Loss": 2.226794481277466, "Pretrain/Loss (Raw)": 2.2048404216766357, "Pretrain/Step": 648, "Pretrain/Step Time": 8.541018756106496} +{"Pretrain/Learning Rate": 4.981028764846106e-05, "Pretrain/Loss": 2.2273638248443604, "Pretrain/Loss (Raw)": 2.304100751876831, "Pretrain/Step": 649, "Pretrain/Step Time": 8.53758774138987} +{"Pretrain/Learning Rate": 4.980924229473155e-05, "Pretrain/Loss": 2.2252135276794434, "Pretrain/Loss (Raw)": 2.101310968399048, "Pretrain/Step": 650, "Pretrain/Step Time": 8.53733766451478} +{"Pretrain/Learning Rate": 4.980819407988331e-05, "Pretrain/Loss": 2.2257862091064453, "Pretrain/Loss (Raw)": 2.0926127433776855, "Pretrain/Step": 651, "Pretrain/Step Time": 8.534115424379706} +{"Pretrain/Learning Rate": 4.980714300403723e-05, "Pretrain/Loss": 2.2275452613830566, "Pretrain/Loss (Raw)": 2.3492910861968994, "Pretrain/Step": 652, "Pretrain/Step Time": 8.536764344200492} +{"Pretrain/Learning Rate": 4.9806089067314515e-05, "Pretrain/Loss": 2.2273073196411133, "Pretrain/Loss (Raw)": 2.093501567840576, "Pretrain/Step": 653, "Pretrain/Step Time": 8.531626159325242} +{"Pretrain/Learning Rate": 4.980503226983673e-05, "Pretrain/Loss": 2.2293102741241455, "Pretrain/Loss (Raw)": 2.1669578552246094, "Pretrain/Step": 654, "Pretrain/Step Time": 8.53454278409481} +{"Pretrain/Learning Rate": 4.980397261172573e-05, "Pretrain/Loss": 2.228299379348755, "Pretrain/Loss (Raw)": 2.104174852371216, "Pretrain/Step": 655, "Pretrain/Step Time": 8.538061937317252} +{"Pretrain/Learning Rate": 4.9802910093103725e-05, "Pretrain/Loss": 2.22873592376709, "Pretrain/Loss (Raw)": 2.189387559890747, "Pretrain/Step": 656, "Pretrain/Step Time": 8.535089695826173} +{"Pretrain/Learning Rate": 4.980184471409326e-05, "Pretrain/Loss": 2.2286555767059326, "Pretrain/Loss (Raw)": 2.1231625080108643, "Pretrain/Step": 657, "Pretrain/Step Time": 8.541845258325338} +{"Pretrain/Learning Rate": 4.980077647481719e-05, "Pretrain/Loss": 2.2300963401794434, "Pretrain/Loss (Raw)": 2.4343421459198, "Pretrain/Step": 658, "Pretrain/Step Time": 8.543080933392048} +{"Pretrain/Learning Rate": 4.979970537539871e-05, "Pretrain/Loss": 2.229835271835327, "Pretrain/Loss (Raw)": 2.253913164138794, "Pretrain/Step": 659, "Pretrain/Step Time": 8.531719284132123} +{"Pretrain/Learning Rate": 4.979863141596135e-05, "Pretrain/Loss": 2.2288949489593506, "Pretrain/Loss (Raw)": 2.328517198562622, "Pretrain/Step": 660, "Pretrain/Step Time": 8.533037446439266} +{"Pretrain/Learning Rate": 4.979755459662896e-05, "Pretrain/Loss": 2.2290542125701904, "Pretrain/Loss (Raw)": 2.3672125339508057, "Pretrain/Step": 661, "Pretrain/Step Time": 8.534550508484244} +{"Pretrain/Learning Rate": 4.979647491752572e-05, "Pretrain/Loss": 2.227121591567993, "Pretrain/Loss (Raw)": 2.0170109272003174, "Pretrain/Step": 662, "Pretrain/Step Time": 8.53557350113988} +{"Pretrain/Learning Rate": 4.979539237877615e-05, "Pretrain/Loss": 2.2284884452819824, "Pretrain/Loss (Raw)": 2.1522879600524902, "Pretrain/Step": 663, "Pretrain/Step Time": 8.5348115041852} +{"Pretrain/Learning Rate": 4.979430698050509e-05, "Pretrain/Loss": 2.228005886077881, "Pretrain/Loss (Raw)": 2.3271095752716064, "Pretrain/Step": 664, "Pretrain/Step Time": 8.53914999589324} +{"Pretrain/Learning Rate": 4.979321872283772e-05, "Pretrain/Loss": 2.228196620941162, "Pretrain/Loss (Raw)": 2.3187625408172607, "Pretrain/Step": 665, "Pretrain/Step Time": 8.534460302442312} +{"Pretrain/Learning Rate": 4.979212760589953e-05, "Pretrain/Loss": 2.2291359901428223, "Pretrain/Loss (Raw)": 2.231904983520508, "Pretrain/Step": 666, "Pretrain/Step Time": 8.531230622902513} +{"Pretrain/Learning Rate": 4.9791033629816364e-05, "Pretrain/Loss": 2.227492332458496, "Pretrain/Loss (Raw)": 2.15263295173645, "Pretrain/Step": 667, "Pretrain/Step Time": 8.52963718213141} +{"Pretrain/Learning Rate": 4.978993679471438e-05, "Pretrain/Loss": 2.2262916564941406, "Pretrain/Loss (Raw)": 2.0723414421081543, "Pretrain/Step": 668, "Pretrain/Step Time": 8.530107505619526} +{"Pretrain/Learning Rate": 4.978883710072008e-05, "Pretrain/Loss": 2.226349353790283, "Pretrain/Loss (Raw)": 2.041074752807617, "Pretrain/Step": 669, "Pretrain/Step Time": 8.538535438477993} +{"Pretrain/Learning Rate": 4.978773454796026e-05, "Pretrain/Loss": 2.225933790206909, "Pretrain/Loss (Raw)": 2.236618995666504, "Pretrain/Step": 670, "Pretrain/Step Time": 8.525557238608599} +{"Pretrain/Learning Rate": 4.9786629136562095e-05, "Pretrain/Loss": 2.2239363193511963, "Pretrain/Loss (Raw)": 2.130955457687378, "Pretrain/Step": 671, "Pretrain/Step Time": 8.524854121729732} +{"Pretrain/Learning Rate": 4.978552086665306e-05, "Pretrain/Loss": 2.224642276763916, "Pretrain/Loss (Raw)": 2.3315865993499756, "Pretrain/Step": 672, "Pretrain/Step Time": 8.5268296264112} +{"Pretrain/Learning Rate": 4.9784409738360973e-05, "Pretrain/Loss": 2.2227935791015625, "Pretrain/Loss (Raw)": 2.2414679527282715, "Pretrain/Step": 673, "Pretrain/Step Time": 8.523607347160578} +{"Pretrain/Learning Rate": 4.978329575181395e-05, "Pretrain/Loss": 2.2216479778289795, "Pretrain/Loss (Raw)": 2.1772191524505615, "Pretrain/Step": 674, "Pretrain/Step Time": 8.520382398739457} +{"Pretrain/Learning Rate": 4.978217890714049e-05, "Pretrain/Loss": 2.2242398262023926, "Pretrain/Loss (Raw)": 2.499671459197998, "Pretrain/Step": 675, "Pretrain/Step Time": 8.526525946334004} +{"Pretrain/Learning Rate": 4.978105920446938e-05, "Pretrain/Loss": 2.222165584564209, "Pretrain/Loss (Raw)": 2.0329582691192627, "Pretrain/Step": 676, "Pretrain/Step Time": 8.53414792381227} +{"Pretrain/Learning Rate": 4.977993664392975e-05, "Pretrain/Loss": 2.220808267593384, "Pretrain/Loss (Raw)": 2.024588108062744, "Pretrain/Step": 677, "Pretrain/Step Time": 8.530181150883436} +{"Pretrain/Learning Rate": 4.9778811225651056e-05, "Pretrain/Loss": 2.2194674015045166, "Pretrain/Loss (Raw)": 2.102449893951416, "Pretrain/Step": 678, "Pretrain/Step Time": 8.532620809972286} +{"Pretrain/Learning Rate": 4.9777682949763096e-05, "Pretrain/Loss": 2.2214088439941406, "Pretrain/Loss (Raw)": 2.381089210510254, "Pretrain/Step": 679, "Pretrain/Step Time": 8.531092919409275} +{"Pretrain/Learning Rate": 4.9776551816395975e-05, "Pretrain/Loss": 2.219444513320923, "Pretrain/Loss (Raw)": 2.1126179695129395, "Pretrain/Step": 680, "Pretrain/Step Time": 8.530757939442992} +{"Pretrain/Learning Rate": 4.977541782568015e-05, "Pretrain/Loss": 2.2175774574279785, "Pretrain/Loss (Raw)": 2.0261077880859375, "Pretrain/Step": 681, "Pretrain/Step Time": 8.529357086867094} +{"Pretrain/Learning Rate": 4.97742809777464e-05, "Pretrain/Loss": 2.2178964614868164, "Pretrain/Loss (Raw)": 2.2398619651794434, "Pretrain/Step": 682, "Pretrain/Step Time": 8.528385106474161} +{"Pretrain/Learning Rate": 4.9773141272725824e-05, "Pretrain/Loss": 2.218266725540161, "Pretrain/Loss (Raw)": 2.1115357875823975, "Pretrain/Step": 683, "Pretrain/Step Time": 8.535404974594712} +{"Pretrain/Learning Rate": 4.9771998710749864e-05, "Pretrain/Loss": 2.2154526710510254, "Pretrain/Loss (Raw)": 2.14182448387146, "Pretrain/Step": 684, "Pretrain/Step Time": 8.534513799473643} +{"Pretrain/Learning Rate": 4.977085329195028e-05, "Pretrain/Loss": 2.2152023315429688, "Pretrain/Loss (Raw)": 2.132382869720459, "Pretrain/Step": 685, "Pretrain/Step Time": 8.53748913668096} +{"Pretrain/Learning Rate": 4.9769705016459164e-05, "Pretrain/Loss": 2.211421251296997, "Pretrain/Loss (Raw)": 2.1917834281921387, "Pretrain/Step": 686, "Pretrain/Step Time": 8.533370401710272} +{"Pretrain/Learning Rate": 4.976855388440896e-05, "Pretrain/Loss": 2.212324380874634, "Pretrain/Loss (Raw)": 2.248603105545044, "Pretrain/Step": 687, "Pretrain/Step Time": 8.532370930537581} +{"Pretrain/Learning Rate": 4.97673998959324e-05, "Pretrain/Loss": 2.2114992141723633, "Pretrain/Loss (Raw)": 2.0749781131744385, "Pretrain/Step": 688, "Pretrain/Step Time": 8.533748459070921} +{"Pretrain/Learning Rate": 4.976624305116259e-05, "Pretrain/Loss": 2.2137207984924316, "Pretrain/Loss (Raw)": 2.13680100440979, "Pretrain/Step": 689, "Pretrain/Step Time": 8.536122441291809} +{"Pretrain/Learning Rate": 4.9765083350232913e-05, "Pretrain/Loss": 2.2154736518859863, "Pretrain/Loss (Raw)": 2.3073062896728516, "Pretrain/Step": 690, "Pretrain/Step Time": 8.534798355773091} +{"Pretrain/Learning Rate": 4.976392079327713e-05, "Pretrain/Loss": 2.2156906127929688, "Pretrain/Loss (Raw)": 2.1838538646698, "Pretrain/Step": 691, "Pretrain/Step Time": 8.533089702948928} +{"Pretrain/Learning Rate": 4.976275538042932e-05, "Pretrain/Loss": 2.2147514820098877, "Pretrain/Loss (Raw)": 2.1360716819763184, "Pretrain/Step": 692, "Pretrain/Step Time": 8.531079363077879} +{"Pretrain/Learning Rate": 4.976158711182386e-05, "Pretrain/Loss": 2.2148571014404297, "Pretrain/Loss (Raw)": 2.15372371673584, "Pretrain/Step": 693, "Pretrain/Step Time": 8.527712410315871} +{"Pretrain/Learning Rate": 4.9760415987595496e-05, "Pretrain/Loss": 2.217568874359131, "Pretrain/Loss (Raw)": 2.522444009780884, "Pretrain/Step": 694, "Pretrain/Step Time": 8.540865886956453} +{"Pretrain/Learning Rate": 4.9759242007879295e-05, "Pretrain/Loss": 2.21734619140625, "Pretrain/Loss (Raw)": 2.1407394409179688, "Pretrain/Step": 695, "Pretrain/Step Time": 8.540673790499568} +{"Pretrain/Learning Rate": 4.975806517281062e-05, "Pretrain/Loss": 2.2184948921203613, "Pretrain/Loss (Raw)": 2.267329454421997, "Pretrain/Step": 696, "Pretrain/Step Time": 8.53535789810121} +{"Pretrain/Learning Rate": 4.975688548252522e-05, "Pretrain/Loss": 2.2146494388580322, "Pretrain/Loss (Raw)": 2.0083978176116943, "Pretrain/Step": 697, "Pretrain/Step Time": 8.54091326892376} +{"Pretrain/Learning Rate": 4.9755702937159124e-05, "Pretrain/Loss": 2.2150678634643555, "Pretrain/Loss (Raw)": 2.348041534423828, "Pretrain/Step": 698, "Pretrain/Step Time": 8.537123501300812} +{"Pretrain/Learning Rate": 4.975451753684871e-05, "Pretrain/Loss": 2.215437650680542, "Pretrain/Loss (Raw)": 2.11867356300354, "Pretrain/Step": 699, "Pretrain/Step Time": 8.537213295698166} +{"Pretrain/Learning Rate": 4.975332928173069e-05, "Pretrain/Loss": 2.216029644012451, "Pretrain/Loss (Raw)": 2.3149404525756836, "Pretrain/Step": 700, "Pretrain/Step Time": 8.540237430483103} +{"Pretrain/Learning Rate": 4.975213817194209e-05, "Pretrain/Loss": 2.214703321456909, "Pretrain/Loss (Raw)": 2.089590549468994, "Pretrain/Step": 701, "Pretrain/Step Time": 8.539773389697075} +{"Pretrain/Learning Rate": 4.975094420762029e-05, "Pretrain/Loss": 2.2155280113220215, "Pretrain/Loss (Raw)": 2.1626803874969482, "Pretrain/Step": 702, "Pretrain/Step Time": 8.539227308705449} +{"Pretrain/Learning Rate": 4.9749747388902964e-05, "Pretrain/Loss": 2.214479923248291, "Pretrain/Loss (Raw)": 2.160856008529663, "Pretrain/Step": 703, "Pretrain/Step Time": 8.541752010583878} +{"Pretrain/Learning Rate": 4.974854771592815e-05, "Pretrain/Loss": 2.214853525161743, "Pretrain/Loss (Raw)": 2.2299506664276123, "Pretrain/Step": 704, "Pretrain/Step Time": 8.542995046824217} +{"Pretrain/Learning Rate": 4.974734518883419e-05, "Pretrain/Loss": 2.2125935554504395, "Pretrain/Loss (Raw)": 1.891736626625061, "Pretrain/Step": 705, "Pretrain/Step Time": 8.537194905802608} +{"Pretrain/Learning Rate": 4.974613980775977e-05, "Pretrain/Loss": 2.210731029510498, "Pretrain/Loss (Raw)": 2.2711563110351562, "Pretrain/Step": 706, "Pretrain/Step Time": 8.539024125784636} +{"Pretrain/Learning Rate": 4.974493157284391e-05, "Pretrain/Loss": 2.2107491493225098, "Pretrain/Loss (Raw)": 2.181119918823242, "Pretrain/Step": 707, "Pretrain/Step Time": 8.543693371117115} +{"Pretrain/Learning Rate": 4.974372048422593e-05, "Pretrain/Loss": 2.211252212524414, "Pretrain/Loss (Raw)": 2.1776363849639893, "Pretrain/Step": 708, "Pretrain/Step Time": 8.539920080453157} +{"Pretrain/Learning Rate": 4.974250654204551e-05, "Pretrain/Loss": 2.211756706237793, "Pretrain/Loss (Raw)": 2.22788405418396, "Pretrain/Step": 709, "Pretrain/Step Time": 8.540726751089096} +{"Pretrain/Learning Rate": 4.974128974644264e-05, "Pretrain/Loss": 2.2107951641082764, "Pretrain/Loss (Raw)": 2.0231142044067383, "Pretrain/Step": 710, "Pretrain/Step Time": 8.544388946145773} +{"Pretrain/Learning Rate": 4.9740070097557656e-05, "Pretrain/Loss": 2.2103118896484375, "Pretrain/Loss (Raw)": 2.085571050643921, "Pretrain/Step": 711, "Pretrain/Step Time": 8.541986487805843} +{"Pretrain/Learning Rate": 4.973884759553121e-05, "Pretrain/Loss": 2.2100348472595215, "Pretrain/Loss (Raw)": 2.077329158782959, "Pretrain/Step": 712, "Pretrain/Step Time": 8.541446331888437} +{"Pretrain/Learning Rate": 4.973762224050428e-05, "Pretrain/Loss": 2.208970785140991, "Pretrain/Loss (Raw)": 2.297267198562622, "Pretrain/Step": 713, "Pretrain/Step Time": 8.539760878309608} +{"Pretrain/Learning Rate": 4.973639403261819e-05, "Pretrain/Loss": 2.209437847137451, "Pretrain/Loss (Raw)": 2.2322335243225098, "Pretrain/Step": 714, "Pretrain/Step Time": 8.538433331996202} +{"Pretrain/Learning Rate": 4.9735162972014584e-05, "Pretrain/Loss": 2.209742546081543, "Pretrain/Loss (Raw)": 2.2702693939208984, "Pretrain/Step": 715, "Pretrain/Step Time": 8.537769073620439} +{"Pretrain/Learning Rate": 4.9733929058835425e-05, "Pretrain/Loss": 2.2077584266662598, "Pretrain/Loss (Raw)": 2.141869306564331, "Pretrain/Step": 716, "Pretrain/Step Time": 8.535282788798213} +{"Pretrain/Learning Rate": 4.973269229322301e-05, "Pretrain/Loss": 2.209177255630493, "Pretrain/Loss (Raw)": 2.2623350620269775, "Pretrain/Step": 717, "Pretrain/Step Time": 8.534965429455042} +{"Pretrain/Learning Rate": 4.973145267531998e-05, "Pretrain/Loss": 2.209500312805176, "Pretrain/Loss (Raw)": 2.2330477237701416, "Pretrain/Step": 718, "Pretrain/Step Time": 8.539529643952847} +{"Pretrain/Learning Rate": 4.973021020526929e-05, "Pretrain/Loss": 2.2087817192077637, "Pretrain/Loss (Raw)": 2.2268636226654053, "Pretrain/Step": 719, "Pretrain/Step Time": 8.541961511597037} +{"Pretrain/Learning Rate": 4.972896488321422e-05, "Pretrain/Loss": 2.207859516143799, "Pretrain/Loss (Raw)": 2.052236557006836, "Pretrain/Step": 720, "Pretrain/Step Time": 8.539918154478073} +{"Pretrain/Learning Rate": 4.97277167092984e-05, "Pretrain/Loss": 2.204831838607788, "Pretrain/Loss (Raw)": 1.923721432685852, "Pretrain/Step": 721, "Pretrain/Step Time": 8.535665119066834} +{"Pretrain/Learning Rate": 4.972646568366577e-05, "Pretrain/Loss": 2.2027196884155273, "Pretrain/Loss (Raw)": 2.1046695709228516, "Pretrain/Step": 722, "Pretrain/Step Time": 8.534412954002619} +{"Pretrain/Learning Rate": 4.9725211806460604e-05, "Pretrain/Loss": 2.202650547027588, "Pretrain/Loss (Raw)": 2.157092809677124, "Pretrain/Step": 723, "Pretrain/Step Time": 8.542239848524332} +{"Pretrain/Learning Rate": 4.97239550778275e-05, "Pretrain/Loss": 2.2019829750061035, "Pretrain/Loss (Raw)": 2.129645347595215, "Pretrain/Step": 724, "Pretrain/Step Time": 8.543319894000888} +{"Pretrain/Learning Rate": 4.972269549791139e-05, "Pretrain/Loss": 2.2006962299346924, "Pretrain/Loss (Raw)": 2.0427587032318115, "Pretrain/Step": 725, "Pretrain/Step Time": 8.535704469308257} +{"Pretrain/Learning Rate": 4.9721433066857535e-05, "Pretrain/Loss": 2.2010560035705566, "Pretrain/Loss (Raw)": 2.1980929374694824, "Pretrain/Step": 726, "Pretrain/Step Time": 8.544958088546991} +{"Pretrain/Learning Rate": 4.9720167784811535e-05, "Pretrain/Loss": 2.1978588104248047, "Pretrain/Loss (Raw)": 1.7520394325256348, "Pretrain/Step": 727, "Pretrain/Step Time": 8.539472494274378} +{"Pretrain/Learning Rate": 4.97188996519193e-05, "Pretrain/Loss": 2.195526361465454, "Pretrain/Loss (Raw)": 2.1401100158691406, "Pretrain/Step": 728, "Pretrain/Step Time": 8.534676425158978} +{"Pretrain/Learning Rate": 4.971762866832708e-05, "Pretrain/Loss": 2.1945223808288574, "Pretrain/Loss (Raw)": 2.028805732727051, "Pretrain/Step": 729, "Pretrain/Step Time": 8.542544400319457} +{"Pretrain/Learning Rate": 4.971635483418144e-05, "Pretrain/Loss": 2.195023536682129, "Pretrain/Loss (Raw)": 2.2302048206329346, "Pretrain/Step": 730, "Pretrain/Step Time": 8.54525020904839} +{"Pretrain/Learning Rate": 4.97150781496293e-05, "Pretrain/Loss": 2.1946310997009277, "Pretrain/Loss (Raw)": 2.258476495742798, "Pretrain/Step": 731, "Pretrain/Step Time": 8.538469271734357} +{"Pretrain/Learning Rate": 4.971379861481789e-05, "Pretrain/Loss": 2.19439959526062, "Pretrain/Loss (Raw)": 2.229008197784424, "Pretrain/Step": 732, "Pretrain/Step Time": 8.547094719484448} +{"Pretrain/Learning Rate": 4.9712516229894756e-05, "Pretrain/Loss": 2.1926984786987305, "Pretrain/Loss (Raw)": 2.0043537616729736, "Pretrain/Step": 733, "Pretrain/Step Time": 8.543034363538027} +{"Pretrain/Learning Rate": 4.971123099500781e-05, "Pretrain/Loss": 2.192340850830078, "Pretrain/Loss (Raw)": 2.087470293045044, "Pretrain/Step": 734, "Pretrain/Step Time": 8.54146004281938} +{"Pretrain/Learning Rate": 4.970994291030526e-05, "Pretrain/Loss": 2.19264554977417, "Pretrain/Loss (Raw)": 2.172382354736328, "Pretrain/Step": 735, "Pretrain/Step Time": 8.543322198092937} +{"Pretrain/Learning Rate": 4.970865197593566e-05, "Pretrain/Loss": 2.192396879196167, "Pretrain/Loss (Raw)": 2.0988118648529053, "Pretrain/Step": 736, "Pretrain/Step Time": 8.544505313038826} +{"Pretrain/Learning Rate": 4.9707358192047885e-05, "Pretrain/Loss": 2.1912221908569336, "Pretrain/Loss (Raw)": 2.2750439643859863, "Pretrain/Step": 737, "Pretrain/Step Time": 8.532516609877348} +{"Pretrain/Learning Rate": 4.970606155879113e-05, "Pretrain/Loss": 2.1926450729370117, "Pretrain/Loss (Raw)": 2.25614595413208, "Pretrain/Step": 738, "Pretrain/Step Time": 8.533239474520087} +{"Pretrain/Learning Rate": 4.970476207631494e-05, "Pretrain/Loss": 2.1926512718200684, "Pretrain/Loss (Raw)": 2.1032230854034424, "Pretrain/Step": 739, "Pretrain/Step Time": 8.533425517380238} +{"Pretrain/Learning Rate": 4.970345974476918e-05, "Pretrain/Loss": 2.192387104034424, "Pretrain/Loss (Raw)": 2.2171666622161865, "Pretrain/Step": 740, "Pretrain/Step Time": 8.533346056938171} +{"Pretrain/Learning Rate": 4.970215456430403e-05, "Pretrain/Loss": 2.191746950149536, "Pretrain/Loss (Raw)": 2.1189446449279785, "Pretrain/Step": 741, "Pretrain/Step Time": 8.53972116485238} +{"Pretrain/Learning Rate": 4.970084653507001e-05, "Pretrain/Loss": 2.191868782043457, "Pretrain/Loss (Raw)": 2.1151721477508545, "Pretrain/Step": 742, "Pretrain/Step Time": 8.544494550675154} +{"Pretrain/Learning Rate": 4.969953565721799e-05, "Pretrain/Loss": 2.192164182662964, "Pretrain/Loss (Raw)": 2.2999017238616943, "Pretrain/Step": 743, "Pretrain/Step Time": 8.536610724404454} +{"Pretrain/Learning Rate": 4.969822193089911e-05, "Pretrain/Loss": 2.1941428184509277, "Pretrain/Loss (Raw)": 2.203749179840088, "Pretrain/Step": 744, "Pretrain/Step Time": 8.533610109239817} +{"Pretrain/Learning Rate": 4.969690535626491e-05, "Pretrain/Loss": 2.1918230056762695, "Pretrain/Loss (Raw)": 2.1740167140960693, "Pretrain/Step": 745, "Pretrain/Step Time": 8.528996301814914} +{"Pretrain/Learning Rate": 4.96955859334672e-05, "Pretrain/Loss": 2.191969633102417, "Pretrain/Loss (Raw)": 2.2602803707122803, "Pretrain/Step": 746, "Pretrain/Step Time": 8.54053458943963} +{"Pretrain/Learning Rate": 4.9694263662658156e-05, "Pretrain/Loss": 2.192476749420166, "Pretrain/Loss (Raw)": 2.3712568283081055, "Pretrain/Step": 747, "Pretrain/Step Time": 8.53505408577621} +{"Pretrain/Learning Rate": 4.9692938543990265e-05, "Pretrain/Loss": 2.192612409591675, "Pretrain/Loss (Raw)": 2.3712854385375977, "Pretrain/Step": 748, "Pretrain/Step Time": 8.5350935831666} +{"Pretrain/Learning Rate": 4.969161057761634e-05, "Pretrain/Loss": 2.1908504962921143, "Pretrain/Loss (Raw)": 2.065335988998413, "Pretrain/Step": 749, "Pretrain/Step Time": 8.532831508666277} +{"Pretrain/Learning Rate": 4.969027976368954e-05, "Pretrain/Loss": 2.1913368701934814, "Pretrain/Loss (Raw)": 2.23895525932312, "Pretrain/Step": 750, "Pretrain/Step Time": 8.532628307119012} +{"Pretrain/Learning Rate": 4.968894610236332e-05, "Pretrain/Loss": 2.1888349056243896, "Pretrain/Loss (Raw)": 2.0017125606536865, "Pretrain/Step": 751, "Pretrain/Step Time": 8.531695444136858} +{"Pretrain/Learning Rate": 4.968760959379151e-05, "Pretrain/Loss": 2.1878671646118164, "Pretrain/Loss (Raw)": 2.138338327407837, "Pretrain/Step": 752, "Pretrain/Step Time": 8.528227668255568} +{"Pretrain/Learning Rate": 4.968627023812822e-05, "Pretrain/Loss": 2.1884331703186035, "Pretrain/Loss (Raw)": 2.1105051040649414, "Pretrain/Step": 753, "Pretrain/Step Time": 8.53251695819199} +{"Pretrain/Learning Rate": 4.968492803552793e-05, "Pretrain/Loss": 2.1899280548095703, "Pretrain/Loss (Raw)": 2.240138053894043, "Pretrain/Step": 754, "Pretrain/Step Time": 8.532426526769996} +{"Pretrain/Learning Rate": 4.968358298614541e-05, "Pretrain/Loss": 2.189382791519165, "Pretrain/Loss (Raw)": 2.094590425491333, "Pretrain/Step": 755, "Pretrain/Step Time": 8.527105396613479} +{"Pretrain/Learning Rate": 4.968223509013579e-05, "Pretrain/Loss": 2.188293933868408, "Pretrain/Loss (Raw)": 2.1397883892059326, "Pretrain/Step": 756, "Pretrain/Step Time": 8.526755606755614} +{"Pretrain/Learning Rate": 4.968088434765452e-05, "Pretrain/Loss": 2.1909921169281006, "Pretrain/Loss (Raw)": 2.4234743118286133, "Pretrain/Step": 757, "Pretrain/Step Time": 8.530622301623225} +{"Pretrain/Learning Rate": 4.967953075885736e-05, "Pretrain/Loss": 2.1890106201171875, "Pretrain/Loss (Raw)": 2.0755460262298584, "Pretrain/Step": 758, "Pretrain/Step Time": 8.532122576609254} +{"Pretrain/Learning Rate": 4.9678174323900415e-05, "Pretrain/Loss": 2.1877684593200684, "Pretrain/Loss (Raw)": 2.173651695251465, "Pretrain/Step": 759, "Pretrain/Step Time": 8.534396966919303} +{"Pretrain/Learning Rate": 4.9676815042940125e-05, "Pretrain/Loss": 2.1869630813598633, "Pretrain/Loss (Raw)": 1.991127371788025, "Pretrain/Step": 760, "Pretrain/Step Time": 8.528897078707814} +{"Pretrain/Learning Rate": 4.967545291613325e-05, "Pretrain/Loss": 2.1872479915618896, "Pretrain/Loss (Raw)": 2.252653121948242, "Pretrain/Step": 761, "Pretrain/Step Time": 8.532133653759956} +{"Pretrain/Learning Rate": 4.967408794363686e-05, "Pretrain/Loss": 2.186737060546875, "Pretrain/Loss (Raw)": 2.271782398223877, "Pretrain/Step": 762, "Pretrain/Step Time": 8.536204004660249} +{"Pretrain/Learning Rate": 4.9672720125608384e-05, "Pretrain/Loss": 2.1864757537841797, "Pretrain/Loss (Raw)": 2.0699405670166016, "Pretrain/Step": 763, "Pretrain/Step Time": 8.5329823885113} +{"Pretrain/Learning Rate": 4.9671349462205565e-05, "Pretrain/Loss": 2.187972068786621, "Pretrain/Loss (Raw)": 2.4444737434387207, "Pretrain/Step": 764, "Pretrain/Step Time": 8.536937179043889} +{"Pretrain/Learning Rate": 4.966997595358647e-05, "Pretrain/Loss": 2.187378406524658, "Pretrain/Loss (Raw)": 2.1282589435577393, "Pretrain/Step": 765, "Pretrain/Step Time": 8.53960233926773} +{"Pretrain/Learning Rate": 4.966859959990949e-05, "Pretrain/Loss": 2.1896748542785645, "Pretrain/Loss (Raw)": 2.387740135192871, "Pretrain/Step": 766, "Pretrain/Step Time": 8.538392094895244} +{"Pretrain/Learning Rate": 4.966722040133337e-05, "Pretrain/Loss": 2.188896894454956, "Pretrain/Loss (Raw)": 2.2082958221435547, "Pretrain/Step": 767, "Pretrain/Step Time": 8.534883523359895} +{"Pretrain/Learning Rate": 4.9665838358017156e-05, "Pretrain/Loss": 2.1877999305725098, "Pretrain/Loss (Raw)": 1.9898172616958618, "Pretrain/Step": 768, "Pretrain/Step Time": 8.52896930463612} +{"Pretrain/Learning Rate": 4.966445347012023e-05, "Pretrain/Loss": 2.1851181983947754, "Pretrain/Loss (Raw)": 2.0567569732666016, "Pretrain/Step": 769, "Pretrain/Step Time": 8.529267616569996} +{"Pretrain/Learning Rate": 4.9663065737802316e-05, "Pretrain/Loss": 2.1852033138275146, "Pretrain/Loss (Raw)": 2.1423966884613037, "Pretrain/Step": 770, "Pretrain/Step Time": 8.535893114283681} +{"Pretrain/Learning Rate": 4.9661675161223435e-05, "Pretrain/Loss": 2.1799678802490234, "Pretrain/Loss (Raw)": 2.1861255168914795, "Pretrain/Step": 771, "Pretrain/Step Time": 8.541437793523073} +{"Pretrain/Learning Rate": 4.966028174054397e-05, "Pretrain/Loss": 2.1795530319213867, "Pretrain/Loss (Raw)": 1.8901633024215698, "Pretrain/Step": 772, "Pretrain/Step Time": 8.542226951569319} +{"Pretrain/Learning Rate": 4.965888547592461e-05, "Pretrain/Loss": 2.179201364517212, "Pretrain/Loss (Raw)": 2.1047606468200684, "Pretrain/Step": 773, "Pretrain/Step Time": 8.54111636057496} +{"Pretrain/Learning Rate": 4.965748636752638e-05, "Pretrain/Loss": 2.1761913299560547, "Pretrain/Loss (Raw)": 2.365159511566162, "Pretrain/Step": 774, "Pretrain/Step Time": 8.540777254849672} +{"Pretrain/Learning Rate": 4.965608441551063e-05, "Pretrain/Loss": 2.175997734069824, "Pretrain/Loss (Raw)": 2.214543342590332, "Pretrain/Step": 775, "Pretrain/Step Time": 8.539437418803573} +{"Pretrain/Learning Rate": 4.965467962003905e-05, "Pretrain/Loss": 2.174729824066162, "Pretrain/Loss (Raw)": 2.0425612926483154, "Pretrain/Step": 776, "Pretrain/Step Time": 8.535313567146659} +{"Pretrain/Learning Rate": 4.965327198127363e-05, "Pretrain/Loss": 2.1736340522766113, "Pretrain/Loss (Raw)": 2.163841485977173, "Pretrain/Step": 777, "Pretrain/Step Time": 8.537526628002524} +{"Pretrain/Learning Rate": 4.965186149937672e-05, "Pretrain/Loss": 2.1740479469299316, "Pretrain/Loss (Raw)": 2.1543056964874268, "Pretrain/Step": 778, "Pretrain/Step Time": 8.535701790824533} +{"Pretrain/Learning Rate": 4.9650448174510986e-05, "Pretrain/Loss": 2.175231695175171, "Pretrain/Loss (Raw)": 2.2441182136535645, "Pretrain/Step": 779, "Pretrain/Step Time": 8.543476022779942} +{"Pretrain/Learning Rate": 4.9649032006839404e-05, "Pretrain/Loss": 2.1742663383483887, "Pretrain/Loss (Raw)": 2.2257511615753174, "Pretrain/Step": 780, "Pretrain/Step Time": 8.54210633970797} +{"Pretrain/Learning Rate": 4.964761299652529e-05, "Pretrain/Loss": 2.175168991088867, "Pretrain/Loss (Raw)": 2.209012746810913, "Pretrain/Step": 781, "Pretrain/Step Time": 8.542213965207338} +{"Pretrain/Learning Rate": 4.9646191143732324e-05, "Pretrain/Loss": 2.1755194664001465, "Pretrain/Loss (Raw)": 2.2118043899536133, "Pretrain/Step": 782, "Pretrain/Step Time": 8.540257286280394} +{"Pretrain/Learning Rate": 4.9644766448624444e-05, "Pretrain/Loss": 2.1758480072021484, "Pretrain/Loss (Raw)": 2.146256446838379, "Pretrain/Step": 783, "Pretrain/Step Time": 8.544513268396258} +{"Pretrain/Learning Rate": 4.9643338911365964e-05, "Pretrain/Loss": 2.1757001876831055, "Pretrain/Loss (Raw)": 2.170477867126465, "Pretrain/Step": 784, "Pretrain/Step Time": 8.546967135742307} +{"Pretrain/Learning Rate": 4.9641908532121525e-05, "Pretrain/Loss": 2.17692494392395, "Pretrain/Loss (Raw)": 2.279911756515503, "Pretrain/Step": 785, "Pretrain/Step Time": 8.537164220586419} +{"Pretrain/Learning Rate": 4.964047531105608e-05, "Pretrain/Loss": 2.174910068511963, "Pretrain/Loss (Raw)": 2.1764302253723145, "Pretrain/Step": 786, "Pretrain/Step Time": 8.537906609475613} +{"Pretrain/Learning Rate": 4.963903924833491e-05, "Pretrain/Loss": 2.1773955821990967, "Pretrain/Loss (Raw)": 2.5720696449279785, "Pretrain/Step": 787, "Pretrain/Step Time": 8.54044483974576} +{"Pretrain/Learning Rate": 4.963760034412363e-05, "Pretrain/Loss": 2.176450729370117, "Pretrain/Loss (Raw)": 2.2075719833374023, "Pretrain/Step": 788, "Pretrain/Step Time": 8.541463863104582} +{"Pretrain/Learning Rate": 4.9636158598588185e-05, "Pretrain/Loss": 2.1736397743225098, "Pretrain/Loss (Raw)": 2.007413625717163, "Pretrain/Step": 789, "Pretrain/Step Time": 8.54195793159306} +{"Pretrain/Learning Rate": 4.9634714011894836e-05, "Pretrain/Loss": 2.1754987239837646, "Pretrain/Loss (Raw)": 2.2549431324005127, "Pretrain/Step": 790, "Pretrain/Step Time": 8.539181334897876} +{"Pretrain/Learning Rate": 4.963326658421019e-05, "Pretrain/Loss": 2.1758413314819336, "Pretrain/Loss (Raw)": 2.196160316467285, "Pretrain/Step": 791, "Pretrain/Step Time": 8.544058192521334} +{"Pretrain/Learning Rate": 4.9631816315701165e-05, "Pretrain/Loss": 2.1760716438293457, "Pretrain/Loss (Raw)": 2.3565754890441895, "Pretrain/Step": 792, "Pretrain/Step Time": 8.536215994507074} +{"Pretrain/Learning Rate": 4.9630363206535e-05, "Pretrain/Loss": 2.1761341094970703, "Pretrain/Loss (Raw)": 2.326763153076172, "Pretrain/Step": 793, "Pretrain/Step Time": 8.535103503614664} +{"Pretrain/Learning Rate": 4.962890725687931e-05, "Pretrain/Loss": 2.17535138130188, "Pretrain/Loss (Raw)": 2.131720781326294, "Pretrain/Step": 794, "Pretrain/Step Time": 8.5384426638484} +{"Pretrain/Learning Rate": 4.962744846690196e-05, "Pretrain/Loss": 2.1771864891052246, "Pretrain/Loss (Raw)": 2.3875365257263184, "Pretrain/Step": 795, "Pretrain/Step Time": 8.544989868998528} +{"Pretrain/Learning Rate": 4.962598683677122e-05, "Pretrain/Loss": 2.1772305965423584, "Pretrain/Loss (Raw)": 2.077995777130127, "Pretrain/Step": 796, "Pretrain/Step Time": 8.548833150416613} +{"Pretrain/Learning Rate": 4.9624522366655625e-05, "Pretrain/Loss": 2.1807079315185547, "Pretrain/Loss (Raw)": 2.486149549484253, "Pretrain/Step": 797, "Pretrain/Step Time": 8.55041634477675} +{"Pretrain/Learning Rate": 4.962305505672408e-05, "Pretrain/Loss": 2.1794252395629883, "Pretrain/Loss (Raw)": 2.0724480152130127, "Pretrain/Step": 798, "Pretrain/Step Time": 8.550403932109475} +{"Pretrain/Learning Rate": 4.96215849071458e-05, "Pretrain/Loss": 2.179474115371704, "Pretrain/Loss (Raw)": 2.137192487716675, "Pretrain/Step": 799, "Pretrain/Step Time": 8.549673397094011} +{"Pretrain/Learning Rate": 4.962011191809033e-05, "Pretrain/Loss": 2.178414821624756, "Pretrain/Loss (Raw)": 2.195986747741699, "Pretrain/Step": 800, "Pretrain/Step Time": 8.551903143525124} +{"Pretrain/Learning Rate": 4.961863608972753e-05, "Pretrain/Loss": 2.1775197982788086, "Pretrain/Loss (Raw)": 2.126924991607666, "Pretrain/Step": 801, "Pretrain/Step Time": 8.556053765118122} +{"Pretrain/Learning Rate": 4.961715742222762e-05, "Pretrain/Loss": 2.1786208152770996, "Pretrain/Loss (Raw)": 2.3181209564208984, "Pretrain/Step": 802, "Pretrain/Step Time": 8.569736434146762} +{"Pretrain/Learning Rate": 4.961567591576112e-05, "Pretrain/Loss": 2.176396369934082, "Pretrain/Loss (Raw)": 2.2149641513824463, "Pretrain/Step": 803, "Pretrain/Step Time": 8.559930950403214} +{"Pretrain/Learning Rate": 4.961419157049887e-05, "Pretrain/Loss": 2.1769936084747314, "Pretrain/Loss (Raw)": 2.1094167232513428, "Pretrain/Step": 804, "Pretrain/Step Time": 8.554481711238623} +{"Pretrain/Learning Rate": 4.9612704386612066e-05, "Pretrain/Loss": 2.1789357662200928, "Pretrain/Loss (Raw)": 2.273183584213257, "Pretrain/Step": 805, "Pretrain/Step Time": 8.551153944805264} +{"Pretrain/Learning Rate": 4.9611214364272206e-05, "Pretrain/Loss": 2.179816484451294, "Pretrain/Loss (Raw)": 2.2151753902435303, "Pretrain/Step": 806, "Pretrain/Step Time": 8.548989966511726} +{"Pretrain/Learning Rate": 4.960972150365114e-05, "Pretrain/Loss": 2.1771798133850098, "Pretrain/Loss (Raw)": 2.0436148643493652, "Pretrain/Step": 807, "Pretrain/Step Time": 8.556240556761622} +{"Pretrain/Learning Rate": 4.960822580492103e-05, "Pretrain/Loss": 2.177816390991211, "Pretrain/Loss (Raw)": 2.19409441947937, "Pretrain/Step": 808, "Pretrain/Step Time": 8.56299197115004} +{"Pretrain/Learning Rate": 4.960672726825436e-05, "Pretrain/Loss": 2.1778783798217773, "Pretrain/Loss (Raw)": 2.0340158939361572, "Pretrain/Step": 809, "Pretrain/Step Time": 8.561514241620898} +{"Pretrain/Learning Rate": 4.960522589382395e-05, "Pretrain/Loss": 2.1780972480773926, "Pretrain/Loss (Raw)": 2.2679123878479004, "Pretrain/Step": 810, "Pretrain/Step Time": 8.558421464636922} +{"Pretrain/Learning Rate": 4.960372168180294e-05, "Pretrain/Loss": 2.179779529571533, "Pretrain/Loss (Raw)": 2.326840877532959, "Pretrain/Step": 811, "Pretrain/Step Time": 8.552220987156034} +{"Pretrain/Learning Rate": 4.9602214632364816e-05, "Pretrain/Loss": 2.1789984703063965, "Pretrain/Loss (Raw)": 2.041853904724121, "Pretrain/Step": 812, "Pretrain/Step Time": 8.551604291424155} +{"Pretrain/Learning Rate": 4.9600704745683367e-05, "Pretrain/Loss": 2.1782727241516113, "Pretrain/Loss (Raw)": 2.0394833087921143, "Pretrain/Step": 813, "Pretrain/Step Time": 8.556747499853373} +{"Pretrain/Learning Rate": 4.959919202193273e-05, "Pretrain/Loss": 2.1769280433654785, "Pretrain/Loss (Raw)": 2.0196869373321533, "Pretrain/Step": 814, "Pretrain/Step Time": 8.55843292362988} +{"Pretrain/Learning Rate": 4.959767646128735e-05, "Pretrain/Loss": 2.175675868988037, "Pretrain/Loss (Raw)": 2.0883235931396484, "Pretrain/Step": 815, "Pretrain/Step Time": 8.562106540426612} +{"Pretrain/Learning Rate": 4.959615806392201e-05, "Pretrain/Loss": 2.176514148712158, "Pretrain/Loss (Raw)": 2.182281494140625, "Pretrain/Step": 816, "Pretrain/Step Time": 8.553312310948968} +{"Pretrain/Learning Rate": 4.959463683001182e-05, "Pretrain/Loss": 2.177903175354004, "Pretrain/Loss (Raw)": 2.3145761489868164, "Pretrain/Step": 817, "Pretrain/Step Time": 8.547865010797977} +{"Pretrain/Learning Rate": 4.959311275973223e-05, "Pretrain/Loss": 2.1768269538879395, "Pretrain/Loss (Raw)": 2.169543743133545, "Pretrain/Step": 818, "Pretrain/Step Time": 8.54961870610714} +{"Pretrain/Learning Rate": 4.959158585325898e-05, "Pretrain/Loss": 2.178475856781006, "Pretrain/Loss (Raw)": 2.394925117492676, "Pretrain/Step": 819, "Pretrain/Step Time": 8.547009503468871} +{"Pretrain/Learning Rate": 4.959005611076817e-05, "Pretrain/Loss": 2.179187536239624, "Pretrain/Loss (Raw)": 2.2271885871887207, "Pretrain/Step": 820, "Pretrain/Step Time": 8.555691616609693} +{"Pretrain/Learning Rate": 4.9588523532436214e-05, "Pretrain/Loss": 2.1794252395629883, "Pretrain/Loss (Raw)": 2.184124231338501, "Pretrain/Step": 821, "Pretrain/Step Time": 8.556085022166371} +{"Pretrain/Learning Rate": 4.9586988118439863e-05, "Pretrain/Loss": 2.1774802207946777, "Pretrain/Loss (Raw)": 2.273489475250244, "Pretrain/Step": 822, "Pretrain/Step Time": 8.545106099918485} +{"Pretrain/Learning Rate": 4.958544986895619e-05, "Pretrain/Loss": 2.1792407035827637, "Pretrain/Loss (Raw)": 2.366084098815918, "Pretrain/Step": 823, "Pretrain/Step Time": 8.544141467660666} +{"Pretrain/Learning Rate": 4.958390878416258e-05, "Pretrain/Loss": 2.1795220375061035, "Pretrain/Loss (Raw)": 2.3033523559570312, "Pretrain/Step": 824, "Pretrain/Step Time": 8.546142175793648} +{"Pretrain/Learning Rate": 4.9582364864236765e-05, "Pretrain/Loss": 2.1817641258239746, "Pretrain/Loss (Raw)": 2.295341730117798, "Pretrain/Step": 825, "Pretrain/Step Time": 8.541163053363562} +{"Pretrain/Learning Rate": 4.95808181093568e-05, "Pretrain/Loss": 2.1798934936523438, "Pretrain/Loss (Raw)": 2.1086056232452393, "Pretrain/Step": 826, "Pretrain/Step Time": 8.547428356483579} +{"Pretrain/Learning Rate": 4.9579268519701063e-05, "Pretrain/Loss": 2.18043851852417, "Pretrain/Loss (Raw)": 2.188448905944824, "Pretrain/Step": 827, "Pretrain/Step Time": 8.54409451968968} +{"Pretrain/Learning Rate": 4.957771609544826e-05, "Pretrain/Loss": 2.180093288421631, "Pretrain/Loss (Raw)": 2.2707626819610596, "Pretrain/Step": 828, "Pretrain/Step Time": 8.540892072021961} +{"Pretrain/Learning Rate": 4.957616083677742e-05, "Pretrain/Loss": 2.180237293243408, "Pretrain/Loss (Raw)": 2.108020305633545, "Pretrain/Step": 829, "Pretrain/Step Time": 8.540816839784384} +{"Pretrain/Learning Rate": 4.9574602743867916e-05, "Pretrain/Loss": 2.178494453430176, "Pretrain/Loss (Raw)": 1.9395921230316162, "Pretrain/Step": 830, "Pretrain/Step Time": 8.542102290317416} +{"Pretrain/Learning Rate": 4.957304181689941e-05, "Pretrain/Loss": 2.178899049758911, "Pretrain/Loss (Raw)": 2.212669610977173, "Pretrain/Step": 831, "Pretrain/Step Time": 8.538615200668573} +{"Pretrain/Learning Rate": 4.957147805605194e-05, "Pretrain/Loss": 2.1787405014038086, "Pretrain/Loss (Raw)": 2.2096407413482666, "Pretrain/Step": 832, "Pretrain/Step Time": 8.547853633761406} +{"Pretrain/Learning Rate": 4.956991146150583e-05, "Pretrain/Loss": 2.1827688217163086, "Pretrain/Loss (Raw)": 2.4073641300201416, "Pretrain/Step": 833, "Pretrain/Step Time": 8.549724221229553} +{"Pretrain/Learning Rate": 4.9568342033441755e-05, "Pretrain/Loss": 2.1816036701202393, "Pretrain/Loss (Raw)": 2.1220037937164307, "Pretrain/Step": 834, "Pretrain/Step Time": 8.546894090250134} +{"Pretrain/Learning Rate": 4.956676977204071e-05, "Pretrain/Loss": 2.182762861251831, "Pretrain/Loss (Raw)": 2.329505681991577, "Pretrain/Step": 835, "Pretrain/Step Time": 8.543114995583892} +{"Pretrain/Learning Rate": 4.9565194677484e-05, "Pretrain/Loss": 2.181671619415283, "Pretrain/Loss (Raw)": 2.0379745960235596, "Pretrain/Step": 836, "Pretrain/Step Time": 8.539805181324482} +{"Pretrain/Learning Rate": 4.95636167499533e-05, "Pretrain/Loss": 2.1792047023773193, "Pretrain/Loss (Raw)": 1.9120997190475464, "Pretrain/Step": 837, "Pretrain/Step Time": 8.542306140065193} +{"Pretrain/Learning Rate": 4.9562035989630564e-05, "Pretrain/Loss": 2.1826088428497314, "Pretrain/Loss (Raw)": 2.458841323852539, "Pretrain/Step": 838, "Pretrain/Step Time": 8.548691913485527} +{"Pretrain/Learning Rate": 4.95604523966981e-05, "Pretrain/Loss": 2.1811904907226562, "Pretrain/Loss (Raw)": 1.904059648513794, "Pretrain/Step": 839, "Pretrain/Step Time": 8.54925812408328} +{"Pretrain/Learning Rate": 4.9558865971338524e-05, "Pretrain/Loss": 2.18343448638916, "Pretrain/Loss (Raw)": 2.364516019821167, "Pretrain/Step": 840, "Pretrain/Step Time": 8.541014451533556} +{"Pretrain/Learning Rate": 4.9557276713734805e-05, "Pretrain/Loss": 2.1831812858581543, "Pretrain/Loss (Raw)": 2.2648472785949707, "Pretrain/Step": 841, "Pretrain/Step Time": 8.54146721959114} +{"Pretrain/Learning Rate": 4.955568462407022e-05, "Pretrain/Loss": 2.1840004920959473, "Pretrain/Loss (Raw)": 2.3370954990386963, "Pretrain/Step": 842, "Pretrain/Step Time": 8.53899516351521} +{"Pretrain/Learning Rate": 4.955408970252837e-05, "Pretrain/Loss": 2.183262348175049, "Pretrain/Loss (Raw)": 2.175804853439331, "Pretrain/Step": 843, "Pretrain/Step Time": 8.539431046694517} +{"Pretrain/Learning Rate": 4.955249194929319e-05, "Pretrain/Loss": 2.183382034301758, "Pretrain/Loss (Raw)": 2.1572043895721436, "Pretrain/Step": 844, "Pretrain/Step Time": 8.550663040950894} +{"Pretrain/Learning Rate": 4.955089136454895e-05, "Pretrain/Loss": 2.1832823753356934, "Pretrain/Loss (Raw)": 2.2495510578155518, "Pretrain/Step": 845, "Pretrain/Step Time": 8.552456134930253} +{"Pretrain/Learning Rate": 4.954928794848023e-05, "Pretrain/Loss": 2.1831483840942383, "Pretrain/Loss (Raw)": 2.215921401977539, "Pretrain/Step": 846, "Pretrain/Step Time": 8.549377864226699} +{"Pretrain/Learning Rate": 4.954768170127194e-05, "Pretrain/Loss": 2.1835145950317383, "Pretrain/Loss (Raw)": 2.2737460136413574, "Pretrain/Step": 847, "Pretrain/Step Time": 8.540660850703716} +{"Pretrain/Learning Rate": 4.9546072623109325e-05, "Pretrain/Loss": 2.184311866760254, "Pretrain/Loss (Raw)": 2.154261827468872, "Pretrain/Step": 848, "Pretrain/Step Time": 8.549642572179437} +{"Pretrain/Learning Rate": 4.954446071417795e-05, "Pretrain/Loss": 2.1860036849975586, "Pretrain/Loss (Raw)": 2.140289545059204, "Pretrain/Step": 849, "Pretrain/Step Time": 8.546288648620248} +{"Pretrain/Learning Rate": 4.954284597466371e-05, "Pretrain/Loss": 2.187145471572876, "Pretrain/Loss (Raw)": 2.250800609588623, "Pretrain/Step": 850, "Pretrain/Step Time": 8.555628223344684} +{"Pretrain/Learning Rate": 4.954122840475281e-05, "Pretrain/Loss": 2.1880650520324707, "Pretrain/Loss (Raw)": 2.274787425994873, "Pretrain/Step": 851, "Pretrain/Step Time": 8.546873476356268} +{"Pretrain/Learning Rate": 4.9539608004631825e-05, "Pretrain/Loss": 2.1883068084716797, "Pretrain/Loss (Raw)": 2.1606240272521973, "Pretrain/Step": 852, "Pretrain/Step Time": 8.5504892449826} +{"Pretrain/Learning Rate": 4.9537984774487606e-05, "Pretrain/Loss": 2.1890077590942383, "Pretrain/Loss (Raw)": 2.132451295852661, "Pretrain/Step": 853, "Pretrain/Step Time": 8.54791227541864} +{"Pretrain/Learning Rate": 4.953635871450736e-05, "Pretrain/Loss": 2.1888952255249023, "Pretrain/Loss (Raw)": 2.183715343475342, "Pretrain/Step": 854, "Pretrain/Step Time": 8.54106355085969} +{"Pretrain/Learning Rate": 4.95347298248786e-05, "Pretrain/Loss": 2.191863536834717, "Pretrain/Loss (Raw)": 2.1319706439971924, "Pretrain/Step": 855, "Pretrain/Step Time": 8.545452993363142} +{"Pretrain/Learning Rate": 4.953309810578918e-05, "Pretrain/Loss": 2.192080020904541, "Pretrain/Loss (Raw)": 2.167804479598999, "Pretrain/Step": 856, "Pretrain/Step Time": 8.551102513447404} +{"Pretrain/Learning Rate": 4.953146355742729e-05, "Pretrain/Loss": 2.192601203918457, "Pretrain/Loss (Raw)": 2.0955333709716797, "Pretrain/Step": 857, "Pretrain/Step Time": 8.54223221167922} +{"Pretrain/Learning Rate": 4.952982617998143e-05, "Pretrain/Loss": 2.191586494445801, "Pretrain/Loss (Raw)": 2.1002888679504395, "Pretrain/Step": 858, "Pretrain/Step Time": 8.53844909928739} +{"Pretrain/Learning Rate": 4.952818597364043e-05, "Pretrain/Loss": 2.1904172897338867, "Pretrain/Loss (Raw)": 2.1088297367095947, "Pretrain/Step": 859, "Pretrain/Step Time": 8.541098296642303} +{"Pretrain/Learning Rate": 4.952654293859344e-05, "Pretrain/Loss": 2.1897547245025635, "Pretrain/Loss (Raw)": 2.1442253589630127, "Pretrain/Step": 860, "Pretrain/Step Time": 8.535000752657652} +{"Pretrain/Learning Rate": 4.952489707502993e-05, "Pretrain/Loss": 2.1903674602508545, "Pretrain/Loss (Raw)": 2.0827722549438477, "Pretrain/Step": 861, "Pretrain/Step Time": 8.538159357383847} +{"Pretrain/Learning Rate": 4.952324838313974e-05, "Pretrain/Loss": 2.190845012664795, "Pretrain/Loss (Raw)": 2.148585319519043, "Pretrain/Step": 862, "Pretrain/Step Time": 8.539803177118301} +{"Pretrain/Learning Rate": 4.9521596863112986e-05, "Pretrain/Loss": 2.190159320831299, "Pretrain/Loss (Raw)": 2.084611177444458, "Pretrain/Step": 863, "Pretrain/Step Time": 8.535382077097893} +{"Pretrain/Learning Rate": 4.951994251514013e-05, "Pretrain/Loss": 2.189937114715576, "Pretrain/Loss (Raw)": 2.0703978538513184, "Pretrain/Step": 864, "Pretrain/Step Time": 8.53891335427761} +{"Pretrain/Learning Rate": 4.9518285339411966e-05, "Pretrain/Loss": 2.1896681785583496, "Pretrain/Loss (Raw)": 2.240619659423828, "Pretrain/Step": 865, "Pretrain/Step Time": 8.535281537100673} +{"Pretrain/Learning Rate": 4.9516625336119595e-05, "Pretrain/Loss": 2.189182758331299, "Pretrain/Loss (Raw)": 2.1940042972564697, "Pretrain/Step": 866, "Pretrain/Step Time": 8.540589543059468} +{"Pretrain/Learning Rate": 4.951496250545446e-05, "Pretrain/Loss": 2.1894798278808594, "Pretrain/Loss (Raw)": 2.1412386894226074, "Pretrain/Step": 867, "Pretrain/Step Time": 8.537645071744919} +{"Pretrain/Learning Rate": 4.951329684760835e-05, "Pretrain/Loss": 2.188309669494629, "Pretrain/Loss (Raw)": 2.0674121379852295, "Pretrain/Step": 868, "Pretrain/Step Time": 8.549421096220613} +{"Pretrain/Learning Rate": 4.951162836277332e-05, "Pretrain/Loss": 2.1877782344818115, "Pretrain/Loss (Raw)": 2.050899028778076, "Pretrain/Step": 869, "Pretrain/Step Time": 8.541020918637514} +{"Pretrain/Learning Rate": 4.950995705114182e-05, "Pretrain/Loss": 2.188505172729492, "Pretrain/Loss (Raw)": 2.2082035541534424, "Pretrain/Step": 870, "Pretrain/Step Time": 8.547258792445064} +{"Pretrain/Learning Rate": 4.950828291290656e-05, "Pretrain/Loss": 2.1881279945373535, "Pretrain/Loss (Raw)": 2.2516562938690186, "Pretrain/Step": 871, "Pretrain/Step Time": 8.54924950003624} +{"Pretrain/Learning Rate": 4.950660594826064e-05, "Pretrain/Loss": 2.1889028549194336, "Pretrain/Loss (Raw)": 2.3029117584228516, "Pretrain/Step": 872, "Pretrain/Step Time": 8.55142462067306} +{"Pretrain/Learning Rate": 4.9504926157397436e-05, "Pretrain/Loss": 2.1901350021362305, "Pretrain/Loss (Raw)": 2.3317372798919678, "Pretrain/Step": 873, "Pretrain/Step Time": 8.549744268879294} +{"Pretrain/Learning Rate": 4.950324354051068e-05, "Pretrain/Loss": 2.192375659942627, "Pretrain/Loss (Raw)": 2.5470800399780273, "Pretrain/Step": 874, "Pretrain/Step Time": 8.547828139737248} +{"Pretrain/Learning Rate": 4.950155809779442e-05, "Pretrain/Loss": 2.1906180381774902, "Pretrain/Loss (Raw)": 2.14628529548645, "Pretrain/Step": 875, "Pretrain/Step Time": 8.556862452998757} +{"Pretrain/Learning Rate": 4.9499869829443026e-05, "Pretrain/Loss": 2.1900360584259033, "Pretrain/Loss (Raw)": 2.2967920303344727, "Pretrain/Step": 876, "Pretrain/Step Time": 8.552056711167097} +{"Pretrain/Learning Rate": 4.9498178735651184e-05, "Pretrain/Loss": 2.1890225410461426, "Pretrain/Loss (Raw)": 1.9356207847595215, "Pretrain/Step": 877, "Pretrain/Step Time": 8.553398912772536} +{"Pretrain/Learning Rate": 4.949648481661394e-05, "Pretrain/Loss": 2.1872239112854004, "Pretrain/Loss (Raw)": 2.0087027549743652, "Pretrain/Step": 878, "Pretrain/Step Time": 8.551720667630434} +{"Pretrain/Learning Rate": 4.949478807252663e-05, "Pretrain/Loss": 2.1876626014709473, "Pretrain/Loss (Raw)": 2.057866096496582, "Pretrain/Step": 879, "Pretrain/Step Time": 8.547963486984372} +{"Pretrain/Learning Rate": 4.949308850358494e-05, "Pretrain/Loss": 2.1886801719665527, "Pretrain/Loss (Raw)": 2.268608331680298, "Pretrain/Step": 880, "Pretrain/Step Time": 8.556201566010714} +{"Pretrain/Learning Rate": 4.949138610998487e-05, "Pretrain/Loss": 2.1890883445739746, "Pretrain/Loss (Raw)": 2.1627187728881836, "Pretrain/Step": 881, "Pretrain/Step Time": 8.551106749102473} +{"Pretrain/Learning Rate": 4.9489680891922746e-05, "Pretrain/Loss": 2.188817024230957, "Pretrain/Loss (Raw)": 2.205435276031494, "Pretrain/Step": 882, "Pretrain/Step Time": 8.555800130590796} +{"Pretrain/Learning Rate": 4.948797284959522e-05, "Pretrain/Loss": 2.1910300254821777, "Pretrain/Loss (Raw)": 2.3778462409973145, "Pretrain/Step": 883, "Pretrain/Step Time": 8.553209982812405} +{"Pretrain/Learning Rate": 4.948626198319928e-05, "Pretrain/Loss": 2.1912193298339844, "Pretrain/Loss (Raw)": 2.1640491485595703, "Pretrain/Step": 884, "Pretrain/Step Time": 8.555146336555481} +{"Pretrain/Learning Rate": 4.948454829293222e-05, "Pretrain/Loss": 2.1907572746276855, "Pretrain/Loss (Raw)": 2.364302635192871, "Pretrain/Step": 885, "Pretrain/Step Time": 8.553848864510655} +{"Pretrain/Learning Rate": 4.9482831778991676e-05, "Pretrain/Loss": 2.1894137859344482, "Pretrain/Loss (Raw)": 1.9035738706588745, "Pretrain/Step": 886, "Pretrain/Step Time": 8.558785321190953} +{"Pretrain/Learning Rate": 4.9481112441575605e-05, "Pretrain/Loss": 2.188805103302002, "Pretrain/Loss (Raw)": 2.0957729816436768, "Pretrain/Step": 887, "Pretrain/Step Time": 8.550519470125437} +{"Pretrain/Learning Rate": 4.947939028088229e-05, "Pretrain/Loss": 2.19026780128479, "Pretrain/Loss (Raw)": 2.178330659866333, "Pretrain/Step": 888, "Pretrain/Step Time": 8.557995410636067} +{"Pretrain/Learning Rate": 4.947766529711033e-05, "Pretrain/Loss": 2.1898484230041504, "Pretrain/Loss (Raw)": 2.198998212814331, "Pretrain/Step": 889, "Pretrain/Step Time": 8.549572175368667} +{"Pretrain/Learning Rate": 4.947593749045867e-05, "Pretrain/Loss": 2.186856746673584, "Pretrain/Loss (Raw)": 1.888825535774231, "Pretrain/Step": 890, "Pretrain/Step Time": 8.547656815499067} +{"Pretrain/Learning Rate": 4.947420686112657e-05, "Pretrain/Loss": 2.186051368713379, "Pretrain/Loss (Raw)": 1.966840147972107, "Pretrain/Step": 891, "Pretrain/Step Time": 8.548288594931364} +{"Pretrain/Learning Rate": 4.9472473409313605e-05, "Pretrain/Loss": 2.1828064918518066, "Pretrain/Loss (Raw)": 2.029127359390259, "Pretrain/Step": 892, "Pretrain/Step Time": 8.54836267605424} +{"Pretrain/Learning Rate": 4.947073713521968e-05, "Pretrain/Loss": 2.1827807426452637, "Pretrain/Loss (Raw)": 2.1249423027038574, "Pretrain/Step": 893, "Pretrain/Step Time": 8.541785400360823} +{"Pretrain/Learning Rate": 4.9468998039045046e-05, "Pretrain/Loss": 2.1809959411621094, "Pretrain/Loss (Raw)": 2.15929913520813, "Pretrain/Step": 894, "Pretrain/Step Time": 8.551460659131408} +{"Pretrain/Learning Rate": 4.946725612099026e-05, "Pretrain/Loss": 2.1816654205322266, "Pretrain/Loss (Raw)": 2.2940003871917725, "Pretrain/Step": 895, "Pretrain/Step Time": 8.550365462899208} +{"Pretrain/Learning Rate": 4.9465511381256204e-05, "Pretrain/Loss": 2.184781074523926, "Pretrain/Loss (Raw)": 2.388648271560669, "Pretrain/Step": 896, "Pretrain/Step Time": 8.555579157546163} +{"Pretrain/Learning Rate": 4.946376382004408e-05, "Pretrain/Loss": 2.185535430908203, "Pretrain/Loss (Raw)": 2.153273344039917, "Pretrain/Step": 897, "Pretrain/Step Time": 8.55360572040081} +{"Pretrain/Learning Rate": 4.9462013437555446e-05, "Pretrain/Loss": 2.1852898597717285, "Pretrain/Loss (Raw)": 2.1109800338745117, "Pretrain/Step": 898, "Pretrain/Step Time": 8.557120006531477} +{"Pretrain/Learning Rate": 4.946026023399215e-05, "Pretrain/Loss": 2.1834030151367188, "Pretrain/Loss (Raw)": 1.9446125030517578, "Pretrain/Step": 899, "Pretrain/Step Time": 8.549323946237564} +{"Pretrain/Learning Rate": 4.9458504209556377e-05, "Pretrain/Loss": 2.185628890991211, "Pretrain/Loss (Raw)": 2.1750667095184326, "Pretrain/Step": 900, "Pretrain/Step Time": 8.55291154421866} +{"Pretrain/Learning Rate": 4.945674536445065e-05, "Pretrain/Loss": 2.187343120574951, "Pretrain/Loss (Raw)": 2.3241939544677734, "Pretrain/Step": 901, "Pretrain/Step Time": 8.550692347809672} +{"Pretrain/Learning Rate": 4.945498369887781e-05, "Pretrain/Loss": 2.1856510639190674, "Pretrain/Loss (Raw)": 2.1485841274261475, "Pretrain/Step": 902, "Pretrain/Step Time": 8.549639951437712} +{"Pretrain/Learning Rate": 4.945321921304101e-05, "Pretrain/Loss": 2.1842455863952637, "Pretrain/Loss (Raw)": 2.034640312194824, "Pretrain/Step": 903, "Pretrain/Step Time": 8.554367324337363} +{"Pretrain/Learning Rate": 4.945145190714374e-05, "Pretrain/Loss": 2.1865763664245605, "Pretrain/Loss (Raw)": 2.340911388397217, "Pretrain/Step": 904, "Pretrain/Step Time": 8.562904199585319} +{"Pretrain/Learning Rate": 4.944968178138982e-05, "Pretrain/Loss": 2.1862144470214844, "Pretrain/Loss (Raw)": 2.1175107955932617, "Pretrain/Step": 905, "Pretrain/Step Time": 8.557984713464975} +{"Pretrain/Learning Rate": 4.944790883598339e-05, "Pretrain/Loss": 2.1893463134765625, "Pretrain/Loss (Raw)": 2.555161237716675, "Pretrain/Step": 906, "Pretrain/Step Time": 8.558167271316051} +{"Pretrain/Learning Rate": 4.9446133071128905e-05, "Pretrain/Loss": 2.1883111000061035, "Pretrain/Loss (Raw)": 2.1116104125976562, "Pretrain/Step": 907, "Pretrain/Step Time": 8.55393104068935} +{"Pretrain/Learning Rate": 4.944435448703116e-05, "Pretrain/Loss": 2.187833070755005, "Pretrain/Loss (Raw)": 2.1645655632019043, "Pretrain/Step": 908, "Pretrain/Step Time": 8.548908734694123} +{"Pretrain/Learning Rate": 4.944257308389528e-05, "Pretrain/Loss": 2.1870293617248535, "Pretrain/Loss (Raw)": 2.1061177253723145, "Pretrain/Step": 909, "Pretrain/Step Time": 8.549267198890448} +{"Pretrain/Learning Rate": 4.944078886192668e-05, "Pretrain/Loss": 2.186121702194214, "Pretrain/Loss (Raw)": 2.095656394958496, "Pretrain/Step": 910, "Pretrain/Step Time": 8.55924029648304} +{"Pretrain/Learning Rate": 4.943900182133116e-05, "Pretrain/Loss": 2.184929847717285, "Pretrain/Loss (Raw)": 1.993719220161438, "Pretrain/Step": 911, "Pretrain/Step Time": 8.553857803344727} +{"Pretrain/Learning Rate": 4.943721196231477e-05, "Pretrain/Loss": 2.184250831604004, "Pretrain/Loss (Raw)": 2.0835492610931396, "Pretrain/Step": 912, "Pretrain/Step Time": 8.550299683585763} +{"Pretrain/Learning Rate": 4.943541928508395e-05, "Pretrain/Loss": 2.184234619140625, "Pretrain/Loss (Raw)": 2.2778382301330566, "Pretrain/Step": 913, "Pretrain/Step Time": 8.550350533798337} +{"Pretrain/Learning Rate": 4.9433623789845426e-05, "Pretrain/Loss": 2.185223340988159, "Pretrain/Loss (Raw)": 2.302978277206421, "Pretrain/Step": 914, "Pretrain/Step Time": 8.549215035513043} +{"Pretrain/Learning Rate": 4.943182547680629e-05, "Pretrain/Loss": 2.1819868087768555, "Pretrain/Loss (Raw)": 2.1578140258789062, "Pretrain/Step": 915, "Pretrain/Step Time": 8.552282312884927} +{"Pretrain/Learning Rate": 4.94300243461739e-05, "Pretrain/Loss": 2.182166814804077, "Pretrain/Loss (Raw)": 2.2306036949157715, "Pretrain/Step": 916, "Pretrain/Step Time": 8.553956566378474} +{"Pretrain/Learning Rate": 4.9428220398155986e-05, "Pretrain/Loss": 2.1860125064849854, "Pretrain/Loss (Raw)": 2.4996395111083984, "Pretrain/Step": 917, "Pretrain/Step Time": 8.554539188742638} +{"Pretrain/Learning Rate": 4.94264136329606e-05, "Pretrain/Loss": 2.186908006668091, "Pretrain/Loss (Raw)": 2.3695878982543945, "Pretrain/Step": 918, "Pretrain/Step Time": 8.552592189982533} +{"Pretrain/Learning Rate": 4.942460405079608e-05, "Pretrain/Loss": 2.186408042907715, "Pretrain/Loss (Raw)": 2.132127285003662, "Pretrain/Step": 919, "Pretrain/Step Time": 8.550609432160854} +{"Pretrain/Learning Rate": 4.942279165187113e-05, "Pretrain/Loss": 2.185349941253662, "Pretrain/Loss (Raw)": 2.221158981323242, "Pretrain/Step": 920, "Pretrain/Step Time": 8.554318564012647} +{"Pretrain/Learning Rate": 4.9420976436394764e-05, "Pretrain/Loss": 2.184607982635498, "Pretrain/Loss (Raw)": 2.231790065765381, "Pretrain/Step": 921, "Pretrain/Step Time": 8.553306819871068} +{"Pretrain/Learning Rate": 4.941915840457632e-05, "Pretrain/Loss": 2.1832962036132812, "Pretrain/Loss (Raw)": 1.9638041257858276, "Pretrain/Step": 922, "Pretrain/Step Time": 8.55586052685976} +{"Pretrain/Learning Rate": 4.941733755662545e-05, "Pretrain/Loss": 2.1806130409240723, "Pretrain/Loss (Raw)": 2.0441088676452637, "Pretrain/Step": 923, "Pretrain/Step Time": 8.548354236409068} +{"Pretrain/Learning Rate": 4.941551389275217e-05, "Pretrain/Loss": 2.1814956665039062, "Pretrain/Loss (Raw)": 2.190967321395874, "Pretrain/Step": 924, "Pretrain/Step Time": 8.549621112644672} +{"Pretrain/Learning Rate": 4.9413687413166777e-05, "Pretrain/Loss": 2.1806468963623047, "Pretrain/Loss (Raw)": 2.3775241374969482, "Pretrain/Step": 925, "Pretrain/Step Time": 8.539276167750359} +{"Pretrain/Learning Rate": 4.94118581180799e-05, "Pretrain/Loss": 2.180960178375244, "Pretrain/Loss (Raw)": 2.112550735473633, "Pretrain/Step": 926, "Pretrain/Step Time": 8.543413994833827} +{"Pretrain/Learning Rate": 4.9410026007702525e-05, "Pretrain/Loss": 2.1816606521606445, "Pretrain/Loss (Raw)": 2.2268426418304443, "Pretrain/Step": 927, "Pretrain/Step Time": 8.542320620268583} +{"Pretrain/Learning Rate": 4.940819108224592e-05, "Pretrain/Loss": 2.181365966796875, "Pretrain/Loss (Raw)": 2.158264636993408, "Pretrain/Step": 928, "Pretrain/Step Time": 8.545003978535533} +{"Pretrain/Learning Rate": 4.940635334192171e-05, "Pretrain/Loss": 2.182239055633545, "Pretrain/Loss (Raw)": 2.238670587539673, "Pretrain/Step": 929, "Pretrain/Step Time": 8.543610155582428} +{"Pretrain/Learning Rate": 4.940451278694181e-05, "Pretrain/Loss": 2.183623790740967, "Pretrain/Loss (Raw)": 2.495379686355591, "Pretrain/Step": 930, "Pretrain/Step Time": 8.537071796134114} +{"Pretrain/Learning Rate": 4.9402669417518514e-05, "Pretrain/Loss": 2.1835665702819824, "Pretrain/Loss (Raw)": 2.2076382637023926, "Pretrain/Step": 931, "Pretrain/Step Time": 8.538154797628522} +{"Pretrain/Learning Rate": 4.940082323386439e-05, "Pretrain/Loss": 2.1862030029296875, "Pretrain/Loss (Raw)": 2.446882724761963, "Pretrain/Step": 932, "Pretrain/Step Time": 8.540082329884171} +{"Pretrain/Learning Rate": 4.939897423619234e-05, "Pretrain/Loss": 2.18422794342041, "Pretrain/Loss (Raw)": 2.0203821659088135, "Pretrain/Step": 933, "Pretrain/Step Time": 8.542006824165583} +{"Pretrain/Learning Rate": 4.9397122424715624e-05, "Pretrain/Loss": 2.1852128505706787, "Pretrain/Loss (Raw)": 2.3412368297576904, "Pretrain/Step": 934, "Pretrain/Step Time": 8.547169208526611} +{"Pretrain/Learning Rate": 4.939526779964778e-05, "Pretrain/Loss": 2.185832977294922, "Pretrain/Loss (Raw)": 2.1230101585388184, "Pretrain/Step": 935, "Pretrain/Step Time": 8.539753194898367} +{"Pretrain/Learning Rate": 4.9393410361202694e-05, "Pretrain/Loss": 2.185272216796875, "Pretrain/Loss (Raw)": 2.122284173965454, "Pretrain/Step": 936, "Pretrain/Step Time": 8.531580014154315} +{"Pretrain/Learning Rate": 4.9391550109594584e-05, "Pretrain/Loss": 2.187983989715576, "Pretrain/Loss (Raw)": 2.3811419010162354, "Pretrain/Step": 937, "Pretrain/Step Time": 8.53766737319529} +{"Pretrain/Learning Rate": 4.938968704503798e-05, "Pretrain/Loss": 2.1866044998168945, "Pretrain/Loss (Raw)": 2.0913007259368896, "Pretrain/Step": 938, "Pretrain/Step Time": 8.534819664433599} +{"Pretrain/Learning Rate": 4.938782116774774e-05, "Pretrain/Loss": 2.1853508949279785, "Pretrain/Loss (Raw)": 2.1663970947265625, "Pretrain/Step": 939, "Pretrain/Step Time": 8.535064017400146} +{"Pretrain/Learning Rate": 4.938595247793903e-05, "Pretrain/Loss": 2.1855642795562744, "Pretrain/Loss (Raw)": 2.0691685676574707, "Pretrain/Step": 940, "Pretrain/Step Time": 8.532326152548194} +{"Pretrain/Learning Rate": 4.938408097582738e-05, "Pretrain/Loss": 2.186976432800293, "Pretrain/Loss (Raw)": 2.2202417850494385, "Pretrain/Step": 941, "Pretrain/Step Time": 8.534617561846972} +{"Pretrain/Learning Rate": 4.9382206661628615e-05, "Pretrain/Loss": 2.1874096393585205, "Pretrain/Loss (Raw)": 2.075147867202759, "Pretrain/Step": 942, "Pretrain/Step Time": 8.531919453293085} +{"Pretrain/Learning Rate": 4.9380329535558887e-05, "Pretrain/Loss": 2.1886672973632812, "Pretrain/Loss (Raw)": 2.2493090629577637, "Pretrain/Step": 943, "Pretrain/Step Time": 8.534109111875296} +{"Pretrain/Learning Rate": 4.9378449597834664e-05, "Pretrain/Loss": 2.188197374343872, "Pretrain/Loss (Raw)": 2.122119903564453, "Pretrain/Step": 944, "Pretrain/Step Time": 8.532302170991898} +{"Pretrain/Learning Rate": 4.937656684867276e-05, "Pretrain/Loss": 2.1871604919433594, "Pretrain/Loss (Raw)": 2.1818535327911377, "Pretrain/Step": 945, "Pretrain/Step Time": 8.535253329202533} +{"Pretrain/Learning Rate": 4.93746812882903e-05, "Pretrain/Loss": 2.186602830886841, "Pretrain/Loss (Raw)": 2.098160982131958, "Pretrain/Step": 946, "Pretrain/Step Time": 8.53260607086122} +{"Pretrain/Learning Rate": 4.937279291690474e-05, "Pretrain/Loss": 2.183973550796509, "Pretrain/Loss (Raw)": 2.058380126953125, "Pretrain/Step": 947, "Pretrain/Step Time": 8.54481802508235} +{"Pretrain/Learning Rate": 4.9370901734733856e-05, "Pretrain/Loss": 2.183173179626465, "Pretrain/Loss (Raw)": 2.1247482299804688, "Pretrain/Step": 948, "Pretrain/Step Time": 8.535986095666885} +{"Pretrain/Learning Rate": 4.936900774199573e-05, "Pretrain/Loss": 2.1820335388183594, "Pretrain/Loss (Raw)": 2.0382163524627686, "Pretrain/Step": 949, "Pretrain/Step Time": 8.538822770118713} +{"Pretrain/Learning Rate": 4.936711093890881e-05, "Pretrain/Loss": 2.181445598602295, "Pretrain/Loss (Raw)": 2.1982734203338623, "Pretrain/Step": 950, "Pretrain/Step Time": 8.542117776349187} +{"Pretrain/Learning Rate": 4.936521132569184e-05, "Pretrain/Loss": 2.182182550430298, "Pretrain/Loss (Raw)": 2.4603917598724365, "Pretrain/Step": 951, "Pretrain/Step Time": 8.545986965298653} +{"Pretrain/Learning Rate": 4.936330890256388e-05, "Pretrain/Loss": 2.1801979541778564, "Pretrain/Loss (Raw)": 2.049349784851074, "Pretrain/Step": 952, "Pretrain/Step Time": 8.54698577709496} +{"Pretrain/Learning Rate": 4.9361403669744336e-05, "Pretrain/Loss": 2.178488254547119, "Pretrain/Loss (Raw)": 2.0764617919921875, "Pretrain/Step": 953, "Pretrain/Step Time": 8.553734203800559} +{"Pretrain/Learning Rate": 4.935949562745293e-05, "Pretrain/Loss": 2.1784348487854004, "Pretrain/Loss (Raw)": 2.1017866134643555, "Pretrain/Step": 954, "Pretrain/Step Time": 8.547751892358065} +{"Pretrain/Learning Rate": 4.93575847759097e-05, "Pretrain/Loss": 2.177964210510254, "Pretrain/Loss (Raw)": 2.1282155513763428, "Pretrain/Step": 955, "Pretrain/Step Time": 8.546179134398699} +{"Pretrain/Learning Rate": 4.9355671115335015e-05, "Pretrain/Loss": 2.1767609119415283, "Pretrain/Loss (Raw)": 2.1167287826538086, "Pretrain/Step": 956, "Pretrain/Step Time": 8.550175393000245} +{"Pretrain/Learning Rate": 4.935375464594957e-05, "Pretrain/Loss": 2.1766796112060547, "Pretrain/Loss (Raw)": 2.0976197719573975, "Pretrain/Step": 957, "Pretrain/Step Time": 8.547389570623636} +{"Pretrain/Learning Rate": 4.9351835367974375e-05, "Pretrain/Loss": 2.1798207759857178, "Pretrain/Loss (Raw)": 2.3416526317596436, "Pretrain/Step": 958, "Pretrain/Step Time": 8.54457014799118} +{"Pretrain/Learning Rate": 4.9349913281630786e-05, "Pretrain/Loss": 2.1794018745422363, "Pretrain/Loss (Raw)": 2.1590359210968018, "Pretrain/Step": 959, "Pretrain/Step Time": 8.55550872348249} +{"Pretrain/Learning Rate": 4.934798838714045e-05, "Pretrain/Loss": 2.17732572555542, "Pretrain/Loss (Raw)": 1.9439146518707275, "Pretrain/Step": 960, "Pretrain/Step Time": 8.545649230480194} +{"Pretrain/Learning Rate": 4.9346060684725364e-05, "Pretrain/Loss": 2.1754159927368164, "Pretrain/Loss (Raw)": 2.162891387939453, "Pretrain/Step": 961, "Pretrain/Step Time": 8.548767983913422} +{"Pretrain/Learning Rate": 4.934413017460784e-05, "Pretrain/Loss": 2.1746277809143066, "Pretrain/Loss (Raw)": 2.021136999130249, "Pretrain/Step": 962, "Pretrain/Step Time": 8.548720557242632} +{"Pretrain/Learning Rate": 4.93421968570105e-05, "Pretrain/Loss": 2.174020767211914, "Pretrain/Loss (Raw)": 2.251798391342163, "Pretrain/Step": 963, "Pretrain/Step Time": 8.549318622797728} +{"Pretrain/Learning Rate": 4.934026073215633e-05, "Pretrain/Loss": 2.175182342529297, "Pretrain/Loss (Raw)": 2.1866607666015625, "Pretrain/Step": 964, "Pretrain/Step Time": 8.551281973719597} +{"Pretrain/Learning Rate": 4.933832180026858e-05, "Pretrain/Loss": 2.1776957511901855, "Pretrain/Loss (Raw)": 2.2338218688964844, "Pretrain/Step": 965, "Pretrain/Step Time": 8.555418990552425} +{"Pretrain/Learning Rate": 4.933638006157089e-05, "Pretrain/Loss": 2.1747539043426514, "Pretrain/Loss (Raw)": 2.082298755645752, "Pretrain/Step": 966, "Pretrain/Step Time": 8.546635517850518} +{"Pretrain/Learning Rate": 4.933443551628717e-05, "Pretrain/Loss": 2.1769471168518066, "Pretrain/Loss (Raw)": 2.1847527027130127, "Pretrain/Step": 967, "Pretrain/Step Time": 8.551614921540022} +{"Pretrain/Learning Rate": 4.933248816464168e-05, "Pretrain/Loss": 2.176983594894409, "Pretrain/Loss (Raw)": 2.369218349456787, "Pretrain/Step": 968, "Pretrain/Step Time": 8.555147795006633} +{"Pretrain/Learning Rate": 4.933053800685899e-05, "Pretrain/Loss": 2.1761133670806885, "Pretrain/Loss (Raw)": 2.1534337997436523, "Pretrain/Step": 969, "Pretrain/Step Time": 8.554927786812186} +{"Pretrain/Learning Rate": 4.932858504316401e-05, "Pretrain/Loss": 2.1763651371002197, "Pretrain/Loss (Raw)": 2.3693480491638184, "Pretrain/Step": 970, "Pretrain/Step Time": 8.555811326950788} +{"Pretrain/Learning Rate": 4.932662927378196e-05, "Pretrain/Loss": 2.174984931945801, "Pretrain/Loss (Raw)": 1.999162197113037, "Pretrain/Step": 971, "Pretrain/Step Time": 8.559217737987638} +{"Pretrain/Learning Rate": 4.93246706989384e-05, "Pretrain/Loss": 2.175189256668091, "Pretrain/Loss (Raw)": 2.1833317279815674, "Pretrain/Step": 972, "Pretrain/Step Time": 8.548595143482089} +{"Pretrain/Learning Rate": 4.932270931885918e-05, "Pretrain/Loss": 2.1745197772979736, "Pretrain/Loss (Raw)": 2.163853168487549, "Pretrain/Step": 973, "Pretrain/Step Time": 8.552473731338978} +{"Pretrain/Learning Rate": 4.9320745133770524e-05, "Pretrain/Loss": 2.173409938812256, "Pretrain/Loss (Raw)": 2.073838233947754, "Pretrain/Step": 974, "Pretrain/Step Time": 8.555380133911967} +{"Pretrain/Learning Rate": 4.931877814389893e-05, "Pretrain/Loss": 2.173408269882202, "Pretrain/Loss (Raw)": 2.2735464572906494, "Pretrain/Step": 975, "Pretrain/Step Time": 8.553493980318308} +{"Pretrain/Learning Rate": 4.931680834947124e-05, "Pretrain/Loss": 2.1734962463378906, "Pretrain/Loss (Raw)": 2.165546417236328, "Pretrain/Step": 976, "Pretrain/Step Time": 8.544411703944206} +{"Pretrain/Learning Rate": 4.9314835750714635e-05, "Pretrain/Loss": 2.1727547645568848, "Pretrain/Loss (Raw)": 2.045389175415039, "Pretrain/Step": 977, "Pretrain/Step Time": 8.550998624414206} +{"Pretrain/Learning Rate": 4.9312860347856595e-05, "Pretrain/Loss": 2.173269033432007, "Pretrain/Loss (Raw)": 2.316608428955078, "Pretrain/Step": 978, "Pretrain/Step Time": 8.542410019785166} +{"Pretrain/Learning Rate": 4.931088214112494e-05, "Pretrain/Loss": 2.1721978187561035, "Pretrain/Loss (Raw)": 2.1376869678497314, "Pretrain/Step": 979, "Pretrain/Step Time": 8.547985767945647} +{"Pretrain/Learning Rate": 4.930890113074779e-05, "Pretrain/Loss": 2.171290874481201, "Pretrain/Loss (Raw)": 2.044506549835205, "Pretrain/Step": 980, "Pretrain/Step Time": 8.547412730753422} +{"Pretrain/Learning Rate": 4.930691731695362e-05, "Pretrain/Loss": 2.170358419418335, "Pretrain/Loss (Raw)": 2.0131123065948486, "Pretrain/Step": 981, "Pretrain/Step Time": 8.550355948507786} +{"Pretrain/Learning Rate": 4.9304930699971194e-05, "Pretrain/Loss": 2.1699466705322266, "Pretrain/Loss (Raw)": 2.1309924125671387, "Pretrain/Step": 982, "Pretrain/Step Time": 8.550000250339508} +{"Pretrain/Learning Rate": 4.9302941280029645e-05, "Pretrain/Loss": 2.172370433807373, "Pretrain/Loss (Raw)": 2.442213296890259, "Pretrain/Step": 983, "Pretrain/Step Time": 8.55257560685277} +{"Pretrain/Learning Rate": 4.930094905735838e-05, "Pretrain/Loss": 2.1736414432525635, "Pretrain/Loss (Raw)": 2.3304998874664307, "Pretrain/Step": 984, "Pretrain/Step Time": 8.543528493493795} +{"Pretrain/Learning Rate": 4.929895403218717e-05, "Pretrain/Loss": 2.172990322113037, "Pretrain/Loss (Raw)": 2.012179136276245, "Pretrain/Step": 985, "Pretrain/Step Time": 8.546622859314084} +{"Pretrain/Learning Rate": 4.929695620474607e-05, "Pretrain/Loss": 2.174128532409668, "Pretrain/Loss (Raw)": 2.246022939682007, "Pretrain/Step": 986, "Pretrain/Step Time": 8.545524811372161} +{"Pretrain/Learning Rate": 4.9294955575265494e-05, "Pretrain/Loss": 2.1742448806762695, "Pretrain/Loss (Raw)": 2.123715400695801, "Pretrain/Step": 987, "Pretrain/Step Time": 8.54109868220985} +{"Pretrain/Learning Rate": 4.929295214397616e-05, "Pretrain/Loss": 2.1786370277404785, "Pretrain/Loss (Raw)": 2.706397771835327, "Pretrain/Step": 988, "Pretrain/Step Time": 8.542137315496802} +{"Pretrain/Learning Rate": 4.929094591110911e-05, "Pretrain/Loss": 2.180304765701294, "Pretrain/Loss (Raw)": 2.2962422370910645, "Pretrain/Step": 989, "Pretrain/Step Time": 8.548787949606776} +{"Pretrain/Learning Rate": 4.928893687689572e-05, "Pretrain/Loss": 2.1825218200683594, "Pretrain/Loss (Raw)": 2.432396411895752, "Pretrain/Step": 990, "Pretrain/Step Time": 8.545377343893051} +{"Pretrain/Learning Rate": 4.928692504156767e-05, "Pretrain/Loss": 2.1830034255981445, "Pretrain/Loss (Raw)": 2.146244525909424, "Pretrain/Step": 991, "Pretrain/Step Time": 8.54503539018333} +{"Pretrain/Learning Rate": 4.928491040535699e-05, "Pretrain/Loss": 2.182344436645508, "Pretrain/Loss (Raw)": 1.9860353469848633, "Pretrain/Step": 992, "Pretrain/Step Time": 8.540383273735642} +{"Pretrain/Learning Rate": 4.9282892968495995e-05, "Pretrain/Loss": 2.1804449558258057, "Pretrain/Loss (Raw)": 1.9974981546401978, "Pretrain/Step": 993, "Pretrain/Step Time": 8.54701916128397} +{"Pretrain/Learning Rate": 4.928087273121737e-05, "Pretrain/Loss": 2.1802730560302734, "Pretrain/Loss (Raw)": 2.1720223426818848, "Pretrain/Step": 994, "Pretrain/Step Time": 8.54408859089017} +{"Pretrain/Learning Rate": 4.9278849693754076e-05, "Pretrain/Loss": 2.17966365814209, "Pretrain/Loss (Raw)": 2.063218355178833, "Pretrain/Step": 995, "Pretrain/Step Time": 8.552422422915697} +{"Pretrain/Learning Rate": 4.927682385633944e-05, "Pretrain/Loss": 2.1802639961242676, "Pretrain/Loss (Raw)": 2.144249200820923, "Pretrain/Step": 996, "Pretrain/Step Time": 8.546944392845035} +{"Pretrain/Learning Rate": 4.927479521920707e-05, "Pretrain/Loss": 2.182236671447754, "Pretrain/Loss (Raw)": 2.3034071922302246, "Pretrain/Step": 997, "Pretrain/Step Time": 8.54928183928132} +{"Pretrain/Learning Rate": 4.927276378259094e-05, "Pretrain/Loss": 2.1810808181762695, "Pretrain/Loss (Raw)": 2.0602610111236572, "Pretrain/Step": 998, "Pretrain/Step Time": 8.540395565330982} +{"Pretrain/Learning Rate": 4.9270729546725305e-05, "Pretrain/Loss": 2.179986000061035, "Pretrain/Loss (Raw)": 2.111482858657837, "Pretrain/Step": 999, "Pretrain/Step Time": 8.540817247703671} +{"Pretrain/Learning Rate": 4.9268692511844774e-05, "Pretrain/Loss": 2.178102731704712, "Pretrain/Loss (Raw)": 2.0618693828582764, "Pretrain/Step": 1000, "Pretrain/Step Time": 8.539761817082763} +{"Pretrain/Learning Rate": 4.926665267818426e-05, "Pretrain/Loss": 2.1770222187042236, "Pretrain/Loss (Raw)": 2.193430185317993, "Pretrain/Step": 1001, "Pretrain/Step Time": 8.54771013557911} +{"Pretrain/Learning Rate": 4.926461004597901e-05, "Pretrain/Loss": 2.1752586364746094, "Pretrain/Loss (Raw)": 2.321343183517456, "Pretrain/Step": 1002, "Pretrain/Step Time": 8.539357101544738} +{"Pretrain/Learning Rate": 4.92625646154646e-05, "Pretrain/Loss": 2.173933982849121, "Pretrain/Loss (Raw)": 1.9767242670059204, "Pretrain/Step": 1003, "Pretrain/Step Time": 8.534361777827144} +{"Pretrain/Learning Rate": 4.926051638687691e-05, "Pretrain/Loss": 2.172409772872925, "Pretrain/Loss (Raw)": 2.101684093475342, "Pretrain/Step": 1004, "Pretrain/Step Time": 8.535463584586978} +{"Pretrain/Learning Rate": 4.925846536045215e-05, "Pretrain/Loss": 2.1738479137420654, "Pretrain/Loss (Raw)": 2.119725227355957, "Pretrain/Step": 1005, "Pretrain/Step Time": 8.533821422606707} +{"Pretrain/Learning Rate": 4.925641153642684e-05, "Pretrain/Loss": 2.1749584674835205, "Pretrain/Loss (Raw)": 2.1508443355560303, "Pretrain/Step": 1006, "Pretrain/Step Time": 8.533415377140045} +{"Pretrain/Learning Rate": 4.925435491503787e-05, "Pretrain/Loss": 2.175288200378418, "Pretrain/Loss (Raw)": 2.1000771522521973, "Pretrain/Step": 1007, "Pretrain/Step Time": 8.543037317693233} +{"Pretrain/Learning Rate": 4.9252295496522395e-05, "Pretrain/Loss": 2.1732187271118164, "Pretrain/Loss (Raw)": 2.0036978721618652, "Pretrain/Step": 1008, "Pretrain/Step Time": 8.539464982226491} +{"Pretrain/Learning Rate": 4.925023328111792e-05, "Pretrain/Loss": 2.1714136600494385, "Pretrain/Loss (Raw)": 1.9316707849502563, "Pretrain/Step": 1009, "Pretrain/Step Time": 8.537714794278145} +{"Pretrain/Learning Rate": 4.924816826906227e-05, "Pretrain/Loss": 2.1703786849975586, "Pretrain/Loss (Raw)": 2.0729739665985107, "Pretrain/Step": 1010, "Pretrain/Step Time": 8.536523437127471} +{"Pretrain/Learning Rate": 4.92461004605936e-05, "Pretrain/Loss": 2.169252395629883, "Pretrain/Loss (Raw)": 2.2337048053741455, "Pretrain/Step": 1011, "Pretrain/Step Time": 8.537280529737473} +{"Pretrain/Learning Rate": 4.924402985595037e-05, "Pretrain/Loss": 2.168541431427002, "Pretrain/Loss (Raw)": 2.0730173587799072, "Pretrain/Step": 1012, "Pretrain/Step Time": 8.538066433742642} +{"Pretrain/Learning Rate": 4.924195645537138e-05, "Pretrain/Loss": 2.1661343574523926, "Pretrain/Loss (Raw)": 2.0562031269073486, "Pretrain/Step": 1013, "Pretrain/Step Time": 8.542782317847013} +{"Pretrain/Learning Rate": 4.923988025909574e-05, "Pretrain/Loss": 2.169780731201172, "Pretrain/Loss (Raw)": 2.370326519012451, "Pretrain/Step": 1014, "Pretrain/Step Time": 8.54141179844737} +{"Pretrain/Learning Rate": 4.923780126736288e-05, "Pretrain/Loss": 2.1701502799987793, "Pretrain/Loss (Raw)": 2.1430726051330566, "Pretrain/Step": 1015, "Pretrain/Step Time": 8.544556714594364} +{"Pretrain/Learning Rate": 4.923571948041257e-05, "Pretrain/Loss": 2.1688520908355713, "Pretrain/Loss (Raw)": 2.0121469497680664, "Pretrain/Step": 1016, "Pretrain/Step Time": 8.540232967585325} +{"Pretrain/Learning Rate": 4.923363489848489e-05, "Pretrain/Loss": 2.1680965423583984, "Pretrain/Loss (Raw)": 2.1023056507110596, "Pretrain/Step": 1017, "Pretrain/Step Time": 8.538240319117904} +{"Pretrain/Learning Rate": 4.923154752182023e-05, "Pretrain/Loss": 2.170440912246704, "Pretrain/Loss (Raw)": 2.188904285430908, "Pretrain/Step": 1018, "Pretrain/Step Time": 8.540174575522542} +{"Pretrain/Learning Rate": 4.922945735065934e-05, "Pretrain/Loss": 2.172027587890625, "Pretrain/Loss (Raw)": 2.1699283123016357, "Pretrain/Step": 1019, "Pretrain/Step Time": 8.540471624583006} +{"Pretrain/Learning Rate": 4.9227364385243246e-05, "Pretrain/Loss": 2.172882080078125, "Pretrain/Loss (Raw)": 2.1385037899017334, "Pretrain/Step": 1020, "Pretrain/Step Time": 8.533746829256415} +{"Pretrain/Learning Rate": 4.922526862581333e-05, "Pretrain/Loss": 2.172901153564453, "Pretrain/Loss (Raw)": 2.1273915767669678, "Pretrain/Step": 1021, "Pretrain/Step Time": 8.535602392628789} +{"Pretrain/Learning Rate": 4.922317007261129e-05, "Pretrain/Loss": 2.1748366355895996, "Pretrain/Loss (Raw)": 2.4069998264312744, "Pretrain/Step": 1022, "Pretrain/Step Time": 8.533903738483787} +{"Pretrain/Learning Rate": 4.922106872587913e-05, "Pretrain/Loss": 2.1744861602783203, "Pretrain/Loss (Raw)": 2.2491421699523926, "Pretrain/Step": 1023, "Pretrain/Step Time": 8.533000318333507} +{"Pretrain/Learning Rate": 4.921896458585919e-05, "Pretrain/Loss": 2.171165943145752, "Pretrain/Loss (Raw)": 1.9636712074279785, "Pretrain/Step": 1024, "Pretrain/Step Time": 8.528793774545193} +{"Pretrain/Learning Rate": 4.9216857652794125e-05, "Pretrain/Loss": 2.170165777206421, "Pretrain/Loss (Raw)": 2.025243043899536, "Pretrain/Step": 1025, "Pretrain/Step Time": 8.537626933306456} +{"Pretrain/Learning Rate": 4.921474792692692e-05, "Pretrain/Loss": 2.1704370975494385, "Pretrain/Loss (Raw)": 2.1457486152648926, "Pretrain/Step": 1026, "Pretrain/Step Time": 8.529001938179135} +{"Pretrain/Learning Rate": 4.921263540850089e-05, "Pretrain/Loss": 2.1716623306274414, "Pretrain/Loss (Raw)": 2.1014552116394043, "Pretrain/Step": 1027, "Pretrain/Step Time": 8.533981654793024} +{"Pretrain/Learning Rate": 4.921052009775965e-05, "Pretrain/Loss": 2.173259973526001, "Pretrain/Loss (Raw)": 2.379520893096924, "Pretrain/Step": 1028, "Pretrain/Step Time": 8.530666019767523} +{"Pretrain/Learning Rate": 4.9208401994947144e-05, "Pretrain/Loss": 2.1716623306274414, "Pretrain/Loss (Raw)": 2.1197006702423096, "Pretrain/Step": 1029, "Pretrain/Step Time": 8.536069177091122} +{"Pretrain/Learning Rate": 4.920628110030765e-05, "Pretrain/Loss": 2.1710095405578613, "Pretrain/Loss (Raw)": 2.065025568008423, "Pretrain/Step": 1030, "Pretrain/Step Time": 8.536725966259837} +{"Pretrain/Learning Rate": 4.920415741408575e-05, "Pretrain/Loss": 2.173139810562134, "Pretrain/Loss (Raw)": 2.3073222637176514, "Pretrain/Step": 1031, "Pretrain/Step Time": 8.539766697213054} +{"Pretrain/Learning Rate": 4.920203093652637e-05, "Pretrain/Loss": 2.171464204788208, "Pretrain/Loss (Raw)": 2.126426935195923, "Pretrain/Step": 1032, "Pretrain/Step Time": 8.533072870224714} +{"Pretrain/Learning Rate": 4.919990166787474e-05, "Pretrain/Loss": 2.1723403930664062, "Pretrain/Loss (Raw)": 2.2296597957611084, "Pretrain/Step": 1033, "Pretrain/Step Time": 8.537120517343283} +{"Pretrain/Learning Rate": 4.919776960837641e-05, "Pretrain/Loss": 2.169769287109375, "Pretrain/Loss (Raw)": 2.2260568141937256, "Pretrain/Step": 1034, "Pretrain/Step Time": 8.535177506506443} +{"Pretrain/Learning Rate": 4.9195634758277264e-05, "Pretrain/Loss": 2.169396162033081, "Pretrain/Loss (Raw)": 2.063850164413452, "Pretrain/Step": 1035, "Pretrain/Step Time": 8.535297999158502} +{"Pretrain/Learning Rate": 4.919349711782351e-05, "Pretrain/Loss": 2.1689133644104004, "Pretrain/Loss (Raw)": 2.1027488708496094, "Pretrain/Step": 1036, "Pretrain/Step Time": 8.538302643224597} +{"Pretrain/Learning Rate": 4.919135668726167e-05, "Pretrain/Loss": 2.169032335281372, "Pretrain/Loss (Raw)": 2.1213653087615967, "Pretrain/Step": 1037, "Pretrain/Step Time": 8.543805997818708} +{"Pretrain/Learning Rate": 4.9189213466838565e-05, "Pretrain/Loss": 2.168309450149536, "Pretrain/Loss (Raw)": 2.0031254291534424, "Pretrain/Step": 1038, "Pretrain/Step Time": 8.53402735479176} +{"Pretrain/Learning Rate": 4.91870674568014e-05, "Pretrain/Loss": 2.1705331802368164, "Pretrain/Loss (Raw)": 2.2783422470092773, "Pretrain/Step": 1039, "Pretrain/Step Time": 8.539516992866993} +{"Pretrain/Learning Rate": 4.9184918657397625e-05, "Pretrain/Loss": 2.1708502769470215, "Pretrain/Loss (Raw)": 2.124164581298828, "Pretrain/Step": 1040, "Pretrain/Step Time": 8.542735382914543} +{"Pretrain/Learning Rate": 4.918276706887508e-05, "Pretrain/Loss": 2.1692488193511963, "Pretrain/Loss (Raw)": 2.0728421211242676, "Pretrain/Step": 1041, "Pretrain/Step Time": 8.543370192870498} +{"Pretrain/Learning Rate": 4.918061269148187e-05, "Pretrain/Loss": 2.1695685386657715, "Pretrain/Loss (Raw)": 2.3438992500305176, "Pretrain/Step": 1042, "Pretrain/Step Time": 8.548201594501734} +{"Pretrain/Learning Rate": 4.9178455525466484e-05, "Pretrain/Loss": 2.1701409816741943, "Pretrain/Loss (Raw)": 2.231095790863037, "Pretrain/Step": 1043, "Pretrain/Step Time": 8.548681776970625} +{"Pretrain/Learning Rate": 4.9176295571077655e-05, "Pretrain/Loss": 2.171046257019043, "Pretrain/Loss (Raw)": 2.3464925289154053, "Pretrain/Step": 1044, "Pretrain/Step Time": 8.544867157936096} +{"Pretrain/Learning Rate": 4.917413282856451e-05, "Pretrain/Loss": 2.169656276702881, "Pretrain/Loss (Raw)": 2.3217313289642334, "Pretrain/Step": 1045, "Pretrain/Step Time": 8.547232549637556} +{"Pretrain/Learning Rate": 4.917196729817645e-05, "Pretrain/Loss": 2.167510986328125, "Pretrain/Loss (Raw)": 2.094940662384033, "Pretrain/Step": 1046, "Pretrain/Step Time": 8.547840652987361} +{"Pretrain/Learning Rate": 4.9169798980163215e-05, "Pretrain/Loss": 2.165679454803467, "Pretrain/Loss (Raw)": 1.8977022171020508, "Pretrain/Step": 1047, "Pretrain/Step Time": 8.547120975330472} +{"Pretrain/Learning Rate": 4.916762787477487e-05, "Pretrain/Loss": 2.16387677192688, "Pretrain/Loss (Raw)": 1.9904370307922363, "Pretrain/Step": 1048, "Pretrain/Step Time": 8.543705388903618} +{"Pretrain/Learning Rate": 4.91654539822618e-05, "Pretrain/Loss": 2.161731719970703, "Pretrain/Loss (Raw)": 1.9572094678878784, "Pretrain/Step": 1049, "Pretrain/Step Time": 8.551967101171613} +{"Pretrain/Learning Rate": 4.916327730287471e-05, "Pretrain/Loss": 2.1618523597717285, "Pretrain/Loss (Raw)": 1.9792455434799194, "Pretrain/Step": 1050, "Pretrain/Step Time": 8.545543611049652} +{"Pretrain/Learning Rate": 4.916109783686461e-05, "Pretrain/Loss": 2.1610491275787354, "Pretrain/Loss (Raw)": 1.941298007965088, "Pretrain/Step": 1051, "Pretrain/Step Time": 8.54747087135911} +{"Pretrain/Learning Rate": 4.915891558448287e-05, "Pretrain/Loss": 2.16094970703125, "Pretrain/Loss (Raw)": 2.1782591342926025, "Pretrain/Step": 1052, "Pretrain/Step Time": 8.542457977309823} +{"Pretrain/Learning Rate": 4.915673054598113e-05, "Pretrain/Loss": 2.1596851348876953, "Pretrain/Loss (Raw)": 2.215655565261841, "Pretrain/Step": 1053, "Pretrain/Step Time": 8.545869624242187} +{"Pretrain/Learning Rate": 4.91545427216114e-05, "Pretrain/Loss": 2.160857677459717, "Pretrain/Loss (Raw)": 2.26263165473938, "Pretrain/Step": 1054, "Pretrain/Step Time": 8.548240644857287} +{"Pretrain/Learning Rate": 4.915235211162599e-05, "Pretrain/Loss": 2.1615374088287354, "Pretrain/Loss (Raw)": 2.3138439655303955, "Pretrain/Step": 1055, "Pretrain/Step Time": 8.552303133532405} +{"Pretrain/Learning Rate": 4.9150158716277516e-05, "Pretrain/Loss": 2.160297393798828, "Pretrain/Loss (Raw)": 1.9995388984680176, "Pretrain/Step": 1056, "Pretrain/Step Time": 8.543153902515769} +{"Pretrain/Learning Rate": 4.9147962535818935e-05, "Pretrain/Loss": 2.1603918075561523, "Pretrain/Loss (Raw)": 2.250760793685913, "Pretrain/Step": 1057, "Pretrain/Step Time": 8.546136312186718} +{"Pretrain/Learning Rate": 4.9145763570503536e-05, "Pretrain/Loss": 2.1572012901306152, "Pretrain/Loss (Raw)": 2.086988925933838, "Pretrain/Step": 1058, "Pretrain/Step Time": 8.545724334195256} +{"Pretrain/Learning Rate": 4.914356182058491e-05, "Pretrain/Loss": 2.1568307876586914, "Pretrain/Loss (Raw)": 2.1601977348327637, "Pretrain/Step": 1059, "Pretrain/Step Time": 8.547010991722345} +{"Pretrain/Learning Rate": 4.914135728631695e-05, "Pretrain/Loss": 2.154845714569092, "Pretrain/Loss (Raw)": 2.1928367614746094, "Pretrain/Step": 1060, "Pretrain/Step Time": 8.544131023809314} +{"Pretrain/Learning Rate": 4.913914996795391e-05, "Pretrain/Loss": 2.155128240585327, "Pretrain/Loss (Raw)": 2.0565237998962402, "Pretrain/Step": 1061, "Pretrain/Step Time": 8.550700446590781} +{"Pretrain/Learning Rate": 4.9136939865750357e-05, "Pretrain/Loss": 2.157397985458374, "Pretrain/Loss (Raw)": 2.631747245788574, "Pretrain/Step": 1062, "Pretrain/Step Time": 8.543907897546887} +{"Pretrain/Learning Rate": 4.913472697996116e-05, "Pretrain/Loss": 2.1577439308166504, "Pretrain/Loss (Raw)": 2.167278289794922, "Pretrain/Step": 1063, "Pretrain/Step Time": 8.546631649136543} +{"Pretrain/Learning Rate": 4.913251131084152e-05, "Pretrain/Loss": 2.1592280864715576, "Pretrain/Loss (Raw)": 2.3122940063476562, "Pretrain/Step": 1064, "Pretrain/Step Time": 8.5475417021662} +{"Pretrain/Learning Rate": 4.9130292858646966e-05, "Pretrain/Loss": 2.157221794128418, "Pretrain/Loss (Raw)": 2.1243526935577393, "Pretrain/Step": 1065, "Pretrain/Step Time": 8.543653910979629} +{"Pretrain/Learning Rate": 4.912807162363332e-05, "Pretrain/Loss": 2.1568379402160645, "Pretrain/Loss (Raw)": 2.0421347618103027, "Pretrain/Step": 1066, "Pretrain/Step Time": 8.54596734046936} +{"Pretrain/Learning Rate": 4.912584760605677e-05, "Pretrain/Loss": 2.1571316719055176, "Pretrain/Loss (Raw)": 2.2039763927459717, "Pretrain/Step": 1067, "Pretrain/Step Time": 8.545763233676553} +{"Pretrain/Learning Rate": 4.9123620806173785e-05, "Pretrain/Loss": 2.1580495834350586, "Pretrain/Loss (Raw)": 2.186713457107544, "Pretrain/Step": 1068, "Pretrain/Step Time": 8.555166658014059} +{"Pretrain/Learning Rate": 4.9121391224241174e-05, "Pretrain/Loss": 2.157184600830078, "Pretrain/Loss (Raw)": 2.1095058917999268, "Pretrain/Step": 1069, "Pretrain/Step Time": 8.549911241978407} +{"Pretrain/Learning Rate": 4.9119158860516066e-05, "Pretrain/Loss": 2.156175136566162, "Pretrain/Loss (Raw)": 1.945932149887085, "Pretrain/Step": 1070, "Pretrain/Step Time": 8.55292198434472} +{"Pretrain/Learning Rate": 4.9116923715255905e-05, "Pretrain/Loss": 2.154758930206299, "Pretrain/Loss (Raw)": 2.068007230758667, "Pretrain/Step": 1071, "Pretrain/Step Time": 8.549965843558311} +{"Pretrain/Learning Rate": 4.9114685788718454e-05, "Pretrain/Loss": 2.1552023887634277, "Pretrain/Loss (Raw)": 2.1789190769195557, "Pretrain/Step": 1072, "Pretrain/Step Time": 8.55160117894411} +{"Pretrain/Learning Rate": 4.9112445081161813e-05, "Pretrain/Loss": 2.1536474227905273, "Pretrain/Loss (Raw)": 1.9828020334243774, "Pretrain/Step": 1073, "Pretrain/Step Time": 8.554653346538544} +{"Pretrain/Learning Rate": 4.9110201592844376e-05, "Pretrain/Loss": 2.1522414684295654, "Pretrain/Loss (Raw)": 1.9181838035583496, "Pretrain/Step": 1074, "Pretrain/Step Time": 8.561695965006948} +{"Pretrain/Learning Rate": 4.910795532402489e-05, "Pretrain/Loss": 2.1526708602905273, "Pretrain/Loss (Raw)": 2.113358736038208, "Pretrain/Step": 1075, "Pretrain/Step Time": 8.549598686397076} +{"Pretrain/Learning Rate": 4.910570627496239e-05, "Pretrain/Loss": 2.152520179748535, "Pretrain/Loss (Raw)": 2.105471134185791, "Pretrain/Step": 1076, "Pretrain/Step Time": 8.555066917091608} +{"Pretrain/Learning Rate": 4.9103454445916256e-05, "Pretrain/Loss": 2.154582977294922, "Pretrain/Loss (Raw)": 2.3022260665893555, "Pretrain/Step": 1077, "Pretrain/Step Time": 8.553057663142681} +{"Pretrain/Learning Rate": 4.910119983714616e-05, "Pretrain/Loss": 2.154677629470825, "Pretrain/Loss (Raw)": 2.210402011871338, "Pretrain/Step": 1078, "Pretrain/Step Time": 8.551864724606276} +{"Pretrain/Learning Rate": 4.909894244891214e-05, "Pretrain/Loss": 2.153684139251709, "Pretrain/Loss (Raw)": 2.3332064151763916, "Pretrain/Step": 1079, "Pretrain/Step Time": 8.551536072045565} +{"Pretrain/Learning Rate": 4.909668228147453e-05, "Pretrain/Loss": 2.1548197269439697, "Pretrain/Loss (Raw)": 2.1947340965270996, "Pretrain/Step": 1080, "Pretrain/Step Time": 8.548219477757812} +{"Pretrain/Learning Rate": 4.9094419335093966e-05, "Pretrain/Loss": 2.1527814865112305, "Pretrain/Loss (Raw)": 1.8155663013458252, "Pretrain/Step": 1081, "Pretrain/Step Time": 8.548046784475446} +{"Pretrain/Learning Rate": 4.909215361003142e-05, "Pretrain/Loss": 2.1535301208496094, "Pretrain/Loss (Raw)": 2.1975901126861572, "Pretrain/Step": 1082, "Pretrain/Step Time": 8.549281138926744} +{"Pretrain/Learning Rate": 4.90898851065482e-05, "Pretrain/Loss": 2.153748035430908, "Pretrain/Loss (Raw)": 2.1560909748077393, "Pretrain/Step": 1083, "Pretrain/Step Time": 8.54536747559905} +{"Pretrain/Learning Rate": 4.908761382490591e-05, "Pretrain/Loss": 2.1537957191467285, "Pretrain/Loss (Raw)": 2.122866630554199, "Pretrain/Step": 1084, "Pretrain/Step Time": 8.541487885639071} +{"Pretrain/Learning Rate": 4.908533976536649e-05, "Pretrain/Loss": 2.153846263885498, "Pretrain/Loss (Raw)": 2.1040823459625244, "Pretrain/Step": 1085, "Pretrain/Step Time": 8.54147456586361} +{"Pretrain/Learning Rate": 4.90830629281922e-05, "Pretrain/Loss": 2.151123285293579, "Pretrain/Loss (Raw)": 1.9931174516677856, "Pretrain/Step": 1086, "Pretrain/Step Time": 8.558949055150151} +{"Pretrain/Learning Rate": 4.908078331364561e-05, "Pretrain/Loss": 2.151559352874756, "Pretrain/Loss (Raw)": 2.2148213386535645, "Pretrain/Step": 1087, "Pretrain/Step Time": 8.556375933811069} +{"Pretrain/Learning Rate": 4.907850092198961e-05, "Pretrain/Loss": 2.1536405086517334, "Pretrain/Loss (Raw)": 2.210343837738037, "Pretrain/Step": 1088, "Pretrain/Step Time": 8.55878034234047} +{"Pretrain/Learning Rate": 4.9076215753487425e-05, "Pretrain/Loss": 2.154829740524292, "Pretrain/Loss (Raw)": 2.315110683441162, "Pretrain/Step": 1089, "Pretrain/Step Time": 8.558442026376724} +{"Pretrain/Learning Rate": 4.9073927808402585e-05, "Pretrain/Loss": 2.1561014652252197, "Pretrain/Loss (Raw)": 2.1838979721069336, "Pretrain/Step": 1090, "Pretrain/Step Time": 8.559855926781893} +{"Pretrain/Learning Rate": 4.907163708699896e-05, "Pretrain/Loss": 2.1553714275360107, "Pretrain/Loss (Raw)": 2.158358097076416, "Pretrain/Step": 1091, "Pretrain/Step Time": 8.563175363466144} +{"Pretrain/Learning Rate": 4.9069343589540704e-05, "Pretrain/Loss": 2.1546154022216797, "Pretrain/Loss (Raw)": 2.0898852348327637, "Pretrain/Step": 1092, "Pretrain/Step Time": 8.560339469462633} +{"Pretrain/Learning Rate": 4.906704731629233e-05, "Pretrain/Loss": 2.1534528732299805, "Pretrain/Loss (Raw)": 2.085026979446411, "Pretrain/Step": 1093, "Pretrain/Step Time": 8.552674299106002} +{"Pretrain/Learning Rate": 4.9064748267518656e-05, "Pretrain/Loss": 2.155855178833008, "Pretrain/Loss (Raw)": 2.389793872833252, "Pretrain/Step": 1094, "Pretrain/Step Time": 8.553222542628646} +{"Pretrain/Learning Rate": 4.9062446443484813e-05, "Pretrain/Loss": 2.1556763648986816, "Pretrain/Loss (Raw)": 2.1618785858154297, "Pretrain/Step": 1095, "Pretrain/Step Time": 8.546473402529955} +{"Pretrain/Learning Rate": 4.9060141844456267e-05, "Pretrain/Loss": 2.154170274734497, "Pretrain/Loss (Raw)": 2.176426887512207, "Pretrain/Step": 1096, "Pretrain/Step Time": 8.545466037467122} +{"Pretrain/Learning Rate": 4.905783447069878e-05, "Pretrain/Loss": 2.15394926071167, "Pretrain/Loss (Raw)": 2.1251637935638428, "Pretrain/Step": 1097, "Pretrain/Step Time": 8.551643276587129} +{"Pretrain/Learning Rate": 4.905552432247846e-05, "Pretrain/Loss": 2.1516964435577393, "Pretrain/Loss (Raw)": 2.080954074859619, "Pretrain/Step": 1098, "Pretrain/Step Time": 8.547407848760486} +{"Pretrain/Learning Rate": 4.905321140006172e-05, "Pretrain/Loss": 2.1530323028564453, "Pretrain/Loss (Raw)": 2.170161247253418, "Pretrain/Step": 1099, "Pretrain/Step Time": 8.548520289361477} +{"Pretrain/Learning Rate": 4.90508957037153e-05, "Pretrain/Loss": 2.153262138366699, "Pretrain/Loss (Raw)": 2.2127692699432373, "Pretrain/Step": 1100, "Pretrain/Step Time": 8.551106298342347} +{"Pretrain/Learning Rate": 4.9048577233706264e-05, "Pretrain/Loss": 2.152031421661377, "Pretrain/Loss (Raw)": 2.0063188076019287, "Pretrain/Step": 1101, "Pretrain/Step Time": 8.543619150295854} +{"Pretrain/Learning Rate": 4.9046255990301965e-05, "Pretrain/Loss": 2.157637596130371, "Pretrain/Loss (Raw)": 2.7914373874664307, "Pretrain/Step": 1102, "Pretrain/Step Time": 8.54207006469369} +{"Pretrain/Learning Rate": 4.904393197377012e-05, "Pretrain/Loss": 2.1552181243896484, "Pretrain/Loss (Raw)": 1.9638293981552124, "Pretrain/Step": 1103, "Pretrain/Step Time": 8.543366065248847} +{"Pretrain/Learning Rate": 4.9041605184378746e-05, "Pretrain/Loss": 2.1540229320526123, "Pretrain/Loss (Raw)": 2.0125818252563477, "Pretrain/Step": 1104, "Pretrain/Step Time": 8.552855843678117} +{"Pretrain/Learning Rate": 4.903927562239617e-05, "Pretrain/Loss": 2.154405355453491, "Pretrain/Loss (Raw)": 2.0943260192871094, "Pretrain/Step": 1105, "Pretrain/Step Time": 8.550131898373365} +{"Pretrain/Learning Rate": 4.9036943288091066e-05, "Pretrain/Loss": 2.1526925563812256, "Pretrain/Loss (Raw)": 2.09735107421875, "Pretrain/Step": 1106, "Pretrain/Step Time": 8.549715897068381} +{"Pretrain/Learning Rate": 4.903460818173238e-05, "Pretrain/Loss": 2.1548280715942383, "Pretrain/Loss (Raw)": 2.4110190868377686, "Pretrain/Step": 1107, "Pretrain/Step Time": 8.545929251238704} +{"Pretrain/Learning Rate": 4.9032270303589435e-05, "Pretrain/Loss": 2.1554784774780273, "Pretrain/Loss (Raw)": 2.1277694702148438, "Pretrain/Step": 1108, "Pretrain/Step Time": 8.546446723863482} +{"Pretrain/Learning Rate": 4.9029929653931826e-05, "Pretrain/Loss": 2.157712936401367, "Pretrain/Loss (Raw)": 2.2991292476654053, "Pretrain/Step": 1109, "Pretrain/Step Time": 8.542388122528791} +{"Pretrain/Learning Rate": 4.90275862330295e-05, "Pretrain/Loss": 2.161904811859131, "Pretrain/Loss (Raw)": 2.6675944328308105, "Pretrain/Step": 1110, "Pretrain/Step Time": 8.553846454247832} +{"Pretrain/Learning Rate": 4.902524004115271e-05, "Pretrain/Loss": 2.1600329875946045, "Pretrain/Loss (Raw)": 2.202589273452759, "Pretrain/Step": 1111, "Pretrain/Step Time": 8.548022164031863} +{"Pretrain/Learning Rate": 4.902289107857202e-05, "Pretrain/Loss": 2.1573855876922607, "Pretrain/Loss (Raw)": 1.9916242361068726, "Pretrain/Step": 1112, "Pretrain/Step Time": 8.550788732245564} +{"Pretrain/Learning Rate": 4.9020539345558335e-05, "Pretrain/Loss": 2.157003879547119, "Pretrain/Loss (Raw)": 1.9633461236953735, "Pretrain/Step": 1113, "Pretrain/Step Time": 8.548360675573349} +{"Pretrain/Learning Rate": 4.9018184842382866e-05, "Pretrain/Loss": 2.1563377380371094, "Pretrain/Loss (Raw)": 2.160750150680542, "Pretrain/Step": 1114, "Pretrain/Step Time": 8.549965757876635} +{"Pretrain/Learning Rate": 4.901582756931715e-05, "Pretrain/Loss": 2.1568331718444824, "Pretrain/Loss (Raw)": 2.1870992183685303, "Pretrain/Step": 1115, "Pretrain/Step Time": 8.549308074638247} +{"Pretrain/Learning Rate": 4.901346752663302e-05, "Pretrain/Loss": 2.153686046600342, "Pretrain/Loss (Raw)": 2.303597927093506, "Pretrain/Step": 1116, "Pretrain/Step Time": 8.557419385761023} +{"Pretrain/Learning Rate": 4.9011104714602666e-05, "Pretrain/Loss": 2.1528992652893066, "Pretrain/Loss (Raw)": 2.1955349445343018, "Pretrain/Step": 1117, "Pretrain/Step Time": 8.54475667141378} +{"Pretrain/Learning Rate": 4.900873913349857e-05, "Pretrain/Loss": 2.1519346237182617, "Pretrain/Loss (Raw)": 2.3089356422424316, "Pretrain/Step": 1118, "Pretrain/Step Time": 8.552963603287935} +{"Pretrain/Learning Rate": 4.9006370783593544e-05, "Pretrain/Loss": 2.153522491455078, "Pretrain/Loss (Raw)": 2.3494856357574463, "Pretrain/Step": 1119, "Pretrain/Step Time": 8.550613718107343} +{"Pretrain/Learning Rate": 4.900399966516073e-05, "Pretrain/Loss": 2.154033660888672, "Pretrain/Loss (Raw)": 2.051450252532959, "Pretrain/Step": 1120, "Pretrain/Step Time": 8.550871334969997} +{"Pretrain/Learning Rate": 4.900162577847355e-05, "Pretrain/Loss": 2.1564278602600098, "Pretrain/Loss (Raw)": 2.303955316543579, "Pretrain/Step": 1121, "Pretrain/Step Time": 8.54829921759665} +{"Pretrain/Learning Rate": 4.899924912380579e-05, "Pretrain/Loss": 2.1558961868286133, "Pretrain/Loss (Raw)": 2.1039509773254395, "Pretrain/Step": 1122, "Pretrain/Step Time": 8.556673793122172} +{"Pretrain/Learning Rate": 4.899686970143153e-05, "Pretrain/Loss": 2.157315731048584, "Pretrain/Loss (Raw)": 2.2449374198913574, "Pretrain/Step": 1123, "Pretrain/Step Time": 8.547708425670862} +{"Pretrain/Learning Rate": 4.8994487511625184e-05, "Pretrain/Loss": 2.157615900039673, "Pretrain/Loss (Raw)": 2.182655096054077, "Pretrain/Step": 1124, "Pretrain/Step Time": 8.54412786476314} +{"Pretrain/Learning Rate": 4.899210255466147e-05, "Pretrain/Loss": 2.1554503440856934, "Pretrain/Loss (Raw)": 2.026212215423584, "Pretrain/Step": 1125, "Pretrain/Step Time": 8.544052036479115} +{"Pretrain/Learning Rate": 4.898971483081543e-05, "Pretrain/Loss": 2.1560187339782715, "Pretrain/Loss (Raw)": 2.133044481277466, "Pretrain/Step": 1126, "Pretrain/Step Time": 8.548521347343922} +{"Pretrain/Learning Rate": 4.898732434036244e-05, "Pretrain/Loss": 2.157280683517456, "Pretrain/Loss (Raw)": 2.272998094558716, "Pretrain/Step": 1127, "Pretrain/Step Time": 8.548028495162725} +{"Pretrain/Learning Rate": 4.898493108357817e-05, "Pretrain/Loss": 2.1564719676971436, "Pretrain/Loss (Raw)": 1.9583522081375122, "Pretrain/Step": 1128, "Pretrain/Step Time": 8.552274810150266} +{"Pretrain/Learning Rate": 4.898253506073863e-05, "Pretrain/Loss": 2.1545462608337402, "Pretrain/Loss (Raw)": 1.946955919265747, "Pretrain/Step": 1129, "Pretrain/Step Time": 8.546040739864111} +{"Pretrain/Learning Rate": 4.8980136272120136e-05, "Pretrain/Loss": 2.1535744667053223, "Pretrain/Loss (Raw)": 2.1969611644744873, "Pretrain/Step": 1130, "Pretrain/Step Time": 8.552301652729511} +{"Pretrain/Learning Rate": 4.8977734717999326e-05, "Pretrain/Loss": 2.1539783477783203, "Pretrain/Loss (Raw)": 2.0283865928649902, "Pretrain/Step": 1131, "Pretrain/Step Time": 8.551015404984355} +{"Pretrain/Learning Rate": 4.8975330398653164e-05, "Pretrain/Loss": 2.1545095443725586, "Pretrain/Loss (Raw)": 2.1696865558624268, "Pretrain/Step": 1132, "Pretrain/Step Time": 8.555051075294614} +{"Pretrain/Learning Rate": 4.8972923314358934e-05, "Pretrain/Loss": 2.1547303199768066, "Pretrain/Loss (Raw)": 2.1479930877685547, "Pretrain/Step": 1133, "Pretrain/Step Time": 8.553726205602288} +{"Pretrain/Learning Rate": 4.8970513465394206e-05, "Pretrain/Loss": 2.1561498641967773, "Pretrain/Loss (Raw)": 2.332533597946167, "Pretrain/Step": 1134, "Pretrain/Step Time": 8.568971134722233} +{"Pretrain/Learning Rate": 4.896810085203692e-05, "Pretrain/Loss": 2.155398368835449, "Pretrain/Loss (Raw)": 2.0038793087005615, "Pretrain/Step": 1135, "Pretrain/Step Time": 8.55855698697269} +{"Pretrain/Learning Rate": 4.896568547456531e-05, "Pretrain/Loss": 2.1567845344543457, "Pretrain/Loss (Raw)": 2.18113374710083, "Pretrain/Step": 1136, "Pretrain/Step Time": 8.559769647195935} +{"Pretrain/Learning Rate": 4.896326733325791e-05, "Pretrain/Loss": 2.159747838973999, "Pretrain/Loss (Raw)": 2.31097149848938, "Pretrain/Step": 1137, "Pretrain/Step Time": 8.559603145346045} +{"Pretrain/Learning Rate": 4.8960846428393615e-05, "Pretrain/Loss": 2.166391134262085, "Pretrain/Loss (Raw)": 2.9233222007751465, "Pretrain/Step": 1138, "Pretrain/Step Time": 8.557239493355155} +{"Pretrain/Learning Rate": 4.8958422760251585e-05, "Pretrain/Loss": 2.16685152053833, "Pretrain/Loss (Raw)": 2.2926273345947266, "Pretrain/Step": 1139, "Pretrain/Step Time": 8.559005161747336} +{"Pretrain/Learning Rate": 4.8955996329111364e-05, "Pretrain/Loss": 2.1663601398468018, "Pretrain/Loss (Raw)": 2.010127067565918, "Pretrain/Step": 1140, "Pretrain/Step Time": 8.566688645631075} +{"Pretrain/Learning Rate": 4.895356713525275e-05, "Pretrain/Loss": 2.1670517921447754, "Pretrain/Loss (Raw)": 2.1447525024414062, "Pretrain/Step": 1141, "Pretrain/Step Time": 8.564462203532457} +{"Pretrain/Learning Rate": 4.895113517895591e-05, "Pretrain/Loss": 2.165817975997925, "Pretrain/Loss (Raw)": 2.2123985290527344, "Pretrain/Step": 1142, "Pretrain/Step Time": 8.560038255527616} +{"Pretrain/Learning Rate": 4.8948700460501294e-05, "Pretrain/Loss": 2.1663246154785156, "Pretrain/Loss (Raw)": 2.207906484603882, "Pretrain/Step": 1143, "Pretrain/Step Time": 8.561680799350142} +{"Pretrain/Learning Rate": 4.8946262980169686e-05, "Pretrain/Loss": 2.1668546199798584, "Pretrain/Loss (Raw)": 2.0799877643585205, "Pretrain/Step": 1144, "Pretrain/Step Time": 8.56016792356968} +{"Pretrain/Learning Rate": 4.894382273824221e-05, "Pretrain/Loss": 2.1677541732788086, "Pretrain/Loss (Raw)": 2.217442274093628, "Pretrain/Step": 1145, "Pretrain/Step Time": 8.563816107809544} +{"Pretrain/Learning Rate": 4.894137973500025e-05, "Pretrain/Loss": 2.167914390563965, "Pretrain/Loss (Raw)": 2.2094295024871826, "Pretrain/Step": 1146, "Pretrain/Step Time": 8.565536636859179} +{"Pretrain/Learning Rate": 4.893893397072558e-05, "Pretrain/Loss": 2.1687798500061035, "Pretrain/Loss (Raw)": 2.280684232711792, "Pretrain/Step": 1147, "Pretrain/Step Time": 8.562216775491834} +{"Pretrain/Learning Rate": 4.893648544570022e-05, "Pretrain/Loss": 2.166684150695801, "Pretrain/Loss (Raw)": 1.8702805042266846, "Pretrain/Step": 1148, "Pretrain/Step Time": 8.56328572705388} +{"Pretrain/Learning Rate": 4.893403416020658e-05, "Pretrain/Loss": 2.166095733642578, "Pretrain/Loss (Raw)": 2.0520551204681396, "Pretrain/Step": 1149, "Pretrain/Step Time": 8.562114998698235} +{"Pretrain/Learning Rate": 4.893158011452734e-05, "Pretrain/Loss": 2.165344715118408, "Pretrain/Loss (Raw)": 2.3108572959899902, "Pretrain/Step": 1150, "Pretrain/Step Time": 8.553743578493595} +{"Pretrain/Learning Rate": 4.8929123308945505e-05, "Pretrain/Loss": 2.163789987564087, "Pretrain/Loss (Raw)": 2.050144910812378, "Pretrain/Step": 1151, "Pretrain/Step Time": 8.555172743275762} +{"Pretrain/Learning Rate": 4.8926663743744414e-05, "Pretrain/Loss": 2.1670563220977783, "Pretrain/Loss (Raw)": 2.3817756175994873, "Pretrain/Step": 1152, "Pretrain/Step Time": 8.563361158594489} +{"Pretrain/Learning Rate": 4.892420141920772e-05, "Pretrain/Loss": 2.1692848205566406, "Pretrain/Loss (Raw)": 2.3104729652404785, "Pretrain/Step": 1153, "Pretrain/Step Time": 8.557240605354309} +{"Pretrain/Learning Rate": 4.8921736335619385e-05, "Pretrain/Loss": 2.169990301132202, "Pretrain/Loss (Raw)": 2.236060619354248, "Pretrain/Step": 1154, "Pretrain/Step Time": 8.55711623467505} +{"Pretrain/Learning Rate": 4.8919268493263684e-05, "Pretrain/Loss": 2.169727087020874, "Pretrain/Loss (Raw)": 2.0677757263183594, "Pretrain/Step": 1155, "Pretrain/Step Time": 8.554826978594065} +{"Pretrain/Learning Rate": 4.891679789242524e-05, "Pretrain/Loss": 2.167249917984009, "Pretrain/Loss (Raw)": 2.0624382495880127, "Pretrain/Step": 1156, "Pretrain/Step Time": 8.554885258898139} +{"Pretrain/Learning Rate": 4.891432453338895e-05, "Pretrain/Loss": 2.167771339416504, "Pretrain/Loss (Raw)": 2.186472177505493, "Pretrain/Step": 1157, "Pretrain/Step Time": 8.551754361018538} +{"Pretrain/Learning Rate": 4.8911848416440075e-05, "Pretrain/Loss": 2.1692826747894287, "Pretrain/Loss (Raw)": 2.258460283279419, "Pretrain/Step": 1158, "Pretrain/Step Time": 8.552826657891273} +{"Pretrain/Learning Rate": 4.890936954186416e-05, "Pretrain/Loss": 2.168839693069458, "Pretrain/Loss (Raw)": 2.2506189346313477, "Pretrain/Step": 1159, "Pretrain/Step Time": 8.557549562305212} +{"Pretrain/Learning Rate": 4.890688790994709e-05, "Pretrain/Loss": 2.168330669403076, "Pretrain/Loss (Raw)": 2.061271905899048, "Pretrain/Step": 1160, "Pretrain/Step Time": 8.556613355875015} +{"Pretrain/Learning Rate": 4.890440352097505e-05, "Pretrain/Loss": 2.166626453399658, "Pretrain/Loss (Raw)": 2.0114972591400146, "Pretrain/Step": 1161, "Pretrain/Step Time": 8.55415217205882} +{"Pretrain/Learning Rate": 4.8901916375234556e-05, "Pretrain/Loss": 2.1651086807250977, "Pretrain/Loss (Raw)": 2.031789541244507, "Pretrain/Step": 1162, "Pretrain/Step Time": 8.55751721188426} +{"Pretrain/Learning Rate": 4.889942647301243e-05, "Pretrain/Loss": 2.1677334308624268, "Pretrain/Loss (Raw)": 2.3998215198516846, "Pretrain/Step": 1163, "Pretrain/Step Time": 8.556090904399753} +{"Pretrain/Learning Rate": 4.8896933814595834e-05, "Pretrain/Loss": 2.17025089263916, "Pretrain/Loss (Raw)": 2.4250240325927734, "Pretrain/Step": 1164, "Pretrain/Step Time": 8.553951313719153} +{"Pretrain/Learning Rate": 4.8894438400272224e-05, "Pretrain/Loss": 2.170267343521118, "Pretrain/Loss (Raw)": 2.123432159423828, "Pretrain/Step": 1165, "Pretrain/Step Time": 8.554424431174994} +{"Pretrain/Learning Rate": 4.889194023032938e-05, "Pretrain/Loss": 2.171909809112549, "Pretrain/Loss (Raw)": 2.2133541107177734, "Pretrain/Step": 1166, "Pretrain/Step Time": 8.556142488494515} +{"Pretrain/Learning Rate": 4.8889439305055406e-05, "Pretrain/Loss": 2.170896291732788, "Pretrain/Loss (Raw)": 2.148622751235962, "Pretrain/Step": 1167, "Pretrain/Step Time": 8.550667146220803} +{"Pretrain/Learning Rate": 4.8886935624738715e-05, "Pretrain/Loss": 2.1710891723632812, "Pretrain/Loss (Raw)": 2.148874521255493, "Pretrain/Step": 1168, "Pretrain/Step Time": 8.551551965996623} +{"Pretrain/Learning Rate": 4.888442918966806e-05, "Pretrain/Loss": 2.170994281768799, "Pretrain/Loss (Raw)": 2.0606772899627686, "Pretrain/Step": 1169, "Pretrain/Step Time": 8.550654916092753} +{"Pretrain/Learning Rate": 4.888192000013248e-05, "Pretrain/Loss": 2.1694631576538086, "Pretrain/Loss (Raw)": 2.147899866104126, "Pretrain/Step": 1170, "Pretrain/Step Time": 8.549825556576252} +{"Pretrain/Learning Rate": 4.887940805642135e-05, "Pretrain/Loss": 2.1677794456481934, "Pretrain/Loss (Raw)": 2.01558518409729, "Pretrain/Step": 1171, "Pretrain/Step Time": 8.547800241038203} +{"Pretrain/Learning Rate": 4.887689335882436e-05, "Pretrain/Loss": 2.166818857192993, "Pretrain/Loss (Raw)": 2.2235453128814697, "Pretrain/Step": 1172, "Pretrain/Step Time": 8.551571663469076} +{"Pretrain/Learning Rate": 4.8874375907631506e-05, "Pretrain/Loss": 2.16495943069458, "Pretrain/Loss (Raw)": 2.0837409496307373, "Pretrain/Step": 1173, "Pretrain/Step Time": 8.546982960775495} +{"Pretrain/Learning Rate": 4.887185570313314e-05, "Pretrain/Loss": 2.1655290126800537, "Pretrain/Loss (Raw)": 2.167834520339966, "Pretrain/Step": 1174, "Pretrain/Step Time": 8.547265727072954} +{"Pretrain/Learning Rate": 4.886933274561988e-05, "Pretrain/Loss": 2.1683809757232666, "Pretrain/Loss (Raw)": 2.262751579284668, "Pretrain/Step": 1175, "Pretrain/Step Time": 8.547494925558567} +{"Pretrain/Learning Rate": 4.886680703538269e-05, "Pretrain/Loss": 2.168888568878174, "Pretrain/Loss (Raw)": 2.0554325580596924, "Pretrain/Step": 1176, "Pretrain/Step Time": 8.554440064355731} +{"Pretrain/Learning Rate": 4.886427857271284e-05, "Pretrain/Loss": 2.1711525917053223, "Pretrain/Loss (Raw)": 2.246957302093506, "Pretrain/Step": 1177, "Pretrain/Step Time": 8.545424479991198} +{"Pretrain/Learning Rate": 4.886174735790194e-05, "Pretrain/Loss": 2.1720900535583496, "Pretrain/Loss (Raw)": 2.09926176071167, "Pretrain/Step": 1178, "Pretrain/Step Time": 8.54843752272427} +{"Pretrain/Learning Rate": 4.88592133912419e-05, "Pretrain/Loss": 2.17366099357605, "Pretrain/Loss (Raw)": 2.1423728466033936, "Pretrain/Step": 1179, "Pretrain/Step Time": 8.55113903991878} +{"Pretrain/Learning Rate": 4.885667667302494e-05, "Pretrain/Loss": 2.171908378601074, "Pretrain/Loss (Raw)": 1.9539294242858887, "Pretrain/Step": 1180, "Pretrain/Step Time": 8.555193094536662} +{"Pretrain/Learning Rate": 4.88541372035436e-05, "Pretrain/Loss": 2.1686148643493652, "Pretrain/Loss (Raw)": 1.794104814529419, "Pretrain/Step": 1181, "Pretrain/Step Time": 8.553942145779729} +{"Pretrain/Learning Rate": 4.885159498309077e-05, "Pretrain/Loss": 2.167473316192627, "Pretrain/Loss (Raw)": 2.116503953933716, "Pretrain/Step": 1182, "Pretrain/Step Time": 8.550818014889956} +{"Pretrain/Learning Rate": 4.884905001195961e-05, "Pretrain/Loss": 2.165618658065796, "Pretrain/Loss (Raw)": 2.0764429569244385, "Pretrain/Step": 1183, "Pretrain/Step Time": 8.551466094329953} +{"Pretrain/Learning Rate": 4.884650229044361e-05, "Pretrain/Loss": 2.1669862270355225, "Pretrain/Loss (Raw)": 2.17460036277771, "Pretrain/Step": 1184, "Pretrain/Step Time": 8.556865524500608} +{"Pretrain/Learning Rate": 4.884395181883661e-05, "Pretrain/Loss": 2.1657485961914062, "Pretrain/Loss (Raw)": 2.092317581176758, "Pretrain/Step": 1185, "Pretrain/Step Time": 8.55565225891769} +{"Pretrain/Learning Rate": 4.8841398597432725e-05, "Pretrain/Loss": 2.1660027503967285, "Pretrain/Loss (Raw)": 2.1195383071899414, "Pretrain/Step": 1186, "Pretrain/Step Time": 8.549949346110225} +{"Pretrain/Learning Rate": 4.883884262652641e-05, "Pretrain/Loss": 2.1658620834350586, "Pretrain/Loss (Raw)": 2.1421854496002197, "Pretrain/Step": 1187, "Pretrain/Step Time": 8.5514792855829} +{"Pretrain/Learning Rate": 4.883628390641243e-05, "Pretrain/Loss": 2.165112018585205, "Pretrain/Loss (Raw)": 2.0968434810638428, "Pretrain/Step": 1188, "Pretrain/Step Time": 8.552536759525537} +{"Pretrain/Learning Rate": 4.883372243738588e-05, "Pretrain/Loss": 2.1670331954956055, "Pretrain/Loss (Raw)": 2.3024206161499023, "Pretrain/Step": 1189, "Pretrain/Step Time": 8.551403727382421} +{"Pretrain/Learning Rate": 4.883115821974213e-05, "Pretrain/Loss": 2.163832664489746, "Pretrain/Loss (Raw)": 2.222074508666992, "Pretrain/Step": 1190, "Pretrain/Step Time": 8.554558949545026} +{"Pretrain/Learning Rate": 4.8828591253776937e-05, "Pretrain/Loss": 2.161637783050537, "Pretrain/Loss (Raw)": 1.8863390684127808, "Pretrain/Step": 1191, "Pretrain/Step Time": 8.552410809323192} +{"Pretrain/Learning Rate": 4.88260215397863e-05, "Pretrain/Loss": 2.159717559814453, "Pretrain/Loss (Raw)": 2.066521644592285, "Pretrain/Step": 1192, "Pretrain/Step Time": 8.552421793341637} +{"Pretrain/Learning Rate": 4.882344907806659e-05, "Pretrain/Loss": 2.1592793464660645, "Pretrain/Loss (Raw)": 2.06825590133667, "Pretrain/Step": 1193, "Pretrain/Step Time": 8.556602383032441} +{"Pretrain/Learning Rate": 4.882087386891448e-05, "Pretrain/Loss": 2.1598219871520996, "Pretrain/Loss (Raw)": 2.111567735671997, "Pretrain/Step": 1194, "Pretrain/Step Time": 8.556829994544387} +{"Pretrain/Learning Rate": 4.8818295912626955e-05, "Pretrain/Loss": 2.159228801727295, "Pretrain/Loss (Raw)": 2.128044605255127, "Pretrain/Step": 1195, "Pretrain/Step Time": 8.562659678980708} +{"Pretrain/Learning Rate": 4.88157152095013e-05, "Pretrain/Loss": 2.158479928970337, "Pretrain/Loss (Raw)": 2.0908641815185547, "Pretrain/Step": 1196, "Pretrain/Step Time": 8.55779454484582} +{"Pretrain/Learning Rate": 4.881313175983515e-05, "Pretrain/Loss": 2.1598708629608154, "Pretrain/Loss (Raw)": 2.28756046295166, "Pretrain/Step": 1197, "Pretrain/Step Time": 8.56032838858664} +{"Pretrain/Learning Rate": 4.881054556392642e-05, "Pretrain/Loss": 2.1623101234436035, "Pretrain/Loss (Raw)": 2.2581589221954346, "Pretrain/Step": 1198, "Pretrain/Step Time": 8.557162966579199} +{"Pretrain/Learning Rate": 4.8807956622073394e-05, "Pretrain/Loss": 2.164229154586792, "Pretrain/Loss (Raw)": 2.313633918762207, "Pretrain/Step": 1199, "Pretrain/Step Time": 8.561654508113861} +{"Pretrain/Learning Rate": 4.880536493457461e-05, "Pretrain/Loss": 2.163414239883423, "Pretrain/Loss (Raw)": 2.0746207237243652, "Pretrain/Step": 1200, "Pretrain/Step Time": 8.56070727109909} +{"Pretrain/Learning Rate": 4.880277050172897e-05, "Pretrain/Loss": 2.166156053543091, "Pretrain/Loss (Raw)": 2.333747386932373, "Pretrain/Step": 1201, "Pretrain/Step Time": 8.56160562299192} +{"Pretrain/Learning Rate": 4.880017332383567e-05, "Pretrain/Loss": 2.168874979019165, "Pretrain/Loss (Raw)": 2.2662007808685303, "Pretrain/Step": 1202, "Pretrain/Step Time": 8.55459300428629} +{"Pretrain/Learning Rate": 4.879757340119425e-05, "Pretrain/Loss": 2.169546604156494, "Pretrain/Loss (Raw)": 2.1993486881256104, "Pretrain/Step": 1203, "Pretrain/Step Time": 8.55444043315947} +{"Pretrain/Learning Rate": 4.879497073410451e-05, "Pretrain/Loss": 2.1689157485961914, "Pretrain/Loss (Raw)": 2.0246846675872803, "Pretrain/Step": 1204, "Pretrain/Step Time": 8.549608079716563} +{"Pretrain/Learning Rate": 4.8792365322866626e-05, "Pretrain/Loss": 2.167886734008789, "Pretrain/Loss (Raw)": 2.1705493927001953, "Pretrain/Step": 1205, "Pretrain/Step Time": 8.550754627212882} +{"Pretrain/Learning Rate": 4.878975716778106e-05, "Pretrain/Loss": 2.1683168411254883, "Pretrain/Loss (Raw)": 2.265435218811035, "Pretrain/Step": 1206, "Pretrain/Step Time": 8.550896445289254} +{"Pretrain/Learning Rate": 4.878714626914859e-05, "Pretrain/Loss": 2.16731595993042, "Pretrain/Loss (Raw)": 2.205101490020752, "Pretrain/Step": 1207, "Pretrain/Step Time": 8.555021420121193} +{"Pretrain/Learning Rate": 4.878453262727033e-05, "Pretrain/Loss": 2.164821147918701, "Pretrain/Loss (Raw)": 1.8754160404205322, "Pretrain/Step": 1208, "Pretrain/Step Time": 8.557738462463021} +{"Pretrain/Learning Rate": 4.878191624244769e-05, "Pretrain/Loss": 2.169255495071411, "Pretrain/Loss (Raw)": 2.3831324577331543, "Pretrain/Step": 1209, "Pretrain/Step Time": 8.55685125477612} +{"Pretrain/Learning Rate": 4.8779297114982406e-05, "Pretrain/Loss": 2.168626070022583, "Pretrain/Loss (Raw)": 2.1170237064361572, "Pretrain/Step": 1210, "Pretrain/Step Time": 8.556005366146564} +{"Pretrain/Learning Rate": 4.877667524517652e-05, "Pretrain/Loss": 2.168595790863037, "Pretrain/Loss (Raw)": 2.1522271633148193, "Pretrain/Step": 1211, "Pretrain/Step Time": 8.560608226805925} +{"Pretrain/Learning Rate": 4.877405063333241e-05, "Pretrain/Loss": 2.1697475910186768, "Pretrain/Loss (Raw)": 2.270298719406128, "Pretrain/Step": 1212, "Pretrain/Step Time": 8.561106275767088} +{"Pretrain/Learning Rate": 4.877142327975276e-05, "Pretrain/Loss": 2.171980381011963, "Pretrain/Loss (Raw)": 2.389847755432129, "Pretrain/Step": 1213, "Pretrain/Step Time": 8.562878850847483} +{"Pretrain/Learning Rate": 4.8768793184740556e-05, "Pretrain/Loss": 2.1736979484558105, "Pretrain/Loss (Raw)": 2.2129967212677, "Pretrain/Step": 1214, "Pretrain/Step Time": 8.548314219340682} +{"Pretrain/Learning Rate": 4.8766160348599125e-05, "Pretrain/Loss": 2.1736836433410645, "Pretrain/Loss (Raw)": 2.2129604816436768, "Pretrain/Step": 1215, "Pretrain/Step Time": 8.545626755803823} +{"Pretrain/Learning Rate": 4.876352477163209e-05, "Pretrain/Loss": 2.17291522026062, "Pretrain/Loss (Raw)": 2.112025022506714, "Pretrain/Step": 1216, "Pretrain/Step Time": 8.54225880280137} +{"Pretrain/Learning Rate": 4.8760886454143394e-05, "Pretrain/Loss": 2.173064947128296, "Pretrain/Loss (Raw)": 2.3342623710632324, "Pretrain/Step": 1217, "Pretrain/Step Time": 8.541567964479327} +{"Pretrain/Learning Rate": 4.875824539643731e-05, "Pretrain/Loss": 2.171931743621826, "Pretrain/Loss (Raw)": 2.03884220123291, "Pretrain/Step": 1218, "Pretrain/Step Time": 8.538730664178729} +{"Pretrain/Learning Rate": 4.8755601598818427e-05, "Pretrain/Loss": 2.171525478363037, "Pretrain/Loss (Raw)": 2.106353282928467, "Pretrain/Step": 1219, "Pretrain/Step Time": 8.540401903912425} +{"Pretrain/Learning Rate": 4.875295506159161e-05, "Pretrain/Loss": 2.1720123291015625, "Pretrain/Loss (Raw)": 2.152195692062378, "Pretrain/Step": 1220, "Pretrain/Step Time": 8.544418646022677} +{"Pretrain/Learning Rate": 4.87503057850621e-05, "Pretrain/Loss": 2.1716227531433105, "Pretrain/Loss (Raw)": 2.0351903438568115, "Pretrain/Step": 1221, "Pretrain/Step Time": 8.551525184884667} +{"Pretrain/Learning Rate": 4.874765376953541e-05, "Pretrain/Loss": 2.17012357711792, "Pretrain/Loss (Raw)": 2.1978919506073, "Pretrain/Step": 1222, "Pretrain/Step Time": 8.547713795676827} +{"Pretrain/Learning Rate": 4.874499901531737e-05, "Pretrain/Loss": 2.169142484664917, "Pretrain/Loss (Raw)": 2.036280393600464, "Pretrain/Step": 1223, "Pretrain/Step Time": 8.552421763539314} +{"Pretrain/Learning Rate": 4.874234152271418e-05, "Pretrain/Loss": 2.169046401977539, "Pretrain/Loss (Raw)": 2.1641438007354736, "Pretrain/Step": 1224, "Pretrain/Step Time": 8.550513796508312} +{"Pretrain/Learning Rate": 4.8739681292032266e-05, "Pretrain/Loss": 2.1695523262023926, "Pretrain/Loss (Raw)": 2.1898927688598633, "Pretrain/Step": 1225, "Pretrain/Step Time": 8.55036193691194} +{"Pretrain/Learning Rate": 4.8737018323578445e-05, "Pretrain/Loss": 2.169499158859253, "Pretrain/Loss (Raw)": 2.0741615295410156, "Pretrain/Step": 1226, "Pretrain/Step Time": 8.551548358052969} +{"Pretrain/Learning Rate": 4.873435261765982e-05, "Pretrain/Loss": 2.1694536209106445, "Pretrain/Loss (Raw)": 2.1643424034118652, "Pretrain/Step": 1227, "Pretrain/Step Time": 8.551318805664778} +{"Pretrain/Learning Rate": 4.873168417458381e-05, "Pretrain/Loss": 2.170377016067505, "Pretrain/Loss (Raw)": 2.33097243309021, "Pretrain/Step": 1228, "Pretrain/Step Time": 8.545183414593339} +{"Pretrain/Learning Rate": 4.8729012994658166e-05, "Pretrain/Loss": 2.1716086864471436, "Pretrain/Loss (Raw)": 2.163947343826294, "Pretrain/Step": 1229, "Pretrain/Step Time": 8.550151756033301} +{"Pretrain/Learning Rate": 4.8726339078190914e-05, "Pretrain/Loss": 2.1656246185302734, "Pretrain/Loss (Raw)": 2.0254898071289062, "Pretrain/Step": 1230, "Pretrain/Step Time": 8.549442352727056} +{"Pretrain/Learning Rate": 4.872366242549044e-05, "Pretrain/Loss": 2.1680126190185547, "Pretrain/Loss (Raw)": 2.2694878578186035, "Pretrain/Step": 1231, "Pretrain/Step Time": 8.558368416503072} +{"Pretrain/Learning Rate": 4.872098303686543e-05, "Pretrain/Loss": 2.1689302921295166, "Pretrain/Loss (Raw)": 2.1300530433654785, "Pretrain/Step": 1232, "Pretrain/Step Time": 8.54994136467576} +{"Pretrain/Learning Rate": 4.871830091262488e-05, "Pretrain/Loss": 2.16969633102417, "Pretrain/Loss (Raw)": 2.1923863887786865, "Pretrain/Step": 1233, "Pretrain/Step Time": 8.553294107317924} +{"Pretrain/Learning Rate": 4.8715616053078095e-05, "Pretrain/Loss": 2.169313907623291, "Pretrain/Loss (Raw)": 2.048388957977295, "Pretrain/Step": 1234, "Pretrain/Step Time": 8.55357794649899} +{"Pretrain/Learning Rate": 4.871292845853472e-05, "Pretrain/Loss": 2.170640230178833, "Pretrain/Loss (Raw)": 2.5807931423187256, "Pretrain/Step": 1235, "Pretrain/Step Time": 8.554499687626958} +{"Pretrain/Learning Rate": 4.87102381293047e-05, "Pretrain/Loss": 2.1698756217956543, "Pretrain/Loss (Raw)": 2.0298912525177, "Pretrain/Step": 1236, "Pretrain/Step Time": 8.551234144717455} +{"Pretrain/Learning Rate": 4.870754506569829e-05, "Pretrain/Loss": 2.1687064170837402, "Pretrain/Loss (Raw)": 2.1494834423065186, "Pretrain/Step": 1237, "Pretrain/Step Time": 8.557811722159386} +{"Pretrain/Learning Rate": 4.870484926802606e-05, "Pretrain/Loss": 2.16375732421875, "Pretrain/Loss (Raw)": 2.034132719039917, "Pretrain/Step": 1238, "Pretrain/Step Time": 8.545930137857795} +{"Pretrain/Learning Rate": 4.8702150736598925e-05, "Pretrain/Loss": 2.161710500717163, "Pretrain/Loss (Raw)": 1.940559983253479, "Pretrain/Step": 1239, "Pretrain/Step Time": 8.552841803058982} +{"Pretrain/Learning Rate": 4.8699449471728075e-05, "Pretrain/Loss": 2.1629490852355957, "Pretrain/Loss (Raw)": 2.150165557861328, "Pretrain/Step": 1240, "Pretrain/Step Time": 8.548599736765027} +{"Pretrain/Learning Rate": 4.869674547372504e-05, "Pretrain/Loss": 2.165808916091919, "Pretrain/Loss (Raw)": 2.3294074535369873, "Pretrain/Step": 1241, "Pretrain/Step Time": 8.551159484311938} +{"Pretrain/Learning Rate": 4.8694038742901646e-05, "Pretrain/Loss": 2.1669089794158936, "Pretrain/Loss (Raw)": 2.3015451431274414, "Pretrain/Step": 1242, "Pretrain/Step Time": 8.55106645822525} +{"Pretrain/Learning Rate": 4.869132927957007e-05, "Pretrain/Loss": 2.1654927730560303, "Pretrain/Loss (Raw)": 2.005842685699463, "Pretrain/Step": 1243, "Pretrain/Step Time": 8.557389026507735} +{"Pretrain/Learning Rate": 4.868861708404275e-05, "Pretrain/Loss": 2.1642770767211914, "Pretrain/Loss (Raw)": 2.1479692459106445, "Pretrain/Step": 1244, "Pretrain/Step Time": 8.550327334553003} +{"Pretrain/Learning Rate": 4.868590215663248e-05, "Pretrain/Loss": 2.165249824523926, "Pretrain/Loss (Raw)": 2.3200478553771973, "Pretrain/Step": 1245, "Pretrain/Step Time": 8.557288285344839} +{"Pretrain/Learning Rate": 4.8683184497652366e-05, "Pretrain/Loss": 2.1630334854125977, "Pretrain/Loss (Raw)": 2.025292158126831, "Pretrain/Step": 1246, "Pretrain/Step Time": 8.552343729883432} +{"Pretrain/Learning Rate": 4.868046410741582e-05, "Pretrain/Loss": 2.161055088043213, "Pretrain/Loss (Raw)": 2.09621524810791, "Pretrain/Step": 1247, "Pretrain/Step Time": 8.554726099595428} +{"Pretrain/Learning Rate": 4.867774098623657e-05, "Pretrain/Loss": 2.1620030403137207, "Pretrain/Loss (Raw)": 2.1727635860443115, "Pretrain/Step": 1248, "Pretrain/Step Time": 8.55308268405497} +{"Pretrain/Learning Rate": 4.8675015134428654e-05, "Pretrain/Loss": 2.160247325897217, "Pretrain/Loss (Raw)": 2.079259157180786, "Pretrain/Step": 1249, "Pretrain/Step Time": 8.558268187567592} +{"Pretrain/Learning Rate": 4.867228655230643e-05, "Pretrain/Loss": 2.1621532440185547, "Pretrain/Loss (Raw)": 2.3479039669036865, "Pretrain/Step": 1250, "Pretrain/Step Time": 8.549300080165267} +{"Pretrain/Learning Rate": 4.866955524018457e-05, "Pretrain/Loss": 2.161360740661621, "Pretrain/Loss (Raw)": 2.143522262573242, "Pretrain/Step": 1251, "Pretrain/Step Time": 8.55273170210421} +{"Pretrain/Learning Rate": 4.866682119837807e-05, "Pretrain/Loss": 2.161504030227661, "Pretrain/Loss (Raw)": 2.2009670734405518, "Pretrain/Step": 1252, "Pretrain/Step Time": 8.550626652315259} +{"Pretrain/Learning Rate": 4.866408442720223e-05, "Pretrain/Loss": 2.1634364128112793, "Pretrain/Loss (Raw)": 2.2735700607299805, "Pretrain/Step": 1253, "Pretrain/Step Time": 8.552896494045854} +{"Pretrain/Learning Rate": 4.8661344926972666e-05, "Pretrain/Loss": 2.164644718170166, "Pretrain/Loss (Raw)": 2.2876765727996826, "Pretrain/Step": 1254, "Pretrain/Step Time": 8.547084409743547} +{"Pretrain/Learning Rate": 4.8658602698005294e-05, "Pretrain/Loss": 2.1626436710357666, "Pretrain/Loss (Raw)": 2.0168848037719727, "Pretrain/Step": 1255, "Pretrain/Step Time": 8.54980044811964} +{"Pretrain/Learning Rate": 4.8655857740616395e-05, "Pretrain/Loss": 2.162985324859619, "Pretrain/Loss (Raw)": 2.002096652984619, "Pretrain/Step": 1256, "Pretrain/Step Time": 8.547935925424099} +{"Pretrain/Learning Rate": 4.8653110055122496e-05, "Pretrain/Loss": 2.1645097732543945, "Pretrain/Loss (Raw)": 2.1420793533325195, "Pretrain/Step": 1257, "Pretrain/Step Time": 8.548724690452218} +{"Pretrain/Learning Rate": 4.8650359641840495e-05, "Pretrain/Loss": 2.165872097015381, "Pretrain/Loss (Raw)": 2.3713321685791016, "Pretrain/Step": 1258, "Pretrain/Step Time": 8.546019025146961} +{"Pretrain/Learning Rate": 4.864760650108758e-05, "Pretrain/Loss": 2.1651978492736816, "Pretrain/Loss (Raw)": 1.9420784711837769, "Pretrain/Step": 1259, "Pretrain/Step Time": 8.546409908682108} +{"Pretrain/Learning Rate": 4.864485063318125e-05, "Pretrain/Loss": 2.1644697189331055, "Pretrain/Loss (Raw)": 2.076470375061035, "Pretrain/Step": 1260, "Pretrain/Step Time": 8.541535129770637} +{"Pretrain/Learning Rate": 4.864209203843932e-05, "Pretrain/Loss": 2.164973735809326, "Pretrain/Loss (Raw)": 2.212509870529175, "Pretrain/Step": 1261, "Pretrain/Step Time": 8.54880596511066} +{"Pretrain/Learning Rate": 4.8639330717179946e-05, "Pretrain/Loss": 2.164527416229248, "Pretrain/Loss (Raw)": 2.275419235229492, "Pretrain/Step": 1262, "Pretrain/Step Time": 8.53452935628593} +{"Pretrain/Learning Rate": 4.863656666972154e-05, "Pretrain/Loss": 2.164119243621826, "Pretrain/Loss (Raw)": 1.9516198635101318, "Pretrain/Step": 1263, "Pretrain/Step Time": 8.541463790461421} +{"Pretrain/Learning Rate": 4.86337998963829e-05, "Pretrain/Loss": 2.164856433868408, "Pretrain/Loss (Raw)": 2.275482654571533, "Pretrain/Step": 1264, "Pretrain/Step Time": 8.537715775892138} +{"Pretrain/Learning Rate": 4.863103039748309e-05, "Pretrain/Loss": 2.1642532348632812, "Pretrain/Loss (Raw)": 2.233783483505249, "Pretrain/Step": 1265, "Pretrain/Step Time": 8.537819927558303} +{"Pretrain/Learning Rate": 4.86282581733415e-05, "Pretrain/Loss": 2.156853437423706, "Pretrain/Loss (Raw)": 1.9761505126953125, "Pretrain/Step": 1266, "Pretrain/Step Time": 8.53617007099092} +{"Pretrain/Learning Rate": 4.8625483224277835e-05, "Pretrain/Loss": 2.1563806533813477, "Pretrain/Loss (Raw)": 2.232144832611084, "Pretrain/Step": 1267, "Pretrain/Step Time": 8.535018764436245} +{"Pretrain/Learning Rate": 4.8622705550612126e-05, "Pretrain/Loss": 2.157736301422119, "Pretrain/Loss (Raw)": 2.183603048324585, "Pretrain/Step": 1268, "Pretrain/Step Time": 8.5407729819417} +{"Pretrain/Learning Rate": 4.861992515266469e-05, "Pretrain/Loss": 2.1583986282348633, "Pretrain/Loss (Raw)": 2.229536294937134, "Pretrain/Step": 1269, "Pretrain/Step Time": 8.538164535537362} +{"Pretrain/Learning Rate": 4.8617142030756194e-05, "Pretrain/Loss": 2.1579666137695312, "Pretrain/Loss (Raw)": 2.1570968627929688, "Pretrain/Step": 1270, "Pretrain/Step Time": 8.535553641617298} +{"Pretrain/Learning Rate": 4.8614356185207575e-05, "Pretrain/Loss": 2.1568048000335693, "Pretrain/Loss (Raw)": 2.0592122077941895, "Pretrain/Step": 1271, "Pretrain/Step Time": 8.535734811797738} +{"Pretrain/Learning Rate": 4.861156761634014e-05, "Pretrain/Loss": 2.1576037406921387, "Pretrain/Loss (Raw)": 2.1822617053985596, "Pretrain/Step": 1272, "Pretrain/Step Time": 8.534260045737028} +{"Pretrain/Learning Rate": 4.860877632447546e-05, "Pretrain/Loss": 2.1572816371917725, "Pretrain/Loss (Raw)": 2.176198959350586, "Pretrain/Step": 1273, "Pretrain/Step Time": 8.531416045501828} +{"Pretrain/Learning Rate": 4.8605982309935446e-05, "Pretrain/Loss": 2.1562232971191406, "Pretrain/Loss (Raw)": 2.0739879608154297, "Pretrain/Step": 1274, "Pretrain/Step Time": 8.540328323841095} +{"Pretrain/Learning Rate": 4.860318557304232e-05, "Pretrain/Loss": 2.15446138381958, "Pretrain/Loss (Raw)": 2.055149555206299, "Pretrain/Step": 1275, "Pretrain/Step Time": 8.540811048820615} +{"Pretrain/Learning Rate": 4.860038611411861e-05, "Pretrain/Loss": 2.1565184593200684, "Pretrain/Loss (Raw)": 2.1335835456848145, "Pretrain/Step": 1276, "Pretrain/Step Time": 8.54030123539269} +{"Pretrain/Learning Rate": 4.8597583933487165e-05, "Pretrain/Loss": 2.157533884048462, "Pretrain/Loss (Raw)": 2.1819963455200195, "Pretrain/Step": 1277, "Pretrain/Step Time": 8.540276557207108} +{"Pretrain/Learning Rate": 4.859477903147115e-05, "Pretrain/Loss": 2.15908145904541, "Pretrain/Loss (Raw)": 2.508942127227783, "Pretrain/Step": 1278, "Pretrain/Step Time": 8.543336238712072} +{"Pretrain/Learning Rate": 4.8591971408394034e-05, "Pretrain/Loss": 2.159254789352417, "Pretrain/Loss (Raw)": 2.072350025177002, "Pretrain/Step": 1279, "Pretrain/Step Time": 8.54780201241374} +{"Pretrain/Learning Rate": 4.85891610645796e-05, "Pretrain/Loss": 2.158388137817383, "Pretrain/Loss (Raw)": 2.2708489894866943, "Pretrain/Step": 1280, "Pretrain/Step Time": 8.545300301164389} +{"Pretrain/Learning Rate": 4.8586348000351956e-05, "Pretrain/Loss": 2.156528949737549, "Pretrain/Loss (Raw)": 2.072495222091675, "Pretrain/Step": 1281, "Pretrain/Step Time": 8.540112983435392} +{"Pretrain/Learning Rate": 4.8583532216035524e-05, "Pretrain/Loss": 2.1559815406799316, "Pretrain/Loss (Raw)": 2.166019916534424, "Pretrain/Step": 1282, "Pretrain/Step Time": 8.54451259598136} +{"Pretrain/Learning Rate": 4.858071371195502e-05, "Pretrain/Loss": 2.1548264026641846, "Pretrain/Loss (Raw)": 1.9199020862579346, "Pretrain/Step": 1283, "Pretrain/Step Time": 8.546191714704037} +{"Pretrain/Learning Rate": 4.8577892488435504e-05, "Pretrain/Loss": 2.1551356315612793, "Pretrain/Loss (Raw)": 2.101996421813965, "Pretrain/Step": 1284, "Pretrain/Step Time": 8.54592490941286} +{"Pretrain/Learning Rate": 4.8575068545802316e-05, "Pretrain/Loss": 2.154592275619507, "Pretrain/Loss (Raw)": 2.116928815841675, "Pretrain/Step": 1285, "Pretrain/Step Time": 8.545403884723783} +{"Pretrain/Learning Rate": 4.8572241884381145e-05, "Pretrain/Loss": 2.1538853645324707, "Pretrain/Loss (Raw)": 2.167964220046997, "Pretrain/Step": 1286, "Pretrain/Step Time": 8.552897848188877} +{"Pretrain/Learning Rate": 4.856941250449795e-05, "Pretrain/Loss": 2.152029514312744, "Pretrain/Loss (Raw)": 2.013096570968628, "Pretrain/Step": 1287, "Pretrain/Step Time": 8.539620205760002} +{"Pretrain/Learning Rate": 4.8566580406479045e-05, "Pretrain/Loss": 2.152038335800171, "Pretrain/Loss (Raw)": 2.0624029636383057, "Pretrain/Step": 1288, "Pretrain/Step Time": 8.541672108694911} +{"Pretrain/Learning Rate": 4.856374559065104e-05, "Pretrain/Loss": 2.152127265930176, "Pretrain/Loss (Raw)": 2.022887945175171, "Pretrain/Step": 1289, "Pretrain/Step Time": 8.5409288816154} +{"Pretrain/Learning Rate": 4.856090805734086e-05, "Pretrain/Loss": 2.151993989944458, "Pretrain/Loss (Raw)": 2.0147273540496826, "Pretrain/Step": 1290, "Pretrain/Step Time": 8.539936853572726} +{"Pretrain/Learning Rate": 4.855806780687574e-05, "Pretrain/Loss": 2.1499085426330566, "Pretrain/Loss (Raw)": 2.1328694820404053, "Pretrain/Step": 1291, "Pretrain/Step Time": 8.540094375610352} +{"Pretrain/Learning Rate": 4.8555224839583236e-05, "Pretrain/Loss": 2.1490988731384277, "Pretrain/Loss (Raw)": 2.3213977813720703, "Pretrain/Step": 1292, "Pretrain/Step Time": 8.552310211583972} +{"Pretrain/Learning Rate": 4.8552379155791194e-05, "Pretrain/Loss": 2.1474761962890625, "Pretrain/Loss (Raw)": 1.9157084226608276, "Pretrain/Step": 1293, "Pretrain/Step Time": 8.543891243636608} +{"Pretrain/Learning Rate": 4.854953075582782e-05, "Pretrain/Loss": 2.144928216934204, "Pretrain/Loss (Raw)": 1.8872112035751343, "Pretrain/Step": 1294, "Pretrain/Step Time": 8.54836743324995} +{"Pretrain/Learning Rate": 4.854667964002158e-05, "Pretrain/Loss": 2.143747329711914, "Pretrain/Loss (Raw)": 1.9974720478057861, "Pretrain/Step": 1295, "Pretrain/Step Time": 8.547930434346199} +{"Pretrain/Learning Rate": 4.8543825808701294e-05, "Pretrain/Loss": 2.142148494720459, "Pretrain/Loss (Raw)": 1.9442254304885864, "Pretrain/Step": 1296, "Pretrain/Step Time": 8.544770825654268} +{"Pretrain/Learning Rate": 4.854096926219607e-05, "Pretrain/Loss": 2.1436452865600586, "Pretrain/Loss (Raw)": 2.252253532409668, "Pretrain/Step": 1297, "Pretrain/Step Time": 8.545787872746587} +{"Pretrain/Learning Rate": 4.853811000083535e-05, "Pretrain/Loss": 2.142545700073242, "Pretrain/Loss (Raw)": 2.007190704345703, "Pretrain/Step": 1298, "Pretrain/Step Time": 8.554538879543543} +{"Pretrain/Learning Rate": 4.8535248024948854e-05, "Pretrain/Loss": 2.143904209136963, "Pretrain/Loss (Raw)": 2.189448118209839, "Pretrain/Step": 1299, "Pretrain/Step Time": 8.551159186288714} +{"Pretrain/Learning Rate": 4.853238333486666e-05, "Pretrain/Loss": 2.1434543132781982, "Pretrain/Loss (Raw)": 2.16595196723938, "Pretrain/Step": 1300, "Pretrain/Step Time": 8.544982019811869} +{"Pretrain/Learning Rate": 4.852951593091914e-05, "Pretrain/Loss": 2.143899917602539, "Pretrain/Loss (Raw)": 2.1408212184906006, "Pretrain/Step": 1301, "Pretrain/Step Time": 8.54493785649538} +{"Pretrain/Learning Rate": 4.852664581343696e-05, "Pretrain/Loss": 2.1430811882019043, "Pretrain/Loss (Raw)": 2.063007354736328, "Pretrain/Step": 1302, "Pretrain/Step Time": 8.544382331892848} +{"Pretrain/Learning Rate": 4.852377298275113e-05, "Pretrain/Loss": 2.1438310146331787, "Pretrain/Loss (Raw)": 2.3587534427642822, "Pretrain/Step": 1303, "Pretrain/Step Time": 8.54488087631762} +{"Pretrain/Learning Rate": 4.852089743919295e-05, "Pretrain/Loss": 2.1445581912994385, "Pretrain/Loss (Raw)": 2.148484706878662, "Pretrain/Step": 1304, "Pretrain/Step Time": 8.546680077910423} +{"Pretrain/Learning Rate": 4.851801918309403e-05, "Pretrain/Loss": 2.1452205181121826, "Pretrain/Loss (Raw)": 2.3317339420318604, "Pretrain/Step": 1305, "Pretrain/Step Time": 8.54616180434823} +{"Pretrain/Learning Rate": 4.8515138214786335e-05, "Pretrain/Loss": 2.148101329803467, "Pretrain/Loss (Raw)": 2.468022108078003, "Pretrain/Step": 1306, "Pretrain/Step Time": 8.543361313641071} +{"Pretrain/Learning Rate": 4.851225453460209e-05, "Pretrain/Loss": 2.148029327392578, "Pretrain/Loss (Raw)": 2.133157253265381, "Pretrain/Step": 1307, "Pretrain/Step Time": 8.542226387187839} +{"Pretrain/Learning Rate": 4.850936814287386e-05, "Pretrain/Loss": 2.1495485305786133, "Pretrain/Loss (Raw)": 2.1483919620513916, "Pretrain/Step": 1308, "Pretrain/Step Time": 8.539142481982708} +{"Pretrain/Learning Rate": 4.85064790399345e-05, "Pretrain/Loss": 2.154649257659912, "Pretrain/Loss (Raw)": 2.4469857215881348, "Pretrain/Step": 1309, "Pretrain/Step Time": 8.53587312437594} +{"Pretrain/Learning Rate": 4.850358722611723e-05, "Pretrain/Loss": 2.153095245361328, "Pretrain/Loss (Raw)": 1.9175901412963867, "Pretrain/Step": 1310, "Pretrain/Step Time": 8.54816448315978} +{"Pretrain/Learning Rate": 4.850069270175552e-05, "Pretrain/Loss": 2.155332088470459, "Pretrain/Loss (Raw)": 2.362760543823242, "Pretrain/Step": 1311, "Pretrain/Step Time": 8.542354512959719} +{"Pretrain/Learning Rate": 4.849779546718319e-05, "Pretrain/Loss": 2.1546528339385986, "Pretrain/Loss (Raw)": 2.087636709213257, "Pretrain/Step": 1312, "Pretrain/Step Time": 8.538080919533968} +{"Pretrain/Learning Rate": 4.8494895522734364e-05, "Pretrain/Loss": 2.1551856994628906, "Pretrain/Loss (Raw)": 2.160531520843506, "Pretrain/Step": 1313, "Pretrain/Step Time": 8.535999557003379} +{"Pretrain/Learning Rate": 4.849199286874347e-05, "Pretrain/Loss": 2.15358829498291, "Pretrain/Loss (Raw)": 1.9150627851486206, "Pretrain/Step": 1314, "Pretrain/Step Time": 8.538591066375375} +{"Pretrain/Learning Rate": 4.8489087505545266e-05, "Pretrain/Loss": 2.153872489929199, "Pretrain/Loss (Raw)": 2.1785781383514404, "Pretrain/Step": 1315, "Pretrain/Step Time": 8.535318914800882} +{"Pretrain/Learning Rate": 4.84861794334748e-05, "Pretrain/Loss": 2.1558308601379395, "Pretrain/Loss (Raw)": 2.347515821456909, "Pretrain/Step": 1316, "Pretrain/Step Time": 8.5486921351403} +{"Pretrain/Learning Rate": 4.848326865286746e-05, "Pretrain/Loss": 2.155026912689209, "Pretrain/Loss (Raw)": 2.199517250061035, "Pretrain/Step": 1317, "Pretrain/Step Time": 8.53963096626103} +{"Pretrain/Learning Rate": 4.848035516405892e-05, "Pretrain/Loss": 2.154841423034668, "Pretrain/Loss (Raw)": 2.1983256340026855, "Pretrain/Step": 1318, "Pretrain/Step Time": 8.542100863531232} +{"Pretrain/Learning Rate": 4.847743896738517e-05, "Pretrain/Loss": 2.1584224700927734, "Pretrain/Loss (Raw)": 2.344750165939331, "Pretrain/Step": 1319, "Pretrain/Step Time": 8.544192090630531} +{"Pretrain/Learning Rate": 4.847452006318254e-05, "Pretrain/Loss": 2.15917706489563, "Pretrain/Loss (Raw)": 2.163060426712036, "Pretrain/Step": 1320, "Pretrain/Step Time": 8.541367087513208} +{"Pretrain/Learning Rate": 4.8471598451787635e-05, "Pretrain/Loss": 2.1594619750976562, "Pretrain/Loss (Raw)": 2.1047120094299316, "Pretrain/Step": 1321, "Pretrain/Step Time": 8.536958580836654} +{"Pretrain/Learning Rate": 4.8468674133537395e-05, "Pretrain/Loss": 2.1594791412353516, "Pretrain/Loss (Raw)": 2.113783836364746, "Pretrain/Step": 1322, "Pretrain/Step Time": 8.543154910206795} +{"Pretrain/Learning Rate": 4.846574710876907e-05, "Pretrain/Loss": 2.1593427658081055, "Pretrain/Loss (Raw)": 2.1106173992156982, "Pretrain/Step": 1323, "Pretrain/Step Time": 8.537040865048766} +{"Pretrain/Learning Rate": 4.846281737782021e-05, "Pretrain/Loss": 2.160412311553955, "Pretrain/Loss (Raw)": 2.227741003036499, "Pretrain/Step": 1324, "Pretrain/Step Time": 8.53859587945044} +{"Pretrain/Learning Rate": 4.845988494102869e-05, "Pretrain/Loss": 2.1585049629211426, "Pretrain/Loss (Raw)": 2.0434107780456543, "Pretrain/Step": 1325, "Pretrain/Step Time": 8.534020591527224} +{"Pretrain/Learning Rate": 4.845694979873269e-05, "Pretrain/Loss": 2.1575050354003906, "Pretrain/Loss (Raw)": 2.1301636695861816, "Pretrain/Step": 1326, "Pretrain/Step Time": 8.540377730503678} +{"Pretrain/Learning Rate": 4.845401195127071e-05, "Pretrain/Loss": 2.154229164123535, "Pretrain/Loss (Raw)": 1.8943575620651245, "Pretrain/Step": 1327, "Pretrain/Step Time": 8.537054246291518} +{"Pretrain/Learning Rate": 4.845107139898155e-05, "Pretrain/Loss": 2.1542201042175293, "Pretrain/Loss (Raw)": 2.0734405517578125, "Pretrain/Step": 1328, "Pretrain/Step Time": 8.5417659021914} +{"Pretrain/Learning Rate": 4.8448128142204334e-05, "Pretrain/Loss": 2.152756690979004, "Pretrain/Loss (Raw)": 2.146444320678711, "Pretrain/Step": 1329, "Pretrain/Step Time": 8.53898211568594} +{"Pretrain/Learning Rate": 4.8445182181278494e-05, "Pretrain/Loss": 2.152454376220703, "Pretrain/Loss (Raw)": 2.227494716644287, "Pretrain/Step": 1330, "Pretrain/Step Time": 8.543608518317342} +{"Pretrain/Learning Rate": 4.8442233516543756e-05, "Pretrain/Loss": 2.1503713130950928, "Pretrain/Loss (Raw)": 1.9327086210250854, "Pretrain/Step": 1331, "Pretrain/Step Time": 8.544373616576195} +{"Pretrain/Learning Rate": 4.8439282148340195e-05, "Pretrain/Loss": 2.1509437561035156, "Pretrain/Loss (Raw)": 2.097963571548462, "Pretrain/Step": 1332, "Pretrain/Step Time": 8.546279264613986} +{"Pretrain/Learning Rate": 4.843632807700816e-05, "Pretrain/Loss": 2.1515421867370605, "Pretrain/Loss (Raw)": 2.2471516132354736, "Pretrain/Step": 1333, "Pretrain/Step Time": 8.542342631146312} +{"Pretrain/Learning Rate": 4.843337130288834e-05, "Pretrain/Loss": 2.1491689682006836, "Pretrain/Loss (Raw)": 1.9616848230361938, "Pretrain/Step": 1334, "Pretrain/Step Time": 8.548215543851256} +{"Pretrain/Learning Rate": 4.843041182632172e-05, "Pretrain/Loss": 2.1471824645996094, "Pretrain/Loss (Raw)": 1.9507920742034912, "Pretrain/Step": 1335, "Pretrain/Step Time": 8.539716081693769} +{"Pretrain/Learning Rate": 4.84274496476496e-05, "Pretrain/Loss": 2.1506149768829346, "Pretrain/Loss (Raw)": 2.3147947788238525, "Pretrain/Step": 1336, "Pretrain/Step Time": 8.540079670026898} +{"Pretrain/Learning Rate": 4.84244847672136e-05, "Pretrain/Loss": 2.1479735374450684, "Pretrain/Loss (Raw)": 2.0450284481048584, "Pretrain/Step": 1337, "Pretrain/Step Time": 8.53458041511476} +{"Pretrain/Learning Rate": 4.842151718535563e-05, "Pretrain/Loss": 2.1486804485321045, "Pretrain/Loss (Raw)": 2.2074859142303467, "Pretrain/Step": 1338, "Pretrain/Step Time": 8.540933191776276} +{"Pretrain/Learning Rate": 4.841854690241793e-05, "Pretrain/Loss": 2.1481683254241943, "Pretrain/Loss (Raw)": 2.0866928100585938, "Pretrain/Step": 1339, "Pretrain/Step Time": 8.537727957591414} +{"Pretrain/Learning Rate": 4.841557391874304e-05, "Pretrain/Loss": 2.147569179534912, "Pretrain/Loss (Raw)": 2.1936051845550537, "Pretrain/Step": 1340, "Pretrain/Step Time": 8.549816073849797} +{"Pretrain/Learning Rate": 4.8412598234673845e-05, "Pretrain/Loss": 2.146404266357422, "Pretrain/Loss (Raw)": 2.240750312805176, "Pretrain/Step": 1341, "Pretrain/Step Time": 8.547701966017485} +{"Pretrain/Learning Rate": 4.840961985055349e-05, "Pretrain/Loss": 2.1462931632995605, "Pretrain/Loss (Raw)": 2.1987671852111816, "Pretrain/Step": 1342, "Pretrain/Step Time": 8.553183145821095} +{"Pretrain/Learning Rate": 4.8406638766725464e-05, "Pretrain/Loss": 2.145504951477051, "Pretrain/Loss (Raw)": 2.1120645999908447, "Pretrain/Step": 1343, "Pretrain/Step Time": 8.546060632914305} +{"Pretrain/Learning Rate": 4.840365498353357e-05, "Pretrain/Loss": 2.1469814777374268, "Pretrain/Loss (Raw)": 2.301015853881836, "Pretrain/Step": 1344, "Pretrain/Step Time": 8.549106417223811} +{"Pretrain/Learning Rate": 4.840066850132189e-05, "Pretrain/Loss": 2.1451187133789062, "Pretrain/Loss (Raw)": 2.0958309173583984, "Pretrain/Step": 1345, "Pretrain/Step Time": 8.550175849348307} +{"Pretrain/Learning Rate": 4.839767932043485e-05, "Pretrain/Loss": 2.144636869430542, "Pretrain/Loss (Raw)": 1.9771623611450195, "Pretrain/Step": 1346, "Pretrain/Step Time": 8.556719964370131} +{"Pretrain/Learning Rate": 4.839468744121718e-05, "Pretrain/Loss": 2.146571159362793, "Pretrain/Loss (Raw)": 2.353945016860962, "Pretrain/Step": 1347, "Pretrain/Step Time": 8.550614869222045} +{"Pretrain/Learning Rate": 4.8391692864013916e-05, "Pretrain/Loss": 2.147939682006836, "Pretrain/Loss (Raw)": 2.3273937702178955, "Pretrain/Step": 1348, "Pretrain/Step Time": 8.550611533224583} +{"Pretrain/Learning Rate": 4.838869558917041e-05, "Pretrain/Loss": 2.149603843688965, "Pretrain/Loss (Raw)": 2.248196601867676, "Pretrain/Step": 1349, "Pretrain/Step Time": 8.543747898191214} +{"Pretrain/Learning Rate": 4.838569561703231e-05, "Pretrain/Loss": 2.148831605911255, "Pretrain/Loss (Raw)": 2.0990328788757324, "Pretrain/Step": 1350, "Pretrain/Step Time": 8.54694022424519} +{"Pretrain/Learning Rate": 4.83826929479456e-05, "Pretrain/Loss": 2.1514482498168945, "Pretrain/Loss (Raw)": 2.371217727661133, "Pretrain/Step": 1351, "Pretrain/Step Time": 8.548281850293279} +{"Pretrain/Learning Rate": 4.837968758225655e-05, "Pretrain/Loss": 2.1509006023406982, "Pretrain/Loss (Raw)": 2.094041347503662, "Pretrain/Step": 1352, "Pretrain/Step Time": 8.554756412282586} +{"Pretrain/Learning Rate": 4.837667952031176e-05, "Pretrain/Loss": 2.1514155864715576, "Pretrain/Loss (Raw)": 2.2557973861694336, "Pretrain/Step": 1353, "Pretrain/Step Time": 8.552175298333168} +{"Pretrain/Learning Rate": 4.8373668762458144e-05, "Pretrain/Loss": 2.154663562774658, "Pretrain/Loss (Raw)": 2.4899044036865234, "Pretrain/Step": 1354, "Pretrain/Step Time": 8.553965957835317} +{"Pretrain/Learning Rate": 4.8370655309042896e-05, "Pretrain/Loss": 2.155203342437744, "Pretrain/Loss (Raw)": 2.233419179916382, "Pretrain/Step": 1355, "Pretrain/Step Time": 8.546977372840047} +{"Pretrain/Learning Rate": 4.8367639160413553e-05, "Pretrain/Loss": 2.1517765522003174, "Pretrain/Loss (Raw)": 1.8923685550689697, "Pretrain/Step": 1356, "Pretrain/Step Time": 8.554873708635569} +{"Pretrain/Learning Rate": 4.8364620316917956e-05, "Pretrain/Loss": 2.1509456634521484, "Pretrain/Loss (Raw)": 2.057579755783081, "Pretrain/Step": 1357, "Pretrain/Step Time": 8.554800601676106} +{"Pretrain/Learning Rate": 4.836159877890424e-05, "Pretrain/Loss": 2.1512885093688965, "Pretrain/Loss (Raw)": 2.0693905353546143, "Pretrain/Step": 1358, "Pretrain/Step Time": 8.559198375791311} +{"Pretrain/Learning Rate": 4.835857454672087e-05, "Pretrain/Loss": 2.150665760040283, "Pretrain/Loss (Raw)": 2.1897900104522705, "Pretrain/Step": 1359, "Pretrain/Step Time": 8.553573684766889} +{"Pretrain/Learning Rate": 4.835554762071661e-05, "Pretrain/Loss": 2.150789737701416, "Pretrain/Loss (Raw)": 2.1459102630615234, "Pretrain/Step": 1360, "Pretrain/Step Time": 8.556006027385592} +{"Pretrain/Learning Rate": 4.8352518001240555e-05, "Pretrain/Loss": 2.1505448818206787, "Pretrain/Loss (Raw)": 2.161031723022461, "Pretrain/Step": 1361, "Pretrain/Step Time": 8.552242014557123} +{"Pretrain/Learning Rate": 4.834948568864207e-05, "Pretrain/Loss": 2.1503546237945557, "Pretrain/Loss (Raw)": 2.0240590572357178, "Pretrain/Step": 1362, "Pretrain/Step Time": 8.55435023829341} +{"Pretrain/Learning Rate": 4.8346450683270875e-05, "Pretrain/Loss": 2.148165464401245, "Pretrain/Loss (Raw)": 2.3005714416503906, "Pretrain/Step": 1363, "Pretrain/Step Time": 8.550666350871325} +{"Pretrain/Learning Rate": 4.8343412985476974e-05, "Pretrain/Loss": 2.149714469909668, "Pretrain/Loss (Raw)": 2.228147029876709, "Pretrain/Step": 1364, "Pretrain/Step Time": 8.563269319012761} +{"Pretrain/Learning Rate": 4.83403725956107e-05, "Pretrain/Loss": 2.146993637084961, "Pretrain/Loss (Raw)": 1.801226019859314, "Pretrain/Step": 1365, "Pretrain/Step Time": 8.558341911062598} +{"Pretrain/Learning Rate": 4.8337329514022664e-05, "Pretrain/Loss": 2.14748477935791, "Pretrain/Loss (Raw)": 2.097007989883423, "Pretrain/Step": 1366, "Pretrain/Step Time": 8.557482710108161} +{"Pretrain/Learning Rate": 4.833428374106382e-05, "Pretrain/Loss": 2.1495401859283447, "Pretrain/Loss (Raw)": 2.203655242919922, "Pretrain/Step": 1367, "Pretrain/Step Time": 8.556361110880971} +{"Pretrain/Learning Rate": 4.833123527708542e-05, "Pretrain/Loss": 2.1507351398468018, "Pretrain/Loss (Raw)": 2.3031044006347656, "Pretrain/Step": 1368, "Pretrain/Step Time": 8.55987778864801} +{"Pretrain/Learning Rate": 4.832818412243904e-05, "Pretrain/Loss": 2.1501340866088867, "Pretrain/Loss (Raw)": 2.2524428367614746, "Pretrain/Step": 1369, "Pretrain/Step Time": 8.558934262022376} +{"Pretrain/Learning Rate": 4.8325130277476526e-05, "Pretrain/Loss": 2.150702953338623, "Pretrain/Loss (Raw)": 2.374394178390503, "Pretrain/Step": 1370, "Pretrain/Step Time": 8.560237739235163} +{"Pretrain/Learning Rate": 4.832207374255008e-05, "Pretrain/Loss": 2.1535420417785645, "Pretrain/Loss (Raw)": 2.3692362308502197, "Pretrain/Step": 1371, "Pretrain/Step Time": 8.553442334756255} +{"Pretrain/Learning Rate": 4.8319014518012195e-05, "Pretrain/Loss": 2.1540470123291016, "Pretrain/Loss (Raw)": 2.2126057147979736, "Pretrain/Step": 1372, "Pretrain/Step Time": 8.555959427729249} +{"Pretrain/Learning Rate": 4.831595260421567e-05, "Pretrain/Loss": 2.1510121822357178, "Pretrain/Loss (Raw)": 1.9315845966339111, "Pretrain/Step": 1373, "Pretrain/Step Time": 8.553294450044632} +{"Pretrain/Learning Rate": 4.8312888001513624e-05, "Pretrain/Loss": 2.1517157554626465, "Pretrain/Loss (Raw)": 2.1153693199157715, "Pretrain/Step": 1374, "Pretrain/Step Time": 8.552283246070147} +{"Pretrain/Learning Rate": 4.830982071025948e-05, "Pretrain/Loss": 2.154238224029541, "Pretrain/Loss (Raw)": 2.4190914630889893, "Pretrain/Step": 1375, "Pretrain/Step Time": 8.55640752799809} +{"Pretrain/Learning Rate": 4.830675073080697e-05, "Pretrain/Loss": 2.154911994934082, "Pretrain/Loss (Raw)": 2.259009599685669, "Pretrain/Step": 1376, "Pretrain/Step Time": 8.56210071220994} +{"Pretrain/Learning Rate": 4.830367806351015e-05, "Pretrain/Loss": 2.1534783840179443, "Pretrain/Loss (Raw)": 1.895749807357788, "Pretrain/Step": 1377, "Pretrain/Step Time": 8.556160803884268} +{"Pretrain/Learning Rate": 4.830060270872335e-05, "Pretrain/Loss": 2.15440034866333, "Pretrain/Loss (Raw)": 2.4659321308135986, "Pretrain/Step": 1378, "Pretrain/Step Time": 8.557949839159846} +{"Pretrain/Learning Rate": 4.8297524666801265e-05, "Pretrain/Loss": 2.156895875930786, "Pretrain/Loss (Raw)": 2.4629335403442383, "Pretrain/Step": 1379, "Pretrain/Step Time": 8.553433928638697} +{"Pretrain/Learning Rate": 4.829444393809884e-05, "Pretrain/Loss": 2.1569833755493164, "Pretrain/Loss (Raw)": 2.212185859680176, "Pretrain/Step": 1380, "Pretrain/Step Time": 8.555883053690195} +{"Pretrain/Learning Rate": 4.829136052297138e-05, "Pretrain/Loss": 2.1557326316833496, "Pretrain/Loss (Raw)": 2.1134450435638428, "Pretrain/Step": 1381, "Pretrain/Step Time": 8.550611080601811} +{"Pretrain/Learning Rate": 4.828827442177447e-05, "Pretrain/Loss": 2.1553831100463867, "Pretrain/Loss (Raw)": 2.2429423332214355, "Pretrain/Step": 1382, "Pretrain/Step Time": 8.556821689009666} +{"Pretrain/Learning Rate": 4.8285185634864024e-05, "Pretrain/Loss": 2.1556551456451416, "Pretrain/Loss (Raw)": 2.0517008304595947, "Pretrain/Step": 1383, "Pretrain/Step Time": 8.552826967090368} +{"Pretrain/Learning Rate": 4.8282094162596235e-05, "Pretrain/Loss": 2.156346559524536, "Pretrain/Loss (Raw)": 2.0905957221984863, "Pretrain/Step": 1384, "Pretrain/Step Time": 8.557076847180724} +{"Pretrain/Learning Rate": 4.8279000005327644e-05, "Pretrain/Loss": 2.1570000648498535, "Pretrain/Loss (Raw)": 2.225715160369873, "Pretrain/Step": 1385, "Pretrain/Step Time": 8.553633140400052} +{"Pretrain/Learning Rate": 4.827590316341508e-05, "Pretrain/Loss": 2.1538846492767334, "Pretrain/Loss (Raw)": 1.972589373588562, "Pretrain/Step": 1386, "Pretrain/Step Time": 8.556118372827768} +{"Pretrain/Learning Rate": 4.827280363721568e-05, "Pretrain/Loss": 2.155277729034424, "Pretrain/Loss (Raw)": 2.120404005050659, "Pretrain/Step": 1387, "Pretrain/Step Time": 8.555059559643269} +{"Pretrain/Learning Rate": 4.82697014270869e-05, "Pretrain/Loss": 2.1555685997009277, "Pretrain/Loss (Raw)": 2.1136860847473145, "Pretrain/Step": 1388, "Pretrain/Step Time": 8.564932690933347} +{"Pretrain/Learning Rate": 4.8266596533386505e-05, "Pretrain/Loss": 2.15555477142334, "Pretrain/Loss (Raw)": 2.210712432861328, "Pretrain/Step": 1389, "Pretrain/Step Time": 8.558821249753237} +{"Pretrain/Learning Rate": 4.8263488956472555e-05, "Pretrain/Loss": 2.1537487506866455, "Pretrain/Loss (Raw)": 2.0442700386047363, "Pretrain/Step": 1390, "Pretrain/Step Time": 8.558205641806126} +{"Pretrain/Learning Rate": 4.826037869670345e-05, "Pretrain/Loss": 2.155672788619995, "Pretrain/Loss (Raw)": 2.1978862285614014, "Pretrain/Step": 1391, "Pretrain/Step Time": 8.552817828953266} +{"Pretrain/Learning Rate": 4.8257265754437854e-05, "Pretrain/Loss": 2.154038906097412, "Pretrain/Loss (Raw)": 2.0663626194000244, "Pretrain/Step": 1392, "Pretrain/Step Time": 8.555746797472239} +{"Pretrain/Learning Rate": 4.825415013003478e-05, "Pretrain/Loss": 2.1514463424682617, "Pretrain/Loss (Raw)": 1.9019279479980469, "Pretrain/Step": 1393, "Pretrain/Step Time": 8.554937092587352} +{"Pretrain/Learning Rate": 4.8251031823853546e-05, "Pretrain/Loss": 2.1548385620117188, "Pretrain/Loss (Raw)": 2.410351276397705, "Pretrain/Step": 1394, "Pretrain/Step Time": 8.566294869408011} +{"Pretrain/Learning Rate": 4.824791083625375e-05, "Pretrain/Loss": 2.153623580932617, "Pretrain/Loss (Raw)": 2.076622247695923, "Pretrain/Step": 1395, "Pretrain/Step Time": 8.566602105274796} +{"Pretrain/Learning Rate": 4.8244787167595335e-05, "Pretrain/Loss": 2.151937484741211, "Pretrain/Loss (Raw)": 1.967801809310913, "Pretrain/Step": 1396, "Pretrain/Step Time": 8.551613351330161} +{"Pretrain/Learning Rate": 4.824166081823853e-05, "Pretrain/Loss": 2.1497726440429688, "Pretrain/Loss (Raw)": 1.9524232149124146, "Pretrain/Step": 1397, "Pretrain/Step Time": 8.549186512827873} +{"Pretrain/Learning Rate": 4.823853178854387e-05, "Pretrain/Loss": 2.1517269611358643, "Pretrain/Loss (Raw)": 2.4072744846343994, "Pretrain/Step": 1398, "Pretrain/Step Time": 8.549999624490738} +{"Pretrain/Learning Rate": 4.8235400078872234e-05, "Pretrain/Loss": 2.149825096130371, "Pretrain/Loss (Raw)": 1.815737247467041, "Pretrain/Step": 1399, "Pretrain/Step Time": 8.551034718751907} +{"Pretrain/Learning Rate": 4.823226568958477e-05, "Pretrain/Loss": 2.150543212890625, "Pretrain/Loss (Raw)": 2.2741804122924805, "Pretrain/Step": 1400, "Pretrain/Step Time": 8.559728505089879} +{"Pretrain/Learning Rate": 4.822912862104295e-05, "Pretrain/Loss": 2.149649143218994, "Pretrain/Loss (Raw)": 2.061783790588379, "Pretrain/Step": 1401, "Pretrain/Step Time": 8.557894108816981} +{"Pretrain/Learning Rate": 4.8225988873608554e-05, "Pretrain/Loss": 2.1492180824279785, "Pretrain/Loss (Raw)": 2.0187878608703613, "Pretrain/Step": 1402, "Pretrain/Step Time": 8.549382386729121} +{"Pretrain/Learning Rate": 4.8222846447643686e-05, "Pretrain/Loss": 2.150595188140869, "Pretrain/Loss (Raw)": 2.2314064502716064, "Pretrain/Step": 1403, "Pretrain/Step Time": 8.548296390101314} +{"Pretrain/Learning Rate": 4.8219701343510727e-05, "Pretrain/Loss": 2.1518912315368652, "Pretrain/Loss (Raw)": 2.2995030879974365, "Pretrain/Step": 1404, "Pretrain/Step Time": 8.549350952729583} +{"Pretrain/Learning Rate": 4.8216553561572395e-05, "Pretrain/Loss": 2.1517281532287598, "Pretrain/Loss (Raw)": 2.161119222640991, "Pretrain/Step": 1405, "Pretrain/Step Time": 8.55006187967956} +{"Pretrain/Learning Rate": 4.821340310219171e-05, "Pretrain/Loss": 2.148800849914551, "Pretrain/Loss (Raw)": 2.1342647075653076, "Pretrain/Step": 1406, "Pretrain/Step Time": 8.553215485066175} +{"Pretrain/Learning Rate": 4.8210249965732e-05, "Pretrain/Loss": 2.1486265659332275, "Pretrain/Loss (Raw)": 2.050013780593872, "Pretrain/Step": 1407, "Pretrain/Step Time": 8.544402562081814} +{"Pretrain/Learning Rate": 4.8207094152556886e-05, "Pretrain/Loss": 2.146681070327759, "Pretrain/Loss (Raw)": 2.021862030029297, "Pretrain/Step": 1408, "Pretrain/Step Time": 8.545841371640563} +{"Pretrain/Learning Rate": 4.820393566303032e-05, "Pretrain/Loss": 2.1461427211761475, "Pretrain/Loss (Raw)": 2.0035674571990967, "Pretrain/Step": 1409, "Pretrain/Step Time": 8.550335336476564} +{"Pretrain/Learning Rate": 4.8200774497516555e-05, "Pretrain/Loss": 2.1458168029785156, "Pretrain/Loss (Raw)": 2.1243174076080322, "Pretrain/Step": 1410, "Pretrain/Step Time": 8.547386813908815} +{"Pretrain/Learning Rate": 4.8197610656380144e-05, "Pretrain/Loss": 2.1475670337677, "Pretrain/Loss (Raw)": 2.1439132690429688, "Pretrain/Step": 1411, "Pretrain/Step Time": 8.544086718931794} +{"Pretrain/Learning Rate": 4.8194444139985965e-05, "Pretrain/Loss": 2.148055076599121, "Pretrain/Loss (Raw)": 2.1644701957702637, "Pretrain/Step": 1412, "Pretrain/Step Time": 8.545038737356663} +{"Pretrain/Learning Rate": 4.81912749486992e-05, "Pretrain/Loss": 2.148630142211914, "Pretrain/Loss (Raw)": 2.190507411956787, "Pretrain/Step": 1413, "Pretrain/Step Time": 8.553219502791762} +{"Pretrain/Learning Rate": 4.818810308288531e-05, "Pretrain/Loss": 2.149003267288208, "Pretrain/Loss (Raw)": 2.215754270553589, "Pretrain/Step": 1414, "Pretrain/Step Time": 8.54264971241355} +{"Pretrain/Learning Rate": 4.818492854291012e-05, "Pretrain/Loss": 2.153529644012451, "Pretrain/Loss (Raw)": 2.592461347579956, "Pretrain/Step": 1415, "Pretrain/Step Time": 8.545522103086114} +{"Pretrain/Learning Rate": 4.818175132913971e-05, "Pretrain/Loss": 2.1529247760772705, "Pretrain/Loss (Raw)": 1.984977126121521, "Pretrain/Step": 1416, "Pretrain/Step Time": 8.546212997287512} +{"Pretrain/Learning Rate": 4.817857144194051e-05, "Pretrain/Loss": 2.1537084579467773, "Pretrain/Loss (Raw)": 2.1232104301452637, "Pretrain/Step": 1417, "Pretrain/Step Time": 8.543313944712281} +{"Pretrain/Learning Rate": 4.817538888167923e-05, "Pretrain/Loss": 2.1594600677490234, "Pretrain/Loss (Raw)": 2.7509562969207764, "Pretrain/Step": 1418, "Pretrain/Step Time": 8.548888335004449} +{"Pretrain/Learning Rate": 4.817220364872289e-05, "Pretrain/Loss": 2.1580309867858887, "Pretrain/Loss (Raw)": 1.9499222040176392, "Pretrain/Step": 1419, "Pretrain/Step Time": 8.5549840554595} +{"Pretrain/Learning Rate": 4.816901574343884e-05, "Pretrain/Loss": 2.158369541168213, "Pretrain/Loss (Raw)": 2.3647303581237793, "Pretrain/Step": 1420, "Pretrain/Step Time": 8.546741742640734} +{"Pretrain/Learning Rate": 4.816582516619471e-05, "Pretrain/Loss": 2.160158634185791, "Pretrain/Loss (Raw)": 2.144733428955078, "Pretrain/Step": 1421, "Pretrain/Step Time": 8.548533299937844} +{"Pretrain/Learning Rate": 4.816263191735847e-05, "Pretrain/Loss": 2.1622982025146484, "Pretrain/Loss (Raw)": 2.16107177734375, "Pretrain/Step": 1422, "Pretrain/Step Time": 8.542140940204263} +{"Pretrain/Learning Rate": 4.8159435997298375e-05, "Pretrain/Loss": 2.162684917449951, "Pretrain/Loss (Raw)": 2.0469675064086914, "Pretrain/Step": 1423, "Pretrain/Step Time": 8.541401222348213} +{"Pretrain/Learning Rate": 4.8156237406382975e-05, "Pretrain/Loss": 2.1653151512145996, "Pretrain/Loss (Raw)": 2.280902147293091, "Pretrain/Step": 1424, "Pretrain/Step Time": 8.548338148742914} +{"Pretrain/Learning Rate": 4.815303614498118e-05, "Pretrain/Loss": 2.1648993492126465, "Pretrain/Loss (Raw)": 2.199007511138916, "Pretrain/Step": 1425, "Pretrain/Step Time": 8.556595349684358} +{"Pretrain/Learning Rate": 4.814983221346214e-05, "Pretrain/Loss": 2.1655497550964355, "Pretrain/Loss (Raw)": 2.0904369354248047, "Pretrain/Step": 1426, "Pretrain/Step Time": 8.54429891705513} +{"Pretrain/Learning Rate": 4.814662561219537e-05, "Pretrain/Loss": 2.166780948638916, "Pretrain/Loss (Raw)": 2.3470771312713623, "Pretrain/Step": 1427, "Pretrain/Step Time": 8.549364782869816} +{"Pretrain/Learning Rate": 4.814341634155066e-05, "Pretrain/Loss": 2.169538974761963, "Pretrain/Loss (Raw)": 2.5189599990844727, "Pretrain/Step": 1428, "Pretrain/Step Time": 8.547384282574058} +{"Pretrain/Learning Rate": 4.8140204401898134e-05, "Pretrain/Loss": 2.171144962310791, "Pretrain/Loss (Raw)": 2.346405029296875, "Pretrain/Step": 1429, "Pretrain/Step Time": 8.546455962583423} +{"Pretrain/Learning Rate": 4.813698979360819e-05, "Pretrain/Loss": 2.172809362411499, "Pretrain/Loss (Raw)": 2.2760255336761475, "Pretrain/Step": 1430, "Pretrain/Step Time": 8.552815990522504} +{"Pretrain/Learning Rate": 4.813377251705156e-05, "Pretrain/Loss": 2.1691668033599854, "Pretrain/Loss (Raw)": 1.8925223350524902, "Pretrain/Step": 1431, "Pretrain/Step Time": 8.548555323854089} +{"Pretrain/Learning Rate": 4.8130552572599265e-05, "Pretrain/Loss": 2.1684162616729736, "Pretrain/Loss (Raw)": 2.0524046421051025, "Pretrain/Step": 1432, "Pretrain/Step Time": 8.546241600066423} +{"Pretrain/Learning Rate": 4.8127329960622656e-05, "Pretrain/Loss": 2.1665735244750977, "Pretrain/Loss (Raw)": 2.0958898067474365, "Pretrain/Step": 1433, "Pretrain/Step Time": 8.552560150623322} +{"Pretrain/Learning Rate": 4.8124104681493375e-05, "Pretrain/Loss": 2.1642539501190186, "Pretrain/Loss (Raw)": 2.171093702316284, "Pretrain/Step": 1434, "Pretrain/Step Time": 8.553766125813127} +{"Pretrain/Learning Rate": 4.8120876735583384e-05, "Pretrain/Loss": 2.162787914276123, "Pretrain/Loss (Raw)": 1.9455204010009766, "Pretrain/Step": 1435, "Pretrain/Step Time": 8.55057067424059} +{"Pretrain/Learning Rate": 4.811764612326493e-05, "Pretrain/Loss": 2.162364959716797, "Pretrain/Loss (Raw)": 2.094212770462036, "Pretrain/Step": 1436, "Pretrain/Step Time": 8.555776929482818} +{"Pretrain/Learning Rate": 4.8114412844910595e-05, "Pretrain/Loss": 2.159158229827881, "Pretrain/Loss (Raw)": 2.036555528640747, "Pretrain/Step": 1437, "Pretrain/Step Time": 8.555651389062405} +{"Pretrain/Learning Rate": 4.8111176900893254e-05, "Pretrain/Loss": 2.1605405807495117, "Pretrain/Loss (Raw)": 2.0945382118225098, "Pretrain/Step": 1438, "Pretrain/Step Time": 8.54984594322741} +{"Pretrain/Learning Rate": 4.810793829158609e-05, "Pretrain/Loss": 2.158252239227295, "Pretrain/Loss (Raw)": 2.069826126098633, "Pretrain/Step": 1439, "Pretrain/Step Time": 8.553726790472865} +{"Pretrain/Learning Rate": 4.8104697017362595e-05, "Pretrain/Loss": 2.1561460494995117, "Pretrain/Loss (Raw)": 1.8180822134017944, "Pretrain/Step": 1440, "Pretrain/Step Time": 8.554240813478827} +{"Pretrain/Learning Rate": 4.8101453078596565e-05, "Pretrain/Loss": 2.1571898460388184, "Pretrain/Loss (Raw)": 2.294142484664917, "Pretrain/Step": 1441, "Pretrain/Step Time": 8.554652910679579} +{"Pretrain/Learning Rate": 4.809820647566211e-05, "Pretrain/Loss": 2.1618590354919434, "Pretrain/Loss (Raw)": 2.5126829147338867, "Pretrain/Step": 1442, "Pretrain/Step Time": 8.55654819495976} +{"Pretrain/Learning Rate": 4.8094957208933635e-05, "Pretrain/Loss": 2.1641783714294434, "Pretrain/Loss (Raw)": 2.475446939468384, "Pretrain/Step": 1443, "Pretrain/Step Time": 8.554707575589418} +{"Pretrain/Learning Rate": 4.809170527878587e-05, "Pretrain/Loss": 2.1638660430908203, "Pretrain/Loss (Raw)": 2.3075366020202637, "Pretrain/Step": 1444, "Pretrain/Step Time": 8.548993106931448} +{"Pretrain/Learning Rate": 4.808845068559384e-05, "Pretrain/Loss": 2.163125514984131, "Pretrain/Loss (Raw)": 2.104745626449585, "Pretrain/Step": 1445, "Pretrain/Step Time": 8.55559473671019} +{"Pretrain/Learning Rate": 4.808519342973289e-05, "Pretrain/Loss": 2.1620845794677734, "Pretrain/Loss (Raw)": 2.0650696754455566, "Pretrain/Step": 1446, "Pretrain/Step Time": 8.550876297056675} +{"Pretrain/Learning Rate": 4.808193351157865e-05, "Pretrain/Loss": 2.161386013031006, "Pretrain/Loss (Raw)": 2.2553751468658447, "Pretrain/Step": 1447, "Pretrain/Step Time": 8.553134156391025} +{"Pretrain/Learning Rate": 4.8078670931507064e-05, "Pretrain/Loss": 2.1602783203125, "Pretrain/Loss (Raw)": 2.0212554931640625, "Pretrain/Step": 1448, "Pretrain/Step Time": 8.553598571568727} +{"Pretrain/Learning Rate": 4.80754056898944e-05, "Pretrain/Loss": 2.1605725288391113, "Pretrain/Loss (Raw)": 2.14237380027771, "Pretrain/Step": 1449, "Pretrain/Step Time": 8.552390929311514} +{"Pretrain/Learning Rate": 4.807213778711722e-05, "Pretrain/Loss": 2.159761428833008, "Pretrain/Loss (Raw)": 2.0099618434906006, "Pretrain/Step": 1450, "Pretrain/Step Time": 8.553139552474022} +{"Pretrain/Learning Rate": 4.8068867223552384e-05, "Pretrain/Loss": 2.1611876487731934, "Pretrain/Loss (Raw)": 2.2931759357452393, "Pretrain/Step": 1451, "Pretrain/Step Time": 8.557129269465804} +{"Pretrain/Learning Rate": 4.8065593999577086e-05, "Pretrain/Loss": 2.159416675567627, "Pretrain/Loss (Raw)": 2.001028060913086, "Pretrain/Step": 1452, "Pretrain/Step Time": 8.556574914604425} +{"Pretrain/Learning Rate": 4.806231811556879e-05, "Pretrain/Loss": 2.159689426422119, "Pretrain/Loss (Raw)": 2.078329086303711, "Pretrain/Step": 1453, "Pretrain/Step Time": 8.555780006572604} +{"Pretrain/Learning Rate": 4.80590395719053e-05, "Pretrain/Loss": 2.158787727355957, "Pretrain/Loss (Raw)": 2.0147461891174316, "Pretrain/Step": 1454, "Pretrain/Step Time": 8.554866343736649} +{"Pretrain/Learning Rate": 4.805575836896471e-05, "Pretrain/Loss": 2.1616716384887695, "Pretrain/Loss (Raw)": 2.2635276317596436, "Pretrain/Step": 1455, "Pretrain/Step Time": 8.557919524610043} +{"Pretrain/Learning Rate": 4.805247450712542e-05, "Pretrain/Loss": 2.160961151123047, "Pretrain/Loss (Raw)": 1.9824872016906738, "Pretrain/Step": 1456, "Pretrain/Step Time": 8.558079844340682} +{"Pretrain/Learning Rate": 4.804918798676614e-05, "Pretrain/Loss": 2.160388946533203, "Pretrain/Loss (Raw)": 2.0731985569000244, "Pretrain/Step": 1457, "Pretrain/Step Time": 8.558866765350103} +{"Pretrain/Learning Rate": 4.804589880826589e-05, "Pretrain/Loss": 2.1587119102478027, "Pretrain/Loss (Raw)": 2.012852668762207, "Pretrain/Step": 1458, "Pretrain/Step Time": 8.558971209451556} +{"Pretrain/Learning Rate": 4.8042606972004e-05, "Pretrain/Loss": 2.160229444503784, "Pretrain/Loss (Raw)": 2.126923084259033, "Pretrain/Step": 1459, "Pretrain/Step Time": 8.558746661990881} +{"Pretrain/Learning Rate": 4.803931247836009e-05, "Pretrain/Loss": 2.160444736480713, "Pretrain/Loss (Raw)": 2.125544548034668, "Pretrain/Step": 1460, "Pretrain/Step Time": 8.556860949844122} +{"Pretrain/Learning Rate": 4.80360153277141e-05, "Pretrain/Loss": 2.1596763134002686, "Pretrain/Loss (Raw)": 2.1487905979156494, "Pretrain/Step": 1461, "Pretrain/Step Time": 8.56279563345015} +{"Pretrain/Learning Rate": 4.8032715520446275e-05, "Pretrain/Loss": 2.159510612487793, "Pretrain/Loss (Raw)": 1.9404364824295044, "Pretrain/Step": 1462, "Pretrain/Step Time": 8.558694722130895} +{"Pretrain/Learning Rate": 4.802941305693716e-05, "Pretrain/Loss": 2.1616008281707764, "Pretrain/Loss (Raw)": 2.2183656692504883, "Pretrain/Step": 1463, "Pretrain/Step Time": 8.564093731343746} +{"Pretrain/Learning Rate": 4.802610793756761e-05, "Pretrain/Loss": 2.159731864929199, "Pretrain/Loss (Raw)": 2.075568199157715, "Pretrain/Step": 1464, "Pretrain/Step Time": 8.561948474496603} +{"Pretrain/Learning Rate": 4.8022800162718794e-05, "Pretrain/Loss": 2.1606037616729736, "Pretrain/Loss (Raw)": 2.1566226482391357, "Pretrain/Step": 1465, "Pretrain/Step Time": 8.562690444290638} +{"Pretrain/Learning Rate": 4.801948973277218e-05, "Pretrain/Loss": 2.1598849296569824, "Pretrain/Loss (Raw)": 2.115467071533203, "Pretrain/Step": 1466, "Pretrain/Step Time": 8.557030888274312} +{"Pretrain/Learning Rate": 4.8016176648109534e-05, "Pretrain/Loss": 2.1600117683410645, "Pretrain/Loss (Raw)": 2.102954387664795, "Pretrain/Step": 1467, "Pretrain/Step Time": 8.564851699396968} +{"Pretrain/Learning Rate": 4.801286090911295e-05, "Pretrain/Loss": 2.160083293914795, "Pretrain/Loss (Raw)": 2.2027587890625, "Pretrain/Step": 1468, "Pretrain/Step Time": 8.554432988166809} +{"Pretrain/Learning Rate": 4.80095425161648e-05, "Pretrain/Loss": 2.1599292755126953, "Pretrain/Loss (Raw)": 2.2209978103637695, "Pretrain/Step": 1469, "Pretrain/Step Time": 8.555510384961963} +{"Pretrain/Learning Rate": 4.800622146964777e-05, "Pretrain/Loss": 2.158853054046631, "Pretrain/Loss (Raw)": 2.0610156059265137, "Pretrain/Step": 1470, "Pretrain/Step Time": 8.55386102385819} +{"Pretrain/Learning Rate": 4.8002897769944885e-05, "Pretrain/Loss": 2.1597347259521484, "Pretrain/Loss (Raw)": 2.2249507904052734, "Pretrain/Step": 1471, "Pretrain/Step Time": 8.559433218091726} +{"Pretrain/Learning Rate": 4.799957141743944e-05, "Pretrain/Loss": 2.159529209136963, "Pretrain/Loss (Raw)": 2.27471923828125, "Pretrain/Step": 1472, "Pretrain/Step Time": 8.563658971339464} +{"Pretrain/Learning Rate": 4.799624241251502e-05, "Pretrain/Loss": 2.1593103408813477, "Pretrain/Loss (Raw)": 2.06779408454895, "Pretrain/Step": 1473, "Pretrain/Step Time": 8.564510265365243} +{"Pretrain/Learning Rate": 4.7992910755555584e-05, "Pretrain/Loss": 2.1596713066101074, "Pretrain/Loss (Raw)": 2.023355722427368, "Pretrain/Step": 1474, "Pretrain/Step Time": 8.558379452675581} +{"Pretrain/Learning Rate": 4.798957644694533e-05, "Pretrain/Loss": 2.1564700603485107, "Pretrain/Loss (Raw)": 1.9441930055618286, "Pretrain/Step": 1475, "Pretrain/Step Time": 8.560511508956552} +{"Pretrain/Learning Rate": 4.7986239487068785e-05, "Pretrain/Loss": 2.154524326324463, "Pretrain/Loss (Raw)": 2.078338384628296, "Pretrain/Step": 1476, "Pretrain/Step Time": 8.556994521990418} +{"Pretrain/Learning Rate": 4.798289987631079e-05, "Pretrain/Loss": 2.1534743309020996, "Pretrain/Loss (Raw)": 2.1138253211975098, "Pretrain/Step": 1477, "Pretrain/Step Time": 8.553723717108369} +{"Pretrain/Learning Rate": 4.797955761505648e-05, "Pretrain/Loss": 2.154085636138916, "Pretrain/Loss (Raw)": 2.177239418029785, "Pretrain/Step": 1478, "Pretrain/Step Time": 8.5582679733634} +{"Pretrain/Learning Rate": 4.7976212703691306e-05, "Pretrain/Loss": 2.153508424758911, "Pretrain/Loss (Raw)": 2.2973573207855225, "Pretrain/Step": 1479, "Pretrain/Step Time": 8.559822315350175} +{"Pretrain/Learning Rate": 4.797286514260101e-05, "Pretrain/Loss": 2.153524398803711, "Pretrain/Loss (Raw)": 2.0960683822631836, "Pretrain/Step": 1480, "Pretrain/Step Time": 8.554072853177786} +{"Pretrain/Learning Rate": 4.7969514932171665e-05, "Pretrain/Loss": 2.1524100303649902, "Pretrain/Loss (Raw)": 2.113175868988037, "Pretrain/Step": 1481, "Pretrain/Step Time": 8.551916850730777} +{"Pretrain/Learning Rate": 4.796616207278961e-05, "Pretrain/Loss": 2.1499669551849365, "Pretrain/Loss (Raw)": 2.177198886871338, "Pretrain/Step": 1482, "Pretrain/Step Time": 8.55269069969654} +{"Pretrain/Learning Rate": 4.796280656484153e-05, "Pretrain/Loss": 2.149203300476074, "Pretrain/Loss (Raw)": 2.1356780529022217, "Pretrain/Step": 1483, "Pretrain/Step Time": 8.55669086612761} +{"Pretrain/Learning Rate": 4.795944840871439e-05, "Pretrain/Loss": 2.150852680206299, "Pretrain/Loss (Raw)": 2.1034579277038574, "Pretrain/Step": 1484, "Pretrain/Step Time": 8.55277700535953} +{"Pretrain/Learning Rate": 4.7956087604795474e-05, "Pretrain/Loss": 2.151930332183838, "Pretrain/Loss (Raw)": 2.1955366134643555, "Pretrain/Step": 1485, "Pretrain/Step Time": 8.553054179996252} +{"Pretrain/Learning Rate": 4.7952724153472366e-05, "Pretrain/Loss": 2.1534996032714844, "Pretrain/Loss (Raw)": 2.270246744155884, "Pretrain/Step": 1486, "Pretrain/Step Time": 8.552684593945742} +{"Pretrain/Learning Rate": 4.7949358055132945e-05, "Pretrain/Loss": 2.152317523956299, "Pretrain/Loss (Raw)": 2.0384953022003174, "Pretrain/Step": 1487, "Pretrain/Step Time": 8.550189374014735} +{"Pretrain/Learning Rate": 4.7945989310165415e-05, "Pretrain/Loss": 2.1521482467651367, "Pretrain/Loss (Raw)": 2.1242306232452393, "Pretrain/Step": 1488, "Pretrain/Step Time": 8.547164868563414} +{"Pretrain/Learning Rate": 4.794261791895828e-05, "Pretrain/Loss": 2.152118444442749, "Pretrain/Loss (Raw)": 2.1572279930114746, "Pretrain/Step": 1489, "Pretrain/Step Time": 8.549513455480337} +{"Pretrain/Learning Rate": 4.793924388190033e-05, "Pretrain/Loss": 2.152108669281006, "Pretrain/Loss (Raw)": 2.022796869277954, "Pretrain/Step": 1490, "Pretrain/Step Time": 8.547217661514878} +{"Pretrain/Learning Rate": 4.793586719938068e-05, "Pretrain/Loss": 2.1519007682800293, "Pretrain/Loss (Raw)": 2.2739627361297607, "Pretrain/Step": 1491, "Pretrain/Step Time": 8.551185730844736} +{"Pretrain/Learning Rate": 4.7932487871788746e-05, "Pretrain/Loss": 2.150839328765869, "Pretrain/Loss (Raw)": 2.092273712158203, "Pretrain/Step": 1492, "Pretrain/Step Time": 8.539990156888962} +{"Pretrain/Learning Rate": 4.792910589951426e-05, "Pretrain/Loss": 2.1534876823425293, "Pretrain/Loss (Raw)": 2.1402297019958496, "Pretrain/Step": 1493, "Pretrain/Step Time": 8.54222683608532} +{"Pretrain/Learning Rate": 4.792572128294722e-05, "Pretrain/Loss": 2.1536333560943604, "Pretrain/Loss (Raw)": 2.1156327724456787, "Pretrain/Step": 1494, "Pretrain/Step Time": 8.541237242519855} +{"Pretrain/Learning Rate": 4.792233402247799e-05, "Pretrain/Loss": 2.15297794342041, "Pretrain/Loss (Raw)": 2.1197803020477295, "Pretrain/Step": 1495, "Pretrain/Step Time": 8.541011590510607} +{"Pretrain/Learning Rate": 4.791894411849718e-05, "Pretrain/Loss": 2.1520049571990967, "Pretrain/Loss (Raw)": 2.1785624027252197, "Pretrain/Step": 1496, "Pretrain/Step Time": 8.540115723386407} +{"Pretrain/Learning Rate": 4.7915551571395726e-05, "Pretrain/Loss": 2.1514265537261963, "Pretrain/Loss (Raw)": 2.1784157752990723, "Pretrain/Step": 1497, "Pretrain/Step Time": 8.536718862131238} +{"Pretrain/Learning Rate": 4.79121563815649e-05, "Pretrain/Loss": 2.150646209716797, "Pretrain/Loss (Raw)": 2.274501085281372, "Pretrain/Step": 1498, "Pretrain/Step Time": 8.539435248821974} +{"Pretrain/Learning Rate": 4.790875854939622e-05, "Pretrain/Loss": 2.1489145755767822, "Pretrain/Loss (Raw)": 2.1475918292999268, "Pretrain/Step": 1499, "Pretrain/Step Time": 8.541774407029152} +{"Pretrain/Learning Rate": 4.790535807528156e-05, "Pretrain/Loss": 2.1465935707092285, "Pretrain/Loss (Raw)": 1.9155020713806152, "Pretrain/Step": 1500, "Pretrain/Step Time": 8.541105976328254} +{"Pretrain/Learning Rate": 4.7901954959613076e-05, "Pretrain/Loss": 2.1478075981140137, "Pretrain/Loss (Raw)": 2.0870003700256348, "Pretrain/Step": 1501, "Pretrain/Step Time": 8.539310086518526} +{"Pretrain/Learning Rate": 4.789854920278323e-05, "Pretrain/Loss": 2.1470370292663574, "Pretrain/Loss (Raw)": 2.0167393684387207, "Pretrain/Step": 1502, "Pretrain/Step Time": 8.540433298796415} +{"Pretrain/Learning Rate": 4.789514080518478e-05, "Pretrain/Loss": 2.144641876220703, "Pretrain/Loss (Raw)": 2.1124985218048096, "Pretrain/Step": 1503, "Pretrain/Step Time": 8.538066128268838} +{"Pretrain/Learning Rate": 4.789172976721081e-05, "Pretrain/Loss": 2.1435017585754395, "Pretrain/Loss (Raw)": 2.113060712814331, "Pretrain/Step": 1504, "Pretrain/Step Time": 8.532406222075224} +{"Pretrain/Learning Rate": 4.7888316089254705e-05, "Pretrain/Loss": 2.1467390060424805, "Pretrain/Loss (Raw)": 2.3101308345794678, "Pretrain/Step": 1505, "Pretrain/Step Time": 8.53813050314784} +{"Pretrain/Learning Rate": 4.7884899771710126e-05, "Pretrain/Loss": 2.1453335285186768, "Pretrain/Loss (Raw)": 2.2860376834869385, "Pretrain/Step": 1506, "Pretrain/Step Time": 8.533980682492256} +{"Pretrain/Learning Rate": 4.788148081497106e-05, "Pretrain/Loss": 2.1417927742004395, "Pretrain/Loss (Raw)": 2.0096917152404785, "Pretrain/Step": 1507, "Pretrain/Step Time": 8.537149015814066} +{"Pretrain/Learning Rate": 4.787805921943181e-05, "Pretrain/Loss": 2.1411867141723633, "Pretrain/Loss (Raw)": 2.1346373558044434, "Pretrain/Step": 1508, "Pretrain/Step Time": 8.533843388780951} +{"Pretrain/Learning Rate": 4.787463498548698e-05, "Pretrain/Loss": 2.141116142272949, "Pretrain/Loss (Raw)": 2.1044201850891113, "Pretrain/Step": 1509, "Pretrain/Step Time": 8.54580381885171} +{"Pretrain/Learning Rate": 4.787120811353144e-05, "Pretrain/Loss": 2.140648365020752, "Pretrain/Loss (Raw)": 2.18304443359375, "Pretrain/Step": 1510, "Pretrain/Step Time": 8.53958060592413} +{"Pretrain/Learning Rate": 4.786777860396041e-05, "Pretrain/Loss": 2.141118049621582, "Pretrain/Loss (Raw)": 2.1118407249450684, "Pretrain/Step": 1511, "Pretrain/Step Time": 8.541268108412623} +{"Pretrain/Learning Rate": 4.78643464571694e-05, "Pretrain/Loss": 2.141200065612793, "Pretrain/Loss (Raw)": 2.1010947227478027, "Pretrain/Step": 1512, "Pretrain/Step Time": 8.533755896613002} +{"Pretrain/Learning Rate": 4.786091167355421e-05, "Pretrain/Loss": 2.1410768032073975, "Pretrain/Loss (Raw)": 2.2099227905273438, "Pretrain/Step": 1513, "Pretrain/Step Time": 8.536346714943647} +{"Pretrain/Learning Rate": 4.785747425351097e-05, "Pretrain/Loss": 2.141841411590576, "Pretrain/Loss (Raw)": 2.0704705715179443, "Pretrain/Step": 1514, "Pretrain/Step Time": 8.531774628907442} +{"Pretrain/Learning Rate": 4.785403419743608e-05, "Pretrain/Loss": 2.1417829990386963, "Pretrain/Loss (Raw)": 2.112915277481079, "Pretrain/Step": 1515, "Pretrain/Step Time": 8.537816436961293} +{"Pretrain/Learning Rate": 4.785059150572628e-05, "Pretrain/Loss": 2.1421778202056885, "Pretrain/Loss (Raw)": 2.1642236709594727, "Pretrain/Step": 1516, "Pretrain/Step Time": 8.531389432027936} +{"Pretrain/Learning Rate": 4.784714617877859e-05, "Pretrain/Loss": 2.1425464153289795, "Pretrain/Loss (Raw)": 2.25791335105896, "Pretrain/Step": 1517, "Pretrain/Step Time": 8.533700171858072} +{"Pretrain/Learning Rate": 4.784369821699035e-05, "Pretrain/Loss": 2.1441540718078613, "Pretrain/Loss (Raw)": 2.250002861022949, "Pretrain/Step": 1518, "Pretrain/Step Time": 8.533398501574993} +{"Pretrain/Learning Rate": 4.784024762075918e-05, "Pretrain/Loss": 2.1440529823303223, "Pretrain/Loss (Raw)": 2.184955596923828, "Pretrain/Step": 1519, "Pretrain/Step Time": 8.536162577569485} +{"Pretrain/Learning Rate": 4.7836794390483035e-05, "Pretrain/Loss": 2.143580436706543, "Pretrain/Loss (Raw)": 2.005869150161743, "Pretrain/Step": 1520, "Pretrain/Step Time": 8.5338567905128} +{"Pretrain/Learning Rate": 4.7833338526560145e-05, "Pretrain/Loss": 2.1467983722686768, "Pretrain/Loss (Raw)": 2.3138468265533447, "Pretrain/Step": 1521, "Pretrain/Step Time": 8.537178698927164} +{"Pretrain/Learning Rate": 4.782988002938907e-05, "Pretrain/Loss": 2.1442787647247314, "Pretrain/Loss (Raw)": 2.0878522396087646, "Pretrain/Step": 1522, "Pretrain/Step Time": 8.530736170709133} +{"Pretrain/Learning Rate": 4.782641889936864e-05, "Pretrain/Loss": 2.1442437171936035, "Pretrain/Loss (Raw)": 2.072152614593506, "Pretrain/Step": 1523, "Pretrain/Step Time": 8.535191217437387} +{"Pretrain/Learning Rate": 4.782295513689803e-05, "Pretrain/Loss": 2.145019769668579, "Pretrain/Loss (Raw)": 2.0671274662017822, "Pretrain/Step": 1524, "Pretrain/Step Time": 8.534636482596397} +{"Pretrain/Learning Rate": 4.7819488742376686e-05, "Pretrain/Loss": 2.1480958461761475, "Pretrain/Loss (Raw)": 2.34614896774292, "Pretrain/Step": 1525, "Pretrain/Step Time": 8.53636834397912} +{"Pretrain/Learning Rate": 4.7816019716204375e-05, "Pretrain/Loss": 2.149142265319824, "Pretrain/Loss (Raw)": 2.5412251949310303, "Pretrain/Step": 1526, "Pretrain/Step Time": 8.534321248531342} +{"Pretrain/Learning Rate": 4.781254805878115e-05, "Pretrain/Loss": 2.1524643898010254, "Pretrain/Loss (Raw)": 2.240948438644409, "Pretrain/Step": 1527, "Pretrain/Step Time": 8.535678090527654} +{"Pretrain/Learning Rate": 4.780907377050739e-05, "Pretrain/Loss": 2.1509270668029785, "Pretrain/Loss (Raw)": 2.077418804168701, "Pretrain/Step": 1528, "Pretrain/Step Time": 8.529632225632668} +{"Pretrain/Learning Rate": 4.780559685178376e-05, "Pretrain/Loss": 2.1519362926483154, "Pretrain/Loss (Raw)": 2.1909549236297607, "Pretrain/Step": 1529, "Pretrain/Step Time": 8.534803805872798} +{"Pretrain/Learning Rate": 4.780211730301124e-05, "Pretrain/Loss": 2.1523332595825195, "Pretrain/Loss (Raw)": 2.0695981979370117, "Pretrain/Step": 1530, "Pretrain/Step Time": 8.532609233632684} +{"Pretrain/Learning Rate": 4.779863512459111e-05, "Pretrain/Loss": 2.1511218547821045, "Pretrain/Loss (Raw)": 2.0763494968414307, "Pretrain/Step": 1531, "Pretrain/Step Time": 8.537990670651197} +{"Pretrain/Learning Rate": 4.779515031692494e-05, "Pretrain/Loss": 2.1521997451782227, "Pretrain/Loss (Raw)": 2.4374964237213135, "Pretrain/Step": 1532, "Pretrain/Step Time": 8.5348093919456} +{"Pretrain/Learning Rate": 4.7791662880414625e-05, "Pretrain/Loss": 2.1541216373443604, "Pretrain/Loss (Raw)": 2.4071176052093506, "Pretrain/Step": 1533, "Pretrain/Step Time": 8.53435118123889} +{"Pretrain/Learning Rate": 4.778817281546235e-05, "Pretrain/Loss": 2.153759002685547, "Pretrain/Loss (Raw)": 2.0878193378448486, "Pretrain/Step": 1534, "Pretrain/Step Time": 8.535868406295776} +{"Pretrain/Learning Rate": 4.7784680122470605e-05, "Pretrain/Loss": 2.156189441680908, "Pretrain/Loss (Raw)": 2.361138343811035, "Pretrain/Step": 1535, "Pretrain/Step Time": 8.542600318789482} +{"Pretrain/Learning Rate": 4.778118480184218e-05, "Pretrain/Loss": 2.1569671630859375, "Pretrain/Loss (Raw)": 2.12139892578125, "Pretrain/Step": 1536, "Pretrain/Step Time": 8.544363183900714} +{"Pretrain/Learning Rate": 4.777768685398017e-05, "Pretrain/Loss": 2.156552791595459, "Pretrain/Loss (Raw)": 1.9505099058151245, "Pretrain/Step": 1537, "Pretrain/Step Time": 8.54284531250596} +{"Pretrain/Learning Rate": 4.777418627928799e-05, "Pretrain/Loss": 2.15712571144104, "Pretrain/Loss (Raw)": 2.1976449489593506, "Pretrain/Step": 1538, "Pretrain/Step Time": 8.539968406781554} +{"Pretrain/Learning Rate": 4.777068307816932e-05, "Pretrain/Loss": 2.1565651893615723, "Pretrain/Loss (Raw)": 2.0721938610076904, "Pretrain/Step": 1539, "Pretrain/Step Time": 8.539773495867848} +{"Pretrain/Learning Rate": 4.776717725102819e-05, "Pretrain/Loss": 2.1568379402160645, "Pretrain/Loss (Raw)": 2.199385166168213, "Pretrain/Step": 1540, "Pretrain/Step Time": 8.539886364713311} +{"Pretrain/Learning Rate": 4.77636687982689e-05, "Pretrain/Loss": 2.156688928604126, "Pretrain/Loss (Raw)": 2.171438217163086, "Pretrain/Step": 1541, "Pretrain/Step Time": 8.53642937168479} +{"Pretrain/Learning Rate": 4.776015772029605e-05, "Pretrain/Loss": 2.155390739440918, "Pretrain/Loss (Raw)": 2.049582004547119, "Pretrain/Step": 1542, "Pretrain/Step Time": 8.544100711122155} +{"Pretrain/Learning Rate": 4.7756644017514564e-05, "Pretrain/Loss": 2.1509482860565186, "Pretrain/Loss (Raw)": 2.0238192081451416, "Pretrain/Step": 1543, "Pretrain/Step Time": 8.546223865821958} +{"Pretrain/Learning Rate": 4.775312769032966e-05, "Pretrain/Loss": 2.1520442962646484, "Pretrain/Loss (Raw)": 2.125272035598755, "Pretrain/Step": 1544, "Pretrain/Step Time": 8.548224372789264} +{"Pretrain/Learning Rate": 4.774960873914685e-05, "Pretrain/Loss": 2.1532490253448486, "Pretrain/Loss (Raw)": 2.2773988246917725, "Pretrain/Step": 1545, "Pretrain/Step Time": 8.549016887322068} +{"Pretrain/Learning Rate": 4.774608716437196e-05, "Pretrain/Loss": 2.1495065689086914, "Pretrain/Loss (Raw)": 2.2719178199768066, "Pretrain/Step": 1546, "Pretrain/Step Time": 8.543081298470497} +{"Pretrain/Learning Rate": 4.7742562966411117e-05, "Pretrain/Loss": 2.151094675064087, "Pretrain/Loss (Raw)": 2.153200387954712, "Pretrain/Step": 1547, "Pretrain/Step Time": 8.54291220754385} +{"Pretrain/Learning Rate": 4.7739036145670744e-05, "Pretrain/Loss": 2.148869514465332, "Pretrain/Loss (Raw)": 2.0799169540405273, "Pretrain/Step": 1548, "Pretrain/Step Time": 8.54672572761774} +{"Pretrain/Learning Rate": 4.773550670255758e-05, "Pretrain/Loss": 2.148789644241333, "Pretrain/Loss (Raw)": 2.1345314979553223, "Pretrain/Step": 1549, "Pretrain/Step Time": 8.54379571042955} +{"Pretrain/Learning Rate": 4.773197463747865e-05, "Pretrain/Loss": 2.147864818572998, "Pretrain/Loss (Raw)": 2.0426881313323975, "Pretrain/Step": 1550, "Pretrain/Step Time": 8.54891406558454} +{"Pretrain/Learning Rate": 4.772843995084128e-05, "Pretrain/Loss": 2.149705648422241, "Pretrain/Loss (Raw)": 2.2825822830200195, "Pretrain/Step": 1551, "Pretrain/Step Time": 8.545664040371776} +{"Pretrain/Learning Rate": 4.7724902643053116e-05, "Pretrain/Loss": 2.1493916511535645, "Pretrain/Loss (Raw)": 2.240713119506836, "Pretrain/Step": 1552, "Pretrain/Step Time": 8.54518892429769} +{"Pretrain/Learning Rate": 4.77213627145221e-05, "Pretrain/Loss": 2.148944854736328, "Pretrain/Loss (Raw)": 2.1417922973632812, "Pretrain/Step": 1553, "Pretrain/Step Time": 8.53870308957994} +{"Pretrain/Learning Rate": 4.771782016565647e-05, "Pretrain/Loss": 2.1522717475891113, "Pretrain/Loss (Raw)": 2.5162768363952637, "Pretrain/Step": 1554, "Pretrain/Step Time": 8.541302049532533} +{"Pretrain/Learning Rate": 4.771427499686477e-05, "Pretrain/Loss": 2.153623580932617, "Pretrain/Loss (Raw)": 2.5201187133789062, "Pretrain/Step": 1555, "Pretrain/Step Time": 8.540582414716482} +{"Pretrain/Learning Rate": 4.771072720855584e-05, "Pretrain/Loss": 2.151214599609375, "Pretrain/Loss (Raw)": 2.2106473445892334, "Pretrain/Step": 1556, "Pretrain/Step Time": 8.545896841213107} +{"Pretrain/Learning Rate": 4.770717680113883e-05, "Pretrain/Loss": 2.148749589920044, "Pretrain/Loss (Raw)": 2.0308613777160645, "Pretrain/Step": 1557, "Pretrain/Step Time": 8.544076396152377} +{"Pretrain/Learning Rate": 4.770362377502319e-05, "Pretrain/Loss": 2.14772891998291, "Pretrain/Loss (Raw)": 2.1454050540924072, "Pretrain/Step": 1558, "Pretrain/Step Time": 8.538423424586654} +{"Pretrain/Learning Rate": 4.770006813061868e-05, "Pretrain/Loss": 2.1500725746154785, "Pretrain/Loss (Raw)": 2.1924731731414795, "Pretrain/Step": 1559, "Pretrain/Step Time": 8.545895595103502} +{"Pretrain/Learning Rate": 4.769650986833535e-05, "Pretrain/Loss": 2.1519579887390137, "Pretrain/Loss (Raw)": 2.2937426567077637, "Pretrain/Step": 1560, "Pretrain/Step Time": 8.54468435794115} +{"Pretrain/Learning Rate": 4.769294898858354e-05, "Pretrain/Loss": 2.149685859680176, "Pretrain/Loss (Raw)": 1.8050512075424194, "Pretrain/Step": 1561, "Pretrain/Step Time": 8.54182692244649} +{"Pretrain/Learning Rate": 4.768938549177393e-05, "Pretrain/Loss": 2.1497788429260254, "Pretrain/Loss (Raw)": 2.182992935180664, "Pretrain/Step": 1562, "Pretrain/Step Time": 8.53959052450955} +{"Pretrain/Learning Rate": 4.768581937831746e-05, "Pretrain/Loss": 2.153179168701172, "Pretrain/Loss (Raw)": 2.3807852268218994, "Pretrain/Step": 1563, "Pretrain/Step Time": 8.54187886044383} +{"Pretrain/Learning Rate": 4.768225064862541e-05, "Pretrain/Loss": 2.154322624206543, "Pretrain/Loss (Raw)": 2.2405598163604736, "Pretrain/Step": 1564, "Pretrain/Step Time": 8.540232120081782} +{"Pretrain/Learning Rate": 4.767867930310933e-05, "Pretrain/Loss": 2.1572413444519043, "Pretrain/Loss (Raw)": 2.4101483821868896, "Pretrain/Step": 1565, "Pretrain/Step Time": 8.543796664103866} +{"Pretrain/Learning Rate": 4.7675105342181084e-05, "Pretrain/Loss": 2.158804416656494, "Pretrain/Loss (Raw)": 2.2946279048919678, "Pretrain/Step": 1566, "Pretrain/Step Time": 8.540622409433126} +{"Pretrain/Learning Rate": 4.767152876625285e-05, "Pretrain/Loss": 2.159708023071289, "Pretrain/Loss (Raw)": 2.185480833053589, "Pretrain/Step": 1567, "Pretrain/Step Time": 8.536075135692954} +{"Pretrain/Learning Rate": 4.766794957573708e-05, "Pretrain/Loss": 2.1637377738952637, "Pretrain/Loss (Raw)": 2.3338825702667236, "Pretrain/Step": 1568, "Pretrain/Step Time": 8.539270492270589} +{"Pretrain/Learning Rate": 4.766436777104655e-05, "Pretrain/Loss": 2.163703203201294, "Pretrain/Loss (Raw)": 2.2897112369537354, "Pretrain/Step": 1569, "Pretrain/Step Time": 8.536892302334309} +{"Pretrain/Learning Rate": 4.766078335259433e-05, "Pretrain/Loss": 2.1610796451568604, "Pretrain/Loss (Raw)": 2.1768839359283447, "Pretrain/Step": 1570, "Pretrain/Step Time": 8.543599044904113} +{"Pretrain/Learning Rate": 4.76571963207938e-05, "Pretrain/Loss": 2.157871723175049, "Pretrain/Loss (Raw)": 2.0648539066314697, "Pretrain/Step": 1571, "Pretrain/Step Time": 8.543434172868729} +{"Pretrain/Learning Rate": 4.765360667605861e-05, "Pretrain/Loss": 2.1573879718780518, "Pretrain/Loss (Raw)": 2.2455976009368896, "Pretrain/Step": 1572, "Pretrain/Step Time": 8.54187842272222} +{"Pretrain/Learning Rate": 4.765001441880276e-05, "Pretrain/Loss": 2.1568822860717773, "Pretrain/Loss (Raw)": 2.040017604827881, "Pretrain/Step": 1573, "Pretrain/Step Time": 8.538991205394268} +{"Pretrain/Learning Rate": 4.764641954944052e-05, "Pretrain/Loss": 2.1561264991760254, "Pretrain/Loss (Raw)": 1.9683486223220825, "Pretrain/Step": 1574, "Pretrain/Step Time": 8.538359204307199} +{"Pretrain/Learning Rate": 4.764282206838646e-05, "Pretrain/Loss": 2.155150890350342, "Pretrain/Loss (Raw)": 2.1304612159729004, "Pretrain/Step": 1575, "Pretrain/Step Time": 8.535387072712183} +{"Pretrain/Learning Rate": 4.763922197605547e-05, "Pretrain/Loss": 2.155653238296509, "Pretrain/Loss (Raw)": 2.085577964782715, "Pretrain/Step": 1576, "Pretrain/Step Time": 8.545154511928558} +{"Pretrain/Learning Rate": 4.763561927286271e-05, "Pretrain/Loss": 2.1546630859375, "Pretrain/Loss (Raw)": 2.0156311988830566, "Pretrain/Step": 1577, "Pretrain/Step Time": 8.546584084630013} +{"Pretrain/Learning Rate": 4.7632013959223684e-05, "Pretrain/Loss": 2.154588460922241, "Pretrain/Loss (Raw)": 2.000403642654419, "Pretrain/Step": 1578, "Pretrain/Step Time": 8.537360882386565} +{"Pretrain/Learning Rate": 4.7628406035554156e-05, "Pretrain/Loss": 2.15316104888916, "Pretrain/Loss (Raw)": 2.1104485988616943, "Pretrain/Step": 1579, "Pretrain/Step Time": 8.534950787201524} +{"Pretrain/Learning Rate": 4.762479550227022e-05, "Pretrain/Loss": 2.154179573059082, "Pretrain/Loss (Raw)": 2.131441831588745, "Pretrain/Step": 1580, "Pretrain/Step Time": 8.5357149168849} +{"Pretrain/Learning Rate": 4.762118235978825e-05, "Pretrain/Loss": 2.1542372703552246, "Pretrain/Loss (Raw)": 2.0856616497039795, "Pretrain/Step": 1581, "Pretrain/Step Time": 8.532878667116165} +{"Pretrain/Learning Rate": 4.7617566608524946e-05, "Pretrain/Loss": 2.156128406524658, "Pretrain/Loss (Raw)": 2.256824493408203, "Pretrain/Step": 1582, "Pretrain/Step Time": 8.539797700941563} +{"Pretrain/Learning Rate": 4.761394824889727e-05, "Pretrain/Loss": 2.154402256011963, "Pretrain/Loss (Raw)": 2.042600393295288, "Pretrain/Step": 1583, "Pretrain/Step Time": 8.536820182576776} +{"Pretrain/Learning Rate": 4.761032728132253e-05, "Pretrain/Loss": 2.1560440063476562, "Pretrain/Loss (Raw)": 2.1926629543304443, "Pretrain/Step": 1584, "Pretrain/Step Time": 8.53418730944395} +{"Pretrain/Learning Rate": 4.76067037062183e-05, "Pretrain/Loss": 2.156912326812744, "Pretrain/Loss (Raw)": 2.1842896938323975, "Pretrain/Step": 1585, "Pretrain/Step Time": 8.533896211534739} +{"Pretrain/Learning Rate": 4.7603077524002474e-05, "Pretrain/Loss": 2.1562955379486084, "Pretrain/Loss (Raw)": 1.9339345693588257, "Pretrain/Step": 1586, "Pretrain/Step Time": 8.529061745852232} +{"Pretrain/Learning Rate": 4.759944873509324e-05, "Pretrain/Loss": 2.156886100769043, "Pretrain/Loss (Raw)": 2.2025015354156494, "Pretrain/Step": 1587, "Pretrain/Step Time": 8.526217574253678} +{"Pretrain/Learning Rate": 4.7595817339909086e-05, "Pretrain/Loss": 2.1568074226379395, "Pretrain/Loss (Raw)": 2.1155052185058594, "Pretrain/Step": 1588, "Pretrain/Step Time": 8.536437191069126} +{"Pretrain/Learning Rate": 4.75921833388688e-05, "Pretrain/Loss": 2.1565122604370117, "Pretrain/Loss (Raw)": 2.110987901687622, "Pretrain/Step": 1589, "Pretrain/Step Time": 8.534905396401882} +{"Pretrain/Learning Rate": 4.758854673239147e-05, "Pretrain/Loss": 2.159569263458252, "Pretrain/Loss (Raw)": 2.3317267894744873, "Pretrain/Step": 1590, "Pretrain/Step Time": 8.53120368346572} +{"Pretrain/Learning Rate": 4.7584907520896495e-05, "Pretrain/Loss": 2.1572041511535645, "Pretrain/Loss (Raw)": 1.9156222343444824, "Pretrain/Step": 1591, "Pretrain/Step Time": 8.529938366264105} +{"Pretrain/Learning Rate": 4.7581265704803554e-05, "Pretrain/Loss": 2.1566829681396484, "Pretrain/Loss (Raw)": 2.0088696479797363, "Pretrain/Step": 1592, "Pretrain/Step Time": 8.529469851404428} +{"Pretrain/Learning Rate": 4.757762128453266e-05, "Pretrain/Loss": 2.157121419906616, "Pretrain/Loss (Raw)": 2.2127559185028076, "Pretrain/Step": 1593, "Pretrain/Step Time": 8.534483823925257} +{"Pretrain/Learning Rate": 4.757397426050408e-05, "Pretrain/Loss": 2.155752420425415, "Pretrain/Loss (Raw)": 1.9402104616165161, "Pretrain/Step": 1594, "Pretrain/Step Time": 8.539996156468987} +{"Pretrain/Learning Rate": 4.757032463313842e-05, "Pretrain/Loss": 2.157041072845459, "Pretrain/Loss (Raw)": 2.2679238319396973, "Pretrain/Step": 1595, "Pretrain/Step Time": 8.532563956454396} +{"Pretrain/Learning Rate": 4.756667240285656e-05, "Pretrain/Loss": 2.1569015979766846, "Pretrain/Loss (Raw)": 2.184894323348999, "Pretrain/Step": 1596, "Pretrain/Step Time": 8.534360649064183} +{"Pretrain/Learning Rate": 4.756301757007971e-05, "Pretrain/Loss": 2.159013509750366, "Pretrain/Loss (Raw)": 2.491302967071533, "Pretrain/Step": 1597, "Pretrain/Step Time": 8.534534677863121} +{"Pretrain/Learning Rate": 4.755936013522935e-05, "Pretrain/Loss": 2.1604561805725098, "Pretrain/Loss (Raw)": 2.245696783065796, "Pretrain/Step": 1598, "Pretrain/Step Time": 8.532428432255983} +{"Pretrain/Learning Rate": 4.7555700098727276e-05, "Pretrain/Loss": 2.1598410606384277, "Pretrain/Loss (Raw)": 2.146218776702881, "Pretrain/Step": 1599, "Pretrain/Step Time": 8.529357058927417} +{"Pretrain/Learning Rate": 4.755203746099558e-05, "Pretrain/Loss": 2.1591968536376953, "Pretrain/Loss (Raw)": 2.192253351211548, "Pretrain/Step": 1600, "Pretrain/Step Time": 8.525886891409755} +{"Pretrain/Learning Rate": 4.754837222245666e-05, "Pretrain/Loss": 2.159583568572998, "Pretrain/Loss (Raw)": 2.1172776222229004, "Pretrain/Step": 1601, "Pretrain/Step Time": 8.525117428973317} +{"Pretrain/Learning Rate": 4.75447043835332e-05, "Pretrain/Loss": 2.1603236198425293, "Pretrain/Loss (Raw)": 2.118112325668335, "Pretrain/Step": 1602, "Pretrain/Step Time": 8.524243647232652} +{"Pretrain/Learning Rate": 4.75410339446482e-05, "Pretrain/Loss": 2.162759304046631, "Pretrain/Loss (Raw)": 2.2559516429901123, "Pretrain/Step": 1603, "Pretrain/Step Time": 8.52404392696917} +{"Pretrain/Learning Rate": 4.753736090622494e-05, "Pretrain/Loss": 2.16312575340271, "Pretrain/Loss (Raw)": 2.1252477169036865, "Pretrain/Step": 1604, "Pretrain/Step Time": 8.525359569117427} +{"Pretrain/Learning Rate": 4.753368526868703e-05, "Pretrain/Loss": 2.164273262023926, "Pretrain/Loss (Raw)": 2.2606849670410156, "Pretrain/Step": 1605, "Pretrain/Step Time": 8.53246733173728} +{"Pretrain/Learning Rate": 4.753000703245834e-05, "Pretrain/Loss": 2.163844347000122, "Pretrain/Loss (Raw)": 2.122361183166504, "Pretrain/Step": 1606, "Pretrain/Step Time": 8.524477591738105} +{"Pretrain/Learning Rate": 4.752632619796309e-05, "Pretrain/Loss": 2.163283348083496, "Pretrain/Loss (Raw)": 2.2255356311798096, "Pretrain/Step": 1607, "Pretrain/Step Time": 8.520769679918885} +{"Pretrain/Learning Rate": 4.752264276562575e-05, "Pretrain/Loss": 2.164304256439209, "Pretrain/Loss (Raw)": 2.226736307144165, "Pretrain/Step": 1608, "Pretrain/Step Time": 8.522625310346484} +{"Pretrain/Learning Rate": 4.751895673587111e-05, "Pretrain/Loss": 2.1640336513519287, "Pretrain/Loss (Raw)": 2.0785560607910156, "Pretrain/Step": 1609, "Pretrain/Step Time": 8.524319019168615} +{"Pretrain/Learning Rate": 4.751526810912427e-05, "Pretrain/Loss": 2.1619653701782227, "Pretrain/Loss (Raw)": 1.9124573469161987, "Pretrain/Step": 1610, "Pretrain/Step Time": 8.524753546342254} +{"Pretrain/Learning Rate": 4.751157688581062e-05, "Pretrain/Loss": 2.1617331504821777, "Pretrain/Loss (Raw)": 2.1059622764587402, "Pretrain/Step": 1611, "Pretrain/Step Time": 8.522319965064526} +{"Pretrain/Learning Rate": 4.750788306635584e-05, "Pretrain/Loss": 2.1620993614196777, "Pretrain/Loss (Raw)": 2.150301694869995, "Pretrain/Step": 1612, "Pretrain/Step Time": 8.526354897767305} +{"Pretrain/Learning Rate": 4.7504186651185926e-05, "Pretrain/Loss": 2.161367893218994, "Pretrain/Loss (Raw)": 2.101936101913452, "Pretrain/Step": 1613, "Pretrain/Step Time": 8.523288041353226} +{"Pretrain/Learning Rate": 4.7500487640727165e-05, "Pretrain/Loss": 2.16206693649292, "Pretrain/Loss (Raw)": 2.3597116470336914, "Pretrain/Step": 1614, "Pretrain/Step Time": 8.518002154305577} +{"Pretrain/Learning Rate": 4.7496786035406144e-05, "Pretrain/Loss": 2.162271499633789, "Pretrain/Loss (Raw)": 2.064692258834839, "Pretrain/Step": 1615, "Pretrain/Step Time": 8.520830992609262} +{"Pretrain/Learning Rate": 4.749308183564974e-05, "Pretrain/Loss": 2.1617205142974854, "Pretrain/Loss (Raw)": 2.053712844848633, "Pretrain/Step": 1616, "Pretrain/Step Time": 8.520273610949516} +{"Pretrain/Learning Rate": 4.748937504188517e-05, "Pretrain/Loss": 2.1620519161224365, "Pretrain/Loss (Raw)": 2.1996214389801025, "Pretrain/Step": 1617, "Pretrain/Step Time": 8.523576654493809} +{"Pretrain/Learning Rate": 4.748566565453988e-05, "Pretrain/Loss": 2.163302421569824, "Pretrain/Loss (Raw)": 2.182864189147949, "Pretrain/Step": 1618, "Pretrain/Step Time": 8.529885621741414} +{"Pretrain/Learning Rate": 4.748195367404167e-05, "Pretrain/Loss": 2.1624791622161865, "Pretrain/Loss (Raw)": 2.1685950756073, "Pretrain/Step": 1619, "Pretrain/Step Time": 8.52521045319736} +{"Pretrain/Learning Rate": 4.747823910081863e-05, "Pretrain/Loss": 2.162487745285034, "Pretrain/Loss (Raw)": 2.0933682918548584, "Pretrain/Step": 1620, "Pretrain/Step Time": 8.531765392050147} +{"Pretrain/Learning Rate": 4.747452193529913e-05, "Pretrain/Loss": 2.1621017456054688, "Pretrain/Loss (Raw)": 2.090822458267212, "Pretrain/Step": 1621, "Pretrain/Step Time": 8.527321288362145} +{"Pretrain/Learning Rate": 4.747080217791187e-05, "Pretrain/Loss": 2.163766384124756, "Pretrain/Loss (Raw)": 2.3287265300750732, "Pretrain/Step": 1622, "Pretrain/Step Time": 8.532780976966023} +{"Pretrain/Learning Rate": 4.7467079829085804e-05, "Pretrain/Loss": 2.164963722229004, "Pretrain/Loss (Raw)": 2.2730236053466797, "Pretrain/Step": 1623, "Pretrain/Step Time": 8.526064570993185} +{"Pretrain/Learning Rate": 4.746335488925022e-05, "Pretrain/Loss": 2.1655726432800293, "Pretrain/Loss (Raw)": 2.2564916610717773, "Pretrain/Step": 1624, "Pretrain/Step Time": 8.536822579801083} +{"Pretrain/Learning Rate": 4.7459627358834716e-05, "Pretrain/Loss": 2.1658637523651123, "Pretrain/Loss (Raw)": 2.2156918048858643, "Pretrain/Step": 1625, "Pretrain/Step Time": 8.546947829425335} +{"Pretrain/Learning Rate": 4.7455897238269134e-05, "Pretrain/Loss": 2.1647582054138184, "Pretrain/Loss (Raw)": 2.1330084800720215, "Pretrain/Step": 1626, "Pretrain/Step Time": 8.544235499575734} +{"Pretrain/Learning Rate": 4.745216452798368e-05, "Pretrain/Loss": 2.1637442111968994, "Pretrain/Loss (Raw)": 2.01777982711792, "Pretrain/Step": 1627, "Pretrain/Step Time": 8.541871970519423} +{"Pretrain/Learning Rate": 4.744842922840881e-05, "Pretrain/Loss": 2.1674933433532715, "Pretrain/Loss (Raw)": 2.395390748977661, "Pretrain/Step": 1628, "Pretrain/Step Time": 8.539590388536453} +{"Pretrain/Learning Rate": 4.74446913399753e-05, "Pretrain/Loss": 2.169337749481201, "Pretrain/Loss (Raw)": 2.323105812072754, "Pretrain/Step": 1629, "Pretrain/Step Time": 8.540300134569407} +{"Pretrain/Learning Rate": 4.744095086311422e-05, "Pretrain/Loss": 2.1709985733032227, "Pretrain/Loss (Raw)": 2.2293014526367188, "Pretrain/Step": 1630, "Pretrain/Step Time": 8.5488036070019} +{"Pretrain/Learning Rate": 4.743720779825694e-05, "Pretrain/Loss": 2.1712656021118164, "Pretrain/Loss (Raw)": 2.1466832160949707, "Pretrain/Step": 1631, "Pretrain/Step Time": 8.544681476429105} +{"Pretrain/Learning Rate": 4.743346214583514e-05, "Pretrain/Loss": 2.1728973388671875, "Pretrain/Loss (Raw)": 2.3219423294067383, "Pretrain/Step": 1632, "Pretrain/Step Time": 8.551940916106105} +{"Pretrain/Learning Rate": 4.742971390628076e-05, "Pretrain/Loss": 2.1716983318328857, "Pretrain/Loss (Raw)": 2.1566267013549805, "Pretrain/Step": 1633, "Pretrain/Step Time": 8.546216811984777} +{"Pretrain/Learning Rate": 4.742596308002609e-05, "Pretrain/Loss": 2.169700860977173, "Pretrain/Loss (Raw)": 2.030383825302124, "Pretrain/Step": 1634, "Pretrain/Step Time": 8.546976614743471} +{"Pretrain/Learning Rate": 4.742220966750368e-05, "Pretrain/Loss": 2.1714377403259277, "Pretrain/Loss (Raw)": 2.2319812774658203, "Pretrain/Step": 1635, "Pretrain/Step Time": 8.549909507855773} +{"Pretrain/Learning Rate": 4.7418453669146404e-05, "Pretrain/Loss": 2.171614646911621, "Pretrain/Loss (Raw)": 2.1572983264923096, "Pretrain/Step": 1636, "Pretrain/Step Time": 8.554015852510929} +{"Pretrain/Learning Rate": 4.74146950853874e-05, "Pretrain/Loss": 2.170536994934082, "Pretrain/Loss (Raw)": 1.9664820432662964, "Pretrain/Step": 1637, "Pretrain/Step Time": 8.549457354471087} +{"Pretrain/Learning Rate": 4.741093391666014e-05, "Pretrain/Loss": 2.1716907024383545, "Pretrain/Loss (Raw)": 2.330721378326416, "Pretrain/Step": 1638, "Pretrain/Step Time": 8.552694410085678} +{"Pretrain/Learning Rate": 4.7407170163398375e-05, "Pretrain/Loss": 2.1723852157592773, "Pretrain/Loss (Raw)": 2.200761318206787, "Pretrain/Step": 1639, "Pretrain/Step Time": 8.547488352283835} +{"Pretrain/Learning Rate": 4.740340382603616e-05, "Pretrain/Loss": 2.1713671684265137, "Pretrain/Loss (Raw)": 1.9707517623901367, "Pretrain/Step": 1640, "Pretrain/Step Time": 8.54930504783988} +{"Pretrain/Learning Rate": 4.739963490500785e-05, "Pretrain/Loss": 2.170823097229004, "Pretrain/Loss (Raw)": 2.1402716636657715, "Pretrain/Step": 1641, "Pretrain/Step Time": 8.54680704139173} +{"Pretrain/Learning Rate": 4.7395863400748096e-05, "Pretrain/Loss": 2.171327590942383, "Pretrain/Loss (Raw)": 2.135035753250122, "Pretrain/Step": 1642, "Pretrain/Step Time": 8.554091110825539} +{"Pretrain/Learning Rate": 4.7392089313691835e-05, "Pretrain/Loss": 2.172743320465088, "Pretrain/Loss (Raw)": 2.2941477298736572, "Pretrain/Step": 1643, "Pretrain/Step Time": 8.55292334407568} +{"Pretrain/Learning Rate": 4.738831264427432e-05, "Pretrain/Loss": 2.173036813735962, "Pretrain/Loss (Raw)": 2.201817512512207, "Pretrain/Step": 1644, "Pretrain/Step Time": 8.552377726882696} +{"Pretrain/Learning Rate": 4.73845333929311e-05, "Pretrain/Loss": 2.1720778942108154, "Pretrain/Loss (Raw)": 2.1351592540740967, "Pretrain/Step": 1645, "Pretrain/Step Time": 8.551701601594687} +{"Pretrain/Learning Rate": 4.738075156009801e-05, "Pretrain/Loss": 2.171276092529297, "Pretrain/Loss (Raw)": 2.1473846435546875, "Pretrain/Step": 1646, "Pretrain/Step Time": 8.55580922588706} +{"Pretrain/Learning Rate": 4.737696714621118e-05, "Pretrain/Loss": 2.172048807144165, "Pretrain/Loss (Raw)": 2.283829689025879, "Pretrain/Step": 1647, "Pretrain/Step Time": 8.553105615079403} +{"Pretrain/Learning Rate": 4.7373180151707065e-05, "Pretrain/Loss": 2.1727919578552246, "Pretrain/Loss (Raw)": 2.10102915763855, "Pretrain/Step": 1648, "Pretrain/Step Time": 8.562858063727617} +{"Pretrain/Learning Rate": 4.7369390577022385e-05, "Pretrain/Loss": 2.1701407432556152, "Pretrain/Loss (Raw)": 1.9744504690170288, "Pretrain/Step": 1649, "Pretrain/Step Time": 8.55986730568111} +{"Pretrain/Learning Rate": 4.736559842259417e-05, "Pretrain/Loss": 2.170621395111084, "Pretrain/Loss (Raw)": 2.1493773460388184, "Pretrain/Step": 1650, "Pretrain/Step Time": 8.555387202650309} +{"Pretrain/Learning Rate": 4.736180368885976e-05, "Pretrain/Loss": 2.1714541912078857, "Pretrain/Loss (Raw)": 2.178764820098877, "Pretrain/Step": 1651, "Pretrain/Step Time": 8.554494109004736} +{"Pretrain/Learning Rate": 4.735800637625678e-05, "Pretrain/Loss": 2.1730306148529053, "Pretrain/Loss (Raw)": 2.2689151763916016, "Pretrain/Step": 1652, "Pretrain/Step Time": 8.555060014128685} +{"Pretrain/Learning Rate": 4.735420648522314e-05, "Pretrain/Loss": 2.1714744567871094, "Pretrain/Loss (Raw)": 2.146941900253296, "Pretrain/Step": 1653, "Pretrain/Step Time": 8.55808719061315} +{"Pretrain/Learning Rate": 4.7350404016197083e-05, "Pretrain/Loss": 2.168842315673828, "Pretrain/Loss (Raw)": 2.2043209075927734, "Pretrain/Step": 1654, "Pretrain/Step Time": 8.565308326855302} +{"Pretrain/Learning Rate": 4.734659896961711e-05, "Pretrain/Loss": 2.165821075439453, "Pretrain/Loss (Raw)": 1.854225754737854, "Pretrain/Step": 1655, "Pretrain/Step Time": 8.558398511260748} +{"Pretrain/Learning Rate": 4.734279134592204e-05, "Pretrain/Loss": 2.1655874252319336, "Pretrain/Loss (Raw)": 2.0475404262542725, "Pretrain/Step": 1656, "Pretrain/Step Time": 8.561904214322567} +{"Pretrain/Learning Rate": 4.7338981145550994e-05, "Pretrain/Loss": 2.1657567024230957, "Pretrain/Loss (Raw)": 2.212594985961914, "Pretrain/Step": 1657, "Pretrain/Step Time": 8.561646165326238} +{"Pretrain/Learning Rate": 4.7335168368943374e-05, "Pretrain/Loss": 2.166853189468384, "Pretrain/Loss (Raw)": 2.2099549770355225, "Pretrain/Step": 1658, "Pretrain/Step Time": 8.558507405221462} +{"Pretrain/Learning Rate": 4.733135301653889e-05, "Pretrain/Loss": 2.1660919189453125, "Pretrain/Loss (Raw)": 1.978907823562622, "Pretrain/Step": 1659, "Pretrain/Step Time": 8.558298235759139} +{"Pretrain/Learning Rate": 4.732753508877755e-05, "Pretrain/Loss": 2.16300368309021, "Pretrain/Loss (Raw)": 2.042206287384033, "Pretrain/Step": 1660, "Pretrain/Step Time": 8.564045967534184} +{"Pretrain/Learning Rate": 4.732371458609966e-05, "Pretrain/Loss": 2.1602141857147217, "Pretrain/Loss (Raw)": 2.0500524044036865, "Pretrain/Step": 1661, "Pretrain/Step Time": 8.569020060822368} +{"Pretrain/Learning Rate": 4.73198915089458e-05, "Pretrain/Loss": 2.161667585372925, "Pretrain/Loss (Raw)": 2.2738537788391113, "Pretrain/Step": 1662, "Pretrain/Step Time": 8.563642354682088} +{"Pretrain/Learning Rate": 4.731606585775689e-05, "Pretrain/Loss": 2.1606383323669434, "Pretrain/Loss (Raw)": 2.229393720626831, "Pretrain/Step": 1663, "Pretrain/Step Time": 8.562868988141418} +{"Pretrain/Learning Rate": 4.731223763297409e-05, "Pretrain/Loss": 2.1590816974639893, "Pretrain/Loss (Raw)": 1.9221670627593994, "Pretrain/Step": 1664, "Pretrain/Step Time": 8.556578539311886} +{"Pretrain/Learning Rate": 4.730840683503892e-05, "Pretrain/Loss": 2.15924334526062, "Pretrain/Loss (Raw)": 1.9711754322052002, "Pretrain/Step": 1665, "Pretrain/Step Time": 8.555556155741215} +{"Pretrain/Learning Rate": 4.730457346439315e-05, "Pretrain/Loss": 2.1597046852111816, "Pretrain/Loss (Raw)": 2.2567331790924072, "Pretrain/Step": 1666, "Pretrain/Step Time": 8.555720472708344} +{"Pretrain/Learning Rate": 4.7300737521478863e-05, "Pretrain/Loss": 2.160926580429077, "Pretrain/Loss (Raw)": 2.2285826206207275, "Pretrain/Step": 1667, "Pretrain/Step Time": 8.562272245064378} +{"Pretrain/Learning Rate": 4.729689900673845e-05, "Pretrain/Loss": 2.159144878387451, "Pretrain/Loss (Raw)": 1.971335530281067, "Pretrain/Step": 1668, "Pretrain/Step Time": 8.56281585805118} +{"Pretrain/Learning Rate": 4.729305792061457e-05, "Pretrain/Loss": 2.1580159664154053, "Pretrain/Loss (Raw)": 2.0269196033477783, "Pretrain/Step": 1669, "Pretrain/Step Time": 8.55784985423088} +{"Pretrain/Learning Rate": 4.72892142635502e-05, "Pretrain/Loss": 2.1589927673339844, "Pretrain/Loss (Raw)": 2.174600124359131, "Pretrain/Step": 1670, "Pretrain/Step Time": 8.5489945653826} +{"Pretrain/Learning Rate": 4.728536803598862e-05, "Pretrain/Loss": 2.1591057777404785, "Pretrain/Loss (Raw)": 2.0382742881774902, "Pretrain/Step": 1671, "Pretrain/Step Time": 8.548498118296266} +{"Pretrain/Learning Rate": 4.728151923837337e-05, "Pretrain/Loss": 2.160722017288208, "Pretrain/Loss (Raw)": 2.3321895599365234, "Pretrain/Step": 1672, "Pretrain/Step Time": 8.551418730989099} +{"Pretrain/Learning Rate": 4.727766787114835e-05, "Pretrain/Loss": 2.15952730178833, "Pretrain/Loss (Raw)": 2.124443769454956, "Pretrain/Step": 1673, "Pretrain/Step Time": 8.5509689822793} +{"Pretrain/Learning Rate": 4.727381393475767e-05, "Pretrain/Loss": 2.1592679023742676, "Pretrain/Loss (Raw)": 2.23873233795166, "Pretrain/Step": 1674, "Pretrain/Step Time": 8.55707316659391} +{"Pretrain/Learning Rate": 4.726995742964583e-05, "Pretrain/Loss": 2.157999038696289, "Pretrain/Loss (Raw)": 1.9908050298690796, "Pretrain/Step": 1675, "Pretrain/Step Time": 8.550706705078483} +{"Pretrain/Learning Rate": 4.726609835625755e-05, "Pretrain/Loss": 2.157735586166382, "Pretrain/Loss (Raw)": 2.0461747646331787, "Pretrain/Step": 1676, "Pretrain/Step Time": 8.545496823266149} +{"Pretrain/Learning Rate": 4.726223671503789e-05, "Pretrain/Loss": 2.157613754272461, "Pretrain/Loss (Raw)": 2.118947982788086, "Pretrain/Step": 1677, "Pretrain/Step Time": 8.550655838102102} +{"Pretrain/Learning Rate": 4.725837250643218e-05, "Pretrain/Loss": 2.15783953666687, "Pretrain/Loss (Raw)": 2.0715630054473877, "Pretrain/Step": 1678, "Pretrain/Step Time": 8.54855596087873} +{"Pretrain/Learning Rate": 4.7254505730886075e-05, "Pretrain/Loss": 2.157789707183838, "Pretrain/Loss (Raw)": 2.276231527328491, "Pretrain/Step": 1679, "Pretrain/Step Time": 8.550383869558573} +{"Pretrain/Learning Rate": 4.725063638884551e-05, "Pretrain/Loss": 2.1573190689086914, "Pretrain/Loss (Raw)": 2.1804416179656982, "Pretrain/Step": 1680, "Pretrain/Step Time": 8.551918083801866} +{"Pretrain/Learning Rate": 4.724676448075669e-05, "Pretrain/Loss": 2.1567983627319336, "Pretrain/Loss (Raw)": 2.0751609802246094, "Pretrain/Step": 1681, "Pretrain/Step Time": 8.548276485875249} +{"Pretrain/Learning Rate": 4.724289000706617e-05, "Pretrain/Loss": 2.1541695594787598, "Pretrain/Loss (Raw)": 2.1798059940338135, "Pretrain/Step": 1682, "Pretrain/Step Time": 8.546225108206272} +{"Pretrain/Learning Rate": 4.723901296822076e-05, "Pretrain/Loss": 2.151158571243286, "Pretrain/Loss (Raw)": 2.134695529937744, "Pretrain/Step": 1683, "Pretrain/Step Time": 8.546661008149385} +{"Pretrain/Learning Rate": 4.723513336466759e-05, "Pretrain/Loss": 2.150700092315674, "Pretrain/Loss (Raw)": 2.1519570350646973, "Pretrain/Step": 1684, "Pretrain/Step Time": 8.546541085466743} +{"Pretrain/Learning Rate": 4.723125119685405e-05, "Pretrain/Loss": 2.1490135192871094, "Pretrain/Loss (Raw)": 1.814992070198059, "Pretrain/Step": 1685, "Pretrain/Step Time": 8.556072762235999} +{"Pretrain/Learning Rate": 4.722736646522788e-05, "Pretrain/Loss": 2.1484827995300293, "Pretrain/Loss (Raw)": 2.0774683952331543, "Pretrain/Step": 1686, "Pretrain/Step Time": 8.56106855161488} +{"Pretrain/Learning Rate": 4.722347917023706e-05, "Pretrain/Loss": 2.1480274200439453, "Pretrain/Loss (Raw)": 2.1341657638549805, "Pretrain/Step": 1687, "Pretrain/Step Time": 8.555744485929608} +{"Pretrain/Learning Rate": 4.72195893123299e-05, "Pretrain/Loss": 2.146541118621826, "Pretrain/Loss (Raw)": 2.1035208702087402, "Pretrain/Step": 1688, "Pretrain/Step Time": 8.555484345182776} +{"Pretrain/Learning Rate": 4.7215696891955006e-05, "Pretrain/Loss": 2.1471762657165527, "Pretrain/Loss (Raw)": 1.88633394241333, "Pretrain/Step": 1689, "Pretrain/Step Time": 8.553195629268885} +{"Pretrain/Learning Rate": 4.721180190956126e-05, "Pretrain/Loss": 2.146637439727783, "Pretrain/Loss (Raw)": 2.1140341758728027, "Pretrain/Step": 1690, "Pretrain/Step Time": 8.560835391283035} +{"Pretrain/Learning Rate": 4.7207904365597855e-05, "Pretrain/Loss": 2.1453418731689453, "Pretrain/Loss (Raw)": 2.2149388790130615, "Pretrain/Step": 1691, "Pretrain/Step Time": 8.557034203782678} +{"Pretrain/Learning Rate": 4.720400426051427e-05, "Pretrain/Loss": 2.1451423168182373, "Pretrain/Loss (Raw)": 2.2150301933288574, "Pretrain/Step": 1692, "Pretrain/Step Time": 8.560705410316586} +{"Pretrain/Learning Rate": 4.720010159476028e-05, "Pretrain/Loss": 2.1455929279327393, "Pretrain/Loss (Raw)": 2.4678380489349365, "Pretrain/Step": 1693, "Pretrain/Step Time": 8.555732471868396} +{"Pretrain/Learning Rate": 4.719619636878597e-05, "Pretrain/Loss": 2.1438605785369873, "Pretrain/Loss (Raw)": 2.072874069213867, "Pretrain/Step": 1694, "Pretrain/Step Time": 8.554465813562274} +{"Pretrain/Learning Rate": 4.71922885830417e-05, "Pretrain/Loss": 2.143921375274658, "Pretrain/Loss (Raw)": 2.1932694911956787, "Pretrain/Step": 1695, "Pretrain/Step Time": 8.557281069457531} +{"Pretrain/Learning Rate": 4.718837823797814e-05, "Pretrain/Loss": 2.1411609649658203, "Pretrain/Loss (Raw)": 1.9805314540863037, "Pretrain/Step": 1696, "Pretrain/Step Time": 8.553973013535142} +{"Pretrain/Learning Rate": 4.7184465334046246e-05, "Pretrain/Loss": 2.1398215293884277, "Pretrain/Loss (Raw)": 2.118264675140381, "Pretrain/Step": 1697, "Pretrain/Step Time": 8.56580263748765} +{"Pretrain/Learning Rate": 4.718054987169727e-05, "Pretrain/Loss": 2.1399080753326416, "Pretrain/Loss (Raw)": 2.187987804412842, "Pretrain/Step": 1698, "Pretrain/Step Time": 8.5585294701159} +{"Pretrain/Learning Rate": 4.717663185138276e-05, "Pretrain/Loss": 2.1391444206237793, "Pretrain/Loss (Raw)": 1.967077374458313, "Pretrain/Step": 1699, "Pretrain/Step Time": 8.561669522896409} +{"Pretrain/Learning Rate": 4.7172711273554576e-05, "Pretrain/Loss": 2.137136459350586, "Pretrain/Loss (Raw)": 1.9885804653167725, "Pretrain/Step": 1700, "Pretrain/Step Time": 8.555771850049496} +{"Pretrain/Learning Rate": 4.7168788138664845e-05, "Pretrain/Loss": 2.137690544128418, "Pretrain/Loss (Raw)": 2.1109466552734375, "Pretrain/Step": 1701, "Pretrain/Step Time": 8.556777147576213} +{"Pretrain/Learning Rate": 4.7164862447165995e-05, "Pretrain/Loss": 2.1389918327331543, "Pretrain/Loss (Raw)": 2.1349337100982666, "Pretrain/Step": 1702, "Pretrain/Step Time": 8.55808843486011} +{"Pretrain/Learning Rate": 4.716093419951077e-05, "Pretrain/Loss": 2.138895273208618, "Pretrain/Loss (Raw)": 2.118081569671631, "Pretrain/Step": 1703, "Pretrain/Step Time": 8.565351901575923} +{"Pretrain/Learning Rate": 4.7157003396152184e-05, "Pretrain/Loss": 2.138885498046875, "Pretrain/Loss (Raw)": 2.0843505859375, "Pretrain/Step": 1704, "Pretrain/Step Time": 8.557544397190213} +{"Pretrain/Learning Rate": 4.715307003754356e-05, "Pretrain/Loss": 2.138612747192383, "Pretrain/Loss (Raw)": 1.9806991815567017, "Pretrain/Step": 1705, "Pretrain/Step Time": 8.560636408627033} +{"Pretrain/Learning Rate": 4.714913412413851e-05, "Pretrain/Loss": 2.139247417449951, "Pretrain/Loss (Raw)": 2.0816471576690674, "Pretrain/Step": 1706, "Pretrain/Step Time": 8.56267517618835} +{"Pretrain/Learning Rate": 4.714519565639095e-05, "Pretrain/Loss": 2.138929843902588, "Pretrain/Loss (Raw)": 2.069779634475708, "Pretrain/Step": 1707, "Pretrain/Step Time": 8.562251396477222} +{"Pretrain/Learning Rate": 4.714125463475506e-05, "Pretrain/Loss": 2.1401498317718506, "Pretrain/Loss (Raw)": 2.287616729736328, "Pretrain/Step": 1708, "Pretrain/Step Time": 8.556778259575367} +{"Pretrain/Learning Rate": 4.713731105968536e-05, "Pretrain/Loss": 2.141890048980713, "Pretrain/Loss (Raw)": 2.308424472808838, "Pretrain/Step": 1709, "Pretrain/Step Time": 8.567448876798153} +{"Pretrain/Learning Rate": 4.7133364931636644e-05, "Pretrain/Loss": 2.1416943073272705, "Pretrain/Loss (Raw)": 2.231743335723877, "Pretrain/Step": 1710, "Pretrain/Step Time": 8.556722078472376} +{"Pretrain/Learning Rate": 4.712941625106398e-05, "Pretrain/Loss": 2.1421866416931152, "Pretrain/Loss (Raw)": 2.105637550354004, "Pretrain/Step": 1711, "Pretrain/Step Time": 8.554704494774342} +{"Pretrain/Learning Rate": 4.7125465018422755e-05, "Pretrain/Loss": 2.139950752258301, "Pretrain/Loss (Raw)": 1.906479835510254, "Pretrain/Step": 1712, "Pretrain/Step Time": 8.552727539092302} +{"Pretrain/Learning Rate": 4.7121511234168644e-05, "Pretrain/Loss": 2.1402368545532227, "Pretrain/Loss (Raw)": 2.2208878993988037, "Pretrain/Step": 1713, "Pretrain/Step Time": 8.551160642877221} +{"Pretrain/Learning Rate": 4.711755489875762e-05, "Pretrain/Loss": 2.1416842937469482, "Pretrain/Loss (Raw)": 2.1192266941070557, "Pretrain/Step": 1714, "Pretrain/Step Time": 8.552965397015214} +{"Pretrain/Learning Rate": 4.711359601264594e-05, "Pretrain/Loss": 2.142033576965332, "Pretrain/Loss (Raw)": 2.2472214698791504, "Pretrain/Step": 1715, "Pretrain/Step Time": 8.560083327814937} +{"Pretrain/Learning Rate": 4.7109634576290175e-05, "Pretrain/Loss": 2.1407880783081055, "Pretrain/Loss (Raw)": 1.956042766571045, "Pretrain/Step": 1716, "Pretrain/Step Time": 8.549730241298676} +{"Pretrain/Learning Rate": 4.710567059014716e-05, "Pretrain/Loss": 2.140803813934326, "Pretrain/Loss (Raw)": 2.113006353378296, "Pretrain/Step": 1717, "Pretrain/Step Time": 8.5516273714602} +{"Pretrain/Learning Rate": 4.710170405467405e-05, "Pretrain/Loss": 2.1403870582580566, "Pretrain/Loss (Raw)": 2.278390407562256, "Pretrain/Step": 1718, "Pretrain/Step Time": 8.55529759824276} +{"Pretrain/Learning Rate": 4.709773497032828e-05, "Pretrain/Loss": 2.144265651702881, "Pretrain/Loss (Raw)": 2.412062406539917, "Pretrain/Step": 1719, "Pretrain/Step Time": 8.552008984610438} +{"Pretrain/Learning Rate": 4.7093763337567585e-05, "Pretrain/Loss": 2.144209384918213, "Pretrain/Loss (Raw)": 2.001680850982666, "Pretrain/Step": 1720, "Pretrain/Step Time": 8.554118942469358} +{"Pretrain/Learning Rate": 4.708978915685e-05, "Pretrain/Loss": 2.1423840522766113, "Pretrain/Loss (Raw)": 1.979123830795288, "Pretrain/Step": 1721, "Pretrain/Step Time": 8.554728230461478} +{"Pretrain/Learning Rate": 4.708581242863382e-05, "Pretrain/Loss": 2.1457152366638184, "Pretrain/Loss (Raw)": 2.3665988445281982, "Pretrain/Step": 1722, "Pretrain/Step Time": 8.548280412331223} +{"Pretrain/Learning Rate": 4.7081833153377694e-05, "Pretrain/Loss": 2.144982099533081, "Pretrain/Loss (Raw)": 2.1740803718566895, "Pretrain/Step": 1723, "Pretrain/Step Time": 8.555134128779173} +{"Pretrain/Learning Rate": 4.707785133154051e-05, "Pretrain/Loss": 2.1443934440612793, "Pretrain/Loss (Raw)": 2.1095359325408936, "Pretrain/Step": 1724, "Pretrain/Step Time": 8.553429834544659} +{"Pretrain/Learning Rate": 4.707386696358148e-05, "Pretrain/Loss": 2.141449213027954, "Pretrain/Loss (Raw)": 2.114450693130493, "Pretrain/Step": 1725, "Pretrain/Step Time": 8.552411353215575} +{"Pretrain/Learning Rate": 4.7069880049960104e-05, "Pretrain/Loss": 2.140822649002075, "Pretrain/Loss (Raw)": 2.165494441986084, "Pretrain/Step": 1726, "Pretrain/Step Time": 8.553453052416444} +{"Pretrain/Learning Rate": 4.7065890591136154e-05, "Pretrain/Loss": 2.1402950286865234, "Pretrain/Loss (Raw)": 2.0786752700805664, "Pretrain/Step": 1727, "Pretrain/Step Time": 8.552906295284629} +{"Pretrain/Learning Rate": 4.706189858756972e-05, "Pretrain/Loss": 2.1373519897460938, "Pretrain/Loss (Raw)": 1.815524935722351, "Pretrain/Step": 1728, "Pretrain/Step Time": 8.554733544588089} +{"Pretrain/Learning Rate": 4.705790403972119e-05, "Pretrain/Loss": 2.136702060699463, "Pretrain/Loss (Raw)": 2.034097671508789, "Pretrain/Step": 1729, "Pretrain/Step Time": 8.558418344706297} +{"Pretrain/Learning Rate": 4.705390694805122e-05, "Pretrain/Loss": 2.135178565979004, "Pretrain/Loss (Raw)": 1.9231206178665161, "Pretrain/Step": 1730, "Pretrain/Step Time": 8.557701345533133} +{"Pretrain/Learning Rate": 4.704990731302078e-05, "Pretrain/Loss": 2.134976863861084, "Pretrain/Loss (Raw)": 2.230128765106201, "Pretrain/Step": 1731, "Pretrain/Step Time": 8.556219328194857} +{"Pretrain/Learning Rate": 4.7045905135091126e-05, "Pretrain/Loss": 2.137911796569824, "Pretrain/Loss (Raw)": 2.500941514968872, "Pretrain/Step": 1732, "Pretrain/Step Time": 8.556326508522034} +{"Pretrain/Learning Rate": 4.704190041472381e-05, "Pretrain/Loss": 2.1373980045318604, "Pretrain/Loss (Raw)": 2.194904327392578, "Pretrain/Step": 1733, "Pretrain/Step Time": 8.551733491942286} +{"Pretrain/Learning Rate": 4.703789315238067e-05, "Pretrain/Loss": 2.135834217071533, "Pretrain/Loss (Raw)": 1.9222114086151123, "Pretrain/Step": 1734, "Pretrain/Step Time": 8.563713600859046} +{"Pretrain/Learning Rate": 4.703388334852385e-05, "Pretrain/Loss": 2.135356903076172, "Pretrain/Loss (Raw)": 2.1643924713134766, "Pretrain/Step": 1735, "Pretrain/Step Time": 8.562526378780603} +{"Pretrain/Learning Rate": 4.7029871003615776e-05, "Pretrain/Loss": 2.1339380741119385, "Pretrain/Loss (Raw)": 2.045149564743042, "Pretrain/Step": 1736, "Pretrain/Step Time": 8.564202388748527} +{"Pretrain/Learning Rate": 4.7025856118119164e-05, "Pretrain/Loss": 2.134097099304199, "Pretrain/Loss (Raw)": 2.0989177227020264, "Pretrain/Step": 1737, "Pretrain/Step Time": 8.560678819194436} +{"Pretrain/Learning Rate": 4.7021838692497046e-05, "Pretrain/Loss": 2.137328624725342, "Pretrain/Loss (Raw)": 2.3260881900787354, "Pretrain/Step": 1738, "Pretrain/Step Time": 8.559898506850004} +{"Pretrain/Learning Rate": 4.70178187272127e-05, "Pretrain/Loss": 2.1386430263519287, "Pretrain/Loss (Raw)": 2.2742202281951904, "Pretrain/Step": 1739, "Pretrain/Step Time": 8.565074782818556} +{"Pretrain/Learning Rate": 4.701379622272977e-05, "Pretrain/Loss": 2.138765811920166, "Pretrain/Loss (Raw)": 2.165998697280884, "Pretrain/Step": 1740, "Pretrain/Step Time": 8.562008308246732} +{"Pretrain/Learning Rate": 4.700977117951211e-05, "Pretrain/Loss": 2.1386752128601074, "Pretrain/Loss (Raw)": 2.0903611183166504, "Pretrain/Step": 1741, "Pretrain/Step Time": 8.565864235162735} +{"Pretrain/Learning Rate": 4.700574359802393e-05, "Pretrain/Loss": 2.1374435424804688, "Pretrain/Loss (Raw)": 2.202066659927368, "Pretrain/Step": 1742, "Pretrain/Step Time": 8.56802824512124} +{"Pretrain/Learning Rate": 4.700171347872971e-05, "Pretrain/Loss": 2.1402745246887207, "Pretrain/Loss (Raw)": 2.4270200729370117, "Pretrain/Step": 1743, "Pretrain/Step Time": 8.562874658033252} +{"Pretrain/Learning Rate": 4.699768082209421e-05, "Pretrain/Loss": 2.139833927154541, "Pretrain/Loss (Raw)": 1.997346043586731, "Pretrain/Step": 1744, "Pretrain/Step Time": 8.563914325088263} +{"Pretrain/Learning Rate": 4.69936456285825e-05, "Pretrain/Loss": 2.139833450317383, "Pretrain/Loss (Raw)": 2.1995694637298584, "Pretrain/Step": 1745, "Pretrain/Step Time": 8.565918885171413} +{"Pretrain/Learning Rate": 4.698960789865994e-05, "Pretrain/Loss": 2.139918804168701, "Pretrain/Loss (Raw)": 2.193758964538574, "Pretrain/Step": 1746, "Pretrain/Step Time": 8.56027670018375} +{"Pretrain/Learning Rate": 4.698556763279218e-05, "Pretrain/Loss": 2.140683650970459, "Pretrain/Loss (Raw)": 2.2664880752563477, "Pretrain/Step": 1747, "Pretrain/Step Time": 8.56616135686636} +{"Pretrain/Learning Rate": 4.698152483144516e-05, "Pretrain/Loss": 2.1415107250213623, "Pretrain/Loss (Raw)": 2.1992650032043457, "Pretrain/Step": 1748, "Pretrain/Step Time": 8.560887260362506} +{"Pretrain/Learning Rate": 4.697747949508512e-05, "Pretrain/Loss": 2.1418509483337402, "Pretrain/Loss (Raw)": 2.1343910694122314, "Pretrain/Step": 1749, "Pretrain/Step Time": 8.562868343666196} +{"Pretrain/Learning Rate": 4.697343162417858e-05, "Pretrain/Loss": 2.140185832977295, "Pretrain/Loss (Raw)": 2.115567207336426, "Pretrain/Step": 1750, "Pretrain/Step Time": 8.558866754174232} +{"Pretrain/Learning Rate": 4.696938121919235e-05, "Pretrain/Loss": 2.1386964321136475, "Pretrain/Loss (Raw)": 2.0823819637298584, "Pretrain/Step": 1751, "Pretrain/Step Time": 8.569212252274156} +{"Pretrain/Learning Rate": 4.696532828059358e-05, "Pretrain/Loss": 2.137575626373291, "Pretrain/Loss (Raw)": 2.1130006313323975, "Pretrain/Step": 1752, "Pretrain/Step Time": 8.558323226869106} +{"Pretrain/Learning Rate": 4.6961272808849634e-05, "Pretrain/Loss": 2.1374921798706055, "Pretrain/Loss (Raw)": 2.2050259113311768, "Pretrain/Step": 1753, "Pretrain/Step Time": 8.555457595735788} +{"Pretrain/Learning Rate": 4.6957214804428217e-05, "Pretrain/Loss": 2.136691093444824, "Pretrain/Loss (Raw)": 2.0304620265960693, "Pretrain/Step": 1754, "Pretrain/Step Time": 8.551404254510999} +{"Pretrain/Learning Rate": 4.695315426779734e-05, "Pretrain/Loss": 2.139209032058716, "Pretrain/Loss (Raw)": 2.340106964111328, "Pretrain/Step": 1755, "Pretrain/Step Time": 8.552485827356577} +{"Pretrain/Learning Rate": 4.694909119942526e-05, "Pretrain/Loss": 2.135097026824951, "Pretrain/Loss (Raw)": 1.869033932685852, "Pretrain/Step": 1756, "Pretrain/Step Time": 8.551398558542132} +{"Pretrain/Learning Rate": 4.694502559978055e-05, "Pretrain/Loss": 2.135190963745117, "Pretrain/Loss (Raw)": 2.335116147994995, "Pretrain/Step": 1757, "Pretrain/Step Time": 8.557356985285878} +{"Pretrain/Learning Rate": 4.694095746933208e-05, "Pretrain/Loss": 2.1351263523101807, "Pretrain/Loss (Raw)": 2.221052646636963, "Pretrain/Step": 1758, "Pretrain/Step Time": 8.551236124709249} +{"Pretrain/Learning Rate": 4.6936886808549004e-05, "Pretrain/Loss": 2.134958028793335, "Pretrain/Loss (Raw)": 2.1251230239868164, "Pretrain/Step": 1759, "Pretrain/Step Time": 8.554372550919652} +{"Pretrain/Learning Rate": 4.693281361790077e-05, "Pretrain/Loss": 2.132599353790283, "Pretrain/Loss (Raw)": 2.020026445388794, "Pretrain/Step": 1760, "Pretrain/Step Time": 8.548240778967738} +{"Pretrain/Learning Rate": 4.6928737897857124e-05, "Pretrain/Loss": 2.1331050395965576, "Pretrain/Loss (Raw)": 2.221379280090332, "Pretrain/Step": 1761, "Pretrain/Step Time": 8.546436376869678} +{"Pretrain/Learning Rate": 4.692465964888809e-05, "Pretrain/Loss": 2.134681224822998, "Pretrain/Loss (Raw)": 2.2321102619171143, "Pretrain/Step": 1762, "Pretrain/Step Time": 8.549300942569971} +{"Pretrain/Learning Rate": 4.692057887146399e-05, "Pretrain/Loss": 2.1341702938079834, "Pretrain/Loss (Raw)": 2.16658353805542, "Pretrain/Step": 1763, "Pretrain/Step Time": 8.549441132694483} +{"Pretrain/Learning Rate": 4.691649556605545e-05, "Pretrain/Loss": 2.1334338188171387, "Pretrain/Loss (Raw)": 2.0630531311035156, "Pretrain/Step": 1764, "Pretrain/Step Time": 8.55032785050571} +{"Pretrain/Learning Rate": 4.691240973313337e-05, "Pretrain/Loss": 2.13450288772583, "Pretrain/Loss (Raw)": 2.103301525115967, "Pretrain/Step": 1765, "Pretrain/Step Time": 8.54578792117536} +{"Pretrain/Learning Rate": 4.690832137316893e-05, "Pretrain/Loss": 2.1324048042297363, "Pretrain/Loss (Raw)": 2.0621538162231445, "Pretrain/Step": 1766, "Pretrain/Step Time": 8.541783360764384} +{"Pretrain/Learning Rate": 4.690423048663364e-05, "Pretrain/Loss": 2.131300449371338, "Pretrain/Loss (Raw)": 2.0594496726989746, "Pretrain/Step": 1767, "Pretrain/Step Time": 8.550401277840137} +{"Pretrain/Learning Rate": 4.690013707399928e-05, "Pretrain/Loss": 2.131995439529419, "Pretrain/Loss (Raw)": 2.0596892833709717, "Pretrain/Step": 1768, "Pretrain/Step Time": 8.548473440110683} +{"Pretrain/Learning Rate": 4.689604113573791e-05, "Pretrain/Loss": 2.1318798065185547, "Pretrain/Loss (Raw)": 2.1254677772521973, "Pretrain/Step": 1769, "Pretrain/Step Time": 8.548692913725972} +{"Pretrain/Learning Rate": 4.68919426723219e-05, "Pretrain/Loss": 2.1314356327056885, "Pretrain/Loss (Raw)": 2.078186511993408, "Pretrain/Step": 1770, "Pretrain/Step Time": 8.549884246662259} +{"Pretrain/Learning Rate": 4.6887841684223905e-05, "Pretrain/Loss": 2.129542350769043, "Pretrain/Loss (Raw)": 2.0517959594726562, "Pretrain/Step": 1771, "Pretrain/Step Time": 8.546060198917985} +{"Pretrain/Learning Rate": 4.688373817191687e-05, "Pretrain/Loss": 2.1288509368896484, "Pretrain/Loss (Raw)": 2.113306760787964, "Pretrain/Step": 1772, "Pretrain/Step Time": 8.543542245402932} +{"Pretrain/Learning Rate": 4.687963213587402e-05, "Pretrain/Loss": 2.127821445465088, "Pretrain/Loss (Raw)": 2.0034093856811523, "Pretrain/Step": 1773, "Pretrain/Step Time": 8.5425682682544} +{"Pretrain/Learning Rate": 4.6875523576568895e-05, "Pretrain/Loss": 2.1313064098358154, "Pretrain/Loss (Raw)": 2.5934433937072754, "Pretrain/Step": 1774, "Pretrain/Step Time": 8.541486650705338} +{"Pretrain/Learning Rate": 4.6871412494475316e-05, "Pretrain/Loss": 2.1301920413970947, "Pretrain/Loss (Raw)": 2.141186237335205, "Pretrain/Step": 1775, "Pretrain/Step Time": 8.539924031123519} +{"Pretrain/Learning Rate": 4.6867298890067377e-05, "Pretrain/Loss": 2.131535530090332, "Pretrain/Loss (Raw)": 2.273000955581665, "Pretrain/Step": 1776, "Pretrain/Step Time": 8.538878405466676} +{"Pretrain/Learning Rate": 4.68631827638195e-05, "Pretrain/Loss": 2.1320409774780273, "Pretrain/Loss (Raw)": 2.039175033569336, "Pretrain/Step": 1777, "Pretrain/Step Time": 8.537741094827652} +{"Pretrain/Learning Rate": 4.6859064116206356e-05, "Pretrain/Loss": 2.1326775550842285, "Pretrain/Loss (Raw)": 2.2308242321014404, "Pretrain/Step": 1778, "Pretrain/Step Time": 8.542664214968681} +{"Pretrain/Learning Rate": 4.685494294770294e-05, "Pretrain/Loss": 2.130995988845825, "Pretrain/Loss (Raw)": 1.9635368585586548, "Pretrain/Step": 1779, "Pretrain/Step Time": 8.539518924430013} +{"Pretrain/Learning Rate": 4.685081925878452e-05, "Pretrain/Loss": 2.1307125091552734, "Pretrain/Loss (Raw)": 2.232649803161621, "Pretrain/Step": 1780, "Pretrain/Step Time": 8.543813325464725} +{"Pretrain/Learning Rate": 4.684669304992665e-05, "Pretrain/Loss": 2.131178617477417, "Pretrain/Loss (Raw)": 2.2065868377685547, "Pretrain/Step": 1781, "Pretrain/Step Time": 8.541188349947333} +{"Pretrain/Learning Rate": 4.6842564321605196e-05, "Pretrain/Loss": 2.13118314743042, "Pretrain/Loss (Raw)": 2.2048826217651367, "Pretrain/Step": 1782, "Pretrain/Step Time": 8.546604871749878} +{"Pretrain/Learning Rate": 4.683843307429631e-05, "Pretrain/Loss": 2.1346960067749023, "Pretrain/Loss (Raw)": 2.3038532733917236, "Pretrain/Step": 1783, "Pretrain/Step Time": 8.548936542123556} +{"Pretrain/Learning Rate": 4.68342993084764e-05, "Pretrain/Loss": 2.1362650394439697, "Pretrain/Loss (Raw)": 2.2484068870544434, "Pretrain/Step": 1784, "Pretrain/Step Time": 8.549719899892807} +{"Pretrain/Learning Rate": 4.683016302462221e-05, "Pretrain/Loss": 2.1362433433532715, "Pretrain/Loss (Raw)": 2.209829092025757, "Pretrain/Step": 1785, "Pretrain/Step Time": 8.545716481283307} +{"Pretrain/Learning Rate": 4.682602422321076e-05, "Pretrain/Loss": 2.1340508460998535, "Pretrain/Loss (Raw)": 1.9293025732040405, "Pretrain/Step": 1786, "Pretrain/Step Time": 8.548225786536932} +{"Pretrain/Learning Rate": 4.6821882904719344e-05, "Pretrain/Loss": 2.1364245414733887, "Pretrain/Loss (Raw)": 2.2827394008636475, "Pretrain/Step": 1787, "Pretrain/Step Time": 8.54977666027844} +{"Pretrain/Learning Rate": 4.6817739069625563e-05, "Pretrain/Loss": 2.1370413303375244, "Pretrain/Loss (Raw)": 2.1211588382720947, "Pretrain/Step": 1788, "Pretrain/Step Time": 8.551454696804285} +{"Pretrain/Learning Rate": 4.681359271840731e-05, "Pretrain/Loss": 2.1370553970336914, "Pretrain/Loss (Raw)": 2.0518555641174316, "Pretrain/Step": 1789, "Pretrain/Step Time": 8.546062503010035} +{"Pretrain/Learning Rate": 4.6809443851542744e-05, "Pretrain/Loss": 2.1351866722106934, "Pretrain/Loss (Raw)": 2.0346498489379883, "Pretrain/Step": 1790, "Pretrain/Step Time": 8.551896590739489} +{"Pretrain/Learning Rate": 4.680529246951035e-05, "Pretrain/Loss": 2.1348836421966553, "Pretrain/Loss (Raw)": 2.1906023025512695, "Pretrain/Step": 1791, "Pretrain/Step Time": 8.545388281345367} +{"Pretrain/Learning Rate": 4.6801138572788885e-05, "Pretrain/Loss": 2.137343645095825, "Pretrain/Loss (Raw)": 2.237053871154785, "Pretrain/Step": 1792, "Pretrain/Step Time": 8.547265173867345} +{"Pretrain/Learning Rate": 4.679698216185738e-05, "Pretrain/Loss": 2.1376442909240723, "Pretrain/Loss (Raw)": 2.009692430496216, "Pretrain/Step": 1793, "Pretrain/Step Time": 8.548840867355466} +{"Pretrain/Learning Rate": 4.6792823237195185e-05, "Pretrain/Loss": 2.136669397354126, "Pretrain/Loss (Raw)": 2.1319072246551514, "Pretrain/Step": 1794, "Pretrain/Step Time": 8.55547091551125} +{"Pretrain/Learning Rate": 4.678866179928193e-05, "Pretrain/Loss": 2.1368134021759033, "Pretrain/Loss (Raw)": 2.2470290660858154, "Pretrain/Step": 1795, "Pretrain/Step Time": 8.54963344708085} +{"Pretrain/Learning Rate": 4.6784497848597516e-05, "Pretrain/Loss": 2.1382012367248535, "Pretrain/Loss (Raw)": 2.14898419380188, "Pretrain/Step": 1796, "Pretrain/Step Time": 8.552930515259504} +{"Pretrain/Learning Rate": 4.678033138562216e-05, "Pretrain/Loss": 2.138840913772583, "Pretrain/Loss (Raw)": 2.108802556991577, "Pretrain/Step": 1797, "Pretrain/Step Time": 8.550405057147145} +{"Pretrain/Learning Rate": 4.6776162410836354e-05, "Pretrain/Loss": 2.137838125228882, "Pretrain/Loss (Raw)": 2.0462281703948975, "Pretrain/Step": 1798, "Pretrain/Step Time": 8.555944167077541} +{"Pretrain/Learning Rate": 4.677199092472089e-05, "Pretrain/Loss": 2.1382977962493896, "Pretrain/Loss (Raw)": 2.097104072570801, "Pretrain/Step": 1799, "Pretrain/Step Time": 8.552054608240724} +{"Pretrain/Learning Rate": 4.6767816927756834e-05, "Pretrain/Loss": 2.1352694034576416, "Pretrain/Loss (Raw)": 1.9445672035217285, "Pretrain/Step": 1800, "Pretrain/Step Time": 8.550131464377046} +{"Pretrain/Learning Rate": 4.6763640420425566e-05, "Pretrain/Loss": 2.134692430496216, "Pretrain/Loss (Raw)": 2.0506045818328857, "Pretrain/Step": 1801, "Pretrain/Step Time": 8.551584733650088} +{"Pretrain/Learning Rate": 4.675946140320873e-05, "Pretrain/Loss": 2.1339974403381348, "Pretrain/Loss (Raw)": 2.149740219116211, "Pretrain/Step": 1802, "Pretrain/Step Time": 8.550170879811049} +{"Pretrain/Learning Rate": 4.6755279876588256e-05, "Pretrain/Loss": 2.135204792022705, "Pretrain/Loss (Raw)": 2.14536452293396, "Pretrain/Step": 1803, "Pretrain/Step Time": 8.550165506079793} +{"Pretrain/Learning Rate": 4.67510958410464e-05, "Pretrain/Loss": 2.13742733001709, "Pretrain/Loss (Raw)": 2.3306827545166016, "Pretrain/Step": 1804, "Pretrain/Step Time": 8.55257355235517} +{"Pretrain/Learning Rate": 4.6746909297065685e-05, "Pretrain/Loss": 2.137598991394043, "Pretrain/Loss (Raw)": 2.140864849090576, "Pretrain/Step": 1805, "Pretrain/Step Time": 8.548736369237304} +{"Pretrain/Learning Rate": 4.674272024512891e-05, "Pretrain/Loss": 2.139975070953369, "Pretrain/Loss (Raw)": 2.375728130340576, "Pretrain/Step": 1806, "Pretrain/Step Time": 8.556078949943185} +{"Pretrain/Learning Rate": 4.6738528685719185e-05, "Pretrain/Loss": 2.138063430786133, "Pretrain/Loss (Raw)": 2.031538248062134, "Pretrain/Step": 1807, "Pretrain/Step Time": 8.555258009582758} +{"Pretrain/Learning Rate": 4.673433461931989e-05, "Pretrain/Loss": 2.1398632526397705, "Pretrain/Loss (Raw)": 2.4108340740203857, "Pretrain/Step": 1808, "Pretrain/Step Time": 8.553078420460224} +{"Pretrain/Learning Rate": 4.6730138046414714e-05, "Pretrain/Loss": 2.140843391418457, "Pretrain/Loss (Raw)": 2.200615644454956, "Pretrain/Step": 1809, "Pretrain/Step Time": 8.556852674111724} +{"Pretrain/Learning Rate": 4.672593896748763e-05, "Pretrain/Loss": 2.1401710510253906, "Pretrain/Loss (Raw)": 2.0937530994415283, "Pretrain/Step": 1810, "Pretrain/Step Time": 8.557685434818268} +{"Pretrain/Learning Rate": 4.6721737383022876e-05, "Pretrain/Loss": 2.1399760246276855, "Pretrain/Loss (Raw)": 2.10970401763916, "Pretrain/Step": 1811, "Pretrain/Step Time": 8.55975766479969} +{"Pretrain/Learning Rate": 4.671753329350502e-05, "Pretrain/Loss": 2.140921115875244, "Pretrain/Loss (Raw)": 2.272963523864746, "Pretrain/Step": 1812, "Pretrain/Step Time": 8.562557082623243} +{"Pretrain/Learning Rate": 4.671332669941888e-05, "Pretrain/Loss": 2.1409575939178467, "Pretrain/Loss (Raw)": 1.8196347951889038, "Pretrain/Step": 1813, "Pretrain/Step Time": 8.554392782971263} +{"Pretrain/Learning Rate": 4.6709117601249596e-05, "Pretrain/Loss": 2.141308307647705, "Pretrain/Loss (Raw)": 2.1223905086517334, "Pretrain/Step": 1814, "Pretrain/Step Time": 8.55519406683743} +{"Pretrain/Learning Rate": 4.6704905999482575e-05, "Pretrain/Loss": 2.141263961791992, "Pretrain/Loss (Raw)": 2.128450393676758, "Pretrain/Step": 1815, "Pretrain/Step Time": 8.55926913022995} +{"Pretrain/Learning Rate": 4.670069189460351e-05, "Pretrain/Loss": 2.1414759159088135, "Pretrain/Loss (Raw)": 2.1306846141815186, "Pretrain/Step": 1816, "Pretrain/Step Time": 8.551626542583108} +{"Pretrain/Learning Rate": 4.6696475287098396e-05, "Pretrain/Loss": 2.142666816711426, "Pretrain/Loss (Raw)": 2.038747787475586, "Pretrain/Step": 1817, "Pretrain/Step Time": 8.5547777954489} +{"Pretrain/Learning Rate": 4.669225617745352e-05, "Pretrain/Loss": 2.1420273780822754, "Pretrain/Loss (Raw)": 2.032216787338257, "Pretrain/Step": 1818, "Pretrain/Step Time": 8.550939561799169} +{"Pretrain/Learning Rate": 4.668803456615545e-05, "Pretrain/Loss": 2.14170503616333, "Pretrain/Loss (Raw)": 2.1736605167388916, "Pretrain/Step": 1819, "Pretrain/Step Time": 8.553021444007754} +{"Pretrain/Learning Rate": 4.668381045369102e-05, "Pretrain/Loss": 2.138760566711426, "Pretrain/Loss (Raw)": 1.8381340503692627, "Pretrain/Step": 1820, "Pretrain/Step Time": 8.553789695724845} +{"Pretrain/Learning Rate": 4.6679583840547405e-05, "Pretrain/Loss": 2.1372828483581543, "Pretrain/Loss (Raw)": 2.278657913208008, "Pretrain/Step": 1821, "Pretrain/Step Time": 8.55425233580172} +{"Pretrain/Learning Rate": 4.667535472721203e-05, "Pretrain/Loss": 2.138601779937744, "Pretrain/Loss (Raw)": 2.241718292236328, "Pretrain/Step": 1822, "Pretrain/Step Time": 8.55098077468574} +{"Pretrain/Learning Rate": 4.66711231141726e-05, "Pretrain/Loss": 2.1376514434814453, "Pretrain/Loss (Raw)": 2.071641683578491, "Pretrain/Step": 1823, "Pretrain/Step Time": 8.552355593070388} +{"Pretrain/Learning Rate": 4.6666889001917136e-05, "Pretrain/Loss": 2.139078140258789, "Pretrain/Loss (Raw)": 2.163144111633301, "Pretrain/Step": 1824, "Pretrain/Step Time": 8.552360204979777} +{"Pretrain/Learning Rate": 4.666265239093393e-05, "Pretrain/Loss": 2.140554904937744, "Pretrain/Loss (Raw)": 2.3072893619537354, "Pretrain/Step": 1825, "Pretrain/Step Time": 8.548107009381056} +{"Pretrain/Learning Rate": 4.665841328171158e-05, "Pretrain/Loss": 2.139224052429199, "Pretrain/Loss (Raw)": 2.01765775680542, "Pretrain/Step": 1826, "Pretrain/Step Time": 8.547114485874772} +{"Pretrain/Learning Rate": 4.665417167473894e-05, "Pretrain/Loss": 2.142411231994629, "Pretrain/Loss (Raw)": 2.3750431537628174, "Pretrain/Step": 1827, "Pretrain/Step Time": 8.548593152314425} +{"Pretrain/Learning Rate": 4.66499275705052e-05, "Pretrain/Loss": 2.14438796043396, "Pretrain/Loss (Raw)": 2.241586208343506, "Pretrain/Step": 1828, "Pretrain/Step Time": 8.548349352553487} +{"Pretrain/Learning Rate": 4.6645680969499795e-05, "Pretrain/Loss": 2.1444201469421387, "Pretrain/Loss (Raw)": 2.1150424480438232, "Pretrain/Step": 1829, "Pretrain/Step Time": 8.5451077837497} +{"Pretrain/Learning Rate": 4.664143187221245e-05, "Pretrain/Loss": 2.1444091796875, "Pretrain/Loss (Raw)": 2.1335368156433105, "Pretrain/Step": 1830, "Pretrain/Step Time": 8.549822779372334} +{"Pretrain/Learning Rate": 4.6637180279133216e-05, "Pretrain/Loss": 2.1453042030334473, "Pretrain/Loss (Raw)": 2.2326292991638184, "Pretrain/Step": 1831, "Pretrain/Step Time": 8.543833766132593} +{"Pretrain/Learning Rate": 4.6632926190752385e-05, "Pretrain/Loss": 2.1458144187927246, "Pretrain/Loss (Raw)": 2.149689197540283, "Pretrain/Step": 1832, "Pretrain/Step Time": 8.541537586599588} +{"Pretrain/Learning Rate": 4.662866960756057e-05, "Pretrain/Loss": 2.148392677307129, "Pretrain/Loss (Raw)": 2.3107051849365234, "Pretrain/Step": 1833, "Pretrain/Step Time": 8.540592404082417} +{"Pretrain/Learning Rate": 4.662441053004866e-05, "Pretrain/Loss": 2.148193120956421, "Pretrain/Loss (Raw)": 2.056105852127075, "Pretrain/Step": 1834, "Pretrain/Step Time": 8.538102228194475} +{"Pretrain/Learning Rate": 4.6620148958707833e-05, "Pretrain/Loss": 2.147460460662842, "Pretrain/Loss (Raw)": 1.9759923219680786, "Pretrain/Step": 1835, "Pretrain/Step Time": 8.539998261258006} +{"Pretrain/Learning Rate": 4.661588489402955e-05, "Pretrain/Loss": 2.1452994346618652, "Pretrain/Loss (Raw)": 2.0110251903533936, "Pretrain/Step": 1836, "Pretrain/Step Time": 8.546847591176629} +{"Pretrain/Learning Rate": 4.661161833650556e-05, "Pretrain/Loss": 2.1463117599487305, "Pretrain/Loss (Raw)": 2.4379639625549316, "Pretrain/Step": 1837, "Pretrain/Step Time": 8.536711165681481} +{"Pretrain/Learning Rate": 4.660734928662791e-05, "Pretrain/Loss": 2.1457955837249756, "Pretrain/Loss (Raw)": 2.165692090988159, "Pretrain/Step": 1838, "Pretrain/Step Time": 8.543712180107832} +{"Pretrain/Learning Rate": 4.660307774488892e-05, "Pretrain/Loss": 2.1463980674743652, "Pretrain/Loss (Raw)": 2.1827545166015625, "Pretrain/Step": 1839, "Pretrain/Step Time": 8.543987296521664} +{"Pretrain/Learning Rate": 4.65988037117812e-05, "Pretrain/Loss": 2.147981643676758, "Pretrain/Loss (Raw)": 2.1091959476470947, "Pretrain/Step": 1840, "Pretrain/Step Time": 8.543371256440878} +{"Pretrain/Learning Rate": 4.659452718779768e-05, "Pretrain/Loss": 2.1480236053466797, "Pretrain/Loss (Raw)": 2.2262685298919678, "Pretrain/Step": 1841, "Pretrain/Step Time": 8.540490228682756} +{"Pretrain/Learning Rate": 4.6590248173431505e-05, "Pretrain/Loss": 2.1482908725738525, "Pretrain/Loss (Raw)": 2.1534135341644287, "Pretrain/Step": 1842, "Pretrain/Step Time": 8.548109808936715} +{"Pretrain/Learning Rate": 4.6585966669176186e-05, "Pretrain/Loss": 2.147394895553589, "Pretrain/Loss (Raw)": 2.1325454711914062, "Pretrain/Step": 1843, "Pretrain/Step Time": 8.540411850437522} +{"Pretrain/Learning Rate": 4.658168267552547e-05, "Pretrain/Loss": 2.147996425628662, "Pretrain/Loss (Raw)": 2.0330162048339844, "Pretrain/Step": 1844, "Pretrain/Step Time": 8.54937351681292} +{"Pretrain/Learning Rate": 4.657739619297342e-05, "Pretrain/Loss": 2.1474409103393555, "Pretrain/Loss (Raw)": 2.0419371128082275, "Pretrain/Step": 1845, "Pretrain/Step Time": 8.550931328907609} +{"Pretrain/Learning Rate": 4.657310722201436e-05, "Pretrain/Loss": 2.1445136070251465, "Pretrain/Loss (Raw)": 1.9036756753921509, "Pretrain/Step": 1846, "Pretrain/Step Time": 8.547029759734869} +{"Pretrain/Learning Rate": 4.6568815763142914e-05, "Pretrain/Loss": 2.1421241760253906, "Pretrain/Loss (Raw)": 2.1062097549438477, "Pretrain/Step": 1847, "Pretrain/Step Time": 8.550143770873547} +{"Pretrain/Learning Rate": 4.6564521816854e-05, "Pretrain/Loss": 2.1436145305633545, "Pretrain/Loss (Raw)": 2.1924495697021484, "Pretrain/Step": 1848, "Pretrain/Step Time": 8.55146493203938} +{"Pretrain/Learning Rate": 4.656022538364282e-05, "Pretrain/Loss": 2.144219398498535, "Pretrain/Loss (Raw)": 2.05655574798584, "Pretrain/Step": 1849, "Pretrain/Step Time": 8.543941536918283} +{"Pretrain/Learning Rate": 4.655592646400485e-05, "Pretrain/Loss": 2.142617702484131, "Pretrain/Loss (Raw)": 2.161569595336914, "Pretrain/Step": 1850, "Pretrain/Step Time": 8.546537032350898} +{"Pretrain/Learning Rate": 4.6551625058435866e-05, "Pretrain/Loss": 2.141162872314453, "Pretrain/Loss (Raw)": 1.9878634214401245, "Pretrain/Step": 1851, "Pretrain/Step Time": 8.54305088892579} +{"Pretrain/Learning Rate": 4.654732116743194e-05, "Pretrain/Loss": 2.1400489807128906, "Pretrain/Loss (Raw)": 1.9669537544250488, "Pretrain/Step": 1852, "Pretrain/Step Time": 8.542555334046483} +{"Pretrain/Learning Rate": 4.654301479148938e-05, "Pretrain/Loss": 2.140558958053589, "Pretrain/Loss (Raw)": 2.179743528366089, "Pretrain/Step": 1853, "Pretrain/Step Time": 8.540860202163458} +{"Pretrain/Learning Rate": 4.653870593110485e-05, "Pretrain/Loss": 2.140012502670288, "Pretrain/Loss (Raw)": 2.0955464839935303, "Pretrain/Step": 1854, "Pretrain/Step Time": 8.539562530815601} +{"Pretrain/Learning Rate": 4.6534394586775254e-05, "Pretrain/Loss": 2.1383605003356934, "Pretrain/Loss (Raw)": 1.8672047853469849, "Pretrain/Step": 1855, "Pretrain/Step Time": 8.549100134521723} +{"Pretrain/Learning Rate": 4.653008075899781e-05, "Pretrain/Loss": 2.137918472290039, "Pretrain/Loss (Raw)": 1.7589436769485474, "Pretrain/Step": 1856, "Pretrain/Step Time": 8.543530905619264} +{"Pretrain/Learning Rate": 4.652576444826999e-05, "Pretrain/Loss": 2.1380977630615234, "Pretrain/Loss (Raw)": 2.057079792022705, "Pretrain/Step": 1857, "Pretrain/Step Time": 8.53501308336854} +{"Pretrain/Learning Rate": 4.652144565508959e-05, "Pretrain/Loss": 2.1403751373291016, "Pretrain/Loss (Raw)": 2.214613676071167, "Pretrain/Step": 1858, "Pretrain/Step Time": 8.539622580632567} +{"Pretrain/Learning Rate": 4.6517124379954655e-05, "Pretrain/Loss": 2.1390304565429688, "Pretrain/Loss (Raw)": 2.058004140853882, "Pretrain/Step": 1859, "Pretrain/Step Time": 8.541454836726189} +{"Pretrain/Learning Rate": 4.651280062336355e-05, "Pretrain/Loss": 2.1371662616729736, "Pretrain/Loss (Raw)": 2.2623064517974854, "Pretrain/Step": 1860, "Pretrain/Step Time": 8.537942573428154} +{"Pretrain/Learning Rate": 4.65084743858149e-05, "Pretrain/Loss": 2.134643793106079, "Pretrain/Loss (Raw)": 1.8720628023147583, "Pretrain/Step": 1861, "Pretrain/Step Time": 8.548680996522307} +{"Pretrain/Learning Rate": 4.6504145667807644e-05, "Pretrain/Loss": 2.135303020477295, "Pretrain/Loss (Raw)": 2.006558895111084, "Pretrain/Step": 1862, "Pretrain/Step Time": 8.540583554655313} +{"Pretrain/Learning Rate": 4.649981446984097e-05, "Pretrain/Loss": 2.135143756866455, "Pretrain/Loss (Raw)": 2.144009590148926, "Pretrain/Step": 1863, "Pretrain/Step Time": 8.539118839427829} +{"Pretrain/Learning Rate": 4.649548079241438e-05, "Pretrain/Loss": 2.1369457244873047, "Pretrain/Loss (Raw)": 2.275810480117798, "Pretrain/Step": 1864, "Pretrain/Step Time": 8.53563791885972} +{"Pretrain/Learning Rate": 4.649114463602766e-05, "Pretrain/Loss": 2.1372432708740234, "Pretrain/Loss (Raw)": 2.1370108127593994, "Pretrain/Step": 1865, "Pretrain/Step Time": 8.536577576771379} +{"Pretrain/Learning Rate": 4.648680600118087e-05, "Pretrain/Loss": 2.1354641914367676, "Pretrain/Loss (Raw)": 2.098367214202881, "Pretrain/Step": 1866, "Pretrain/Step Time": 8.53732599504292} +{"Pretrain/Learning Rate": 4.6482464888374365e-05, "Pretrain/Loss": 2.135711669921875, "Pretrain/Loss (Raw)": 2.305863857269287, "Pretrain/Step": 1867, "Pretrain/Step Time": 8.543953958898783} +{"Pretrain/Learning Rate": 4.6478121298108776e-05, "Pretrain/Loss": 2.1358509063720703, "Pretrain/Loss (Raw)": 2.1838364601135254, "Pretrain/Step": 1868, "Pretrain/Step Time": 8.542900502681732} +{"Pretrain/Learning Rate": 4.647377523088503e-05, "Pretrain/Loss": 2.138030529022217, "Pretrain/Loss (Raw)": 2.3693814277648926, "Pretrain/Step": 1869, "Pretrain/Step Time": 8.539054356515408} +{"Pretrain/Learning Rate": 4.6469426687204346e-05, "Pretrain/Loss": 2.1369004249572754, "Pretrain/Loss (Raw)": 2.0574069023132324, "Pretrain/Step": 1870, "Pretrain/Step Time": 8.53931249678135} +{"Pretrain/Learning Rate": 4.646507566756819e-05, "Pretrain/Loss": 2.1340887546539307, "Pretrain/Loss (Raw)": 2.0671231746673584, "Pretrain/Step": 1871, "Pretrain/Step Time": 8.54013261012733} +{"Pretrain/Learning Rate": 4.646072217247838e-05, "Pretrain/Loss": 2.138179302215576, "Pretrain/Loss (Raw)": 2.520914077758789, "Pretrain/Step": 1872, "Pretrain/Step Time": 8.54223370552063} +{"Pretrain/Learning Rate": 4.645636620243695e-05, "Pretrain/Loss": 2.136896848678589, "Pretrain/Loss (Raw)": 2.0354409217834473, "Pretrain/Step": 1873, "Pretrain/Step Time": 8.540102761238813} +{"Pretrain/Learning Rate": 4.645200775794628e-05, "Pretrain/Loss": 2.1346778869628906, "Pretrain/Loss (Raw)": 1.9097158908843994, "Pretrain/Step": 1874, "Pretrain/Step Time": 8.552870571613312} +{"Pretrain/Learning Rate": 4.6447646839508975e-05, "Pretrain/Loss": 2.1374340057373047, "Pretrain/Loss (Raw)": 2.619300127029419, "Pretrain/Step": 1875, "Pretrain/Step Time": 8.548879105597734} +{"Pretrain/Learning Rate": 4.6443283447627974e-05, "Pretrain/Loss": 2.1365392208099365, "Pretrain/Loss (Raw)": 2.084691047668457, "Pretrain/Step": 1876, "Pretrain/Step Time": 8.549321254715323} +{"Pretrain/Learning Rate": 4.643891758280649e-05, "Pretrain/Loss": 2.1371519565582275, "Pretrain/Loss (Raw)": 2.2128336429595947, "Pretrain/Step": 1877, "Pretrain/Step Time": 8.55336513184011} +{"Pretrain/Learning Rate": 4.6434549245548e-05, "Pretrain/Loss": 2.1365861892700195, "Pretrain/Loss (Raw)": 2.0431432723999023, "Pretrain/Step": 1878, "Pretrain/Step Time": 8.554236525669694} +{"Pretrain/Learning Rate": 4.643017843635629e-05, "Pretrain/Loss": 2.1360256671905518, "Pretrain/Loss (Raw)": 2.010641098022461, "Pretrain/Step": 1879, "Pretrain/Step Time": 8.551476426422596} +{"Pretrain/Learning Rate": 4.6425805155735416e-05, "Pretrain/Loss": 2.138087749481201, "Pretrain/Loss (Raw)": 2.376945734024048, "Pretrain/Step": 1880, "Pretrain/Step Time": 8.549681227654219} +{"Pretrain/Learning Rate": 4.642142940418973e-05, "Pretrain/Loss": 2.137212038040161, "Pretrain/Loss (Raw)": 2.092966079711914, "Pretrain/Step": 1881, "Pretrain/Step Time": 8.542876793071628} +{"Pretrain/Learning Rate": 4.641705118222387e-05, "Pretrain/Loss": 2.1370105743408203, "Pretrain/Loss (Raw)": 2.00465726852417, "Pretrain/Step": 1882, "Pretrain/Step Time": 8.549072988331318} +{"Pretrain/Learning Rate": 4.6412670490342747e-05, "Pretrain/Loss": 2.1347100734710693, "Pretrain/Loss (Raw)": 2.045638084411621, "Pretrain/Step": 1883, "Pretrain/Step Time": 8.547869933769107} +{"Pretrain/Learning Rate": 4.6408287329051556e-05, "Pretrain/Loss": 2.137340545654297, "Pretrain/Loss (Raw)": 2.2057082653045654, "Pretrain/Step": 1884, "Pretrain/Step Time": 8.549822943285108} +{"Pretrain/Learning Rate": 4.64039016988558e-05, "Pretrain/Loss": 2.1351165771484375, "Pretrain/Loss (Raw)": 2.050476312637329, "Pretrain/Step": 1885, "Pretrain/Step Time": 8.549353543668985} +{"Pretrain/Learning Rate": 4.639951360026123e-05, "Pretrain/Loss": 2.1343586444854736, "Pretrain/Loss (Raw)": 2.124039888381958, "Pretrain/Step": 1886, "Pretrain/Step Time": 8.554920893162489} +{"Pretrain/Learning Rate": 4.639512303377393e-05, "Pretrain/Loss": 2.135098934173584, "Pretrain/Loss (Raw)": 2.219865322113037, "Pretrain/Step": 1887, "Pretrain/Step Time": 8.558923842385411} +{"Pretrain/Learning Rate": 4.639072999990022e-05, "Pretrain/Loss": 2.1351523399353027, "Pretrain/Loss (Raw)": 2.0268425941467285, "Pretrain/Step": 1888, "Pretrain/Step Time": 8.557601185515523} +{"Pretrain/Learning Rate": 4.6386334499146724e-05, "Pretrain/Loss": 2.1339240074157715, "Pretrain/Loss (Raw)": 2.0641872882843018, "Pretrain/Step": 1889, "Pretrain/Step Time": 8.559429286047816} +{"Pretrain/Learning Rate": 4.638193653202035e-05, "Pretrain/Loss": 2.133852005004883, "Pretrain/Loss (Raw)": 2.222892999649048, "Pretrain/Step": 1890, "Pretrain/Step Time": 8.557689065113664} +{"Pretrain/Learning Rate": 4.6377536099028315e-05, "Pretrain/Loss": 2.1334524154663086, "Pretrain/Loss (Raw)": 2.1154091358184814, "Pretrain/Step": 1891, "Pretrain/Step Time": 8.557756716385484} +{"Pretrain/Learning Rate": 4.637313320067808e-05, "Pretrain/Loss": 2.1342391967773438, "Pretrain/Loss (Raw)": 2.1637673377990723, "Pretrain/Step": 1892, "Pretrain/Step Time": 8.556671718135476} +{"Pretrain/Learning Rate": 4.636872783747741e-05, "Pretrain/Loss": 2.134246826171875, "Pretrain/Loss (Raw)": 2.1042697429656982, "Pretrain/Step": 1893, "Pretrain/Step Time": 8.55659237317741} +{"Pretrain/Learning Rate": 4.636432000993435e-05, "Pretrain/Loss": 2.13571834564209, "Pretrain/Loss (Raw)": 2.2505407333374023, "Pretrain/Step": 1894, "Pretrain/Step Time": 8.559311682358384} +{"Pretrain/Learning Rate": 4.635990971855724e-05, "Pretrain/Loss": 2.136229991912842, "Pretrain/Loss (Raw)": 2.1249170303344727, "Pretrain/Step": 1895, "Pretrain/Step Time": 8.556037256494164} +{"Pretrain/Learning Rate": 4.6355496963854684e-05, "Pretrain/Loss": 2.1375813484191895, "Pretrain/Loss (Raw)": 2.2326712608337402, "Pretrain/Step": 1896, "Pretrain/Step Time": 8.559635229408741} +{"Pretrain/Learning Rate": 4.635108174633559e-05, "Pretrain/Loss": 2.139552593231201, "Pretrain/Loss (Raw)": 2.3777997493743896, "Pretrain/Step": 1897, "Pretrain/Step Time": 8.56781081110239} +{"Pretrain/Learning Rate": 4.634666406650914e-05, "Pretrain/Loss": 2.139934539794922, "Pretrain/Loss (Raw)": 2.127048969268799, "Pretrain/Step": 1898, "Pretrain/Step Time": 8.560232810676098} +{"Pretrain/Learning Rate": 4.63422439248848e-05, "Pretrain/Loss": 2.1396045684814453, "Pretrain/Loss (Raw)": 2.00957989692688, "Pretrain/Step": 1899, "Pretrain/Step Time": 8.556201266124845} +{"Pretrain/Learning Rate": 4.633782132197232e-05, "Pretrain/Loss": 2.1387906074523926, "Pretrain/Loss (Raw)": 2.0091240406036377, "Pretrain/Step": 1900, "Pretrain/Step Time": 8.558260217308998} +{"Pretrain/Learning Rate": 4.633339625828173e-05, "Pretrain/Loss": 2.139540195465088, "Pretrain/Loss (Raw)": 2.099369525909424, "Pretrain/Step": 1901, "Pretrain/Step Time": 8.557839402928948} +{"Pretrain/Learning Rate": 4.632896873432338e-05, "Pretrain/Loss": 2.1355080604553223, "Pretrain/Loss (Raw)": 2.0773143768310547, "Pretrain/Step": 1902, "Pretrain/Step Time": 8.55730328336358} +{"Pretrain/Learning Rate": 4.632453875060784e-05, "Pretrain/Loss": 2.135106086730957, "Pretrain/Loss (Raw)": 2.089700937271118, "Pretrain/Step": 1903, "Pretrain/Step Time": 8.565789926797152} +{"Pretrain/Learning Rate": 4.6320106307646e-05, "Pretrain/Loss": 2.132991313934326, "Pretrain/Loss (Raw)": 2.0023229122161865, "Pretrain/Step": 1904, "Pretrain/Step Time": 8.555635206401348} +{"Pretrain/Learning Rate": 4.6315671405949046e-05, "Pretrain/Loss": 2.1326794624328613, "Pretrain/Loss (Raw)": 1.9992761611938477, "Pretrain/Step": 1905, "Pretrain/Step Time": 8.558900233358145} +{"Pretrain/Learning Rate": 4.631123404602842e-05, "Pretrain/Loss": 2.131422281265259, "Pretrain/Loss (Raw)": 2.069904327392578, "Pretrain/Step": 1906, "Pretrain/Step Time": 8.554185383021832} +{"Pretrain/Learning Rate": 4.630679422839585e-05, "Pretrain/Loss": 2.1347999572753906, "Pretrain/Loss (Raw)": 2.3958582878112793, "Pretrain/Step": 1907, "Pretrain/Step Time": 8.556976545602083} +{"Pretrain/Learning Rate": 4.6302351953563385e-05, "Pretrain/Loss": 2.1378164291381836, "Pretrain/Loss (Raw)": 2.6188013553619385, "Pretrain/Step": 1908, "Pretrain/Step Time": 8.557444849982858} +{"Pretrain/Learning Rate": 4.629790722204331e-05, "Pretrain/Loss": 2.1381797790527344, "Pretrain/Loss (Raw)": 2.253091812133789, "Pretrain/Step": 1909, "Pretrain/Step Time": 8.563886247575283} +{"Pretrain/Learning Rate": 4.629346003434821e-05, "Pretrain/Loss": 2.137460231781006, "Pretrain/Loss (Raw)": 2.112757444381714, "Pretrain/Step": 1910, "Pretrain/Step Time": 8.550911827012897} +{"Pretrain/Learning Rate": 4.628901039099096e-05, "Pretrain/Loss": 2.1362533569335938, "Pretrain/Loss (Raw)": 2.1493775844573975, "Pretrain/Step": 1911, "Pretrain/Step Time": 8.549852320924401} +{"Pretrain/Learning Rate": 4.6284558292484724e-05, "Pretrain/Loss": 2.134432315826416, "Pretrain/Loss (Raw)": 2.015294075012207, "Pretrain/Step": 1912, "Pretrain/Step Time": 8.544877661392093} +{"Pretrain/Learning Rate": 4.628010373934292e-05, "Pretrain/Loss": 2.1369004249572754, "Pretrain/Loss (Raw)": 2.525803565979004, "Pretrain/Step": 1913, "Pretrain/Step Time": 8.544507367536426} +{"Pretrain/Learning Rate": 4.627564673207928e-05, "Pretrain/Loss": 2.1392202377319336, "Pretrain/Loss (Raw)": 2.2261972427368164, "Pretrain/Step": 1914, "Pretrain/Step Time": 8.543811788782477} +{"Pretrain/Learning Rate": 4.62711872712078e-05, "Pretrain/Loss": 2.137993812561035, "Pretrain/Loss (Raw)": 2.125779628753662, "Pretrain/Step": 1915, "Pretrain/Step Time": 8.54525681771338} +{"Pretrain/Learning Rate": 4.626672535724278e-05, "Pretrain/Loss": 2.136441707611084, "Pretrain/Loss (Raw)": 1.9224915504455566, "Pretrain/Step": 1916, "Pretrain/Step Time": 8.541567677631974} +{"Pretrain/Learning Rate": 4.626226099069878e-05, "Pretrain/Loss": 2.138380527496338, "Pretrain/Loss (Raw)": 2.300027370452881, "Pretrain/Step": 1917, "Pretrain/Step Time": 8.546874672174454} +{"Pretrain/Learning Rate": 4.625779417209065e-05, "Pretrain/Loss": 2.139308214187622, "Pretrain/Loss (Raw)": 2.1533679962158203, "Pretrain/Step": 1918, "Pretrain/Step Time": 8.543738694861531} +{"Pretrain/Learning Rate": 4.625332490193352e-05, "Pretrain/Loss": 2.139591693878174, "Pretrain/Loss (Raw)": 2.226874828338623, "Pretrain/Step": 1919, "Pretrain/Step Time": 8.544079821556807} +{"Pretrain/Learning Rate": 4.624885318074282e-05, "Pretrain/Loss": 2.1418581008911133, "Pretrain/Loss (Raw)": 2.527156352996826, "Pretrain/Step": 1920, "Pretrain/Step Time": 8.543255435302854} +{"Pretrain/Learning Rate": 4.624437900903424e-05, "Pretrain/Loss": 2.1430575847625732, "Pretrain/Loss (Raw)": 2.1632518768310547, "Pretrain/Step": 1921, "Pretrain/Step Time": 8.549556225538254} +{"Pretrain/Learning Rate": 4.623990238732376e-05, "Pretrain/Loss": 2.141981840133667, "Pretrain/Loss (Raw)": 1.9942091703414917, "Pretrain/Step": 1922, "Pretrain/Step Time": 8.547264646738768} +{"Pretrain/Learning Rate": 4.6235423316127655e-05, "Pretrain/Loss": 2.141314744949341, "Pretrain/Loss (Raw)": 2.1616291999816895, "Pretrain/Step": 1923, "Pretrain/Step Time": 8.548716850578785} +{"Pretrain/Learning Rate": 4.623094179596248e-05, "Pretrain/Loss": 2.1404333114624023, "Pretrain/Loss (Raw)": 2.036184787750244, "Pretrain/Step": 1924, "Pretrain/Step Time": 8.542369354516268} +{"Pretrain/Learning Rate": 4.622645782734504e-05, "Pretrain/Loss": 2.140171527862549, "Pretrain/Loss (Raw)": 2.0753018856048584, "Pretrain/Step": 1925, "Pretrain/Step Time": 8.545962005853653} +{"Pretrain/Learning Rate": 4.6221971410792466e-05, "Pretrain/Loss": 2.1405935287475586, "Pretrain/Loss (Raw)": 2.1002213954925537, "Pretrain/Step": 1926, "Pretrain/Step Time": 8.541618375107646} +{"Pretrain/Learning Rate": 4.621748254682214e-05, "Pretrain/Loss": 2.1406447887420654, "Pretrain/Loss (Raw)": 2.1036550998687744, "Pretrain/Step": 1927, "Pretrain/Step Time": 8.553856581449509} +{"Pretrain/Learning Rate": 4.621299123595176e-05, "Pretrain/Loss": 2.1413936614990234, "Pretrain/Loss (Raw)": 2.0404465198516846, "Pretrain/Step": 1928, "Pretrain/Step Time": 8.545459562912583} +{"Pretrain/Learning Rate": 4.620849747869926e-05, "Pretrain/Loss": 2.1415224075317383, "Pretrain/Loss (Raw)": 2.067077398300171, "Pretrain/Step": 1929, "Pretrain/Step Time": 8.548829523846507} +{"Pretrain/Learning Rate": 4.6204001275582904e-05, "Pretrain/Loss": 2.1407785415649414, "Pretrain/Loss (Raw)": 2.054489850997925, "Pretrain/Step": 1930, "Pretrain/Step Time": 8.544132001698017} +{"Pretrain/Learning Rate": 4.61995026271212e-05, "Pretrain/Loss": 2.139807939529419, "Pretrain/Loss (Raw)": 2.02116060256958, "Pretrain/Step": 1931, "Pretrain/Step Time": 8.546763818711042} +{"Pretrain/Learning Rate": 4.619500153383296e-05, "Pretrain/Loss": 2.139591932296753, "Pretrain/Loss (Raw)": 2.303027868270874, "Pretrain/Step": 1932, "Pretrain/Step Time": 8.545450100675225} +{"Pretrain/Learning Rate": 4.619049799623726e-05, "Pretrain/Loss": 2.139681339263916, "Pretrain/Loss (Raw)": 2.152332067489624, "Pretrain/Step": 1933, "Pretrain/Step Time": 8.55245941132307} +{"Pretrain/Learning Rate": 4.618599201485349e-05, "Pretrain/Loss": 2.13681697845459, "Pretrain/Loss (Raw)": 2.0090723037719727, "Pretrain/Step": 1934, "Pretrain/Step Time": 8.543325474485755} +{"Pretrain/Learning Rate": 4.618148359020128e-05, "Pretrain/Loss": 2.137594699859619, "Pretrain/Loss (Raw)": 2.1310646533966064, "Pretrain/Step": 1935, "Pretrain/Step Time": 8.54411968588829} +{"Pretrain/Learning Rate": 4.617697272280057e-05, "Pretrain/Loss": 2.137266159057617, "Pretrain/Loss (Raw)": 2.3688199520111084, "Pretrain/Step": 1936, "Pretrain/Step Time": 8.535688674077392} +{"Pretrain/Learning Rate": 4.6172459413171586e-05, "Pretrain/Loss": 2.137176990509033, "Pretrain/Loss (Raw)": 2.1892104148864746, "Pretrain/Step": 1937, "Pretrain/Step Time": 8.534422617405653} +{"Pretrain/Learning Rate": 4.616794366183481e-05, "Pretrain/Loss": 2.1380577087402344, "Pretrain/Loss (Raw)": 2.2064614295959473, "Pretrain/Step": 1938, "Pretrain/Step Time": 8.535862404853106} +{"Pretrain/Learning Rate": 4.616342546931102e-05, "Pretrain/Loss": 2.1374268531799316, "Pretrain/Loss (Raw)": 2.0289559364318848, "Pretrain/Step": 1939, "Pretrain/Step Time": 8.53860579431057} +{"Pretrain/Learning Rate": 4.6158904836121286e-05, "Pretrain/Loss": 2.1373324394226074, "Pretrain/Loss (Raw)": 2.2608628273010254, "Pretrain/Step": 1940, "Pretrain/Step Time": 8.533349055796862} +{"Pretrain/Learning Rate": 4.6154381762786936e-05, "Pretrain/Loss": 2.1402487754821777, "Pretrain/Loss (Raw)": 2.1929235458374023, "Pretrain/Step": 1941, "Pretrain/Step Time": 8.532332649454474} +{"Pretrain/Learning Rate": 4.6149856249829606e-05, "Pretrain/Loss": 2.1395254135131836, "Pretrain/Loss (Raw)": 2.0297887325286865, "Pretrain/Step": 1942, "Pretrain/Step Time": 8.527531391009688} +{"Pretrain/Learning Rate": 4.6145328297771183e-05, "Pretrain/Loss": 2.1389176845550537, "Pretrain/Loss (Raw)": 2.0506882667541504, "Pretrain/Step": 1943, "Pretrain/Step Time": 8.526365185156465} +{"Pretrain/Learning Rate": 4.614079790713387e-05, "Pretrain/Loss": 2.1394214630126953, "Pretrain/Loss (Raw)": 2.1951446533203125, "Pretrain/Step": 1944, "Pretrain/Step Time": 8.533745646476746} +{"Pretrain/Learning Rate": 4.613626507844012e-05, "Pretrain/Loss": 2.141152858734131, "Pretrain/Loss (Raw)": 2.260369062423706, "Pretrain/Step": 1945, "Pretrain/Step Time": 8.531227465718985} +{"Pretrain/Learning Rate": 4.613172981221268e-05, "Pretrain/Loss": 2.143819808959961, "Pretrain/Loss (Raw)": 2.373577356338501, "Pretrain/Step": 1946, "Pretrain/Step Time": 8.531606703996658} +{"Pretrain/Learning Rate": 4.612719210897459e-05, "Pretrain/Loss": 2.1434378623962402, "Pretrain/Loss (Raw)": 2.1247775554656982, "Pretrain/Step": 1947, "Pretrain/Step Time": 8.540026411414146} +{"Pretrain/Learning Rate": 4.612265196924914e-05, "Pretrain/Loss": 2.1450002193450928, "Pretrain/Loss (Raw)": 2.0381226539611816, "Pretrain/Step": 1948, "Pretrain/Step Time": 8.532026262953877} +{"Pretrain/Learning Rate": 4.611810939355995e-05, "Pretrain/Loss": 2.1439592838287354, "Pretrain/Loss (Raw)": 2.1454217433929443, "Pretrain/Step": 1949, "Pretrain/Step Time": 8.539873570203781} +{"Pretrain/Learning Rate": 4.611356438243085e-05, "Pretrain/Loss": 2.1429572105407715, "Pretrain/Loss (Raw)": 2.1134395599365234, "Pretrain/Step": 1950, "Pretrain/Step Time": 8.538914879783988} +{"Pretrain/Learning Rate": 4.610901693638603e-05, "Pretrain/Loss": 2.142620086669922, "Pretrain/Loss (Raw)": 2.0284996032714844, "Pretrain/Step": 1951, "Pretrain/Step Time": 8.54339787364006} +{"Pretrain/Learning Rate": 4.610446705594991e-05, "Pretrain/Loss": 2.142392873764038, "Pretrain/Loss (Raw)": 2.1340551376342773, "Pretrain/Step": 1952, "Pretrain/Step Time": 8.543717475607991} +{"Pretrain/Learning Rate": 4.6099914741647196e-05, "Pretrain/Loss": 2.141892433166504, "Pretrain/Loss (Raw)": 2.243244171142578, "Pretrain/Step": 1953, "Pretrain/Step Time": 8.54320327937603} +{"Pretrain/Learning Rate": 4.609535999400289e-05, "Pretrain/Loss": 2.1433658599853516, "Pretrain/Loss (Raw)": 2.206230878829956, "Pretrain/Step": 1954, "Pretrain/Step Time": 8.54289992339909} +{"Pretrain/Learning Rate": 4.6090802813542255e-05, "Pretrain/Loss": 2.1421408653259277, "Pretrain/Loss (Raw)": 2.218247175216675, "Pretrain/Step": 1955, "Pretrain/Step Time": 8.542799644172192} +{"Pretrain/Learning Rate": 4.608624320079087e-05, "Pretrain/Loss": 2.1418473720550537, "Pretrain/Loss (Raw)": 2.2040295600891113, "Pretrain/Step": 1956, "Pretrain/Step Time": 8.542799247428775} +{"Pretrain/Learning Rate": 4.608168115627455e-05, "Pretrain/Loss": 2.1433348655700684, "Pretrain/Loss (Raw)": 2.305457353591919, "Pretrain/Step": 1957, "Pretrain/Step Time": 8.543405329808593} +{"Pretrain/Learning Rate": 4.607711668051942e-05, "Pretrain/Loss": 2.144195556640625, "Pretrain/Loss (Raw)": 2.2436928749084473, "Pretrain/Step": 1958, "Pretrain/Step Time": 8.544273905456066} +{"Pretrain/Learning Rate": 4.6072549774051874e-05, "Pretrain/Loss": 2.1445682048797607, "Pretrain/Loss (Raw)": 2.2803287506103516, "Pretrain/Step": 1959, "Pretrain/Step Time": 8.54333620890975} +{"Pretrain/Learning Rate": 4.60679804373986e-05, "Pretrain/Loss": 2.1442694664001465, "Pretrain/Loss (Raw)": 2.111452102661133, "Pretrain/Step": 1960, "Pretrain/Step Time": 8.55434251204133} +{"Pretrain/Learning Rate": 4.606340867108653e-05, "Pretrain/Loss": 2.1429483890533447, "Pretrain/Loss (Raw)": 2.141618490219116, "Pretrain/Step": 1961, "Pretrain/Step Time": 8.555601943284273} +{"Pretrain/Learning Rate": 4.605883447564293e-05, "Pretrain/Loss": 2.1430468559265137, "Pretrain/Loss (Raw)": 2.0686802864074707, "Pretrain/Step": 1962, "Pretrain/Step Time": 8.555543104186654} +{"Pretrain/Learning Rate": 4.6054257851595303e-05, "Pretrain/Loss": 2.1446547508239746, "Pretrain/Loss (Raw)": 2.1817944049835205, "Pretrain/Step": 1963, "Pretrain/Step Time": 8.552188642323017} +{"Pretrain/Learning Rate": 4.604967879947145e-05, "Pretrain/Loss": 2.146357536315918, "Pretrain/Loss (Raw)": 2.2289986610412598, "Pretrain/Step": 1964, "Pretrain/Step Time": 8.559875760227442} +{"Pretrain/Learning Rate": 4.6045097319799447e-05, "Pretrain/Loss": 2.1430139541625977, "Pretrain/Loss (Raw)": 2.0099709033966064, "Pretrain/Step": 1965, "Pretrain/Step Time": 8.565974807366729} +{"Pretrain/Learning Rate": 4.6040513413107655e-05, "Pretrain/Loss": 2.1429343223571777, "Pretrain/Loss (Raw)": 2.155547857284546, "Pretrain/Step": 1966, "Pretrain/Step Time": 8.559670241549611} +{"Pretrain/Learning Rate": 4.603592707992471e-05, "Pretrain/Loss": 2.1443593502044678, "Pretrain/Loss (Raw)": 2.36514949798584, "Pretrain/Step": 1967, "Pretrain/Step Time": 8.562603628262877} +{"Pretrain/Learning Rate": 4.6031338320779534e-05, "Pretrain/Loss": 2.1448516845703125, "Pretrain/Loss (Raw)": 2.172191858291626, "Pretrain/Step": 1968, "Pretrain/Step Time": 8.562572248280048} +{"Pretrain/Learning Rate": 4.602674713620131e-05, "Pretrain/Loss": 2.1436867713928223, "Pretrain/Loss (Raw)": 2.077191114425659, "Pretrain/Step": 1969, "Pretrain/Step Time": 8.569246931001544} +{"Pretrain/Learning Rate": 4.6022153526719536e-05, "Pretrain/Loss": 2.144139051437378, "Pretrain/Loss (Raw)": 2.2112772464752197, "Pretrain/Step": 1970, "Pretrain/Step Time": 8.565041664987803} +{"Pretrain/Learning Rate": 4.601755749286395e-05, "Pretrain/Loss": 2.1425623893737793, "Pretrain/Loss (Raw)": 1.9307352304458618, "Pretrain/Step": 1971, "Pretrain/Step Time": 8.567415239289403} +{"Pretrain/Learning Rate": 4.6012959035164596e-05, "Pretrain/Loss": 2.1427462100982666, "Pretrain/Loss (Raw)": 2.0565531253814697, "Pretrain/Step": 1972, "Pretrain/Step Time": 8.561378125101328} +{"Pretrain/Learning Rate": 4.6008358154151794e-05, "Pretrain/Loss": 2.1431102752685547, "Pretrain/Loss (Raw)": 2.088538885116577, "Pretrain/Step": 1973, "Pretrain/Step Time": 8.553331749513745} +{"Pretrain/Learning Rate": 4.600375485035613e-05, "Pretrain/Loss": 2.1446547508239746, "Pretrain/Loss (Raw)": 2.101367473602295, "Pretrain/Step": 1974, "Pretrain/Step Time": 8.558384973555803} +{"Pretrain/Learning Rate": 4.599914912430849e-05, "Pretrain/Loss": 2.1435742378234863, "Pretrain/Loss (Raw)": 1.9678752422332764, "Pretrain/Step": 1975, "Pretrain/Step Time": 8.55391701683402} +{"Pretrain/Learning Rate": 4.5994540976540013e-05, "Pretrain/Loss": 2.143455982208252, "Pretrain/Loss (Raw)": 2.177359104156494, "Pretrain/Step": 1976, "Pretrain/Step Time": 8.558611260727048} +{"Pretrain/Learning Rate": 4.598993040758215e-05, "Pretrain/Loss": 2.144721269607544, "Pretrain/Loss (Raw)": 2.218492269515991, "Pretrain/Step": 1977, "Pretrain/Step Time": 8.55928673222661} +{"Pretrain/Learning Rate": 4.59853174179666e-05, "Pretrain/Loss": 2.1433684825897217, "Pretrain/Loss (Raw)": 1.9884034395217896, "Pretrain/Step": 1978, "Pretrain/Step Time": 8.557029349729419} +{"Pretrain/Learning Rate": 4.5980702008225365e-05, "Pretrain/Loss": 2.1436400413513184, "Pretrain/Loss (Raw)": 2.022627830505371, "Pretrain/Step": 1979, "Pretrain/Step Time": 8.558407558128238} +{"Pretrain/Learning Rate": 4.59760841788907e-05, "Pretrain/Loss": 2.1446783542633057, "Pretrain/Loss (Raw)": 2.099864959716797, "Pretrain/Step": 1980, "Pretrain/Step Time": 8.561026787385345} +{"Pretrain/Learning Rate": 4.597146393049517e-05, "Pretrain/Loss": 2.144186019897461, "Pretrain/Loss (Raw)": 2.1167337894439697, "Pretrain/Step": 1981, "Pretrain/Step Time": 8.563732339069247} +{"Pretrain/Learning Rate": 4.59668412635716e-05, "Pretrain/Loss": 2.143113136291504, "Pretrain/Loss (Raw)": 1.9582083225250244, "Pretrain/Step": 1982, "Pretrain/Step Time": 8.565022882074118} +{"Pretrain/Learning Rate": 4.5962216178653095e-05, "Pretrain/Loss": 2.144981861114502, "Pretrain/Loss (Raw)": 2.106383800506592, "Pretrain/Step": 1983, "Pretrain/Step Time": 8.559654336422682} +{"Pretrain/Learning Rate": 4.5957588676273046e-05, "Pretrain/Loss": 2.14825439453125, "Pretrain/Loss (Raw)": 2.177827835083008, "Pretrain/Step": 1984, "Pretrain/Step Time": 8.559684664011002} +{"Pretrain/Learning Rate": 4.595295875696511e-05, "Pretrain/Loss": 2.1484620571136475, "Pretrain/Loss (Raw)": 2.0836925506591797, "Pretrain/Step": 1985, "Pretrain/Step Time": 8.564414352178574} +{"Pretrain/Learning Rate": 4.5948326421263244e-05, "Pretrain/Loss": 2.1486339569091797, "Pretrain/Loss (Raw)": 2.2365963459014893, "Pretrain/Step": 1986, "Pretrain/Step Time": 8.563670115545392} +{"Pretrain/Learning Rate": 4.5943691669701654e-05, "Pretrain/Loss": 2.150196075439453, "Pretrain/Loss (Raw)": 2.257982015609741, "Pretrain/Step": 1987, "Pretrain/Step Time": 8.5623446572572} +{"Pretrain/Learning Rate": 4.593905450281486e-05, "Pretrain/Loss": 2.1493775844573975, "Pretrain/Loss (Raw)": 2.1575114727020264, "Pretrain/Step": 1988, "Pretrain/Step Time": 8.574751632288098} +{"Pretrain/Learning Rate": 4.593441492113763e-05, "Pretrain/Loss": 2.1501924991607666, "Pretrain/Loss (Raw)": 1.976380705833435, "Pretrain/Step": 1989, "Pretrain/Step Time": 8.567615559324622} +{"Pretrain/Learning Rate": 4.5929772925205014e-05, "Pretrain/Loss": 2.1497645378112793, "Pretrain/Loss (Raw)": 1.9517725706100464, "Pretrain/Step": 1990, "Pretrain/Step Time": 8.570246767252684} +{"Pretrain/Learning Rate": 4.592512851555237e-05, "Pretrain/Loss": 2.150063991546631, "Pretrain/Loss (Raw)": 2.182337760925293, "Pretrain/Step": 1991, "Pretrain/Step Time": 8.574227575212717} +{"Pretrain/Learning Rate": 4.592048169271531e-05, "Pretrain/Loss": 2.1476101875305176, "Pretrain/Loss (Raw)": 1.9617294073104858, "Pretrain/Step": 1992, "Pretrain/Step Time": 8.572107626125216} +{"Pretrain/Learning Rate": 4.591583245722971e-05, "Pretrain/Loss": 2.147193431854248, "Pretrain/Loss (Raw)": 2.083686113357544, "Pretrain/Step": 1993, "Pretrain/Step Time": 8.575909508392215} +{"Pretrain/Learning Rate": 4.591118080963176e-05, "Pretrain/Loss": 2.147350311279297, "Pretrain/Loss (Raw)": 2.1184308528900146, "Pretrain/Step": 1994, "Pretrain/Step Time": 8.582794854417443} +{"Pretrain/Learning Rate": 4.590652675045789e-05, "Pretrain/Loss": 2.1456289291381836, "Pretrain/Loss (Raw)": 2.0855555534362793, "Pretrain/Step": 1995, "Pretrain/Step Time": 8.57723380997777} +{"Pretrain/Learning Rate": 4.5901870280244855e-05, "Pretrain/Loss": 2.1454710960388184, "Pretrain/Loss (Raw)": 2.163590669631958, "Pretrain/Step": 1996, "Pretrain/Step Time": 8.576195565983653} +{"Pretrain/Learning Rate": 4.589721139952964e-05, "Pretrain/Loss": 2.144648313522339, "Pretrain/Loss (Raw)": 2.2640862464904785, "Pretrain/Step": 1997, "Pretrain/Step Time": 8.575414974242449} +{"Pretrain/Learning Rate": 4.589255010884953e-05, "Pretrain/Loss": 2.145536422729492, "Pretrain/Loss (Raw)": 2.171050786972046, "Pretrain/Step": 1998, "Pretrain/Step Time": 8.572730742394924} +{"Pretrain/Learning Rate": 4.58878864087421e-05, "Pretrain/Loss": 2.146294593811035, "Pretrain/Loss (Raw)": 2.1642098426818848, "Pretrain/Step": 1999, "Pretrain/Step Time": 8.569964427500963} +{"Pretrain/Learning Rate": 4.5883220299745176e-05, "Pretrain/Loss": 2.144120216369629, "Pretrain/Loss (Raw)": 2.24259614944458, "Pretrain/Step": 2000, "Pretrain/Step Time": 8.572537433356047} +{"Pretrain/Learning Rate": 4.587855178239689e-05, "Pretrain/Loss": 2.1454689502716064, "Pretrain/Loss (Raw)": 2.2080700397491455, "Pretrain/Step": 2001, "Pretrain/Step Time": 8.57182395644486} +{"Pretrain/Learning Rate": 4.587388085723562e-05, "Pretrain/Loss": 2.146973133087158, "Pretrain/Loss (Raw)": 2.102222204208374, "Pretrain/Step": 2002, "Pretrain/Step Time": 8.55812842398882} +{"Pretrain/Learning Rate": 4.586920752480006e-05, "Pretrain/Loss": 2.1428074836730957, "Pretrain/Loss (Raw)": 2.0861337184906006, "Pretrain/Step": 2003, "Pretrain/Step Time": 8.553991198539734} +{"Pretrain/Learning Rate": 4.5864531785629136e-05, "Pretrain/Loss": 2.142970561981201, "Pretrain/Loss (Raw)": 2.1055150032043457, "Pretrain/Step": 2004, "Pretrain/Step Time": 8.555130643770099} +{"Pretrain/Learning Rate": 4.5859853640262104e-05, "Pretrain/Loss": 2.142141342163086, "Pretrain/Loss (Raw)": 2.1067168712615967, "Pretrain/Step": 2005, "Pretrain/Step Time": 8.557603687047958} +{"Pretrain/Learning Rate": 4.5855173089238445e-05, "Pretrain/Loss": 2.1418824195861816, "Pretrain/Loss (Raw)": 2.0100038051605225, "Pretrain/Step": 2006, "Pretrain/Step Time": 8.558292083442211} +{"Pretrain/Learning Rate": 4.5850490133097957e-05, "Pretrain/Loss": 2.142918586730957, "Pretrain/Loss (Raw)": 2.143272638320923, "Pretrain/Step": 2007, "Pretrain/Step Time": 8.555974250659347} +{"Pretrain/Learning Rate": 4.584580477238069e-05, "Pretrain/Loss": 2.142000675201416, "Pretrain/Loss (Raw)": 2.259462833404541, "Pretrain/Step": 2008, "Pretrain/Step Time": 8.55630936846137} +{"Pretrain/Learning Rate": 4.5841117007627e-05, "Pretrain/Loss": 2.142568349838257, "Pretrain/Loss (Raw)": 2.1656317710876465, "Pretrain/Step": 2009, "Pretrain/Step Time": 8.555670352652669} +{"Pretrain/Learning Rate": 4.583642683937748e-05, "Pretrain/Loss": 2.1434249877929688, "Pretrain/Loss (Raw)": 2.114286184310913, "Pretrain/Step": 2010, "Pretrain/Step Time": 8.553006241098046} +{"Pretrain/Learning Rate": 4.583173426817304e-05, "Pretrain/Loss": 2.1441588401794434, "Pretrain/Loss (Raw)": 2.1396162509918213, "Pretrain/Step": 2011, "Pretrain/Step Time": 8.557386089116335} +{"Pretrain/Learning Rate": 4.5827039294554833e-05, "Pretrain/Loss": 2.1434578895568848, "Pretrain/Loss (Raw)": 2.1159305572509766, "Pretrain/Step": 2012, "Pretrain/Step Time": 8.558881128206849} +{"Pretrain/Learning Rate": 4.582234191906432e-05, "Pretrain/Loss": 2.1441149711608887, "Pretrain/Loss (Raw)": 2.13460373878479, "Pretrain/Step": 2013, "Pretrain/Step Time": 8.554055087268353} +{"Pretrain/Learning Rate": 4.581764214224322e-05, "Pretrain/Loss": 2.14420223236084, "Pretrain/Loss (Raw)": 2.1351969242095947, "Pretrain/Step": 2014, "Pretrain/Step Time": 8.547963635995984} +{"Pretrain/Learning Rate": 4.581293996463353e-05, "Pretrain/Loss": 2.142266273498535, "Pretrain/Loss (Raw)": 1.9720783233642578, "Pretrain/Step": 2015, "Pretrain/Step Time": 8.541771536692977} +{"Pretrain/Learning Rate": 4.580823538677753e-05, "Pretrain/Loss": 2.142230987548828, "Pretrain/Loss (Raw)": 2.0223286151885986, "Pretrain/Step": 2016, "Pretrain/Step Time": 8.545408437028527} +{"Pretrain/Learning Rate": 4.580352840921777e-05, "Pretrain/Loss": 2.141594886779785, "Pretrain/Loss (Raw)": 1.9827646017074585, "Pretrain/Step": 2017, "Pretrain/Step Time": 8.542873049154878} +{"Pretrain/Learning Rate": 4.579881903249709e-05, "Pretrain/Loss": 2.141676187515259, "Pretrain/Loss (Raw)": 2.2333149909973145, "Pretrain/Step": 2018, "Pretrain/Step Time": 8.544978182762861} +{"Pretrain/Learning Rate": 4.5794107257158595e-05, "Pretrain/Loss": 2.141812324523926, "Pretrain/Loss (Raw)": 2.1328155994415283, "Pretrain/Step": 2019, "Pretrain/Step Time": 8.54548041895032} +{"Pretrain/Learning Rate": 4.578939308374566e-05, "Pretrain/Loss": 2.141909599304199, "Pretrain/Loss (Raw)": 2.17622447013855, "Pretrain/Step": 2020, "Pretrain/Step Time": 8.54205404408276} +{"Pretrain/Learning Rate": 4.578467651280195e-05, "Pretrain/Loss": 2.1428890228271484, "Pretrain/Loss (Raw)": 2.229609727859497, "Pretrain/Step": 2021, "Pretrain/Step Time": 8.543525150045753} +{"Pretrain/Learning Rate": 4.57799575448714e-05, "Pretrain/Loss": 2.142371416091919, "Pretrain/Loss (Raw)": 2.1843109130859375, "Pretrain/Step": 2022, "Pretrain/Step Time": 8.543256500735879} +{"Pretrain/Learning Rate": 4.5775236180498235e-05, "Pretrain/Loss": 2.142916679382324, "Pretrain/Loss (Raw)": 2.194719076156616, "Pretrain/Step": 2023, "Pretrain/Step Time": 8.550331525504589} +{"Pretrain/Learning Rate": 4.5770512420226934e-05, "Pretrain/Loss": 2.1411561965942383, "Pretrain/Loss (Raw)": 2.007288932800293, "Pretrain/Step": 2024, "Pretrain/Step Time": 8.548420699313283} +{"Pretrain/Learning Rate": 4.5765786264602274e-05, "Pretrain/Loss": 2.139669179916382, "Pretrain/Loss (Raw)": 2.1874911785125732, "Pretrain/Step": 2025, "Pretrain/Step Time": 8.541402479633689} +{"Pretrain/Learning Rate": 4.5761057714169284e-05, "Pretrain/Loss": 2.1409664154052734, "Pretrain/Loss (Raw)": 2.293091297149658, "Pretrain/Step": 2026, "Pretrain/Step Time": 8.541612926870584} +{"Pretrain/Learning Rate": 4.575632676947329e-05, "Pretrain/Loss": 2.1422548294067383, "Pretrain/Loss (Raw)": 2.1744937896728516, "Pretrain/Step": 2027, "Pretrain/Step Time": 8.54279369302094} +{"Pretrain/Learning Rate": 4.575159343105988e-05, "Pretrain/Loss": 2.1430959701538086, "Pretrain/Loss (Raw)": 2.1167938709259033, "Pretrain/Step": 2028, "Pretrain/Step Time": 8.542340196669102} +{"Pretrain/Learning Rate": 4.5746857699474946e-05, "Pretrain/Loss": 2.1426572799682617, "Pretrain/Loss (Raw)": 2.0431885719299316, "Pretrain/Step": 2029, "Pretrain/Step Time": 8.544160036370158} +{"Pretrain/Learning Rate": 4.574211957526461e-05, "Pretrain/Loss": 2.144016981124878, "Pretrain/Loss (Raw)": 2.2513809204101562, "Pretrain/Step": 2030, "Pretrain/Step Time": 8.545020245015621} +{"Pretrain/Learning Rate": 4.57373790589753e-05, "Pretrain/Loss": 2.1451406478881836, "Pretrain/Loss (Raw)": 2.2335166931152344, "Pretrain/Step": 2031, "Pretrain/Step Time": 8.539310054853559} +{"Pretrain/Learning Rate": 4.573263615115372e-05, "Pretrain/Loss": 2.1458487510681152, "Pretrain/Loss (Raw)": 2.0929765701293945, "Pretrain/Step": 2032, "Pretrain/Step Time": 8.544887389987707} +{"Pretrain/Learning Rate": 4.572789085234686e-05, "Pretrain/Loss": 2.1471102237701416, "Pretrain/Loss (Raw)": 2.160737991333008, "Pretrain/Step": 2033, "Pretrain/Step Time": 8.542786862701178} +{"Pretrain/Learning Rate": 4.5723143163101934e-05, "Pretrain/Loss": 2.1462059020996094, "Pretrain/Loss (Raw)": 1.9541668891906738, "Pretrain/Step": 2034, "Pretrain/Step Time": 8.54436626471579} +{"Pretrain/Learning Rate": 4.571839308396649e-05, "Pretrain/Loss": 2.1445152759552, "Pretrain/Loss (Raw)": 2.1794257164001465, "Pretrain/Step": 2035, "Pretrain/Step Time": 8.544967422261834} +{"Pretrain/Learning Rate": 4.571364061548834e-05, "Pretrain/Loss": 2.141098976135254, "Pretrain/Loss (Raw)": 2.181542158126831, "Pretrain/Step": 2036, "Pretrain/Step Time": 8.539503287523985} +{"Pretrain/Learning Rate": 4.5708885758215543e-05, "Pretrain/Loss": 2.139723300933838, "Pretrain/Loss (Raw)": 2.076996326446533, "Pretrain/Step": 2037, "Pretrain/Step Time": 8.547061670571566} +{"Pretrain/Learning Rate": 4.570412851269645e-05, "Pretrain/Loss": 2.1398842334747314, "Pretrain/Loss (Raw)": 2.133356809616089, "Pretrain/Step": 2038, "Pretrain/Step Time": 8.546409605070949} +{"Pretrain/Learning Rate": 4.56993688794797e-05, "Pretrain/Loss": 2.1399693489074707, "Pretrain/Loss (Raw)": 2.1602683067321777, "Pretrain/Step": 2039, "Pretrain/Step Time": 8.55244573391974} +{"Pretrain/Learning Rate": 4.5694606859114196e-05, "Pretrain/Loss": 2.140043020248413, "Pretrain/Loss (Raw)": 2.024714231491089, "Pretrain/Step": 2040, "Pretrain/Step Time": 8.551967564970255} +{"Pretrain/Learning Rate": 4.5689842452149114e-05, "Pretrain/Loss": 2.135859966278076, "Pretrain/Loss (Raw)": 1.9903943538665771, "Pretrain/Step": 2041, "Pretrain/Step Time": 8.553562259301543} +{"Pretrain/Learning Rate": 4.56850756591339e-05, "Pretrain/Loss": 2.135253667831421, "Pretrain/Loss (Raw)": 2.148592472076416, "Pretrain/Step": 2042, "Pretrain/Step Time": 8.554266696795821} +{"Pretrain/Learning Rate": 4.56803064806183e-05, "Pretrain/Loss": 2.134964942932129, "Pretrain/Loss (Raw)": 2.0888147354125977, "Pretrain/Step": 2043, "Pretrain/Step Time": 8.56073609367013} +{"Pretrain/Learning Rate": 4.567553491715229e-05, "Pretrain/Loss": 2.135960817337036, "Pretrain/Loss (Raw)": 2.04996395111084, "Pretrain/Step": 2044, "Pretrain/Step Time": 8.557888237759471} +{"Pretrain/Learning Rate": 4.567076096928618e-05, "Pretrain/Loss": 2.134392499923706, "Pretrain/Loss (Raw)": 2.0992729663848877, "Pretrain/Step": 2045, "Pretrain/Step Time": 8.559796836227179} +{"Pretrain/Learning Rate": 4.566598463757051e-05, "Pretrain/Loss": 2.1347403526306152, "Pretrain/Loss (Raw)": 2.1978919506073, "Pretrain/Step": 2046, "Pretrain/Step Time": 8.564329754561186} +{"Pretrain/Learning Rate": 4.56612059225561e-05, "Pretrain/Loss": 2.1335225105285645, "Pretrain/Loss (Raw)": 2.0709855556488037, "Pretrain/Step": 2047, "Pretrain/Step Time": 8.565516740083694} +{"Pretrain/Learning Rate": 4.565642482479408e-05, "Pretrain/Loss": 2.1321234703063965, "Pretrain/Loss (Raw)": 2.3481152057647705, "Pretrain/Step": 2048, "Pretrain/Step Time": 8.568989124149084} +{"Pretrain/Learning Rate": 4.565164134483581e-05, "Pretrain/Loss": 2.133216619491577, "Pretrain/Loss (Raw)": 2.3031649589538574, "Pretrain/Step": 2049, "Pretrain/Step Time": 8.564572039991617} +{"Pretrain/Learning Rate": 4.5646855483232935e-05, "Pretrain/Loss": 2.135626792907715, "Pretrain/Loss (Raw)": 2.30271053314209, "Pretrain/Step": 2050, "Pretrain/Step Time": 8.563814334571362} +{"Pretrain/Learning Rate": 4.56420672405374e-05, "Pretrain/Loss": 2.132948160171509, "Pretrain/Loss (Raw)": 1.8187406063079834, "Pretrain/Step": 2051, "Pretrain/Step Time": 8.564747301861644} +{"Pretrain/Learning Rate": 4.563727661730141e-05, "Pretrain/Loss": 2.1324760913848877, "Pretrain/Loss (Raw)": 1.9757790565490723, "Pretrain/Step": 2052, "Pretrain/Step Time": 8.565431471914053} +{"Pretrain/Learning Rate": 4.563248361407743e-05, "Pretrain/Loss": 2.1330831050872803, "Pretrain/Loss (Raw)": 2.152996301651001, "Pretrain/Step": 2053, "Pretrain/Step Time": 8.5651794411242} +{"Pretrain/Learning Rate": 4.562768823141821e-05, "Pretrain/Loss": 2.1329612731933594, "Pretrain/Loss (Raw)": 2.084611415863037, "Pretrain/Step": 2054, "Pretrain/Step Time": 8.563689295202494} +{"Pretrain/Learning Rate": 4.562289046987679e-05, "Pretrain/Loss": 2.1328463554382324, "Pretrain/Loss (Raw)": 2.088949680328369, "Pretrain/Step": 2055, "Pretrain/Step Time": 8.556595908477902} +{"Pretrain/Learning Rate": 4.561809033000646e-05, "Pretrain/Loss": 2.1334633827209473, "Pretrain/Loss (Raw)": 2.11944842338562, "Pretrain/Step": 2056, "Pretrain/Step Time": 8.559948232024908} +{"Pretrain/Learning Rate": 4.5613287812360796e-05, "Pretrain/Loss": 2.133868455886841, "Pretrain/Loss (Raw)": 2.118921995162964, "Pretrain/Step": 2057, "Pretrain/Step Time": 8.56028925254941} +{"Pretrain/Learning Rate": 4.560848291749365e-05, "Pretrain/Loss": 2.1347150802612305, "Pretrain/Loss (Raw)": 2.162843942642212, "Pretrain/Step": 2058, "Pretrain/Step Time": 8.558213436976075} +{"Pretrain/Learning Rate": 4.560367564595914e-05, "Pretrain/Loss": 2.1347880363464355, "Pretrain/Loss (Raw)": 2.0305116176605225, "Pretrain/Step": 2059, "Pretrain/Step Time": 8.558813283219934} +{"Pretrain/Learning Rate": 4.559886599831167e-05, "Pretrain/Loss": 2.1318795680999756, "Pretrain/Loss (Raw)": 1.930741310119629, "Pretrain/Step": 2060, "Pretrain/Step Time": 8.554043255746365} +{"Pretrain/Learning Rate": 4.559405397510591e-05, "Pretrain/Loss": 2.1329994201660156, "Pretrain/Loss (Raw)": 2.2956855297088623, "Pretrain/Step": 2061, "Pretrain/Step Time": 8.550407974049449} +{"Pretrain/Learning Rate": 4.55892395768968e-05, "Pretrain/Loss": 2.135387897491455, "Pretrain/Loss (Raw)": 2.3147871494293213, "Pretrain/Step": 2062, "Pretrain/Step Time": 8.560103263705969} +{"Pretrain/Learning Rate": 4.5584422804239566e-05, "Pretrain/Loss": 2.1361236572265625, "Pretrain/Loss (Raw)": 2.225254535675049, "Pretrain/Step": 2063, "Pretrain/Step Time": 8.564901050180197} +{"Pretrain/Learning Rate": 4.55796036576897e-05, "Pretrain/Loss": 2.13543963432312, "Pretrain/Loss (Raw)": 2.2812750339508057, "Pretrain/Step": 2064, "Pretrain/Step Time": 8.571112535893917} +{"Pretrain/Learning Rate": 4.557478213780295e-05, "Pretrain/Loss": 2.133565664291382, "Pretrain/Loss (Raw)": 1.9493407011032104, "Pretrain/Step": 2065, "Pretrain/Step Time": 8.569993892684579} +{"Pretrain/Learning Rate": 4.556995824513539e-05, "Pretrain/Loss": 2.1318540573120117, "Pretrain/Loss (Raw)": 1.987370252609253, "Pretrain/Step": 2066, "Pretrain/Step Time": 8.568161027505994} +{"Pretrain/Learning Rate": 4.5565131980243305e-05, "Pretrain/Loss": 2.1342434883117676, "Pretrain/Loss (Raw)": 2.334799289703369, "Pretrain/Step": 2067, "Pretrain/Step Time": 8.566044975072145} +{"Pretrain/Learning Rate": 4.55603033436833e-05, "Pretrain/Loss": 2.133223533630371, "Pretrain/Loss (Raw)": 2.1303203105926514, "Pretrain/Step": 2068, "Pretrain/Step Time": 8.576256653293967} +{"Pretrain/Learning Rate": 4.555547233601223e-05, "Pretrain/Loss": 2.1330676078796387, "Pretrain/Loss (Raw)": 2.1729538440704346, "Pretrain/Step": 2069, "Pretrain/Step Time": 8.578735321760178} +{"Pretrain/Learning Rate": 4.555063895778723e-05, "Pretrain/Loss": 2.1337056159973145, "Pretrain/Loss (Raw)": 2.1114377975463867, "Pretrain/Step": 2070, "Pretrain/Step Time": 8.576219199225307} +{"Pretrain/Learning Rate": 4.5545803209565704e-05, "Pretrain/Loss": 2.1350014209747314, "Pretrain/Loss (Raw)": 2.216552495956421, "Pretrain/Step": 2071, "Pretrain/Step Time": 8.576959190890193} +{"Pretrain/Learning Rate": 4.554096509190534e-05, "Pretrain/Loss": 2.1339588165283203, "Pretrain/Loss (Raw)": 2.0616872310638428, "Pretrain/Step": 2072, "Pretrain/Step Time": 8.571999207139015} +{"Pretrain/Learning Rate": 4.5536124605364085e-05, "Pretrain/Loss": 2.1354918479919434, "Pretrain/Loss (Raw)": 2.4565935134887695, "Pretrain/Step": 2073, "Pretrain/Step Time": 8.579580010846257} +{"Pretrain/Learning Rate": 4.553128175050018e-05, "Pretrain/Loss": 2.1342358589172363, "Pretrain/Loss (Raw)": 2.212831735610962, "Pretrain/Step": 2074, "Pretrain/Step Time": 8.574398927390575} +{"Pretrain/Learning Rate": 4.552643652787211e-05, "Pretrain/Loss": 2.134369373321533, "Pretrain/Loss (Raw)": 2.1418614387512207, "Pretrain/Step": 2075, "Pretrain/Step Time": 8.575688607990742} +{"Pretrain/Learning Rate": 4.552158893803865e-05, "Pretrain/Loss": 2.133873701095581, "Pretrain/Loss (Raw)": 1.9746673107147217, "Pretrain/Step": 2076, "Pretrain/Step Time": 8.573480322957039} +{"Pretrain/Learning Rate": 4.551673898155886e-05, "Pretrain/Loss": 2.1327967643737793, "Pretrain/Loss (Raw)": 2.007566452026367, "Pretrain/Step": 2077, "Pretrain/Step Time": 8.56735043041408} +{"Pretrain/Learning Rate": 4.5511886658992055e-05, "Pretrain/Loss": 2.1321187019348145, "Pretrain/Loss (Raw)": 2.0266330242156982, "Pretrain/Step": 2078, "Pretrain/Step Time": 8.568576585501432} +{"Pretrain/Learning Rate": 4.550703197089782e-05, "Pretrain/Loss": 2.1326537132263184, "Pretrain/Loss (Raw)": 2.096991539001465, "Pretrain/Step": 2079, "Pretrain/Step Time": 8.566395103931427} +{"Pretrain/Learning Rate": 4.550217491783603e-05, "Pretrain/Loss": 2.131606101989746, "Pretrain/Loss (Raw)": 1.9999903440475464, "Pretrain/Step": 2080, "Pretrain/Step Time": 8.565312158316374} +{"Pretrain/Learning Rate": 4.549731550036682e-05, "Pretrain/Loss": 2.130063533782959, "Pretrain/Loss (Raw)": 2.045797348022461, "Pretrain/Step": 2081, "Pretrain/Step Time": 8.564674574881792} +{"Pretrain/Learning Rate": 4.5492453719050596e-05, "Pretrain/Loss": 2.1286187171936035, "Pretrain/Loss (Raw)": 2.0212759971618652, "Pretrain/Step": 2082, "Pretrain/Step Time": 8.561968369409442} +{"Pretrain/Learning Rate": 4.5487589574448046e-05, "Pretrain/Loss": 2.129535675048828, "Pretrain/Loss (Raw)": 2.3356142044067383, "Pretrain/Step": 2083, "Pretrain/Step Time": 8.562174132093787} +{"Pretrain/Learning Rate": 4.5482723067120124e-05, "Pretrain/Loss": 2.1294474601745605, "Pretrain/Loss (Raw)": 2.192763090133667, "Pretrain/Step": 2084, "Pretrain/Step Time": 8.56112165004015} +{"Pretrain/Learning Rate": 4.547785419762807e-05, "Pretrain/Loss": 2.1260204315185547, "Pretrain/Loss (Raw)": 1.866807222366333, "Pretrain/Step": 2085, "Pretrain/Step Time": 8.577088922262192} +{"Pretrain/Learning Rate": 4.547298296653336e-05, "Pretrain/Loss": 2.1255922317504883, "Pretrain/Loss (Raw)": 2.1888363361358643, "Pretrain/Step": 2086, "Pretrain/Step Time": 8.56752461194992} +{"Pretrain/Learning Rate": 4.5468109374397796e-05, "Pretrain/Loss": 2.123976707458496, "Pretrain/Loss (Raw)": 2.0735719203948975, "Pretrain/Step": 2087, "Pretrain/Step Time": 8.571085318922997} +{"Pretrain/Learning Rate": 4.54632334217834e-05, "Pretrain/Loss": 2.1247568130493164, "Pretrain/Loss (Raw)": 2.2113029956817627, "Pretrain/Step": 2088, "Pretrain/Step Time": 8.559538044035435} +{"Pretrain/Learning Rate": 4.545835510925251e-05, "Pretrain/Loss": 2.1244640350341797, "Pretrain/Loss (Raw)": 2.1041452884674072, "Pretrain/Step": 2089, "Pretrain/Step Time": 8.55613580532372} +{"Pretrain/Learning Rate": 4.5453474437367695e-05, "Pretrain/Loss": 2.1252281665802, "Pretrain/Loss (Raw)": 2.166471481323242, "Pretrain/Step": 2090, "Pretrain/Step Time": 8.557031612843275} +{"Pretrain/Learning Rate": 4.544859140669183e-05, "Pretrain/Loss": 2.125669002532959, "Pretrain/Loss (Raw)": 2.2382609844207764, "Pretrain/Step": 2091, "Pretrain/Step Time": 8.567823234945536} +{"Pretrain/Learning Rate": 4.5443706017788054e-05, "Pretrain/Loss": 2.124406576156616, "Pretrain/Loss (Raw)": 2.0673794746398926, "Pretrain/Step": 2092, "Pretrain/Step Time": 8.554972914978862} +{"Pretrain/Learning Rate": 4.5438818271219765e-05, "Pretrain/Loss": 2.125793933868408, "Pretrain/Loss (Raw)": 2.1875343322753906, "Pretrain/Step": 2093, "Pretrain/Step Time": 8.548673324286938} +{"Pretrain/Learning Rate": 4.5433928167550634e-05, "Pretrain/Loss": 2.1269569396972656, "Pretrain/Loss (Raw)": 2.3044097423553467, "Pretrain/Step": 2094, "Pretrain/Step Time": 8.547144090756774} +{"Pretrain/Learning Rate": 4.542903570734463e-05, "Pretrain/Loss": 2.1270413398742676, "Pretrain/Loss (Raw)": 2.3759608268737793, "Pretrain/Step": 2095, "Pretrain/Step Time": 8.545278627425432} +{"Pretrain/Learning Rate": 4.542414089116595e-05, "Pretrain/Loss": 2.127285957336426, "Pretrain/Loss (Raw)": 2.2035088539123535, "Pretrain/Step": 2096, "Pretrain/Step Time": 8.546159200370312} +{"Pretrain/Learning Rate": 4.541924371957911e-05, "Pretrain/Loss": 2.127335548400879, "Pretrain/Loss (Raw)": 2.0835647583007812, "Pretrain/Step": 2097, "Pretrain/Step Time": 8.54799429886043} +{"Pretrain/Learning Rate": 4.5414344193148866e-05, "Pretrain/Loss": 2.12768292427063, "Pretrain/Loss (Raw)": 2.2557151317596436, "Pretrain/Step": 2098, "Pretrain/Step Time": 8.541589664295316} +{"Pretrain/Learning Rate": 4.540944231244025e-05, "Pretrain/Loss": 2.129340171813965, "Pretrain/Loss (Raw)": 2.1428892612457275, "Pretrain/Step": 2099, "Pretrain/Step Time": 8.542604641988873} +{"Pretrain/Learning Rate": 4.540453807801858e-05, "Pretrain/Loss": 2.128366470336914, "Pretrain/Loss (Raw)": 1.931925892829895, "Pretrain/Step": 2100, "Pretrain/Step Time": 8.54246568866074} +{"Pretrain/Learning Rate": 4.539963149044943e-05, "Pretrain/Loss": 2.1270523071289062, "Pretrain/Loss (Raw)": 1.9202879667282104, "Pretrain/Step": 2101, "Pretrain/Step Time": 8.543962391093373} +{"Pretrain/Learning Rate": 4.539472255029864e-05, "Pretrain/Loss": 2.1266589164733887, "Pretrain/Loss (Raw)": 2.0510220527648926, "Pretrain/Step": 2102, "Pretrain/Step Time": 8.542811954393983} +{"Pretrain/Learning Rate": 4.538981125813235e-05, "Pretrain/Loss": 2.127319097518921, "Pretrain/Loss (Raw)": 2.0523793697357178, "Pretrain/Step": 2103, "Pretrain/Step Time": 8.543396620079875} +{"Pretrain/Learning Rate": 4.538489761451694e-05, "Pretrain/Loss": 2.1266517639160156, "Pretrain/Loss (Raw)": 2.0919559001922607, "Pretrain/Step": 2104, "Pretrain/Step Time": 8.541944179683924} +{"Pretrain/Learning Rate": 4.537998162001909e-05, "Pretrain/Loss": 2.1256513595581055, "Pretrain/Loss (Raw)": 2.0904200077056885, "Pretrain/Step": 2105, "Pretrain/Step Time": 8.541962528601289} +{"Pretrain/Learning Rate": 4.537506327520571e-05, "Pretrain/Loss": 2.1288669109344482, "Pretrain/Loss (Raw)": 2.3999977111816406, "Pretrain/Step": 2106, "Pretrain/Step Time": 8.543811364099383} +{"Pretrain/Learning Rate": 4.5370142580644036e-05, "Pretrain/Loss": 2.1295456886291504, "Pretrain/Loss (Raw)": 2.109543561935425, "Pretrain/Step": 2107, "Pretrain/Step Time": 8.540695242583752} +{"Pretrain/Learning Rate": 4.536521953690153e-05, "Pretrain/Loss": 2.128706932067871, "Pretrain/Loss (Raw)": 1.9924689531326294, "Pretrain/Step": 2108, "Pretrain/Step Time": 8.537340890616179} +{"Pretrain/Learning Rate": 4.5360294144545946e-05, "Pretrain/Loss": 2.128723621368408, "Pretrain/Loss (Raw)": 2.1188783645629883, "Pretrain/Step": 2109, "Pretrain/Step Time": 8.547704393044114} +{"Pretrain/Learning Rate": 4.5355366404145294e-05, "Pretrain/Loss": 2.13004469871521, "Pretrain/Loss (Raw)": 2.1273069381713867, "Pretrain/Step": 2110, "Pretrain/Step Time": 8.543477905914187} +{"Pretrain/Learning Rate": 4.5350436316267876e-05, "Pretrain/Loss": 2.132420063018799, "Pretrain/Loss (Raw)": 2.4104275703430176, "Pretrain/Step": 2111, "Pretrain/Step Time": 8.54635095410049} +{"Pretrain/Learning Rate": 4.534550388148224e-05, "Pretrain/Loss": 2.133114814758301, "Pretrain/Loss (Raw)": 2.266749143600464, "Pretrain/Step": 2112, "Pretrain/Step Time": 8.549969544634223} +{"Pretrain/Learning Rate": 4.5340569100357235e-05, "Pretrain/Loss": 2.1325559616088867, "Pretrain/Loss (Raw)": 2.0121419429779053, "Pretrain/Step": 2113, "Pretrain/Step Time": 8.548034213483334} +{"Pretrain/Learning Rate": 4.5335631973461944e-05, "Pretrain/Loss": 2.1322426795959473, "Pretrain/Loss (Raw)": 2.1965208053588867, "Pretrain/Step": 2114, "Pretrain/Step Time": 8.544469116255641} +{"Pretrain/Learning Rate": 4.5330692501365755e-05, "Pretrain/Loss": 2.1297597885131836, "Pretrain/Loss (Raw)": 1.940195918083191, "Pretrain/Step": 2115, "Pretrain/Step Time": 8.544807836413383} +{"Pretrain/Learning Rate": 4.532575068463831e-05, "Pretrain/Loss": 2.129774570465088, "Pretrain/Loss (Raw)": 2.1593821048736572, "Pretrain/Step": 2116, "Pretrain/Step Time": 8.543189438059926} +{"Pretrain/Learning Rate": 4.532080652384951e-05, "Pretrain/Loss": 2.1317343711853027, "Pretrain/Loss (Raw)": 2.2272560596466064, "Pretrain/Step": 2117, "Pretrain/Step Time": 8.53793023712933} +{"Pretrain/Learning Rate": 4.5315860019569546e-05, "Pretrain/Loss": 2.1335341930389404, "Pretrain/Loss (Raw)": 2.182121753692627, "Pretrain/Step": 2118, "Pretrain/Step Time": 8.53156659565866} +{"Pretrain/Learning Rate": 4.531091117236888e-05, "Pretrain/Loss": 2.133753538131714, "Pretrain/Loss (Raw)": 2.21041202545166, "Pretrain/Step": 2119, "Pretrain/Step Time": 8.52993692830205} +{"Pretrain/Learning Rate": 4.530595998281822e-05, "Pretrain/Loss": 2.1356558799743652, "Pretrain/Loss (Raw)": 2.205203056335449, "Pretrain/Step": 2120, "Pretrain/Step Time": 8.530779575929046} +{"Pretrain/Learning Rate": 4.530100645148858e-05, "Pretrain/Loss": 2.134751558303833, "Pretrain/Loss (Raw)": 1.967978596687317, "Pretrain/Step": 2121, "Pretrain/Step Time": 8.528034029528499} +{"Pretrain/Learning Rate": 4.529605057895121e-05, "Pretrain/Loss": 2.1348838806152344, "Pretrain/Loss (Raw)": 2.135359764099121, "Pretrain/Step": 2122, "Pretrain/Step Time": 8.52799073047936} +{"Pretrain/Learning Rate": 4.529109236577764e-05, "Pretrain/Loss": 2.134399890899658, "Pretrain/Loss (Raw)": 2.0235941410064697, "Pretrain/Step": 2123, "Pretrain/Step Time": 8.522619009017944} +{"Pretrain/Learning Rate": 4.5286131812539704e-05, "Pretrain/Loss": 2.1335606575012207, "Pretrain/Loss (Raw)": 2.056192636489868, "Pretrain/Step": 2124, "Pretrain/Step Time": 8.525593761354685} +{"Pretrain/Learning Rate": 4.5281168919809444e-05, "Pretrain/Loss": 2.130814552307129, "Pretrain/Loss (Raw)": 1.9125542640686035, "Pretrain/Step": 2125, "Pretrain/Step Time": 8.528841516003013} +{"Pretrain/Learning Rate": 4.527620368815921e-05, "Pretrain/Loss": 2.129025936126709, "Pretrain/Loss (Raw)": 1.9421255588531494, "Pretrain/Step": 2126, "Pretrain/Step Time": 8.533854611217976} +{"Pretrain/Learning Rate": 4.527123611816163e-05, "Pretrain/Loss": 2.1290206909179688, "Pretrain/Loss (Raw)": 2.163529634475708, "Pretrain/Step": 2127, "Pretrain/Step Time": 8.535291558131576} +{"Pretrain/Learning Rate": 4.526626621038958e-05, "Pretrain/Loss": 2.1267871856689453, "Pretrain/Loss (Raw)": 1.956727147102356, "Pretrain/Step": 2128, "Pretrain/Step Time": 8.542538560926914} +{"Pretrain/Learning Rate": 4.526129396541621e-05, "Pretrain/Loss": 2.1254377365112305, "Pretrain/Loss (Raw)": 2.03532075881958, "Pretrain/Step": 2129, "Pretrain/Step Time": 8.535345653072} +{"Pretrain/Learning Rate": 4.525631938381495e-05, "Pretrain/Loss": 2.125204563140869, "Pretrain/Loss (Raw)": 2.0723886489868164, "Pretrain/Step": 2130, "Pretrain/Step Time": 8.532734245061874} +{"Pretrain/Learning Rate": 4.5251342466159487e-05, "Pretrain/Loss": 2.1273136138916016, "Pretrain/Loss (Raw)": 2.3560516834259033, "Pretrain/Step": 2131, "Pretrain/Step Time": 8.542171604931355} +{"Pretrain/Learning Rate": 4.524636321302378e-05, "Pretrain/Loss": 2.126345634460449, "Pretrain/Loss (Raw)": 1.9816474914550781, "Pretrain/Step": 2132, "Pretrain/Step Time": 8.538725644350052} +{"Pretrain/Learning Rate": 4.524138162498206e-05, "Pretrain/Loss": 2.1269679069519043, "Pretrain/Loss (Raw)": 2.1864044666290283, "Pretrain/Step": 2133, "Pretrain/Step Time": 8.529781671240926} +{"Pretrain/Learning Rate": 4.5236397702608833e-05, "Pretrain/Loss": 2.129896879196167, "Pretrain/Loss (Raw)": 2.3848865032196045, "Pretrain/Step": 2134, "Pretrain/Step Time": 8.542028088122606} +{"Pretrain/Learning Rate": 4.5231411446478865e-05, "Pretrain/Loss": 2.1297249794006348, "Pretrain/Loss (Raw)": 2.1212658882141113, "Pretrain/Step": 2135, "Pretrain/Step Time": 8.539311027154326} +{"Pretrain/Learning Rate": 4.5226422857167207e-05, "Pretrain/Loss": 2.1273365020751953, "Pretrain/Loss (Raw)": 1.953709602355957, "Pretrain/Step": 2136, "Pretrain/Step Time": 8.538824601098895} +{"Pretrain/Learning Rate": 4.5221431935249144e-05, "Pretrain/Loss": 2.126396656036377, "Pretrain/Loss (Raw)": 2.0453484058380127, "Pretrain/Step": 2137, "Pretrain/Step Time": 8.542565368115902} +{"Pretrain/Learning Rate": 4.5216438681300265e-05, "Pretrain/Loss": 2.125495433807373, "Pretrain/Loss (Raw)": 1.998924732208252, "Pretrain/Step": 2138, "Pretrain/Step Time": 8.541587680578232} +{"Pretrain/Learning Rate": 4.521144309589641e-05, "Pretrain/Loss": 2.1250672340393066, "Pretrain/Loss (Raw)": 2.0847864151000977, "Pretrain/Step": 2139, "Pretrain/Step Time": 8.538012094795704} +{"Pretrain/Learning Rate": 4.520644517961371e-05, "Pretrain/Loss": 2.125053882598877, "Pretrain/Loss (Raw)": 2.1142678260803223, "Pretrain/Step": 2140, "Pretrain/Step Time": 8.54805352538824} +{"Pretrain/Learning Rate": 4.520144493302853e-05, "Pretrain/Loss": 2.1253395080566406, "Pretrain/Loss (Raw)": 2.1711513996124268, "Pretrain/Step": 2141, "Pretrain/Step Time": 8.545972803607583} +{"Pretrain/Learning Rate": 4.519644235671752e-05, "Pretrain/Loss": 2.1244359016418457, "Pretrain/Loss (Raw)": 2.019516706466675, "Pretrain/Step": 2142, "Pretrain/Step Time": 8.547796539962292} +{"Pretrain/Learning Rate": 4.519143745125762e-05, "Pretrain/Loss": 2.126875400543213, "Pretrain/Loss (Raw)": 2.2843263149261475, "Pretrain/Step": 2143, "Pretrain/Step Time": 8.54833273589611} +{"Pretrain/Learning Rate": 4.5186430217226004e-05, "Pretrain/Loss": 2.1283388137817383, "Pretrain/Loss (Raw)": 2.2096633911132812, "Pretrain/Step": 2144, "Pretrain/Step Time": 8.547872418537736} +{"Pretrain/Learning Rate": 4.518142065520013e-05, "Pretrain/Loss": 2.1291065216064453, "Pretrain/Loss (Raw)": 2.0810272693634033, "Pretrain/Step": 2145, "Pretrain/Step Time": 8.55020554177463} +{"Pretrain/Learning Rate": 4.5176408765757736e-05, "Pretrain/Loss": 2.1267409324645996, "Pretrain/Loss (Raw)": 1.9305421113967896, "Pretrain/Step": 2146, "Pretrain/Step Time": 8.550956496968865} +{"Pretrain/Learning Rate": 4.5171394549476794e-05, "Pretrain/Loss": 2.125419855117798, "Pretrain/Loss (Raw)": 1.9636809825897217, "Pretrain/Step": 2147, "Pretrain/Step Time": 8.546846503391862} +{"Pretrain/Learning Rate": 4.5166378006935595e-05, "Pretrain/Loss": 2.125056266784668, "Pretrain/Loss (Raw)": 2.1297082901000977, "Pretrain/Step": 2148, "Pretrain/Step Time": 8.549928463995457} +{"Pretrain/Learning Rate": 4.5161359138712655e-05, "Pretrain/Loss": 2.124666690826416, "Pretrain/Loss (Raw)": 2.179745674133301, "Pretrain/Step": 2149, "Pretrain/Step Time": 8.547511242330074} +{"Pretrain/Learning Rate": 4.5156337945386775e-05, "Pretrain/Loss": 2.123466968536377, "Pretrain/Loss (Raw)": 2.030750274658203, "Pretrain/Step": 2150, "Pretrain/Step Time": 8.545734208077192} +{"Pretrain/Learning Rate": 4.515131442753703e-05, "Pretrain/Loss": 2.123136520385742, "Pretrain/Loss (Raw)": 2.1524088382720947, "Pretrain/Step": 2151, "Pretrain/Step Time": 8.539807746186852} +{"Pretrain/Learning Rate": 4.5146288585742737e-05, "Pretrain/Loss": 2.1251423358917236, "Pretrain/Loss (Raw)": 2.26401948928833, "Pretrain/Step": 2152, "Pretrain/Step Time": 8.550056306645274} +{"Pretrain/Learning Rate": 4.514126042058352e-05, "Pretrain/Loss": 2.1251649856567383, "Pretrain/Loss (Raw)": 2.190392017364502, "Pretrain/Step": 2153, "Pretrain/Step Time": 8.547485910356045} +{"Pretrain/Learning Rate": 4.513622993263924e-05, "Pretrain/Loss": 2.122723340988159, "Pretrain/Loss (Raw)": 1.9805893898010254, "Pretrain/Step": 2154, "Pretrain/Step Time": 8.554556788876653} +{"Pretrain/Learning Rate": 4.5131197122490035e-05, "Pretrain/Loss": 2.1217522621154785, "Pretrain/Loss (Raw)": 2.0501770973205566, "Pretrain/Step": 2155, "Pretrain/Step Time": 8.557014044374228} +{"Pretrain/Learning Rate": 4.512616199071632e-05, "Pretrain/Loss": 2.1213645935058594, "Pretrain/Loss (Raw)": 2.067162275314331, "Pretrain/Step": 2156, "Pretrain/Step Time": 8.558241873979568} +{"Pretrain/Learning Rate": 4.512112453789877e-05, "Pretrain/Loss": 2.1210508346557617, "Pretrain/Loss (Raw)": 2.0030486583709717, "Pretrain/Step": 2157, "Pretrain/Step Time": 8.556023646146059} +{"Pretrain/Learning Rate": 4.5116084764618325e-05, "Pretrain/Loss": 2.121511459350586, "Pretrain/Loss (Raw)": 2.3103208541870117, "Pretrain/Step": 2158, "Pretrain/Step Time": 8.563695495948195} +{"Pretrain/Learning Rate": 4.511104267145618e-05, "Pretrain/Loss": 2.119647741317749, "Pretrain/Loss (Raw)": 1.9949833154678345, "Pretrain/Step": 2159, "Pretrain/Step Time": 8.561243426054716} +{"Pretrain/Learning Rate": 4.510599825899384e-05, "Pretrain/Loss": 2.121427059173584, "Pretrain/Loss (Raw)": 2.320697546005249, "Pretrain/Step": 2160, "Pretrain/Step Time": 8.563412822782993} +{"Pretrain/Learning Rate": 4.510095152781304e-05, "Pretrain/Loss": 2.1215267181396484, "Pretrain/Loss (Raw)": 2.1735000610351562, "Pretrain/Step": 2161, "Pretrain/Step Time": 8.564019149169326} +{"Pretrain/Learning Rate": 4.509590247849579e-05, "Pretrain/Loss": 2.1231982707977295, "Pretrain/Loss (Raw)": 2.168147325515747, "Pretrain/Step": 2162, "Pretrain/Step Time": 8.565154587849975} +{"Pretrain/Learning Rate": 4.509085111162437e-05, "Pretrain/Loss": 2.120305299758911, "Pretrain/Loss (Raw)": 1.8091124296188354, "Pretrain/Step": 2163, "Pretrain/Step Time": 8.56223526224494} +{"Pretrain/Learning Rate": 4.508579742778133e-05, "Pretrain/Loss": 2.1205685138702393, "Pretrain/Loss (Raw)": 2.215240001678467, "Pretrain/Step": 2164, "Pretrain/Step Time": 8.572459446266294} +{"Pretrain/Learning Rate": 4.508074142754948e-05, "Pretrain/Loss": 2.1195199489593506, "Pretrain/Loss (Raw)": 1.9427640438079834, "Pretrain/Step": 2165, "Pretrain/Step Time": 8.556687757372856} +{"Pretrain/Learning Rate": 4.507568311151191e-05, "Pretrain/Loss": 2.119490146636963, "Pretrain/Loss (Raw)": 2.129570245742798, "Pretrain/Step": 2166, "Pretrain/Step Time": 8.558768168091774} +{"Pretrain/Learning Rate": 4.5070622480251955e-05, "Pretrain/Loss": 2.11946439743042, "Pretrain/Loss (Raw)": 2.156947135925293, "Pretrain/Step": 2167, "Pretrain/Step Time": 8.554493142291903} +{"Pretrain/Learning Rate": 4.506555953435324e-05, "Pretrain/Loss": 2.1204757690429688, "Pretrain/Loss (Raw)": 2.1541521549224854, "Pretrain/Step": 2168, "Pretrain/Step Time": 8.556351194158196} +{"Pretrain/Learning Rate": 4.5060494274399654e-05, "Pretrain/Loss": 2.121878147125244, "Pretrain/Loss (Raw)": 2.1699392795562744, "Pretrain/Step": 2169, "Pretrain/Step Time": 8.556993912905455} +{"Pretrain/Learning Rate": 4.505542670097534e-05, "Pretrain/Loss": 2.120704412460327, "Pretrain/Loss (Raw)": 1.9983642101287842, "Pretrain/Step": 2170, "Pretrain/Step Time": 8.558179138228297} +{"Pretrain/Learning Rate": 4.505035681466472e-05, "Pretrain/Loss": 2.1194496154785156, "Pretrain/Loss (Raw)": 1.9281737804412842, "Pretrain/Step": 2171, "Pretrain/Step Time": 8.546524874866009} +{"Pretrain/Learning Rate": 4.504528461605247e-05, "Pretrain/Loss": 2.119758367538452, "Pretrain/Loss (Raw)": 2.089494228363037, "Pretrain/Step": 2172, "Pretrain/Step Time": 8.550599655136466} +{"Pretrain/Learning Rate": 4.5040210105723525e-05, "Pretrain/Loss": 2.1194450855255127, "Pretrain/Loss (Raw)": 2.0591683387756348, "Pretrain/Step": 2173, "Pretrain/Step Time": 8.542054295539856} +{"Pretrain/Learning Rate": 4.5035133284263134e-05, "Pretrain/Loss": 2.1173462867736816, "Pretrain/Loss (Raw)": 1.9292277097702026, "Pretrain/Step": 2174, "Pretrain/Step Time": 8.53870370797813} +{"Pretrain/Learning Rate": 4.5030054152256756e-05, "Pretrain/Loss": 2.1183228492736816, "Pretrain/Loss (Raw)": 2.1960179805755615, "Pretrain/Step": 2175, "Pretrain/Step Time": 8.538506412878633} +{"Pretrain/Learning Rate": 4.502497271029015e-05, "Pretrain/Loss": 2.116225242614746, "Pretrain/Loss (Raw)": 2.079598903656006, "Pretrain/Step": 2176, "Pretrain/Step Time": 8.537550808861852} +{"Pretrain/Learning Rate": 4.501988895894933e-05, "Pretrain/Loss": 2.1152665615081787, "Pretrain/Loss (Raw)": 2.18045973777771, "Pretrain/Step": 2177, "Pretrain/Step Time": 8.541937546804547} +{"Pretrain/Learning Rate": 4.501480289882058e-05, "Pretrain/Loss": 2.1131603717803955, "Pretrain/Loss (Raw)": 2.03312611579895, "Pretrain/Step": 2178, "Pretrain/Step Time": 8.538275811821222} +{"Pretrain/Learning Rate": 4.5009714530490455e-05, "Pretrain/Loss": 2.118091583251953, "Pretrain/Loss (Raw)": 2.4499170780181885, "Pretrain/Step": 2179, "Pretrain/Step Time": 8.540006682276726} +{"Pretrain/Learning Rate": 4.5004623854545746e-05, "Pretrain/Loss": 2.1192402839660645, "Pretrain/Loss (Raw)": 2.1228466033935547, "Pretrain/Step": 2180, "Pretrain/Step Time": 8.543543301522732} +{"Pretrain/Learning Rate": 4.4999530871573556e-05, "Pretrain/Loss": 2.118936538696289, "Pretrain/Loss (Raw)": 2.1140949726104736, "Pretrain/Step": 2181, "Pretrain/Step Time": 8.543643537908792} +{"Pretrain/Learning Rate": 4.499443558216123e-05, "Pretrain/Loss": 2.119307518005371, "Pretrain/Loss (Raw)": 2.132079601287842, "Pretrain/Step": 2182, "Pretrain/Step Time": 8.55384336411953} +{"Pretrain/Learning Rate": 4.498933798689638e-05, "Pretrain/Loss": 2.119016647338867, "Pretrain/Loss (Raw)": 2.051748514175415, "Pretrain/Step": 2183, "Pretrain/Step Time": 8.549521327018738} +{"Pretrain/Learning Rate": 4.498423808636687e-05, "Pretrain/Loss": 2.1184473037719727, "Pretrain/Loss (Raw)": 2.046557664871216, "Pretrain/Step": 2184, "Pretrain/Step Time": 8.550285380333662} +{"Pretrain/Learning Rate": 4.497913588116085e-05, "Pretrain/Loss": 2.1179704666137695, "Pretrain/Loss (Raw)": 2.057905912399292, "Pretrain/Step": 2185, "Pretrain/Step Time": 8.549243956804276} +{"Pretrain/Learning Rate": 4.497403137186674e-05, "Pretrain/Loss": 2.117645502090454, "Pretrain/Loss (Raw)": 2.121232748031616, "Pretrain/Step": 2186, "Pretrain/Step Time": 8.553915157914162} +{"Pretrain/Learning Rate": 4.496892455907322e-05, "Pretrain/Loss": 2.119594097137451, "Pretrain/Loss (Raw)": 2.279919147491455, "Pretrain/Step": 2187, "Pretrain/Step Time": 8.553481789305806} +{"Pretrain/Learning Rate": 4.496381544336922e-05, "Pretrain/Loss": 2.1206722259521484, "Pretrain/Loss (Raw)": 2.06876540184021, "Pretrain/Step": 2188, "Pretrain/Step Time": 8.560595873743296} +{"Pretrain/Learning Rate": 4.495870402534394e-05, "Pretrain/Loss": 2.1200008392333984, "Pretrain/Loss (Raw)": 2.2097597122192383, "Pretrain/Step": 2189, "Pretrain/Step Time": 8.558497233316302} +{"Pretrain/Learning Rate": 4.495359030558688e-05, "Pretrain/Loss": 2.1179497241973877, "Pretrain/Loss (Raw)": 2.05222225189209, "Pretrain/Step": 2190, "Pretrain/Step Time": 8.548625316470861} +{"Pretrain/Learning Rate": 4.494847428468775e-05, "Pretrain/Loss": 2.116046190261841, "Pretrain/Loss (Raw)": 1.9816102981567383, "Pretrain/Step": 2191, "Pretrain/Step Time": 8.545903136953712} +{"Pretrain/Learning Rate": 4.494335596323657e-05, "Pretrain/Loss": 2.1166844367980957, "Pretrain/Loss (Raw)": 2.3629603385925293, "Pretrain/Step": 2192, "Pretrain/Step Time": 8.545413322746754} +{"Pretrain/Learning Rate": 4.49382353418236e-05, "Pretrain/Loss": 2.1198387145996094, "Pretrain/Loss (Raw)": 2.353088855743408, "Pretrain/Step": 2193, "Pretrain/Step Time": 8.554512701928616} +{"Pretrain/Learning Rate": 4.493311242103938e-05, "Pretrain/Loss": 2.1188597679138184, "Pretrain/Loss (Raw)": 1.8620789051055908, "Pretrain/Step": 2194, "Pretrain/Step Time": 8.55098314397037} +{"Pretrain/Learning Rate": 4.4927987201474707e-05, "Pretrain/Loss": 2.115654706954956, "Pretrain/Loss (Raw)": 1.9245415925979614, "Pretrain/Step": 2195, "Pretrain/Step Time": 8.552025778219104} +{"Pretrain/Learning Rate": 4.492285968372065e-05, "Pretrain/Loss": 2.11660099029541, "Pretrain/Loss (Raw)": 2.2514264583587646, "Pretrain/Step": 2196, "Pretrain/Step Time": 8.540834613144398} +{"Pretrain/Learning Rate": 4.491772986836853e-05, "Pretrain/Loss": 2.116002082824707, "Pretrain/Loss (Raw)": 2.0963311195373535, "Pretrain/Step": 2197, "Pretrain/Step Time": 8.542122626677155} +{"Pretrain/Learning Rate": 4.4912597756009946e-05, "Pretrain/Loss": 2.1152687072753906, "Pretrain/Loss (Raw)": 2.017537832260132, "Pretrain/Step": 2198, "Pretrain/Step Time": 8.545331517234445} +{"Pretrain/Learning Rate": 4.490746334723677e-05, "Pretrain/Loss": 2.114023208618164, "Pretrain/Loss (Raw)": 2.0571274757385254, "Pretrain/Step": 2199, "Pretrain/Step Time": 8.54303266480565} +{"Pretrain/Learning Rate": 4.4902326642641095e-05, "Pretrain/Loss": 2.1134674549102783, "Pretrain/Loss (Raw)": 1.9905543327331543, "Pretrain/Step": 2200, "Pretrain/Step Time": 8.549667509272695} +{"Pretrain/Learning Rate": 4.489718764281534e-05, "Pretrain/Loss": 2.1118035316467285, "Pretrain/Loss (Raw)": 2.243603467941284, "Pretrain/Step": 2201, "Pretrain/Step Time": 8.540771359577775} +{"Pretrain/Learning Rate": 4.489204634835215e-05, "Pretrain/Loss": 2.109900951385498, "Pretrain/Loss (Raw)": 1.9693021774291992, "Pretrain/Step": 2202, "Pretrain/Step Time": 8.546481275931} +{"Pretrain/Learning Rate": 4.488690275984443e-05, "Pretrain/Loss": 2.1123805046081543, "Pretrain/Loss (Raw)": 2.4592719078063965, "Pretrain/Step": 2203, "Pretrain/Step Time": 8.535348808392882} +{"Pretrain/Learning Rate": 4.488175687788538e-05, "Pretrain/Loss": 2.1134390830993652, "Pretrain/Loss (Raw)": 2.110170364379883, "Pretrain/Step": 2204, "Pretrain/Step Time": 8.541558323428035} +{"Pretrain/Learning Rate": 4.4876608703068434e-05, "Pretrain/Loss": 2.114633798599243, "Pretrain/Loss (Raw)": 2.1604771614074707, "Pretrain/Step": 2205, "Pretrain/Step Time": 8.539385307580233} +{"Pretrain/Learning Rate": 4.487145823598732e-05, "Pretrain/Loss": 2.1159284114837646, "Pretrain/Loss (Raw)": 2.192338466644287, "Pretrain/Step": 2206, "Pretrain/Step Time": 8.548058420419693} +{"Pretrain/Learning Rate": 4.4866305477236e-05, "Pretrain/Loss": 2.1163723468780518, "Pretrain/Loss (Raw)": 2.153813123703003, "Pretrain/Step": 2207, "Pretrain/Step Time": 8.545189717784524} +{"Pretrain/Learning Rate": 4.486115042740872e-05, "Pretrain/Loss": 2.117598533630371, "Pretrain/Loss (Raw)": 2.156935930252075, "Pretrain/Step": 2208, "Pretrain/Step Time": 8.547862078994513} +{"Pretrain/Learning Rate": 4.4855993087099984e-05, "Pretrain/Loss": 2.118748664855957, "Pretrain/Loss (Raw)": 2.193018674850464, "Pretrain/Step": 2209, "Pretrain/Step Time": 8.544859873130918} +{"Pretrain/Learning Rate": 4.485083345690456e-05, "Pretrain/Loss": 2.121284246444702, "Pretrain/Loss (Raw)": 2.3458361625671387, "Pretrain/Step": 2210, "Pretrain/Step Time": 8.547065403312445} +{"Pretrain/Learning Rate": 4.4845671537417486e-05, "Pretrain/Loss": 2.1209349632263184, "Pretrain/Loss (Raw)": 2.2909016609191895, "Pretrain/Step": 2211, "Pretrain/Step Time": 8.548249734565616} +{"Pretrain/Learning Rate": 4.484050732923405e-05, "Pretrain/Loss": 2.1218485832214355, "Pretrain/Loss (Raw)": 2.309708595275879, "Pretrain/Step": 2212, "Pretrain/Step Time": 8.557162525132298} +{"Pretrain/Learning Rate": 4.483534083294982e-05, "Pretrain/Loss": 2.1236958503723145, "Pretrain/Loss (Raw)": 2.103241205215454, "Pretrain/Step": 2213, "Pretrain/Step Time": 8.542191796004772} +{"Pretrain/Learning Rate": 4.483017204916061e-05, "Pretrain/Loss": 2.125124454498291, "Pretrain/Loss (Raw)": 2.371696710586548, "Pretrain/Step": 2214, "Pretrain/Step Time": 8.546123253181577} +{"Pretrain/Learning Rate": 4.482500097846253e-05, "Pretrain/Loss": 2.125217914581299, "Pretrain/Loss (Raw)": 2.085549831390381, "Pretrain/Step": 2215, "Pretrain/Step Time": 8.540956081822515} +{"Pretrain/Learning Rate": 4.4819827621451906e-05, "Pretrain/Loss": 2.124680519104004, "Pretrain/Loss (Raw)": 2.1425139904022217, "Pretrain/Step": 2216, "Pretrain/Step Time": 8.542324049398303} +{"Pretrain/Learning Rate": 4.481465197872538e-05, "Pretrain/Loss": 2.1232337951660156, "Pretrain/Loss (Raw)": 1.9189739227294922, "Pretrain/Step": 2217, "Pretrain/Step Time": 8.540777025744319} +{"Pretrain/Learning Rate": 4.4809474050879806e-05, "Pretrain/Loss": 2.123227596282959, "Pretrain/Loss (Raw)": 2.165665626525879, "Pretrain/Step": 2218, "Pretrain/Step Time": 8.547364765778184} +{"Pretrain/Learning Rate": 4.4804293838512346e-05, "Pretrain/Loss": 2.122126817703247, "Pretrain/Loss (Raw)": 2.0973663330078125, "Pretrain/Step": 2219, "Pretrain/Step Time": 8.540209244936705} +{"Pretrain/Learning Rate": 4.47991113422204e-05, "Pretrain/Loss": 2.122436046600342, "Pretrain/Loss (Raw)": 2.10697603225708, "Pretrain/Step": 2220, "Pretrain/Step Time": 8.540477428585291} +{"Pretrain/Learning Rate": 4.479392656260163e-05, "Pretrain/Loss": 2.1220922470092773, "Pretrain/Loss (Raw)": 2.1435387134552, "Pretrain/Step": 2221, "Pretrain/Step Time": 8.544648284092546} +{"Pretrain/Learning Rate": 4.4788739500253986e-05, "Pretrain/Loss": 2.1188902854919434, "Pretrain/Loss (Raw)": 1.8945249319076538, "Pretrain/Step": 2222, "Pretrain/Step Time": 8.545325301587582} +{"Pretrain/Learning Rate": 4.4783550155775647e-05, "Pretrain/Loss": 2.1180405616760254, "Pretrain/Loss (Raw)": 2.2671873569488525, "Pretrain/Step": 2223, "Pretrain/Step Time": 8.545857166871428} +{"Pretrain/Learning Rate": 4.4778358529765085e-05, "Pretrain/Loss": 2.117936372756958, "Pretrain/Loss (Raw)": 2.190185785293579, "Pretrain/Step": 2224, "Pretrain/Step Time": 8.54701998271048} +{"Pretrain/Learning Rate": 4.477316462282102e-05, "Pretrain/Loss": 2.1185193061828613, "Pretrain/Loss (Raw)": 2.1581671237945557, "Pretrain/Step": 2225, "Pretrain/Step Time": 8.540014749392867} +{"Pretrain/Learning Rate": 4.476796843554243e-05, "Pretrain/Loss": 2.1171441078186035, "Pretrain/Loss (Raw)": 2.0797157287597656, "Pretrain/Step": 2226, "Pretrain/Step Time": 8.551835227757692} +{"Pretrain/Learning Rate": 4.4762769968528575e-05, "Pretrain/Loss": 2.11687970161438, "Pretrain/Loss (Raw)": 2.109034538269043, "Pretrain/Step": 2227, "Pretrain/Step Time": 8.550333807244897} +{"Pretrain/Learning Rate": 4.475756922237896e-05, "Pretrain/Loss": 2.1186671257019043, "Pretrain/Loss (Raw)": 2.1607308387756348, "Pretrain/Step": 2228, "Pretrain/Step Time": 8.553429583087564} +{"Pretrain/Learning Rate": 4.4752366197693365e-05, "Pretrain/Loss": 2.1210765838623047, "Pretrain/Loss (Raw)": 2.228668451309204, "Pretrain/Step": 2229, "Pretrain/Step Time": 8.553537085652351} +{"Pretrain/Learning Rate": 4.474716089507182e-05, "Pretrain/Loss": 2.121548652648926, "Pretrain/Loss (Raw)": 2.1114675998687744, "Pretrain/Step": 2230, "Pretrain/Step Time": 8.55003553070128} +{"Pretrain/Learning Rate": 4.474195331511464e-05, "Pretrain/Loss": 2.12333607673645, "Pretrain/Loss (Raw)": 2.28116512298584, "Pretrain/Step": 2231, "Pretrain/Step Time": 8.558207454159856} +{"Pretrain/Learning Rate": 4.473674345842236e-05, "Pretrain/Loss": 2.1239213943481445, "Pretrain/Loss (Raw)": 2.1668903827667236, "Pretrain/Step": 2232, "Pretrain/Step Time": 8.553669665008783} +{"Pretrain/Learning Rate": 4.4731531325595835e-05, "Pretrain/Loss": 2.125262498855591, "Pretrain/Loss (Raw)": 2.2620608806610107, "Pretrain/Step": 2233, "Pretrain/Step Time": 8.556316943839192} +{"Pretrain/Learning Rate": 4.472631691723613e-05, "Pretrain/Loss": 2.1246542930603027, "Pretrain/Loss (Raw)": 2.322155237197876, "Pretrain/Step": 2234, "Pretrain/Step Time": 8.557636572048068} +{"Pretrain/Learning Rate": 4.4721100233944606e-05, "Pretrain/Loss": 2.1266019344329834, "Pretrain/Loss (Raw)": 2.35884165763855, "Pretrain/Step": 2235, "Pretrain/Step Time": 8.556656701490283} +{"Pretrain/Learning Rate": 4.471588127632288e-05, "Pretrain/Loss": 2.128561019897461, "Pretrain/Loss (Raw)": 2.2432384490966797, "Pretrain/Step": 2236, "Pretrain/Step Time": 8.558348188176751} +{"Pretrain/Learning Rate": 4.471066004497282e-05, "Pretrain/Loss": 2.131511688232422, "Pretrain/Loss (Raw)": 2.4965837001800537, "Pretrain/Step": 2237, "Pretrain/Step Time": 8.55957137234509} +{"Pretrain/Learning Rate": 4.470543654049656e-05, "Pretrain/Loss": 2.132066249847412, "Pretrain/Loss (Raw)": 2.198256731033325, "Pretrain/Step": 2238, "Pretrain/Step Time": 8.560977948829532} +{"Pretrain/Learning Rate": 4.47002107634965e-05, "Pretrain/Loss": 2.1288681030273438, "Pretrain/Loss (Raw)": 2.0010688304901123, "Pretrain/Step": 2239, "Pretrain/Step Time": 8.554715357720852} +{"Pretrain/Learning Rate": 4.469498271457531e-05, "Pretrain/Loss": 2.127286911010742, "Pretrain/Loss (Raw)": 2.0643551349639893, "Pretrain/Step": 2240, "Pretrain/Step Time": 8.55180824920535} +{"Pretrain/Learning Rate": 4.468975239433591e-05, "Pretrain/Loss": 2.127420425415039, "Pretrain/Loss (Raw)": 2.0292558670043945, "Pretrain/Step": 2241, "Pretrain/Step Time": 8.551887834444642} +{"Pretrain/Learning Rate": 4.468451980338148e-05, "Pretrain/Loss": 2.1256532669067383, "Pretrain/Loss (Raw)": 1.9703350067138672, "Pretrain/Step": 2242, "Pretrain/Step Time": 8.557037245482206} +{"Pretrain/Learning Rate": 4.467928494231547e-05, "Pretrain/Loss": 2.1281442642211914, "Pretrain/Loss (Raw)": 2.259028196334839, "Pretrain/Step": 2243, "Pretrain/Step Time": 8.55788343027234} +{"Pretrain/Learning Rate": 4.4674047811741585e-05, "Pretrain/Loss": 2.1288411617279053, "Pretrain/Loss (Raw)": 2.248586654663086, "Pretrain/Step": 2244, "Pretrain/Step Time": 8.554855190217495} +{"Pretrain/Learning Rate": 4.466880841226381e-05, "Pretrain/Loss": 2.129636764526367, "Pretrain/Loss (Raw)": 2.3290884494781494, "Pretrain/Step": 2245, "Pretrain/Step Time": 8.55619658343494} +{"Pretrain/Learning Rate": 4.466356674448635e-05, "Pretrain/Loss": 2.1289303302764893, "Pretrain/Loss (Raw)": 2.091703414916992, "Pretrain/Step": 2246, "Pretrain/Step Time": 8.558359421789646} +{"Pretrain/Learning Rate": 4.4658322809013723e-05, "Pretrain/Loss": 2.1272075176239014, "Pretrain/Loss (Raw)": 1.9898930788040161, "Pretrain/Step": 2247, "Pretrain/Step Time": 8.5586520973593} +{"Pretrain/Learning Rate": 4.465307660645068e-05, "Pretrain/Loss": 2.1267311573028564, "Pretrain/Loss (Raw)": 2.1442043781280518, "Pretrain/Step": 2248, "Pretrain/Step Time": 8.5597401317209} +{"Pretrain/Learning Rate": 4.464782813740223e-05, "Pretrain/Loss": 2.127797842025757, "Pretrain/Loss (Raw)": 2.104537010192871, "Pretrain/Step": 2249, "Pretrain/Step Time": 8.563168983906507} +{"Pretrain/Learning Rate": 4.464257740247366e-05, "Pretrain/Loss": 2.1264355182647705, "Pretrain/Loss (Raw)": 1.9609776735305786, "Pretrain/Step": 2250, "Pretrain/Step Time": 8.563271384686232} +{"Pretrain/Learning Rate": 4.4637324402270495e-05, "Pretrain/Loss": 2.124880790710449, "Pretrain/Loss (Raw)": 1.8245657682418823, "Pretrain/Step": 2251, "Pretrain/Step Time": 8.562472961843014} +{"Pretrain/Learning Rate": 4.463206913739856e-05, "Pretrain/Loss": 2.124440908432007, "Pretrain/Loss (Raw)": 1.9999136924743652, "Pretrain/Step": 2252, "Pretrain/Step Time": 8.563947996124625} +{"Pretrain/Learning Rate": 4.462681160846389e-05, "Pretrain/Loss": 2.1255078315734863, "Pretrain/Loss (Raw)": 2.0491364002227783, "Pretrain/Step": 2253, "Pretrain/Step Time": 8.562153428792953} +{"Pretrain/Learning Rate": 4.4621551816072835e-05, "Pretrain/Loss": 2.127047061920166, "Pretrain/Loss (Raw)": 2.1391189098358154, "Pretrain/Step": 2254, "Pretrain/Step Time": 8.559948846697807} +{"Pretrain/Learning Rate": 4.4616289760831954e-05, "Pretrain/Loss": 2.1296310424804688, "Pretrain/Loss (Raw)": 2.494293451309204, "Pretrain/Step": 2255, "Pretrain/Step Time": 8.564697079360485} +{"Pretrain/Learning Rate": 4.46110254433481e-05, "Pretrain/Loss": 2.1307692527770996, "Pretrain/Loss (Raw)": 2.1024184226989746, "Pretrain/Step": 2256, "Pretrain/Step Time": 8.556345090270042} +{"Pretrain/Learning Rate": 4.4605758864228384e-05, "Pretrain/Loss": 2.1301305294036865, "Pretrain/Loss (Raw)": 1.953548789024353, "Pretrain/Step": 2257, "Pretrain/Step Time": 8.559164296835661} +{"Pretrain/Learning Rate": 4.460049002408018e-05, "Pretrain/Loss": 2.1308064460754395, "Pretrain/Loss (Raw)": 2.158921480178833, "Pretrain/Step": 2258, "Pretrain/Step Time": 8.56771406903863} +{"Pretrain/Learning Rate": 4.45952189235111e-05, "Pretrain/Loss": 2.12880802154541, "Pretrain/Loss (Raw)": 2.10023832321167, "Pretrain/Step": 2259, "Pretrain/Step Time": 8.563473651185632} +{"Pretrain/Learning Rate": 4.458994556312903e-05, "Pretrain/Loss": 2.1295948028564453, "Pretrain/Loss (Raw)": 2.082383155822754, "Pretrain/Step": 2260, "Pretrain/Step Time": 8.562878865748644} +{"Pretrain/Learning Rate": 4.458466994354214e-05, "Pretrain/Loss": 2.1287026405334473, "Pretrain/Loss (Raw)": 2.072166919708252, "Pretrain/Step": 2261, "Pretrain/Step Time": 8.574028555303812} +{"Pretrain/Learning Rate": 4.457939206535882e-05, "Pretrain/Loss": 2.125331401824951, "Pretrain/Loss (Raw)": 1.9533716440200806, "Pretrain/Step": 2262, "Pretrain/Step Time": 8.558300890028477} +{"Pretrain/Learning Rate": 4.4574111929187744e-05, "Pretrain/Loss": 2.1264657974243164, "Pretrain/Loss (Raw)": 2.266490936279297, "Pretrain/Step": 2263, "Pretrain/Step Time": 8.557641556486487} +{"Pretrain/Learning Rate": 4.4568829535637844e-05, "Pretrain/Loss": 2.128324270248413, "Pretrain/Loss (Raw)": 2.1915857791900635, "Pretrain/Step": 2264, "Pretrain/Step Time": 8.55775204114616} +{"Pretrain/Learning Rate": 4.456354488531832e-05, "Pretrain/Loss": 2.130585193634033, "Pretrain/Loss (Raw)": 2.3347411155700684, "Pretrain/Step": 2265, "Pretrain/Step Time": 8.558356143534184} +{"Pretrain/Learning Rate": 4.4558257978838605e-05, "Pretrain/Loss": 2.1301498413085938, "Pretrain/Loss (Raw)": 1.9431989192962646, "Pretrain/Step": 2266, "Pretrain/Step Time": 8.555193880572915} +{"Pretrain/Learning Rate": 4.455296881680842e-05, "Pretrain/Loss": 2.1292452812194824, "Pretrain/Loss (Raw)": 1.9690204858779907, "Pretrain/Step": 2267, "Pretrain/Step Time": 8.562914108857512} +{"Pretrain/Learning Rate": 4.4547677399837726e-05, "Pretrain/Loss": 2.1300406455993652, "Pretrain/Loss (Raw)": 2.216075897216797, "Pretrain/Step": 2268, "Pretrain/Step Time": 8.55149645730853} +{"Pretrain/Learning Rate": 4.4542383728536774e-05, "Pretrain/Loss": 2.128798007965088, "Pretrain/Loss (Raw)": 2.0120816230773926, "Pretrain/Step": 2269, "Pretrain/Step Time": 8.55077026039362} +{"Pretrain/Learning Rate": 4.453708780351604e-05, "Pretrain/Loss": 2.1293752193450928, "Pretrain/Loss (Raw)": 2.0933961868286133, "Pretrain/Step": 2270, "Pretrain/Step Time": 8.546939646825194} +{"Pretrain/Learning Rate": 4.4531789625386274e-05, "Pretrain/Loss": 2.127169132232666, "Pretrain/Loss (Raw)": 2.0019662380218506, "Pretrain/Step": 2271, "Pretrain/Step Time": 8.54813127592206} +{"Pretrain/Learning Rate": 4.45264891947585e-05, "Pretrain/Loss": 2.126967191696167, "Pretrain/Loss (Raw)": 2.183802604675293, "Pretrain/Step": 2272, "Pretrain/Step Time": 8.546373950317502} +{"Pretrain/Learning Rate": 4.452118651224398e-05, "Pretrain/Loss": 2.128054618835449, "Pretrain/Loss (Raw)": 2.2201952934265137, "Pretrain/Step": 2273, "Pretrain/Step Time": 8.552980782464147} +{"Pretrain/Learning Rate": 4.451588157845424e-05, "Pretrain/Loss": 2.1278765201568604, "Pretrain/Loss (Raw)": 1.907759666442871, "Pretrain/Step": 2274, "Pretrain/Step Time": 8.55429757758975} +{"Pretrain/Learning Rate": 4.451057439400108e-05, "Pretrain/Loss": 2.128338575363159, "Pretrain/Loss (Raw)": 2.0228168964385986, "Pretrain/Step": 2275, "Pretrain/Step Time": 8.556573620066047} +{"Pretrain/Learning Rate": 4.450526495949653e-05, "Pretrain/Loss": 2.1296944618225098, "Pretrain/Loss (Raw)": 2.3032522201538086, "Pretrain/Step": 2276, "Pretrain/Step Time": 8.555076353251934} +{"Pretrain/Learning Rate": 4.449995327555293e-05, "Pretrain/Loss": 2.130014419555664, "Pretrain/Loss (Raw)": 2.220693588256836, "Pretrain/Step": 2277, "Pretrain/Step Time": 8.553421014919877} +{"Pretrain/Learning Rate": 4.449463934278282e-05, "Pretrain/Loss": 2.1314549446105957, "Pretrain/Loss (Raw)": 2.2151479721069336, "Pretrain/Step": 2278, "Pretrain/Step Time": 8.55058840289712} +{"Pretrain/Learning Rate": 4.4489323161799045e-05, "Pretrain/Loss": 2.1309945583343506, "Pretrain/Loss (Raw)": 2.093487024307251, "Pretrain/Step": 2279, "Pretrain/Step Time": 8.562802435830235} +{"Pretrain/Learning Rate": 4.4484004733214685e-05, "Pretrain/Loss": 2.129666805267334, "Pretrain/Loss (Raw)": 2.0940887928009033, "Pretrain/Step": 2280, "Pretrain/Step Time": 8.551516933366656} +{"Pretrain/Learning Rate": 4.447868405764309e-05, "Pretrain/Loss": 2.128744125366211, "Pretrain/Loss (Raw)": 2.0722827911376953, "Pretrain/Step": 2281, "Pretrain/Step Time": 8.55302570015192} +{"Pretrain/Learning Rate": 4.4473361135697856e-05, "Pretrain/Loss": 2.128180980682373, "Pretrain/Loss (Raw)": 1.9084782600402832, "Pretrain/Step": 2282, "Pretrain/Step Time": 8.54683799855411} +{"Pretrain/Learning Rate": 4.446803596799286e-05, "Pretrain/Loss": 2.128196954727173, "Pretrain/Loss (Raw)": 2.052229404449463, "Pretrain/Step": 2283, "Pretrain/Step Time": 8.546126559376717} +{"Pretrain/Learning Rate": 4.446270855514222e-05, "Pretrain/Loss": 2.1283483505249023, "Pretrain/Loss (Raw)": 2.086559772491455, "Pretrain/Step": 2284, "Pretrain/Step Time": 8.544210247695446} +{"Pretrain/Learning Rate": 4.445737889776031e-05, "Pretrain/Loss": 2.1292455196380615, "Pretrain/Loss (Raw)": 2.117859363555908, "Pretrain/Step": 2285, "Pretrain/Step Time": 8.55103156901896} +{"Pretrain/Learning Rate": 4.44520469964618e-05, "Pretrain/Loss": 2.124790668487549, "Pretrain/Loss (Raw)": 1.7400987148284912, "Pretrain/Step": 2286, "Pretrain/Step Time": 8.541426056995988} +{"Pretrain/Learning Rate": 4.444671285186155e-05, "Pretrain/Loss": 2.125605583190918, "Pretrain/Loss (Raw)": 2.0992770195007324, "Pretrain/Step": 2287, "Pretrain/Step Time": 8.543131468817592} +{"Pretrain/Learning Rate": 4.444137646457474e-05, "Pretrain/Loss": 2.126959800720215, "Pretrain/Loss (Raw)": 2.494062662124634, "Pretrain/Step": 2288, "Pretrain/Step Time": 8.540140552446246} +{"Pretrain/Learning Rate": 4.4436037835216784e-05, "Pretrain/Loss": 2.1261491775512695, "Pretrain/Loss (Raw)": 2.06976318359375, "Pretrain/Step": 2289, "Pretrain/Step Time": 8.542307140305638} +{"Pretrain/Learning Rate": 4.4430696964403366e-05, "Pretrain/Loss": 2.123391628265381, "Pretrain/Loss (Raw)": 1.8151792287826538, "Pretrain/Step": 2290, "Pretrain/Step Time": 8.540679007768631} +{"Pretrain/Learning Rate": 4.4425353852750414e-05, "Pretrain/Loss": 2.1253957748413086, "Pretrain/Loss (Raw)": 2.0656304359436035, "Pretrain/Step": 2291, "Pretrain/Step Time": 8.5481270942837} +{"Pretrain/Learning Rate": 4.4420008500874116e-05, "Pretrain/Loss": 2.1239356994628906, "Pretrain/Loss (Raw)": 2.0283405780792236, "Pretrain/Step": 2292, "Pretrain/Step Time": 8.539140522480011} +{"Pretrain/Learning Rate": 4.441466090939093e-05, "Pretrain/Loss": 2.126741409301758, "Pretrain/Loss (Raw)": 2.301905870437622, "Pretrain/Step": 2293, "Pretrain/Step Time": 8.54163832589984} +{"Pretrain/Learning Rate": 4.440931107891756e-05, "Pretrain/Loss": 2.1285557746887207, "Pretrain/Loss (Raw)": 2.361793279647827, "Pretrain/Step": 2294, "Pretrain/Step Time": 8.539765214547515} +{"Pretrain/Learning Rate": 4.440395901007098e-05, "Pretrain/Loss": 2.128420114517212, "Pretrain/Loss (Raw)": 2.139578342437744, "Pretrain/Step": 2295, "Pretrain/Step Time": 8.54021169245243} +{"Pretrain/Learning Rate": 4.4398604703468415e-05, "Pretrain/Loss": 2.1275734901428223, "Pretrain/Loss (Raw)": 2.0458242893218994, "Pretrain/Step": 2296, "Pretrain/Step Time": 8.538707286119461} +{"Pretrain/Learning Rate": 4.439324815972734e-05, "Pretrain/Loss": 2.1267929077148438, "Pretrain/Loss (Raw)": 2.070011615753174, "Pretrain/Step": 2297, "Pretrain/Step Time": 8.542735932394862} +{"Pretrain/Learning Rate": 4.438788937946551e-05, "Pretrain/Loss": 2.1275649070739746, "Pretrain/Loss (Raw)": 2.097170114517212, "Pretrain/Step": 2298, "Pretrain/Step Time": 8.538159785792232} +{"Pretrain/Learning Rate": 4.4382528363300916e-05, "Pretrain/Loss": 2.1285207271575928, "Pretrain/Loss (Raw)": 2.0505053997039795, "Pretrain/Step": 2299, "Pretrain/Step Time": 8.544227289035916} +{"Pretrain/Learning Rate": 4.437716511185181e-05, "Pretrain/Loss": 2.1293442249298096, "Pretrain/Loss (Raw)": 2.194918394088745, "Pretrain/Step": 2300, "Pretrain/Step Time": 8.545314326882362} +{"Pretrain/Learning Rate": 4.437179962573672e-05, "Pretrain/Loss": 2.1299893856048584, "Pretrain/Loss (Raw)": 2.141740322113037, "Pretrain/Step": 2301, "Pretrain/Step Time": 8.545338777825236} +{"Pretrain/Learning Rate": 4.436643190557441e-05, "Pretrain/Loss": 2.129763603210449, "Pretrain/Loss (Raw)": 1.9003514051437378, "Pretrain/Step": 2302, "Pretrain/Step Time": 8.541334185749292} +{"Pretrain/Learning Rate": 4.4361061951983925e-05, "Pretrain/Loss": 2.1313881874084473, "Pretrain/Loss (Raw)": 2.4039347171783447, "Pretrain/Step": 2303, "Pretrain/Step Time": 8.549181187525392} +{"Pretrain/Learning Rate": 4.435568976558454e-05, "Pretrain/Loss": 2.130969524383545, "Pretrain/Loss (Raw)": 2.0260231494903564, "Pretrain/Step": 2304, "Pretrain/Step Time": 8.549269372597337} +{"Pretrain/Learning Rate": 4.4350315346995804e-05, "Pretrain/Loss": 2.1320414543151855, "Pretrain/Loss (Raw)": 2.31768536567688, "Pretrain/Step": 2305, "Pretrain/Step Time": 8.542056668549776} +{"Pretrain/Learning Rate": 4.434493869683752e-05, "Pretrain/Loss": 2.132957935333252, "Pretrain/Loss (Raw)": 2.1504297256469727, "Pretrain/Step": 2306, "Pretrain/Step Time": 8.545248815789819} +{"Pretrain/Learning Rate": 4.4339559815729746e-05, "Pretrain/Loss": 2.1279306411743164, "Pretrain/Loss (Raw)": 1.806426763534546, "Pretrain/Step": 2307, "Pretrain/Step Time": 8.547605838626623} +{"Pretrain/Learning Rate": 4.4334178704292805e-05, "Pretrain/Loss": 2.128232955932617, "Pretrain/Loss (Raw)": 2.161531686782837, "Pretrain/Step": 2308, "Pretrain/Step Time": 8.545260412618518} +{"Pretrain/Learning Rate": 4.432879536314727e-05, "Pretrain/Loss": 2.1268362998962402, "Pretrain/Loss (Raw)": 1.9353053569793701, "Pretrain/Step": 2309, "Pretrain/Step Time": 8.541200339794159} +{"Pretrain/Learning Rate": 4.4323409792913974e-05, "Pretrain/Loss": 2.125488042831421, "Pretrain/Loss (Raw)": 1.959505319595337, "Pretrain/Step": 2310, "Pretrain/Step Time": 8.541843712329865} +{"Pretrain/Learning Rate": 4.431802199421401e-05, "Pretrain/Loss": 2.1239795684814453, "Pretrain/Loss (Raw)": 1.8586870431900024, "Pretrain/Step": 2311, "Pretrain/Step Time": 8.543861720710993} +{"Pretrain/Learning Rate": 4.431263196766872e-05, "Pretrain/Loss": 2.124141216278076, "Pretrain/Loss (Raw)": 2.0672338008880615, "Pretrain/Step": 2312, "Pretrain/Step Time": 8.540696397423744} +{"Pretrain/Learning Rate": 4.43072397138997e-05, "Pretrain/Loss": 2.122452735900879, "Pretrain/Loss (Raw)": 1.8417898416519165, "Pretrain/Step": 2313, "Pretrain/Step Time": 8.544399635866284} +{"Pretrain/Learning Rate": 4.430184523352881e-05, "Pretrain/Loss": 2.1219840049743652, "Pretrain/Loss (Raw)": 2.0612502098083496, "Pretrain/Step": 2314, "Pretrain/Step Time": 8.541962832212448} +{"Pretrain/Learning Rate": 4.429644852717819e-05, "Pretrain/Loss": 2.1200900077819824, "Pretrain/Loss (Raw)": 2.037456750869751, "Pretrain/Step": 2315, "Pretrain/Step Time": 8.541247088462114} +{"Pretrain/Learning Rate": 4.4291049595470193e-05, "Pretrain/Loss": 2.1203393936157227, "Pretrain/Loss (Raw)": 2.1006858348846436, "Pretrain/Step": 2316, "Pretrain/Step Time": 8.540707869455218} +{"Pretrain/Learning Rate": 4.428564843902746e-05, "Pretrain/Loss": 2.1198391914367676, "Pretrain/Loss (Raw)": 2.145737409591675, "Pretrain/Step": 2317, "Pretrain/Step Time": 8.545290326699615} +{"Pretrain/Learning Rate": 4.4280245058472866e-05, "Pretrain/Loss": 2.1210954189300537, "Pretrain/Loss (Raw)": 2.213038206100464, "Pretrain/Step": 2318, "Pretrain/Step Time": 8.548063088208437} +{"Pretrain/Learning Rate": 4.427483945442956e-05, "Pretrain/Loss": 2.122206211090088, "Pretrain/Loss (Raw)": 2.123781681060791, "Pretrain/Step": 2319, "Pretrain/Step Time": 8.548933256417513} +{"Pretrain/Learning Rate": 4.426943162752094e-05, "Pretrain/Loss": 2.118351697921753, "Pretrain/Loss (Raw)": 1.8695873022079468, "Pretrain/Step": 2320, "Pretrain/Step Time": 8.547775922343135} +{"Pretrain/Learning Rate": 4.426402157837067e-05, "Pretrain/Loss": 2.1162109375, "Pretrain/Loss (Raw)": 2.0790774822235107, "Pretrain/Step": 2321, "Pretrain/Step Time": 8.538095369935036} +{"Pretrain/Learning Rate": 4.425860930760265e-05, "Pretrain/Loss": 2.1183927059173584, "Pretrain/Loss (Raw)": 2.1413445472717285, "Pretrain/Step": 2322, "Pretrain/Step Time": 8.546037163585424} +{"Pretrain/Learning Rate": 4.4253194815841056e-05, "Pretrain/Loss": 2.119905471801758, "Pretrain/Loss (Raw)": 2.118187427520752, "Pretrain/Step": 2323, "Pretrain/Step Time": 8.545438891276717} +{"Pretrain/Learning Rate": 4.424777810371032e-05, "Pretrain/Loss": 2.1184017658233643, "Pretrain/Loss (Raw)": 2.0589377880096436, "Pretrain/Step": 2324, "Pretrain/Step Time": 8.5462526679039} +{"Pretrain/Learning Rate": 4.424235917183511e-05, "Pretrain/Loss": 2.121072769165039, "Pretrain/Loss (Raw)": 2.4382100105285645, "Pretrain/Step": 2325, "Pretrain/Step Time": 8.543767081573606} +{"Pretrain/Learning Rate": 4.4236938020840365e-05, "Pretrain/Loss": 2.122075080871582, "Pretrain/Loss (Raw)": 2.1458561420440674, "Pretrain/Step": 2326, "Pretrain/Step Time": 8.542345713824034} +{"Pretrain/Learning Rate": 4.423151465135128e-05, "Pretrain/Loss": 2.1212263107299805, "Pretrain/Loss (Raw)": 1.9484539031982422, "Pretrain/Step": 2327, "Pretrain/Step Time": 8.541867734864354} +{"Pretrain/Learning Rate": 4.422608906399331e-05, "Pretrain/Loss": 2.12249755859375, "Pretrain/Loss (Raw)": 2.153287887573242, "Pretrain/Step": 2328, "Pretrain/Step Time": 8.541585981845856} +{"Pretrain/Learning Rate": 4.4220661259392146e-05, "Pretrain/Loss": 2.119933605194092, "Pretrain/Loss (Raw)": 1.9153937101364136, "Pretrain/Step": 2329, "Pretrain/Step Time": 8.544304568320513} +{"Pretrain/Learning Rate": 4.421523123817376e-05, "Pretrain/Loss": 2.122103452682495, "Pretrain/Loss (Raw)": 2.247083902359009, "Pretrain/Step": 2330, "Pretrain/Step Time": 8.540116220712662} +{"Pretrain/Learning Rate": 4.420979900096436e-05, "Pretrain/Loss": 2.1197261810302734, "Pretrain/Loss (Raw)": 2.1549596786499023, "Pretrain/Step": 2331, "Pretrain/Step Time": 8.546258382499218} +{"Pretrain/Learning Rate": 4.420436454839041e-05, "Pretrain/Loss": 2.1219136714935303, "Pretrain/Loss (Raw)": 2.3901751041412354, "Pretrain/Step": 2332, "Pretrain/Step Time": 8.542636912316084} +{"Pretrain/Learning Rate": 4.419892788107865e-05, "Pretrain/Loss": 2.1210052967071533, "Pretrain/Loss (Raw)": 2.044201374053955, "Pretrain/Step": 2333, "Pretrain/Step Time": 8.546520495787263} +{"Pretrain/Learning Rate": 4.419348899965608e-05, "Pretrain/Loss": 2.119953155517578, "Pretrain/Loss (Raw)": 2.0576565265655518, "Pretrain/Step": 2334, "Pretrain/Step Time": 8.547719359397888} +{"Pretrain/Learning Rate": 4.4188047904749894e-05, "Pretrain/Loss": 2.1186575889587402, "Pretrain/Loss (Raw)": 1.988011121749878, "Pretrain/Step": 2335, "Pretrain/Step Time": 8.547180239111185} +{"Pretrain/Learning Rate": 4.418260459698761e-05, "Pretrain/Loss": 2.119076728820801, "Pretrain/Loss (Raw)": 2.2105562686920166, "Pretrain/Step": 2336, "Pretrain/Step Time": 8.545424649491906} +{"Pretrain/Learning Rate": 4.417715907699698e-05, "Pretrain/Loss": 2.1202402114868164, "Pretrain/Loss (Raw)": 2.3419437408447266, "Pretrain/Step": 2337, "Pretrain/Step Time": 8.544336225837469} +{"Pretrain/Learning Rate": 4.417171134540599e-05, "Pretrain/Loss": 2.11812686920166, "Pretrain/Loss (Raw)": 2.0753331184387207, "Pretrain/Step": 2338, "Pretrain/Step Time": 8.548496389761567} +{"Pretrain/Learning Rate": 4.416626140284291e-05, "Pretrain/Loss": 2.11580228805542, "Pretrain/Loss (Raw)": 1.9933782815933228, "Pretrain/Step": 2339, "Pretrain/Step Time": 8.548839297145605} +{"Pretrain/Learning Rate": 4.416080924993625e-05, "Pretrain/Loss": 2.114234209060669, "Pretrain/Loss (Raw)": 2.1089723110198975, "Pretrain/Step": 2340, "Pretrain/Step Time": 8.54499526321888} +{"Pretrain/Learning Rate": 4.415535488731478e-05, "Pretrain/Loss": 2.1153955459594727, "Pretrain/Loss (Raw)": 2.251889944076538, "Pretrain/Step": 2341, "Pretrain/Step Time": 8.549236295744777} +{"Pretrain/Learning Rate": 4.414989831560753e-05, "Pretrain/Loss": 2.1139440536499023, "Pretrain/Loss (Raw)": 2.1859240531921387, "Pretrain/Step": 2342, "Pretrain/Step Time": 8.551542507484555} +{"Pretrain/Learning Rate": 4.4144439535443763e-05, "Pretrain/Loss": 2.1151137351989746, "Pretrain/Loss (Raw)": 2.235276699066162, "Pretrain/Step": 2343, "Pretrain/Step Time": 8.551413487643003} +{"Pretrain/Learning Rate": 4.413897854745301e-05, "Pretrain/Loss": 2.1137571334838867, "Pretrain/Loss (Raw)": 1.9688550233840942, "Pretrain/Step": 2344, "Pretrain/Step Time": 8.551930766552687} +{"Pretrain/Learning Rate": 4.413351535226507e-05, "Pretrain/Loss": 2.117192506790161, "Pretrain/Loss (Raw)": 2.358689069747925, "Pretrain/Step": 2345, "Pretrain/Step Time": 8.556038307026029} +{"Pretrain/Learning Rate": 4.4128049950509984e-05, "Pretrain/Loss": 2.1163463592529297, "Pretrain/Loss (Raw)": 2.057377576828003, "Pretrain/Step": 2346, "Pretrain/Step Time": 8.555375277996063} +{"Pretrain/Learning Rate": 4.412258234281804e-05, "Pretrain/Loss": 2.1169564723968506, "Pretrain/Loss (Raw)": 2.1754398345947266, "Pretrain/Step": 2347, "Pretrain/Step Time": 8.552466159686446} +{"Pretrain/Learning Rate": 4.411711252981979e-05, "Pretrain/Loss": 2.1153321266174316, "Pretrain/Loss (Raw)": 1.8990544080734253, "Pretrain/Step": 2348, "Pretrain/Step Time": 8.550327200442553} +{"Pretrain/Learning Rate": 4.411164051214603e-05, "Pretrain/Loss": 2.1159486770629883, "Pretrain/Loss (Raw)": 2.2224998474121094, "Pretrain/Step": 2349, "Pretrain/Step Time": 8.546039216220379} +{"Pretrain/Learning Rate": 4.4106166290427846e-05, "Pretrain/Loss": 2.1157383918762207, "Pretrain/Loss (Raw)": 1.8676005601882935, "Pretrain/Step": 2350, "Pretrain/Step Time": 8.547616021707654} +{"Pretrain/Learning Rate": 4.410068986529653e-05, "Pretrain/Loss": 2.114528179168701, "Pretrain/Loss (Raw)": 2.112257719039917, "Pretrain/Step": 2351, "Pretrain/Step Time": 8.550268925726414} +{"Pretrain/Learning Rate": 4.409521123738365e-05, "Pretrain/Loss": 2.114208698272705, "Pretrain/Loss (Raw)": 2.149299383163452, "Pretrain/Step": 2352, "Pretrain/Step Time": 8.55088852532208} +{"Pretrain/Learning Rate": 4.4089730407321035e-05, "Pretrain/Loss": 2.1131458282470703, "Pretrain/Loss (Raw)": 2.0221290588378906, "Pretrain/Step": 2353, "Pretrain/Step Time": 8.554722405970097} +{"Pretrain/Learning Rate": 4.408424737574075e-05, "Pretrain/Loss": 2.1137890815734863, "Pretrain/Loss (Raw)": 2.1620471477508545, "Pretrain/Step": 2354, "Pretrain/Step Time": 8.5466982498765} +{"Pretrain/Learning Rate": 4.407876214327513e-05, "Pretrain/Loss": 2.114133834838867, "Pretrain/Loss (Raw)": 2.1531598567962646, "Pretrain/Step": 2355, "Pretrain/Step Time": 8.553325701504946} +{"Pretrain/Learning Rate": 4.407327471055677e-05, "Pretrain/Loss": 2.1112804412841797, "Pretrain/Loss (Raw)": 1.7954829931259155, "Pretrain/Step": 2356, "Pretrain/Step Time": 8.549642205238342} +{"Pretrain/Learning Rate": 4.406778507821848e-05, "Pretrain/Loss": 2.1119441986083984, "Pretrain/Loss (Raw)": 2.3136227130889893, "Pretrain/Step": 2357, "Pretrain/Step Time": 8.54865530692041} +{"Pretrain/Learning Rate": 4.4062293246893374e-05, "Pretrain/Loss": 2.1107215881347656, "Pretrain/Loss (Raw)": 1.9549884796142578, "Pretrain/Step": 2358, "Pretrain/Step Time": 8.553007818758488} +{"Pretrain/Learning Rate": 4.4056799217214774e-05, "Pretrain/Loss": 2.1100893020629883, "Pretrain/Loss (Raw)": 2.200244188308716, "Pretrain/Step": 2359, "Pretrain/Step Time": 8.54939972795546} +{"Pretrain/Learning Rate": 4.4051302989816304e-05, "Pretrain/Loss": 2.1095974445343018, "Pretrain/Loss (Raw)": 2.1039061546325684, "Pretrain/Step": 2360, "Pretrain/Step Time": 8.545681333169341} +{"Pretrain/Learning Rate": 4.404580456533179e-05, "Pretrain/Loss": 2.1087944507598877, "Pretrain/Loss (Raw)": 2.159290313720703, "Pretrain/Step": 2361, "Pretrain/Step Time": 8.545635212212801} +{"Pretrain/Learning Rate": 4.404030394439535e-05, "Pretrain/Loss": 2.106541156768799, "Pretrain/Loss (Raw)": 2.0337393283843994, "Pretrain/Step": 2362, "Pretrain/Step Time": 8.54460928030312} +{"Pretrain/Learning Rate": 4.4034801127641336e-05, "Pretrain/Loss": 2.104280948638916, "Pretrain/Loss (Raw)": 2.0695106983184814, "Pretrain/Step": 2363, "Pretrain/Step Time": 8.544045638293028} +{"Pretrain/Learning Rate": 4.4029296115704366e-05, "Pretrain/Loss": 2.103646755218506, "Pretrain/Loss (Raw)": 2.1620965003967285, "Pretrain/Step": 2364, "Pretrain/Step Time": 8.550284752622247} +{"Pretrain/Learning Rate": 4.40237889092193e-05, "Pretrain/Loss": 2.1023752689361572, "Pretrain/Loss (Raw)": 2.3338212966918945, "Pretrain/Step": 2365, "Pretrain/Step Time": 8.537286331877112} +{"Pretrain/Learning Rate": 4.401827950882125e-05, "Pretrain/Loss": 2.101715564727783, "Pretrain/Loss (Raw)": 2.113828659057617, "Pretrain/Step": 2366, "Pretrain/Step Time": 8.537367420271039} +{"Pretrain/Learning Rate": 4.4012767915145594e-05, "Pretrain/Loss": 2.1037256717681885, "Pretrain/Loss (Raw)": 2.258336305618286, "Pretrain/Step": 2367, "Pretrain/Step Time": 8.539810819551349} +{"Pretrain/Learning Rate": 4.400725412882794e-05, "Pretrain/Loss": 2.1040303707122803, "Pretrain/Loss (Raw)": 2.1033623218536377, "Pretrain/Step": 2368, "Pretrain/Step Time": 8.544791337102652} +{"Pretrain/Learning Rate": 4.400173815050418e-05, "Pretrain/Loss": 2.1053009033203125, "Pretrain/Loss (Raw)": 2.1919069290161133, "Pretrain/Step": 2369, "Pretrain/Step Time": 8.543453395366669} +{"Pretrain/Learning Rate": 4.399621998081045e-05, "Pretrain/Loss": 2.1074459552764893, "Pretrain/Loss (Raw)": 2.2448909282684326, "Pretrain/Step": 2370, "Pretrain/Step Time": 8.53967198729515} +{"Pretrain/Learning Rate": 4.39906996203831e-05, "Pretrain/Loss": 2.107025384902954, "Pretrain/Loss (Raw)": 2.2051916122436523, "Pretrain/Step": 2371, "Pretrain/Step Time": 8.541342383250594} +{"Pretrain/Learning Rate": 4.398517706985879e-05, "Pretrain/Loss": 2.1065378189086914, "Pretrain/Loss (Raw)": 2.1861748695373535, "Pretrain/Step": 2372, "Pretrain/Step Time": 8.53782432153821} +{"Pretrain/Learning Rate": 4.39796523298744e-05, "Pretrain/Loss": 2.1084537506103516, "Pretrain/Loss (Raw)": 2.574310064315796, "Pretrain/Step": 2373, "Pretrain/Step Time": 8.541095562279224} +{"Pretrain/Learning Rate": 4.397412540106707e-05, "Pretrain/Loss": 2.110443353652954, "Pretrain/Loss (Raw)": 2.346400737762451, "Pretrain/Step": 2374, "Pretrain/Step Time": 8.538457477465272} +{"Pretrain/Learning Rate": 4.396859628407418e-05, "Pretrain/Loss": 2.110787868499756, "Pretrain/Loss (Raw)": 2.033961772918701, "Pretrain/Step": 2375, "Pretrain/Step Time": 8.535527611151338} +{"Pretrain/Learning Rate": 4.39630649795334e-05, "Pretrain/Loss": 2.1098952293395996, "Pretrain/Loss (Raw)": 2.0299620628356934, "Pretrain/Step": 2376, "Pretrain/Step Time": 8.535401297733188} +{"Pretrain/Learning Rate": 4.3957531488082595e-05, "Pretrain/Loss": 2.1097493171691895, "Pretrain/Loss (Raw)": 2.085855007171631, "Pretrain/Step": 2377, "Pretrain/Step Time": 8.534679995849729} +{"Pretrain/Learning Rate": 4.395199581035994e-05, "Pretrain/Loss": 2.1126933097839355, "Pretrain/Loss (Raw)": 2.337820529937744, "Pretrain/Step": 2378, "Pretrain/Step Time": 8.52853687480092} +{"Pretrain/Learning Rate": 4.3946457947003813e-05, "Pretrain/Loss": 2.1146774291992188, "Pretrain/Loss (Raw)": 2.078502893447876, "Pretrain/Step": 2379, "Pretrain/Step Time": 8.527694130316377} +{"Pretrain/Learning Rate": 4.394091789865288e-05, "Pretrain/Loss": 2.1150355339050293, "Pretrain/Loss (Raw)": 2.0457746982574463, "Pretrain/Step": 2380, "Pretrain/Step Time": 8.524001827463508} +{"Pretrain/Learning Rate": 4.393537566594605e-05, "Pretrain/Loss": 2.114828586578369, "Pretrain/Loss (Raw)": 2.0226457118988037, "Pretrain/Step": 2381, "Pretrain/Step Time": 8.523316740989685} +{"Pretrain/Learning Rate": 4.392983124952246e-05, "Pretrain/Loss": 2.114362955093384, "Pretrain/Loss (Raw)": 2.0795302391052246, "Pretrain/Step": 2382, "Pretrain/Step Time": 8.528551975265145} +{"Pretrain/Learning Rate": 4.392428465002154e-05, "Pretrain/Loss": 2.112206220626831, "Pretrain/Loss (Raw)": 2.2182021141052246, "Pretrain/Step": 2383, "Pretrain/Step Time": 8.527195954695344} +{"Pretrain/Learning Rate": 4.391873586808294e-05, "Pretrain/Loss": 2.1132631301879883, "Pretrain/Loss (Raw)": 2.237722873687744, "Pretrain/Step": 2384, "Pretrain/Step Time": 8.527946712449193} +{"Pretrain/Learning Rate": 4.391318490434656e-05, "Pretrain/Loss": 2.1148619651794434, "Pretrain/Loss (Raw)": 2.158188819885254, "Pretrain/Step": 2385, "Pretrain/Step Time": 8.52448157966137} +{"Pretrain/Learning Rate": 4.3907631759452584e-05, "Pretrain/Loss": 2.1138930320739746, "Pretrain/Loss (Raw)": 2.0349233150482178, "Pretrain/Step": 2386, "Pretrain/Step Time": 8.519831335172057} +{"Pretrain/Learning Rate": 4.3902076434041416e-05, "Pretrain/Loss": 2.118788242340088, "Pretrain/Loss (Raw)": 2.72683048248291, "Pretrain/Step": 2387, "Pretrain/Step Time": 8.521596487611532} +{"Pretrain/Learning Rate": 4.389651892875373e-05, "Pretrain/Loss": 2.1182470321655273, "Pretrain/Loss (Raw)": 2.013091564178467, "Pretrain/Step": 2388, "Pretrain/Step Time": 8.533017221838236} +{"Pretrain/Learning Rate": 4.389095924423043e-05, "Pretrain/Loss": 2.117337226867676, "Pretrain/Loss (Raw)": 1.9557008743286133, "Pretrain/Step": 2389, "Pretrain/Step Time": 8.52137435413897} +{"Pretrain/Learning Rate": 4.388539738111269e-05, "Pretrain/Loss": 2.1193833351135254, "Pretrain/Loss (Raw)": 2.2152798175811768, "Pretrain/Step": 2390, "Pretrain/Step Time": 8.53008016385138} +{"Pretrain/Learning Rate": 4.387983334004194e-05, "Pretrain/Loss": 2.116767406463623, "Pretrain/Loss (Raw)": 1.9316389560699463, "Pretrain/Step": 2391, "Pretrain/Step Time": 8.532397715374827} +{"Pretrain/Learning Rate": 4.387426712165984e-05, "Pretrain/Loss": 2.1167876720428467, "Pretrain/Loss (Raw)": 2.1941778659820557, "Pretrain/Step": 2392, "Pretrain/Step Time": 8.533581897616386} +{"Pretrain/Learning Rate": 4.3868698726608325e-05, "Pretrain/Loss": 2.1160523891448975, "Pretrain/Loss (Raw)": 2.2406392097473145, "Pretrain/Step": 2393, "Pretrain/Step Time": 8.532586801797152} +{"Pretrain/Learning Rate": 4.3863128155529554e-05, "Pretrain/Loss": 2.116424560546875, "Pretrain/Loss (Raw)": 1.9908316135406494, "Pretrain/Step": 2394, "Pretrain/Step Time": 8.54624280706048} +{"Pretrain/Learning Rate": 4.385755540906595e-05, "Pretrain/Loss": 2.1183016300201416, "Pretrain/Loss (Raw)": 2.20928692817688, "Pretrain/Step": 2395, "Pretrain/Step Time": 8.536329401656985} +{"Pretrain/Learning Rate": 4.385198048786021e-05, "Pretrain/Loss": 2.1155877113342285, "Pretrain/Loss (Raw)": 1.8687063455581665, "Pretrain/Step": 2396, "Pretrain/Step Time": 8.537295795977116} +{"Pretrain/Learning Rate": 4.384640339255525e-05, "Pretrain/Loss": 2.117522716522217, "Pretrain/Loss (Raw)": 2.2597577571868896, "Pretrain/Step": 2397, "Pretrain/Step Time": 8.537888545542955} +{"Pretrain/Learning Rate": 4.384082412379423e-05, "Pretrain/Loss": 2.118126630783081, "Pretrain/Loss (Raw)": 2.170694589614868, "Pretrain/Step": 2398, "Pretrain/Step Time": 8.539471400901675} +{"Pretrain/Learning Rate": 4.38352426822206e-05, "Pretrain/Loss": 2.117063045501709, "Pretrain/Loss (Raw)": 1.8658138513565063, "Pretrain/Step": 2399, "Pretrain/Step Time": 8.537048030644655} +{"Pretrain/Learning Rate": 4.3829659068478026e-05, "Pretrain/Loss": 2.1196844577789307, "Pretrain/Loss (Raw)": 2.5193560123443604, "Pretrain/Step": 2400, "Pretrain/Step Time": 8.544994873926044} +{"Pretrain/Learning Rate": 4.3824073283210445e-05, "Pretrain/Loss": 2.118467330932617, "Pretrain/Loss (Raw)": 2.064392566680908, "Pretrain/Step": 2401, "Pretrain/Step Time": 8.537863213568926} +{"Pretrain/Learning Rate": 4.381848532706202e-05, "Pretrain/Loss": 2.1199445724487305, "Pretrain/Loss (Raw)": 2.096855640411377, "Pretrain/Step": 2402, "Pretrain/Step Time": 8.53673173300922} +{"Pretrain/Learning Rate": 4.38128952006772e-05, "Pretrain/Loss": 2.1208038330078125, "Pretrain/Loss (Raw)": 2.132803201675415, "Pretrain/Step": 2403, "Pretrain/Step Time": 8.535461695864797} +{"Pretrain/Learning Rate": 4.380730290470065e-05, "Pretrain/Loss": 2.1190707683563232, "Pretrain/Loss (Raw)": 2.081418514251709, "Pretrain/Step": 2404, "Pretrain/Step Time": 8.540160397067666} +{"Pretrain/Learning Rate": 4.380170843977731e-05, "Pretrain/Loss": 2.117593288421631, "Pretrain/Loss (Raw)": 2.031574249267578, "Pretrain/Step": 2405, "Pretrain/Step Time": 8.540630908682942} +{"Pretrain/Learning Rate": 4.3796111806552364e-05, "Pretrain/Loss": 2.117526054382324, "Pretrain/Loss (Raw)": 2.206566333770752, "Pretrain/Step": 2406, "Pretrain/Step Time": 8.557258738204837} +{"Pretrain/Learning Rate": 4.379051300567123e-05, "Pretrain/Loss": 2.1204605102539062, "Pretrain/Loss (Raw)": 2.46905779838562, "Pretrain/Step": 2407, "Pretrain/Step Time": 8.54235289990902} +{"Pretrain/Learning Rate": 4.378491203777958e-05, "Pretrain/Loss": 2.1195995807647705, "Pretrain/Loss (Raw)": 1.983883261680603, "Pretrain/Step": 2408, "Pretrain/Step Time": 8.542171325534582} +{"Pretrain/Learning Rate": 4.377930890352337e-05, "Pretrain/Loss": 2.118971109390259, "Pretrain/Loss (Raw)": 1.9918663501739502, "Pretrain/Step": 2409, "Pretrain/Step Time": 8.544022388756275} +{"Pretrain/Learning Rate": 4.3773703603548765e-05, "Pretrain/Loss": 2.119899272918701, "Pretrain/Loss (Raw)": 2.027315139770508, "Pretrain/Step": 2410, "Pretrain/Step Time": 8.542992504313588} +{"Pretrain/Learning Rate": 4.3768096138502194e-05, "Pretrain/Loss": 2.121076822280884, "Pretrain/Loss (Raw)": 2.202911853790283, "Pretrain/Step": 2411, "Pretrain/Step Time": 8.54188453219831} +{"Pretrain/Learning Rate": 4.376248650903033e-05, "Pretrain/Loss": 2.123539686203003, "Pretrain/Loss (Raw)": 2.4018073081970215, "Pretrain/Step": 2412, "Pretrain/Step Time": 8.551386918872595} +{"Pretrain/Learning Rate": 4.375687471578011e-05, "Pretrain/Loss": 2.1252782344818115, "Pretrain/Loss (Raw)": 2.340378761291504, "Pretrain/Step": 2413, "Pretrain/Step Time": 8.541056403890252} +{"Pretrain/Learning Rate": 4.375126075939873e-05, "Pretrain/Loss": 2.1272850036621094, "Pretrain/Loss (Raw)": 1.9969946146011353, "Pretrain/Step": 2414, "Pretrain/Step Time": 8.549353990703821} +{"Pretrain/Learning Rate": 4.374564464053359e-05, "Pretrain/Loss": 2.1263890266418457, "Pretrain/Loss (Raw)": 1.984569787979126, "Pretrain/Step": 2415, "Pretrain/Step Time": 8.55114651657641} +{"Pretrain/Learning Rate": 4.374002635983238e-05, "Pretrain/Loss": 2.124044179916382, "Pretrain/Loss (Raw)": 2.1939446926116943, "Pretrain/Step": 2416, "Pretrain/Step Time": 8.546292521059513} +{"Pretrain/Learning Rate": 4.373440591794301e-05, "Pretrain/Loss": 2.124030590057373, "Pretrain/Loss (Raw)": 2.068012237548828, "Pretrain/Step": 2417, "Pretrain/Step Time": 8.545453500002623} +{"Pretrain/Learning Rate": 4.372878331551369e-05, "Pretrain/Loss": 2.126363754272461, "Pretrain/Loss (Raw)": 2.113809585571289, "Pretrain/Step": 2418, "Pretrain/Step Time": 8.550585249438882} +{"Pretrain/Learning Rate": 4.3723158553192813e-05, "Pretrain/Loss": 2.1272153854370117, "Pretrain/Loss (Raw)": 2.174668073654175, "Pretrain/Step": 2419, "Pretrain/Step Time": 8.546924272552133} +{"Pretrain/Learning Rate": 4.3717531631629075e-05, "Pretrain/Loss": 2.127915382385254, "Pretrain/Loss (Raw)": 2.117905616760254, "Pretrain/Step": 2420, "Pretrain/Step Time": 8.543619342148304} +{"Pretrain/Learning Rate": 4.371190255147138e-05, "Pretrain/Loss": 2.1251516342163086, "Pretrain/Loss (Raw)": 1.9481664896011353, "Pretrain/Step": 2421, "Pretrain/Step Time": 8.545769553631544} +{"Pretrain/Learning Rate": 4.370627131336891e-05, "Pretrain/Loss": 2.1219615936279297, "Pretrain/Loss (Raw)": 1.953471302986145, "Pretrain/Step": 2422, "Pretrain/Step Time": 8.548606546595693} +{"Pretrain/Learning Rate": 4.370063791797109e-05, "Pretrain/Loss": 2.120577335357666, "Pretrain/Loss (Raw)": 1.9623799324035645, "Pretrain/Step": 2423, "Pretrain/Step Time": 8.547577248886228} +{"Pretrain/Learning Rate": 4.3695002365927584e-05, "Pretrain/Loss": 2.120602607727051, "Pretrain/Loss (Raw)": 2.049076557159424, "Pretrain/Step": 2424, "Pretrain/Step Time": 8.550523079931736} +{"Pretrain/Learning Rate": 4.368936465788831e-05, "Pretrain/Loss": 2.1202754974365234, "Pretrain/Loss (Raw)": 2.028146743774414, "Pretrain/Step": 2425, "Pretrain/Step Time": 8.548016119748354} +{"Pretrain/Learning Rate": 4.3683724794503436e-05, "Pretrain/Loss": 2.120493173599243, "Pretrain/Loss (Raw)": 2.1250364780426025, "Pretrain/Step": 2426, "Pretrain/Step Time": 8.553901696577668} +{"Pretrain/Learning Rate": 4.367808277642338e-05, "Pretrain/Loss": 2.1210289001464844, "Pretrain/Loss (Raw)": 2.1190738677978516, "Pretrain/Step": 2427, "Pretrain/Step Time": 8.549200508743525} +{"Pretrain/Learning Rate": 4.3672438604298806e-05, "Pretrain/Loss": 2.1228933334350586, "Pretrain/Loss (Raw)": 2.4335622787475586, "Pretrain/Step": 2428, "Pretrain/Step Time": 8.543892255052924} +{"Pretrain/Learning Rate": 4.3666792278780625e-05, "Pretrain/Loss": 2.122112274169922, "Pretrain/Loss (Raw)": 2.041729688644409, "Pretrain/Step": 2429, "Pretrain/Step Time": 8.549644598737359} +{"Pretrain/Learning Rate": 4.366114380051999e-05, "Pretrain/Loss": 2.124342203140259, "Pretrain/Loss (Raw)": 2.185826301574707, "Pretrain/Step": 2430, "Pretrain/Step Time": 8.554990602657199} +{"Pretrain/Learning Rate": 4.365549317016832e-05, "Pretrain/Loss": 2.122957706451416, "Pretrain/Loss (Raw)": 2.226694107055664, "Pretrain/Step": 2431, "Pretrain/Step Time": 8.547342235222459} +{"Pretrain/Learning Rate": 4.364984038837727e-05, "Pretrain/Loss": 2.123138189315796, "Pretrain/Loss (Raw)": 2.049140691757202, "Pretrain/Step": 2432, "Pretrain/Step Time": 8.550565399229527} +{"Pretrain/Learning Rate": 4.364418545579875e-05, "Pretrain/Loss": 2.122490882873535, "Pretrain/Loss (Raw)": 2.2348055839538574, "Pretrain/Step": 2433, "Pretrain/Step Time": 8.553109221160412} +{"Pretrain/Learning Rate": 4.363852837308491e-05, "Pretrain/Loss": 2.1220645904541016, "Pretrain/Loss (Raw)": 2.095890760421753, "Pretrain/Step": 2434, "Pretrain/Step Time": 8.554394269362092} +{"Pretrain/Learning Rate": 4.3632869140888144e-05, "Pretrain/Loss": 2.1248581409454346, "Pretrain/Loss (Raw)": 2.1639833450317383, "Pretrain/Step": 2435, "Pretrain/Step Time": 8.551719045266509} +{"Pretrain/Learning Rate": 4.362720775986111e-05, "Pretrain/Loss": 2.1240439414978027, "Pretrain/Loss (Raw)": 2.0573203563690186, "Pretrain/Step": 2436, "Pretrain/Step Time": 8.556579219177365} +{"Pretrain/Learning Rate": 4.362154423065671e-05, "Pretrain/Loss": 2.1262130737304688, "Pretrain/Loss (Raw)": 2.2129688262939453, "Pretrain/Step": 2437, "Pretrain/Step Time": 8.555659545585513} +{"Pretrain/Learning Rate": 4.361587855392807e-05, "Pretrain/Loss": 2.1273300647735596, "Pretrain/Loss (Raw)": 2.102487087249756, "Pretrain/Step": 2438, "Pretrain/Step Time": 8.548158952966332} +{"Pretrain/Learning Rate": 4.3610210730328604e-05, "Pretrain/Loss": 2.128142833709717, "Pretrain/Loss (Raw)": 1.9626903533935547, "Pretrain/Step": 2439, "Pretrain/Step Time": 8.549125026911497} +{"Pretrain/Learning Rate": 4.3604540760511935e-05, "Pretrain/Loss": 2.132906436920166, "Pretrain/Loss (Raw)": 2.6769604682922363, "Pretrain/Step": 2440, "Pretrain/Step Time": 8.552068317309022} +{"Pretrain/Learning Rate": 4.3598868645131964e-05, "Pretrain/Loss": 2.1351258754730225, "Pretrain/Loss (Raw)": 2.1259074211120605, "Pretrain/Step": 2441, "Pretrain/Step Time": 8.546090368181467} +{"Pretrain/Learning Rate": 4.359319438484282e-05, "Pretrain/Loss": 2.135572910308838, "Pretrain/Loss (Raw)": 2.118469476699829, "Pretrain/Step": 2442, "Pretrain/Step Time": 8.54999496974051} +{"Pretrain/Learning Rate": 4.358751798029887e-05, "Pretrain/Loss": 2.136563777923584, "Pretrain/Loss (Raw)": 2.164301872253418, "Pretrain/Step": 2443, "Pretrain/Step Time": 8.550851374864578} +{"Pretrain/Learning Rate": 4.358183943215478e-05, "Pretrain/Loss": 2.1380319595336914, "Pretrain/Loss (Raw)": 2.288602113723755, "Pretrain/Step": 2444, "Pretrain/Step Time": 8.549938945099711} +{"Pretrain/Learning Rate": 4.3576158741065395e-05, "Pretrain/Loss": 2.1361474990844727, "Pretrain/Loss (Raw)": 1.9045279026031494, "Pretrain/Step": 2445, "Pretrain/Step Time": 8.549385361373425} +{"Pretrain/Learning Rate": 4.357047590768586e-05, "Pretrain/Loss": 2.135573387145996, "Pretrain/Loss (Raw)": 2.139561414718628, "Pretrain/Step": 2446, "Pretrain/Step Time": 8.548231817781925} +{"Pretrain/Learning Rate": 4.356479093267153e-05, "Pretrain/Loss": 2.136888265609741, "Pretrain/Loss (Raw)": 2.292058229446411, "Pretrain/Step": 2447, "Pretrain/Step Time": 8.544183338060975} +{"Pretrain/Learning Rate": 4.355910381667803e-05, "Pretrain/Loss": 2.138923168182373, "Pretrain/Loss (Raw)": 2.13008451461792, "Pretrain/Step": 2448, "Pretrain/Step Time": 8.545346884056926} +{"Pretrain/Learning Rate": 4.355341456036122e-05, "Pretrain/Loss": 2.1391425132751465, "Pretrain/Loss (Raw)": 2.1071205139160156, "Pretrain/Step": 2449, "Pretrain/Step Time": 8.544876834377646} +{"Pretrain/Learning Rate": 4.354772316437722e-05, "Pretrain/Loss": 2.140268087387085, "Pretrain/Loss (Raw)": 2.2854437828063965, "Pretrain/Step": 2450, "Pretrain/Step Time": 8.541390266269445} +{"Pretrain/Learning Rate": 4.354202962938239e-05, "Pretrain/Loss": 2.140441417694092, "Pretrain/Loss (Raw)": 2.1403439044952393, "Pretrain/Step": 2451, "Pretrain/Step Time": 8.54081279039383} +{"Pretrain/Learning Rate": 4.353633395603332e-05, "Pretrain/Loss": 2.1407108306884766, "Pretrain/Loss (Raw)": 2.0934648513793945, "Pretrain/Step": 2452, "Pretrain/Step Time": 8.541334947571158} +{"Pretrain/Learning Rate": 4.353063614498688e-05, "Pretrain/Loss": 2.138202667236328, "Pretrain/Loss (Raw)": 2.1171374320983887, "Pretrain/Step": 2453, "Pretrain/Step Time": 8.545249078422785} +{"Pretrain/Learning Rate": 4.352493619690016e-05, "Pretrain/Loss": 2.1390504837036133, "Pretrain/Loss (Raw)": 2.254413604736328, "Pretrain/Step": 2454, "Pretrain/Step Time": 8.544869476929307} +{"Pretrain/Learning Rate": 4.351923411243049e-05, "Pretrain/Loss": 2.1386866569519043, "Pretrain/Loss (Raw)": 1.9018433094024658, "Pretrain/Step": 2455, "Pretrain/Step Time": 8.54880952462554} +{"Pretrain/Learning Rate": 4.35135298922355e-05, "Pretrain/Loss": 2.138880491256714, "Pretrain/Loss (Raw)": 2.1780991554260254, "Pretrain/Step": 2456, "Pretrain/Step Time": 8.542467365041375} +{"Pretrain/Learning Rate": 4.350782353697299e-05, "Pretrain/Loss": 2.140486478805542, "Pretrain/Loss (Raw)": 2.120974540710449, "Pretrain/Step": 2457, "Pretrain/Step Time": 8.540139416232705} +{"Pretrain/Learning Rate": 4.350211504730106e-05, "Pretrain/Loss": 2.1375670433044434, "Pretrain/Loss (Raw)": 1.8733880519866943, "Pretrain/Step": 2458, "Pretrain/Step Time": 8.543273879215121} +{"Pretrain/Learning Rate": 4.3496404423878045e-05, "Pretrain/Loss": 2.136465311050415, "Pretrain/Loss (Raw)": 2.013942003250122, "Pretrain/Step": 2459, "Pretrain/Step Time": 8.543669320642948} +{"Pretrain/Learning Rate": 4.349069166736251e-05, "Pretrain/Loss": 2.136364459991455, "Pretrain/Loss (Raw)": 2.3772404193878174, "Pretrain/Step": 2460, "Pretrain/Step Time": 8.545551061630249} +{"Pretrain/Learning Rate": 4.348497677841328e-05, "Pretrain/Loss": 2.1367015838623047, "Pretrain/Loss (Raw)": 2.0873849391937256, "Pretrain/Step": 2461, "Pretrain/Step Time": 8.544889472424984} +{"Pretrain/Learning Rate": 4.3479259757689427e-05, "Pretrain/Loss": 2.1360256671905518, "Pretrain/Loss (Raw)": 1.9711354970932007, "Pretrain/Step": 2462, "Pretrain/Step Time": 8.533275408670306} +{"Pretrain/Learning Rate": 4.347354060585026e-05, "Pretrain/Loss": 2.137007236480713, "Pretrain/Loss (Raw)": 2.113635540008545, "Pretrain/Step": 2463, "Pretrain/Step Time": 8.532494273036718} +{"Pretrain/Learning Rate": 4.346781932355533e-05, "Pretrain/Loss": 2.1362667083740234, "Pretrain/Loss (Raw)": 2.115798234939575, "Pretrain/Step": 2464, "Pretrain/Step Time": 8.534928560256958} +{"Pretrain/Learning Rate": 4.3462095911464465e-05, "Pretrain/Loss": 2.134183883666992, "Pretrain/Loss (Raw)": 2.075336217880249, "Pretrain/Step": 2465, "Pretrain/Step Time": 8.53333481401205} +{"Pretrain/Learning Rate": 4.34563703702377e-05, "Pretrain/Loss": 2.1351304054260254, "Pretrain/Loss (Raw)": 2.196500539779663, "Pretrain/Step": 2466, "Pretrain/Step Time": 8.542495282366872} +{"Pretrain/Learning Rate": 4.3450642700535335e-05, "Pretrain/Loss": 2.1356210708618164, "Pretrain/Loss (Raw)": 2.0561890602111816, "Pretrain/Step": 2467, "Pretrain/Step Time": 8.537848206236959} +{"Pretrain/Learning Rate": 4.344491290301791e-05, "Pretrain/Loss": 2.1340231895446777, "Pretrain/Loss (Raw)": 1.9044320583343506, "Pretrain/Step": 2468, "Pretrain/Step Time": 8.537359880283475} +{"Pretrain/Learning Rate": 4.3439180978346216e-05, "Pretrain/Loss": 2.133098602294922, "Pretrain/Loss (Raw)": 2.133547782897949, "Pretrain/Step": 2469, "Pretrain/Step Time": 8.5332095567137} +{"Pretrain/Learning Rate": 4.3433446927181274e-05, "Pretrain/Loss": 2.1327738761901855, "Pretrain/Loss (Raw)": 2.144315719604492, "Pretrain/Step": 2470, "Pretrain/Step Time": 8.529541881754994} +{"Pretrain/Learning Rate": 4.342771075018438e-05, "Pretrain/Loss": 2.134321928024292, "Pretrain/Loss (Raw)": 2.433457612991333, "Pretrain/Step": 2471, "Pretrain/Step Time": 8.53214524872601} +{"Pretrain/Learning Rate": 4.342197244801705e-05, "Pretrain/Loss": 2.136293411254883, "Pretrain/Loss (Raw)": 2.2211930751800537, "Pretrain/Step": 2472, "Pretrain/Step Time": 8.542880814522505} +{"Pretrain/Learning Rate": 4.341623202134105e-05, "Pretrain/Loss": 2.1345176696777344, "Pretrain/Loss (Raw)": 2.131401538848877, "Pretrain/Step": 2473, "Pretrain/Step Time": 8.540683902800083} +{"Pretrain/Learning Rate": 4.341048947081839e-05, "Pretrain/Loss": 2.134368896484375, "Pretrain/Loss (Raw)": 2.0383331775665283, "Pretrain/Step": 2474, "Pretrain/Step Time": 8.531597573310137} +{"Pretrain/Learning Rate": 4.340474479711133e-05, "Pretrain/Loss": 2.132997989654541, "Pretrain/Loss (Raw)": 1.9999579191207886, "Pretrain/Step": 2475, "Pretrain/Step Time": 8.534958155825734} +{"Pretrain/Learning Rate": 4.3398998000882375e-05, "Pretrain/Loss": 2.1338982582092285, "Pretrain/Loss (Raw)": 2.014310836791992, "Pretrain/Step": 2476, "Pretrain/Step Time": 8.539135007187724} +{"Pretrain/Learning Rate": 4.339324908279427e-05, "Pretrain/Loss": 2.1336617469787598, "Pretrain/Loss (Raw)": 2.192228078842163, "Pretrain/Step": 2477, "Pretrain/Step Time": 8.544189620763063} +{"Pretrain/Learning Rate": 4.338749804351001e-05, "Pretrain/Loss": 2.135565996170044, "Pretrain/Loss (Raw)": 2.1113061904907227, "Pretrain/Step": 2478, "Pretrain/Step Time": 8.542052475735545} +{"Pretrain/Learning Rate": 4.338174488369283e-05, "Pretrain/Loss": 2.1349129676818848, "Pretrain/Loss (Raw)": 2.0286715030670166, "Pretrain/Step": 2479, "Pretrain/Step Time": 8.541125077754259} +{"Pretrain/Learning Rate": 4.337598960400622e-05, "Pretrain/Loss": 2.1348893642425537, "Pretrain/Loss (Raw)": 2.146287441253662, "Pretrain/Step": 2480, "Pretrain/Step Time": 8.541371896862984} +{"Pretrain/Learning Rate": 4.337023220511389e-05, "Pretrain/Loss": 2.1344292163848877, "Pretrain/Loss (Raw)": 1.9632208347320557, "Pretrain/Step": 2481, "Pretrain/Step Time": 8.538968831300735} +{"Pretrain/Learning Rate": 4.336447268767982e-05, "Pretrain/Loss": 2.1344385147094727, "Pretrain/Loss (Raw)": 2.1632416248321533, "Pretrain/Step": 2482, "Pretrain/Step Time": 8.540360992774367} +{"Pretrain/Learning Rate": 4.3358711052368224e-05, "Pretrain/Loss": 2.134324789047241, "Pretrain/Loss (Raw)": 2.1386334896087646, "Pretrain/Step": 2483, "Pretrain/Step Time": 8.537285195663571} +{"Pretrain/Learning Rate": 4.335294729984356e-05, "Pretrain/Loss": 2.1353724002838135, "Pretrain/Loss (Raw)": 1.9295599460601807, "Pretrain/Step": 2484, "Pretrain/Step Time": 8.537295879796147} +{"Pretrain/Learning Rate": 4.334718143077054e-05, "Pretrain/Loss": 2.1328983306884766, "Pretrain/Loss (Raw)": 1.9969362020492554, "Pretrain/Step": 2485, "Pretrain/Step Time": 8.539081234484911} +{"Pretrain/Learning Rate": 4.334141344581408e-05, "Pretrain/Loss": 2.1335902214050293, "Pretrain/Loss (Raw)": 2.0435612201690674, "Pretrain/Step": 2486, "Pretrain/Step Time": 8.53935844823718} +{"Pretrain/Learning Rate": 4.3335643345639414e-05, "Pretrain/Loss": 2.1337218284606934, "Pretrain/Loss (Raw)": 2.217106819152832, "Pretrain/Step": 2487, "Pretrain/Step Time": 8.535062529146671} +{"Pretrain/Learning Rate": 4.332987113091195e-05, "Pretrain/Loss": 2.1337392330169678, "Pretrain/Loss (Raw)": 2.1061205863952637, "Pretrain/Step": 2488, "Pretrain/Step Time": 8.537807589396834} +{"Pretrain/Learning Rate": 4.332409680229737e-05, "Pretrain/Loss": 2.1324000358581543, "Pretrain/Loss (Raw)": 1.9878644943237305, "Pretrain/Step": 2489, "Pretrain/Step Time": 8.538612673059106} +{"Pretrain/Learning Rate": 4.3318320360461616e-05, "Pretrain/Loss": 2.1318254470825195, "Pretrain/Loss (Raw)": 1.9601936340332031, "Pretrain/Step": 2490, "Pretrain/Step Time": 8.534967299550772} +{"Pretrain/Learning Rate": 4.331254180607083e-05, "Pretrain/Loss": 2.1331746578216553, "Pretrain/Loss (Raw)": 2.2422168254852295, "Pretrain/Step": 2491, "Pretrain/Step Time": 8.544408341869712} +{"Pretrain/Learning Rate": 4.330676113979143e-05, "Pretrain/Loss": 2.1343183517456055, "Pretrain/Loss (Raw)": 2.3084840774536133, "Pretrain/Step": 2492, "Pretrain/Step Time": 8.54040308482945} +{"Pretrain/Learning Rate": 4.330097836229007e-05, "Pretrain/Loss": 2.132295608520508, "Pretrain/Loss (Raw)": 2.074908971786499, "Pretrain/Step": 2493, "Pretrain/Step Time": 8.540685128420591} +{"Pretrain/Learning Rate": 4.3295193474233655e-05, "Pretrain/Loss": 2.131701707839966, "Pretrain/Loss (Raw)": 2.037802219390869, "Pretrain/Step": 2494, "Pretrain/Step Time": 8.543745124712586} +{"Pretrain/Learning Rate": 4.328940647628931e-05, "Pretrain/Loss": 2.130526542663574, "Pretrain/Loss (Raw)": 2.1078929901123047, "Pretrain/Step": 2495, "Pretrain/Step Time": 8.539157198742032} +{"Pretrain/Learning Rate": 4.328361736912443e-05, "Pretrain/Loss": 2.1310434341430664, "Pretrain/Loss (Raw)": 2.169550657272339, "Pretrain/Step": 2496, "Pretrain/Step Time": 8.53542996570468} +{"Pretrain/Learning Rate": 4.3277826153406644e-05, "Pretrain/Loss": 2.12868070602417, "Pretrain/Loss (Raw)": 1.8894798755645752, "Pretrain/Step": 2497, "Pretrain/Step Time": 8.543118523433805} +{"Pretrain/Learning Rate": 4.327203282980382e-05, "Pretrain/Loss": 2.1258156299591064, "Pretrain/Loss (Raw)": 1.8781636953353882, "Pretrain/Step": 2498, "Pretrain/Step Time": 8.545362569391727} +{"Pretrain/Learning Rate": 4.326623739898406e-05, "Pretrain/Loss": 2.125253677368164, "Pretrain/Loss (Raw)": 2.1332693099975586, "Pretrain/Step": 2499, "Pretrain/Step Time": 8.546018708497286} +{"Pretrain/Learning Rate": 4.3260439861615734e-05, "Pretrain/Loss": 2.1226277351379395, "Pretrain/Loss (Raw)": 1.8500585556030273, "Pretrain/Step": 2500, "Pretrain/Step Time": 8.545567845925689} +{"Pretrain/Learning Rate": 4.325464021836744e-05, "Pretrain/Loss": 2.1183643341064453, "Pretrain/Loss (Raw)": 2.0286006927490234, "Pretrain/Step": 2501, "Pretrain/Step Time": 8.541662838310003} +{"Pretrain/Learning Rate": 4.3248838469908016e-05, "Pretrain/Loss": 2.116779088973999, "Pretrain/Loss (Raw)": 2.143465042114258, "Pretrain/Step": 2502, "Pretrain/Step Time": 8.546593518927693} +{"Pretrain/Learning Rate": 4.324303461690655e-05, "Pretrain/Loss": 2.1166882514953613, "Pretrain/Loss (Raw)": 2.0223536491394043, "Pretrain/Step": 2503, "Pretrain/Step Time": 8.558089077472687} +{"Pretrain/Learning Rate": 4.3237228660032355e-05, "Pretrain/Loss": 2.11796498298645, "Pretrain/Loss (Raw)": 2.193368434906006, "Pretrain/Step": 2504, "Pretrain/Step Time": 8.559405336156487} +{"Pretrain/Learning Rate": 4.323142059995503e-05, "Pretrain/Loss": 2.1195311546325684, "Pretrain/Loss (Raw)": 2.2863223552703857, "Pretrain/Step": 2505, "Pretrain/Step Time": 8.558328220620751} +{"Pretrain/Learning Rate": 4.3225610437344363e-05, "Pretrain/Loss": 2.11860990524292, "Pretrain/Loss (Raw)": 2.219897747039795, "Pretrain/Step": 2506, "Pretrain/Step Time": 8.557561043649912} +{"Pretrain/Learning Rate": 4.321979817287043e-05, "Pretrain/Loss": 2.1211905479431152, "Pretrain/Loss (Raw)": 2.4088194370269775, "Pretrain/Step": 2507, "Pretrain/Step Time": 8.5621595736593} +{"Pretrain/Learning Rate": 4.32139838072035e-05, "Pretrain/Loss": 2.1222405433654785, "Pretrain/Loss (Raw)": 2.180187702178955, "Pretrain/Step": 2508, "Pretrain/Step Time": 8.56191104836762} +{"Pretrain/Learning Rate": 4.320816734101415e-05, "Pretrain/Loss": 2.1208345890045166, "Pretrain/Loss (Raw)": 1.8426822423934937, "Pretrain/Step": 2509, "Pretrain/Step Time": 8.573998101055622} +{"Pretrain/Learning Rate": 4.320234877497313e-05, "Pretrain/Loss": 2.1213300228118896, "Pretrain/Loss (Raw)": 2.1429455280303955, "Pretrain/Step": 2510, "Pretrain/Step Time": 8.565806617960334} +{"Pretrain/Learning Rate": 4.319652810975148e-05, "Pretrain/Loss": 2.1191678047180176, "Pretrain/Loss (Raw)": 1.9414528608322144, "Pretrain/Step": 2511, "Pretrain/Step Time": 8.568090939894319} +{"Pretrain/Learning Rate": 4.319070534602047e-05, "Pretrain/Loss": 2.1177313327789307, "Pretrain/Loss (Raw)": 2.053831100463867, "Pretrain/Step": 2512, "Pretrain/Step Time": 8.561932068318129} +{"Pretrain/Learning Rate": 4.318488048445158e-05, "Pretrain/Loss": 2.115873098373413, "Pretrain/Loss (Raw)": 1.9203475713729858, "Pretrain/Step": 2513, "Pretrain/Step Time": 8.566291581839323} +{"Pretrain/Learning Rate": 4.317905352571661e-05, "Pretrain/Loss": 2.1161441802978516, "Pretrain/Loss (Raw)": 2.069636821746826, "Pretrain/Step": 2514, "Pretrain/Step Time": 8.565958302468061} +{"Pretrain/Learning Rate": 4.317322447048751e-05, "Pretrain/Loss": 2.110438585281372, "Pretrain/Loss (Raw)": 1.9965057373046875, "Pretrain/Step": 2515, "Pretrain/Step Time": 8.570229429751635} +{"Pretrain/Learning Rate": 4.316739331943653e-05, "Pretrain/Loss": 2.1130523681640625, "Pretrain/Loss (Raw)": 2.347651720046997, "Pretrain/Step": 2516, "Pretrain/Step Time": 8.557202642783523} +{"Pretrain/Learning Rate": 4.316156007323614e-05, "Pretrain/Loss": 2.1143128871917725, "Pretrain/Loss (Raw)": 2.117037534713745, "Pretrain/Step": 2517, "Pretrain/Step Time": 8.563957717269659} +{"Pretrain/Learning Rate": 4.315572473255908e-05, "Pretrain/Loss": 2.1130664348602295, "Pretrain/Loss (Raw)": 2.0557289123535156, "Pretrain/Step": 2518, "Pretrain/Step Time": 8.556189497932792} +{"Pretrain/Learning Rate": 4.3149887298078276e-05, "Pretrain/Loss": 2.11430025100708, "Pretrain/Loss (Raw)": 2.0895910263061523, "Pretrain/Step": 2519, "Pretrain/Step Time": 8.551006326451898} +{"Pretrain/Learning Rate": 4.314404777046694e-05, "Pretrain/Loss": 2.113450050354004, "Pretrain/Loss (Raw)": 2.0853428840637207, "Pretrain/Step": 2520, "Pretrain/Step Time": 8.558998201042414} +{"Pretrain/Learning Rate": 4.313820615039853e-05, "Pretrain/Loss": 2.1126904487609863, "Pretrain/Loss (Raw)": 2.1433889865875244, "Pretrain/Step": 2521, "Pretrain/Step Time": 8.555725492537022} +{"Pretrain/Learning Rate": 4.313236243854671e-05, "Pretrain/Loss": 2.112034797668457, "Pretrain/Loss (Raw)": 1.9069085121154785, "Pretrain/Step": 2522, "Pretrain/Step Time": 8.54805682040751} +{"Pretrain/Learning Rate": 4.3126516635585414e-05, "Pretrain/Loss": 2.1127305030822754, "Pretrain/Loss (Raw)": 2.298348903656006, "Pretrain/Step": 2523, "Pretrain/Step Time": 8.551563953980803} +{"Pretrain/Learning Rate": 4.312066874218881e-05, "Pretrain/Loss": 2.115760326385498, "Pretrain/Loss (Raw)": 2.256517171859741, "Pretrain/Step": 2524, "Pretrain/Step Time": 8.548694096505642} +{"Pretrain/Learning Rate": 4.3114818759031284e-05, "Pretrain/Loss": 2.1154422760009766, "Pretrain/Loss (Raw)": 2.219059467315674, "Pretrain/Step": 2525, "Pretrain/Step Time": 8.55280421115458} +{"Pretrain/Learning Rate": 4.310896668678751e-05, "Pretrain/Loss": 2.1142611503601074, "Pretrain/Loss (Raw)": 2.0195114612579346, "Pretrain/Step": 2526, "Pretrain/Step Time": 8.551809556782246} +{"Pretrain/Learning Rate": 4.3103112526132364e-05, "Pretrain/Loss": 2.118838310241699, "Pretrain/Loss (Raw)": 2.45170259475708, "Pretrain/Step": 2527, "Pretrain/Step Time": 8.556153832003474} +{"Pretrain/Learning Rate": 4.3097256277740976e-05, "Pretrain/Loss": 2.1164300441741943, "Pretrain/Loss (Raw)": 2.2110843658447266, "Pretrain/Step": 2528, "Pretrain/Step Time": 8.550783444195986} +{"Pretrain/Learning Rate": 4.309139794228871e-05, "Pretrain/Loss": 2.118006706237793, "Pretrain/Loss (Raw)": 2.2662103176116943, "Pretrain/Step": 2529, "Pretrain/Step Time": 8.551038011908531} +{"Pretrain/Learning Rate": 4.3085537520451196e-05, "Pretrain/Loss": 2.119091510772705, "Pretrain/Loss (Raw)": 2.235720157623291, "Pretrain/Step": 2530, "Pretrain/Step Time": 8.546758715063334} +{"Pretrain/Learning Rate": 4.307967501290427e-05, "Pretrain/Loss": 2.119701385498047, "Pretrain/Loss (Raw)": 2.2108609676361084, "Pretrain/Step": 2531, "Pretrain/Step Time": 8.551107423380017} +{"Pretrain/Learning Rate": 4.307381042032402e-05, "Pretrain/Loss": 2.119462251663208, "Pretrain/Loss (Raw)": 2.0508017539978027, "Pretrain/Step": 2532, "Pretrain/Step Time": 8.547880860045552} +{"Pretrain/Learning Rate": 4.3067943743386796e-05, "Pretrain/Loss": 2.121145248413086, "Pretrain/Loss (Raw)": 2.246969699859619, "Pretrain/Step": 2533, "Pretrain/Step Time": 8.552071563899517} +{"Pretrain/Learning Rate": 4.3062074982769155e-05, "Pretrain/Loss": 2.125293731689453, "Pretrain/Loss (Raw)": 2.737576961517334, "Pretrain/Step": 2534, "Pretrain/Step Time": 8.5422976706177} +{"Pretrain/Learning Rate": 4.305620413914792e-05, "Pretrain/Loss": 2.122396945953369, "Pretrain/Loss (Raw)": 2.0983150005340576, "Pretrain/Step": 2535, "Pretrain/Step Time": 8.539687333628535} +{"Pretrain/Learning Rate": 4.305033121320013e-05, "Pretrain/Loss": 2.1226038932800293, "Pretrain/Loss (Raw)": 2.0103349685668945, "Pretrain/Step": 2536, "Pretrain/Step Time": 8.541434908285737} +{"Pretrain/Learning Rate": 4.30444562056031e-05, "Pretrain/Loss": 2.125039577484131, "Pretrain/Loss (Raw)": 2.303673505783081, "Pretrain/Step": 2537, "Pretrain/Step Time": 8.540066976100206} +{"Pretrain/Learning Rate": 4.3038579117034347e-05, "Pretrain/Loss": 2.125586986541748, "Pretrain/Loss (Raw)": 2.097346305847168, "Pretrain/Step": 2538, "Pretrain/Step Time": 8.53922776132822} +{"Pretrain/Learning Rate": 4.303269994817165e-05, "Pretrain/Loss": 2.123728036880493, "Pretrain/Loss (Raw)": 1.9649780988693237, "Pretrain/Step": 2539, "Pretrain/Step Time": 8.547304222360253} +{"Pretrain/Learning Rate": 4.302681869969302e-05, "Pretrain/Loss": 2.119863986968994, "Pretrain/Loss (Raw)": 1.9072022438049316, "Pretrain/Step": 2540, "Pretrain/Step Time": 8.53666832856834} +{"Pretrain/Learning Rate": 4.3020935372276716e-05, "Pretrain/Loss": 2.119386911392212, "Pretrain/Loss (Raw)": 2.2793145179748535, "Pretrain/Step": 2541, "Pretrain/Step Time": 8.542050616815686} +{"Pretrain/Learning Rate": 4.3015049966601224e-05, "Pretrain/Loss": 2.119352340698242, "Pretrain/Loss (Raw)": 1.9925658702850342, "Pretrain/Step": 2542, "Pretrain/Step Time": 8.534172939136624} +{"Pretrain/Learning Rate": 4.3009162483345275e-05, "Pretrain/Loss": 2.121774673461914, "Pretrain/Loss (Raw)": 2.2946360111236572, "Pretrain/Step": 2543, "Pretrain/Step Time": 8.532453274354339} +{"Pretrain/Learning Rate": 4.300327292318786e-05, "Pretrain/Loss": 2.1228575706481934, "Pretrain/Loss (Raw)": 2.3325867652893066, "Pretrain/Step": 2544, "Pretrain/Step Time": 8.53659744746983} +{"Pretrain/Learning Rate": 4.299738128680817e-05, "Pretrain/Loss": 2.1249961853027344, "Pretrain/Loss (Raw)": 2.3417162895202637, "Pretrain/Step": 2545, "Pretrain/Step Time": 8.543942838907242} +{"Pretrain/Learning Rate": 4.299148757488567e-05, "Pretrain/Loss": 2.125138759613037, "Pretrain/Loss (Raw)": 2.1320595741271973, "Pretrain/Step": 2546, "Pretrain/Step Time": 8.539909226819873} +{"Pretrain/Learning Rate": 4.298559178810003e-05, "Pretrain/Loss": 2.12331223487854, "Pretrain/Loss (Raw)": 1.9408875703811646, "Pretrain/Step": 2547, "Pretrain/Step Time": 8.538335995748639} +{"Pretrain/Learning Rate": 4.297969392713121e-05, "Pretrain/Loss": 2.123347282409668, "Pretrain/Loss (Raw)": 2.1224029064178467, "Pretrain/Step": 2548, "Pretrain/Step Time": 8.540989197790623} +{"Pretrain/Learning Rate": 4.297379399265935e-05, "Pretrain/Loss": 2.1239004135131836, "Pretrain/Loss (Raw)": 2.018925905227661, "Pretrain/Step": 2549, "Pretrain/Step Time": 8.53850574977696} +{"Pretrain/Learning Rate": 4.296789198536488e-05, "Pretrain/Loss": 2.1268198490142822, "Pretrain/Loss (Raw)": 2.3271901607513428, "Pretrain/Step": 2550, "Pretrain/Step Time": 8.536134919151664} +{"Pretrain/Learning Rate": 4.296198790592843e-05, "Pretrain/Loss": 2.129197120666504, "Pretrain/Loss (Raw)": 2.266691207885742, "Pretrain/Step": 2551, "Pretrain/Step Time": 8.544819293543696} +{"Pretrain/Learning Rate": 4.295608175503091e-05, "Pretrain/Loss": 2.128831624984741, "Pretrain/Loss (Raw)": 2.002269744873047, "Pretrain/Step": 2552, "Pretrain/Step Time": 8.540270602330565} +{"Pretrain/Learning Rate": 4.295017353335342e-05, "Pretrain/Loss": 2.1286303997039795, "Pretrain/Loss (Raw)": 2.002389430999756, "Pretrain/Step": 2553, "Pretrain/Step Time": 8.539592185989022} +{"Pretrain/Learning Rate": 4.2944263241577334e-05, "Pretrain/Loss": 2.128326654434204, "Pretrain/Loss (Raw)": 2.086151361465454, "Pretrain/Step": 2554, "Pretrain/Step Time": 8.537334479391575} +{"Pretrain/Learning Rate": 4.293835088038425e-05, "Pretrain/Loss": 2.1289002895355225, "Pretrain/Loss (Raw)": 2.192519426345825, "Pretrain/Step": 2555, "Pretrain/Step Time": 8.537038961425424} +{"Pretrain/Learning Rate": 4.2932436450456025e-05, "Pretrain/Loss": 2.1251931190490723, "Pretrain/Loss (Raw)": 1.9590380191802979, "Pretrain/Step": 2556, "Pretrain/Step Time": 8.538549093529582} +{"Pretrain/Learning Rate": 4.292651995247472e-05, "Pretrain/Loss": 2.1265387535095215, "Pretrain/Loss (Raw)": 2.213956832885742, "Pretrain/Step": 2557, "Pretrain/Step Time": 8.543683098629117} +{"Pretrain/Learning Rate": 4.292060138712266e-05, "Pretrain/Loss": 2.1259427070617676, "Pretrain/Loss (Raw)": 2.109537363052368, "Pretrain/Step": 2558, "Pretrain/Step Time": 8.539510685950518} +{"Pretrain/Learning Rate": 4.2914680755082414e-05, "Pretrain/Loss": 2.1241183280944824, "Pretrain/Loss (Raw)": 1.993172526359558, "Pretrain/Step": 2559, "Pretrain/Step Time": 8.54062601365149} +{"Pretrain/Learning Rate": 4.2908758057036756e-05, "Pretrain/Loss": 2.1255478858947754, "Pretrain/Loss (Raw)": 2.232131004333496, "Pretrain/Step": 2560, "Pretrain/Step Time": 8.533908447250724} +{"Pretrain/Learning Rate": 4.2902833293668744e-05, "Pretrain/Loss": 2.1247944831848145, "Pretrain/Loss (Raw)": 2.1383697986602783, "Pretrain/Step": 2561, "Pretrain/Step Time": 8.529743937775493} +{"Pretrain/Learning Rate": 4.2896906465661623e-05, "Pretrain/Loss": 2.125354528427124, "Pretrain/Loss (Raw)": 2.1675713062286377, "Pretrain/Step": 2562, "Pretrain/Step Time": 8.531132297590375} +{"Pretrain/Learning Rate": 4.289097757369892e-05, "Pretrain/Loss": 2.1260924339294434, "Pretrain/Loss (Raw)": 2.258436679840088, "Pretrain/Step": 2563, "Pretrain/Step Time": 8.536669433116913} +{"Pretrain/Learning Rate": 4.288504661846437e-05, "Pretrain/Loss": 2.1274704933166504, "Pretrain/Loss (Raw)": 2.233689546585083, "Pretrain/Step": 2564, "Pretrain/Step Time": 8.530641756951809} +{"Pretrain/Learning Rate": 4.2879113600641976e-05, "Pretrain/Loss": 2.127168655395508, "Pretrain/Loss (Raw)": 2.1743381023406982, "Pretrain/Step": 2565, "Pretrain/Step Time": 8.53520867228508} +{"Pretrain/Learning Rate": 4.287317852091595e-05, "Pretrain/Loss": 2.1277923583984375, "Pretrain/Loss (Raw)": 2.1823482513427734, "Pretrain/Step": 2566, "Pretrain/Step Time": 8.532116275280714} +{"Pretrain/Learning Rate": 4.2867241379970754e-05, "Pretrain/Loss": 2.1277570724487305, "Pretrain/Loss (Raw)": 1.958177089691162, "Pretrain/Step": 2567, "Pretrain/Step Time": 8.529122907668352} +{"Pretrain/Learning Rate": 4.2861302178491094e-05, "Pretrain/Loss": 2.1222236156463623, "Pretrain/Loss (Raw)": 1.9686676263809204, "Pretrain/Step": 2568, "Pretrain/Step Time": 8.528902117162943} +{"Pretrain/Learning Rate": 4.28553609171619e-05, "Pretrain/Loss": 2.1219663619995117, "Pretrain/Loss (Raw)": 2.092958450317383, "Pretrain/Step": 2569, "Pretrain/Step Time": 8.544692227616906} +{"Pretrain/Learning Rate": 4.284941759666835e-05, "Pretrain/Loss": 2.121415138244629, "Pretrain/Loss (Raw)": 2.047905921936035, "Pretrain/Step": 2570, "Pretrain/Step Time": 8.53907254524529} +{"Pretrain/Learning Rate": 4.2843472217695844e-05, "Pretrain/Loss": 2.1213037967681885, "Pretrain/Loss (Raw)": 2.15008544921875, "Pretrain/Step": 2571, "Pretrain/Step Time": 8.543020674958825} +{"Pretrain/Learning Rate": 4.283752478093005e-05, "Pretrain/Loss": 2.1201915740966797, "Pretrain/Loss (Raw)": 2.146230936050415, "Pretrain/Step": 2572, "Pretrain/Step Time": 8.5378308724612} +{"Pretrain/Learning Rate": 4.283157528705683e-05, "Pretrain/Loss": 2.122232675552368, "Pretrain/Loss (Raw)": 2.165785074234009, "Pretrain/Step": 2573, "Pretrain/Step Time": 8.536313563585281} +{"Pretrain/Learning Rate": 4.2825623736762344e-05, "Pretrain/Loss": 2.1183242797851562, "Pretrain/Loss (Raw)": 1.6392920017242432, "Pretrain/Step": 2574, "Pretrain/Step Time": 8.536174561828375} +{"Pretrain/Learning Rate": 4.2819670130732926e-05, "Pretrain/Loss": 2.117609977722168, "Pretrain/Loss (Raw)": 2.200634241104126, "Pretrain/Step": 2575, "Pretrain/Step Time": 8.546442672610283} +{"Pretrain/Learning Rate": 4.2813714469655176e-05, "Pretrain/Loss": 2.1159281730651855, "Pretrain/Loss (Raw)": 1.9147990942001343, "Pretrain/Step": 2576, "Pretrain/Step Time": 8.545211609452963} +{"Pretrain/Learning Rate": 4.280775675421593e-05, "Pretrain/Loss": 2.1174983978271484, "Pretrain/Loss (Raw)": 2.3081226348876953, "Pretrain/Step": 2577, "Pretrain/Step Time": 8.55204633064568} +{"Pretrain/Learning Rate": 4.280179698510226e-05, "Pretrain/Loss": 2.1163244247436523, "Pretrain/Loss (Raw)": 2.135134220123291, "Pretrain/Step": 2578, "Pretrain/Step Time": 8.552298709750175} +{"Pretrain/Learning Rate": 4.279583516300148e-05, "Pretrain/Loss": 2.1183767318725586, "Pretrain/Loss (Raw)": 2.4030778408050537, "Pretrain/Step": 2579, "Pretrain/Step Time": 8.55166931450367} +{"Pretrain/Learning Rate": 4.2789871288601136e-05, "Pretrain/Loss": 2.1175198554992676, "Pretrain/Loss (Raw)": 1.9837449789047241, "Pretrain/Step": 2580, "Pretrain/Step Time": 8.55010954476893} +{"Pretrain/Learning Rate": 4.2783905362589e-05, "Pretrain/Loss": 2.119053363800049, "Pretrain/Loss (Raw)": 2.3134512901306152, "Pretrain/Step": 2581, "Pretrain/Step Time": 8.547595515847206} +{"Pretrain/Learning Rate": 4.27779373856531e-05, "Pretrain/Loss": 2.11621356010437, "Pretrain/Loss (Raw)": 1.8909265995025635, "Pretrain/Step": 2582, "Pretrain/Step Time": 8.559483179822564} +{"Pretrain/Learning Rate": 4.277196735848169e-05, "Pretrain/Loss": 2.1166515350341797, "Pretrain/Loss (Raw)": 1.9578903913497925, "Pretrain/Step": 2583, "Pretrain/Step Time": 8.553744545206428} +{"Pretrain/Learning Rate": 4.2765995281763263e-05, "Pretrain/Loss": 2.116258144378662, "Pretrain/Loss (Raw)": 2.127743721008301, "Pretrain/Step": 2584, "Pretrain/Step Time": 8.556197071447968} +{"Pretrain/Learning Rate": 4.2760021156186534e-05, "Pretrain/Loss": 2.1152987480163574, "Pretrain/Loss (Raw)": 1.998193621635437, "Pretrain/Step": 2585, "Pretrain/Step Time": 8.553279891610146} +{"Pretrain/Learning Rate": 4.2754044982440486e-05, "Pretrain/Loss": 2.116858720779419, "Pretrain/Loss (Raw)": 2.073026418685913, "Pretrain/Step": 2586, "Pretrain/Step Time": 8.555009480565786} +{"Pretrain/Learning Rate": 4.2748066761214305e-05, "Pretrain/Loss": 2.116549015045166, "Pretrain/Loss (Raw)": 1.9743428230285645, "Pretrain/Step": 2587, "Pretrain/Step Time": 8.548099461942911} +{"Pretrain/Learning Rate": 4.274208649319744e-05, "Pretrain/Loss": 2.1133954524993896, "Pretrain/Loss (Raw)": 1.9735649824142456, "Pretrain/Step": 2588, "Pretrain/Step Time": 8.55411527864635} +{"Pretrain/Learning Rate": 4.273610417907955e-05, "Pretrain/Loss": 2.1147944927215576, "Pretrain/Loss (Raw)": 2.2664637565612793, "Pretrain/Step": 2589, "Pretrain/Step Time": 8.55309253744781} +{"Pretrain/Learning Rate": 4.2730119819550555e-05, "Pretrain/Loss": 2.1147642135620117, "Pretrain/Loss (Raw)": 1.9672356843948364, "Pretrain/Step": 2590, "Pretrain/Step Time": 8.556203389540315} +{"Pretrain/Learning Rate": 4.2724133415300596e-05, "Pretrain/Loss": 2.114166021347046, "Pretrain/Loss (Raw)": 2.0370864868164062, "Pretrain/Step": 2591, "Pretrain/Step Time": 8.559115195646882} +{"Pretrain/Learning Rate": 4.271814496702005e-05, "Pretrain/Loss": 2.113416910171509, "Pretrain/Loss (Raw)": 2.0199217796325684, "Pretrain/Step": 2592, "Pretrain/Step Time": 8.56130295060575} +{"Pretrain/Learning Rate": 4.2712154475399534e-05, "Pretrain/Loss": 2.1127543449401855, "Pretrain/Loss (Raw)": 1.990500569343567, "Pretrain/Step": 2593, "Pretrain/Step Time": 8.567926157265902} +{"Pretrain/Learning Rate": 4.2706161941129906e-05, "Pretrain/Loss": 2.1135292053222656, "Pretrain/Loss (Raw)": 2.295698881149292, "Pretrain/Step": 2594, "Pretrain/Step Time": 8.551816023886204} +{"Pretrain/Learning Rate": 4.270016736490225e-05, "Pretrain/Loss": 2.1150922775268555, "Pretrain/Loss (Raw)": 2.2562499046325684, "Pretrain/Step": 2595, "Pretrain/Step Time": 8.558807576075196} +{"Pretrain/Learning Rate": 4.2694170747407886e-05, "Pretrain/Loss": 2.11857008934021, "Pretrain/Loss (Raw)": 2.349611520767212, "Pretrain/Step": 2596, "Pretrain/Step Time": 8.556805120781064} +{"Pretrain/Learning Rate": 4.268817208933837e-05, "Pretrain/Loss": 2.11739444732666, "Pretrain/Loss (Raw)": 1.9830917119979858, "Pretrain/Step": 2597, "Pretrain/Step Time": 8.55798694677651} +{"Pretrain/Learning Rate": 4.268217139138551e-05, "Pretrain/Loss": 2.115549087524414, "Pretrain/Loss (Raw)": 1.90809166431427, "Pretrain/Step": 2598, "Pretrain/Step Time": 8.557018555700779} +{"Pretrain/Learning Rate": 4.267616865424131e-05, "Pretrain/Loss": 2.1131935119628906, "Pretrain/Loss (Raw)": 2.131911039352417, "Pretrain/Step": 2599, "Pretrain/Step Time": 8.564523108303547} +{"Pretrain/Learning Rate": 4.267016387859806e-05, "Pretrain/Loss": 2.1129298210144043, "Pretrain/Loss (Raw)": 2.1874465942382812, "Pretrain/Step": 2600, "Pretrain/Step Time": 8.553377524018288} +{"Pretrain/Learning Rate": 4.266415706514824e-05, "Pretrain/Loss": 2.112154006958008, "Pretrain/Loss (Raw)": 2.0320990085601807, "Pretrain/Step": 2601, "Pretrain/Step Time": 8.555673316121101} +{"Pretrain/Learning Rate": 4.2658148214584585e-05, "Pretrain/Loss": 2.1130542755126953, "Pretrain/Loss (Raw)": 2.153566837310791, "Pretrain/Step": 2602, "Pretrain/Step Time": 8.556853288784623} +{"Pretrain/Learning Rate": 4.265213732760008e-05, "Pretrain/Loss": 2.114750623703003, "Pretrain/Loss (Raw)": 2.2171075344085693, "Pretrain/Step": 2603, "Pretrain/Step Time": 8.554742693901062} +{"Pretrain/Learning Rate": 4.264612440488791e-05, "Pretrain/Loss": 2.1137819290161133, "Pretrain/Loss (Raw)": 1.8903019428253174, "Pretrain/Step": 2604, "Pretrain/Step Time": 8.552466681227088} +{"Pretrain/Learning Rate": 4.264010944714153e-05, "Pretrain/Loss": 2.113204002380371, "Pretrain/Loss (Raw)": 2.118250846862793, "Pretrain/Step": 2605, "Pretrain/Step Time": 8.55475022085011} +{"Pretrain/Learning Rate": 4.263409245505461e-05, "Pretrain/Loss": 2.1132850646972656, "Pretrain/Loss (Raw)": 2.121687173843384, "Pretrain/Step": 2606, "Pretrain/Step Time": 8.552416501566768} +{"Pretrain/Learning Rate": 4.262807342932105e-05, "Pretrain/Loss": 2.115729331970215, "Pretrain/Loss (Raw)": 2.341536045074463, "Pretrain/Step": 2607, "Pretrain/Step Time": 8.55363179370761} +{"Pretrain/Learning Rate": 4.262205237063499e-05, "Pretrain/Loss": 2.1142690181732178, "Pretrain/Loss (Raw)": 1.9593706130981445, "Pretrain/Step": 2608, "Pretrain/Step Time": 8.553020613268018} +{"Pretrain/Learning Rate": 4.2616029279690814e-05, "Pretrain/Loss": 2.114795207977295, "Pretrain/Loss (Raw)": 2.0305562019348145, "Pretrain/Step": 2609, "Pretrain/Step Time": 8.550796184688807} +{"Pretrain/Learning Rate": 4.261000415718312e-05, "Pretrain/Loss": 2.111586093902588, "Pretrain/Loss (Raw)": 1.7525044679641724, "Pretrain/Step": 2610, "Pretrain/Step Time": 8.55167342722416} +{"Pretrain/Learning Rate": 4.260397700380679e-05, "Pretrain/Loss": 2.112196445465088, "Pretrain/Loss (Raw)": 2.2167770862579346, "Pretrain/Step": 2611, "Pretrain/Step Time": 8.560949677601457} +{"Pretrain/Learning Rate": 4.259794782025687e-05, "Pretrain/Loss": 2.112881660461426, "Pretrain/Loss (Raw)": 2.017225503921509, "Pretrain/Step": 2612, "Pretrain/Step Time": 8.560607260093093} +{"Pretrain/Learning Rate": 4.2591916607228675e-05, "Pretrain/Loss": 2.113011360168457, "Pretrain/Loss (Raw)": 2.0135602951049805, "Pretrain/Step": 2613, "Pretrain/Step Time": 8.559016218408942} +{"Pretrain/Learning Rate": 4.2585883365417774e-05, "Pretrain/Loss": 2.113943099975586, "Pretrain/Loss (Raw)": 2.162825345993042, "Pretrain/Step": 2614, "Pretrain/Step Time": 8.554168820381165} +{"Pretrain/Learning Rate": 4.2579848095519926e-05, "Pretrain/Loss": 2.113222599029541, "Pretrain/Loss (Raw)": 2.124866247177124, "Pretrain/Step": 2615, "Pretrain/Step Time": 8.552703358232975} +{"Pretrain/Learning Rate": 4.257381079823116e-05, "Pretrain/Loss": 2.111048698425293, "Pretrain/Loss (Raw)": 1.8278709650039673, "Pretrain/Step": 2616, "Pretrain/Step Time": 8.552167888730764} +{"Pretrain/Learning Rate": 4.2567771474247726e-05, "Pretrain/Loss": 2.111445426940918, "Pretrain/Loss (Raw)": 2.0386476516723633, "Pretrain/Step": 2617, "Pretrain/Step Time": 8.556780880317092} +{"Pretrain/Learning Rate": 4.2561730124266094e-05, "Pretrain/Loss": 2.1128365993499756, "Pretrain/Loss (Raw)": 2.1382641792297363, "Pretrain/Step": 2618, "Pretrain/Step Time": 8.56759007833898} +{"Pretrain/Learning Rate": 4.255568674898301e-05, "Pretrain/Loss": 2.1134438514709473, "Pretrain/Loss (Raw)": 2.3199477195739746, "Pretrain/Step": 2619, "Pretrain/Step Time": 8.557773012667894} +{"Pretrain/Learning Rate": 4.254964134909538e-05, "Pretrain/Loss": 2.1112189292907715, "Pretrain/Loss (Raw)": 2.023679733276367, "Pretrain/Step": 2620, "Pretrain/Step Time": 8.556004341691732} +{"Pretrain/Learning Rate": 4.254359392530043e-05, "Pretrain/Loss": 2.109186887741089, "Pretrain/Loss (Raw)": 1.8148072957992554, "Pretrain/Step": 2621, "Pretrain/Step Time": 8.55607539601624} +{"Pretrain/Learning Rate": 4.2537544478295556e-05, "Pretrain/Loss": 2.110593318939209, "Pretrain/Loss (Raw)": 2.2178261280059814, "Pretrain/Step": 2622, "Pretrain/Step Time": 8.555118469521403} +{"Pretrain/Learning Rate": 4.253149300877841e-05, "Pretrain/Loss": 2.110769748687744, "Pretrain/Loss (Raw)": 2.130472183227539, "Pretrain/Step": 2623, "Pretrain/Step Time": 8.56666823476553} +{"Pretrain/Learning Rate": 4.252543951744688e-05, "Pretrain/Loss": 2.1112520694732666, "Pretrain/Loss (Raw)": 2.2312846183776855, "Pretrain/Step": 2624, "Pretrain/Step Time": 8.566944148391485} +{"Pretrain/Learning Rate": 4.251938400499909e-05, "Pretrain/Loss": 2.112144947052002, "Pretrain/Loss (Raw)": 2.003791093826294, "Pretrain/Step": 2625, "Pretrain/Step Time": 8.5609215721488} +{"Pretrain/Learning Rate": 4.251332647213337e-05, "Pretrain/Loss": 2.115294933319092, "Pretrain/Loss (Raw)": 2.281343936920166, "Pretrain/Step": 2626, "Pretrain/Step Time": 8.559741159901023} +{"Pretrain/Learning Rate": 4.250726691954832e-05, "Pretrain/Loss": 2.1156795024871826, "Pretrain/Loss (Raw)": 2.1825168132781982, "Pretrain/Step": 2627, "Pretrain/Step Time": 8.55507213063538} +{"Pretrain/Learning Rate": 4.250120534794275e-05, "Pretrain/Loss": 2.117999792098999, "Pretrain/Loss (Raw)": 2.1470320224761963, "Pretrain/Step": 2628, "Pretrain/Step Time": 8.559482319280505} +{"Pretrain/Learning Rate": 4.249514175801572e-05, "Pretrain/Loss": 2.11867094039917, "Pretrain/Loss (Raw)": 2.1145193576812744, "Pretrain/Step": 2629, "Pretrain/Step Time": 8.562040075659752} +{"Pretrain/Learning Rate": 4.248907615046649e-05, "Pretrain/Loss": 2.119298219680786, "Pretrain/Loss (Raw)": 2.2237539291381836, "Pretrain/Step": 2630, "Pretrain/Step Time": 8.558552965521812} +{"Pretrain/Learning Rate": 4.24830085259946e-05, "Pretrain/Loss": 2.121339797973633, "Pretrain/Loss (Raw)": 2.2836833000183105, "Pretrain/Step": 2631, "Pretrain/Step Time": 8.551841918379068} +{"Pretrain/Learning Rate": 4.247693888529978e-05, "Pretrain/Loss": 2.1185503005981445, "Pretrain/Loss (Raw)": 1.8362988233566284, "Pretrain/Step": 2632, "Pretrain/Step Time": 8.549448335543275} +{"Pretrain/Learning Rate": 4.247086722908201e-05, "Pretrain/Loss": 2.1174111366271973, "Pretrain/Loss (Raw)": 2.1405208110809326, "Pretrain/Step": 2633, "Pretrain/Step Time": 8.547686168923974} +{"Pretrain/Learning Rate": 4.24647935580415e-05, "Pretrain/Loss": 2.117541551589966, "Pretrain/Loss (Raw)": 2.2365963459014893, "Pretrain/Step": 2634, "Pretrain/Step Time": 8.55344919115305} +{"Pretrain/Learning Rate": 4.2458717872878715e-05, "Pretrain/Loss": 2.1156413555145264, "Pretrain/Loss (Raw)": 2.1656007766723633, "Pretrain/Step": 2635, "Pretrain/Step Time": 8.552829021587968} +{"Pretrain/Learning Rate": 4.245264017429431e-05, "Pretrain/Loss": 2.115077018737793, "Pretrain/Loss (Raw)": 2.107943058013916, "Pretrain/Step": 2636, "Pretrain/Step Time": 8.553339652717113} +{"Pretrain/Learning Rate": 4.2446560462989203e-05, "Pretrain/Loss": 2.11749267578125, "Pretrain/Loss (Raw)": 2.151895761489868, "Pretrain/Step": 2637, "Pretrain/Step Time": 8.542865566909313} +{"Pretrain/Learning Rate": 4.244047873966452e-05, "Pretrain/Loss": 2.118192434310913, "Pretrain/Loss (Raw)": 2.2324836254119873, "Pretrain/Step": 2638, "Pretrain/Step Time": 8.54499138891697} +{"Pretrain/Learning Rate": 4.2434395005021666e-05, "Pretrain/Loss": 2.1184539794921875, "Pretrain/Loss (Raw)": 1.974950909614563, "Pretrain/Step": 2639, "Pretrain/Step Time": 8.543235532939434} +{"Pretrain/Learning Rate": 4.242830925976221e-05, "Pretrain/Loss": 2.1175386905670166, "Pretrain/Loss (Raw)": 1.936660647392273, "Pretrain/Step": 2640, "Pretrain/Step Time": 8.547280123457313} +{"Pretrain/Learning Rate": 4.2422221504588016e-05, "Pretrain/Loss": 2.12226939201355, "Pretrain/Loss (Raw)": 2.5258896350860596, "Pretrain/Step": 2641, "Pretrain/Step Time": 8.54903713800013} +{"Pretrain/Learning Rate": 4.2416131740201134e-05, "Pretrain/Loss": 2.122685432434082, "Pretrain/Loss (Raw)": 2.1229026317596436, "Pretrain/Step": 2642, "Pretrain/Step Time": 8.545066237449646} +{"Pretrain/Learning Rate": 4.241003996730388e-05, "Pretrain/Loss": 2.1258325576782227, "Pretrain/Loss (Raw)": 2.399332284927368, "Pretrain/Step": 2643, "Pretrain/Step Time": 8.546267053112388} +{"Pretrain/Learning Rate": 4.240394618659878e-05, "Pretrain/Loss": 2.125762939453125, "Pretrain/Loss (Raw)": 2.3387441635131836, "Pretrain/Step": 2644, "Pretrain/Step Time": 8.548605397343636} +{"Pretrain/Learning Rate": 4.2397850398788586e-05, "Pretrain/Loss": 2.1234254837036133, "Pretrain/Loss (Raw)": 1.8178105354309082, "Pretrain/Step": 2645, "Pretrain/Step Time": 8.545535603538156} +{"Pretrain/Learning Rate": 4.239175260457631e-05, "Pretrain/Loss": 2.1214919090270996, "Pretrain/Loss (Raw)": 1.8082330226898193, "Pretrain/Step": 2646, "Pretrain/Step Time": 8.549688743427396} +{"Pretrain/Learning Rate": 4.2385652804665164e-05, "Pretrain/Loss": 2.1210765838623047, "Pretrain/Loss (Raw)": 2.0364480018615723, "Pretrain/Step": 2647, "Pretrain/Step Time": 8.552893428131938} +{"Pretrain/Learning Rate": 4.237955099975862e-05, "Pretrain/Loss": 2.121542453765869, "Pretrain/Loss (Raw)": 2.144949197769165, "Pretrain/Step": 2648, "Pretrain/Step Time": 8.548692857846618} +{"Pretrain/Learning Rate": 4.237344719056035e-05, "Pretrain/Loss": 2.1209492683410645, "Pretrain/Loss (Raw)": 2.067460060119629, "Pretrain/Step": 2649, "Pretrain/Step Time": 8.548739010468125} +{"Pretrain/Learning Rate": 4.236734137777429e-05, "Pretrain/Loss": 2.1238880157470703, "Pretrain/Loss (Raw)": 2.2831006050109863, "Pretrain/Step": 2650, "Pretrain/Step Time": 8.550065949559212} +{"Pretrain/Learning Rate": 4.236123356210458e-05, "Pretrain/Loss": 2.1217336654663086, "Pretrain/Loss (Raw)": 2.022571086883545, "Pretrain/Step": 2651, "Pretrain/Step Time": 8.548128753900528} +{"Pretrain/Learning Rate": 4.235512374425561e-05, "Pretrain/Loss": 2.118692398071289, "Pretrain/Loss (Raw)": 1.8672312498092651, "Pretrain/Step": 2652, "Pretrain/Step Time": 8.551027584820986} +{"Pretrain/Learning Rate": 4.234901192493199e-05, "Pretrain/Loss": 2.1179380416870117, "Pretrain/Loss (Raw)": 2.122539520263672, "Pretrain/Step": 2653, "Pretrain/Step Time": 8.548341948539019} +{"Pretrain/Learning Rate": 4.234289810483857e-05, "Pretrain/Loss": 2.1190218925476074, "Pretrain/Loss (Raw)": 2.158198118209839, "Pretrain/Step": 2654, "Pretrain/Step Time": 8.554436147212982} +{"Pretrain/Learning Rate": 4.233678228468041e-05, "Pretrain/Loss": 2.117053985595703, "Pretrain/Loss (Raw)": 2.1998512744903564, "Pretrain/Step": 2655, "Pretrain/Step Time": 8.551325161010027} +{"Pretrain/Learning Rate": 4.2330664465162826e-05, "Pretrain/Loss": 2.1176745891571045, "Pretrain/Loss (Raw)": 2.290513038635254, "Pretrain/Step": 2656, "Pretrain/Step Time": 8.554288705810905} +{"Pretrain/Learning Rate": 4.232454464699135e-05, "Pretrain/Loss": 2.116861581802368, "Pretrain/Loss (Raw)": 2.162137985229492, "Pretrain/Step": 2657, "Pretrain/Step Time": 8.551779802888632} +{"Pretrain/Learning Rate": 4.231842283087175e-05, "Pretrain/Loss": 2.1152865886688232, "Pretrain/Loss (Raw)": 2.034132480621338, "Pretrain/Step": 2658, "Pretrain/Step Time": 8.555126827210188} +{"Pretrain/Learning Rate": 4.231229901751002e-05, "Pretrain/Loss": 2.1137537956237793, "Pretrain/Loss (Raw)": 2.0146284103393555, "Pretrain/Step": 2659, "Pretrain/Step Time": 8.551351299509406} +{"Pretrain/Learning Rate": 4.2306173207612394e-05, "Pretrain/Loss": 2.115440607070923, "Pretrain/Loss (Raw)": 2.2667362689971924, "Pretrain/Step": 2660, "Pretrain/Step Time": 8.553872687742114} +{"Pretrain/Learning Rate": 4.230004540188533e-05, "Pretrain/Loss": 2.1166765689849854, "Pretrain/Loss (Raw)": 2.405182123184204, "Pretrain/Step": 2661, "Pretrain/Step Time": 8.549582781270146} +{"Pretrain/Learning Rate": 4.22939156010355e-05, "Pretrain/Loss": 2.1117048263549805, "Pretrain/Loss (Raw)": 2.101186752319336, "Pretrain/Step": 2662, "Pretrain/Step Time": 8.550013018772006} +{"Pretrain/Learning Rate": 4.2287783805769824e-05, "Pretrain/Loss": 2.1132073402404785, "Pretrain/Loss (Raw)": 2.2906494140625, "Pretrain/Step": 2663, "Pretrain/Step Time": 8.552353717386723} +{"Pretrain/Learning Rate": 4.2281650016795466e-05, "Pretrain/Loss": 2.1150169372558594, "Pretrain/Loss (Raw)": 2.241941452026367, "Pretrain/Step": 2664, "Pretrain/Step Time": 8.55399027839303} +{"Pretrain/Learning Rate": 4.227551423481979e-05, "Pretrain/Loss": 2.1124649047851562, "Pretrain/Loss (Raw)": 1.9769964218139648, "Pretrain/Step": 2665, "Pretrain/Step Time": 8.55458428710699} +{"Pretrain/Learning Rate": 4.2269376460550414e-05, "Pretrain/Loss": 2.112671375274658, "Pretrain/Loss (Raw)": 2.1238110065460205, "Pretrain/Step": 2666, "Pretrain/Step Time": 8.561017090454698} +{"Pretrain/Learning Rate": 4.226323669469516e-05, "Pretrain/Loss": 2.1140403747558594, "Pretrain/Loss (Raw)": 2.140186071395874, "Pretrain/Step": 2667, "Pretrain/Step Time": 8.55524254962802} +{"Pretrain/Learning Rate": 4.225709493796211e-05, "Pretrain/Loss": 2.116384506225586, "Pretrain/Loss (Raw)": 2.207273483276367, "Pretrain/Step": 2668, "Pretrain/Step Time": 8.562714153900743} +{"Pretrain/Learning Rate": 4.225095119105956e-05, "Pretrain/Loss": 2.1161632537841797, "Pretrain/Loss (Raw)": 2.2509958744049072, "Pretrain/Step": 2669, "Pretrain/Step Time": 8.56201246380806} +{"Pretrain/Learning Rate": 4.224480545469603e-05, "Pretrain/Loss": 2.1174306869506836, "Pretrain/Loss (Raw)": 2.1547486782073975, "Pretrain/Step": 2670, "Pretrain/Step Time": 8.56145928800106} +{"Pretrain/Learning Rate": 4.223865772958026e-05, "Pretrain/Loss": 2.116375684738159, "Pretrain/Loss (Raw)": 2.159646987915039, "Pretrain/Step": 2671, "Pretrain/Step Time": 8.565902253612876} +{"Pretrain/Learning Rate": 4.223250801642126e-05, "Pretrain/Loss": 2.1137685775756836, "Pretrain/Loss (Raw)": 1.9988739490509033, "Pretrain/Step": 2672, "Pretrain/Step Time": 8.565992202609777} +{"Pretrain/Learning Rate": 4.222635631592823e-05, "Pretrain/Loss": 2.1122117042541504, "Pretrain/Loss (Raw)": 2.1424291133880615, "Pretrain/Step": 2673, "Pretrain/Step Time": 8.556089961901307} +{"Pretrain/Learning Rate": 4.2220202628810614e-05, "Pretrain/Loss": 2.1118037700653076, "Pretrain/Loss (Raw)": 2.0798330307006836, "Pretrain/Step": 2674, "Pretrain/Step Time": 8.55979915894568} +{"Pretrain/Learning Rate": 4.2214046955778085e-05, "Pretrain/Loss": 2.1120829582214355, "Pretrain/Loss (Raw)": 1.9766316413879395, "Pretrain/Step": 2675, "Pretrain/Step Time": 8.556997517123818} +{"Pretrain/Learning Rate": 4.2207889297540546e-05, "Pretrain/Loss": 2.1117324829101562, "Pretrain/Loss (Raw)": 2.0775325298309326, "Pretrain/Step": 2676, "Pretrain/Step Time": 8.561768921092153} +{"Pretrain/Learning Rate": 4.2201729654808136e-05, "Pretrain/Loss": 2.1129252910614014, "Pretrain/Loss (Raw)": 2.1716256141662598, "Pretrain/Step": 2677, "Pretrain/Step Time": 8.561315286904573} +{"Pretrain/Learning Rate": 4.21955680282912e-05, "Pretrain/Loss": 2.111412286758423, "Pretrain/Loss (Raw)": 2.1335108280181885, "Pretrain/Step": 2678, "Pretrain/Step Time": 8.563109813258052} +{"Pretrain/Learning Rate": 4.218940441870033e-05, "Pretrain/Loss": 2.1106224060058594, "Pretrain/Loss (Raw)": 2.1655776500701904, "Pretrain/Step": 2679, "Pretrain/Step Time": 8.558437226340175} +{"Pretrain/Learning Rate": 4.218323882674634e-05, "Pretrain/Loss": 2.1129417419433594, "Pretrain/Loss (Raw)": 2.2991669178009033, "Pretrain/Step": 2680, "Pretrain/Step Time": 8.559180045500398} +{"Pretrain/Learning Rate": 4.217707125314029e-05, "Pretrain/Loss": 2.113346576690674, "Pretrain/Loss (Raw)": 2.054190158843994, "Pretrain/Step": 2681, "Pretrain/Step Time": 8.558432046324015} +{"Pretrain/Learning Rate": 4.217090169859343e-05, "Pretrain/Loss": 2.1131086349487305, "Pretrain/Loss (Raw)": 2.055730104446411, "Pretrain/Step": 2682, "Pretrain/Step Time": 8.559276007115841} +{"Pretrain/Learning Rate": 4.216473016381728e-05, "Pretrain/Loss": 2.1121389865875244, "Pretrain/Loss (Raw)": 2.068382740020752, "Pretrain/Step": 2683, "Pretrain/Step Time": 8.555878879502416} +{"Pretrain/Learning Rate": 4.215855664952356e-05, "Pretrain/Loss": 2.113938093185425, "Pretrain/Loss (Raw)": 2.1893362998962402, "Pretrain/Step": 2684, "Pretrain/Step Time": 8.562944740056992} +{"Pretrain/Learning Rate": 4.215238115642424e-05, "Pretrain/Loss": 2.114686965942383, "Pretrain/Loss (Raw)": 2.3097879886627197, "Pretrain/Step": 2685, "Pretrain/Step Time": 8.551434896886349} +{"Pretrain/Learning Rate": 4.2146203685231495e-05, "Pretrain/Loss": 2.1146392822265625, "Pretrain/Loss (Raw)": 2.1034069061279297, "Pretrain/Step": 2686, "Pretrain/Step Time": 8.560778837651014} +{"Pretrain/Learning Rate": 4.214002423665775e-05, "Pretrain/Loss": 2.114849328994751, "Pretrain/Loss (Raw)": 2.0200960636138916, "Pretrain/Step": 2687, "Pretrain/Step Time": 8.561841540038586} +{"Pretrain/Learning Rate": 4.213384281141563e-05, "Pretrain/Loss": 2.1121273040771484, "Pretrain/Loss (Raw)": 1.883697748184204, "Pretrain/Step": 2688, "Pretrain/Step Time": 8.56155645288527} +{"Pretrain/Learning Rate": 4.212765941021804e-05, "Pretrain/Loss": 2.1112723350524902, "Pretrain/Loss (Raw)": 2.0289316177368164, "Pretrain/Step": 2689, "Pretrain/Step Time": 8.565028123557568} +{"Pretrain/Learning Rate": 4.212147403377805e-05, "Pretrain/Loss": 2.1092207431793213, "Pretrain/Loss (Raw)": 1.9049776792526245, "Pretrain/Step": 2690, "Pretrain/Step Time": 8.560811338946223} +{"Pretrain/Learning Rate": 4.2115286682808995e-05, "Pretrain/Loss": 2.10695743560791, "Pretrain/Loss (Raw)": 1.9687579870224, "Pretrain/Step": 2691, "Pretrain/Step Time": 8.554577600210905} +{"Pretrain/Learning Rate": 4.210909735802442e-05, "Pretrain/Loss": 2.103208065032959, "Pretrain/Loss (Raw)": 1.7537521123886108, "Pretrain/Step": 2692, "Pretrain/Step Time": 8.559132795780897} +{"Pretrain/Learning Rate": 4.210290606013812e-05, "Pretrain/Loss": 2.1041712760925293, "Pretrain/Loss (Raw)": 2.2976245880126953, "Pretrain/Step": 2693, "Pretrain/Step Time": 8.555796997621655} +{"Pretrain/Learning Rate": 4.209671278986412e-05, "Pretrain/Loss": 2.1012609004974365, "Pretrain/Loss (Raw)": 1.8098169565200806, "Pretrain/Step": 2694, "Pretrain/Step Time": 8.558793449774384} +{"Pretrain/Learning Rate": 4.209051754791662e-05, "Pretrain/Loss": 2.1034460067749023, "Pretrain/Loss (Raw)": 2.2378649711608887, "Pretrain/Step": 2695, "Pretrain/Step Time": 8.564025709405541} +{"Pretrain/Learning Rate": 4.208432033501011e-05, "Pretrain/Loss": 2.1058144569396973, "Pretrain/Loss (Raw)": 2.2718541622161865, "Pretrain/Step": 2696, "Pretrain/Step Time": 8.563069785013795} +{"Pretrain/Learning Rate": 4.2078121151859276e-05, "Pretrain/Loss": 2.106138229370117, "Pretrain/Loss (Raw)": 2.134406328201294, "Pretrain/Step": 2697, "Pretrain/Step Time": 8.556757815182209} +{"Pretrain/Learning Rate": 4.2071919999179036e-05, "Pretrain/Loss": 2.108160972595215, "Pretrain/Loss (Raw)": 2.3067915439605713, "Pretrain/Step": 2698, "Pretrain/Step Time": 8.555670002475381} +{"Pretrain/Learning Rate": 4.206571687768454e-05, "Pretrain/Loss": 2.108025074005127, "Pretrain/Loss (Raw)": 2.1327226161956787, "Pretrain/Step": 2699, "Pretrain/Step Time": 8.55008733831346} +{"Pretrain/Learning Rate": 4.2059511788091146e-05, "Pretrain/Loss": 2.10617733001709, "Pretrain/Loss (Raw)": 1.9097174406051636, "Pretrain/Step": 2700, "Pretrain/Step Time": 8.555075837299228} +{"Pretrain/Learning Rate": 4.205330473111447e-05, "Pretrain/Loss": 2.1043596267700195, "Pretrain/Loss (Raw)": 1.933078646659851, "Pretrain/Step": 2701, "Pretrain/Step Time": 8.553867112845182} +{"Pretrain/Learning Rate": 4.204709570747034e-05, "Pretrain/Loss": 2.108851432800293, "Pretrain/Loss (Raw)": 2.214282512664795, "Pretrain/Step": 2702, "Pretrain/Step Time": 8.550893802195787} +{"Pretrain/Learning Rate": 4.2040884717874804e-05, "Pretrain/Loss": 2.1082968711853027, "Pretrain/Loss (Raw)": 2.1296255588531494, "Pretrain/Step": 2703, "Pretrain/Step Time": 8.553219797089696} +{"Pretrain/Learning Rate": 4.203467176304414e-05, "Pretrain/Loss": 2.1098361015319824, "Pretrain/Loss (Raw)": 2.111849308013916, "Pretrain/Step": 2704, "Pretrain/Step Time": 8.556478705257177} +{"Pretrain/Learning Rate": 4.202845684369486e-05, "Pretrain/Loss": 2.109635829925537, "Pretrain/Loss (Raw)": 2.282451868057251, "Pretrain/Step": 2705, "Pretrain/Step Time": 8.549510503187776} +{"Pretrain/Learning Rate": 4.202223996054369e-05, "Pretrain/Loss": 2.111959457397461, "Pretrain/Loss (Raw)": 2.432589054107666, "Pretrain/Step": 2706, "Pretrain/Step Time": 8.5472292304039} +{"Pretrain/Learning Rate": 4.20160211143076e-05, "Pretrain/Loss": 2.1107311248779297, "Pretrain/Loss (Raw)": 2.2458555698394775, "Pretrain/Step": 2707, "Pretrain/Step Time": 8.545246180146933} +{"Pretrain/Learning Rate": 4.200980030570377e-05, "Pretrain/Loss": 2.1131656169891357, "Pretrain/Loss (Raw)": 2.2953479290008545, "Pretrain/Step": 2708, "Pretrain/Step Time": 8.548465615138412} +{"Pretrain/Learning Rate": 4.2003577535449624e-05, "Pretrain/Loss": 2.1104531288146973, "Pretrain/Loss (Raw)": 1.966247320175171, "Pretrain/Step": 2709, "Pretrain/Step Time": 8.557235345244408} +{"Pretrain/Learning Rate": 4.199735280426279e-05, "Pretrain/Loss": 2.111427068710327, "Pretrain/Loss (Raw)": 2.0155770778656006, "Pretrain/Step": 2710, "Pretrain/Step Time": 8.545725351199508} +{"Pretrain/Learning Rate": 4.199112611286113e-05, "Pretrain/Loss": 2.1112589836120605, "Pretrain/Loss (Raw)": 1.9363629817962646, "Pretrain/Step": 2711, "Pretrain/Step Time": 8.548495644703507} +{"Pretrain/Learning Rate": 4.1984897461962754e-05, "Pretrain/Loss": 2.1109442710876465, "Pretrain/Loss (Raw)": 2.0874855518341064, "Pretrain/Step": 2712, "Pretrain/Step Time": 8.545552046969533} +{"Pretrain/Learning Rate": 4.197866685228596e-05, "Pretrain/Loss": 2.1103146076202393, "Pretrain/Loss (Raw)": 1.9176005125045776, "Pretrain/Step": 2713, "Pretrain/Step Time": 8.552933041006327} +{"Pretrain/Learning Rate": 4.19724342845493e-05, "Pretrain/Loss": 2.108945846557617, "Pretrain/Loss (Raw)": 1.8978147506713867, "Pretrain/Step": 2714, "Pretrain/Step Time": 8.54820504784584} +{"Pretrain/Learning Rate": 4.1966199759471535e-05, "Pretrain/Loss": 2.110218048095703, "Pretrain/Loss (Raw)": 2.137171983718872, "Pretrain/Step": 2715, "Pretrain/Step Time": 8.559875121340156} +{"Pretrain/Learning Rate": 4.195996327777167e-05, "Pretrain/Loss": 2.112748384475708, "Pretrain/Loss (Raw)": 2.2974696159362793, "Pretrain/Step": 2716, "Pretrain/Step Time": 8.553117165341973} +{"Pretrain/Learning Rate": 4.195372484016893e-05, "Pretrain/Loss": 2.1120190620422363, "Pretrain/Loss (Raw)": 2.1730797290802, "Pretrain/Step": 2717, "Pretrain/Step Time": 8.55233969539404} +{"Pretrain/Learning Rate": 4.1947484447382746e-05, "Pretrain/Loss": 2.1132254600524902, "Pretrain/Loss (Raw)": 2.121676445007324, "Pretrain/Step": 2718, "Pretrain/Step Time": 8.551627503708005} +{"Pretrain/Learning Rate": 4.194124210013279e-05, "Pretrain/Loss": 2.113961696624756, "Pretrain/Loss (Raw)": 2.1313271522521973, "Pretrain/Step": 2719, "Pretrain/Step Time": 8.550184870138764} +{"Pretrain/Learning Rate": 4.1934997799138976e-05, "Pretrain/Loss": 2.1136348247528076, "Pretrain/Loss (Raw)": 1.9780874252319336, "Pretrain/Step": 2720, "Pretrain/Step Time": 8.546192014589906} +{"Pretrain/Learning Rate": 4.192875154512141e-05, "Pretrain/Loss": 2.114945888519287, "Pretrain/Loss (Raw)": 2.158287525177002, "Pretrain/Step": 2721, "Pretrain/Step Time": 8.548304226249456} +{"Pretrain/Learning Rate": 4.192250333880045e-05, "Pretrain/Loss": 2.1129584312438965, "Pretrain/Loss (Raw)": 2.041339874267578, "Pretrain/Step": 2722, "Pretrain/Step Time": 8.552654882892966} +{"Pretrain/Learning Rate": 4.191625318089666e-05, "Pretrain/Loss": 2.1111345291137695, "Pretrain/Loss (Raw)": 2.022763967514038, "Pretrain/Step": 2723, "Pretrain/Step Time": 8.547926049679518} +{"Pretrain/Learning Rate": 4.191000107213084e-05, "Pretrain/Loss": 2.108659505844116, "Pretrain/Loss (Raw)": 2.0328400135040283, "Pretrain/Step": 2724, "Pretrain/Step Time": 8.547565836459398} +{"Pretrain/Learning Rate": 4.190374701322401e-05, "Pretrain/Loss": 2.109905242919922, "Pretrain/Loss (Raw)": 2.142540693283081, "Pretrain/Step": 2725, "Pretrain/Step Time": 8.547500705346465} +{"Pretrain/Learning Rate": 4.1897491004897435e-05, "Pretrain/Loss": 2.111917495727539, "Pretrain/Loss (Raw)": 2.165654182434082, "Pretrain/Step": 2726, "Pretrain/Step Time": 8.548124985769391} +{"Pretrain/Learning Rate": 4.189123304787256e-05, "Pretrain/Loss": 2.1127119064331055, "Pretrain/Loss (Raw)": 2.2335898876190186, "Pretrain/Step": 2727, "Pretrain/Step Time": 8.548484122380614} +{"Pretrain/Learning Rate": 4.1884973142871096e-05, "Pretrain/Loss": 2.113605499267578, "Pretrain/Loss (Raw)": 2.3018312454223633, "Pretrain/Step": 2728, "Pretrain/Step Time": 8.553024150431156} +{"Pretrain/Learning Rate": 4.187871129061498e-05, "Pretrain/Loss": 2.1133832931518555, "Pretrain/Loss (Raw)": 2.003667116165161, "Pretrain/Step": 2729, "Pretrain/Step Time": 8.54883493669331} +{"Pretrain/Learning Rate": 4.187244749182633e-05, "Pretrain/Loss": 2.1120262145996094, "Pretrain/Loss (Raw)": 1.9798250198364258, "Pretrain/Step": 2730, "Pretrain/Step Time": 8.552324462682009} +{"Pretrain/Learning Rate": 4.1866181747227526e-05, "Pretrain/Loss": 2.1107635498046875, "Pretrain/Loss (Raw)": 2.0555057525634766, "Pretrain/Step": 2731, "Pretrain/Step Time": 8.551631009206176} +{"Pretrain/Learning Rate": 4.185991405754118e-05, "Pretrain/Loss": 2.1126880645751953, "Pretrain/Loss (Raw)": 2.1366426944732666, "Pretrain/Step": 2732, "Pretrain/Step Time": 8.54742588289082} +{"Pretrain/Learning Rate": 4.185364442349008e-05, "Pretrain/Loss": 2.111052989959717, "Pretrain/Loss (Raw)": 1.908929705619812, "Pretrain/Step": 2733, "Pretrain/Step Time": 8.554657895117998} +{"Pretrain/Learning Rate": 4.184737284579731e-05, "Pretrain/Loss": 2.111854076385498, "Pretrain/Loss (Raw)": 2.2242724895477295, "Pretrain/Step": 2734, "Pretrain/Step Time": 8.555345192551613} +{"Pretrain/Learning Rate": 4.18410993251861e-05, "Pretrain/Loss": 2.1088786125183105, "Pretrain/Loss (Raw)": 1.9606497287750244, "Pretrain/Step": 2735, "Pretrain/Step Time": 8.554340414702892} +{"Pretrain/Learning Rate": 4.183482386237996e-05, "Pretrain/Loss": 2.1102118492126465, "Pretrain/Loss (Raw)": 2.1300227642059326, "Pretrain/Step": 2736, "Pretrain/Step Time": 8.55208401940763} +{"Pretrain/Learning Rate": 4.182854645810261e-05, "Pretrain/Loss": 2.111201524734497, "Pretrain/Loss (Raw)": 2.15724515914917, "Pretrain/Step": 2737, "Pretrain/Step Time": 8.555154709145427} +{"Pretrain/Learning Rate": 4.182226711307798e-05, "Pretrain/Loss": 2.1128389835357666, "Pretrain/Loss (Raw)": 1.9621047973632812, "Pretrain/Step": 2738, "Pretrain/Step Time": 8.552578365430236} +{"Pretrain/Learning Rate": 4.181598582803024e-05, "Pretrain/Loss": 2.1152701377868652, "Pretrain/Loss (Raw)": 2.527958393096924, "Pretrain/Step": 2739, "Pretrain/Step Time": 8.548287661746144} +{"Pretrain/Learning Rate": 4.1809702603683776e-05, "Pretrain/Loss": 2.1174564361572266, "Pretrain/Loss (Raw)": 2.2970850467681885, "Pretrain/Step": 2740, "Pretrain/Step Time": 8.548985781148076} +{"Pretrain/Learning Rate": 4.1803417440763196e-05, "Pretrain/Loss": 2.119013547897339, "Pretrain/Loss (Raw)": 2.2128682136535645, "Pretrain/Step": 2741, "Pretrain/Step Time": 8.549154100939631} +{"Pretrain/Learning Rate": 4.179713033999333e-05, "Pretrain/Loss": 2.117583751678467, "Pretrain/Loss (Raw)": 1.9798070192337036, "Pretrain/Step": 2742, "Pretrain/Step Time": 8.547618871554732} +{"Pretrain/Learning Rate": 4.1790841302099246e-05, "Pretrain/Loss": 2.117154598236084, "Pretrain/Loss (Raw)": 2.06994891166687, "Pretrain/Step": 2743, "Pretrain/Step Time": 8.550028551369905} +{"Pretrain/Learning Rate": 4.1784550327806226e-05, "Pretrain/Loss": 2.1186230182647705, "Pretrain/Loss (Raw)": 2.0158207416534424, "Pretrain/Step": 2744, "Pretrain/Step Time": 8.551181625574827} +{"Pretrain/Learning Rate": 4.177825741783977e-05, "Pretrain/Loss": 2.11836576461792, "Pretrain/Loss (Raw)": 2.005686044692993, "Pretrain/Step": 2745, "Pretrain/Step Time": 8.554700788110495} +{"Pretrain/Learning Rate": 4.1771962572925606e-05, "Pretrain/Loss": 2.116910457611084, "Pretrain/Loss (Raw)": 1.9520376920700073, "Pretrain/Step": 2746, "Pretrain/Step Time": 8.546459786593914} +{"Pretrain/Learning Rate": 4.176566579378968e-05, "Pretrain/Loss": 2.1137044429779053, "Pretrain/Loss (Raw)": 1.9095405340194702, "Pretrain/Step": 2747, "Pretrain/Step Time": 8.5479945987463} +{"Pretrain/Learning Rate": 4.175936708115818e-05, "Pretrain/Loss": 2.1146762371063232, "Pretrain/Loss (Raw)": 2.1480860710144043, "Pretrain/Step": 2748, "Pretrain/Step Time": 8.548597659915686} +{"Pretrain/Learning Rate": 4.1753066435757494e-05, "Pretrain/Loss": 2.1159112453460693, "Pretrain/Loss (Raw)": 1.9728631973266602, "Pretrain/Step": 2749, "Pretrain/Step Time": 8.550528762862086} +{"Pretrain/Learning Rate": 4.1746763858314244e-05, "Pretrain/Loss": 2.1139445304870605, "Pretrain/Loss (Raw)": 1.9661134481430054, "Pretrain/Step": 2750, "Pretrain/Step Time": 8.548133958131075} +{"Pretrain/Learning Rate": 4.174045934955527e-05, "Pretrain/Loss": 2.112987995147705, "Pretrain/Loss (Raw)": 2.0080184936523438, "Pretrain/Step": 2751, "Pretrain/Step Time": 8.548833668231964} +{"Pretrain/Learning Rate": 4.173415291020764e-05, "Pretrain/Loss": 2.1121323108673096, "Pretrain/Loss (Raw)": 2.12176513671875, "Pretrain/Step": 2752, "Pretrain/Step Time": 8.548323346301913} +{"Pretrain/Learning Rate": 4.172784454099865e-05, "Pretrain/Loss": 2.111130714416504, "Pretrain/Loss (Raw)": 1.8755899667739868, "Pretrain/Step": 2753, "Pretrain/Step Time": 8.549826456233859} +{"Pretrain/Learning Rate": 4.172153424265579e-05, "Pretrain/Loss": 2.1092841625213623, "Pretrain/Loss (Raw)": 2.04498028755188, "Pretrain/Step": 2754, "Pretrain/Step Time": 8.549773683771491} +{"Pretrain/Learning Rate": 4.171522201590682e-05, "Pretrain/Loss": 2.1079907417297363, "Pretrain/Loss (Raw)": 2.0169341564178467, "Pretrain/Step": 2755, "Pretrain/Step Time": 8.549556674435735} +{"Pretrain/Learning Rate": 4.170890786147967e-05, "Pretrain/Loss": 2.1069223880767822, "Pretrain/Loss (Raw)": 2.010298013687134, "Pretrain/Step": 2756, "Pretrain/Step Time": 8.543021004647017} +{"Pretrain/Learning Rate": 4.170259178010254e-05, "Pretrain/Loss": 2.105588912963867, "Pretrain/Loss (Raw)": 1.9438388347625732, "Pretrain/Step": 2757, "Pretrain/Step Time": 8.550342943519354} +{"Pretrain/Learning Rate": 4.169627377250382e-05, "Pretrain/Loss": 2.10520601272583, "Pretrain/Loss (Raw)": 2.1747584342956543, "Pretrain/Step": 2758, "Pretrain/Step Time": 8.548272997140884} +{"Pretrain/Learning Rate": 4.1689953839412124e-05, "Pretrain/Loss": 2.104884147644043, "Pretrain/Loss (Raw)": 2.2424468994140625, "Pretrain/Step": 2759, "Pretrain/Step Time": 8.54734748415649} +{"Pretrain/Learning Rate": 4.1683631981556314e-05, "Pretrain/Loss": 2.1067910194396973, "Pretrain/Loss (Raw)": 2.0803894996643066, "Pretrain/Step": 2760, "Pretrain/Step Time": 8.550960019230843} +{"Pretrain/Learning Rate": 4.167730819966545e-05, "Pretrain/Loss": 2.107138156890869, "Pretrain/Loss (Raw)": 2.184955358505249, "Pretrain/Step": 2761, "Pretrain/Step Time": 8.551707923412323} +{"Pretrain/Learning Rate": 4.167098249446881e-05, "Pretrain/Loss": 2.105151653289795, "Pretrain/Loss (Raw)": 1.9823360443115234, "Pretrain/Step": 2762, "Pretrain/Step Time": 8.54471699334681} +{"Pretrain/Learning Rate": 4.166465486669592e-05, "Pretrain/Loss": 2.1046369075775146, "Pretrain/Loss (Raw)": 2.099698543548584, "Pretrain/Step": 2763, "Pretrain/Step Time": 8.548441281542182} +{"Pretrain/Learning Rate": 4.16583253170765e-05, "Pretrain/Loss": 2.1041054725646973, "Pretrain/Loss (Raw)": 2.0399489402770996, "Pretrain/Step": 2764, "Pretrain/Step Time": 8.547406485304236} +{"Pretrain/Learning Rate": 4.165199384634051e-05, "Pretrain/Loss": 2.102790355682373, "Pretrain/Loss (Raw)": 1.9835330247879028, "Pretrain/Step": 2765, "Pretrain/Step Time": 8.54947148822248} +{"Pretrain/Learning Rate": 4.164566045521812e-05, "Pretrain/Loss": 2.1013364791870117, "Pretrain/Loss (Raw)": 2.0463902950286865, "Pretrain/Step": 2766, "Pretrain/Step Time": 8.547129221260548} +{"Pretrain/Learning Rate": 4.163932514443973e-05, "Pretrain/Loss": 2.1035332679748535, "Pretrain/Loss (Raw)": 2.2561583518981934, "Pretrain/Step": 2767, "Pretrain/Step Time": 8.545512948185205} +{"Pretrain/Learning Rate": 4.163298791473596e-05, "Pretrain/Loss": 2.1054768562316895, "Pretrain/Loss (Raw)": 2.185431957244873, "Pretrain/Step": 2768, "Pretrain/Step Time": 8.543732114136219} +{"Pretrain/Learning Rate": 4.1626648766837654e-05, "Pretrain/Loss": 2.102686882019043, "Pretrain/Loss (Raw)": 2.1687777042388916, "Pretrain/Step": 2769, "Pretrain/Step Time": 8.54789287596941} +{"Pretrain/Learning Rate": 4.162030770147585e-05, "Pretrain/Loss": 2.10322904586792, "Pretrain/Loss (Raw)": 2.1922826766967773, "Pretrain/Step": 2770, "Pretrain/Step Time": 8.550491193309426} +{"Pretrain/Learning Rate": 4.161396471938185e-05, "Pretrain/Loss": 2.1007635593414307, "Pretrain/Loss (Raw)": 2.0837514400482178, "Pretrain/Step": 2771, "Pretrain/Step Time": 8.547813368961215} +{"Pretrain/Learning Rate": 4.1607619821287154e-05, "Pretrain/Loss": 2.0984511375427246, "Pretrain/Loss (Raw)": 2.0427730083465576, "Pretrain/Step": 2772, "Pretrain/Step Time": 8.544793659821153} +{"Pretrain/Learning Rate": 4.160127300792348e-05, "Pretrain/Loss": 2.1004090309143066, "Pretrain/Loss (Raw)": 2.068408966064453, "Pretrain/Step": 2773, "Pretrain/Step Time": 8.549440298229456} +{"Pretrain/Learning Rate": 4.159492428002277e-05, "Pretrain/Loss": 2.102998733520508, "Pretrain/Loss (Raw)": 2.1397368907928467, "Pretrain/Step": 2774, "Pretrain/Step Time": 8.545649087056518} +{"Pretrain/Learning Rate": 4.1588573638317195e-05, "Pretrain/Loss": 2.1039812564849854, "Pretrain/Loss (Raw)": 2.1621944904327393, "Pretrain/Step": 2775, "Pretrain/Step Time": 8.551366977393627} +{"Pretrain/Learning Rate": 4.158222108353915e-05, "Pretrain/Loss": 2.1006414890289307, "Pretrain/Loss (Raw)": 1.7174575328826904, "Pretrain/Step": 2776, "Pretrain/Step Time": 8.549389980733395} +{"Pretrain/Learning Rate": 4.1575866616421224e-05, "Pretrain/Loss": 2.1018834114074707, "Pretrain/Loss (Raw)": 2.2264208793640137, "Pretrain/Step": 2777, "Pretrain/Step Time": 8.55378165282309} +{"Pretrain/Learning Rate": 4.156951023769625e-05, "Pretrain/Loss": 2.101263999938965, "Pretrain/Loss (Raw)": 2.203819513320923, "Pretrain/Step": 2778, "Pretrain/Step Time": 8.552983473986387} +{"Pretrain/Learning Rate": 4.156315194809728e-05, "Pretrain/Loss": 2.103148937225342, "Pretrain/Loss (Raw)": 2.263835906982422, "Pretrain/Step": 2779, "Pretrain/Step Time": 8.552850555628538} +{"Pretrain/Learning Rate": 4.1556791748357584e-05, "Pretrain/Loss": 2.1059672832489014, "Pretrain/Loss (Raw)": 2.2279999256134033, "Pretrain/Step": 2780, "Pretrain/Step Time": 8.549675026908517} +{"Pretrain/Learning Rate": 4.155042963921064e-05, "Pretrain/Loss": 2.1052346229553223, "Pretrain/Loss (Raw)": 2.0287489891052246, "Pretrain/Step": 2781, "Pretrain/Step Time": 8.555480228736997} +{"Pretrain/Learning Rate": 4.1544065621390165e-05, "Pretrain/Loss": 2.1039042472839355, "Pretrain/Loss (Raw)": 1.9879323244094849, "Pretrain/Step": 2782, "Pretrain/Step Time": 8.5479826759547} +{"Pretrain/Learning Rate": 4.153769969563008e-05, "Pretrain/Loss": 2.1020023822784424, "Pretrain/Loss (Raw)": 1.956398367881775, "Pretrain/Step": 2783, "Pretrain/Step Time": 8.555980417877436} +{"Pretrain/Learning Rate": 4.1531331862664545e-05, "Pretrain/Loss": 2.0999250411987305, "Pretrain/Loss (Raw)": 2.0246293544769287, "Pretrain/Step": 2784, "Pretrain/Step Time": 8.549387307837605} +{"Pretrain/Learning Rate": 4.1524962123227914e-05, "Pretrain/Loss": 2.0973126888275146, "Pretrain/Loss (Raw)": 1.827723503112793, "Pretrain/Step": 2785, "Pretrain/Step Time": 8.553414450958371} +{"Pretrain/Learning Rate": 4.151859047805479e-05, "Pretrain/Loss": 2.098837375640869, "Pretrain/Loss (Raw)": 2.2293124198913574, "Pretrain/Step": 2786, "Pretrain/Step Time": 8.549527229741216} +{"Pretrain/Learning Rate": 4.151221692787997e-05, "Pretrain/Loss": 2.099000930786133, "Pretrain/Loss (Raw)": 2.035541534423828, "Pretrain/Step": 2787, "Pretrain/Step Time": 8.55033316463232} +{"Pretrain/Learning Rate": 4.1505841473438485e-05, "Pretrain/Loss": 2.0968313217163086, "Pretrain/Loss (Raw)": 1.9890466928482056, "Pretrain/Step": 2788, "Pretrain/Step Time": 8.547885144129395} +{"Pretrain/Learning Rate": 4.149946411546558e-05, "Pretrain/Loss": 2.097297191619873, "Pretrain/Loss (Raw)": 2.4648239612579346, "Pretrain/Step": 2789, "Pretrain/Step Time": 8.553167758509517} +{"Pretrain/Learning Rate": 4.1493084854696726e-05, "Pretrain/Loss": 2.097170352935791, "Pretrain/Loss (Raw)": 2.0849413871765137, "Pretrain/Step": 2790, "Pretrain/Step Time": 8.554906075820327} +{"Pretrain/Learning Rate": 4.1486703691867616e-05, "Pretrain/Loss": 2.0960192680358887, "Pretrain/Loss (Raw)": 2.143315553665161, "Pretrain/Step": 2791, "Pretrain/Step Time": 8.554095949977636} +{"Pretrain/Learning Rate": 4.148032062771414e-05, "Pretrain/Loss": 2.0951285362243652, "Pretrain/Loss (Raw)": 2.1279051303863525, "Pretrain/Step": 2792, "Pretrain/Step Time": 8.555493099614978} +{"Pretrain/Learning Rate": 4.147393566297244e-05, "Pretrain/Loss": 2.094367027282715, "Pretrain/Loss (Raw)": 1.8795222043991089, "Pretrain/Step": 2793, "Pretrain/Step Time": 8.55431674234569} +{"Pretrain/Learning Rate": 4.1467548798378847e-05, "Pretrain/Loss": 2.094297409057617, "Pretrain/Loss (Raw)": 2.114915370941162, "Pretrain/Step": 2794, "Pretrain/Step Time": 8.557939006015658} +{"Pretrain/Learning Rate": 4.1461160034669925e-05, "Pretrain/Loss": 2.093066692352295, "Pretrain/Loss (Raw)": 1.9826256036758423, "Pretrain/Step": 2795, "Pretrain/Step Time": 8.555687505751848} +{"Pretrain/Learning Rate": 4.145476937258247e-05, "Pretrain/Loss": 2.0919618606567383, "Pretrain/Loss (Raw)": 2.0658669471740723, "Pretrain/Step": 2796, "Pretrain/Step Time": 8.548614839091897} +{"Pretrain/Learning Rate": 4.144837681285346e-05, "Pretrain/Loss": 2.092478036880493, "Pretrain/Loss (Raw)": 2.31707763671875, "Pretrain/Step": 2797, "Pretrain/Step Time": 8.550232119858265} +{"Pretrain/Learning Rate": 4.1441982356220144e-05, "Pretrain/Loss": 2.090729236602783, "Pretrain/Loss (Raw)": 1.9309226274490356, "Pretrain/Step": 2798, "Pretrain/Step Time": 8.551595272496343} +{"Pretrain/Learning Rate": 4.1435586003419935e-05, "Pretrain/Loss": 2.089716911315918, "Pretrain/Loss (Raw)": 2.030043601989746, "Pretrain/Step": 2799, "Pretrain/Step Time": 8.54442653991282} +{"Pretrain/Learning Rate": 4.1429187755190504e-05, "Pretrain/Loss": 2.0900018215179443, "Pretrain/Loss (Raw)": 2.035353422164917, "Pretrain/Step": 2800, "Pretrain/Step Time": 8.553377766162157} +{"Pretrain/Learning Rate": 4.1422787612269726e-05, "Pretrain/Loss": 2.089416027069092, "Pretrain/Loss (Raw)": 2.0674378871917725, "Pretrain/Step": 2801, "Pretrain/Step Time": 8.562703255563974} +{"Pretrain/Learning Rate": 4.1416385575395686e-05, "Pretrain/Loss": 2.089589834213257, "Pretrain/Loss (Raw)": 2.102085590362549, "Pretrain/Step": 2802, "Pretrain/Step Time": 8.555452963337302} +{"Pretrain/Learning Rate": 4.140998164530672e-05, "Pretrain/Loss": 2.089754581451416, "Pretrain/Loss (Raw)": 1.9977282285690308, "Pretrain/Step": 2803, "Pretrain/Step Time": 8.55512234941125} +{"Pretrain/Learning Rate": 4.140357582274133e-05, "Pretrain/Loss": 2.088470697402954, "Pretrain/Loss (Raw)": 1.913183331489563, "Pretrain/Step": 2804, "Pretrain/Step Time": 8.550610762089491} +{"Pretrain/Learning Rate": 4.1397168108438286e-05, "Pretrain/Loss": 2.088026523590088, "Pretrain/Loss (Raw)": 2.114750385284424, "Pretrain/Step": 2805, "Pretrain/Step Time": 8.553674744442105} +{"Pretrain/Learning Rate": 4.139075850313655e-05, "Pretrain/Loss": 2.087883472442627, "Pretrain/Loss (Raw)": 2.1152281761169434, "Pretrain/Step": 2806, "Pretrain/Step Time": 8.551498472690582} +{"Pretrain/Learning Rate": 4.1384347007575305e-05, "Pretrain/Loss": 2.0876545906066895, "Pretrain/Loss (Raw)": 2.136265277862549, "Pretrain/Step": 2807, "Pretrain/Step Time": 8.551576627418399} +{"Pretrain/Learning Rate": 4.137793362249396e-05, "Pretrain/Loss": 2.0872864723205566, "Pretrain/Loss (Raw)": 2.2520458698272705, "Pretrain/Step": 2808, "Pretrain/Step Time": 8.553731966763735} +{"Pretrain/Learning Rate": 4.137151834863213e-05, "Pretrain/Loss": 2.08786678314209, "Pretrain/Loss (Raw)": 2.128502130508423, "Pretrain/Step": 2809, "Pretrain/Step Time": 8.556030863896012} +{"Pretrain/Learning Rate": 4.136510118672966e-05, "Pretrain/Loss": 2.0873634815216064, "Pretrain/Loss (Raw)": 1.99129056930542, "Pretrain/Step": 2810, "Pretrain/Step Time": 8.556881664320827} +{"Pretrain/Learning Rate": 4.135868213752661e-05, "Pretrain/Loss": 2.0884342193603516, "Pretrain/Loss (Raw)": 2.2054331302642822, "Pretrain/Step": 2811, "Pretrain/Step Time": 8.55723381228745} +{"Pretrain/Learning Rate": 4.135226120176325e-05, "Pretrain/Loss": 2.0875487327575684, "Pretrain/Loss (Raw)": 2.0759735107421875, "Pretrain/Step": 2812, "Pretrain/Step Time": 8.560464968904853} +{"Pretrain/Learning Rate": 4.134583838018007e-05, "Pretrain/Loss": 2.0868892669677734, "Pretrain/Loss (Raw)": 2.2253897190093994, "Pretrain/Step": 2813, "Pretrain/Step Time": 8.56153323687613} +{"Pretrain/Learning Rate": 4.133941367351779e-05, "Pretrain/Loss": 2.088118314743042, "Pretrain/Loss (Raw)": 2.2607429027557373, "Pretrain/Step": 2814, "Pretrain/Step Time": 8.55024941265583} +{"Pretrain/Learning Rate": 4.133298708251733e-05, "Pretrain/Loss": 2.0888848304748535, "Pretrain/Loss (Raw)": 2.1182122230529785, "Pretrain/Step": 2815, "Pretrain/Step Time": 8.552998777478933} +{"Pretrain/Learning Rate": 4.132655860791983e-05, "Pretrain/Loss": 2.091327667236328, "Pretrain/Loss (Raw)": 2.1963512897491455, "Pretrain/Step": 2816, "Pretrain/Step Time": 8.553278455510736} +{"Pretrain/Learning Rate": 4.132012825046666e-05, "Pretrain/Loss": 2.0917277336120605, "Pretrain/Loss (Raw)": 2.0801429748535156, "Pretrain/Step": 2817, "Pretrain/Step Time": 8.552128864452243} +{"Pretrain/Learning Rate": 4.13136960108994e-05, "Pretrain/Loss": 2.0937678813934326, "Pretrain/Loss (Raw)": 2.16613507270813, "Pretrain/Step": 2818, "Pretrain/Step Time": 8.562278043478727} +{"Pretrain/Learning Rate": 4.130726188995985e-05, "Pretrain/Loss": 2.0952067375183105, "Pretrain/Loss (Raw)": 2.1529080867767334, "Pretrain/Step": 2819, "Pretrain/Step Time": 8.559911727905273} +{"Pretrain/Learning Rate": 4.1300825888390006e-05, "Pretrain/Loss": 2.09850811958313, "Pretrain/Loss (Raw)": 2.1763556003570557, "Pretrain/Step": 2820, "Pretrain/Step Time": 8.558403993025422} +{"Pretrain/Learning Rate": 4.1294388006932114e-05, "Pretrain/Loss": 2.0985841751098633, "Pretrain/Loss (Raw)": 2.307325601577759, "Pretrain/Step": 2821, "Pretrain/Step Time": 8.559492040425539} +{"Pretrain/Learning Rate": 4.128794824632861e-05, "Pretrain/Loss": 2.100228786468506, "Pretrain/Loss (Raw)": 2.020343065261841, "Pretrain/Step": 2822, "Pretrain/Step Time": 8.559774819761515} +{"Pretrain/Learning Rate": 4.1281506607322167e-05, "Pretrain/Loss": 2.099029541015625, "Pretrain/Loss (Raw)": 2.0843794345855713, "Pretrain/Step": 2823, "Pretrain/Step Time": 8.558247093111277} +{"Pretrain/Learning Rate": 4.1275063090655666e-05, "Pretrain/Loss": 2.099377155303955, "Pretrain/Loss (Raw)": 2.316335678100586, "Pretrain/Step": 2824, "Pretrain/Step Time": 8.568049425259233} +{"Pretrain/Learning Rate": 4.126861769707219e-05, "Pretrain/Loss": 2.098360776901245, "Pretrain/Loss (Raw)": 2.004314661026001, "Pretrain/Step": 2825, "Pretrain/Step Time": 8.560745395720005} +{"Pretrain/Learning Rate": 4.126217042731507e-05, "Pretrain/Loss": 2.097062349319458, "Pretrain/Loss (Raw)": 2.1406049728393555, "Pretrain/Step": 2826, "Pretrain/Step Time": 8.565067613497376} +{"Pretrain/Learning Rate": 4.125572128212781e-05, "Pretrain/Loss": 2.0974080562591553, "Pretrain/Loss (Raw)": 2.1769566535949707, "Pretrain/Step": 2827, "Pretrain/Step Time": 8.564213460311294} +{"Pretrain/Learning Rate": 4.124927026225419e-05, "Pretrain/Loss": 2.0979232788085938, "Pretrain/Loss (Raw)": 1.9756680727005005, "Pretrain/Step": 2828, "Pretrain/Step Time": 8.563468620181084} +{"Pretrain/Learning Rate": 4.124281736843815e-05, "Pretrain/Loss": 2.0974302291870117, "Pretrain/Loss (Raw)": 1.8699930906295776, "Pretrain/Step": 2829, "Pretrain/Step Time": 8.561056479811668} +{"Pretrain/Learning Rate": 4.1236362601423865e-05, "Pretrain/Loss": 2.096189260482788, "Pretrain/Loss (Raw)": 2.0554158687591553, "Pretrain/Step": 2830, "Pretrain/Step Time": 8.572172237560153} +{"Pretrain/Learning Rate": 4.122990596195574e-05, "Pretrain/Loss": 2.095336675643921, "Pretrain/Loss (Raw)": 2.0204832553863525, "Pretrain/Step": 2831, "Pretrain/Step Time": 8.558200465515256} +{"Pretrain/Learning Rate": 4.122344745077838e-05, "Pretrain/Loss": 2.0941104888916016, "Pretrain/Loss (Raw)": 1.954924464225769, "Pretrain/Step": 2832, "Pretrain/Step Time": 8.559069514274597} +{"Pretrain/Learning Rate": 4.121698706863662e-05, "Pretrain/Loss": 2.0945162773132324, "Pretrain/Loss (Raw)": 2.334383964538574, "Pretrain/Step": 2833, "Pretrain/Step Time": 8.557586451992393} +{"Pretrain/Learning Rate": 4.121052481627549e-05, "Pretrain/Loss": 2.0900282859802246, "Pretrain/Loss (Raw)": 1.8581428527832031, "Pretrain/Step": 2834, "Pretrain/Step Time": 8.561769800260663} +{"Pretrain/Learning Rate": 4.120406069444025e-05, "Pretrain/Loss": 2.0879154205322266, "Pretrain/Loss (Raw)": 1.9753851890563965, "Pretrain/Step": 2835, "Pretrain/Step Time": 8.560958353802562} +{"Pretrain/Learning Rate": 4.119759470387637e-05, "Pretrain/Loss": 2.087501049041748, "Pretrain/Loss (Raw)": 2.242321014404297, "Pretrain/Step": 2836, "Pretrain/Step Time": 8.569790692999959} +{"Pretrain/Learning Rate": 4.1191126845329554e-05, "Pretrain/Loss": 2.0898425579071045, "Pretrain/Loss (Raw)": 2.2659401893615723, "Pretrain/Step": 2837, "Pretrain/Step Time": 8.55959264934063} +{"Pretrain/Learning Rate": 4.118465711954569e-05, "Pretrain/Loss": 2.0901145935058594, "Pretrain/Loss (Raw)": 2.050410270690918, "Pretrain/Step": 2838, "Pretrain/Step Time": 8.559081118553877} +{"Pretrain/Learning Rate": 4.1178185527270905e-05, "Pretrain/Loss": 2.0912365913391113, "Pretrain/Loss (Raw)": 2.0799708366394043, "Pretrain/Step": 2839, "Pretrain/Step Time": 8.55718463473022} +{"Pretrain/Learning Rate": 4.1171712069251534e-05, "Pretrain/Loss": 2.0895211696624756, "Pretrain/Loss (Raw)": 1.8679289817810059, "Pretrain/Step": 2840, "Pretrain/Step Time": 8.560630330815911} +{"Pretrain/Learning Rate": 4.116523674623412e-05, "Pretrain/Loss": 2.0913186073303223, "Pretrain/Loss (Raw)": 2.147639036178589, "Pretrain/Step": 2841, "Pretrain/Step Time": 8.557448418810964} +{"Pretrain/Learning Rate": 4.115875955896543e-05, "Pretrain/Loss": 2.0915238857269287, "Pretrain/Loss (Raw)": 1.9241247177124023, "Pretrain/Step": 2842, "Pretrain/Step Time": 8.569104498252273} +{"Pretrain/Learning Rate": 4.115228050819244e-05, "Pretrain/Loss": 2.0913219451904297, "Pretrain/Loss (Raw)": 2.1112937927246094, "Pretrain/Step": 2843, "Pretrain/Step Time": 8.557275734841824} +{"Pretrain/Learning Rate": 4.114579959466235e-05, "Pretrain/Loss": 2.0907461643218994, "Pretrain/Loss (Raw)": 2.223801612854004, "Pretrain/Step": 2844, "Pretrain/Step Time": 8.555760579183698} +{"Pretrain/Learning Rate": 4.113931681912257e-05, "Pretrain/Loss": 2.0921683311462402, "Pretrain/Loss (Raw)": 2.3551106452941895, "Pretrain/Step": 2845, "Pretrain/Step Time": 8.556594612076879} +{"Pretrain/Learning Rate": 4.113283218232073e-05, "Pretrain/Loss": 2.0925545692443848, "Pretrain/Loss (Raw)": 2.1710944175720215, "Pretrain/Step": 2846, "Pretrain/Step Time": 8.55460423976183} +{"Pretrain/Learning Rate": 4.112634568500466e-05, "Pretrain/Loss": 2.0940513610839844, "Pretrain/Loss (Raw)": 2.322935104370117, "Pretrain/Step": 2847, "Pretrain/Step Time": 8.555519297719002} +{"Pretrain/Learning Rate": 4.111985732792242e-05, "Pretrain/Loss": 2.0942304134368896, "Pretrain/Loss (Raw)": 2.0009891986846924, "Pretrain/Step": 2848, "Pretrain/Step Time": 8.561281083151698} +{"Pretrain/Learning Rate": 4.111336711182226e-05, "Pretrain/Loss": 2.0948562622070312, "Pretrain/Loss (Raw)": 2.238407611846924, "Pretrain/Step": 2849, "Pretrain/Step Time": 8.552255567163229} +{"Pretrain/Learning Rate": 4.110687503745269e-05, "Pretrain/Loss": 2.096351146697998, "Pretrain/Loss (Raw)": 2.232710123062134, "Pretrain/Step": 2850, "Pretrain/Step Time": 8.555697912350297} +{"Pretrain/Learning Rate": 4.1100381105562394e-05, "Pretrain/Loss": 2.0971665382385254, "Pretrain/Loss (Raw)": 2.127082347869873, "Pretrain/Step": 2851, "Pretrain/Step Time": 8.551850829273462} +{"Pretrain/Learning Rate": 4.109388531690027e-05, "Pretrain/Loss": 2.0981497764587402, "Pretrain/Loss (Raw)": 2.1587188243865967, "Pretrain/Step": 2852, "Pretrain/Step Time": 8.551025556400418} +{"Pretrain/Learning Rate": 4.108738767221546e-05, "Pretrain/Loss": 2.098165512084961, "Pretrain/Loss (Raw)": 2.1445600986480713, "Pretrain/Step": 2853, "Pretrain/Step Time": 8.552165247499943} +{"Pretrain/Learning Rate": 4.108088817225729e-05, "Pretrain/Loss": 2.0989794731140137, "Pretrain/Loss (Raw)": 2.2698326110839844, "Pretrain/Step": 2854, "Pretrain/Step Time": 8.557384325191379} +{"Pretrain/Learning Rate": 4.1074386817775334e-05, "Pretrain/Loss": 2.0975050926208496, "Pretrain/Loss (Raw)": 2.0448906421661377, "Pretrain/Step": 2855, "Pretrain/Step Time": 8.548468090593815} +{"Pretrain/Learning Rate": 4.106788360951934e-05, "Pretrain/Loss": 2.0953917503356934, "Pretrain/Loss (Raw)": 2.031308650970459, "Pretrain/Step": 2856, "Pretrain/Step Time": 8.546280279755592} +{"Pretrain/Learning Rate": 4.106137854823929e-05, "Pretrain/Loss": 2.095297336578369, "Pretrain/Loss (Raw)": 1.9915733337402344, "Pretrain/Step": 2857, "Pretrain/Step Time": 8.550949091091752} +{"Pretrain/Learning Rate": 4.1054871634685385e-05, "Pretrain/Loss": 2.096156358718872, "Pretrain/Loss (Raw)": 2.089796781539917, "Pretrain/Step": 2858, "Pretrain/Step Time": 8.548542918637395} +{"Pretrain/Learning Rate": 4.104836286960802e-05, "Pretrain/Loss": 2.0951130390167236, "Pretrain/Loss (Raw)": 1.9219619035720825, "Pretrain/Step": 2859, "Pretrain/Step Time": 8.549284579232335} +{"Pretrain/Learning Rate": 4.1041852253757836e-05, "Pretrain/Loss": 2.0938258171081543, "Pretrain/Loss (Raw)": 1.9718612432479858, "Pretrain/Step": 2860, "Pretrain/Step Time": 8.557575795799494} +{"Pretrain/Learning Rate": 4.103533978788566e-05, "Pretrain/Loss": 2.0941507816314697, "Pretrain/Loss (Raw)": 1.9505159854888916, "Pretrain/Step": 2861, "Pretrain/Step Time": 8.543737916275859} +{"Pretrain/Learning Rate": 4.1028825472742536e-05, "Pretrain/Loss": 2.090662956237793, "Pretrain/Loss (Raw)": 1.7778383493423462, "Pretrain/Step": 2862, "Pretrain/Step Time": 8.547823520377278} +{"Pretrain/Learning Rate": 4.1022309309079734e-05, "Pretrain/Loss": 2.093270778656006, "Pretrain/Loss (Raw)": 2.29449462890625, "Pretrain/Step": 2863, "Pretrain/Step Time": 8.543771103024483} +{"Pretrain/Learning Rate": 4.1015791297648716e-05, "Pretrain/Loss": 2.0931222438812256, "Pretrain/Loss (Raw)": 2.1109695434570312, "Pretrain/Step": 2864, "Pretrain/Step Time": 8.546994987875223} +{"Pretrain/Learning Rate": 4.100927143920118e-05, "Pretrain/Loss": 2.0922279357910156, "Pretrain/Loss (Raw)": 2.0427920818328857, "Pretrain/Step": 2865, "Pretrain/Step Time": 8.546090329065919} +{"Pretrain/Learning Rate": 4.100274973448902e-05, "Pretrain/Loss": 2.094162940979004, "Pretrain/Loss (Raw)": 2.2097840309143066, "Pretrain/Step": 2866, "Pretrain/Step Time": 8.551508976146579} +{"Pretrain/Learning Rate": 4.099622618426436e-05, "Pretrain/Loss": 2.091520309448242, "Pretrain/Loss (Raw)": 2.189685344696045, "Pretrain/Step": 2867, "Pretrain/Step Time": 8.54245730675757} +{"Pretrain/Learning Rate": 4.098970078927951e-05, "Pretrain/Loss": 2.0900797843933105, "Pretrain/Loss (Raw)": 2.1126980781555176, "Pretrain/Step": 2868, "Pretrain/Step Time": 8.551761215552688} +{"Pretrain/Learning Rate": 4.0983173550287026e-05, "Pretrain/Loss": 2.0894346237182617, "Pretrain/Loss (Raw)": 2.1302757263183594, "Pretrain/Step": 2869, "Pretrain/Step Time": 8.550208568572998} +{"Pretrain/Learning Rate": 4.0976644468039646e-05, "Pretrain/Loss": 2.0907042026519775, "Pretrain/Loss (Raw)": 2.1423392295837402, "Pretrain/Step": 2870, "Pretrain/Step Time": 8.551169954240322} +{"Pretrain/Learning Rate": 4.097011354329035e-05, "Pretrain/Loss": 2.0918285846710205, "Pretrain/Loss (Raw)": 2.2138662338256836, "Pretrain/Step": 2871, "Pretrain/Step Time": 8.552570421248674} +{"Pretrain/Learning Rate": 4.096358077679231e-05, "Pretrain/Loss": 2.09226655960083, "Pretrain/Loss (Raw)": 2.071885824203491, "Pretrain/Step": 2872, "Pretrain/Step Time": 8.553001379594207} +{"Pretrain/Learning Rate": 4.0957046169298895e-05, "Pretrain/Loss": 2.0939526557922363, "Pretrain/Loss (Raw)": 2.2215001583099365, "Pretrain/Step": 2873, "Pretrain/Step Time": 8.55026687681675} +{"Pretrain/Learning Rate": 4.095050972156374e-05, "Pretrain/Loss": 2.0952553749084473, "Pretrain/Loss (Raw)": 2.1187567710876465, "Pretrain/Step": 2874, "Pretrain/Step Time": 8.548311388120055} +{"Pretrain/Learning Rate": 4.0943971434340633e-05, "Pretrain/Loss": 2.096182107925415, "Pretrain/Loss (Raw)": 2.0281732082366943, "Pretrain/Step": 2875, "Pretrain/Step Time": 8.547980435192585} +{"Pretrain/Learning Rate": 4.093743130838361e-05, "Pretrain/Loss": 2.0969953536987305, "Pretrain/Loss (Raw)": 2.252223014831543, "Pretrain/Step": 2876, "Pretrain/Step Time": 8.548713956028223} +{"Pretrain/Learning Rate": 4.093088934444692e-05, "Pretrain/Loss": 2.0974278450012207, "Pretrain/Loss (Raw)": 2.0281972885131836, "Pretrain/Step": 2877, "Pretrain/Step Time": 8.544395392760634} +{"Pretrain/Learning Rate": 4.092434554328499e-05, "Pretrain/Loss": 2.098118543624878, "Pretrain/Loss (Raw)": 2.0545122623443604, "Pretrain/Step": 2878, "Pretrain/Step Time": 8.55061861500144} +{"Pretrain/Learning Rate": 4.09177999056525e-05, "Pretrain/Loss": 2.0991361141204834, "Pretrain/Loss (Raw)": 2.138270616531372, "Pretrain/Step": 2879, "Pretrain/Step Time": 8.541895037516952} +{"Pretrain/Learning Rate": 4.0911252432304316e-05, "Pretrain/Loss": 2.0989744663238525, "Pretrain/Loss (Raw)": 2.1010806560516357, "Pretrain/Step": 2880, "Pretrain/Step Time": 8.54497393220663} +{"Pretrain/Learning Rate": 4.0904703123995516e-05, "Pretrain/Loss": 2.099597930908203, "Pretrain/Loss (Raw)": 1.9553799629211426, "Pretrain/Step": 2881, "Pretrain/Step Time": 8.54288387671113} +{"Pretrain/Learning Rate": 4.0898151981481416e-05, "Pretrain/Loss": 2.1007866859436035, "Pretrain/Loss (Raw)": 2.1971421241760254, "Pretrain/Step": 2882, "Pretrain/Step Time": 8.54279424622655} +{"Pretrain/Learning Rate": 4.089159900551752e-05, "Pretrain/Loss": 2.101484775543213, "Pretrain/Loss (Raw)": 2.106285572052002, "Pretrain/Step": 2883, "Pretrain/Step Time": 8.545370254665613} +{"Pretrain/Learning Rate": 4.0885044196859537e-05, "Pretrain/Loss": 2.1004538536071777, "Pretrain/Loss (Raw)": 1.8783626556396484, "Pretrain/Step": 2884, "Pretrain/Step Time": 8.547242039814591} +{"Pretrain/Learning Rate": 4.08784875562634e-05, "Pretrain/Loss": 2.1011056900024414, "Pretrain/Loss (Raw)": 2.0272409915924072, "Pretrain/Step": 2885, "Pretrain/Step Time": 8.542692877352238} +{"Pretrain/Learning Rate": 4.087192908448526e-05, "Pretrain/Loss": 2.1004722118377686, "Pretrain/Loss (Raw)": 2.0936927795410156, "Pretrain/Step": 2886, "Pretrain/Step Time": 8.549622360616922} +{"Pretrain/Learning Rate": 4.086536878228147e-05, "Pretrain/Loss": 2.09907603263855, "Pretrain/Loss (Raw)": 2.0637295246124268, "Pretrain/Step": 2887, "Pretrain/Step Time": 8.546244632452726} +{"Pretrain/Learning Rate": 4.0858806650408586e-05, "Pretrain/Loss": 2.098330020904541, "Pretrain/Loss (Raw)": 1.984928011894226, "Pretrain/Step": 2888, "Pretrain/Step Time": 8.545479776337743} +{"Pretrain/Learning Rate": 4.08522426896234e-05, "Pretrain/Loss": 2.0970845222473145, "Pretrain/Loss (Raw)": 2.025500535964966, "Pretrain/Step": 2889, "Pretrain/Step Time": 8.54269222728908} +{"Pretrain/Learning Rate": 4.0845676900682884e-05, "Pretrain/Loss": 2.098526954650879, "Pretrain/Loss (Raw)": 2.1669869422912598, "Pretrain/Step": 2890, "Pretrain/Step Time": 8.545357117429376} +{"Pretrain/Learning Rate": 4.0839109284344235e-05, "Pretrain/Loss": 2.099625587463379, "Pretrain/Loss (Raw)": 2.240288019180298, "Pretrain/Step": 2891, "Pretrain/Step Time": 8.547661505639553} +{"Pretrain/Learning Rate": 4.083253984136487e-05, "Pretrain/Loss": 2.0982627868652344, "Pretrain/Loss (Raw)": 1.865532398223877, "Pretrain/Step": 2892, "Pretrain/Step Time": 8.549183879047632} +{"Pretrain/Learning Rate": 4.0825968572502404e-05, "Pretrain/Loss": 2.0986053943634033, "Pretrain/Loss (Raw)": 2.0273916721343994, "Pretrain/Step": 2893, "Pretrain/Step Time": 8.54734655097127} +{"Pretrain/Learning Rate": 4.081939547851467e-05, "Pretrain/Loss": 2.100813150405884, "Pretrain/Loss (Raw)": 2.328984260559082, "Pretrain/Step": 2894, "Pretrain/Step Time": 8.548735881224275} +{"Pretrain/Learning Rate": 4.0812820560159705e-05, "Pretrain/Loss": 2.0999841690063477, "Pretrain/Loss (Raw)": 2.150043487548828, "Pretrain/Step": 2895, "Pretrain/Step Time": 8.548656914383173} +{"Pretrain/Learning Rate": 4.0806243818195765e-05, "Pretrain/Loss": 2.0992989540100098, "Pretrain/Loss (Raw)": 2.0977253913879395, "Pretrain/Step": 2896, "Pretrain/Step Time": 8.549061369150877} +{"Pretrain/Learning Rate": 4.07996652533813e-05, "Pretrain/Loss": 2.098499298095703, "Pretrain/Loss (Raw)": 2.0664255619049072, "Pretrain/Step": 2897, "Pretrain/Step Time": 8.54194306395948} +{"Pretrain/Learning Rate": 4.0793084866474986e-05, "Pretrain/Loss": 2.0979232788085938, "Pretrain/Loss (Raw)": 2.118549346923828, "Pretrain/Step": 2898, "Pretrain/Step Time": 8.540278982371092} +{"Pretrain/Learning Rate": 4.078650265823571e-05, "Pretrain/Loss": 2.1000397205352783, "Pretrain/Loss (Raw)": 2.3546459674835205, "Pretrain/Step": 2899, "Pretrain/Step Time": 8.544887240976095} +{"Pretrain/Learning Rate": 4.077991862942256e-05, "Pretrain/Loss": 2.099266290664673, "Pretrain/Loss (Raw)": 1.9437825679779053, "Pretrain/Step": 2900, "Pretrain/Step Time": 8.54987332969904} +{"Pretrain/Learning Rate": 4.0773332780794834e-05, "Pretrain/Loss": 2.0984127521514893, "Pretrain/Loss (Raw)": 1.959163784980774, "Pretrain/Step": 2901, "Pretrain/Step Time": 8.54534874483943} +{"Pretrain/Learning Rate": 4.076674511311205e-05, "Pretrain/Loss": 2.096743106842041, "Pretrain/Loss (Raw)": 1.9260140657424927, "Pretrain/Step": 2902, "Pretrain/Step Time": 8.547929380089045} +{"Pretrain/Learning Rate": 4.0760155627133924e-05, "Pretrain/Loss": 2.0965607166290283, "Pretrain/Loss (Raw)": 2.138840675354004, "Pretrain/Step": 2903, "Pretrain/Step Time": 8.55290555022657} +{"Pretrain/Learning Rate": 4.075356432362037e-05, "Pretrain/Loss": 2.0987796783447266, "Pretrain/Loss (Raw)": 2.0014901161193848, "Pretrain/Step": 2904, "Pretrain/Step Time": 8.551902404055} +{"Pretrain/Learning Rate": 4.074697120333156e-05, "Pretrain/Loss": 2.099414825439453, "Pretrain/Loss (Raw)": 2.3077385425567627, "Pretrain/Step": 2905, "Pretrain/Step Time": 8.54994723573327} +{"Pretrain/Learning Rate": 4.0740376267027836e-05, "Pretrain/Loss": 2.1002724170684814, "Pretrain/Loss (Raw)": 2.3135762214660645, "Pretrain/Step": 2906, "Pretrain/Step Time": 8.545075507834554} +{"Pretrain/Learning Rate": 4.0733779515469736e-05, "Pretrain/Loss": 2.0987679958343506, "Pretrain/Loss (Raw)": 2.0712716579437256, "Pretrain/Step": 2907, "Pretrain/Step Time": 8.549206405878067} +{"Pretrain/Learning Rate": 4.072718094941805e-05, "Pretrain/Loss": 2.0971598625183105, "Pretrain/Loss (Raw)": 2.0221564769744873, "Pretrain/Step": 2908, "Pretrain/Step Time": 8.549684250727296} +{"Pretrain/Learning Rate": 4.0720580569633746e-05, "Pretrain/Loss": 2.0973424911499023, "Pretrain/Loss (Raw)": 2.052109479904175, "Pretrain/Step": 2909, "Pretrain/Step Time": 8.552548684179783} +{"Pretrain/Learning Rate": 4.0713978376878016e-05, "Pretrain/Loss": 2.097429037094116, "Pretrain/Loss (Raw)": 1.9990439414978027, "Pretrain/Step": 2910, "Pretrain/Step Time": 8.550504134967923} +{"Pretrain/Learning Rate": 4.070737437191224e-05, "Pretrain/Loss": 2.0987415313720703, "Pretrain/Loss (Raw)": 2.124366521835327, "Pretrain/Step": 2911, "Pretrain/Step Time": 8.550848923623562} +{"Pretrain/Learning Rate": 4.0700768555498045e-05, "Pretrain/Loss": 2.098738670349121, "Pretrain/Loss (Raw)": 2.0242860317230225, "Pretrain/Step": 2912, "Pretrain/Step Time": 8.55087436363101} +{"Pretrain/Learning Rate": 4.069416092839724e-05, "Pretrain/Loss": 2.100735902786255, "Pretrain/Loss (Raw)": 2.083346128463745, "Pretrain/Step": 2913, "Pretrain/Step Time": 8.548175811767578} +{"Pretrain/Learning Rate": 4.068755149137184e-05, "Pretrain/Loss": 2.0994625091552734, "Pretrain/Loss (Raw)": 2.0663275718688965, "Pretrain/Step": 2914, "Pretrain/Step Time": 8.551492238417268} +{"Pretrain/Learning Rate": 4.0680940245184076e-05, "Pretrain/Loss": 2.0991711616516113, "Pretrain/Loss (Raw)": 1.9982738494873047, "Pretrain/Step": 2915, "Pretrain/Step Time": 8.551685953512788} +{"Pretrain/Learning Rate": 4.06743271905964e-05, "Pretrain/Loss": 2.0995826721191406, "Pretrain/Loss (Raw)": 2.0417025089263916, "Pretrain/Step": 2916, "Pretrain/Step Time": 8.549221374094486} +{"Pretrain/Learning Rate": 4.066771232837144e-05, "Pretrain/Loss": 2.096369743347168, "Pretrain/Loss (Raw)": 2.0535640716552734, "Pretrain/Step": 2917, "Pretrain/Step Time": 8.549942756071687} +{"Pretrain/Learning Rate": 4.066109565927208e-05, "Pretrain/Loss": 2.095306158065796, "Pretrain/Loss (Raw)": 1.9487919807434082, "Pretrain/Step": 2918, "Pretrain/Step Time": 8.544077016413212} +{"Pretrain/Learning Rate": 4.0654477184061356e-05, "Pretrain/Loss": 2.095470666885376, "Pretrain/Loss (Raw)": 2.164370059967041, "Pretrain/Step": 2919, "Pretrain/Step Time": 8.54471093416214} +{"Pretrain/Learning Rate": 4.064785690350257e-05, "Pretrain/Loss": 2.0955047607421875, "Pretrain/Loss (Raw)": 2.1322882175445557, "Pretrain/Step": 2920, "Pretrain/Step Time": 8.543207133188844} +{"Pretrain/Learning Rate": 4.064123481835919e-05, "Pretrain/Loss": 2.096950054168701, "Pretrain/Loss (Raw)": 2.0645086765289307, "Pretrain/Step": 2921, "Pretrain/Step Time": 8.556338211521506} +{"Pretrain/Learning Rate": 4.0634610929394893e-05, "Pretrain/Loss": 2.097200393676758, "Pretrain/Loss (Raw)": 2.1469521522521973, "Pretrain/Step": 2922, "Pretrain/Step Time": 8.545659866183996} +{"Pretrain/Learning Rate": 4.06279852373736e-05, "Pretrain/Loss": 2.097641944885254, "Pretrain/Loss (Raw)": 2.0391602516174316, "Pretrain/Step": 2923, "Pretrain/Step Time": 8.548603853210807} +{"Pretrain/Learning Rate": 4.0621357743059415e-05, "Pretrain/Loss": 2.097829818725586, "Pretrain/Loss (Raw)": 2.0899384021759033, "Pretrain/Step": 2924, "Pretrain/Step Time": 8.55025957338512} +{"Pretrain/Learning Rate": 4.061472844721664e-05, "Pretrain/Loss": 2.09735369682312, "Pretrain/Loss (Raw)": 2.256110906600952, "Pretrain/Step": 2925, "Pretrain/Step Time": 8.548335388302803} +{"Pretrain/Learning Rate": 4.06080973506098e-05, "Pretrain/Loss": 2.095766544342041, "Pretrain/Loss (Raw)": 1.7277895212173462, "Pretrain/Step": 2926, "Pretrain/Step Time": 8.54779008589685} +{"Pretrain/Learning Rate": 4.0601464454003624e-05, "Pretrain/Loss": 2.0982673168182373, "Pretrain/Loss (Raw)": 2.350107431411743, "Pretrain/Step": 2927, "Pretrain/Step Time": 8.562149941921234} +{"Pretrain/Learning Rate": 4.059482975816305e-05, "Pretrain/Loss": 2.099672317504883, "Pretrain/Loss (Raw)": 2.2152233123779297, "Pretrain/Step": 2928, "Pretrain/Step Time": 8.549183124676347} +{"Pretrain/Learning Rate": 4.058819326385322e-05, "Pretrain/Loss": 2.1032118797302246, "Pretrain/Loss (Raw)": 2.5204854011535645, "Pretrain/Step": 2929, "Pretrain/Step Time": 8.5470552444458} +{"Pretrain/Learning Rate": 4.05815549718395e-05, "Pretrain/Loss": 2.1020195484161377, "Pretrain/Loss (Raw)": 1.9494550228118896, "Pretrain/Step": 2930, "Pretrain/Step Time": 8.545939242467284} +{"Pretrain/Learning Rate": 4.057491488288743e-05, "Pretrain/Loss": 2.1039366722106934, "Pretrain/Loss (Raw)": 2.2431528568267822, "Pretrain/Step": 2931, "Pretrain/Step Time": 8.544798497110605} +{"Pretrain/Learning Rate": 4.0568272997762785e-05, "Pretrain/Loss": 2.10578989982605, "Pretrain/Loss (Raw)": 2.1503775119781494, "Pretrain/Step": 2932, "Pretrain/Step Time": 8.546423899009824} +{"Pretrain/Learning Rate": 4.056162931723154e-05, "Pretrain/Loss": 2.104839324951172, "Pretrain/Loss (Raw)": 1.9930683374404907, "Pretrain/Step": 2933, "Pretrain/Step Time": 8.551303999498487} +{"Pretrain/Learning Rate": 4.055498384205987e-05, "Pretrain/Loss": 2.105351209640503, "Pretrain/Loss (Raw)": 2.1807377338409424, "Pretrain/Step": 2934, "Pretrain/Step Time": 8.55254427716136} +{"Pretrain/Learning Rate": 4.054833657301417e-05, "Pretrain/Loss": 2.104243040084839, "Pretrain/Loss (Raw)": 1.994444489479065, "Pretrain/Step": 2935, "Pretrain/Step Time": 8.55078985542059} +{"Pretrain/Learning Rate": 4.054168751086102e-05, "Pretrain/Loss": 2.103799343109131, "Pretrain/Loss (Raw)": 2.195239782333374, "Pretrain/Step": 2936, "Pretrain/Step Time": 8.549993366003036} +{"Pretrain/Learning Rate": 4.053503665636724e-05, "Pretrain/Loss": 2.105400562286377, "Pretrain/Loss (Raw)": 2.3334591388702393, "Pretrain/Step": 2937, "Pretrain/Step Time": 8.546063071116805} +{"Pretrain/Learning Rate": 4.052838401029984e-05, "Pretrain/Loss": 2.1058342456817627, "Pretrain/Loss (Raw)": 2.0467782020568848, "Pretrain/Step": 2938, "Pretrain/Step Time": 8.54224213026464} +{"Pretrain/Learning Rate": 4.0521729573426006e-05, "Pretrain/Loss": 2.1040120124816895, "Pretrain/Loss (Raw)": 1.9721999168395996, "Pretrain/Step": 2939, "Pretrain/Step Time": 8.553410351276398} +{"Pretrain/Learning Rate": 4.051507334651318e-05, "Pretrain/Loss": 2.103088855743408, "Pretrain/Loss (Raw)": 1.957831859588623, "Pretrain/Step": 2940, "Pretrain/Step Time": 8.548282677307725} +{"Pretrain/Learning Rate": 4.050841533032899e-05, "Pretrain/Loss": 2.1055748462677, "Pretrain/Loss (Raw)": 2.5435991287231445, "Pretrain/Step": 2941, "Pretrain/Step Time": 8.553649129346013} +{"Pretrain/Learning Rate": 4.050175552564127e-05, "Pretrain/Loss": 2.1046829223632812, "Pretrain/Loss (Raw)": 2.146533727645874, "Pretrain/Step": 2942, "Pretrain/Step Time": 8.557308267802} +{"Pretrain/Learning Rate": 4.049509393321805e-05, "Pretrain/Loss": 2.1050009727478027, "Pretrain/Loss (Raw)": 2.1589572429656982, "Pretrain/Step": 2943, "Pretrain/Step Time": 8.554906388744712} +{"Pretrain/Learning Rate": 4.0488430553827585e-05, "Pretrain/Loss": 2.103902578353882, "Pretrain/Loss (Raw)": 2.0557618141174316, "Pretrain/Step": 2944, "Pretrain/Step Time": 8.555356903001666} +{"Pretrain/Learning Rate": 4.0481765388238324e-05, "Pretrain/Loss": 2.101177453994751, "Pretrain/Loss (Raw)": 1.7313395738601685, "Pretrain/Step": 2945, "Pretrain/Step Time": 8.567782416939735} +{"Pretrain/Learning Rate": 4.047509843721893e-05, "Pretrain/Loss": 2.103609800338745, "Pretrain/Loss (Raw)": 2.4774482250213623, "Pretrain/Step": 2946, "Pretrain/Step Time": 8.556934190914035} +{"Pretrain/Learning Rate": 4.0468429701538253e-05, "Pretrain/Loss": 2.1018311977386475, "Pretrain/Loss (Raw)": 1.9252678155899048, "Pretrain/Step": 2947, "Pretrain/Step Time": 8.555397879332304} +{"Pretrain/Learning Rate": 4.046175918196538e-05, "Pretrain/Loss": 2.100294589996338, "Pretrain/Loss (Raw)": 1.9796282052993774, "Pretrain/Step": 2948, "Pretrain/Step Time": 8.550462670624256} +{"Pretrain/Learning Rate": 4.045508687926958e-05, "Pretrain/Loss": 2.0982847213745117, "Pretrain/Loss (Raw)": 2.0500693321228027, "Pretrain/Step": 2949, "Pretrain/Step Time": 8.553040431812406} +{"Pretrain/Learning Rate": 4.044841279422034e-05, "Pretrain/Loss": 2.0989937782287598, "Pretrain/Loss (Raw)": 2.1111159324645996, "Pretrain/Step": 2950, "Pretrain/Step Time": 8.55239805392921} +{"Pretrain/Learning Rate": 4.044173692758733e-05, "Pretrain/Loss": 2.0973877906799316, "Pretrain/Loss (Raw)": 1.8788580894470215, "Pretrain/Step": 2951, "Pretrain/Step Time": 8.56178255751729} +{"Pretrain/Learning Rate": 4.043505928014045e-05, "Pretrain/Loss": 2.0933289527893066, "Pretrain/Loss (Raw)": 1.7967838048934937, "Pretrain/Step": 2952, "Pretrain/Step Time": 8.551593441516161} +{"Pretrain/Learning Rate": 4.0428379852649816e-05, "Pretrain/Loss": 2.093148946762085, "Pretrain/Loss (Raw)": 1.9812657833099365, "Pretrain/Step": 2953, "Pretrain/Step Time": 8.549086133018136} +{"Pretrain/Learning Rate": 4.042169864588571e-05, "Pretrain/Loss": 2.093832015991211, "Pretrain/Loss (Raw)": 2.2280168533325195, "Pretrain/Step": 2954, "Pretrain/Step Time": 8.549256142228842} +{"Pretrain/Learning Rate": 4.041501566061865e-05, "Pretrain/Loss": 2.092543840408325, "Pretrain/Loss (Raw)": 2.012077808380127, "Pretrain/Step": 2955, "Pretrain/Step Time": 8.54887024499476} +{"Pretrain/Learning Rate": 4.040833089761934e-05, "Pretrain/Loss": 2.093967914581299, "Pretrain/Loss (Raw)": 2.1579742431640625, "Pretrain/Step": 2956, "Pretrain/Step Time": 8.547451820224524} +{"Pretrain/Learning Rate": 4.040164435765871e-05, "Pretrain/Loss": 2.0961833000183105, "Pretrain/Loss (Raw)": 2.153532028198242, "Pretrain/Step": 2957, "Pretrain/Step Time": 8.552892664447427} +{"Pretrain/Learning Rate": 4.039495604150787e-05, "Pretrain/Loss": 2.0969390869140625, "Pretrain/Loss (Raw)": 2.152148485183716, "Pretrain/Step": 2958, "Pretrain/Step Time": 8.540933355689049} +{"Pretrain/Learning Rate": 4.0388265949938165e-05, "Pretrain/Loss": 2.0977442264556885, "Pretrain/Loss (Raw)": 2.1235837936401367, "Pretrain/Step": 2959, "Pretrain/Step Time": 8.546322086825967} +{"Pretrain/Learning Rate": 4.038157408372111e-05, "Pretrain/Loss": 2.0989842414855957, "Pretrain/Loss (Raw)": 2.1136085987091064, "Pretrain/Step": 2960, "Pretrain/Step Time": 8.540262300521135} +{"Pretrain/Learning Rate": 4.037488044362846e-05, "Pretrain/Loss": 2.097332239151001, "Pretrain/Loss (Raw)": 2.12296724319458, "Pretrain/Step": 2961, "Pretrain/Step Time": 8.545417327433825} +{"Pretrain/Learning Rate": 4.036818503043214e-05, "Pretrain/Loss": 2.0997190475463867, "Pretrain/Loss (Raw)": 2.163630723953247, "Pretrain/Step": 2962, "Pretrain/Step Time": 8.541025467216969} +{"Pretrain/Learning Rate": 4.0361487844904314e-05, "Pretrain/Loss": 2.101503610610962, "Pretrain/Loss (Raw)": 2.2038168907165527, "Pretrain/Step": 2963, "Pretrain/Step Time": 8.545822257176042} +{"Pretrain/Learning Rate": 4.035478888781732e-05, "Pretrain/Loss": 2.1002845764160156, "Pretrain/Loss (Raw)": 2.0862653255462646, "Pretrain/Step": 2964, "Pretrain/Step Time": 8.535937691107392} +{"Pretrain/Learning Rate": 4.034808815994372e-05, "Pretrain/Loss": 2.099924087524414, "Pretrain/Loss (Raw)": 2.2198126316070557, "Pretrain/Step": 2965, "Pretrain/Step Time": 8.536115163937211} +{"Pretrain/Learning Rate": 4.0341385662056265e-05, "Pretrain/Loss": 2.100409507751465, "Pretrain/Loss (Raw)": 2.1125388145446777, "Pretrain/Step": 2966, "Pretrain/Step Time": 8.537415191531181} +{"Pretrain/Learning Rate": 4.033468139492793e-05, "Pretrain/Loss": 2.1013236045837402, "Pretrain/Loss (Raw)": 2.1969738006591797, "Pretrain/Step": 2967, "Pretrain/Step Time": 8.537631759420037} +{"Pretrain/Learning Rate": 4.032797535933187e-05, "Pretrain/Loss": 2.1029257774353027, "Pretrain/Loss (Raw)": 2.073023557662964, "Pretrain/Step": 2968, "Pretrain/Step Time": 8.541191117838025} +{"Pretrain/Learning Rate": 4.032126755604147e-05, "Pretrain/Loss": 2.102029800415039, "Pretrain/Loss (Raw)": 2.0329506397247314, "Pretrain/Step": 2969, "Pretrain/Step Time": 8.54059075191617} +{"Pretrain/Learning Rate": 4.03145579858303e-05, "Pretrain/Loss": 2.1043713092803955, "Pretrain/Loss (Raw)": 2.22383451461792, "Pretrain/Step": 2970, "Pretrain/Step Time": 8.535786684602499} +{"Pretrain/Learning Rate": 4.0307846649472134e-05, "Pretrain/Loss": 2.1069514751434326, "Pretrain/Loss (Raw)": 2.44155216217041, "Pretrain/Step": 2971, "Pretrain/Step Time": 8.536352140828967} +{"Pretrain/Learning Rate": 4.030113354774096e-05, "Pretrain/Loss": 2.1049370765686035, "Pretrain/Loss (Raw)": 1.9659861326217651, "Pretrain/Step": 2972, "Pretrain/Step Time": 8.537205338478088} +{"Pretrain/Learning Rate": 4.029441868141096e-05, "Pretrain/Loss": 2.1024160385131836, "Pretrain/Loss (Raw)": 2.0323941707611084, "Pretrain/Step": 2973, "Pretrain/Step Time": 8.536636205390096} +{"Pretrain/Learning Rate": 4.0287702051256535e-05, "Pretrain/Loss": 2.100955009460449, "Pretrain/Loss (Raw)": 1.9840773344039917, "Pretrain/Step": 2974, "Pretrain/Step Time": 8.540738554671407} +{"Pretrain/Learning Rate": 4.0280983658052276e-05, "Pretrain/Loss": 2.098379135131836, "Pretrain/Loss (Raw)": 1.9932348728179932, "Pretrain/Step": 2975, "Pretrain/Step Time": 8.542587008327246} +{"Pretrain/Learning Rate": 4.0274263502572966e-05, "Pretrain/Loss": 2.098513603210449, "Pretrain/Loss (Raw)": 2.01820969581604, "Pretrain/Step": 2976, "Pretrain/Step Time": 8.53666684217751} +{"Pretrain/Learning Rate": 4.026754158559362e-05, "Pretrain/Loss": 2.09712290763855, "Pretrain/Loss (Raw)": 2.0603973865509033, "Pretrain/Step": 2977, "Pretrain/Step Time": 8.545997679233551} +{"Pretrain/Learning Rate": 4.026081790788943e-05, "Pretrain/Loss": 2.0964133739471436, "Pretrain/Loss (Raw)": 2.1418704986572266, "Pretrain/Step": 2978, "Pretrain/Step Time": 8.538721514865756} +{"Pretrain/Learning Rate": 4.025409247023581e-05, "Pretrain/Loss": 2.0968940258026123, "Pretrain/Loss (Raw)": 2.1886186599731445, "Pretrain/Step": 2979, "Pretrain/Step Time": 8.544819021597505} +{"Pretrain/Learning Rate": 4.0247365273408366e-05, "Pretrain/Loss": 2.096301555633545, "Pretrain/Loss (Raw)": 2.0828635692596436, "Pretrain/Step": 2980, "Pretrain/Step Time": 8.544301588088274} +{"Pretrain/Learning Rate": 4.024063631818291e-05, "Pretrain/Loss": 2.0961055755615234, "Pretrain/Loss (Raw)": 2.119497299194336, "Pretrain/Step": 2981, "Pretrain/Step Time": 8.546747470274568} +{"Pretrain/Learning Rate": 4.023390560533546e-05, "Pretrain/Loss": 2.0943922996520996, "Pretrain/Loss (Raw)": 2.0505266189575195, "Pretrain/Step": 2982, "Pretrain/Step Time": 8.540546478703618} +{"Pretrain/Learning Rate": 4.022717313564223e-05, "Pretrain/Loss": 2.094602584838867, "Pretrain/Loss (Raw)": 2.0717885494232178, "Pretrain/Step": 2983, "Pretrain/Step Time": 8.544600607827306} +{"Pretrain/Learning Rate": 4.0220438909879644e-05, "Pretrain/Loss": 2.0957274436950684, "Pretrain/Loss (Raw)": 2.175318717956543, "Pretrain/Step": 2984, "Pretrain/Step Time": 8.544626155868173} +{"Pretrain/Learning Rate": 4.0213702928824315e-05, "Pretrain/Loss": 2.0948832035064697, "Pretrain/Loss (Raw)": 1.8834912776947021, "Pretrain/Step": 2985, "Pretrain/Step Time": 8.543342411518097} +{"Pretrain/Learning Rate": 4.0206965193253075e-05, "Pretrain/Loss": 2.095855712890625, "Pretrain/Loss (Raw)": 2.2142703533172607, "Pretrain/Step": 2986, "Pretrain/Step Time": 8.541905542835593} +{"Pretrain/Learning Rate": 4.0200225703942964e-05, "Pretrain/Loss": 2.095198392868042, "Pretrain/Loss (Raw)": 1.837828278541565, "Pretrain/Step": 2987, "Pretrain/Step Time": 8.544516613706946} +{"Pretrain/Learning Rate": 4.0193484461671185e-05, "Pretrain/Loss": 2.094780206680298, "Pretrain/Loss (Raw)": 1.918349027633667, "Pretrain/Step": 2988, "Pretrain/Step Time": 8.53811590373516} +{"Pretrain/Learning Rate": 4.0186741467215186e-05, "Pretrain/Loss": 2.094402551651001, "Pretrain/Loss (Raw)": 1.902148723602295, "Pretrain/Step": 2989, "Pretrain/Step Time": 8.548203511163592} +{"Pretrain/Learning Rate": 4.017999672135261e-05, "Pretrain/Loss": 2.096714496612549, "Pretrain/Loss (Raw)": 2.0738024711608887, "Pretrain/Step": 2990, "Pretrain/Step Time": 8.54825890623033} +{"Pretrain/Learning Rate": 4.017325022486127e-05, "Pretrain/Loss": 2.09472393989563, "Pretrain/Loss (Raw)": 2.0396804809570312, "Pretrain/Step": 2991, "Pretrain/Step Time": 8.550611397251487} +{"Pretrain/Learning Rate": 4.0166501978519225e-05, "Pretrain/Loss": 2.09279727935791, "Pretrain/Loss (Raw)": 1.8643771409988403, "Pretrain/Step": 2992, "Pretrain/Step Time": 8.548177685588598} +{"Pretrain/Learning Rate": 4.015975198310469e-05, "Pretrain/Loss": 2.093287944793701, "Pretrain/Loss (Raw)": 2.1056034564971924, "Pretrain/Step": 2993, "Pretrain/Step Time": 8.549631686881185} +{"Pretrain/Learning Rate": 4.0153000239396136e-05, "Pretrain/Loss": 2.090876579284668, "Pretrain/Loss (Raw)": 1.9011038541793823, "Pretrain/Step": 2994, "Pretrain/Step Time": 8.54272374138236} +{"Pretrain/Learning Rate": 4.014624674817218e-05, "Pretrain/Loss": 2.0889101028442383, "Pretrain/Loss (Raw)": 1.9379692077636719, "Pretrain/Step": 2995, "Pretrain/Step Time": 8.548137636855245} +{"Pretrain/Learning Rate": 4.0139491510211684e-05, "Pretrain/Loss": 2.089578628540039, "Pretrain/Loss (Raw)": 2.1982810497283936, "Pretrain/Step": 2996, "Pretrain/Step Time": 8.537927573546767} +{"Pretrain/Learning Rate": 4.0132734526293685e-05, "Pretrain/Loss": 2.088926315307617, "Pretrain/Loss (Raw)": 2.0467638969421387, "Pretrain/Step": 2997, "Pretrain/Step Time": 8.53947195224464} +{"Pretrain/Learning Rate": 4.012597579719743e-05, "Pretrain/Loss": 2.089362144470215, "Pretrain/Loss (Raw)": 2.1981475353240967, "Pretrain/Step": 2998, "Pretrain/Step Time": 8.541169963777065} +{"Pretrain/Learning Rate": 4.011921532370238e-05, "Pretrain/Loss": 2.0877199172973633, "Pretrain/Loss (Raw)": 2.003641128540039, "Pretrain/Step": 2999, "Pretrain/Step Time": 8.539642157033086} +{"Pretrain/Learning Rate": 4.0112453106588164e-05, "Pretrain/Loss": 2.088794231414795, "Pretrain/Loss (Raw)": 2.20941162109375, "Pretrain/Step": 3000, "Pretrain/Step Time": 8.545734722167253} +{"Pretrain/Learning Rate": 4.010568914663465e-05, "Pretrain/Loss": 2.087392807006836, "Pretrain/Loss (Raw)": 2.042092800140381, "Pretrain/Step": 3001, "Pretrain/Step Time": 8.539032340049744} +{"Pretrain/Learning Rate": 4.0098923444621885e-05, "Pretrain/Loss": 2.0889081954956055, "Pretrain/Loss (Raw)": 2.312753677368164, "Pretrain/Step": 3002, "Pretrain/Step Time": 8.540312064811587} +{"Pretrain/Learning Rate": 4.0092156001330115e-05, "Pretrain/Loss": 2.089148998260498, "Pretrain/Loss (Raw)": 2.059002637863159, "Pretrain/Step": 3003, "Pretrain/Step Time": 8.542582714930177} +{"Pretrain/Learning Rate": 4.00853868175398e-05, "Pretrain/Loss": 2.0873517990112305, "Pretrain/Loss (Raw)": 2.0221927165985107, "Pretrain/Step": 3004, "Pretrain/Step Time": 8.538274681195617} +{"Pretrain/Learning Rate": 4.007861589403159e-05, "Pretrain/Loss": 2.088846206665039, "Pretrain/Loss (Raw)": 2.2194535732269287, "Pretrain/Step": 3005, "Pretrain/Step Time": 8.538993446156383} +{"Pretrain/Learning Rate": 4.0071843231586345e-05, "Pretrain/Loss": 2.0901939868927, "Pretrain/Loss (Raw)": 2.2270400524139404, "Pretrain/Step": 3006, "Pretrain/Step Time": 8.544042222201824} +{"Pretrain/Learning Rate": 4.006506883098512e-05, "Pretrain/Loss": 2.089942693710327, "Pretrain/Loss (Raw)": 2.1061060428619385, "Pretrain/Step": 3007, "Pretrain/Step Time": 8.543943006545305} +{"Pretrain/Learning Rate": 4.005829269300917e-05, "Pretrain/Loss": 2.092111110687256, "Pretrain/Loss (Raw)": 2.3786251544952393, "Pretrain/Step": 3008, "Pretrain/Step Time": 8.54023826122284} +{"Pretrain/Learning Rate": 4.005151481843994e-05, "Pretrain/Loss": 2.0909652709960938, "Pretrain/Loss (Raw)": 1.8087421655654907, "Pretrain/Step": 3009, "Pretrain/Step Time": 8.54811442643404} +{"Pretrain/Learning Rate": 4.0044735208059104e-05, "Pretrain/Loss": 2.090609550476074, "Pretrain/Loss (Raw)": 2.1515750885009766, "Pretrain/Step": 3010, "Pretrain/Step Time": 8.544349934905767} +{"Pretrain/Learning Rate": 4.0037953862648504e-05, "Pretrain/Loss": 2.088798761367798, "Pretrain/Loss (Raw)": 1.8745180368423462, "Pretrain/Step": 3011, "Pretrain/Step Time": 8.542266763746738} +{"Pretrain/Learning Rate": 4.003117078299021e-05, "Pretrain/Loss": 2.090005397796631, "Pretrain/Loss (Raw)": 2.0328316688537598, "Pretrain/Step": 3012, "Pretrain/Step Time": 8.54881932772696} +{"Pretrain/Learning Rate": 4.002438596986647e-05, "Pretrain/Loss": 2.089217185974121, "Pretrain/Loss (Raw)": 1.9263283014297485, "Pretrain/Step": 3013, "Pretrain/Step Time": 8.543487032875419} +{"Pretrain/Learning Rate": 4.001759942405974e-05, "Pretrain/Loss": 2.0908751487731934, "Pretrain/Loss (Raw)": 2.3059284687042236, "Pretrain/Step": 3014, "Pretrain/Step Time": 8.546886082738638} +{"Pretrain/Learning Rate": 4.001081114635268e-05, "Pretrain/Loss": 2.0930304527282715, "Pretrain/Loss (Raw)": 2.339601993560791, "Pretrain/Step": 3015, "Pretrain/Step Time": 8.553307006135583} +{"Pretrain/Learning Rate": 4.000402113752815e-05, "Pretrain/Loss": 2.095451831817627, "Pretrain/Loss (Raw)": 2.2948708534240723, "Pretrain/Step": 3016, "Pretrain/Step Time": 8.550574017688632} +{"Pretrain/Learning Rate": 3.9997229398369194e-05, "Pretrain/Loss": 2.096555233001709, "Pretrain/Loss (Raw)": 2.1667139530181885, "Pretrain/Step": 3017, "Pretrain/Step Time": 8.556059755384922} +{"Pretrain/Learning Rate": 3.999043592965908e-05, "Pretrain/Loss": 2.09483003616333, "Pretrain/Loss (Raw)": 1.9461688995361328, "Pretrain/Step": 3018, "Pretrain/Step Time": 8.555110501125455} +{"Pretrain/Learning Rate": 3.998364073218126e-05, "Pretrain/Loss": 2.0943541526794434, "Pretrain/Loss (Raw)": 2.1793599128723145, "Pretrain/Step": 3019, "Pretrain/Step Time": 8.54743160866201} +{"Pretrain/Learning Rate": 3.997684380671938e-05, "Pretrain/Loss": 2.0959901809692383, "Pretrain/Loss (Raw)": 2.0749809741973877, "Pretrain/Step": 3020, "Pretrain/Step Time": 8.553745543584228} +{"Pretrain/Learning Rate": 3.9970045154057304e-05, "Pretrain/Loss": 2.094888210296631, "Pretrain/Loss (Raw)": 1.8863186836242676, "Pretrain/Step": 3021, "Pretrain/Step Time": 8.55338286422193} +{"Pretrain/Learning Rate": 3.996324477497907e-05, "Pretrain/Loss": 2.091986656188965, "Pretrain/Loss (Raw)": 1.9575873613357544, "Pretrain/Step": 3022, "Pretrain/Step Time": 8.553869970142841} +{"Pretrain/Learning Rate": 3.9956442670268946e-05, "Pretrain/Loss": 2.0932252407073975, "Pretrain/Loss (Raw)": 2.3085923194885254, "Pretrain/Step": 3023, "Pretrain/Step Time": 8.554095171391964} +{"Pretrain/Learning Rate": 3.9949638840711376e-05, "Pretrain/Loss": 2.093440055847168, "Pretrain/Loss (Raw)": 2.125213623046875, "Pretrain/Step": 3024, "Pretrain/Step Time": 8.55620296113193} +{"Pretrain/Learning Rate": 3.9942833287091006e-05, "Pretrain/Loss": 2.0950136184692383, "Pretrain/Loss (Raw)": 2.267852783203125, "Pretrain/Step": 3025, "Pretrain/Step Time": 8.560511847957969} +{"Pretrain/Learning Rate": 3.9936026010192696e-05, "Pretrain/Loss": 2.095090389251709, "Pretrain/Loss (Raw)": 2.1283650398254395, "Pretrain/Step": 3026, "Pretrain/Step Time": 8.560842551290989} +{"Pretrain/Learning Rate": 3.9929217010801476e-05, "Pretrain/Loss": 2.092569351196289, "Pretrain/Loss (Raw)": 2.031926155090332, "Pretrain/Step": 3027, "Pretrain/Step Time": 8.550530293956399} +{"Pretrain/Learning Rate": 3.992240628970261e-05, "Pretrain/Loss": 2.0933470726013184, "Pretrain/Loss (Raw)": 2.043358325958252, "Pretrain/Step": 3028, "Pretrain/Step Time": 8.552365126088262} +{"Pretrain/Learning Rate": 3.991559384768153e-05, "Pretrain/Loss": 2.0944390296936035, "Pretrain/Loss (Raw)": 2.0989317893981934, "Pretrain/Step": 3029, "Pretrain/Step Time": 8.546660162508488} +{"Pretrain/Learning Rate": 3.9908779685523885e-05, "Pretrain/Loss": 2.096392869949341, "Pretrain/Loss (Raw)": 2.176111936569214, "Pretrain/Step": 3030, "Pretrain/Step Time": 8.557577848434448} +{"Pretrain/Learning Rate": 3.9901963804015516e-05, "Pretrain/Loss": 2.097090721130371, "Pretrain/Loss (Raw)": 2.228161573410034, "Pretrain/Step": 3031, "Pretrain/Step Time": 8.549105025827885} +{"Pretrain/Learning Rate": 3.9895146203942457e-05, "Pretrain/Loss": 2.0988881587982178, "Pretrain/Loss (Raw)": 2.2315454483032227, "Pretrain/Step": 3032, "Pretrain/Step Time": 8.54768343269825} +{"Pretrain/Learning Rate": 3.988832688609095e-05, "Pretrain/Loss": 2.098346471786499, "Pretrain/Loss (Raw)": 2.2384018898010254, "Pretrain/Step": 3033, "Pretrain/Step Time": 8.549185620620847} +{"Pretrain/Learning Rate": 3.988150585124743e-05, "Pretrain/Loss": 2.0979068279266357, "Pretrain/Loss (Raw)": 2.2573294639587402, "Pretrain/Step": 3034, "Pretrain/Step Time": 8.549970610067248} +{"Pretrain/Learning Rate": 3.987468310019853e-05, "Pretrain/Loss": 2.0978002548217773, "Pretrain/Loss (Raw)": 2.0576083660125732, "Pretrain/Step": 3035, "Pretrain/Step Time": 8.548307565972209} +{"Pretrain/Learning Rate": 3.986785863373109e-05, "Pretrain/Loss": 2.0978446006774902, "Pretrain/Loss (Raw)": 2.0278306007385254, "Pretrain/Step": 3036, "Pretrain/Step Time": 8.555073587223887} +{"Pretrain/Learning Rate": 3.9861032452632124e-05, "Pretrain/Loss": 2.1005094051361084, "Pretrain/Loss (Raw)": 2.393205404281616, "Pretrain/Step": 3037, "Pretrain/Step Time": 8.552133359014988} +{"Pretrain/Learning Rate": 3.985420455768887e-05, "Pretrain/Loss": 2.1014397144317627, "Pretrain/Loss (Raw)": 2.118129253387451, "Pretrain/Step": 3038, "Pretrain/Step Time": 8.555203976109624} +{"Pretrain/Learning Rate": 3.9847374949688756e-05, "Pretrain/Loss": 2.100935459136963, "Pretrain/Loss (Raw)": 2.059823513031006, "Pretrain/Step": 3039, "Pretrain/Step Time": 8.545489622280002} +{"Pretrain/Learning Rate": 3.98405436294194e-05, "Pretrain/Loss": 2.100766658782959, "Pretrain/Loss (Raw)": 2.002673864364624, "Pretrain/Step": 3040, "Pretrain/Step Time": 8.552325071766973} +{"Pretrain/Learning Rate": 3.9833710597668614e-05, "Pretrain/Loss": 2.102372169494629, "Pretrain/Loss (Raw)": 2.2888317108154297, "Pretrain/Step": 3041, "Pretrain/Step Time": 8.550759704783559} +{"Pretrain/Learning Rate": 3.9826875855224435e-05, "Pretrain/Loss": 2.102764129638672, "Pretrain/Loss (Raw)": 2.1165521144866943, "Pretrain/Step": 3042, "Pretrain/Step Time": 8.5598353035748} +{"Pretrain/Learning Rate": 3.9820039402875055e-05, "Pretrain/Loss": 2.1039934158325195, "Pretrain/Loss (Raw)": 2.15557599067688, "Pretrain/Step": 3043, "Pretrain/Step Time": 8.55619571171701} +{"Pretrain/Learning Rate": 3.98132012414089e-05, "Pretrain/Loss": 2.103487730026245, "Pretrain/Loss (Raw)": 1.976996898651123, "Pretrain/Step": 3044, "Pretrain/Step Time": 8.553159018978477} +{"Pretrain/Learning Rate": 3.9806361371614576e-05, "Pretrain/Loss": 2.104116439819336, "Pretrain/Loss (Raw)": 2.1340081691741943, "Pretrain/Step": 3045, "Pretrain/Step Time": 8.549646101891994} +{"Pretrain/Learning Rate": 3.979951979428089e-05, "Pretrain/Loss": 2.105465888977051, "Pretrain/Loss (Raw)": 2.121553421020508, "Pretrain/Step": 3046, "Pretrain/Step Time": 8.556658364832401} +{"Pretrain/Learning Rate": 3.9792676510196835e-05, "Pretrain/Loss": 2.1052780151367188, "Pretrain/Loss (Raw)": 2.1403377056121826, "Pretrain/Step": 3047, "Pretrain/Step Time": 8.557691534981132} +{"Pretrain/Learning Rate": 3.978583152015163e-05, "Pretrain/Loss": 2.105182409286499, "Pretrain/Loss (Raw)": 2.1200244426727295, "Pretrain/Step": 3048, "Pretrain/Step Time": 8.558474557474256} +{"Pretrain/Learning Rate": 3.977898482493466e-05, "Pretrain/Loss": 2.1061289310455322, "Pretrain/Loss (Raw)": 2.1856529712677, "Pretrain/Step": 3049, "Pretrain/Step Time": 8.544609628617764} +{"Pretrain/Learning Rate": 3.977213642533552e-05, "Pretrain/Loss": 2.104642868041992, "Pretrain/Loss (Raw)": 1.9567537307739258, "Pretrain/Step": 3050, "Pretrain/Step Time": 8.548116689547896} +{"Pretrain/Learning Rate": 3.976528632214399e-05, "Pretrain/Loss": 2.1051619052886963, "Pretrain/Loss (Raw)": 2.1055991649627686, "Pretrain/Step": 3051, "Pretrain/Step Time": 8.546154135838151} +{"Pretrain/Learning Rate": 3.975843451615007e-05, "Pretrain/Loss": 2.103879690170288, "Pretrain/Loss (Raw)": 1.9258010387420654, "Pretrain/Step": 3052, "Pretrain/Step Time": 8.545744145289063} +{"Pretrain/Learning Rate": 3.9751581008143946e-05, "Pretrain/Loss": 2.1009159088134766, "Pretrain/Loss (Raw)": 1.876749038696289, "Pretrain/Step": 3053, "Pretrain/Step Time": 8.548114793375134} +{"Pretrain/Learning Rate": 3.9744725798915974e-05, "Pretrain/Loss": 2.1033124923706055, "Pretrain/Loss (Raw)": 2.0345401763916016, "Pretrain/Step": 3054, "Pretrain/Step Time": 8.55001638457179} +{"Pretrain/Learning Rate": 3.973786888925675e-05, "Pretrain/Loss": 2.1012606620788574, "Pretrain/Loss (Raw)": 2.0875089168548584, "Pretrain/Step": 3055, "Pretrain/Step Time": 8.542688392102718} +{"Pretrain/Learning Rate": 3.973101027995704e-05, "Pretrain/Loss": 2.1000638008117676, "Pretrain/Loss (Raw)": 2.0619895458221436, "Pretrain/Step": 3056, "Pretrain/Step Time": 8.54558864608407} +{"Pretrain/Learning Rate": 3.9724149971807814e-05, "Pretrain/Loss": 2.0965325832366943, "Pretrain/Loss (Raw)": 2.068507194519043, "Pretrain/Step": 3057, "Pretrain/Step Time": 8.541545990854502} +{"Pretrain/Learning Rate": 3.9717287965600224e-05, "Pretrain/Loss": 2.0970029830932617, "Pretrain/Loss (Raw)": 2.0096535682678223, "Pretrain/Step": 3058, "Pretrain/Step Time": 8.543383348733187} +{"Pretrain/Learning Rate": 3.971042426212563e-05, "Pretrain/Loss": 2.097053050994873, "Pretrain/Loss (Raw)": 2.249572515487671, "Pretrain/Step": 3059, "Pretrain/Step Time": 8.54286035336554} +{"Pretrain/Learning Rate": 3.970355886217561e-05, "Pretrain/Loss": 2.097443103790283, "Pretrain/Loss (Raw)": 2.2002882957458496, "Pretrain/Step": 3060, "Pretrain/Step Time": 8.548036126419902} +{"Pretrain/Learning Rate": 3.9696691766541884e-05, "Pretrain/Loss": 2.0972836017608643, "Pretrain/Loss (Raw)": 1.9726711511611938, "Pretrain/Step": 3061, "Pretrain/Step Time": 8.539701180532575} +{"Pretrain/Learning Rate": 3.968982297601641e-05, "Pretrain/Loss": 2.0953617095947266, "Pretrain/Loss (Raw)": 1.9347481727600098, "Pretrain/Step": 3062, "Pretrain/Step Time": 8.542586522176862} +{"Pretrain/Learning Rate": 3.9682952491391326e-05, "Pretrain/Loss": 2.0959856510162354, "Pretrain/Loss (Raw)": 2.0743021965026855, "Pretrain/Step": 3063, "Pretrain/Step Time": 8.540321407839656} +{"Pretrain/Learning Rate": 3.967608031345898e-05, "Pretrain/Loss": 2.095730781555176, "Pretrain/Loss (Raw)": 2.162609100341797, "Pretrain/Step": 3064, "Pretrain/Step Time": 8.540320113301277} +{"Pretrain/Learning Rate": 3.96692064430119e-05, "Pretrain/Loss": 2.093186140060425, "Pretrain/Loss (Raw)": 2.0077595710754395, "Pretrain/Step": 3065, "Pretrain/Step Time": 8.541859393939376} +{"Pretrain/Learning Rate": 3.96623308808428e-05, "Pretrain/Loss": 2.0928547382354736, "Pretrain/Loss (Raw)": 2.004335880279541, "Pretrain/Step": 3066, "Pretrain/Step Time": 8.550011502578855} +{"Pretrain/Learning Rate": 3.965545362774461e-05, "Pretrain/Loss": 2.093341827392578, "Pretrain/Loss (Raw)": 2.034572124481201, "Pretrain/Step": 3067, "Pretrain/Step Time": 8.543789736926556} +{"Pretrain/Learning Rate": 3.964857468451045e-05, "Pretrain/Loss": 2.097297191619873, "Pretrain/Loss (Raw)": 2.4641027450561523, "Pretrain/Step": 3068, "Pretrain/Step Time": 8.536292685195804} +{"Pretrain/Learning Rate": 3.9641694051933644e-05, "Pretrain/Loss": 2.095399856567383, "Pretrain/Loss (Raw)": 2.3007595539093018, "Pretrain/Step": 3069, "Pretrain/Step Time": 8.536535443738103} +{"Pretrain/Learning Rate": 3.963481173080767e-05, "Pretrain/Loss": 2.0940911769866943, "Pretrain/Loss (Raw)": 1.9790009260177612, "Pretrain/Step": 3070, "Pretrain/Step Time": 8.538530537858605} +{"Pretrain/Learning Rate": 3.962792772192626e-05, "Pretrain/Loss": 2.095428466796875, "Pretrain/Loss (Raw)": 2.3301305770874023, "Pretrain/Step": 3071, "Pretrain/Step Time": 8.537091432139277} +{"Pretrain/Learning Rate": 3.962104202608329e-05, "Pretrain/Loss": 2.095839023590088, "Pretrain/Loss (Raw)": 2.108320713043213, "Pretrain/Step": 3072, "Pretrain/Step Time": 8.539022060111165} +{"Pretrain/Learning Rate": 3.9614154644072854e-05, "Pretrain/Loss": 2.0982327461242676, "Pretrain/Loss (Raw)": 2.037714958190918, "Pretrain/Step": 3073, "Pretrain/Step Time": 8.527482338249683} +{"Pretrain/Learning Rate": 3.960726557668924e-05, "Pretrain/Loss": 2.095613479614258, "Pretrain/Loss (Raw)": 2.1422200202941895, "Pretrain/Step": 3074, "Pretrain/Step Time": 8.531734568998218} +{"Pretrain/Learning Rate": 3.960037482472694e-05, "Pretrain/Loss": 2.0967726707458496, "Pretrain/Loss (Raw)": 2.0736160278320312, "Pretrain/Step": 3075, "Pretrain/Step Time": 8.531640574336052} +{"Pretrain/Learning Rate": 3.95934823889806e-05, "Pretrain/Loss": 2.0983898639678955, "Pretrain/Loss (Raw)": 2.1866374015808105, "Pretrain/Step": 3076, "Pretrain/Step Time": 8.535263804718852} +{"Pretrain/Learning Rate": 3.9586588270245115e-05, "Pretrain/Loss": 2.098864793777466, "Pretrain/Loss (Raw)": 2.1108548641204834, "Pretrain/Step": 3077, "Pretrain/Step Time": 8.536373438313603} +{"Pretrain/Learning Rate": 3.957969246931553e-05, "Pretrain/Loss": 2.1000895500183105, "Pretrain/Loss (Raw)": 2.267913579940796, "Pretrain/Step": 3078, "Pretrain/Step Time": 8.5369366183877} +{"Pretrain/Learning Rate": 3.95727949869871e-05, "Pretrain/Loss": 2.0997514724731445, "Pretrain/Loss (Raw)": 1.8355791568756104, "Pretrain/Step": 3079, "Pretrain/Step Time": 8.528657406568527} +{"Pretrain/Learning Rate": 3.95658958240553e-05, "Pretrain/Loss": 2.1017775535583496, "Pretrain/Loss (Raw)": 2.056093454360962, "Pretrain/Step": 3080, "Pretrain/Step Time": 8.531170144677162} +{"Pretrain/Learning Rate": 3.955899498131575e-05, "Pretrain/Loss": 2.1023380756378174, "Pretrain/Loss (Raw)": 2.053018093109131, "Pretrain/Step": 3081, "Pretrain/Step Time": 8.531526444479823} +{"Pretrain/Learning Rate": 3.9552092459564294e-05, "Pretrain/Loss": 2.1017746925354004, "Pretrain/Loss (Raw)": 2.1558985710144043, "Pretrain/Step": 3082, "Pretrain/Step Time": 8.528704818338156} +{"Pretrain/Learning Rate": 3.9545188259596966e-05, "Pretrain/Loss": 2.101332187652588, "Pretrain/Loss (Raw)": 1.955436110496521, "Pretrain/Step": 3083, "Pretrain/Step Time": 8.528146667405963} +{"Pretrain/Learning Rate": 3.953828238220998e-05, "Pretrain/Loss": 2.1007490158081055, "Pretrain/Loss (Raw)": 2.0833468437194824, "Pretrain/Step": 3084, "Pretrain/Step Time": 8.53397249802947} +{"Pretrain/Learning Rate": 3.9531374828199774e-05, "Pretrain/Loss": 2.1000802516937256, "Pretrain/Loss (Raw)": 2.0679194927215576, "Pretrain/Step": 3085, "Pretrain/Step Time": 8.52937208674848} +{"Pretrain/Learning Rate": 3.952446559836295e-05, "Pretrain/Loss": 2.1012301445007324, "Pretrain/Loss (Raw)": 2.299344778060913, "Pretrain/Step": 3086, "Pretrain/Step Time": 8.537352379411459} +{"Pretrain/Learning Rate": 3.95175546934963e-05, "Pretrain/Loss": 2.098881721496582, "Pretrain/Loss (Raw)": 1.8229693174362183, "Pretrain/Step": 3087, "Pretrain/Step Time": 8.540105402469635} +{"Pretrain/Learning Rate": 3.951064211439684e-05, "Pretrain/Loss": 2.098407506942749, "Pretrain/Loss (Raw)": 2.052910566329956, "Pretrain/Step": 3088, "Pretrain/Step Time": 8.543241938576102} +{"Pretrain/Learning Rate": 3.9503727861861756e-05, "Pretrain/Loss": 2.0987353324890137, "Pretrain/Loss (Raw)": 2.1649510860443115, "Pretrain/Step": 3089, "Pretrain/Step Time": 8.538867009803653} +{"Pretrain/Learning Rate": 3.9496811936688425e-05, "Pretrain/Loss": 2.100553035736084, "Pretrain/Loss (Raw)": 2.396287441253662, "Pretrain/Step": 3090, "Pretrain/Step Time": 8.540994485840201} +{"Pretrain/Learning Rate": 3.9489894339674435e-05, "Pretrain/Loss": 2.0992870330810547, "Pretrain/Loss (Raw)": 2.04177188873291, "Pretrain/Step": 3091, "Pretrain/Step Time": 8.535025678575039} +{"Pretrain/Learning Rate": 3.948297507161756e-05, "Pretrain/Loss": 2.0994009971618652, "Pretrain/Loss (Raw)": 2.1008598804473877, "Pretrain/Step": 3092, "Pretrain/Step Time": 8.53351690620184} +{"Pretrain/Learning Rate": 3.947605413331574e-05, "Pretrain/Loss": 2.0988516807556152, "Pretrain/Loss (Raw)": 2.149458646774292, "Pretrain/Step": 3093, "Pretrain/Step Time": 8.53538578003645} +{"Pretrain/Learning Rate": 3.946913152556715e-05, "Pretrain/Loss": 2.0984201431274414, "Pretrain/Loss (Raw)": 2.0573325157165527, "Pretrain/Step": 3094, "Pretrain/Step Time": 8.54117732681334} +{"Pretrain/Learning Rate": 3.946220724917013e-05, "Pretrain/Loss": 2.097744941711426, "Pretrain/Loss (Raw)": 2.1105523109436035, "Pretrain/Step": 3095, "Pretrain/Step Time": 8.541050802916288} +{"Pretrain/Learning Rate": 3.945528130492322e-05, "Pretrain/Loss": 2.0972442626953125, "Pretrain/Loss (Raw)": 2.008925676345825, "Pretrain/Step": 3096, "Pretrain/Step Time": 8.545479156076908} +{"Pretrain/Learning Rate": 3.944835369362516e-05, "Pretrain/Loss": 2.0973997116088867, "Pretrain/Loss (Raw)": 2.052842855453491, "Pretrain/Step": 3097, "Pretrain/Step Time": 8.545305289328098} +{"Pretrain/Learning Rate": 3.9441424416074866e-05, "Pretrain/Loss": 2.0960757732391357, "Pretrain/Loss (Raw)": 2.054375171661377, "Pretrain/Step": 3098, "Pretrain/Step Time": 8.541568264365196} +{"Pretrain/Learning Rate": 3.9434493473071456e-05, "Pretrain/Loss": 2.095353126525879, "Pretrain/Loss (Raw)": 2.3490636348724365, "Pretrain/Step": 3099, "Pretrain/Step Time": 8.54250568524003} +{"Pretrain/Learning Rate": 3.9427560865414246e-05, "Pretrain/Loss": 2.095644235610962, "Pretrain/Loss (Raw)": 2.003251791000366, "Pretrain/Step": 3100, "Pretrain/Step Time": 8.54668664932251} +{"Pretrain/Learning Rate": 3.942062659390273e-05, "Pretrain/Loss": 2.0961804389953613, "Pretrain/Loss (Raw)": 2.101013422012329, "Pretrain/Step": 3101, "Pretrain/Step Time": 8.545141188427806} +{"Pretrain/Learning Rate": 3.94136906593366e-05, "Pretrain/Loss": 2.0983378887176514, "Pretrain/Loss (Raw)": 2.260237455368042, "Pretrain/Step": 3102, "Pretrain/Step Time": 8.548862719908357} +{"Pretrain/Learning Rate": 3.940675306251574e-05, "Pretrain/Loss": 2.098874807357788, "Pretrain/Loss (Raw)": 2.061958074569702, "Pretrain/Step": 3103, "Pretrain/Step Time": 8.54308969527483} +{"Pretrain/Learning Rate": 3.939981380424024e-05, "Pretrain/Loss": 2.100325584411621, "Pretrain/Loss (Raw)": 2.203911781311035, "Pretrain/Step": 3104, "Pretrain/Step Time": 8.549444317817688} +{"Pretrain/Learning Rate": 3.939287288531035e-05, "Pretrain/Loss": 2.10056209564209, "Pretrain/Loss (Raw)": 2.0906729698181152, "Pretrain/Step": 3105, "Pretrain/Step Time": 8.545611524954438} +{"Pretrain/Learning Rate": 3.938593030652654e-05, "Pretrain/Loss": 2.1019601821899414, "Pretrain/Loss (Raw)": 2.3208231925964355, "Pretrain/Step": 3106, "Pretrain/Step Time": 8.54843326471746} +{"Pretrain/Learning Rate": 3.937898606868946e-05, "Pretrain/Loss": 2.098092555999756, "Pretrain/Loss (Raw)": 1.6935625076293945, "Pretrain/Step": 3107, "Pretrain/Step Time": 8.547242829576135} +{"Pretrain/Learning Rate": 3.9372040172599956e-05, "Pretrain/Loss": 2.0964298248291016, "Pretrain/Loss (Raw)": 1.870012640953064, "Pretrain/Step": 3108, "Pretrain/Step Time": 8.551687663421035} +{"Pretrain/Learning Rate": 3.936509261905905e-05, "Pretrain/Loss": 2.097377061843872, "Pretrain/Loss (Raw)": 2.2407450675964355, "Pretrain/Step": 3109, "Pretrain/Step Time": 8.550927175208926} +{"Pretrain/Learning Rate": 3.935814340886797e-05, "Pretrain/Loss": 2.097935914993286, "Pretrain/Loss (Raw)": 2.122066020965576, "Pretrain/Step": 3110, "Pretrain/Step Time": 8.556274246424437} +{"Pretrain/Learning Rate": 3.935119254282814e-05, "Pretrain/Loss": 2.097470998764038, "Pretrain/Loss (Raw)": 2.0122861862182617, "Pretrain/Step": 3111, "Pretrain/Step Time": 8.554824410006404} +{"Pretrain/Learning Rate": 3.934424002174115e-05, "Pretrain/Loss": 2.0971829891204834, "Pretrain/Loss (Raw)": 2.1384594440460205, "Pretrain/Step": 3112, "Pretrain/Step Time": 8.552668975666165} +{"Pretrain/Learning Rate": 3.9337285846408826e-05, "Pretrain/Loss": 2.0986804962158203, "Pretrain/Loss (Raw)": 2.0751612186431885, "Pretrain/Step": 3113, "Pretrain/Step Time": 8.55374538898468} +{"Pretrain/Learning Rate": 3.9330330017633126e-05, "Pretrain/Loss": 2.0984349250793457, "Pretrain/Loss (Raw)": 2.182859182357788, "Pretrain/Step": 3114, "Pretrain/Step Time": 8.554251303896308} +{"Pretrain/Learning Rate": 3.932337253621624e-05, "Pretrain/Loss": 2.1028618812561035, "Pretrain/Loss (Raw)": 2.404438018798828, "Pretrain/Step": 3115, "Pretrain/Step Time": 8.558506656438112} +{"Pretrain/Learning Rate": 3.9316413402960553e-05, "Pretrain/Loss": 2.102764129638672, "Pretrain/Loss (Raw)": 1.9058703184127808, "Pretrain/Step": 3116, "Pretrain/Step Time": 8.565349524840713} +{"Pretrain/Learning Rate": 3.93094526186686e-05, "Pretrain/Loss": 2.103534698486328, "Pretrain/Loss (Raw)": 2.000762462615967, "Pretrain/Step": 3117, "Pretrain/Step Time": 8.55533549003303} +{"Pretrain/Learning Rate": 3.930249018414315e-05, "Pretrain/Loss": 2.104191303253174, "Pretrain/Loss (Raw)": 2.1578733921051025, "Pretrain/Step": 3118, "Pretrain/Step Time": 8.555521422997117} +{"Pretrain/Learning Rate": 3.9295526100187126e-05, "Pretrain/Loss": 2.1065244674682617, "Pretrain/Loss (Raw)": 2.338329792022705, "Pretrain/Step": 3119, "Pretrain/Step Time": 8.55526339635253} +{"Pretrain/Learning Rate": 3.928856036760368e-05, "Pretrain/Loss": 2.111471652984619, "Pretrain/Loss (Raw)": 2.49761700630188, "Pretrain/Step": 3120, "Pretrain/Step Time": 8.556927500292659} +{"Pretrain/Learning Rate": 3.9281592987196115e-05, "Pretrain/Loss": 2.112992286682129, "Pretrain/Loss (Raw)": 2.300236701965332, "Pretrain/Step": 3121, "Pretrain/Step Time": 8.561071671545506} +{"Pretrain/Learning Rate": 3.9274623959767945e-05, "Pretrain/Loss": 2.1136457920074463, "Pretrain/Loss (Raw)": 1.9847509860992432, "Pretrain/Step": 3122, "Pretrain/Step Time": 8.562166672199965} +{"Pretrain/Learning Rate": 3.9267653286122886e-05, "Pretrain/Loss": 2.114501953125, "Pretrain/Loss (Raw)": 2.047544240951538, "Pretrain/Step": 3123, "Pretrain/Step Time": 8.55633963830769} +{"Pretrain/Learning Rate": 3.9260680967064814e-05, "Pretrain/Loss": 2.111053228378296, "Pretrain/Loss (Raw)": 1.7568397521972656, "Pretrain/Step": 3124, "Pretrain/Step Time": 8.557675551623106} +{"Pretrain/Learning Rate": 3.9253707003397814e-05, "Pretrain/Loss": 2.111107587814331, "Pretrain/Loss (Raw)": 2.0537161827087402, "Pretrain/Step": 3125, "Pretrain/Step Time": 8.556205604225397} +{"Pretrain/Learning Rate": 3.924673139592616e-05, "Pretrain/Loss": 2.109516143798828, "Pretrain/Loss (Raw)": 1.994463324546814, "Pretrain/Step": 3126, "Pretrain/Step Time": 8.555558817461133} +{"Pretrain/Learning Rate": 3.9239754145454304e-05, "Pretrain/Loss": 2.110262155532837, "Pretrain/Loss (Raw)": 2.0991103649139404, "Pretrain/Step": 3127, "Pretrain/Step Time": 8.560081236064434} +{"Pretrain/Learning Rate": 3.92327752527869e-05, "Pretrain/Loss": 2.110158920288086, "Pretrain/Loss (Raw)": 2.1962015628814697, "Pretrain/Step": 3128, "Pretrain/Step Time": 8.557403208687901} +{"Pretrain/Learning Rate": 3.922579471872879e-05, "Pretrain/Loss": 2.110487699508667, "Pretrain/Loss (Raw)": 2.084174871444702, "Pretrain/Step": 3129, "Pretrain/Step Time": 8.558265065774322} +{"Pretrain/Learning Rate": 3.9218812544085004e-05, "Pretrain/Loss": 2.1088333129882812, "Pretrain/Loss (Raw)": 2.1010022163391113, "Pretrain/Step": 3130, "Pretrain/Step Time": 8.556390758603811} +{"Pretrain/Learning Rate": 3.921182872966075e-05, "Pretrain/Loss": 2.10914945602417, "Pretrain/Loss (Raw)": 2.099461555480957, "Pretrain/Step": 3131, "Pretrain/Step Time": 8.556279312819242} +{"Pretrain/Learning Rate": 3.920484327626144e-05, "Pretrain/Loss": 2.110067844390869, "Pretrain/Loss (Raw)": 2.139763832092285, "Pretrain/Step": 3132, "Pretrain/Step Time": 8.56387827731669} +{"Pretrain/Learning Rate": 3.919785618469266e-05, "Pretrain/Loss": 2.1089155673980713, "Pretrain/Loss (Raw)": 2.0719408988952637, "Pretrain/Step": 3133, "Pretrain/Step Time": 8.560993891209364} +{"Pretrain/Learning Rate": 3.9190867455760213e-05, "Pretrain/Loss": 2.1054916381835938, "Pretrain/Loss (Raw)": 1.7888050079345703, "Pretrain/Step": 3134, "Pretrain/Step Time": 8.556176913902164} +{"Pretrain/Learning Rate": 3.918387709027005e-05, "Pretrain/Loss": 2.105855941772461, "Pretrain/Loss (Raw)": 2.152740716934204, "Pretrain/Step": 3135, "Pretrain/Step Time": 8.553521936759353} +{"Pretrain/Learning Rate": 3.917688508902835e-05, "Pretrain/Loss": 2.1046018600463867, "Pretrain/Loss (Raw)": 2.2180581092834473, "Pretrain/Step": 3136, "Pretrain/Step Time": 8.552351079881191} +{"Pretrain/Learning Rate": 3.916989145284146e-05, "Pretrain/Loss": 2.108165740966797, "Pretrain/Loss (Raw)": 2.2649152278900146, "Pretrain/Step": 3137, "Pretrain/Step Time": 8.546135880053043} +{"Pretrain/Learning Rate": 3.9162896182515915e-05, "Pretrain/Loss": 2.107848644256592, "Pretrain/Loss (Raw)": 2.1110355854034424, "Pretrain/Step": 3138, "Pretrain/Step Time": 8.55213825404644} +{"Pretrain/Learning Rate": 3.9155899278858445e-05, "Pretrain/Loss": 2.1095056533813477, "Pretrain/Loss (Raw)": 2.0865676403045654, "Pretrain/Step": 3139, "Pretrain/Step Time": 8.555640203878284} +{"Pretrain/Learning Rate": 3.914890074267597e-05, "Pretrain/Loss": 2.1100072860717773, "Pretrain/Loss (Raw)": 2.09704852104187, "Pretrain/Step": 3140, "Pretrain/Step Time": 8.5551797170192} +{"Pretrain/Learning Rate": 3.914190057477558e-05, "Pretrain/Loss": 2.110924243927002, "Pretrain/Loss (Raw)": 2.043712615966797, "Pretrain/Step": 3141, "Pretrain/Step Time": 8.554305771365762} +{"Pretrain/Learning Rate": 3.913489877596458e-05, "Pretrain/Loss": 2.109142780303955, "Pretrain/Loss (Raw)": 2.0779006481170654, "Pretrain/Step": 3142, "Pretrain/Step Time": 8.54843232408166} +{"Pretrain/Learning Rate": 3.912789534705045e-05, "Pretrain/Loss": 2.1073098182678223, "Pretrain/Loss (Raw)": 2.104997396469116, "Pretrain/Step": 3143, "Pretrain/Step Time": 8.542308617383242} +{"Pretrain/Learning Rate": 3.912089028884085e-05, "Pretrain/Loss": 2.104861259460449, "Pretrain/Loss (Raw)": 1.9814376831054688, "Pretrain/Step": 3144, "Pretrain/Step Time": 8.546742463484406} +{"Pretrain/Learning Rate": 3.9113883602143645e-05, "Pretrain/Loss": 2.103144645690918, "Pretrain/Loss (Raw)": 1.9469937086105347, "Pretrain/Step": 3145, "Pretrain/Step Time": 8.55423871986568} +{"Pretrain/Learning Rate": 3.910687528776688e-05, "Pretrain/Loss": 2.1042709350585938, "Pretrain/Loss (Raw)": 2.090327739715576, "Pretrain/Step": 3146, "Pretrain/Step Time": 8.549127196893096} +{"Pretrain/Learning Rate": 3.9099865346518786e-05, "Pretrain/Loss": 2.105935573577881, "Pretrain/Loss (Raw)": 2.3924400806427, "Pretrain/Step": 3147, "Pretrain/Step Time": 8.549716686829925} +{"Pretrain/Learning Rate": 3.909285377920777e-05, "Pretrain/Loss": 2.105414390563965, "Pretrain/Loss (Raw)": 2.0082788467407227, "Pretrain/Step": 3148, "Pretrain/Step Time": 8.547784207388759} +{"Pretrain/Learning Rate": 3.908584058664245e-05, "Pretrain/Loss": 2.1075425148010254, "Pretrain/Loss (Raw)": 2.158712148666382, "Pretrain/Step": 3149, "Pretrain/Step Time": 8.547110050916672} +{"Pretrain/Learning Rate": 3.907882576963162e-05, "Pretrain/Loss": 2.109282970428467, "Pretrain/Loss (Raw)": 2.180349826812744, "Pretrain/Step": 3150, "Pretrain/Step Time": 8.552789064124227} +{"Pretrain/Learning Rate": 3.907180932898427e-05, "Pretrain/Loss": 2.1079578399658203, "Pretrain/Loss (Raw)": 2.1389899253845215, "Pretrain/Step": 3151, "Pretrain/Step Time": 8.5503917504102} +{"Pretrain/Learning Rate": 3.9064791265509546e-05, "Pretrain/Loss": 2.107053518295288, "Pretrain/Loss (Raw)": 2.0094456672668457, "Pretrain/Step": 3152, "Pretrain/Step Time": 8.553083879873157} +{"Pretrain/Learning Rate": 3.905777158001682e-05, "Pretrain/Loss": 2.105773448944092, "Pretrain/Loss (Raw)": 2.1040122509002686, "Pretrain/Step": 3153, "Pretrain/Step Time": 8.548030257225037} +{"Pretrain/Learning Rate": 3.905075027331564e-05, "Pretrain/Loss": 2.105830192565918, "Pretrain/Loss (Raw)": 2.135627508163452, "Pretrain/Step": 3154, "Pretrain/Step Time": 8.549759432673454} +{"Pretrain/Learning Rate": 3.9043727346215726e-05, "Pretrain/Loss": 2.1065101623535156, "Pretrain/Loss (Raw)": 2.118966579437256, "Pretrain/Step": 3155, "Pretrain/Step Time": 8.548354541882873} +{"Pretrain/Learning Rate": 3.9036702799527e-05, "Pretrain/Loss": 2.1059718132019043, "Pretrain/Loss (Raw)": 1.97442626953125, "Pretrain/Step": 3156, "Pretrain/Step Time": 8.550846939906478} +{"Pretrain/Learning Rate": 3.902967663405956e-05, "Pretrain/Loss": 2.1065545082092285, "Pretrain/Loss (Raw)": 2.173543930053711, "Pretrain/Step": 3157, "Pretrain/Step Time": 8.557358311489224} +{"Pretrain/Learning Rate": 3.90226488506237e-05, "Pretrain/Loss": 2.106416702270508, "Pretrain/Loss (Raw)": 2.158465623855591, "Pretrain/Step": 3158, "Pretrain/Step Time": 8.546614510938525} +{"Pretrain/Learning Rate": 3.9015619450029904e-05, "Pretrain/Loss": 2.1056768894195557, "Pretrain/Loss (Raw)": 2.133474826812744, "Pretrain/Step": 3159, "Pretrain/Step Time": 8.548177413642406} +{"Pretrain/Learning Rate": 3.9008588433088825e-05, "Pretrain/Loss": 2.1058754920959473, "Pretrain/Loss (Raw)": 2.2569470405578613, "Pretrain/Step": 3160, "Pretrain/Step Time": 8.549287363886833} +{"Pretrain/Learning Rate": 3.900155580061132e-05, "Pretrain/Loss": 2.105924367904663, "Pretrain/Loss (Raw)": 2.2446720600128174, "Pretrain/Step": 3161, "Pretrain/Step Time": 8.547678291797638} +{"Pretrain/Learning Rate": 3.899452155340842e-05, "Pretrain/Loss": 2.10491681098938, "Pretrain/Loss (Raw)": 2.128375768661499, "Pretrain/Step": 3162, "Pretrain/Step Time": 8.558725018054247} +{"Pretrain/Learning Rate": 3.898748569229135e-05, "Pretrain/Loss": 2.1063232421875, "Pretrain/Loss (Raw)": 2.237607717514038, "Pretrain/Step": 3163, "Pretrain/Step Time": 8.556281436234713} +{"Pretrain/Learning Rate": 3.898044821807152e-05, "Pretrain/Loss": 2.106142520904541, "Pretrain/Loss (Raw)": 2.0046820640563965, "Pretrain/Step": 3164, "Pretrain/Step Time": 8.553455960005522} +{"Pretrain/Learning Rate": 3.897340913156052e-05, "Pretrain/Loss": 2.1035923957824707, "Pretrain/Loss (Raw)": 2.0668299198150635, "Pretrain/Step": 3165, "Pretrain/Step Time": 8.55081182345748} +{"Pretrain/Learning Rate": 3.896636843357014e-05, "Pretrain/Loss": 2.1035594940185547, "Pretrain/Loss (Raw)": 2.1139042377471924, "Pretrain/Step": 3166, "Pretrain/Step Time": 8.547631908208132} +{"Pretrain/Learning Rate": 3.895932612491233e-05, "Pretrain/Loss": 2.104025363922119, "Pretrain/Loss (Raw)": 2.119467258453369, "Pretrain/Step": 3167, "Pretrain/Step Time": 8.555259991437197} +{"Pretrain/Learning Rate": 3.895228220639926e-05, "Pretrain/Loss": 2.1051723957061768, "Pretrain/Loss (Raw)": 2.1494858264923096, "Pretrain/Step": 3168, "Pretrain/Step Time": 8.546828303486109} +{"Pretrain/Learning Rate": 3.8945236678843266e-05, "Pretrain/Loss": 2.103266716003418, "Pretrain/Loss (Raw)": 2.044893264770508, "Pretrain/Step": 3169, "Pretrain/Step Time": 8.552864365279675} +{"Pretrain/Learning Rate": 3.893818954305686e-05, "Pretrain/Loss": 2.104177474975586, "Pretrain/Loss (Raw)": 2.2331175804138184, "Pretrain/Step": 3170, "Pretrain/Step Time": 8.54732414893806} +{"Pretrain/Learning Rate": 3.893114079985276e-05, "Pretrain/Loss": 2.104220390319824, "Pretrain/Loss (Raw)": 2.161067247390747, "Pretrain/Step": 3171, "Pretrain/Step Time": 8.544947925955057} +{"Pretrain/Learning Rate": 3.892409045004385e-05, "Pretrain/Loss": 2.104668140411377, "Pretrain/Loss (Raw)": 2.034332752227783, "Pretrain/Step": 3172, "Pretrain/Step Time": 8.547394139692187} +{"Pretrain/Learning Rate": 3.891703849444322e-05, "Pretrain/Loss": 2.1063921451568604, "Pretrain/Loss (Raw)": 2.3546831607818604, "Pretrain/Step": 3173, "Pretrain/Step Time": 8.55012559145689} +{"Pretrain/Learning Rate": 3.890998493386414e-05, "Pretrain/Loss": 2.1080706119537354, "Pretrain/Loss (Raw)": 2.3364057540893555, "Pretrain/Step": 3174, "Pretrain/Step Time": 8.546070758253336} +{"Pretrain/Learning Rate": 3.890292976912005e-05, "Pretrain/Loss": 2.107475757598877, "Pretrain/Loss (Raw)": 2.0641930103302, "Pretrain/Step": 3175, "Pretrain/Step Time": 8.54709979146719} +{"Pretrain/Learning Rate": 3.889587300102457e-05, "Pretrain/Loss": 2.108107566833496, "Pretrain/Loss (Raw)": 2.2008724212646484, "Pretrain/Step": 3176, "Pretrain/Step Time": 8.544305298477411} +{"Pretrain/Learning Rate": 3.8888814630391556e-05, "Pretrain/Loss": 2.106830596923828, "Pretrain/Loss (Raw)": 2.0222086906433105, "Pretrain/Step": 3177, "Pretrain/Step Time": 8.545643538236618} +{"Pretrain/Learning Rate": 3.8881754658034986e-05, "Pretrain/Loss": 2.106102705001831, "Pretrain/Loss (Raw)": 1.8635900020599365, "Pretrain/Step": 3178, "Pretrain/Step Time": 8.543698126450181} +{"Pretrain/Learning Rate": 3.8874693084769055e-05, "Pretrain/Loss": 2.1067988872528076, "Pretrain/Loss (Raw)": 2.1947150230407715, "Pretrain/Step": 3179, "Pretrain/Step Time": 8.543355118483305} +{"Pretrain/Learning Rate": 3.8867629911408135e-05, "Pretrain/Loss": 2.1097517013549805, "Pretrain/Loss (Raw)": 2.3037545680999756, "Pretrain/Step": 3180, "Pretrain/Step Time": 8.54571995139122} +{"Pretrain/Learning Rate": 3.886056513876679e-05, "Pretrain/Loss": 2.1103522777557373, "Pretrain/Loss (Raw)": 1.9536340236663818, "Pretrain/Step": 3181, "Pretrain/Step Time": 8.54707758128643} +{"Pretrain/Learning Rate": 3.885349876765976e-05, "Pretrain/Loss": 2.1111040115356445, "Pretrain/Loss (Raw)": 2.1307568550109863, "Pretrain/Step": 3182, "Pretrain/Step Time": 8.543528955429792} +{"Pretrain/Learning Rate": 3.884643079890197e-05, "Pretrain/Loss": 2.109433174133301, "Pretrain/Loss (Raw)": 1.873647928237915, "Pretrain/Step": 3183, "Pretrain/Step Time": 8.541721185669303} +{"Pretrain/Learning Rate": 3.883936123330853e-05, "Pretrain/Loss": 2.109736204147339, "Pretrain/Loss (Raw)": 2.100771903991699, "Pretrain/Step": 3184, "Pretrain/Step Time": 8.53946178033948} +{"Pretrain/Learning Rate": 3.883229007169474e-05, "Pretrain/Loss": 2.1099905967712402, "Pretrain/Loss (Raw)": 2.1010704040527344, "Pretrain/Step": 3185, "Pretrain/Step Time": 8.538121340796351} +{"Pretrain/Learning Rate": 3.8825217314876084e-05, "Pretrain/Loss": 2.1119420528411865, "Pretrain/Loss (Raw)": 2.2594408988952637, "Pretrain/Step": 3186, "Pretrain/Step Time": 8.54331400245428} +{"Pretrain/Learning Rate": 3.881814296366822e-05, "Pretrain/Loss": 2.111459732055664, "Pretrain/Loss (Raw)": 2.187845468521118, "Pretrain/Step": 3187, "Pretrain/Step Time": 8.548698090016842} +{"Pretrain/Learning Rate": 3.881106701888699e-05, "Pretrain/Loss": 2.111130714416504, "Pretrain/Loss (Raw)": 2.158153533935547, "Pretrain/Step": 3188, "Pretrain/Step Time": 8.541187243536115} +{"Pretrain/Learning Rate": 3.880398948134845e-05, "Pretrain/Loss": 2.113170623779297, "Pretrain/Loss (Raw)": 2.233788251876831, "Pretrain/Step": 3189, "Pretrain/Step Time": 8.545656377449632} +{"Pretrain/Learning Rate": 3.879691035186878e-05, "Pretrain/Loss": 2.1131060123443604, "Pretrain/Loss (Raw)": 1.9265021085739136, "Pretrain/Step": 3190, "Pretrain/Step Time": 8.547328660264611} +{"Pretrain/Learning Rate": 3.8789829631264394e-05, "Pretrain/Loss": 2.114483594894409, "Pretrain/Loss (Raw)": 2.250593662261963, "Pretrain/Step": 3191, "Pretrain/Step Time": 8.548580080270767} +{"Pretrain/Learning Rate": 3.878274732035188e-05, "Pretrain/Loss": 2.114337205886841, "Pretrain/Loss (Raw)": 2.143885612487793, "Pretrain/Step": 3192, "Pretrain/Step Time": 8.54798262566328} +{"Pretrain/Learning Rate": 3.8775663419948e-05, "Pretrain/Loss": 2.116373062133789, "Pretrain/Loss (Raw)": 2.268326997756958, "Pretrain/Step": 3193, "Pretrain/Step Time": 8.552380653098226} +{"Pretrain/Learning Rate": 3.87685779308697e-05, "Pretrain/Loss": 2.117283821105957, "Pretrain/Loss (Raw)": 2.120917320251465, "Pretrain/Step": 3194, "Pretrain/Step Time": 8.547163365408778} +{"Pretrain/Learning Rate": 3.8761490853934115e-05, "Pretrain/Loss": 2.1179022789001465, "Pretrain/Loss (Raw)": 2.1137547492980957, "Pretrain/Step": 3195, "Pretrain/Step Time": 8.546441661193967} +{"Pretrain/Learning Rate": 3.875440218995856e-05, "Pretrain/Loss": 2.1127729415893555, "Pretrain/Loss (Raw)": 1.8075312376022339, "Pretrain/Step": 3196, "Pretrain/Step Time": 8.551769027486444} +{"Pretrain/Learning Rate": 3.874731193976052e-05, "Pretrain/Loss": 2.110140085220337, "Pretrain/Loss (Raw)": 1.9637850522994995, "Pretrain/Step": 3197, "Pretrain/Step Time": 8.54717873595655} +{"Pretrain/Learning Rate": 3.87402201041577e-05, "Pretrain/Loss": 2.108761787414551, "Pretrain/Loss (Raw)": 1.802565574645996, "Pretrain/Step": 3198, "Pretrain/Step Time": 8.542697802186012} +{"Pretrain/Learning Rate": 3.8733126683967946e-05, "Pretrain/Loss": 2.1078624725341797, "Pretrain/Loss (Raw)": 2.214994192123413, "Pretrain/Step": 3199, "Pretrain/Step Time": 8.546123519539833} +{"Pretrain/Learning Rate": 3.872603168000931e-05, "Pretrain/Loss": 2.1073880195617676, "Pretrain/Loss (Raw)": 2.0476064682006836, "Pretrain/Step": 3200, "Pretrain/Step Time": 8.54071019589901} +{"Pretrain/Learning Rate": 3.871893509310003e-05, "Pretrain/Loss": 2.1085283756256104, "Pretrain/Loss (Raw)": 2.1836886405944824, "Pretrain/Step": 3201, "Pretrain/Step Time": 8.549584038555622} +{"Pretrain/Learning Rate": 3.87118369240585e-05, "Pretrain/Loss": 2.1081347465515137, "Pretrain/Loss (Raw)": 2.0918211936950684, "Pretrain/Step": 3202, "Pretrain/Step Time": 8.545129489153624} +{"Pretrain/Learning Rate": 3.870473717370333e-05, "Pretrain/Loss": 2.108837842941284, "Pretrain/Loss (Raw)": 2.163632869720459, "Pretrain/Step": 3203, "Pretrain/Step Time": 8.546638479456306} +{"Pretrain/Learning Rate": 3.869763584285328e-05, "Pretrain/Loss": 2.1083807945251465, "Pretrain/Loss (Raw)": 2.128138303756714, "Pretrain/Step": 3204, "Pretrain/Step Time": 8.544599384069443} +{"Pretrain/Learning Rate": 3.869053293232733e-05, "Pretrain/Loss": 2.1088790893554688, "Pretrain/Loss (Raw)": 2.1746039390563965, "Pretrain/Step": 3205, "Pretrain/Step Time": 8.548603409901261} +{"Pretrain/Learning Rate": 3.8683428442944604e-05, "Pretrain/Loss": 2.1074795722961426, "Pretrain/Loss (Raw)": 2.088793992996216, "Pretrain/Step": 3206, "Pretrain/Step Time": 8.544363472610712} +{"Pretrain/Learning Rate": 3.8676322375524435e-05, "Pretrain/Loss": 2.109389305114746, "Pretrain/Loss (Raw)": 2.080040454864502, "Pretrain/Step": 3207, "Pretrain/Step Time": 8.550175487995148} +{"Pretrain/Learning Rate": 3.866921473088632e-05, "Pretrain/Loss": 2.111064910888672, "Pretrain/Loss (Raw)": 2.2705676555633545, "Pretrain/Step": 3208, "Pretrain/Step Time": 8.550609009340405} +{"Pretrain/Learning Rate": 3.866210550984996e-05, "Pretrain/Loss": 2.110395669937134, "Pretrain/Loss (Raw)": 1.9673486948013306, "Pretrain/Step": 3209, "Pretrain/Step Time": 8.5517812166363} +{"Pretrain/Learning Rate": 3.86549947132352e-05, "Pretrain/Loss": 2.1103761196136475, "Pretrain/Loss (Raw)": 2.1533966064453125, "Pretrain/Step": 3210, "Pretrain/Step Time": 8.549065709114075} +{"Pretrain/Learning Rate": 3.8647882341862115e-05, "Pretrain/Loss": 2.1109371185302734, "Pretrain/Loss (Raw)": 2.027242660522461, "Pretrain/Step": 3211, "Pretrain/Step Time": 8.556709678843617} +{"Pretrain/Learning Rate": 3.864076839655093e-05, "Pretrain/Loss": 2.1102139949798584, "Pretrain/Loss (Raw)": 1.9907907247543335, "Pretrain/Step": 3212, "Pretrain/Step Time": 8.55720466375351} +{"Pretrain/Learning Rate": 3.863365287812205e-05, "Pretrain/Loss": 2.1108410358428955, "Pretrain/Loss (Raw)": 2.1481783390045166, "Pretrain/Step": 3213, "Pretrain/Step Time": 8.55766629241407} +{"Pretrain/Learning Rate": 3.862653578739608e-05, "Pretrain/Loss": 2.1084771156311035, "Pretrain/Loss (Raw)": 1.9967671632766724, "Pretrain/Step": 3214, "Pretrain/Step Time": 8.551000081002712} +{"Pretrain/Learning Rate": 3.861941712519379e-05, "Pretrain/Loss": 2.1111998558044434, "Pretrain/Loss (Raw)": 2.1714577674865723, "Pretrain/Step": 3215, "Pretrain/Step Time": 8.548318522050977} +{"Pretrain/Learning Rate": 3.8612296892336144e-05, "Pretrain/Loss": 2.110119342803955, "Pretrain/Loss (Raw)": 1.9146170616149902, "Pretrain/Step": 3216, "Pretrain/Step Time": 8.543767543509603} +{"Pretrain/Learning Rate": 3.8605175089644274e-05, "Pretrain/Loss": 2.1108744144439697, "Pretrain/Loss (Raw)": 2.261598825454712, "Pretrain/Step": 3217, "Pretrain/Step Time": 8.551403595134616} +{"Pretrain/Learning Rate": 3.859805171793951e-05, "Pretrain/Loss": 2.1098685264587402, "Pretrain/Loss (Raw)": 2.267549514770508, "Pretrain/Step": 3218, "Pretrain/Step Time": 8.550344424322248} +{"Pretrain/Learning Rate": 3.8590926778043335e-05, "Pretrain/Loss": 2.109553337097168, "Pretrain/Loss (Raw)": 2.0013880729675293, "Pretrain/Step": 3219, "Pretrain/Step Time": 8.556083463132381} +{"Pretrain/Learning Rate": 3.858380027077745e-05, "Pretrain/Loss": 2.1107702255249023, "Pretrain/Loss (Raw)": 2.256648302078247, "Pretrain/Step": 3220, "Pretrain/Step Time": 8.5570854768157} +{"Pretrain/Learning Rate": 3.8576672196963705e-05, "Pretrain/Loss": 2.110060214996338, "Pretrain/Loss (Raw)": 2.058567523956299, "Pretrain/Step": 3221, "Pretrain/Step Time": 8.557682117447257} +{"Pretrain/Learning Rate": 3.856954255742414e-05, "Pretrain/Loss": 2.109581470489502, "Pretrain/Loss (Raw)": 1.9960335493087769, "Pretrain/Step": 3222, "Pretrain/Step Time": 8.550416674464941} +{"Pretrain/Learning Rate": 3.8562411352980996e-05, "Pretrain/Loss": 2.1096701622009277, "Pretrain/Loss (Raw)": 2.121945858001709, "Pretrain/Step": 3223, "Pretrain/Step Time": 8.553743056952953} +{"Pretrain/Learning Rate": 3.8555278584456664e-05, "Pretrain/Loss": 2.111970901489258, "Pretrain/Loss (Raw)": 2.303420305252075, "Pretrain/Step": 3224, "Pretrain/Step Time": 8.543541697785258} +{"Pretrain/Learning Rate": 3.854814425267373e-05, "Pretrain/Loss": 2.1113691329956055, "Pretrain/Loss (Raw)": 1.9758195877075195, "Pretrain/Step": 3225, "Pretrain/Step Time": 8.546993339434266} +{"Pretrain/Learning Rate": 3.8541008358454956e-05, "Pretrain/Loss": 2.1103010177612305, "Pretrain/Loss (Raw)": 1.9176199436187744, "Pretrain/Step": 3226, "Pretrain/Step Time": 8.543593799695373} +{"Pretrain/Learning Rate": 3.853387090262329e-05, "Pretrain/Loss": 2.1084413528442383, "Pretrain/Loss (Raw)": 2.111027479171753, "Pretrain/Step": 3227, "Pretrain/Step Time": 8.544279048219323} +{"Pretrain/Learning Rate": 3.852673188600187e-05, "Pretrain/Loss": 2.110680103302002, "Pretrain/Loss (Raw)": 2.289820909500122, "Pretrain/Step": 3228, "Pretrain/Step Time": 8.5427171215415} +{"Pretrain/Learning Rate": 3.851959130941398e-05, "Pretrain/Loss": 2.1094722747802734, "Pretrain/Loss (Raw)": 1.9464073181152344, "Pretrain/Step": 3229, "Pretrain/Step Time": 8.547811152413487} +{"Pretrain/Learning Rate": 3.851244917368311e-05, "Pretrain/Loss": 2.1081275939941406, "Pretrain/Loss (Raw)": 2.088104009628296, "Pretrain/Step": 3230, "Pretrain/Step Time": 8.538314297795296} +{"Pretrain/Learning Rate": 3.8505305479632934e-05, "Pretrain/Loss": 2.10707426071167, "Pretrain/Loss (Raw)": 1.9271703958511353, "Pretrain/Step": 3231, "Pretrain/Step Time": 8.544429764151573} +{"Pretrain/Learning Rate": 3.8498160228087284e-05, "Pretrain/Loss": 2.1065149307250977, "Pretrain/Loss (Raw)": 2.1323165893554688, "Pretrain/Step": 3232, "Pretrain/Step Time": 8.537501713261008} +{"Pretrain/Learning Rate": 3.8491013419870204e-05, "Pretrain/Loss": 2.1053240299224854, "Pretrain/Loss (Raw)": 1.9382275342941284, "Pretrain/Step": 3233, "Pretrain/Step Time": 8.533203702419996} +{"Pretrain/Learning Rate": 3.848386505580588e-05, "Pretrain/Loss": 2.1028730869293213, "Pretrain/Loss (Raw)": 2.007112979888916, "Pretrain/Step": 3234, "Pretrain/Step Time": 8.531361855566502} +{"Pretrain/Learning Rate": 3.84767151367187e-05, "Pretrain/Loss": 2.110147476196289, "Pretrain/Loss (Raw)": 2.6246776580810547, "Pretrain/Step": 3235, "Pretrain/Step Time": 8.531825160607696} +{"Pretrain/Learning Rate": 3.846956366343322e-05, "Pretrain/Loss": 2.1112523078918457, "Pretrain/Loss (Raw)": 2.011420488357544, "Pretrain/Step": 3236, "Pretrain/Step Time": 8.53347017429769} +{"Pretrain/Learning Rate": 3.8462410636774196e-05, "Pretrain/Loss": 2.11023211479187, "Pretrain/Loss (Raw)": 2.110167980194092, "Pretrain/Step": 3237, "Pretrain/Step Time": 8.53142667375505} +{"Pretrain/Learning Rate": 3.845525605756653e-05, "Pretrain/Loss": 2.110290050506592, "Pretrain/Loss (Raw)": 2.1294853687286377, "Pretrain/Step": 3238, "Pretrain/Step Time": 8.531981525942683} +{"Pretrain/Learning Rate": 3.844809992663534e-05, "Pretrain/Loss": 2.1110000610351562, "Pretrain/Loss (Raw)": 2.103172779083252, "Pretrain/Step": 3239, "Pretrain/Step Time": 8.53390114940703} +{"Pretrain/Learning Rate": 3.844094224480589e-05, "Pretrain/Loss": 2.1108012199401855, "Pretrain/Loss (Raw)": 2.1129987239837646, "Pretrain/Step": 3240, "Pretrain/Step Time": 8.529348788782954} +{"Pretrain/Learning Rate": 3.843378301290366e-05, "Pretrain/Loss": 2.112398386001587, "Pretrain/Loss (Raw)": 2.2795891761779785, "Pretrain/Step": 3241, "Pretrain/Step Time": 8.525362392887473} +{"Pretrain/Learning Rate": 3.8426622231754255e-05, "Pretrain/Loss": 2.112396001815796, "Pretrain/Loss (Raw)": 2.18255615234375, "Pretrain/Step": 3242, "Pretrain/Step Time": 8.538778826594353} +{"Pretrain/Learning Rate": 3.8419459902183515e-05, "Pretrain/Loss": 2.107123851776123, "Pretrain/Loss (Raw)": 1.7295925617218018, "Pretrain/Step": 3243, "Pretrain/Step Time": 8.53315650112927} +{"Pretrain/Learning Rate": 3.841229602501742e-05, "Pretrain/Loss": 2.1091456413269043, "Pretrain/Loss (Raw)": 2.1646764278411865, "Pretrain/Step": 3244, "Pretrain/Step Time": 8.526738187298179} +{"Pretrain/Learning Rate": 3.840513060108214e-05, "Pretrain/Loss": 2.1088919639587402, "Pretrain/Loss (Raw)": 1.9682952165603638, "Pretrain/Step": 3245, "Pretrain/Step Time": 8.52815323881805} +{"Pretrain/Learning Rate": 3.8397963631204046e-05, "Pretrain/Loss": 2.107860565185547, "Pretrain/Loss (Raw)": 2.0258688926696777, "Pretrain/Step": 3246, "Pretrain/Step Time": 8.526963965967298} +{"Pretrain/Learning Rate": 3.8390795116209645e-05, "Pretrain/Loss": 2.105715274810791, "Pretrain/Loss (Raw)": 2.06369686126709, "Pretrain/Step": 3247, "Pretrain/Step Time": 8.527846843004227} +{"Pretrain/Learning Rate": 3.8383625056925654e-05, "Pretrain/Loss": 2.1030502319335938, "Pretrain/Loss (Raw)": 2.1565346717834473, "Pretrain/Step": 3248, "Pretrain/Step Time": 8.537957502529025} +{"Pretrain/Learning Rate": 3.837645345417895e-05, "Pretrain/Loss": 2.101276159286499, "Pretrain/Loss (Raw)": 2.0731141567230225, "Pretrain/Step": 3249, "Pretrain/Step Time": 8.529234809800982} +{"Pretrain/Learning Rate": 3.836928030879661e-05, "Pretrain/Loss": 2.1018195152282715, "Pretrain/Loss (Raw)": 2.0543270111083984, "Pretrain/Step": 3250, "Pretrain/Step Time": 8.530512321740389} +{"Pretrain/Learning Rate": 3.8362105621605866e-05, "Pretrain/Loss": 2.1038098335266113, "Pretrain/Loss (Raw)": 2.302290678024292, "Pretrain/Step": 3251, "Pretrain/Step Time": 8.53051364608109} +{"Pretrain/Learning Rate": 3.835492939343413e-05, "Pretrain/Loss": 2.1058008670806885, "Pretrain/Loss (Raw)": 2.011695623397827, "Pretrain/Step": 3252, "Pretrain/Step Time": 8.528925195336342} +{"Pretrain/Learning Rate": 3.834775162510901e-05, "Pretrain/Loss": 2.10497784614563, "Pretrain/Loss (Raw)": 1.9483683109283447, "Pretrain/Step": 3253, "Pretrain/Step Time": 8.537294682115316} +{"Pretrain/Learning Rate": 3.834057231745828e-05, "Pretrain/Loss": 2.105558395385742, "Pretrain/Loss (Raw)": 2.0687639713287354, "Pretrain/Step": 3254, "Pretrain/Step Time": 8.535082716494799} +{"Pretrain/Learning Rate": 3.8333391471309884e-05, "Pretrain/Loss": 2.1053662300109863, "Pretrain/Loss (Raw)": 2.074535369873047, "Pretrain/Step": 3255, "Pretrain/Step Time": 8.53644391708076} +{"Pretrain/Learning Rate": 3.8326209087491955e-05, "Pretrain/Loss": 2.1044716835021973, "Pretrain/Loss (Raw)": 2.0816805362701416, "Pretrain/Step": 3256, "Pretrain/Step Time": 8.53379475325346} +{"Pretrain/Learning Rate": 3.8319025166832794e-05, "Pretrain/Loss": 2.1027355194091797, "Pretrain/Loss (Raw)": 1.8619235754013062, "Pretrain/Step": 3257, "Pretrain/Step Time": 8.52814169973135} +{"Pretrain/Learning Rate": 3.83118397101609e-05, "Pretrain/Loss": 2.1009128093719482, "Pretrain/Loss (Raw)": 1.867730975151062, "Pretrain/Step": 3258, "Pretrain/Step Time": 8.533114559948444} +{"Pretrain/Learning Rate": 3.830465271830491e-05, "Pretrain/Loss": 2.1000356674194336, "Pretrain/Loss (Raw)": 1.9871677160263062, "Pretrain/Step": 3259, "Pretrain/Step Time": 8.533676650375128} +{"Pretrain/Learning Rate": 3.829746419209369e-05, "Pretrain/Loss": 2.098816394805908, "Pretrain/Loss (Raw)": 1.9837027788162231, "Pretrain/Step": 3260, "Pretrain/Step Time": 8.528122140094638} +{"Pretrain/Learning Rate": 3.829027413235623e-05, "Pretrain/Loss": 2.0989904403686523, "Pretrain/Loss (Raw)": 2.094231128692627, "Pretrain/Step": 3261, "Pretrain/Step Time": 8.53350037150085} +{"Pretrain/Learning Rate": 3.8283082539921735e-05, "Pretrain/Loss": 2.1000256538391113, "Pretrain/Loss (Raw)": 1.9213272333145142, "Pretrain/Step": 3262, "Pretrain/Step Time": 8.528843915089965} +{"Pretrain/Learning Rate": 3.827588941561956e-05, "Pretrain/Loss": 2.097806930541992, "Pretrain/Loss (Raw)": 1.868719220161438, "Pretrain/Step": 3263, "Pretrain/Step Time": 8.533316060900688} +{"Pretrain/Learning Rate": 3.826869476027927e-05, "Pretrain/Loss": 2.0969462394714355, "Pretrain/Loss (Raw)": 2.107884168624878, "Pretrain/Step": 3264, "Pretrain/Step Time": 8.53645539842546} +{"Pretrain/Learning Rate": 3.826149857473057e-05, "Pretrain/Loss": 2.09751558303833, "Pretrain/Loss (Raw)": 2.3377890586853027, "Pretrain/Step": 3265, "Pretrain/Step Time": 8.53204132989049} +{"Pretrain/Learning Rate": 3.825430085980337e-05, "Pretrain/Loss": 2.096860408782959, "Pretrain/Loss (Raw)": 2.0271880626678467, "Pretrain/Step": 3266, "Pretrain/Step Time": 8.533649059012532} +{"Pretrain/Learning Rate": 3.8247101616327726e-05, "Pretrain/Loss": 2.0977954864501953, "Pretrain/Loss (Raw)": 2.2062697410583496, "Pretrain/Step": 3267, "Pretrain/Step Time": 8.533591013401747} +{"Pretrain/Learning Rate": 3.823990084513391e-05, "Pretrain/Loss": 2.0986404418945312, "Pretrain/Loss (Raw)": 2.205170154571533, "Pretrain/Step": 3268, "Pretrain/Step Time": 8.528644206002355} +{"Pretrain/Learning Rate": 3.8232698547052345e-05, "Pretrain/Loss": 2.099046230316162, "Pretrain/Loss (Raw)": 2.095703125, "Pretrain/Step": 3269, "Pretrain/Step Time": 8.535594517365098} +{"Pretrain/Learning Rate": 3.8225494722913624e-05, "Pretrain/Loss": 2.0987160205841064, "Pretrain/Loss (Raw)": 2.035602331161499, "Pretrain/Step": 3270, "Pretrain/Step Time": 8.539067540317774} +{"Pretrain/Learning Rate": 3.821828937354853e-05, "Pretrain/Loss": 2.0991621017456055, "Pretrain/Loss (Raw)": 2.1620757579803467, "Pretrain/Step": 3271, "Pretrain/Step Time": 8.537002740427852} +{"Pretrain/Learning Rate": 3.821108249978802e-05, "Pretrain/Loss": 2.1002399921417236, "Pretrain/Loss (Raw)": 2.119410514831543, "Pretrain/Step": 3272, "Pretrain/Step Time": 8.539880068972707} +{"Pretrain/Learning Rate": 3.8203874102463235e-05, "Pretrain/Loss": 2.0996570587158203, "Pretrain/Loss (Raw)": 1.872390627861023, "Pretrain/Step": 3273, "Pretrain/Step Time": 8.533684825524688} +{"Pretrain/Learning Rate": 3.819666418240545e-05, "Pretrain/Loss": 2.099527597427368, "Pretrain/Loss (Raw)": 2.0737719535827637, "Pretrain/Step": 3274, "Pretrain/Step Time": 8.536831755191088} +{"Pretrain/Learning Rate": 3.818945274044618e-05, "Pretrain/Loss": 2.0971546173095703, "Pretrain/Loss (Raw)": 2.0886874198913574, "Pretrain/Step": 3275, "Pretrain/Step Time": 8.535277446731925} +{"Pretrain/Learning Rate": 3.8182239777417066e-05, "Pretrain/Loss": 2.0965166091918945, "Pretrain/Loss (Raw)": 1.9266139268875122, "Pretrain/Step": 3276, "Pretrain/Step Time": 8.531537430360913} +{"Pretrain/Learning Rate": 3.817502529414994e-05, "Pretrain/Loss": 2.0972161293029785, "Pretrain/Loss (Raw)": 2.248267412185669, "Pretrain/Step": 3277, "Pretrain/Step Time": 8.52872160077095} +{"Pretrain/Learning Rate": 3.816780929147682e-05, "Pretrain/Loss": 2.096972942352295, "Pretrain/Loss (Raw)": 2.1491785049438477, "Pretrain/Step": 3278, "Pretrain/Step Time": 8.530030338093638} +{"Pretrain/Learning Rate": 3.816059177022988e-05, "Pretrain/Loss": 2.095824718475342, "Pretrain/Loss (Raw)": 1.9920262098312378, "Pretrain/Step": 3279, "Pretrain/Step Time": 8.532086335122585} +{"Pretrain/Learning Rate": 3.8153372731241486e-05, "Pretrain/Loss": 2.097954273223877, "Pretrain/Loss (Raw)": 2.2820498943328857, "Pretrain/Step": 3280, "Pretrain/Step Time": 8.532747900113463} +{"Pretrain/Learning Rate": 3.814615217534416e-05, "Pretrain/Loss": 2.098569393157959, "Pretrain/Loss (Raw)": 2.1827659606933594, "Pretrain/Step": 3281, "Pretrain/Step Time": 8.533699875697494} +{"Pretrain/Learning Rate": 3.813893010337063e-05, "Pretrain/Loss": 2.0973386764526367, "Pretrain/Loss (Raw)": 1.978074312210083, "Pretrain/Step": 3282, "Pretrain/Step Time": 8.53198317065835} +{"Pretrain/Learning Rate": 3.813170651615376e-05, "Pretrain/Loss": 2.0980470180511475, "Pretrain/Loss (Raw)": 2.2096261978149414, "Pretrain/Step": 3283, "Pretrain/Step Time": 8.535649115219712} +{"Pretrain/Learning Rate": 3.8124481414526613e-05, "Pretrain/Loss": 2.101233720779419, "Pretrain/Loss (Raw)": 2.3823306560516357, "Pretrain/Step": 3284, "Pretrain/Step Time": 8.539709158241749} +{"Pretrain/Learning Rate": 3.811725479932243e-05, "Pretrain/Loss": 2.101223945617676, "Pretrain/Loss (Raw)": 2.1723294258117676, "Pretrain/Step": 3285, "Pretrain/Step Time": 8.536451241001487} +{"Pretrain/Learning Rate": 3.8110026671374615e-05, "Pretrain/Loss": 2.099952220916748, "Pretrain/Loss (Raw)": 1.9956552982330322, "Pretrain/Step": 3286, "Pretrain/Step Time": 8.537488680332899} +{"Pretrain/Learning Rate": 3.810279703151674e-05, "Pretrain/Loss": 2.0980236530303955, "Pretrain/Loss (Raw)": 1.886608362197876, "Pretrain/Step": 3287, "Pretrain/Step Time": 8.534398881718516} +{"Pretrain/Learning Rate": 3.809556588058258e-05, "Pretrain/Loss": 2.097745418548584, "Pretrain/Loss (Raw)": 2.221323251724243, "Pretrain/Step": 3288, "Pretrain/Step Time": 8.539218252524734} +{"Pretrain/Learning Rate": 3.8088333219406046e-05, "Pretrain/Loss": 2.0967230796813965, "Pretrain/Loss (Raw)": 2.1138625144958496, "Pretrain/Step": 3289, "Pretrain/Step Time": 8.534415816888213} +{"Pretrain/Learning Rate": 3.808109904882126e-05, "Pretrain/Loss": 2.0965688228607178, "Pretrain/Loss (Raw)": 2.108602285385132, "Pretrain/Step": 3290, "Pretrain/Step Time": 8.53364186361432} +{"Pretrain/Learning Rate": 3.807386336966248e-05, "Pretrain/Loss": 2.0949528217315674, "Pretrain/Loss (Raw)": 2.030735969543457, "Pretrain/Step": 3291, "Pretrain/Step Time": 8.530588505789638} +{"Pretrain/Learning Rate": 3.8066626182764174e-05, "Pretrain/Loss": 2.095848560333252, "Pretrain/Loss (Raw)": 2.1193432807922363, "Pretrain/Step": 3292, "Pretrain/Step Time": 8.531770894303918} +{"Pretrain/Learning Rate": 3.805938748896097e-05, "Pretrain/Loss": 2.097566843032837, "Pretrain/Loss (Raw)": 2.2867941856384277, "Pretrain/Step": 3293, "Pretrain/Step Time": 8.530759491026402} +{"Pretrain/Learning Rate": 3.805214728908765e-05, "Pretrain/Loss": 2.0957446098327637, "Pretrain/Loss (Raw)": 1.8806447982788086, "Pretrain/Step": 3294, "Pretrain/Step Time": 8.536146545782685} +{"Pretrain/Learning Rate": 3.804490558397922e-05, "Pretrain/Loss": 2.0948715209960938, "Pretrain/Loss (Raw)": 2.007700204849243, "Pretrain/Step": 3295, "Pretrain/Step Time": 8.528682503849268} +{"Pretrain/Learning Rate": 3.803766237447079e-05, "Pretrain/Loss": 2.0928425788879395, "Pretrain/Loss (Raw)": 1.8897947072982788, "Pretrain/Step": 3296, "Pretrain/Step Time": 8.53806359320879} +{"Pretrain/Learning Rate": 3.803041766139771e-05, "Pretrain/Loss": 2.092893600463867, "Pretrain/Loss (Raw)": 2.0514371395111084, "Pretrain/Step": 3297, "Pretrain/Step Time": 8.535050941631198} +{"Pretrain/Learning Rate": 3.8023171445595464e-05, "Pretrain/Loss": 2.0918800830841064, "Pretrain/Loss (Raw)": 2.103372097015381, "Pretrain/Step": 3298, "Pretrain/Step Time": 8.53012134693563} +{"Pretrain/Learning Rate": 3.8015923727899714e-05, "Pretrain/Loss": 2.0907928943634033, "Pretrain/Loss (Raw)": 2.0219030380249023, "Pretrain/Step": 3299, "Pretrain/Step Time": 8.534817254170775} +{"Pretrain/Learning Rate": 3.8008674509146304e-05, "Pretrain/Loss": 2.0908000469207764, "Pretrain/Loss (Raw)": 2.035255193710327, "Pretrain/Step": 3300, "Pretrain/Step Time": 8.538680272176862} +{"Pretrain/Learning Rate": 3.800142379017127e-05, "Pretrain/Loss": 2.088883399963379, "Pretrain/Loss (Raw)": 2.1093575954437256, "Pretrain/Step": 3301, "Pretrain/Step Time": 8.539302673190832} +{"Pretrain/Learning Rate": 3.799417157181076e-05, "Pretrain/Loss": 2.084930181503296, "Pretrain/Loss (Raw)": 1.8303934335708618, "Pretrain/Step": 3302, "Pretrain/Step Time": 8.54179273545742} +{"Pretrain/Learning Rate": 3.798691785490115e-05, "Pretrain/Loss": 2.0844335556030273, "Pretrain/Loss (Raw)": 2.0006301403045654, "Pretrain/Step": 3303, "Pretrain/Step Time": 8.537698501721025} +{"Pretrain/Learning Rate": 3.797966264027899e-05, "Pretrain/Loss": 2.0842320919036865, "Pretrain/Loss (Raw)": 2.175060272216797, "Pretrain/Step": 3304, "Pretrain/Step Time": 8.53895914182067} +{"Pretrain/Learning Rate": 3.7972405928780974e-05, "Pretrain/Loss": 2.0846569538116455, "Pretrain/Loss (Raw)": 2.0766184329986572, "Pretrain/Step": 3305, "Pretrain/Step Time": 8.540749475359917} +{"Pretrain/Learning Rate": 3.796514772124396e-05, "Pretrain/Loss": 2.086923599243164, "Pretrain/Loss (Raw)": 2.153714895248413, "Pretrain/Step": 3306, "Pretrain/Step Time": 8.542132107540965} +{"Pretrain/Learning Rate": 3.795788801850504e-05, "Pretrain/Loss": 2.0887272357940674, "Pretrain/Loss (Raw)": 2.425553321838379, "Pretrain/Step": 3307, "Pretrain/Step Time": 8.545088108628988} +{"Pretrain/Learning Rate": 3.7950626821401405e-05, "Pretrain/Loss": 2.0878584384918213, "Pretrain/Loss (Raw)": 2.1925761699676514, "Pretrain/Step": 3308, "Pretrain/Step Time": 8.53984185680747} +{"Pretrain/Learning Rate": 3.794336413077045e-05, "Pretrain/Loss": 2.090470790863037, "Pretrain/Loss (Raw)": 2.2879927158355713, "Pretrain/Step": 3309, "Pretrain/Step Time": 8.536535328254104} +{"Pretrain/Learning Rate": 3.793609994744977e-05, "Pretrain/Loss": 2.0897135734558105, "Pretrain/Loss (Raw)": 2.0338313579559326, "Pretrain/Step": 3310, "Pretrain/Step Time": 8.538084143772721} +{"Pretrain/Learning Rate": 3.792883427227707e-05, "Pretrain/Loss": 2.0902466773986816, "Pretrain/Loss (Raw)": 1.9418915510177612, "Pretrain/Step": 3311, "Pretrain/Step Time": 8.53682461194694} +{"Pretrain/Learning Rate": 3.7921567106090297e-05, "Pretrain/Loss": 2.0900180339813232, "Pretrain/Loss (Raw)": 2.0715184211730957, "Pretrain/Step": 3312, "Pretrain/Step Time": 8.541764181107283} +{"Pretrain/Learning Rate": 3.79142984497275e-05, "Pretrain/Loss": 2.0893335342407227, "Pretrain/Loss (Raw)": 2.0134830474853516, "Pretrain/Step": 3313, "Pretrain/Step Time": 8.546357594430447} +{"Pretrain/Learning Rate": 3.790702830402696e-05, "Pretrain/Loss": 2.0876150131225586, "Pretrain/Loss (Raw)": 2.0394277572631836, "Pretrain/Step": 3314, "Pretrain/Step Time": 8.545161431655288} +{"Pretrain/Learning Rate": 3.7899756669827094e-05, "Pretrain/Loss": 2.087705612182617, "Pretrain/Loss (Raw)": 2.1994428634643555, "Pretrain/Step": 3315, "Pretrain/Step Time": 8.540658576413989} +{"Pretrain/Learning Rate": 3.789248354796651e-05, "Pretrain/Loss": 2.087963581085205, "Pretrain/Loss (Raw)": 2.1912035942077637, "Pretrain/Step": 3316, "Pretrain/Step Time": 8.542748387902975} +{"Pretrain/Learning Rate": 3.788520893928396e-05, "Pretrain/Loss": 2.085944890975952, "Pretrain/Loss (Raw)": 1.9753841161727905, "Pretrain/Step": 3317, "Pretrain/Step Time": 8.544912829995155} +{"Pretrain/Learning Rate": 3.78779328446184e-05, "Pretrain/Loss": 2.08866286277771, "Pretrain/Loss (Raw)": 2.2744014263153076, "Pretrain/Step": 3318, "Pretrain/Step Time": 8.540292432531714} +{"Pretrain/Learning Rate": 3.7870655264808954e-05, "Pretrain/Loss": 2.086660623550415, "Pretrain/Loss (Raw)": 1.9943057298660278, "Pretrain/Step": 3319, "Pretrain/Step Time": 8.53859886340797} +{"Pretrain/Learning Rate": 3.786337620069488e-05, "Pretrain/Loss": 2.0859084129333496, "Pretrain/Loss (Raw)": 2.0475900173187256, "Pretrain/Step": 3320, "Pretrain/Step Time": 8.542190697044134} +{"Pretrain/Learning Rate": 3.7856095653115655e-05, "Pretrain/Loss": 2.084752082824707, "Pretrain/Loss (Raw)": 2.120316982269287, "Pretrain/Step": 3321, "Pretrain/Step Time": 8.53669873997569} +{"Pretrain/Learning Rate": 3.7848813622910894e-05, "Pretrain/Loss": 2.0840134620666504, "Pretrain/Loss (Raw)": 2.0263545513153076, "Pretrain/Step": 3322, "Pretrain/Step Time": 8.534960344433784} +{"Pretrain/Learning Rate": 3.784153011092041e-05, "Pretrain/Loss": 2.0837132930755615, "Pretrain/Loss (Raw)": 2.075343370437622, "Pretrain/Step": 3323, "Pretrain/Step Time": 8.533890921622515} +{"Pretrain/Learning Rate": 3.7834245117984155e-05, "Pretrain/Loss": 2.0885119438171387, "Pretrain/Loss (Raw)": 2.4217703342437744, "Pretrain/Step": 3324, "Pretrain/Step Time": 8.529877802357078} +{"Pretrain/Learning Rate": 3.782695864494228e-05, "Pretrain/Loss": 2.090843439102173, "Pretrain/Loss (Raw)": 2.262214422225952, "Pretrain/Step": 3325, "Pretrain/Step Time": 8.530881240963936} +{"Pretrain/Learning Rate": 3.781967069263509e-05, "Pretrain/Loss": 2.0947978496551514, "Pretrain/Loss (Raw)": 2.308742046356201, "Pretrain/Step": 3326, "Pretrain/Step Time": 8.53929309733212} +{"Pretrain/Learning Rate": 3.781238126190306e-05, "Pretrain/Loss": 2.091663360595703, "Pretrain/Loss (Raw)": 1.8137717247009277, "Pretrain/Step": 3327, "Pretrain/Step Time": 8.536350566893816} +{"Pretrain/Learning Rate": 3.780509035358686e-05, "Pretrain/Loss": 2.091392755508423, "Pretrain/Loss (Raw)": 2.0129575729370117, "Pretrain/Step": 3328, "Pretrain/Step Time": 8.53952218964696} +{"Pretrain/Learning Rate": 3.77977979685273e-05, "Pretrain/Loss": 2.0903518199920654, "Pretrain/Loss (Raw)": 2.050455093383789, "Pretrain/Step": 3329, "Pretrain/Step Time": 8.527535811066628} +{"Pretrain/Learning Rate": 3.7790504107565366e-05, "Pretrain/Loss": 2.0896334648132324, "Pretrain/Loss (Raw)": 1.9998924732208252, "Pretrain/Step": 3330, "Pretrain/Step Time": 8.52728951908648} +{"Pretrain/Learning Rate": 3.7783208771542237e-05, "Pretrain/Loss": 2.0888237953186035, "Pretrain/Loss (Raw)": 2.0599794387817383, "Pretrain/Step": 3331, "Pretrain/Step Time": 8.537906328216195} +{"Pretrain/Learning Rate": 3.7775911961299225e-05, "Pretrain/Loss": 2.089662551879883, "Pretrain/Loss (Raw)": 2.23551869392395, "Pretrain/Step": 3332, "Pretrain/Step Time": 8.54180040769279} +{"Pretrain/Learning Rate": 3.776861367767785e-05, "Pretrain/Loss": 2.089813470840454, "Pretrain/Loss (Raw)": 2.193913221359253, "Pretrain/Step": 3333, "Pretrain/Step Time": 8.538469383493066} +{"Pretrain/Learning Rate": 3.776131392151978e-05, "Pretrain/Loss": 2.091134548187256, "Pretrain/Loss (Raw)": 2.257888078689575, "Pretrain/Step": 3334, "Pretrain/Step Time": 8.544114461168647} +{"Pretrain/Learning Rate": 3.775401269366685e-05, "Pretrain/Loss": 2.0933351516723633, "Pretrain/Loss (Raw)": 2.3617260456085205, "Pretrain/Step": 3335, "Pretrain/Step Time": 8.533344965428114} +{"Pretrain/Learning Rate": 3.7746709994961085e-05, "Pretrain/Loss": 2.0915026664733887, "Pretrain/Loss (Raw)": 2.0359928607940674, "Pretrain/Step": 3336, "Pretrain/Step Time": 8.534990884363651} +{"Pretrain/Learning Rate": 3.7739405826244645e-05, "Pretrain/Loss": 2.0921425819396973, "Pretrain/Loss (Raw)": 2.0492613315582275, "Pretrain/Step": 3337, "Pretrain/Step Time": 8.538976347073913} +{"Pretrain/Learning Rate": 3.773210018835991e-05, "Pretrain/Loss": 2.091923952102661, "Pretrain/Loss (Raw)": 2.1254138946533203, "Pretrain/Step": 3338, "Pretrain/Step Time": 8.541080549359322} +{"Pretrain/Learning Rate": 3.772479308214937e-05, "Pretrain/Loss": 2.0939745903015137, "Pretrain/Loss (Raw)": 2.2897140979766846, "Pretrain/Step": 3339, "Pretrain/Step Time": 8.537276254966855} +{"Pretrain/Learning Rate": 3.771748450845575e-05, "Pretrain/Loss": 2.0949044227600098, "Pretrain/Loss (Raw)": 2.109823703765869, "Pretrain/Step": 3340, "Pretrain/Step Time": 8.531098317354918} +{"Pretrain/Learning Rate": 3.771017446812187e-05, "Pretrain/Loss": 2.0949578285217285, "Pretrain/Loss (Raw)": 2.1550114154815674, "Pretrain/Step": 3341, "Pretrain/Step Time": 8.532780844718218} +{"Pretrain/Learning Rate": 3.770286296199079e-05, "Pretrain/Loss": 2.0958569049835205, "Pretrain/Loss (Raw)": 2.111846446990967, "Pretrain/Step": 3342, "Pretrain/Step Time": 8.531739097088575} +{"Pretrain/Learning Rate": 3.7695549990905694e-05, "Pretrain/Loss": 2.0958428382873535, "Pretrain/Loss (Raw)": 2.1696412563323975, "Pretrain/Step": 3343, "Pretrain/Step Time": 8.52992288209498} +{"Pretrain/Learning Rate": 3.768823555570995e-05, "Pretrain/Loss": 2.0975077152252197, "Pretrain/Loss (Raw)": 2.127711057662964, "Pretrain/Step": 3344, "Pretrain/Step Time": 8.543270163238049} +{"Pretrain/Learning Rate": 3.768091965724709e-05, "Pretrain/Loss": 2.096010684967041, "Pretrain/Loss (Raw)": 2.06998872756958, "Pretrain/Step": 3345, "Pretrain/Step Time": 8.538066735491157} +{"Pretrain/Learning Rate": 3.767360229636082e-05, "Pretrain/Loss": 2.0937585830688477, "Pretrain/Loss (Raw)": 1.9793168306350708, "Pretrain/Step": 3346, "Pretrain/Step Time": 8.534944619983435} +{"Pretrain/Learning Rate": 3.7666283473895014e-05, "Pretrain/Loss": 2.095992088317871, "Pretrain/Loss (Raw)": 2.2872464656829834, "Pretrain/Step": 3347, "Pretrain/Step Time": 8.533212075009942} +{"Pretrain/Learning Rate": 3.765896319069372e-05, "Pretrain/Loss": 2.0929970741271973, "Pretrain/Loss (Raw)": 1.8732961416244507, "Pretrain/Step": 3348, "Pretrain/Step Time": 8.532772045582533} +{"Pretrain/Learning Rate": 3.7651641447601126e-05, "Pretrain/Loss": 2.0938258171081543, "Pretrain/Loss (Raw)": 2.1646432876586914, "Pretrain/Step": 3349, "Pretrain/Step Time": 8.533259216696024} +{"Pretrain/Learning Rate": 3.764431824546163e-05, "Pretrain/Loss": 2.0931122303009033, "Pretrain/Loss (Raw)": 1.9047040939331055, "Pretrain/Step": 3350, "Pretrain/Step Time": 8.535183912143111} +{"Pretrain/Learning Rate": 3.7636993585119775e-05, "Pretrain/Loss": 2.091428756713867, "Pretrain/Loss (Raw)": 1.9064500331878662, "Pretrain/Step": 3351, "Pretrain/Step Time": 8.537654796615243} +{"Pretrain/Learning Rate": 3.762966746742027e-05, "Pretrain/Loss": 2.088510036468506, "Pretrain/Loss (Raw)": 1.929827094078064, "Pretrain/Step": 3352, "Pretrain/Step Time": 8.539585510268807} +{"Pretrain/Learning Rate": 3.7622339893208e-05, "Pretrain/Loss": 2.0907840728759766, "Pretrain/Loss (Raw)": 2.266914129257202, "Pretrain/Step": 3353, "Pretrain/Step Time": 8.535526789724827} +{"Pretrain/Learning Rate": 3.761501086332802e-05, "Pretrain/Loss": 2.0912506580352783, "Pretrain/Loss (Raw)": 1.9773451089859009, "Pretrain/Step": 3354, "Pretrain/Step Time": 8.539822060614824} +{"Pretrain/Learning Rate": 3.760768037862553e-05, "Pretrain/Loss": 2.090181589126587, "Pretrain/Loss (Raw)": 1.9741551876068115, "Pretrain/Step": 3355, "Pretrain/Step Time": 8.53945392370224} +{"Pretrain/Learning Rate": 3.760034843994594e-05, "Pretrain/Loss": 2.0886921882629395, "Pretrain/Loss (Raw)": 2.0991599559783936, "Pretrain/Step": 3356, "Pretrain/Step Time": 8.54597002826631} +{"Pretrain/Learning Rate": 3.7593015048134794e-05, "Pretrain/Loss": 2.091463327407837, "Pretrain/Loss (Raw)": 2.3011600971221924, "Pretrain/Step": 3357, "Pretrain/Step Time": 8.542153369635344} +{"Pretrain/Learning Rate": 3.758568020403781e-05, "Pretrain/Loss": 2.091171979904175, "Pretrain/Loss (Raw)": 2.0507984161376953, "Pretrain/Step": 3358, "Pretrain/Step Time": 8.54773380793631} +{"Pretrain/Learning Rate": 3.757834390850088e-05, "Pretrain/Loss": 2.091942310333252, "Pretrain/Loss (Raw)": 2.0257840156555176, "Pretrain/Step": 3359, "Pretrain/Step Time": 8.54299983754754} +{"Pretrain/Learning Rate": 3.7571006162370056e-05, "Pretrain/Loss": 2.091155767440796, "Pretrain/Loss (Raw)": 2.0316128730773926, "Pretrain/Step": 3360, "Pretrain/Step Time": 8.541514741256833} +{"Pretrain/Learning Rate": 3.7563666966491564e-05, "Pretrain/Loss": 2.093736171722412, "Pretrain/Loss (Raw)": 2.268542766571045, "Pretrain/Step": 3361, "Pretrain/Step Time": 8.544297089800239} +{"Pretrain/Learning Rate": 3.7556326321711796e-05, "Pretrain/Loss": 2.095381498336792, "Pretrain/Loss (Raw)": 2.2177109718322754, "Pretrain/Step": 3362, "Pretrain/Step Time": 8.553583413362503} +{"Pretrain/Learning Rate": 3.7548984228877313e-05, "Pretrain/Loss": 2.091222047805786, "Pretrain/Loss (Raw)": 2.092251777648926, "Pretrain/Step": 3363, "Pretrain/Step Time": 8.553085703402758} +{"Pretrain/Learning Rate": 3.754164068883484e-05, "Pretrain/Loss": 2.091484308242798, "Pretrain/Loss (Raw)": 2.0449893474578857, "Pretrain/Step": 3364, "Pretrain/Step Time": 8.545526795089245} +{"Pretrain/Learning Rate": 3.7534295702431254e-05, "Pretrain/Loss": 2.0916318893432617, "Pretrain/Loss (Raw)": 2.129056692123413, "Pretrain/Step": 3365, "Pretrain/Step Time": 8.543997436761856} +{"Pretrain/Learning Rate": 3.7526949270513635e-05, "Pretrain/Loss": 2.091397285461426, "Pretrain/Loss (Raw)": 2.099493980407715, "Pretrain/Step": 3366, "Pretrain/Step Time": 8.54429230093956} +{"Pretrain/Learning Rate": 3.751960139392919e-05, "Pretrain/Loss": 2.0900917053222656, "Pretrain/Loss (Raw)": 1.9360463619232178, "Pretrain/Step": 3367, "Pretrain/Step Time": 8.541540889069438} +{"Pretrain/Learning Rate": 3.7512252073525325e-05, "Pretrain/Loss": 2.091325521469116, "Pretrain/Loss (Raw)": 2.27091908454895, "Pretrain/Step": 3368, "Pretrain/Step Time": 8.553883472457528} +{"Pretrain/Learning Rate": 3.7504901310149574e-05, "Pretrain/Loss": 2.091122627258301, "Pretrain/Loss (Raw)": 2.2536158561706543, "Pretrain/Step": 3369, "Pretrain/Step Time": 8.553953407332301} +{"Pretrain/Learning Rate": 3.74975491046497e-05, "Pretrain/Loss": 2.0896403789520264, "Pretrain/Loss (Raw)": 1.9928315877914429, "Pretrain/Step": 3370, "Pretrain/Step Time": 8.547785058617592} +{"Pretrain/Learning Rate": 3.7490195457873555e-05, "Pretrain/Loss": 2.093433141708374, "Pretrain/Loss (Raw)": 2.215059518814087, "Pretrain/Step": 3371, "Pretrain/Step Time": 8.545010637491941} +{"Pretrain/Learning Rate": 3.748284037066922e-05, "Pretrain/Loss": 2.0939528942108154, "Pretrain/Loss (Raw)": 2.231201648712158, "Pretrain/Step": 3372, "Pretrain/Step Time": 8.552649836987257} +{"Pretrain/Learning Rate": 3.7475483843884916e-05, "Pretrain/Loss": 2.0970263481140137, "Pretrain/Loss (Raw)": 2.361708641052246, "Pretrain/Step": 3373, "Pretrain/Step Time": 8.553397208452225} +{"Pretrain/Learning Rate": 3.746812587836903e-05, "Pretrain/Loss": 2.096769332885742, "Pretrain/Loss (Raw)": 1.992965579032898, "Pretrain/Step": 3374, "Pretrain/Step Time": 8.55494531057775} +{"Pretrain/Learning Rate": 3.746076647497011e-05, "Pretrain/Loss": 2.0980467796325684, "Pretrain/Loss (Raw)": 2.227222204208374, "Pretrain/Step": 3375, "Pretrain/Step Time": 8.555353503674269} +{"Pretrain/Learning Rate": 3.7453405634536894e-05, "Pretrain/Loss": 2.0984950065612793, "Pretrain/Loss (Raw)": 2.213874340057373, "Pretrain/Step": 3376, "Pretrain/Step Time": 8.54712763428688} +{"Pretrain/Learning Rate": 3.744604335791825e-05, "Pretrain/Loss": 2.1016197204589844, "Pretrain/Loss (Raw)": 2.473116397857666, "Pretrain/Step": 3377, "Pretrain/Step Time": 8.547590970993042} +{"Pretrain/Learning Rate": 3.743867964596324e-05, "Pretrain/Loss": 2.100996255874634, "Pretrain/Loss (Raw)": 1.9744945764541626, "Pretrain/Step": 3378, "Pretrain/Step Time": 8.54472696594894} +{"Pretrain/Learning Rate": 3.743131449952107e-05, "Pretrain/Loss": 2.099585771560669, "Pretrain/Loss (Raw)": 2.1217429637908936, "Pretrain/Step": 3379, "Pretrain/Step Time": 8.549066636711359} +{"Pretrain/Learning Rate": 3.7423947919441147e-05, "Pretrain/Loss": 2.0992376804351807, "Pretrain/Loss (Raw)": 1.9671553373336792, "Pretrain/Step": 3380, "Pretrain/Step Time": 8.55432952940464} +{"Pretrain/Learning Rate": 3.7416579906573e-05, "Pretrain/Loss": 2.0977931022644043, "Pretrain/Loss (Raw)": 1.7634434700012207, "Pretrain/Step": 3381, "Pretrain/Step Time": 8.549711376428604} +{"Pretrain/Learning Rate": 3.7409210461766355e-05, "Pretrain/Loss": 2.099743366241455, "Pretrain/Loss (Raw)": 2.3183982372283936, "Pretrain/Step": 3382, "Pretrain/Step Time": 8.55247257836163} +{"Pretrain/Learning Rate": 3.740183958587108e-05, "Pretrain/Loss": 2.0986008644104004, "Pretrain/Loss (Raw)": 1.92830228805542, "Pretrain/Step": 3383, "Pretrain/Step Time": 8.546802571043372} +{"Pretrain/Learning Rate": 3.7394467279737224e-05, "Pretrain/Loss": 2.0972349643707275, "Pretrain/Loss (Raw)": 1.9068645238876343, "Pretrain/Step": 3384, "Pretrain/Step Time": 8.542493429034948} +{"Pretrain/Learning Rate": 3.7387093544215003e-05, "Pretrain/Loss": 2.0999722480773926, "Pretrain/Loss (Raw)": 2.2122673988342285, "Pretrain/Step": 3385, "Pretrain/Step Time": 8.549040634185076} +{"Pretrain/Learning Rate": 3.7379718380154777e-05, "Pretrain/Loss": 2.1006855964660645, "Pretrain/Loss (Raw)": 1.9590567350387573, "Pretrain/Step": 3386, "Pretrain/Step Time": 8.552780695259571} +{"Pretrain/Learning Rate": 3.737234178840709e-05, "Pretrain/Loss": 2.1003313064575195, "Pretrain/Loss (Raw)": 1.9418343305587769, "Pretrain/Step": 3387, "Pretrain/Step Time": 8.550286179408431} +{"Pretrain/Learning Rate": 3.736496376982266e-05, "Pretrain/Loss": 2.1021931171417236, "Pretrain/Loss (Raw)": 2.221998691558838, "Pretrain/Step": 3388, "Pretrain/Step Time": 8.554211327806115} +{"Pretrain/Learning Rate": 3.7357584325252336e-05, "Pretrain/Loss": 2.1022214889526367, "Pretrain/Loss (Raw)": 2.097869396209717, "Pretrain/Step": 3389, "Pretrain/Step Time": 8.550986958667636} +{"Pretrain/Learning Rate": 3.7350203455547155e-05, "Pretrain/Loss": 2.102323293685913, "Pretrain/Loss (Raw)": 1.9343451261520386, "Pretrain/Step": 3390, "Pretrain/Step Time": 8.550721820443869} +{"Pretrain/Learning Rate": 3.7342821161558316e-05, "Pretrain/Loss": 2.104166030883789, "Pretrain/Loss (Raw)": 2.1046030521392822, "Pretrain/Step": 3391, "Pretrain/Step Time": 8.546293614432216} +{"Pretrain/Learning Rate": 3.7335437444137175e-05, "Pretrain/Loss": 2.10494327545166, "Pretrain/Loss (Raw)": 2.2073590755462646, "Pretrain/Step": 3392, "Pretrain/Step Time": 8.551637196913362} +{"Pretrain/Learning Rate": 3.732805230413527e-05, "Pretrain/Loss": 2.103639602661133, "Pretrain/Loss (Raw)": 2.1709282398223877, "Pretrain/Step": 3393, "Pretrain/Step Time": 8.55107306316495} +{"Pretrain/Learning Rate": 3.732066574240428e-05, "Pretrain/Loss": 2.1048057079315186, "Pretrain/Loss (Raw)": 2.1764302253723145, "Pretrain/Step": 3394, "Pretrain/Step Time": 8.548563105985522} +{"Pretrain/Learning Rate": 3.731327775979605e-05, "Pretrain/Loss": 2.1042582988739014, "Pretrain/Loss (Raw)": 2.1362040042877197, "Pretrain/Step": 3395, "Pretrain/Step Time": 8.546026507392526} +{"Pretrain/Learning Rate": 3.730588835716262e-05, "Pretrain/Loss": 2.103405475616455, "Pretrain/Loss (Raw)": 2.09602427482605, "Pretrain/Step": 3396, "Pretrain/Step Time": 8.546463672071695} +{"Pretrain/Learning Rate": 3.729849753535615e-05, "Pretrain/Loss": 2.106991767883301, "Pretrain/Loss (Raw)": 2.5547196865081787, "Pretrain/Step": 3397, "Pretrain/Step Time": 8.543208179995418} +{"Pretrain/Learning Rate": 3.7291105295229004e-05, "Pretrain/Loss": 2.107173442840576, "Pretrain/Loss (Raw)": 2.0588953495025635, "Pretrain/Step": 3398, "Pretrain/Step Time": 8.543844897300005} +{"Pretrain/Learning Rate": 3.728371163763366e-05, "Pretrain/Loss": 2.1062936782836914, "Pretrain/Loss (Raw)": 2.0494742393493652, "Pretrain/Step": 3399, "Pretrain/Step Time": 8.546174500137568} +{"Pretrain/Learning Rate": 3.727631656342282e-05, "Pretrain/Loss": 2.1108438968658447, "Pretrain/Loss (Raw)": 2.7018191814422607, "Pretrain/Step": 3400, "Pretrain/Step Time": 8.54207006469369} +{"Pretrain/Learning Rate": 3.7268920073449296e-05, "Pretrain/Loss": 2.1118836402893066, "Pretrain/Loss (Raw)": 2.0054972171783447, "Pretrain/Step": 3401, "Pretrain/Step Time": 8.532936790958047} +{"Pretrain/Learning Rate": 3.72615221685661e-05, "Pretrain/Loss": 2.113341808319092, "Pretrain/Loss (Raw)": 2.260385274887085, "Pretrain/Step": 3402, "Pretrain/Step Time": 8.539731839671731} +{"Pretrain/Learning Rate": 3.725412284962639e-05, "Pretrain/Loss": 2.1131887435913086, "Pretrain/Loss (Raw)": 2.0690765380859375, "Pretrain/Step": 3403, "Pretrain/Step Time": 8.53983529470861} +{"Pretrain/Learning Rate": 3.724672211748349e-05, "Pretrain/Loss": 2.1140644550323486, "Pretrain/Loss (Raw)": 2.0387136936187744, "Pretrain/Step": 3404, "Pretrain/Step Time": 8.549175711348653} +{"Pretrain/Learning Rate": 3.723931997299089e-05, "Pretrain/Loss": 2.1135873794555664, "Pretrain/Loss (Raw)": 2.187206745147705, "Pretrain/Step": 3405, "Pretrain/Step Time": 8.55112386122346} +{"Pretrain/Learning Rate": 3.723191641700223e-05, "Pretrain/Loss": 2.112391710281372, "Pretrain/Loss (Raw)": 1.996139645576477, "Pretrain/Step": 3406, "Pretrain/Step Time": 8.543906703591347} +{"Pretrain/Learning Rate": 3.7224511450371334e-05, "Pretrain/Loss": 2.1108460426330566, "Pretrain/Loss (Raw)": 1.794203281402588, "Pretrain/Step": 3407, "Pretrain/Step Time": 8.547065230086446} +{"Pretrain/Learning Rate": 3.721710507395218e-05, "Pretrain/Loss": 2.108452796936035, "Pretrain/Loss (Raw)": 1.9757241010665894, "Pretrain/Step": 3408, "Pretrain/Step Time": 8.539816735312343} +{"Pretrain/Learning Rate": 3.720969728859889e-05, "Pretrain/Loss": 2.108027696609497, "Pretrain/Loss (Raw)": 2.1283249855041504, "Pretrain/Step": 3409, "Pretrain/Step Time": 8.540171433240175} +{"Pretrain/Learning Rate": 3.720228809516578e-05, "Pretrain/Loss": 2.110227108001709, "Pretrain/Loss (Raw)": 2.259580135345459, "Pretrain/Step": 3410, "Pretrain/Step Time": 8.554100757464767} +{"Pretrain/Learning Rate": 3.719487749450731e-05, "Pretrain/Loss": 2.1094326972961426, "Pretrain/Loss (Raw)": 2.1079628467559814, "Pretrain/Step": 3411, "Pretrain/Step Time": 8.554234806448221} +{"Pretrain/Learning Rate": 3.718746548747809e-05, "Pretrain/Loss": 2.1064021587371826, "Pretrain/Loss (Raw)": 1.9944002628326416, "Pretrain/Step": 3412, "Pretrain/Step Time": 8.542631840333343} +{"Pretrain/Learning Rate": 3.7180052074932934e-05, "Pretrain/Loss": 2.106825351715088, "Pretrain/Loss (Raw)": 2.226508617401123, "Pretrain/Step": 3413, "Pretrain/Step Time": 8.544432818889618} +{"Pretrain/Learning Rate": 3.7172637257726774e-05, "Pretrain/Loss": 2.1071786880493164, "Pretrain/Loss (Raw)": 2.0409183502197266, "Pretrain/Step": 3414, "Pretrain/Step Time": 8.542665272951126} +{"Pretrain/Learning Rate": 3.716522103671473e-05, "Pretrain/Loss": 2.1084418296813965, "Pretrain/Loss (Raw)": 2.048259735107422, "Pretrain/Step": 3415, "Pretrain/Step Time": 8.542416239157319} +{"Pretrain/Learning Rate": 3.715780341275207e-05, "Pretrain/Loss": 2.105555295944214, "Pretrain/Loss (Raw)": 1.8518435955047607, "Pretrain/Step": 3416, "Pretrain/Step Time": 8.546025764197111} +{"Pretrain/Learning Rate": 3.715038438669423e-05, "Pretrain/Loss": 2.1052064895629883, "Pretrain/Loss (Raw)": 2.069228172302246, "Pretrain/Step": 3417, "Pretrain/Step Time": 8.546563828364015} +{"Pretrain/Learning Rate": 3.7142963959396806e-05, "Pretrain/Loss": 2.1061108112335205, "Pretrain/Loss (Raw)": 2.2243504524230957, "Pretrain/Step": 3418, "Pretrain/Step Time": 8.543774671852589} +{"Pretrain/Learning Rate": 3.713554213171556e-05, "Pretrain/Loss": 2.105722427368164, "Pretrain/Loss (Raw)": 1.9810068607330322, "Pretrain/Step": 3419, "Pretrain/Step Time": 8.546073129400611} +{"Pretrain/Learning Rate": 3.712811890450641e-05, "Pretrain/Loss": 2.1063904762268066, "Pretrain/Loss (Raw)": 2.2048373222351074, "Pretrain/Step": 3420, "Pretrain/Step Time": 8.542430082336068} +{"Pretrain/Learning Rate": 3.712069427862544e-05, "Pretrain/Loss": 2.1053900718688965, "Pretrain/Loss (Raw)": 2.1588010787963867, "Pretrain/Step": 3421, "Pretrain/Step Time": 8.546331560239196} +{"Pretrain/Learning Rate": 3.711326825492889e-05, "Pretrain/Loss": 2.1062228679656982, "Pretrain/Loss (Raw)": 1.987216830253601, "Pretrain/Step": 3422, "Pretrain/Step Time": 8.544913195073605} +{"Pretrain/Learning Rate": 3.7105840834273164e-05, "Pretrain/Loss": 2.107956886291504, "Pretrain/Loss (Raw)": 2.2296581268310547, "Pretrain/Step": 3423, "Pretrain/Step Time": 8.549037653952837} +{"Pretrain/Learning Rate": 3.7098412017514835e-05, "Pretrain/Loss": 2.1100590229034424, "Pretrain/Loss (Raw)": 2.158871650695801, "Pretrain/Step": 3424, "Pretrain/Step Time": 8.540081588551402} +{"Pretrain/Learning Rate": 3.7090981805510615e-05, "Pretrain/Loss": 2.1095123291015625, "Pretrain/Loss (Raw)": 1.9814674854278564, "Pretrain/Step": 3425, "Pretrain/Step Time": 8.5418017283082} +{"Pretrain/Learning Rate": 3.7083550199117403e-05, "Pretrain/Loss": 2.111518383026123, "Pretrain/Loss (Raw)": 2.36013126373291, "Pretrain/Step": 3426, "Pretrain/Step Time": 8.544565198943019} +{"Pretrain/Learning Rate": 3.707611719919224e-05, "Pretrain/Loss": 2.1112537384033203, "Pretrain/Loss (Raw)": 1.9880160093307495, "Pretrain/Step": 3427, "Pretrain/Step Time": 8.544553063809872} +{"Pretrain/Learning Rate": 3.706868280659234e-05, "Pretrain/Loss": 2.1120710372924805, "Pretrain/Loss (Raw)": 2.13985276222229, "Pretrain/Step": 3428, "Pretrain/Step Time": 8.546535829082131} +{"Pretrain/Learning Rate": 3.7061247022175064e-05, "Pretrain/Loss": 2.1112771034240723, "Pretrain/Loss (Raw)": 2.0077736377716064, "Pretrain/Step": 3429, "Pretrain/Step Time": 8.542869521304965} +{"Pretrain/Learning Rate": 3.705380984679795e-05, "Pretrain/Loss": 2.1129205226898193, "Pretrain/Loss (Raw)": 2.0407536029815674, "Pretrain/Step": 3430, "Pretrain/Step Time": 8.542010396718979} +{"Pretrain/Learning Rate": 3.704637128131868e-05, "Pretrain/Loss": 2.113675355911255, "Pretrain/Loss (Raw)": 2.0972421169281006, "Pretrain/Step": 3431, "Pretrain/Step Time": 8.541777258738875} +{"Pretrain/Learning Rate": 3.7038931326595115e-05, "Pretrain/Loss": 2.112992525100708, "Pretrain/Loss (Raw)": 2.0876474380493164, "Pretrain/Step": 3432, "Pretrain/Step Time": 8.542188676074147} +{"Pretrain/Learning Rate": 3.703148998348526e-05, "Pretrain/Loss": 2.1139698028564453, "Pretrain/Loss (Raw)": 2.201711893081665, "Pretrain/Step": 3433, "Pretrain/Step Time": 8.538772055879235} +{"Pretrain/Learning Rate": 3.702404725284728e-05, "Pretrain/Loss": 2.1160874366760254, "Pretrain/Loss (Raw)": 2.4247970581054688, "Pretrain/Step": 3434, "Pretrain/Step Time": 8.546152167022228} +{"Pretrain/Learning Rate": 3.7016603135539524e-05, "Pretrain/Loss": 2.113029956817627, "Pretrain/Loss (Raw)": 2.0341579914093018, "Pretrain/Step": 3435, "Pretrain/Step Time": 8.545077821239829} +{"Pretrain/Learning Rate": 3.700915763242046e-05, "Pretrain/Loss": 2.1120247840881348, "Pretrain/Loss (Raw)": 2.063950538635254, "Pretrain/Step": 3436, "Pretrain/Step Time": 8.548713892698288} +{"Pretrain/Learning Rate": 3.700171074434876e-05, "Pretrain/Loss": 2.1103267669677734, "Pretrain/Loss (Raw)": 2.0706264972686768, "Pretrain/Step": 3437, "Pretrain/Step Time": 8.550133844837546} +{"Pretrain/Learning Rate": 3.699426247218321e-05, "Pretrain/Loss": 2.1114072799682617, "Pretrain/Loss (Raw)": 2.172126054763794, "Pretrain/Step": 3438, "Pretrain/Step Time": 8.55114253796637} +{"Pretrain/Learning Rate": 3.69868128167828e-05, "Pretrain/Loss": 2.1142754554748535, "Pretrain/Loss (Raw)": 2.3090388774871826, "Pretrain/Step": 3439, "Pretrain/Step Time": 8.548419455066323} +{"Pretrain/Learning Rate": 3.697936177900665e-05, "Pretrain/Loss": 2.11456036567688, "Pretrain/Loss (Raw)": 2.1079769134521484, "Pretrain/Step": 3440, "Pretrain/Step Time": 8.542244059965014} +{"Pretrain/Learning Rate": 3.697190935971405e-05, "Pretrain/Loss": 2.1172537803649902, "Pretrain/Loss (Raw)": 2.3582239151000977, "Pretrain/Step": 3441, "Pretrain/Step Time": 8.536740120500326} +{"Pretrain/Learning Rate": 3.696445555976445e-05, "Pretrain/Loss": 2.117271900177002, "Pretrain/Loss (Raw)": 2.041764259338379, "Pretrain/Step": 3442, "Pretrain/Step Time": 8.541492469608784} +{"Pretrain/Learning Rate": 3.695700038001746e-05, "Pretrain/Loss": 2.117818832397461, "Pretrain/Loss (Raw)": 2.269440174102783, "Pretrain/Step": 3443, "Pretrain/Step Time": 8.544816074892879} +{"Pretrain/Learning Rate": 3.694954382133284e-05, "Pretrain/Loss": 2.116581439971924, "Pretrain/Loss (Raw)": 2.032843589782715, "Pretrain/Step": 3444, "Pretrain/Step Time": 8.545770205557346} +{"Pretrain/Learning Rate": 3.694208588457051e-05, "Pretrain/Loss": 2.1170144081115723, "Pretrain/Loss (Raw)": 2.0307936668395996, "Pretrain/Step": 3445, "Pretrain/Step Time": 8.539099076762795} +{"Pretrain/Learning Rate": 3.693462657059058e-05, "Pretrain/Loss": 2.1148428916931152, "Pretrain/Loss (Raw)": 1.996443748474121, "Pretrain/Step": 3446, "Pretrain/Step Time": 8.539163146167994} +{"Pretrain/Learning Rate": 3.6927165880253266e-05, "Pretrain/Loss": 2.11726713180542, "Pretrain/Loss (Raw)": 2.3046138286590576, "Pretrain/Step": 3447, "Pretrain/Step Time": 8.552126141265035} +{"Pretrain/Learning Rate": 3.691970381441898e-05, "Pretrain/Loss": 2.118335723876953, "Pretrain/Loss (Raw)": 2.184353828430176, "Pretrain/Step": 3448, "Pretrain/Step Time": 8.546609301120043} +{"Pretrain/Learning Rate": 3.691224037394828e-05, "Pretrain/Loss": 2.117887020111084, "Pretrain/Loss (Raw)": 2.0628979206085205, "Pretrain/Step": 3449, "Pretrain/Step Time": 8.546860186383128} +{"Pretrain/Learning Rate": 3.69047755597019e-05, "Pretrain/Loss": 2.118011951446533, "Pretrain/Loss (Raw)": 2.042341709136963, "Pretrain/Step": 3450, "Pretrain/Step Time": 8.55025740712881} +{"Pretrain/Learning Rate": 3.68973093725407e-05, "Pretrain/Loss": 2.1157450675964355, "Pretrain/Loss (Raw)": 1.7851732969284058, "Pretrain/Step": 3451, "Pretrain/Step Time": 8.550747895613313} +{"Pretrain/Learning Rate": 3.688984181332572e-05, "Pretrain/Loss": 2.1130993366241455, "Pretrain/Loss (Raw)": 2.083132028579712, "Pretrain/Step": 3452, "Pretrain/Step Time": 8.553725011646748} +{"Pretrain/Learning Rate": 3.688237288291815e-05, "Pretrain/Loss": 2.110591173171997, "Pretrain/Loss (Raw)": 1.9411574602127075, "Pretrain/Step": 3453, "Pretrain/Step Time": 8.558029429987073} +{"Pretrain/Learning Rate": 3.687490258217935e-05, "Pretrain/Loss": 2.108149528503418, "Pretrain/Loss (Raw)": 1.9961931705474854, "Pretrain/Step": 3454, "Pretrain/Step Time": 8.553663980215788} +{"Pretrain/Learning Rate": 3.6867430911970824e-05, "Pretrain/Loss": 2.11057186126709, "Pretrain/Loss (Raw)": 2.123870372772217, "Pretrain/Step": 3455, "Pretrain/Step Time": 8.552054138854146} +{"Pretrain/Learning Rate": 3.6859957873154256e-05, "Pretrain/Loss": 2.110592842102051, "Pretrain/Loss (Raw)": 2.015638828277588, "Pretrain/Step": 3456, "Pretrain/Step Time": 8.551518429070711} +{"Pretrain/Learning Rate": 3.6852483466591447e-05, "Pretrain/Loss": 2.1106009483337402, "Pretrain/Loss (Raw)": 2.051501750946045, "Pretrain/Step": 3457, "Pretrain/Step Time": 8.554382992908359} +{"Pretrain/Learning Rate": 3.6845007693144404e-05, "Pretrain/Loss": 2.110457181930542, "Pretrain/Loss (Raw)": 1.9814718961715698, "Pretrain/Step": 3458, "Pretrain/Step Time": 8.553989090025425} +{"Pretrain/Learning Rate": 3.683753055367526e-05, "Pretrain/Loss": 2.1115713119506836, "Pretrain/Loss (Raw)": 2.202575922012329, "Pretrain/Step": 3459, "Pretrain/Step Time": 8.5522372238338} +{"Pretrain/Learning Rate": 3.68300520490463e-05, "Pretrain/Loss": 2.1113686561584473, "Pretrain/Loss (Raw)": 2.209589958190918, "Pretrain/Step": 3460, "Pretrain/Step Time": 8.557865396142006} +{"Pretrain/Learning Rate": 3.682257218012e-05, "Pretrain/Loss": 2.110098361968994, "Pretrain/Loss (Raw)": 2.0313079357147217, "Pretrain/Step": 3461, "Pretrain/Step Time": 8.550296681001782} +{"Pretrain/Learning Rate": 3.6815090947758966e-05, "Pretrain/Loss": 2.109715223312378, "Pretrain/Loss (Raw)": 2.208847999572754, "Pretrain/Step": 3462, "Pretrain/Step Time": 8.548576602712274} +{"Pretrain/Learning Rate": 3.6807608352825975e-05, "Pretrain/Loss": 2.1064822673797607, "Pretrain/Loss (Raw)": 1.9479163885116577, "Pretrain/Step": 3463, "Pretrain/Step Time": 8.54941556788981} +{"Pretrain/Learning Rate": 3.680012439618394e-05, "Pretrain/Loss": 2.1068131923675537, "Pretrain/Loss (Raw)": 2.078338861465454, "Pretrain/Step": 3464, "Pretrain/Step Time": 8.552493361756206} +{"Pretrain/Learning Rate": 3.679263907869596e-05, "Pretrain/Loss": 2.107367515563965, "Pretrain/Loss (Raw)": 2.1202147006988525, "Pretrain/Step": 3465, "Pretrain/Step Time": 8.547531830146909} +{"Pretrain/Learning Rate": 3.678515240122527e-05, "Pretrain/Loss": 2.106776237487793, "Pretrain/Loss (Raw)": 2.049757719039917, "Pretrain/Step": 3466, "Pretrain/Step Time": 8.552502086386085} +{"Pretrain/Learning Rate": 3.677766436463527e-05, "Pretrain/Loss": 2.104905843734741, "Pretrain/Loss (Raw)": 2.0502803325653076, "Pretrain/Step": 3467, "Pretrain/Step Time": 8.552580613642931} +{"Pretrain/Learning Rate": 3.677017496978952e-05, "Pretrain/Loss": 2.1052463054656982, "Pretrain/Loss (Raw)": 2.1534054279327393, "Pretrain/Step": 3468, "Pretrain/Step Time": 8.553294319659472} +{"Pretrain/Learning Rate": 3.6762684217551735e-05, "Pretrain/Loss": 2.105536699295044, "Pretrain/Loss (Raw)": 2.1921825408935547, "Pretrain/Step": 3469, "Pretrain/Step Time": 8.549476759508252} +{"Pretrain/Learning Rate": 3.675519210878577e-05, "Pretrain/Loss": 2.1049375534057617, "Pretrain/Loss (Raw)": 2.0351505279541016, "Pretrain/Step": 3470, "Pretrain/Step Time": 8.558044966310263} +{"Pretrain/Learning Rate": 3.6747698644355664e-05, "Pretrain/Loss": 2.1044352054595947, "Pretrain/Loss (Raw)": 2.1053543090820312, "Pretrain/Step": 3471, "Pretrain/Step Time": 8.562447048723698} +{"Pretrain/Learning Rate": 3.674020382512559e-05, "Pretrain/Loss": 2.1041507720947266, "Pretrain/Loss (Raw)": 2.0913069248199463, "Pretrain/Step": 3472, "Pretrain/Step Time": 8.555223213508725} +{"Pretrain/Learning Rate": 3.673270765195989e-05, "Pretrain/Loss": 2.104414463043213, "Pretrain/Loss (Raw)": 2.103721857070923, "Pretrain/Step": 3473, "Pretrain/Step Time": 8.553658038377762} +{"Pretrain/Learning Rate": 3.672521012572307e-05, "Pretrain/Loss": 2.105241298675537, "Pretrain/Loss (Raw)": 2.085177183151245, "Pretrain/Step": 3474, "Pretrain/Step Time": 8.55990283191204} +{"Pretrain/Learning Rate": 3.671771124727975e-05, "Pretrain/Loss": 2.104562282562256, "Pretrain/Loss (Raw)": 2.2003307342529297, "Pretrain/Step": 3475, "Pretrain/Step Time": 8.559457633644342} +{"Pretrain/Learning Rate": 3.671021101749476e-05, "Pretrain/Loss": 2.1073217391967773, "Pretrain/Loss (Raw)": 2.2265055179595947, "Pretrain/Step": 3476, "Pretrain/Step Time": 8.560934755951166} +{"Pretrain/Learning Rate": 3.670270943723305e-05, "Pretrain/Loss": 2.104445457458496, "Pretrain/Loss (Raw)": 1.7964766025543213, "Pretrain/Step": 3477, "Pretrain/Step Time": 8.559975469484925} +{"Pretrain/Learning Rate": 3.669520650735975e-05, "Pretrain/Loss": 2.104717254638672, "Pretrain/Loss (Raw)": 1.939476490020752, "Pretrain/Step": 3478, "Pretrain/Step Time": 8.560414984822273} +{"Pretrain/Learning Rate": 3.668770222874012e-05, "Pretrain/Loss": 2.1089963912963867, "Pretrain/Loss (Raw)": 2.4541828632354736, "Pretrain/Step": 3479, "Pretrain/Step Time": 8.553830191493034} +{"Pretrain/Learning Rate": 3.6680196602239596e-05, "Pretrain/Loss": 2.1086857318878174, "Pretrain/Loss (Raw)": 1.8900679349899292, "Pretrain/Step": 3480, "Pretrain/Step Time": 8.55319263599813} +{"Pretrain/Learning Rate": 3.667268962872376e-05, "Pretrain/Loss": 2.105018138885498, "Pretrain/Loss (Raw)": 1.7974746227264404, "Pretrain/Step": 3481, "Pretrain/Step Time": 8.557408656924963} +{"Pretrain/Learning Rate": 3.666518130905836e-05, "Pretrain/Loss": 2.105748176574707, "Pretrain/Loss (Raw)": 2.0707623958587646, "Pretrain/Step": 3482, "Pretrain/Step Time": 8.552610382437706} +{"Pretrain/Learning Rate": 3.665767164410928e-05, "Pretrain/Loss": 2.1083312034606934, "Pretrain/Loss (Raw)": 2.3047778606414795, "Pretrain/Step": 3483, "Pretrain/Step Time": 8.561225784942508} +{"Pretrain/Learning Rate": 3.665016063474257e-05, "Pretrain/Loss": 2.111337661743164, "Pretrain/Loss (Raw)": 2.4839906692504883, "Pretrain/Step": 3484, "Pretrain/Step Time": 8.553181920200586} +{"Pretrain/Learning Rate": 3.664264828182444e-05, "Pretrain/Loss": 2.1093034744262695, "Pretrain/Loss (Raw)": 2.040827989578247, "Pretrain/Step": 3485, "Pretrain/Step Time": 8.551191110163927} +{"Pretrain/Learning Rate": 3.663513458622124e-05, "Pretrain/Loss": 2.108633279800415, "Pretrain/Loss (Raw)": 1.9649955034255981, "Pretrain/Step": 3486, "Pretrain/Step Time": 8.550174402073026} +{"Pretrain/Learning Rate": 3.662761954879951e-05, "Pretrain/Loss": 2.108351230621338, "Pretrain/Loss (Raw)": 1.989674687385559, "Pretrain/Step": 3487, "Pretrain/Step Time": 8.553550334647298} +{"Pretrain/Learning Rate": 3.662010317042589e-05, "Pretrain/Loss": 2.1079232692718506, "Pretrain/Loss (Raw)": 1.9768364429473877, "Pretrain/Step": 3488, "Pretrain/Step Time": 8.55600618943572} +{"Pretrain/Learning Rate": 3.661258545196722e-05, "Pretrain/Loss": 2.1072773933410645, "Pretrain/Loss (Raw)": 2.1858859062194824, "Pretrain/Step": 3489, "Pretrain/Step Time": 8.566655606031418} +{"Pretrain/Learning Rate": 3.6605066394290476e-05, "Pretrain/Loss": 2.1055235862731934, "Pretrain/Loss (Raw)": 1.9932001829147339, "Pretrain/Step": 3490, "Pretrain/Step Time": 8.558010732755065} +{"Pretrain/Learning Rate": 3.659754599826279e-05, "Pretrain/Loss": 2.1061041355133057, "Pretrain/Loss (Raw)": 2.1665632724761963, "Pretrain/Step": 3491, "Pretrain/Step Time": 8.553445467725396} +{"Pretrain/Learning Rate": 3.659002426475145e-05, "Pretrain/Loss": 2.1073503494262695, "Pretrain/Loss (Raw)": 2.2045180797576904, "Pretrain/Step": 3492, "Pretrain/Step Time": 8.558162750676274} +{"Pretrain/Learning Rate": 3.65825011946239e-05, "Pretrain/Loss": 2.1064014434814453, "Pretrain/Loss (Raw)": 2.0076098442077637, "Pretrain/Step": 3493, "Pretrain/Step Time": 8.558091256767511} +{"Pretrain/Learning Rate": 3.6574976788747725e-05, "Pretrain/Loss": 2.1048078536987305, "Pretrain/Loss (Raw)": 1.895484209060669, "Pretrain/Step": 3494, "Pretrain/Step Time": 8.55389546789229} +{"Pretrain/Learning Rate": 3.6567451047990696e-05, "Pretrain/Loss": 2.105046510696411, "Pretrain/Loss (Raw)": 1.9665920734405518, "Pretrain/Step": 3495, "Pretrain/Step Time": 8.555367963388562} +{"Pretrain/Learning Rate": 3.6559923973220695e-05, "Pretrain/Loss": 2.1029698848724365, "Pretrain/Loss (Raw)": 2.005115032196045, "Pretrain/Step": 3496, "Pretrain/Step Time": 8.550405986607075} +{"Pretrain/Learning Rate": 3.65523955653058e-05, "Pretrain/Loss": 2.103182792663574, "Pretrain/Loss (Raw)": 2.2808706760406494, "Pretrain/Step": 3497, "Pretrain/Step Time": 8.548870969563723} +{"Pretrain/Learning Rate": 3.65448658251142e-05, "Pretrain/Loss": 2.1048121452331543, "Pretrain/Loss (Raw)": 2.2013726234436035, "Pretrain/Step": 3498, "Pretrain/Step Time": 8.547719715163112} +{"Pretrain/Learning Rate": 3.653733475351428e-05, "Pretrain/Loss": 2.103090763092041, "Pretrain/Loss (Raw)": 1.994713306427002, "Pretrain/Step": 3499, "Pretrain/Step Time": 8.54629711061716} +{"Pretrain/Learning Rate": 3.6529802351374545e-05, "Pretrain/Loss": 2.102349281311035, "Pretrain/Loss (Raw)": 2.1363346576690674, "Pretrain/Step": 3500, "Pretrain/Step Time": 8.542315699160099} +{"Pretrain/Learning Rate": 3.652226861956368e-05, "Pretrain/Loss": 2.100031614303589, "Pretrain/Loss (Raw)": 2.065028429031372, "Pretrain/Step": 3501, "Pretrain/Step Time": 8.548479171469808} +{"Pretrain/Learning Rate": 3.65147335589505e-05, "Pretrain/Loss": 2.100543975830078, "Pretrain/Loss (Raw)": 2.058544397354126, "Pretrain/Step": 3502, "Pretrain/Step Time": 8.54331861063838} +{"Pretrain/Learning Rate": 3.650719717040398e-05, "Pretrain/Loss": 2.100144863128662, "Pretrain/Loss (Raw)": 2.176135540008545, "Pretrain/Step": 3503, "Pretrain/Step Time": 8.544603014364839} +{"Pretrain/Learning Rate": 3.649965945479326e-05, "Pretrain/Loss": 2.0989723205566406, "Pretrain/Loss (Raw)": 2.063774585723877, "Pretrain/Step": 3504, "Pretrain/Step Time": 8.540776681154966} +{"Pretrain/Learning Rate": 3.649212041298763e-05, "Pretrain/Loss": 2.0966711044311523, "Pretrain/Loss (Raw)": 2.1786038875579834, "Pretrain/Step": 3505, "Pretrain/Step Time": 8.541913928464055} +{"Pretrain/Learning Rate": 3.648458004585652e-05, "Pretrain/Loss": 2.0992276668548584, "Pretrain/Loss (Raw)": 2.3016984462738037, "Pretrain/Step": 3506, "Pretrain/Step Time": 8.54847376793623} +{"Pretrain/Learning Rate": 3.647703835426952e-05, "Pretrain/Loss": 2.1002469062805176, "Pretrain/Loss (Raw)": 2.2522013187408447, "Pretrain/Step": 3507, "Pretrain/Step Time": 8.554420644417405} +{"Pretrain/Learning Rate": 3.646949533909637e-05, "Pretrain/Loss": 2.1017043590545654, "Pretrain/Loss (Raw)": 2.1537063121795654, "Pretrain/Step": 3508, "Pretrain/Step Time": 8.546804640442133} +{"Pretrain/Learning Rate": 3.646195100120698e-05, "Pretrain/Loss": 2.105163812637329, "Pretrain/Loss (Raw)": 2.2062907218933105, "Pretrain/Step": 3509, "Pretrain/Step Time": 8.54747404716909} +{"Pretrain/Learning Rate": 3.645440534147139e-05, "Pretrain/Loss": 2.1032185554504395, "Pretrain/Loss (Raw)": 2.0693838596343994, "Pretrain/Step": 3510, "Pretrain/Step Time": 8.546230928972363} +{"Pretrain/Learning Rate": 3.644685836075979e-05, "Pretrain/Loss": 2.104123592376709, "Pretrain/Loss (Raw)": 2.0441641807556152, "Pretrain/Step": 3511, "Pretrain/Step Time": 8.546940211206675} +{"Pretrain/Learning Rate": 3.643931005994255e-05, "Pretrain/Loss": 2.105816602706909, "Pretrain/Loss (Raw)": 2.123540163040161, "Pretrain/Step": 3512, "Pretrain/Step Time": 8.546269960701466} +{"Pretrain/Learning Rate": 3.643176043989018e-05, "Pretrain/Loss": 2.105579137802124, "Pretrain/Loss (Raw)": 2.181870937347412, "Pretrain/Step": 3513, "Pretrain/Step Time": 8.55514881759882} +{"Pretrain/Learning Rate": 3.6424209501473314e-05, "Pretrain/Loss": 2.107542037963867, "Pretrain/Loss (Raw)": 2.2102866172790527, "Pretrain/Step": 3514, "Pretrain/Step Time": 8.548539550974965} +{"Pretrain/Learning Rate": 3.641665724556278e-05, "Pretrain/Loss": 2.111022472381592, "Pretrain/Loss (Raw)": 2.3873584270477295, "Pretrain/Step": 3515, "Pretrain/Step Time": 8.550604807212949} +{"Pretrain/Learning Rate": 3.6409103673029535e-05, "Pretrain/Loss": 2.1086957454681396, "Pretrain/Loss (Raw)": 1.9241729974746704, "Pretrain/Step": 3516, "Pretrain/Step Time": 8.543767800554633} +{"Pretrain/Learning Rate": 3.64015487847447e-05, "Pretrain/Loss": 2.1092514991760254, "Pretrain/Loss (Raw)": 2.1690001487731934, "Pretrain/Step": 3517, "Pretrain/Step Time": 8.546536713838577} +{"Pretrain/Learning Rate": 3.6393992581579526e-05, "Pretrain/Loss": 2.1098344326019287, "Pretrain/Loss (Raw)": 2.008974075317383, "Pretrain/Step": 3518, "Pretrain/Step Time": 8.544322203844786} +{"Pretrain/Learning Rate": 3.638643506440544e-05, "Pretrain/Loss": 2.1112496852874756, "Pretrain/Loss (Raw)": 2.2857508659362793, "Pretrain/Step": 3519, "Pretrain/Step Time": 8.559402141720057} +{"Pretrain/Learning Rate": 3.6378876234094014e-05, "Pretrain/Loss": 2.108189105987549, "Pretrain/Loss (Raw)": 1.8156123161315918, "Pretrain/Step": 3520, "Pretrain/Step Time": 8.552557609975338} +{"Pretrain/Learning Rate": 3.6371316091516955e-05, "Pretrain/Loss": 2.106205463409424, "Pretrain/Loss (Raw)": 1.9170101881027222, "Pretrain/Step": 3521, "Pretrain/Step Time": 8.556563530117273} +{"Pretrain/Learning Rate": 3.636375463754614e-05, "Pretrain/Loss": 2.1038894653320312, "Pretrain/Loss (Raw)": 1.8799923658370972, "Pretrain/Step": 3522, "Pretrain/Step Time": 8.55472339503467} +{"Pretrain/Learning Rate": 3.6356191873053594e-05, "Pretrain/Loss": 2.1043241024017334, "Pretrain/Loss (Raw)": 2.1918513774871826, "Pretrain/Step": 3523, "Pretrain/Step Time": 8.55832819826901} +{"Pretrain/Learning Rate": 3.634862779891148e-05, "Pretrain/Loss": 2.104942798614502, "Pretrain/Loss (Raw)": 2.1751904487609863, "Pretrain/Step": 3524, "Pretrain/Step Time": 8.554882509633899} +{"Pretrain/Learning Rate": 3.634106241599215e-05, "Pretrain/Loss": 2.1025373935699463, "Pretrain/Loss (Raw)": 2.2468554973602295, "Pretrain/Step": 3525, "Pretrain/Step Time": 8.560271739959717} +{"Pretrain/Learning Rate": 3.633349572516805e-05, "Pretrain/Loss": 2.1029326915740967, "Pretrain/Loss (Raw)": 2.1094703674316406, "Pretrain/Step": 3526, "Pretrain/Step Time": 8.551708538085222} +{"Pretrain/Learning Rate": 3.632592772731182e-05, "Pretrain/Loss": 2.1042966842651367, "Pretrain/Loss (Raw)": 2.224088430404663, "Pretrain/Step": 3527, "Pretrain/Step Time": 8.55505507439375} +{"Pretrain/Learning Rate": 3.631835842329624e-05, "Pretrain/Loss": 2.1004512310028076, "Pretrain/Loss (Raw)": 2.2095820903778076, "Pretrain/Step": 3528, "Pretrain/Step Time": 8.554347407072783} +{"Pretrain/Learning Rate": 3.6310787813994226e-05, "Pretrain/Loss": 2.1016416549682617, "Pretrain/Loss (Raw)": 2.1578547954559326, "Pretrain/Step": 3529, "Pretrain/Step Time": 8.559881219640374} +{"Pretrain/Learning Rate": 3.6303215900278864e-05, "Pretrain/Loss": 2.1002373695373535, "Pretrain/Loss (Raw)": 2.08066463470459, "Pretrain/Step": 3530, "Pretrain/Step Time": 8.552554888650775} +{"Pretrain/Learning Rate": 3.629564268302338e-05, "Pretrain/Loss": 2.100513458251953, "Pretrain/Loss (Raw)": 2.1044094562530518, "Pretrain/Step": 3531, "Pretrain/Step Time": 8.557118564844131} +{"Pretrain/Learning Rate": 3.6288068163101156e-05, "Pretrain/Loss": 2.100374460220337, "Pretrain/Loss (Raw)": 2.0209152698516846, "Pretrain/Step": 3532, "Pretrain/Step Time": 8.554138721898198} +{"Pretrain/Learning Rate": 3.628049234138572e-05, "Pretrain/Loss": 2.1000919342041016, "Pretrain/Loss (Raw)": 2.151057720184326, "Pretrain/Step": 3533, "Pretrain/Step Time": 8.554212499409914} +{"Pretrain/Learning Rate": 3.6272915218750755e-05, "Pretrain/Loss": 2.1019320487976074, "Pretrain/Loss (Raw)": 2.2316410541534424, "Pretrain/Step": 3534, "Pretrain/Step Time": 8.557221418246627} +{"Pretrain/Learning Rate": 3.6265336796070083e-05, "Pretrain/Loss": 2.1051340103149414, "Pretrain/Loss (Raw)": 2.20407772064209, "Pretrain/Step": 3535, "Pretrain/Step Time": 8.555465336889029} +{"Pretrain/Learning Rate": 3.62577570742177e-05, "Pretrain/Loss": 2.104652166366577, "Pretrain/Loss (Raw)": 1.914060115814209, "Pretrain/Step": 3536, "Pretrain/Step Time": 8.557693924754858} +{"Pretrain/Learning Rate": 3.625017605406771e-05, "Pretrain/Loss": 2.1045665740966797, "Pretrain/Loss (Raw)": 2.117345094680786, "Pretrain/Step": 3537, "Pretrain/Step Time": 8.5579201169312} +{"Pretrain/Learning Rate": 3.624259373649441e-05, "Pretrain/Loss": 2.1029787063598633, "Pretrain/Loss (Raw)": 2.0563395023345947, "Pretrain/Step": 3538, "Pretrain/Step Time": 8.548558169975877} +{"Pretrain/Learning Rate": 3.6235010122372214e-05, "Pretrain/Loss": 2.103329658508301, "Pretrain/Loss (Raw)": 2.152902364730835, "Pretrain/Step": 3539, "Pretrain/Step Time": 8.552744131535292} +{"Pretrain/Learning Rate": 3.6227425212575725e-05, "Pretrain/Loss": 2.1047749519348145, "Pretrain/Loss (Raw)": 2.1794021129608154, "Pretrain/Step": 3540, "Pretrain/Step Time": 8.5540916249156} +{"Pretrain/Learning Rate": 3.621983900797964e-05, "Pretrain/Loss": 2.1040854454040527, "Pretrain/Loss (Raw)": 2.138240337371826, "Pretrain/Step": 3541, "Pretrain/Step Time": 8.553305320441723} +{"Pretrain/Learning Rate": 3.621225150945886e-05, "Pretrain/Loss": 2.103559970855713, "Pretrain/Loss (Raw)": 1.9736320972442627, "Pretrain/Step": 3542, "Pretrain/Step Time": 8.552038736641407} +{"Pretrain/Learning Rate": 3.620466271788841e-05, "Pretrain/Loss": 2.1036853790283203, "Pretrain/Loss (Raw)": 2.064317464828491, "Pretrain/Step": 3543, "Pretrain/Step Time": 8.549684697762132} +{"Pretrain/Learning Rate": 3.6197072634143436e-05, "Pretrain/Loss": 2.1058509349823, "Pretrain/Loss (Raw)": 2.129068613052368, "Pretrain/Step": 3544, "Pretrain/Step Time": 8.550414545461535} +{"Pretrain/Learning Rate": 3.61894812590993e-05, "Pretrain/Loss": 2.1069750785827637, "Pretrain/Loss (Raw)": 2.2130982875823975, "Pretrain/Step": 3545, "Pretrain/Step Time": 8.552318194881082} +{"Pretrain/Learning Rate": 3.6181888593631454e-05, "Pretrain/Loss": 2.105517625808716, "Pretrain/Loss (Raw)": 2.0378036499023438, "Pretrain/Step": 3546, "Pretrain/Step Time": 8.546251077204943} +{"Pretrain/Learning Rate": 3.6174294638615524e-05, "Pretrain/Loss": 2.1045949459075928, "Pretrain/Loss (Raw)": 1.8628942966461182, "Pretrain/Step": 3547, "Pretrain/Step Time": 8.54779020510614} +{"Pretrain/Learning Rate": 3.616669939492728e-05, "Pretrain/Loss": 2.101578950881958, "Pretrain/Loss (Raw)": 1.81879723072052, "Pretrain/Step": 3548, "Pretrain/Step Time": 8.551721397787333} +{"Pretrain/Learning Rate": 3.615910286344265e-05, "Pretrain/Loss": 2.1032485961914062, "Pretrain/Loss (Raw)": 2.37252140045166, "Pretrain/Step": 3549, "Pretrain/Step Time": 8.548632739111781} +{"Pretrain/Learning Rate": 3.615150504503768e-05, "Pretrain/Loss": 2.1051247119903564, "Pretrain/Loss (Raw)": 2.227349281311035, "Pretrain/Step": 3550, "Pretrain/Step Time": 8.548012517392635} +{"Pretrain/Learning Rate": 3.6143905940588616e-05, "Pretrain/Loss": 2.103236436843872, "Pretrain/Loss (Raw)": 1.98797607421875, "Pretrain/Step": 3551, "Pretrain/Step Time": 8.54922129958868} +{"Pretrain/Learning Rate": 3.613630555097179e-05, "Pretrain/Loss": 2.103442668914795, "Pretrain/Loss (Raw)": 2.1852939128875732, "Pretrain/Step": 3552, "Pretrain/Step Time": 8.551159279420972} +{"Pretrain/Learning Rate": 3.6128703877063755e-05, "Pretrain/Loss": 2.1071970462799072, "Pretrain/Loss (Raw)": 2.462002754211426, "Pretrain/Step": 3553, "Pretrain/Step Time": 8.55166545510292} +{"Pretrain/Learning Rate": 3.6121100919741126e-05, "Pretrain/Loss": 2.106414318084717, "Pretrain/Loss (Raw)": 2.2599382400512695, "Pretrain/Step": 3554, "Pretrain/Step Time": 8.550649864599109} +{"Pretrain/Learning Rate": 3.611349667988074e-05, "Pretrain/Loss": 2.1083946228027344, "Pretrain/Loss (Raw)": 2.2414798736572266, "Pretrain/Step": 3555, "Pretrain/Step Time": 8.548949310556054} +{"Pretrain/Learning Rate": 3.6105891158359563e-05, "Pretrain/Loss": 2.108274221420288, "Pretrain/Loss (Raw)": 2.1244659423828125, "Pretrain/Step": 3556, "Pretrain/Step Time": 8.547196144238114} +{"Pretrain/Learning Rate": 3.6098284356054666e-05, "Pretrain/Loss": 2.108686923980713, "Pretrain/Loss (Raw)": 2.060600996017456, "Pretrain/Step": 3557, "Pretrain/Step Time": 8.551978712901473} +{"Pretrain/Learning Rate": 3.609067627384333e-05, "Pretrain/Loss": 2.1093649864196777, "Pretrain/Loss (Raw)": 2.1275155544281006, "Pretrain/Step": 3558, "Pretrain/Step Time": 8.548288328573108} +{"Pretrain/Learning Rate": 3.608306691260295e-05, "Pretrain/Loss": 2.107304573059082, "Pretrain/Loss (Raw)": 1.8335440158843994, "Pretrain/Step": 3559, "Pretrain/Step Time": 8.549326365813613} +{"Pretrain/Learning Rate": 3.607545627321106e-05, "Pretrain/Loss": 2.106964111328125, "Pretrain/Loss (Raw)": 2.0440776348114014, "Pretrain/Step": 3560, "Pretrain/Step Time": 8.55027006752789} +{"Pretrain/Learning Rate": 3.606784435654536e-05, "Pretrain/Loss": 2.1046981811523438, "Pretrain/Loss (Raw)": 1.9116166830062866, "Pretrain/Step": 3561, "Pretrain/Step Time": 8.548767518252134} +{"Pretrain/Learning Rate": 3.6060231163483704e-05, "Pretrain/Loss": 2.1019046306610107, "Pretrain/Loss (Raw)": 2.0672430992126465, "Pretrain/Step": 3562, "Pretrain/Step Time": 8.553147055208683} +{"Pretrain/Learning Rate": 3.6052616694904066e-05, "Pretrain/Loss": 2.1028480529785156, "Pretrain/Loss (Raw)": 2.154938220977783, "Pretrain/Step": 3563, "Pretrain/Step Time": 8.549578353762627} +{"Pretrain/Learning Rate": 3.60450009516846e-05, "Pretrain/Loss": 2.103658676147461, "Pretrain/Loss (Raw)": 2.1676807403564453, "Pretrain/Step": 3564, "Pretrain/Step Time": 8.550238965079188} +{"Pretrain/Learning Rate": 3.603738393470357e-05, "Pretrain/Loss": 2.1032841205596924, "Pretrain/Loss (Raw)": 2.0226879119873047, "Pretrain/Step": 3565, "Pretrain/Step Time": 8.553507780656219} +{"Pretrain/Learning Rate": 3.6029765644839416e-05, "Pretrain/Loss": 2.102818727493286, "Pretrain/Loss (Raw)": 2.112572193145752, "Pretrain/Step": 3566, "Pretrain/Step Time": 8.549020353704691} +{"Pretrain/Learning Rate": 3.602214608297071e-05, "Pretrain/Loss": 2.1004910469055176, "Pretrain/Loss (Raw)": 2.0111210346221924, "Pretrain/Step": 3567, "Pretrain/Step Time": 8.557190073654056} +{"Pretrain/Learning Rate": 3.601452524997619e-05, "Pretrain/Loss": 2.0994536876678467, "Pretrain/Loss (Raw)": 1.9751718044281006, "Pretrain/Step": 3568, "Pretrain/Step Time": 8.556322284042835} +{"Pretrain/Learning Rate": 3.600690314673471e-05, "Pretrain/Loss": 2.0972671508789062, "Pretrain/Loss (Raw)": 2.078357696533203, "Pretrain/Step": 3569, "Pretrain/Step Time": 8.564800921827555} +{"Pretrain/Learning Rate": 3.599927977412529e-05, "Pretrain/Loss": 2.0989203453063965, "Pretrain/Loss (Raw)": 2.2533388137817383, "Pretrain/Step": 3570, "Pretrain/Step Time": 8.557056305930018} +{"Pretrain/Learning Rate": 3.59916551330271e-05, "Pretrain/Loss": 2.098170042037964, "Pretrain/Loss (Raw)": 2.1734323501586914, "Pretrain/Step": 3571, "Pretrain/Step Time": 8.554473008960485} +{"Pretrain/Learning Rate": 3.598402922431944e-05, "Pretrain/Loss": 2.098111867904663, "Pretrain/Loss (Raw)": 2.025395631790161, "Pretrain/Step": 3572, "Pretrain/Step Time": 8.554694637656212} +{"Pretrain/Learning Rate": 3.5976402048881786e-05, "Pretrain/Loss": 2.098081111907959, "Pretrain/Loss (Raw)": 2.0268163681030273, "Pretrain/Step": 3573, "Pretrain/Step Time": 8.555341299623251} +{"Pretrain/Learning Rate": 3.596877360759371e-05, "Pretrain/Loss": 2.0978026390075684, "Pretrain/Loss (Raw)": 1.9608242511749268, "Pretrain/Step": 3574, "Pretrain/Step Time": 8.556890398263931} +{"Pretrain/Learning Rate": 3.5961143901334984e-05, "Pretrain/Loss": 2.0974316596984863, "Pretrain/Loss (Raw)": 2.2571463584899902, "Pretrain/Step": 3575, "Pretrain/Step Time": 8.54647139646113} +{"Pretrain/Learning Rate": 3.5953512930985486e-05, "Pretrain/Loss": 2.0964102745056152, "Pretrain/Loss (Raw)": 2.0536019802093506, "Pretrain/Step": 3576, "Pretrain/Step Time": 8.546151990070939} +{"Pretrain/Learning Rate": 3.594588069742527e-05, "Pretrain/Loss": 2.094931125640869, "Pretrain/Loss (Raw)": 1.8735554218292236, "Pretrain/Step": 3577, "Pretrain/Step Time": 8.547904031351209} +{"Pretrain/Learning Rate": 3.5938247201534505e-05, "Pretrain/Loss": 2.095332622528076, "Pretrain/Loss (Raw)": 2.093748092651367, "Pretrain/Step": 3578, "Pretrain/Step Time": 8.54314941354096} +{"Pretrain/Learning Rate": 3.5930612444193535e-05, "Pretrain/Loss": 2.09588885307312, "Pretrain/Loss (Raw)": 1.8563716411590576, "Pretrain/Step": 3579, "Pretrain/Step Time": 8.541213804855943} +{"Pretrain/Learning Rate": 3.592297642628283e-05, "Pretrain/Loss": 2.097137928009033, "Pretrain/Loss (Raw)": 2.242985486984253, "Pretrain/Step": 3580, "Pretrain/Step Time": 8.546558057889342} +{"Pretrain/Learning Rate": 3.5915339148683005e-05, "Pretrain/Loss": 2.0984129905700684, "Pretrain/Loss (Raw)": 2.104400157928467, "Pretrain/Step": 3581, "Pretrain/Step Time": 8.541036538779736} +{"Pretrain/Learning Rate": 3.590770061227484e-05, "Pretrain/Loss": 2.0987319946289062, "Pretrain/Loss (Raw)": 2.0370101928710938, "Pretrain/Step": 3582, "Pretrain/Step Time": 8.53644984960556} +{"Pretrain/Learning Rate": 3.590006081793925e-05, "Pretrain/Loss": 2.097646713256836, "Pretrain/Loss (Raw)": 1.9849555492401123, "Pretrain/Step": 3583, "Pretrain/Step Time": 8.538816412910819} +{"Pretrain/Learning Rate": 3.589241976655727e-05, "Pretrain/Loss": 2.0966720581054688, "Pretrain/Loss (Raw)": 1.8908724784851074, "Pretrain/Step": 3584, "Pretrain/Step Time": 8.540186442434788} +{"Pretrain/Learning Rate": 3.588477745901013e-05, "Pretrain/Loss": 2.0968704223632812, "Pretrain/Loss (Raw)": 2.0769009590148926, "Pretrain/Step": 3585, "Pretrain/Step Time": 8.53967659175396} +{"Pretrain/Learning Rate": 3.587713389617916e-05, "Pretrain/Loss": 2.0973052978515625, "Pretrain/Loss (Raw)": 2.037122964859009, "Pretrain/Step": 3586, "Pretrain/Step Time": 8.553701812401414} +{"Pretrain/Learning Rate": 3.5869489078945845e-05, "Pretrain/Loss": 2.095432758331299, "Pretrain/Loss (Raw)": 1.9629210233688354, "Pretrain/Step": 3587, "Pretrain/Step Time": 8.544964008033276} +{"Pretrain/Learning Rate": 3.586184300819184e-05, "Pretrain/Loss": 2.0932774543762207, "Pretrain/Loss (Raw)": 1.9337064027786255, "Pretrain/Step": 3588, "Pretrain/Step Time": 8.534899301826954} +{"Pretrain/Learning Rate": 3.585419568479891e-05, "Pretrain/Loss": 2.094165563583374, "Pretrain/Loss (Raw)": 2.1449625492095947, "Pretrain/Step": 3589, "Pretrain/Step Time": 8.53896138817072} +{"Pretrain/Learning Rate": 3.584654710964899e-05, "Pretrain/Loss": 2.094329833984375, "Pretrain/Loss (Raw)": 2.229874849319458, "Pretrain/Step": 3590, "Pretrain/Step Time": 8.53939026221633} +{"Pretrain/Learning Rate": 3.583889728362414e-05, "Pretrain/Loss": 2.095716714859009, "Pretrain/Loss (Raw)": 2.125462055206299, "Pretrain/Step": 3591, "Pretrain/Step Time": 8.539690094068646} +{"Pretrain/Learning Rate": 3.583124620760659e-05, "Pretrain/Loss": 2.0965628623962402, "Pretrain/Loss (Raw)": 2.1866302490234375, "Pretrain/Step": 3592, "Pretrain/Step Time": 8.544519567862153} +{"Pretrain/Learning Rate": 3.582359388247869e-05, "Pretrain/Loss": 2.0938456058502197, "Pretrain/Loss (Raw)": 1.7723989486694336, "Pretrain/Step": 3593, "Pretrain/Step Time": 8.540679413825274} +{"Pretrain/Learning Rate": 3.581594030912294e-05, "Pretrain/Loss": 2.0943660736083984, "Pretrain/Loss (Raw)": 2.116368532180786, "Pretrain/Step": 3594, "Pretrain/Step Time": 8.540990836918354} +{"Pretrain/Learning Rate": 3.580828548842198e-05, "Pretrain/Loss": 2.0964255332946777, "Pretrain/Loss (Raw)": 2.3139123916625977, "Pretrain/Step": 3595, "Pretrain/Step Time": 8.53737141750753} +{"Pretrain/Learning Rate": 3.5800629421258606e-05, "Pretrain/Loss": 2.0952234268188477, "Pretrain/Loss (Raw)": 1.9995172023773193, "Pretrain/Step": 3596, "Pretrain/Step Time": 8.535246396437287} +{"Pretrain/Learning Rate": 3.579297210851576e-05, "Pretrain/Loss": 2.094008207321167, "Pretrain/Loss (Raw)": 2.0366501808166504, "Pretrain/Step": 3597, "Pretrain/Step Time": 8.539122216403484} +{"Pretrain/Learning Rate": 3.5785313551076505e-05, "Pretrain/Loss": 2.0925798416137695, "Pretrain/Loss (Raw)": 1.8523393869400024, "Pretrain/Step": 3598, "Pretrain/Step Time": 8.540213584899902} +{"Pretrain/Learning Rate": 3.577765374982408e-05, "Pretrain/Loss": 2.093308448791504, "Pretrain/Loss (Raw)": 2.198596715927124, "Pretrain/Step": 3599, "Pretrain/Step Time": 8.535844763740897} +{"Pretrain/Learning Rate": 3.576999270564183e-05, "Pretrain/Loss": 2.0933339595794678, "Pretrain/Loss (Raw)": 2.094583034515381, "Pretrain/Step": 3600, "Pretrain/Step Time": 8.53938670270145} +{"Pretrain/Learning Rate": 3.5762330419413273e-05, "Pretrain/Loss": 2.095524787902832, "Pretrain/Loss (Raw)": 2.384138345718384, "Pretrain/Step": 3601, "Pretrain/Step Time": 8.537959581241012} +{"Pretrain/Learning Rate": 3.575466689202206e-05, "Pretrain/Loss": 2.0965588092803955, "Pretrain/Loss (Raw)": 2.2175185680389404, "Pretrain/Step": 3602, "Pretrain/Step Time": 8.53752469830215} +{"Pretrain/Learning Rate": 3.5747002124351986e-05, "Pretrain/Loss": 2.0948312282562256, "Pretrain/Loss (Raw)": 1.9792240858078003, "Pretrain/Step": 3603, "Pretrain/Step Time": 8.533789558336139} +{"Pretrain/Learning Rate": 3.573933611728698e-05, "Pretrain/Loss": 2.092670440673828, "Pretrain/Loss (Raw)": 1.9499013423919678, "Pretrain/Step": 3604, "Pretrain/Step Time": 8.537792762741446} +{"Pretrain/Learning Rate": 3.573166887171113e-05, "Pretrain/Loss": 2.0947885513305664, "Pretrain/Loss (Raw)": 2.0675952434539795, "Pretrain/Step": 3605, "Pretrain/Step Time": 8.531727587804198} +{"Pretrain/Learning Rate": 3.5724000388508655e-05, "Pretrain/Loss": 2.0965380668640137, "Pretrain/Loss (Raw)": 2.163424253463745, "Pretrain/Step": 3606, "Pretrain/Step Time": 8.538268111646175} +{"Pretrain/Learning Rate": 3.571633066856392e-05, "Pretrain/Loss": 2.0924222469329834, "Pretrain/Loss (Raw)": 1.9273616075515747, "Pretrain/Step": 3607, "Pretrain/Step Time": 8.539489256218076} +{"Pretrain/Learning Rate": 3.570865971276144e-05, "Pretrain/Loss": 2.0944652557373047, "Pretrain/Loss (Raw)": 2.1515467166900635, "Pretrain/Step": 3608, "Pretrain/Step Time": 8.540370233356953} +{"Pretrain/Learning Rate": 3.570098752198586e-05, "Pretrain/Loss": 2.09653377532959, "Pretrain/Loss (Raw)": 2.062265157699585, "Pretrain/Step": 3609, "Pretrain/Step Time": 8.538153316825628} +{"Pretrain/Learning Rate": 3.569331409712198e-05, "Pretrain/Loss": 2.096343755722046, "Pretrain/Loss (Raw)": 2.046431541442871, "Pretrain/Step": 3610, "Pretrain/Step Time": 8.545936826616526} +{"Pretrain/Learning Rate": 3.568563943905472e-05, "Pretrain/Loss": 2.0953030586242676, "Pretrain/Loss (Raw)": 2.171566963195801, "Pretrain/Step": 3611, "Pretrain/Step Time": 8.536924647167325} +{"Pretrain/Learning Rate": 3.5677963548669175e-05, "Pretrain/Loss": 2.091388463973999, "Pretrain/Loss (Raw)": 1.9829329252243042, "Pretrain/Step": 3612, "Pretrain/Step Time": 8.537550872191787} +{"Pretrain/Learning Rate": 3.567028642685055e-05, "Pretrain/Loss": 2.0948896408081055, "Pretrain/Loss (Raw)": 2.4889824390411377, "Pretrain/Step": 3613, "Pretrain/Step Time": 8.54139257594943} +{"Pretrain/Learning Rate": 3.566260807448422e-05, "Pretrain/Loss": 2.096296548843384, "Pretrain/Loss (Raw)": 2.145071029663086, "Pretrain/Step": 3614, "Pretrain/Step Time": 8.53710082359612} +{"Pretrain/Learning Rate": 3.565492849245568e-05, "Pretrain/Loss": 2.0962042808532715, "Pretrain/Loss (Raw)": 1.9778547286987305, "Pretrain/Step": 3615, "Pretrain/Step Time": 8.534997817128897} +{"Pretrain/Learning Rate": 3.564724768165058e-05, "Pretrain/Loss": 2.0964550971984863, "Pretrain/Loss (Raw)": 2.0089616775512695, "Pretrain/Step": 3616, "Pretrain/Step Time": 8.547913528978825} +{"Pretrain/Learning Rate": 3.5639565642954705e-05, "Pretrain/Loss": 2.09598445892334, "Pretrain/Loss (Raw)": 2.125624656677246, "Pretrain/Step": 3617, "Pretrain/Step Time": 8.536947390064597} +{"Pretrain/Learning Rate": 3.563188237725399e-05, "Pretrain/Loss": 2.097054958343506, "Pretrain/Loss (Raw)": 2.13022780418396, "Pretrain/Step": 3618, "Pretrain/Step Time": 8.537484861910343} +{"Pretrain/Learning Rate": 3.562419788543449e-05, "Pretrain/Loss": 2.0948140621185303, "Pretrain/Loss (Raw)": 1.879753589630127, "Pretrain/Step": 3619, "Pretrain/Step Time": 8.538314424455166} +{"Pretrain/Learning Rate": 3.561651216838243e-05, "Pretrain/Loss": 2.09330415725708, "Pretrain/Loss (Raw)": 2.0112357139587402, "Pretrain/Step": 3620, "Pretrain/Step Time": 8.538150697946548} +{"Pretrain/Learning Rate": 3.560882522698417e-05, "Pretrain/Loss": 2.0935916900634766, "Pretrain/Loss (Raw)": 2.044438600540161, "Pretrain/Step": 3621, "Pretrain/Step Time": 8.538428166881204} +{"Pretrain/Learning Rate": 3.560113706212618e-05, "Pretrain/Loss": 2.09413480758667, "Pretrain/Loss (Raw)": 1.964980125427246, "Pretrain/Step": 3622, "Pretrain/Step Time": 8.547122253105044} +{"Pretrain/Learning Rate": 3.559344767469512e-05, "Pretrain/Loss": 2.0953598022460938, "Pretrain/Loss (Raw)": 2.123379707336426, "Pretrain/Step": 3623, "Pretrain/Step Time": 8.543570440262556} +{"Pretrain/Learning Rate": 3.5585757065577755e-05, "Pretrain/Loss": 2.0959339141845703, "Pretrain/Loss (Raw)": 2.0786259174346924, "Pretrain/Step": 3624, "Pretrain/Step Time": 8.541231678798795} +{"Pretrain/Learning Rate": 3.557806523566099e-05, "Pretrain/Loss": 2.0951929092407227, "Pretrain/Loss (Raw)": 2.1860179901123047, "Pretrain/Step": 3625, "Pretrain/Step Time": 8.545040301978588} +{"Pretrain/Learning Rate": 3.557037218583191e-05, "Pretrain/Loss": 2.09397292137146, "Pretrain/Loss (Raw)": 2.0451858043670654, "Pretrain/Step": 3626, "Pretrain/Step Time": 8.541174739599228} +{"Pretrain/Learning Rate": 3.5562677916977704e-05, "Pretrain/Loss": 2.0938515663146973, "Pretrain/Loss (Raw)": 1.9791841506958008, "Pretrain/Step": 3627, "Pretrain/Step Time": 8.547079935669899} +{"Pretrain/Learning Rate": 3.55549824299857e-05, "Pretrain/Loss": 2.093275547027588, "Pretrain/Loss (Raw)": 2.0626285076141357, "Pretrain/Step": 3628, "Pretrain/Step Time": 8.55217281728983} +{"Pretrain/Learning Rate": 3.554728572574339e-05, "Pretrain/Loss": 2.0931053161621094, "Pretrain/Loss (Raw)": 2.04325795173645, "Pretrain/Step": 3629, "Pretrain/Step Time": 8.54700804874301} +{"Pretrain/Learning Rate": 3.5539587805138385e-05, "Pretrain/Loss": 2.093392848968506, "Pretrain/Loss (Raw)": 2.095315933227539, "Pretrain/Step": 3630, "Pretrain/Step Time": 8.551172584295273} +{"Pretrain/Learning Rate": 3.5531888669058455e-05, "Pretrain/Loss": 2.0913209915161133, "Pretrain/Loss (Raw)": 1.9109410047531128, "Pretrain/Step": 3631, "Pretrain/Step Time": 8.547666106373072} +{"Pretrain/Learning Rate": 3.552418831839149e-05, "Pretrain/Loss": 2.0913608074188232, "Pretrain/Loss (Raw)": 2.068861246109009, "Pretrain/Step": 3632, "Pretrain/Step Time": 8.546058496460319} +{"Pretrain/Learning Rate": 3.551648675402554e-05, "Pretrain/Loss": 2.0915093421936035, "Pretrain/Loss (Raw)": 2.197641372680664, "Pretrain/Step": 3633, "Pretrain/Step Time": 8.547783801332116} +{"Pretrain/Learning Rate": 3.550878397684878e-05, "Pretrain/Loss": 2.0897932052612305, "Pretrain/Loss (Raw)": 2.0819971561431885, "Pretrain/Step": 3634, "Pretrain/Step Time": 8.550704926252365} +{"Pretrain/Learning Rate": 3.5501079987749535e-05, "Pretrain/Loss": 2.0881221294403076, "Pretrain/Loss (Raw)": 2.0383284091949463, "Pretrain/Step": 3635, "Pretrain/Step Time": 8.54339044354856} +{"Pretrain/Learning Rate": 3.549337478761626e-05, "Pretrain/Loss": 2.087306261062622, "Pretrain/Loss (Raw)": 2.049290180206299, "Pretrain/Step": 3636, "Pretrain/Step Time": 8.548010163009167} +{"Pretrain/Learning Rate": 3.548566837733756e-05, "Pretrain/Loss": 2.0891103744506836, "Pretrain/Loss (Raw)": 2.4371910095214844, "Pretrain/Step": 3637, "Pretrain/Step Time": 8.544472798705101} +{"Pretrain/Learning Rate": 3.547796075780218e-05, "Pretrain/Loss": 2.0878407955169678, "Pretrain/Loss (Raw)": 1.9068838357925415, "Pretrain/Step": 3638, "Pretrain/Step Time": 8.546679649502039} +{"Pretrain/Learning Rate": 3.547025192989898e-05, "Pretrain/Loss": 2.0887210369110107, "Pretrain/Loss (Raw)": 2.1568403244018555, "Pretrain/Step": 3639, "Pretrain/Step Time": 8.543753793463111} +{"Pretrain/Learning Rate": 3.546254189451699e-05, "Pretrain/Loss": 2.088292121887207, "Pretrain/Loss (Raw)": 2.0686333179473877, "Pretrain/Step": 3640, "Pretrain/Step Time": 8.549272565171123} +{"Pretrain/Learning Rate": 3.5454830652545374e-05, "Pretrain/Loss": 2.0889315605163574, "Pretrain/Loss (Raw)": 2.2637157440185547, "Pretrain/Step": 3641, "Pretrain/Step Time": 8.535849830135703} +{"Pretrain/Learning Rate": 3.544711820487343e-05, "Pretrain/Loss": 2.0880837440490723, "Pretrain/Loss (Raw)": 2.1017823219299316, "Pretrain/Step": 3642, "Pretrain/Step Time": 8.540893893688917} +{"Pretrain/Learning Rate": 3.543940455239057e-05, "Pretrain/Loss": 2.0870261192321777, "Pretrain/Loss (Raw)": 2.251967191696167, "Pretrain/Step": 3643, "Pretrain/Step Time": 8.542726581916213} +{"Pretrain/Learning Rate": 3.543168969598639e-05, "Pretrain/Loss": 2.0882186889648438, "Pretrain/Loss (Raw)": 2.0768258571624756, "Pretrain/Step": 3644, "Pretrain/Step Time": 8.544896673411131} +{"Pretrain/Learning Rate": 3.54239736365506e-05, "Pretrain/Loss": 2.086144208908081, "Pretrain/Loss (Raw)": 1.9034849405288696, "Pretrain/Step": 3645, "Pretrain/Step Time": 8.543294301256537} +{"Pretrain/Learning Rate": 3.541625637497306e-05, "Pretrain/Loss": 2.0857787132263184, "Pretrain/Loss (Raw)": 1.9621801376342773, "Pretrain/Step": 3646, "Pretrain/Step Time": 8.553977413102984} +{"Pretrain/Learning Rate": 3.540853791214373e-05, "Pretrain/Loss": 2.0844907760620117, "Pretrain/Loss (Raw)": 2.120896339416504, "Pretrain/Step": 3647, "Pretrain/Step Time": 8.538454450666904} +{"Pretrain/Learning Rate": 3.5400818248952786e-05, "Pretrain/Loss": 2.087346315383911, "Pretrain/Loss (Raw)": 2.181097984313965, "Pretrain/Step": 3648, "Pretrain/Step Time": 8.54381917975843} +{"Pretrain/Learning Rate": 3.539309738629045e-05, "Pretrain/Loss": 2.0894837379455566, "Pretrain/Loss (Raw)": 2.1906087398529053, "Pretrain/Step": 3649, "Pretrain/Step Time": 8.5461800750345} +{"Pretrain/Learning Rate": 3.5385375325047166e-05, "Pretrain/Loss": 2.095048427581787, "Pretrain/Loss (Raw)": 2.5922787189483643, "Pretrain/Step": 3650, "Pretrain/Step Time": 8.543818002566695} +{"Pretrain/Learning Rate": 3.537765206611345e-05, "Pretrain/Loss": 2.0929012298583984, "Pretrain/Loss (Raw)": 1.9169955253601074, "Pretrain/Step": 3651, "Pretrain/Step Time": 8.542576104402542} +{"Pretrain/Learning Rate": 3.536992761038001e-05, "Pretrain/Loss": 2.093231678009033, "Pretrain/Loss (Raw)": 2.2175045013427734, "Pretrain/Step": 3652, "Pretrain/Step Time": 8.552044900134206} +{"Pretrain/Learning Rate": 3.536220195873764e-05, "Pretrain/Loss": 2.0926103591918945, "Pretrain/Loss (Raw)": 2.1673479080200195, "Pretrain/Step": 3653, "Pretrain/Step Time": 8.54232258722186} +{"Pretrain/Learning Rate": 3.535447511207731e-05, "Pretrain/Loss": 2.0915164947509766, "Pretrain/Loss (Raw)": 1.9694379568099976, "Pretrain/Step": 3654, "Pretrain/Step Time": 8.547632865607738} +{"Pretrain/Learning Rate": 3.534674707129013e-05, "Pretrain/Loss": 2.090825319290161, "Pretrain/Loss (Raw)": 2.1356093883514404, "Pretrain/Step": 3655, "Pretrain/Step Time": 8.545956766232848} +{"Pretrain/Learning Rate": 3.5339017837267316e-05, "Pretrain/Loss": 2.0897433757781982, "Pretrain/Loss (Raw)": 2.071101188659668, "Pretrain/Step": 3656, "Pretrain/Step Time": 8.542883541435003} +{"Pretrain/Learning Rate": 3.5331287410900246e-05, "Pretrain/Loss": 2.0877022743225098, "Pretrain/Loss (Raw)": 1.8965801000595093, "Pretrain/Step": 3657, "Pretrain/Step Time": 8.54377082362771} +{"Pretrain/Learning Rate": 3.532355579308043e-05, "Pretrain/Loss": 2.0862364768981934, "Pretrain/Loss (Raw)": 1.8930625915527344, "Pretrain/Step": 3658, "Pretrain/Step Time": 8.554650830104947} +{"Pretrain/Learning Rate": 3.531582298469952e-05, "Pretrain/Loss": 2.0868096351623535, "Pretrain/Loss (Raw)": 2.1777589321136475, "Pretrain/Step": 3659, "Pretrain/Step Time": 8.553287545219064} +{"Pretrain/Learning Rate": 3.530808898664928e-05, "Pretrain/Loss": 2.0873827934265137, "Pretrain/Loss (Raw)": 2.0942797660827637, "Pretrain/Step": 3660, "Pretrain/Step Time": 8.549852289259434} +{"Pretrain/Learning Rate": 3.530035379982166e-05, "Pretrain/Loss": 2.086735248565674, "Pretrain/Loss (Raw)": 2.068169593811035, "Pretrain/Step": 3661, "Pretrain/Step Time": 8.549288617447019} +{"Pretrain/Learning Rate": 3.5292617425108694e-05, "Pretrain/Loss": 2.0860445499420166, "Pretrain/Loss (Raw)": 2.1432371139526367, "Pretrain/Step": 3662, "Pretrain/Step Time": 8.546090997755527} +{"Pretrain/Learning Rate": 3.5284879863402585e-05, "Pretrain/Loss": 2.0853092670440674, "Pretrain/Loss (Raw)": 2.1099743843078613, "Pretrain/Step": 3663, "Pretrain/Step Time": 8.545266222208738} +{"Pretrain/Learning Rate": 3.527714111559567e-05, "Pretrain/Loss": 2.0869412422180176, "Pretrain/Loss (Raw)": 2.1229565143585205, "Pretrain/Step": 3664, "Pretrain/Step Time": 8.55342773348093} +{"Pretrain/Learning Rate": 3.526940118258041e-05, "Pretrain/Loss": 2.086724281311035, "Pretrain/Loss (Raw)": 2.0895724296569824, "Pretrain/Step": 3665, "Pretrain/Step Time": 8.554606406018138} +{"Pretrain/Learning Rate": 3.526166006524942e-05, "Pretrain/Loss": 2.0869264602661133, "Pretrain/Loss (Raw)": 2.082200288772583, "Pretrain/Step": 3666, "Pretrain/Step Time": 8.548214504495263} +{"Pretrain/Learning Rate": 3.525391776449544e-05, "Pretrain/Loss": 2.087113857269287, "Pretrain/Loss (Raw)": 2.1768689155578613, "Pretrain/Step": 3667, "Pretrain/Step Time": 8.542585356160998} +{"Pretrain/Learning Rate": 3.5246174281211344e-05, "Pretrain/Loss": 2.0861077308654785, "Pretrain/Loss (Raw)": 2.050644874572754, "Pretrain/Step": 3668, "Pretrain/Step Time": 8.540705662220716} +{"Pretrain/Learning Rate": 3.523842961629014e-05, "Pretrain/Loss": 2.0867631435394287, "Pretrain/Loss (Raw)": 2.2221474647521973, "Pretrain/Step": 3669, "Pretrain/Step Time": 8.540710495784879} +{"Pretrain/Learning Rate": 3.5230683770624987e-05, "Pretrain/Loss": 2.0854711532592773, "Pretrain/Loss (Raw)": 1.8082376718521118, "Pretrain/Step": 3670, "Pretrain/Step Time": 8.545688975602388} +{"Pretrain/Learning Rate": 3.522293674510918e-05, "Pretrain/Loss": 2.0867691040039062, "Pretrain/Loss (Raw)": 2.2304797172546387, "Pretrain/Step": 3671, "Pretrain/Step Time": 8.550755748525262} +{"Pretrain/Learning Rate": 3.5215188540636134e-05, "Pretrain/Loss": 2.0883278846740723, "Pretrain/Loss (Raw)": 2.328561544418335, "Pretrain/Step": 3672, "Pretrain/Step Time": 8.542829044163227} +{"Pretrain/Learning Rate": 3.520743915809941e-05, "Pretrain/Loss": 2.0875515937805176, "Pretrain/Loss (Raw)": 2.1137306690216064, "Pretrain/Step": 3673, "Pretrain/Step Time": 8.545588290318847} +{"Pretrain/Learning Rate": 3.51996885983927e-05, "Pretrain/Loss": 2.0886030197143555, "Pretrain/Loss (Raw)": 2.1724042892456055, "Pretrain/Step": 3674, "Pretrain/Step Time": 8.544343976303935} +{"Pretrain/Learning Rate": 3.519193686240984e-05, "Pretrain/Loss": 2.0907649993896484, "Pretrain/Loss (Raw)": 2.1395998001098633, "Pretrain/Step": 3675, "Pretrain/Step Time": 8.548887431621552} +{"Pretrain/Learning Rate": 3.51841839510448e-05, "Pretrain/Loss": 2.0921101570129395, "Pretrain/Loss (Raw)": 1.9909981489181519, "Pretrain/Step": 3676, "Pretrain/Step Time": 8.551274402067065} +{"Pretrain/Learning Rate": 3.517642986519167e-05, "Pretrain/Loss": 2.090451240539551, "Pretrain/Loss (Raw)": 2.1601645946502686, "Pretrain/Step": 3677, "Pretrain/Step Time": 8.548981724306941} +{"Pretrain/Learning Rate": 3.51686746057447e-05, "Pretrain/Loss": 2.0907676219940186, "Pretrain/Loss (Raw)": 2.267853021621704, "Pretrain/Step": 3678, "Pretrain/Step Time": 8.54710066691041} +{"Pretrain/Learning Rate": 3.516091817359825e-05, "Pretrain/Loss": 2.0897414684295654, "Pretrain/Loss (Raw)": 1.8566440343856812, "Pretrain/Step": 3679, "Pretrain/Step Time": 8.551453735679388} +{"Pretrain/Learning Rate": 3.515316056964684e-05, "Pretrain/Loss": 2.089262008666992, "Pretrain/Loss (Raw)": 2.123927593231201, "Pretrain/Step": 3680, "Pretrain/Step Time": 8.553421281278133} +{"Pretrain/Learning Rate": 3.5145401794785116e-05, "Pretrain/Loss": 2.086095094680786, "Pretrain/Loss (Raw)": 2.0566351413726807, "Pretrain/Step": 3681, "Pretrain/Step Time": 8.54824012517929} +{"Pretrain/Learning Rate": 3.5137641849907844e-05, "Pretrain/Loss": 2.0829176902770996, "Pretrain/Loss (Raw)": 1.8532257080078125, "Pretrain/Step": 3682, "Pretrain/Step Time": 8.55417275428772} +{"Pretrain/Learning Rate": 3.5129880735909945e-05, "Pretrain/Loss": 2.081531524658203, "Pretrain/Loss (Raw)": 2.0640358924865723, "Pretrain/Step": 3683, "Pretrain/Step Time": 8.553119149059057} +{"Pretrain/Learning Rate": 3.512211845368647e-05, "Pretrain/Loss": 2.0822958946228027, "Pretrain/Loss (Raw)": 2.222296714782715, "Pretrain/Step": 3684, "Pretrain/Step Time": 8.553456578403711} +{"Pretrain/Learning Rate": 3.511435500413259e-05, "Pretrain/Loss": 2.082818031311035, "Pretrain/Loss (Raw)": 2.1274898052215576, "Pretrain/Step": 3685, "Pretrain/Step Time": 8.545438764616847} +{"Pretrain/Learning Rate": 3.510659038814364e-05, "Pretrain/Loss": 2.0817439556121826, "Pretrain/Loss (Raw)": 1.9900007247924805, "Pretrain/Step": 3686, "Pretrain/Step Time": 8.549216059967875} +{"Pretrain/Learning Rate": 3.509882460661506e-05, "Pretrain/Loss": 2.0807008743286133, "Pretrain/Loss (Raw)": 1.7000471353530884, "Pretrain/Step": 3687, "Pretrain/Step Time": 8.550865730270743} +{"Pretrain/Learning Rate": 3.5091057660442434e-05, "Pretrain/Loss": 2.079813241958618, "Pretrain/Loss (Raw)": 1.9304577112197876, "Pretrain/Step": 3688, "Pretrain/Step Time": 8.552074940875173} +{"Pretrain/Learning Rate": 3.5083289550521495e-05, "Pretrain/Loss": 2.0812225341796875, "Pretrain/Loss (Raw)": 2.0919699668884277, "Pretrain/Step": 3689, "Pretrain/Step Time": 8.554452888667583} +{"Pretrain/Learning Rate": 3.507552027774809e-05, "Pretrain/Loss": 2.081050157546997, "Pretrain/Loss (Raw)": 2.0452239513397217, "Pretrain/Step": 3690, "Pretrain/Step Time": 8.544491097331047} +{"Pretrain/Learning Rate": 3.5067749843018205e-05, "Pretrain/Loss": 2.080639362335205, "Pretrain/Loss (Raw)": 2.102349281311035, "Pretrain/Step": 3691, "Pretrain/Step Time": 8.548943240195513} +{"Pretrain/Learning Rate": 3.5059978247227965e-05, "Pretrain/Loss": 2.080808162689209, "Pretrain/Loss (Raw)": 2.1892824172973633, "Pretrain/Step": 3692, "Pretrain/Step Time": 8.550334598869085} +{"Pretrain/Learning Rate": 3.505220549127364e-05, "Pretrain/Loss": 2.081455707550049, "Pretrain/Loss (Raw)": 2.1055588722229004, "Pretrain/Step": 3693, "Pretrain/Step Time": 8.543282555416226} +{"Pretrain/Learning Rate": 3.50444315760516e-05, "Pretrain/Loss": 2.0821125507354736, "Pretrain/Loss (Raw)": 2.196659803390503, "Pretrain/Step": 3694, "Pretrain/Step Time": 8.553199985995889} +{"Pretrain/Learning Rate": 3.503665650245838e-05, "Pretrain/Loss": 2.083817958831787, "Pretrain/Loss (Raw)": 2.22940993309021, "Pretrain/Step": 3695, "Pretrain/Step Time": 8.54509181343019} +{"Pretrain/Learning Rate": 3.502888027139065e-05, "Pretrain/Loss": 2.0864248275756836, "Pretrain/Loss (Raw)": 2.308872699737549, "Pretrain/Step": 3696, "Pretrain/Step Time": 8.554974522441626} +{"Pretrain/Learning Rate": 3.502110288374517e-05, "Pretrain/Loss": 2.086461067199707, "Pretrain/Loss (Raw)": 2.0829856395721436, "Pretrain/Step": 3697, "Pretrain/Step Time": 8.544477682560682} +{"Pretrain/Learning Rate": 3.50133243404189e-05, "Pretrain/Loss": 2.0852577686309814, "Pretrain/Loss (Raw)": 2.099318742752075, "Pretrain/Step": 3698, "Pretrain/Step Time": 8.546189157292247} +{"Pretrain/Learning Rate": 3.5005544642308874e-05, "Pretrain/Loss": 2.0846283435821533, "Pretrain/Loss (Raw)": 2.092843532562256, "Pretrain/Step": 3699, "Pretrain/Step Time": 8.548082828521729} +{"Pretrain/Learning Rate": 3.49977637903123e-05, "Pretrain/Loss": 2.085669755935669, "Pretrain/Loss (Raw)": 2.1586928367614746, "Pretrain/Step": 3700, "Pretrain/Step Time": 8.551277458667755} +{"Pretrain/Learning Rate": 3.4989981785326485e-05, "Pretrain/Loss": 2.0871996879577637, "Pretrain/Loss (Raw)": 2.2226316928863525, "Pretrain/Step": 3701, "Pretrain/Step Time": 8.553174521774054} +{"Pretrain/Learning Rate": 3.498219862824891e-05, "Pretrain/Loss": 2.0876619815826416, "Pretrain/Loss (Raw)": 2.0200321674346924, "Pretrain/Step": 3702, "Pretrain/Step Time": 8.552466984838247} +{"Pretrain/Learning Rate": 3.497441431997714e-05, "Pretrain/Loss": 2.088495969772339, "Pretrain/Loss (Raw)": 2.3638875484466553, "Pretrain/Step": 3703, "Pretrain/Step Time": 8.55060569010675} +{"Pretrain/Learning Rate": 3.4966628861408914e-05, "Pretrain/Loss": 2.089137077331543, "Pretrain/Loss (Raw)": 2.1356546878814697, "Pretrain/Step": 3704, "Pretrain/Step Time": 8.55080877430737} +{"Pretrain/Learning Rate": 3.495884225344208e-05, "Pretrain/Loss": 2.091456413269043, "Pretrain/Loss (Raw)": 2.1704211235046387, "Pretrain/Step": 3705, "Pretrain/Step Time": 8.548916898667812} +{"Pretrain/Learning Rate": 3.495105449697463e-05, "Pretrain/Loss": 2.0908336639404297, "Pretrain/Loss (Raw)": 2.014045238494873, "Pretrain/Step": 3706, "Pretrain/Step Time": 8.553656248375773} +{"Pretrain/Learning Rate": 3.494326559290469e-05, "Pretrain/Loss": 2.0921554565429688, "Pretrain/Loss (Raw)": 2.025554656982422, "Pretrain/Step": 3707, "Pretrain/Step Time": 8.560398621484637} +{"Pretrain/Learning Rate": 3.4935475542130505e-05, "Pretrain/Loss": 2.090773344039917, "Pretrain/Loss (Raw)": 2.0660836696624756, "Pretrain/Step": 3708, "Pretrain/Step Time": 8.552734062075615} +{"Pretrain/Learning Rate": 3.492768434555046e-05, "Pretrain/Loss": 2.09152889251709, "Pretrain/Loss (Raw)": 2.201124668121338, "Pretrain/Step": 3709, "Pretrain/Step Time": 8.554590176790953} +{"Pretrain/Learning Rate": 3.4919892004063084e-05, "Pretrain/Loss": 2.091407299041748, "Pretrain/Loss (Raw)": 2.021439552307129, "Pretrain/Step": 3710, "Pretrain/Step Time": 8.560840297490358} +{"Pretrain/Learning Rate": 3.491209851856701e-05, "Pretrain/Loss": 2.091404914855957, "Pretrain/Loss (Raw)": 1.9846588373184204, "Pretrain/Step": 3711, "Pretrain/Step Time": 8.56194400601089} +{"Pretrain/Learning Rate": 3.490430388996103e-05, "Pretrain/Loss": 2.0931577682495117, "Pretrain/Loss (Raw)": 2.115246534347534, "Pretrain/Step": 3712, "Pretrain/Step Time": 8.565316867083311} +{"Pretrain/Learning Rate": 3.4896508119144056e-05, "Pretrain/Loss": 2.093405246734619, "Pretrain/Loss (Raw)": 2.1085519790649414, "Pretrain/Step": 3713, "Pretrain/Step Time": 8.564051637426019} +{"Pretrain/Learning Rate": 3.4888711207015124e-05, "Pretrain/Loss": 2.094552516937256, "Pretrain/Loss (Raw)": 2.183971881866455, "Pretrain/Step": 3714, "Pretrain/Step Time": 8.555260078981519} +{"Pretrain/Learning Rate": 3.488091315447343e-05, "Pretrain/Loss": 2.0958924293518066, "Pretrain/Loss (Raw)": 2.1344411373138428, "Pretrain/Step": 3715, "Pretrain/Step Time": 8.556792987510562} +{"Pretrain/Learning Rate": 3.487311396241826e-05, "Pretrain/Loss": 2.096309185028076, "Pretrain/Loss (Raw)": 1.987047553062439, "Pretrain/Step": 3716, "Pretrain/Step Time": 8.560968074947596} +{"Pretrain/Learning Rate": 3.486531363174908e-05, "Pretrain/Loss": 2.0960991382598877, "Pretrain/Loss (Raw)": 2.1180686950683594, "Pretrain/Step": 3717, "Pretrain/Step Time": 8.560104487463832} +{"Pretrain/Learning Rate": 3.4857512163365424e-05, "Pretrain/Loss": 2.0954174995422363, "Pretrain/Loss (Raw)": 2.1426427364349365, "Pretrain/Step": 3718, "Pretrain/Step Time": 8.556923035532236} +{"Pretrain/Learning Rate": 3.484970955816703e-05, "Pretrain/Loss": 2.0925047397613525, "Pretrain/Loss (Raw)": 1.7526065111160278, "Pretrain/Step": 3719, "Pretrain/Step Time": 8.56436470337212} +{"Pretrain/Learning Rate": 3.484190581705371e-05, "Pretrain/Loss": 2.091001510620117, "Pretrain/Loss (Raw)": 1.9942480325698853, "Pretrain/Step": 3720, "Pretrain/Step Time": 8.551478022709489} +{"Pretrain/Learning Rate": 3.483410094092543e-05, "Pretrain/Loss": 2.094642400741577, "Pretrain/Loss (Raw)": 2.2384026050567627, "Pretrain/Step": 3721, "Pretrain/Step Time": 8.55476738512516} +{"Pretrain/Learning Rate": 3.48262949306823e-05, "Pretrain/Loss": 2.094320297241211, "Pretrain/Loss (Raw)": 2.075136661529541, "Pretrain/Step": 3722, "Pretrain/Step Time": 8.552908955141902} +{"Pretrain/Learning Rate": 3.481848778722453e-05, "Pretrain/Loss": 2.0920469760894775, "Pretrain/Loss (Raw)": 2.022946357727051, "Pretrain/Step": 3723, "Pretrain/Step Time": 8.552521336823702} +{"Pretrain/Learning Rate": 3.4810679511452484e-05, "Pretrain/Loss": 2.0936660766601562, "Pretrain/Loss (Raw)": 2.20676851272583, "Pretrain/Step": 3724, "Pretrain/Step Time": 8.552142774686217} +{"Pretrain/Learning Rate": 3.480287010426664e-05, "Pretrain/Loss": 2.0973901748657227, "Pretrain/Loss (Raw)": 2.513331413269043, "Pretrain/Step": 3725, "Pretrain/Step Time": 8.557583386078477} +{"Pretrain/Learning Rate": 3.479505956656764e-05, "Pretrain/Loss": 2.099571943283081, "Pretrain/Loss (Raw)": 2.1315906047821045, "Pretrain/Step": 3726, "Pretrain/Step Time": 8.549843616783619} +{"Pretrain/Learning Rate": 3.47872478992562e-05, "Pretrain/Loss": 2.0983166694641113, "Pretrain/Loss (Raw)": 2.0379037857055664, "Pretrain/Step": 3727, "Pretrain/Step Time": 8.553660677745938} +{"Pretrain/Learning Rate": 3.477943510323322e-05, "Pretrain/Loss": 2.098806858062744, "Pretrain/Loss (Raw)": 2.1573362350463867, "Pretrain/Step": 3728, "Pretrain/Step Time": 8.548640353605151} +{"Pretrain/Learning Rate": 3.4771621179399696e-05, "Pretrain/Loss": 2.097602367401123, "Pretrain/Loss (Raw)": 2.2300021648406982, "Pretrain/Step": 3729, "Pretrain/Step Time": 8.553723145276308} +{"Pretrain/Learning Rate": 3.476380612865679e-05, "Pretrain/Loss": 2.0960333347320557, "Pretrain/Loss (Raw)": 2.0166375637054443, "Pretrain/Step": 3730, "Pretrain/Step Time": 8.549397695809603} +{"Pretrain/Learning Rate": 3.475598995190572e-05, "Pretrain/Loss": 2.096294403076172, "Pretrain/Loss (Raw)": 2.0126824378967285, "Pretrain/Step": 3731, "Pretrain/Step Time": 8.560018088668585} +{"Pretrain/Learning Rate": 3.4748172650047945e-05, "Pretrain/Loss": 2.095888137817383, "Pretrain/Loss (Raw)": 1.8978713750839233, "Pretrain/Step": 3732, "Pretrain/Step Time": 8.553961277008057} +{"Pretrain/Learning Rate": 3.474035422398496e-05, "Pretrain/Loss": 2.0959630012512207, "Pretrain/Loss (Raw)": 2.077202320098877, "Pretrain/Step": 3733, "Pretrain/Step Time": 8.563062705099583} +{"Pretrain/Learning Rate": 3.473253467461842e-05, "Pretrain/Loss": 2.094731330871582, "Pretrain/Loss (Raw)": 2.0057692527770996, "Pretrain/Step": 3734, "Pretrain/Step Time": 8.555137898772955} +{"Pretrain/Learning Rate": 3.4724714002850125e-05, "Pretrain/Loss": 2.09602427482605, "Pretrain/Loss (Raw)": 2.092838764190674, "Pretrain/Step": 3735, "Pretrain/Step Time": 8.556358499452472} +{"Pretrain/Learning Rate": 3.471689220958198e-05, "Pretrain/Loss": 2.0959768295288086, "Pretrain/Loss (Raw)": 2.145490884780884, "Pretrain/Step": 3736, "Pretrain/Step Time": 8.554932793602347} +{"Pretrain/Learning Rate": 3.470906929571605e-05, "Pretrain/Loss": 2.095834970474243, "Pretrain/Loss (Raw)": 2.04409122467041, "Pretrain/Step": 3737, "Pretrain/Step Time": 8.55959371291101} +{"Pretrain/Learning Rate": 3.470124526215449e-05, "Pretrain/Loss": 2.097536563873291, "Pretrain/Loss (Raw)": 2.2642481327056885, "Pretrain/Step": 3738, "Pretrain/Step Time": 8.55210023932159} +{"Pretrain/Learning Rate": 3.469342010979962e-05, "Pretrain/Loss": 2.096261978149414, "Pretrain/Loss (Raw)": 2.0084311962127686, "Pretrain/Step": 3739, "Pretrain/Step Time": 8.556064071133733} +{"Pretrain/Learning Rate": 3.4685593839553856e-05, "Pretrain/Loss": 2.097609281539917, "Pretrain/Loss (Raw)": 2.1553688049316406, "Pretrain/Step": 3740, "Pretrain/Step Time": 8.553476000204682} +{"Pretrain/Learning Rate": 3.467776645231978e-05, "Pretrain/Loss": 2.096045970916748, "Pretrain/Loss (Raw)": 2.2888808250427246, "Pretrain/Step": 3741, "Pretrain/Step Time": 8.556090898811817} +{"Pretrain/Learning Rate": 3.466993794900007e-05, "Pretrain/Loss": 2.097846508026123, "Pretrain/Loss (Raw)": 2.375540018081665, "Pretrain/Step": 3742, "Pretrain/Step Time": 8.5580815076828} +{"Pretrain/Learning Rate": 3.466210833049755e-05, "Pretrain/Loss": 2.0963401794433594, "Pretrain/Loss (Raw)": 1.7850391864776611, "Pretrain/Step": 3743, "Pretrain/Step Time": 8.563693437725306} +{"Pretrain/Learning Rate": 3.465427759771516e-05, "Pretrain/Loss": 2.098202705383301, "Pretrain/Loss (Raw)": 2.24733567237854, "Pretrain/Step": 3744, "Pretrain/Step Time": 8.55202634446323} +{"Pretrain/Learning Rate": 3.464644575155599e-05, "Pretrain/Loss": 2.097252368927002, "Pretrain/Loss (Raw)": 2.0040149688720703, "Pretrain/Step": 3745, "Pretrain/Step Time": 8.551445409655571} +{"Pretrain/Learning Rate": 3.463861279292324e-05, "Pretrain/Loss": 2.096681594848633, "Pretrain/Loss (Raw)": 2.0571329593658447, "Pretrain/Step": 3746, "Pretrain/Step Time": 8.553226893767715} +{"Pretrain/Learning Rate": 3.4630778722720244e-05, "Pretrain/Loss": 2.098147392272949, "Pretrain/Loss (Raw)": 2.067420482635498, "Pretrain/Step": 3747, "Pretrain/Step Time": 8.556300206109881} +{"Pretrain/Learning Rate": 3.462294354185046e-05, "Pretrain/Loss": 2.097750186920166, "Pretrain/Loss (Raw)": 1.9603859186172485, "Pretrain/Step": 3748, "Pretrain/Step Time": 8.5541882365942} +{"Pretrain/Learning Rate": 3.4615107251217496e-05, "Pretrain/Loss": 2.0979208946228027, "Pretrain/Loss (Raw)": 2.0662968158721924, "Pretrain/Step": 3749, "Pretrain/Step Time": 8.559029063209891} +{"Pretrain/Learning Rate": 3.460726985172504e-05, "Pretrain/Loss": 2.0982699394226074, "Pretrain/Loss (Raw)": 2.009636640548706, "Pretrain/Step": 3750, "Pretrain/Step Time": 8.54728084243834} +{"Pretrain/Learning Rate": 3.4599431344276966e-05, "Pretrain/Loss": 2.0986366271972656, "Pretrain/Loss (Raw)": 2.1703433990478516, "Pretrain/Step": 3751, "Pretrain/Step Time": 8.556305466219783} +{"Pretrain/Learning Rate": 3.459159172977723e-05, "Pretrain/Loss": 2.101802110671997, "Pretrain/Loss (Raw)": 2.4837875366210938, "Pretrain/Step": 3752, "Pretrain/Step Time": 8.55350386351347} +{"Pretrain/Learning Rate": 3.4583751009129936e-05, "Pretrain/Loss": 2.101095676422119, "Pretrain/Loss (Raw)": 2.0956082344055176, "Pretrain/Step": 3753, "Pretrain/Step Time": 8.552869528532028} +{"Pretrain/Learning Rate": 3.457590918323932e-05, "Pretrain/Loss": 2.1001811027526855, "Pretrain/Loss (Raw)": 1.9281258583068848, "Pretrain/Step": 3754, "Pretrain/Step Time": 8.555324485525489} +{"Pretrain/Learning Rate": 3.4568066253009736e-05, "Pretrain/Loss": 2.100191116333008, "Pretrain/Loss (Raw)": 1.9804507493972778, "Pretrain/Step": 3755, "Pretrain/Step Time": 8.55465010739863} +{"Pretrain/Learning Rate": 3.456022221934566e-05, "Pretrain/Loss": 2.0998706817626953, "Pretrain/Loss (Raw)": 2.021618604660034, "Pretrain/Step": 3756, "Pretrain/Step Time": 8.546203672885895} +{"Pretrain/Learning Rate": 3.455237708315171e-05, "Pretrain/Loss": 2.1002137660980225, "Pretrain/Loss (Raw)": 2.087155818939209, "Pretrain/Step": 3757, "Pretrain/Step Time": 8.55290836840868} +{"Pretrain/Learning Rate": 3.454453084533262e-05, "Pretrain/Loss": 2.1008801460266113, "Pretrain/Loss (Raw)": 2.1806230545043945, "Pretrain/Step": 3758, "Pretrain/Step Time": 8.553435569629073} +{"Pretrain/Learning Rate": 3.453668350679327e-05, "Pretrain/Loss": 2.101029872894287, "Pretrain/Loss (Raw)": 1.9301058053970337, "Pretrain/Step": 3759, "Pretrain/Step Time": 8.552520273253322} +{"Pretrain/Learning Rate": 3.4528835068438625e-05, "Pretrain/Loss": 2.099874496459961, "Pretrain/Loss (Raw)": 1.9209481477737427, "Pretrain/Step": 3760, "Pretrain/Step Time": 8.558006161823869} +{"Pretrain/Learning Rate": 3.452098553117382e-05, "Pretrain/Loss": 2.098257064819336, "Pretrain/Loss (Raw)": 1.9906079769134521, "Pretrain/Step": 3761, "Pretrain/Step Time": 8.563683176413178} +{"Pretrain/Learning Rate": 3.4513134895904105e-05, "Pretrain/Loss": 2.097667694091797, "Pretrain/Loss (Raw)": 2.0065646171569824, "Pretrain/Step": 3762, "Pretrain/Step Time": 8.553131349384785} +{"Pretrain/Learning Rate": 3.450528316353484e-05, "Pretrain/Loss": 2.0978784561157227, "Pretrain/Loss (Raw)": 2.0653023719787598, "Pretrain/Step": 3763, "Pretrain/Step Time": 8.552580954506993} +{"Pretrain/Learning Rate": 3.4497430334971534e-05, "Pretrain/Loss": 2.0983803272247314, "Pretrain/Loss (Raw)": 2.1135332584381104, "Pretrain/Step": 3764, "Pretrain/Step Time": 8.551653925329447} +{"Pretrain/Learning Rate": 3.448957641111981e-05, "Pretrain/Loss": 2.0938568115234375, "Pretrain/Loss (Raw)": 1.8582196235656738, "Pretrain/Step": 3765, "Pretrain/Step Time": 8.549572836607695} +{"Pretrain/Learning Rate": 3.4481721392885414e-05, "Pretrain/Loss": 2.0955018997192383, "Pretrain/Loss (Raw)": 2.117462158203125, "Pretrain/Step": 3766, "Pretrain/Step Time": 8.552165571600199} +{"Pretrain/Learning Rate": 3.447386528117423e-05, "Pretrain/Loss": 2.092916488647461, "Pretrain/Loss (Raw)": 1.8258897066116333, "Pretrain/Step": 3767, "Pretrain/Step Time": 8.555779319256544} +{"Pretrain/Learning Rate": 3.446600807689226e-05, "Pretrain/Loss": 2.09452223777771, "Pretrain/Loss (Raw)": 2.274160146713257, "Pretrain/Step": 3768, "Pretrain/Step Time": 8.55784902535379} +{"Pretrain/Learning Rate": 3.4458149780945636e-05, "Pretrain/Loss": 2.0942859649658203, "Pretrain/Loss (Raw)": 2.233471393585205, "Pretrain/Step": 3769, "Pretrain/Step Time": 8.561659630388021} +{"Pretrain/Learning Rate": 3.4450290394240606e-05, "Pretrain/Loss": 2.0947961807250977, "Pretrain/Loss (Raw)": 2.1670849323272705, "Pretrain/Step": 3770, "Pretrain/Step Time": 8.558272214606404} +{"Pretrain/Learning Rate": 3.444242991768356e-05, "Pretrain/Loss": 2.092427968978882, "Pretrain/Loss (Raw)": 1.9488420486450195, "Pretrain/Step": 3771, "Pretrain/Step Time": 8.554705752059817} +{"Pretrain/Learning Rate": 3.4434568352181e-05, "Pretrain/Loss": 2.0912911891937256, "Pretrain/Loss (Raw)": 1.931320309638977, "Pretrain/Step": 3772, "Pretrain/Step Time": 8.555432202294469} +{"Pretrain/Learning Rate": 3.442670569863956e-05, "Pretrain/Loss": 2.0946013927459717, "Pretrain/Loss (Raw)": 2.327188014984131, "Pretrain/Step": 3773, "Pretrain/Step Time": 8.557782707735896} +{"Pretrain/Learning Rate": 3.4418841957965995e-05, "Pretrain/Loss": 2.095654010772705, "Pretrain/Loss (Raw)": 2.096914052963257, "Pretrain/Step": 3774, "Pretrain/Step Time": 8.554779101163149} +{"Pretrain/Learning Rate": 3.44109771310672e-05, "Pretrain/Loss": 2.095897674560547, "Pretrain/Loss (Raw)": 2.1521084308624268, "Pretrain/Step": 3775, "Pretrain/Step Time": 8.563731694594026} +{"Pretrain/Learning Rate": 3.440311121885018e-05, "Pretrain/Loss": 2.0961477756500244, "Pretrain/Loss (Raw)": 2.213073492050171, "Pretrain/Step": 3776, "Pretrain/Step Time": 8.557846248149872} +{"Pretrain/Learning Rate": 3.4395244222222054e-05, "Pretrain/Loss": 2.095226287841797, "Pretrain/Loss (Raw)": 2.072662353515625, "Pretrain/Step": 3777, "Pretrain/Step Time": 8.558759897947311} +{"Pretrain/Learning Rate": 3.43873761420901e-05, "Pretrain/Loss": 2.09222412109375, "Pretrain/Loss (Raw)": 2.2080063819885254, "Pretrain/Step": 3778, "Pretrain/Step Time": 8.559313725680113} +{"Pretrain/Learning Rate": 3.4379506979361694e-05, "Pretrain/Loss": 2.0944080352783203, "Pretrain/Loss (Raw)": 2.1965560913085938, "Pretrain/Step": 3779, "Pretrain/Step Time": 8.560719029977918} +{"Pretrain/Learning Rate": 3.437163673494434e-05, "Pretrain/Loss": 2.0947153568267822, "Pretrain/Loss (Raw)": 2.2568211555480957, "Pretrain/Step": 3780, "Pretrain/Step Time": 8.553162982687354} +{"Pretrain/Learning Rate": 3.436376540974568e-05, "Pretrain/Loss": 2.0939836502075195, "Pretrain/Loss (Raw)": 2.073687791824341, "Pretrain/Step": 3781, "Pretrain/Step Time": 8.56088967807591} +{"Pretrain/Learning Rate": 3.4355893004673476e-05, "Pretrain/Loss": 2.0953330993652344, "Pretrain/Loss (Raw)": 2.142178535461426, "Pretrain/Step": 3782, "Pretrain/Step Time": 8.559697629883885} +{"Pretrain/Learning Rate": 3.4348019520635587e-05, "Pretrain/Loss": 2.0936145782470703, "Pretrain/Loss (Raw)": 1.915635585784912, "Pretrain/Step": 3783, "Pretrain/Step Time": 8.556356005370617} +{"Pretrain/Learning Rate": 3.434014495854006e-05, "Pretrain/Loss": 2.093628168106079, "Pretrain/Loss (Raw)": 2.0728330612182617, "Pretrain/Step": 3784, "Pretrain/Step Time": 8.562090523540974} +{"Pretrain/Learning Rate": 3.4332269319294984e-05, "Pretrain/Loss": 2.0939080715179443, "Pretrain/Loss (Raw)": 1.9324183464050293, "Pretrain/Step": 3785, "Pretrain/Step Time": 8.561096519231796} +{"Pretrain/Learning Rate": 3.432439260380865e-05, "Pretrain/Loss": 2.094820976257324, "Pretrain/Loss (Raw)": 2.0099053382873535, "Pretrain/Step": 3786, "Pretrain/Step Time": 8.556176604703069} +{"Pretrain/Learning Rate": 3.4316514812989406e-05, "Pretrain/Loss": 2.094193458557129, "Pretrain/Loss (Raw)": 2.0974671840667725, "Pretrain/Step": 3787, "Pretrain/Step Time": 8.553833119571209} +{"Pretrain/Learning Rate": 3.4308635947745796e-05, "Pretrain/Loss": 2.0934619903564453, "Pretrain/Loss (Raw)": 2.0006327629089355, "Pretrain/Step": 3788, "Pretrain/Step Time": 8.551550513133407} +{"Pretrain/Learning Rate": 3.43007560089864e-05, "Pretrain/Loss": 2.094489097595215, "Pretrain/Loss (Raw)": 2.199624538421631, "Pretrain/Step": 3789, "Pretrain/Step Time": 8.555312914773822} +{"Pretrain/Learning Rate": 3.429287499762001e-05, "Pretrain/Loss": 2.09335994720459, "Pretrain/Loss (Raw)": 1.9987372159957886, "Pretrain/Step": 3790, "Pretrain/Step Time": 8.558016572147608} +{"Pretrain/Learning Rate": 3.428499291455548e-05, "Pretrain/Loss": 2.092583417892456, "Pretrain/Loss (Raw)": 2.010577440261841, "Pretrain/Step": 3791, "Pretrain/Step Time": 8.562556372955441} +{"Pretrain/Learning Rate": 3.427710976070182e-05, "Pretrain/Loss": 2.0920395851135254, "Pretrain/Loss (Raw)": 2.0533390045166016, "Pretrain/Step": 3792, "Pretrain/Step Time": 8.553898595273495} +{"Pretrain/Learning Rate": 3.426922553696814e-05, "Pretrain/Loss": 2.0914502143859863, "Pretrain/Loss (Raw)": 2.0141303539276123, "Pretrain/Step": 3793, "Pretrain/Step Time": 8.553192012012005} +{"Pretrain/Learning Rate": 3.426134024426371e-05, "Pretrain/Loss": 2.0903103351593018, "Pretrain/Loss (Raw)": 1.9362715482711792, "Pretrain/Step": 3794, "Pretrain/Step Time": 8.552207116037607} +{"Pretrain/Learning Rate": 3.425345388349786e-05, "Pretrain/Loss": 2.091069459915161, "Pretrain/Loss (Raw)": 2.2740654945373535, "Pretrain/Step": 3795, "Pretrain/Step Time": 8.554607942700386} +{"Pretrain/Learning Rate": 3.4245566455580116e-05, "Pretrain/Loss": 2.0937561988830566, "Pretrain/Loss (Raw)": 2.394540309906006, "Pretrain/Step": 3796, "Pretrain/Step Time": 8.559933800250292} +{"Pretrain/Learning Rate": 3.423767796142008e-05, "Pretrain/Loss": 2.0928006172180176, "Pretrain/Loss (Raw)": 2.099808692932129, "Pretrain/Step": 3797, "Pretrain/Step Time": 8.562509952113032} +{"Pretrain/Learning Rate": 3.422978840192749e-05, "Pretrain/Loss": 2.094168186187744, "Pretrain/Loss (Raw)": 1.983311414718628, "Pretrain/Step": 3798, "Pretrain/Step Time": 8.554547114297748} +{"Pretrain/Learning Rate": 3.4221897778012214e-05, "Pretrain/Loss": 2.0927047729492188, "Pretrain/Loss (Raw)": 2.043174982070923, "Pretrain/Step": 3799, "Pretrain/Step Time": 8.555393820628524} +{"Pretrain/Learning Rate": 3.421400609058423e-05, "Pretrain/Loss": 2.0916008949279785, "Pretrain/Loss (Raw)": 2.1872408390045166, "Pretrain/Step": 3800, "Pretrain/Step Time": 8.555532243102789} +{"Pretrain/Learning Rate": 3.420611334055365e-05, "Pretrain/Loss": 2.09196138381958, "Pretrain/Loss (Raw)": 2.159869432449341, "Pretrain/Step": 3801, "Pretrain/Step Time": 8.555437540635467} +{"Pretrain/Learning Rate": 3.4198219528830675e-05, "Pretrain/Loss": 2.0909135341644287, "Pretrain/Loss (Raw)": 2.0383100509643555, "Pretrain/Step": 3802, "Pretrain/Step Time": 8.55459700897336} +{"Pretrain/Learning Rate": 3.4190324656325704e-05, "Pretrain/Loss": 2.09175968170166, "Pretrain/Loss (Raw)": 2.2479147911071777, "Pretrain/Step": 3803, "Pretrain/Step Time": 8.54722017236054} +{"Pretrain/Learning Rate": 3.418242872394919e-05, "Pretrain/Loss": 2.093564748764038, "Pretrain/Loss (Raw)": 2.2220146656036377, "Pretrain/Step": 3804, "Pretrain/Step Time": 8.549742752686143} +{"Pretrain/Learning Rate": 3.417453173261171e-05, "Pretrain/Loss": 2.093535900115967, "Pretrain/Loss (Raw)": 2.156487464904785, "Pretrain/Step": 3805, "Pretrain/Step Time": 8.553364273160696} +{"Pretrain/Learning Rate": 3.4166633683224015e-05, "Pretrain/Loss": 2.091146945953369, "Pretrain/Loss (Raw)": 1.9620792865753174, "Pretrain/Step": 3806, "Pretrain/Step Time": 8.554892405867577} +{"Pretrain/Learning Rate": 3.4158734576696915e-05, "Pretrain/Loss": 2.0928432941436768, "Pretrain/Loss (Raw)": 2.0737624168395996, "Pretrain/Step": 3807, "Pretrain/Step Time": 8.548921331763268} +{"Pretrain/Learning Rate": 3.4150834413941394e-05, "Pretrain/Loss": 2.0919852256774902, "Pretrain/Loss (Raw)": 2.014068126678467, "Pretrain/Step": 3808, "Pretrain/Step Time": 8.54993873089552} +{"Pretrain/Learning Rate": 3.414293319586853e-05, "Pretrain/Loss": 2.092057704925537, "Pretrain/Loss (Raw)": 2.065943479537964, "Pretrain/Step": 3809, "Pretrain/Step Time": 8.550502762198448} +{"Pretrain/Learning Rate": 3.4135030923389525e-05, "Pretrain/Loss": 2.093428134918213, "Pretrain/Loss (Raw)": 2.0286240577697754, "Pretrain/Step": 3810, "Pretrain/Step Time": 8.55298594944179} +{"Pretrain/Learning Rate": 3.412712759741571e-05, "Pretrain/Loss": 2.0929064750671387, "Pretrain/Loss (Raw)": 1.9972652196884155, "Pretrain/Step": 3811, "Pretrain/Step Time": 8.55405849404633} +{"Pretrain/Learning Rate": 3.411922321885853e-05, "Pretrain/Loss": 2.0916810035705566, "Pretrain/Loss (Raw)": 2.0654163360595703, "Pretrain/Step": 3812, "Pretrain/Step Time": 8.550786891952157} +{"Pretrain/Learning Rate": 3.411131778862955e-05, "Pretrain/Loss": 2.0924463272094727, "Pretrain/Loss (Raw)": 2.225480079650879, "Pretrain/Step": 3813, "Pretrain/Step Time": 8.552263170480728} +{"Pretrain/Learning Rate": 3.4103411307640475e-05, "Pretrain/Loss": 2.0944983959198, "Pretrain/Loss (Raw)": 2.2526662349700928, "Pretrain/Step": 3814, "Pretrain/Step Time": 8.550780741497874} +{"Pretrain/Learning Rate": 3.409550377680311e-05, "Pretrain/Loss": 2.097595691680908, "Pretrain/Loss (Raw)": 2.0965018272399902, "Pretrain/Step": 3815, "Pretrain/Step Time": 8.549695203080773} +{"Pretrain/Learning Rate": 3.408759519702939e-05, "Pretrain/Loss": 2.099198341369629, "Pretrain/Loss (Raw)": 2.135601282119751, "Pretrain/Step": 3816, "Pretrain/Step Time": 8.553072540089488} +{"Pretrain/Learning Rate": 3.407968556923137e-05, "Pretrain/Loss": 2.098475456237793, "Pretrain/Loss (Raw)": 1.9994271993637085, "Pretrain/Step": 3817, "Pretrain/Step Time": 8.552862318232656} +{"Pretrain/Learning Rate": 3.407177489432123e-05, "Pretrain/Loss": 2.098844051361084, "Pretrain/Loss (Raw)": 2.0924222469329834, "Pretrain/Step": 3818, "Pretrain/Step Time": 8.55103613436222} +{"Pretrain/Learning Rate": 3.406386317321126e-05, "Pretrain/Loss": 2.098712921142578, "Pretrain/Loss (Raw)": 2.085535764694214, "Pretrain/Step": 3819, "Pretrain/Step Time": 8.548033503815532} +{"Pretrain/Learning Rate": 3.4055950406813875e-05, "Pretrain/Loss": 2.098879337310791, "Pretrain/Loss (Raw)": 2.2105984687805176, "Pretrain/Step": 3820, "Pretrain/Step Time": 8.548841705545783} +{"Pretrain/Learning Rate": 3.404803659604162e-05, "Pretrain/Loss": 2.10034441947937, "Pretrain/Loss (Raw)": 2.293086290359497, "Pretrain/Step": 3821, "Pretrain/Step Time": 8.549692383036017} +{"Pretrain/Learning Rate": 3.4040121741807146e-05, "Pretrain/Loss": 2.0990865230560303, "Pretrain/Loss (Raw)": 2.035633087158203, "Pretrain/Step": 3822, "Pretrain/Step Time": 8.549281956627965} +{"Pretrain/Learning Rate": 3.403220584502323e-05, "Pretrain/Loss": 2.0983052253723145, "Pretrain/Loss (Raw)": 2.1294331550598145, "Pretrain/Step": 3823, "Pretrain/Step Time": 8.549039017409086} +{"Pretrain/Learning Rate": 3.402428890660279e-05, "Pretrain/Loss": 2.097612142562866, "Pretrain/Loss (Raw)": 2.22013258934021, "Pretrain/Step": 3824, "Pretrain/Step Time": 8.547657385468483} +{"Pretrain/Learning Rate": 3.401637092745882e-05, "Pretrain/Loss": 2.0964486598968506, "Pretrain/Loss (Raw)": 1.9340814352035522, "Pretrain/Step": 3825, "Pretrain/Step Time": 8.551144529134035} +{"Pretrain/Learning Rate": 3.4008451908504457e-05, "Pretrain/Loss": 2.096486806869507, "Pretrain/Loss (Raw)": 2.1041882038116455, "Pretrain/Step": 3826, "Pretrain/Step Time": 8.549580989405513} +{"Pretrain/Learning Rate": 3.400053185065298e-05, "Pretrain/Loss": 2.0966076850891113, "Pretrain/Loss (Raw)": 2.108327627182007, "Pretrain/Step": 3827, "Pretrain/Step Time": 8.553560910746455} +{"Pretrain/Learning Rate": 3.399261075481776e-05, "Pretrain/Loss": 2.095755100250244, "Pretrain/Loss (Raw)": 2.0495564937591553, "Pretrain/Step": 3828, "Pretrain/Step Time": 8.551731444895267} +{"Pretrain/Learning Rate": 3.39846886219123e-05, "Pretrain/Loss": 2.0930142402648926, "Pretrain/Loss (Raw)": 1.8718067407608032, "Pretrain/Step": 3829, "Pretrain/Step Time": 8.550830129534006} +{"Pretrain/Learning Rate": 3.3976765452850194e-05, "Pretrain/Loss": 2.0923826694488525, "Pretrain/Loss (Raw)": 1.9391816854476929, "Pretrain/Step": 3830, "Pretrain/Step Time": 8.553493566811085} +{"Pretrain/Learning Rate": 3.3968841248545214e-05, "Pretrain/Loss": 2.0895121097564697, "Pretrain/Loss (Raw)": 1.9964544773101807, "Pretrain/Step": 3831, "Pretrain/Step Time": 8.553242355585098} +{"Pretrain/Learning Rate": 3.396091600991118e-05, "Pretrain/Loss": 2.0888848304748535, "Pretrain/Loss (Raw)": 2.055340528488159, "Pretrain/Step": 3832, "Pretrain/Step Time": 8.555376762524247} +{"Pretrain/Learning Rate": 3.39529897378621e-05, "Pretrain/Loss": 2.0873312950134277, "Pretrain/Loss (Raw)": 1.9715687036514282, "Pretrain/Step": 3833, "Pretrain/Step Time": 8.552470659837127} +{"Pretrain/Learning Rate": 3.3945062433312055e-05, "Pretrain/Loss": 2.0852737426757812, "Pretrain/Loss (Raw)": 1.7507174015045166, "Pretrain/Step": 3834, "Pretrain/Step Time": 8.557870907709002} +{"Pretrain/Learning Rate": 3.3937134097175256e-05, "Pretrain/Loss": 2.084815502166748, "Pretrain/Loss (Raw)": 1.966858983039856, "Pretrain/Step": 3835, "Pretrain/Step Time": 8.550735093653202} +{"Pretrain/Learning Rate": 3.392920473036604e-05, "Pretrain/Loss": 2.0838122367858887, "Pretrain/Loss (Raw)": 1.9376729726791382, "Pretrain/Step": 3836, "Pretrain/Step Time": 8.559923697263002} +{"Pretrain/Learning Rate": 3.392127433379886e-05, "Pretrain/Loss": 2.082031488418579, "Pretrain/Loss (Raw)": 1.9732152223587036, "Pretrain/Step": 3837, "Pretrain/Step Time": 8.55748731829226} +{"Pretrain/Learning Rate": 3.391334290838829e-05, "Pretrain/Loss": 2.082268476486206, "Pretrain/Loss (Raw)": 2.051765203475952, "Pretrain/Step": 3838, "Pretrain/Step Time": 8.555771131068468} +{"Pretrain/Learning Rate": 3.3905410455049e-05, "Pretrain/Loss": 2.0838136672973633, "Pretrain/Loss (Raw)": 2.1824235916137695, "Pretrain/Step": 3839, "Pretrain/Step Time": 8.552002614364028} +{"Pretrain/Learning Rate": 3.389747697469583e-05, "Pretrain/Loss": 2.083500385284424, "Pretrain/Loss (Raw)": 2.075157642364502, "Pretrain/Step": 3840, "Pretrain/Step Time": 8.556454265490174} +{"Pretrain/Learning Rate": 3.388954246824367e-05, "Pretrain/Loss": 2.084040880203247, "Pretrain/Loss (Raw)": 2.177739381790161, "Pretrain/Step": 3841, "Pretrain/Step Time": 8.558274859562516} +{"Pretrain/Learning Rate": 3.3881606936607604e-05, "Pretrain/Loss": 2.0838704109191895, "Pretrain/Loss (Raw)": 2.162168264389038, "Pretrain/Step": 3842, "Pretrain/Step Time": 8.556879768148065} +{"Pretrain/Learning Rate": 3.387367038070275e-05, "Pretrain/Loss": 2.082202434539795, "Pretrain/Loss (Raw)": 1.9209263324737549, "Pretrain/Step": 3843, "Pretrain/Step Time": 8.556360118091106} +{"Pretrain/Learning Rate": 3.386573280144444e-05, "Pretrain/Loss": 2.0824713706970215, "Pretrain/Loss (Raw)": 2.0214734077453613, "Pretrain/Step": 3844, "Pretrain/Step Time": 8.553467217832804} +{"Pretrain/Learning Rate": 3.385779419974803e-05, "Pretrain/Loss": 2.0824790000915527, "Pretrain/Loss (Raw)": 2.119033098220825, "Pretrain/Step": 3845, "Pretrain/Step Time": 8.553634587675333} +{"Pretrain/Learning Rate": 3.384985457652906e-05, "Pretrain/Loss": 2.0818254947662354, "Pretrain/Loss (Raw)": 2.0590109825134277, "Pretrain/Step": 3846, "Pretrain/Step Time": 8.555157406255603} +{"Pretrain/Learning Rate": 3.384191393270316e-05, "Pretrain/Loss": 2.086064338684082, "Pretrain/Loss (Raw)": 2.295166015625, "Pretrain/Step": 3847, "Pretrain/Step Time": 8.559729669243097} +{"Pretrain/Learning Rate": 3.383397226918607e-05, "Pretrain/Loss": 2.0883967876434326, "Pretrain/Loss (Raw)": 2.292804718017578, "Pretrain/Step": 3848, "Pretrain/Step Time": 8.561576001346111} +{"Pretrain/Learning Rate": 3.382602958689369e-05, "Pretrain/Loss": 2.087775230407715, "Pretrain/Loss (Raw)": 2.1588587760925293, "Pretrain/Step": 3849, "Pretrain/Step Time": 8.562663732096553} +{"Pretrain/Learning Rate": 3.381808588674197e-05, "Pretrain/Loss": 2.085846185684204, "Pretrain/Loss (Raw)": 1.8282119035720825, "Pretrain/Step": 3850, "Pretrain/Step Time": 8.559917600825429} +{"Pretrain/Learning Rate": 3.381014116964705e-05, "Pretrain/Loss": 2.085467576980591, "Pretrain/Loss (Raw)": 1.9744805097579956, "Pretrain/Step": 3851, "Pretrain/Step Time": 8.565326023846865} +{"Pretrain/Learning Rate": 3.380219543652512e-05, "Pretrain/Loss": 2.0828216075897217, "Pretrain/Loss (Raw)": 1.8680795431137085, "Pretrain/Step": 3852, "Pretrain/Step Time": 8.565367994830012} +{"Pretrain/Learning Rate": 3.379424868829254e-05, "Pretrain/Loss": 2.0810132026672363, "Pretrain/Loss (Raw)": 2.2818825244903564, "Pretrain/Step": 3853, "Pretrain/Step Time": 8.564543889835477} +{"Pretrain/Learning Rate": 3.378630092586576e-05, "Pretrain/Loss": 2.080434560775757, "Pretrain/Loss (Raw)": 2.0575170516967773, "Pretrain/Step": 3854, "Pretrain/Step Time": 8.565777622163296} +{"Pretrain/Learning Rate": 3.377835215016136e-05, "Pretrain/Loss": 2.0803823471069336, "Pretrain/Loss (Raw)": 2.031195640563965, "Pretrain/Step": 3855, "Pretrain/Step Time": 8.561368502676487} +{"Pretrain/Learning Rate": 3.3770402362096024e-05, "Pretrain/Loss": 2.0805511474609375, "Pretrain/Loss (Raw)": 2.1789543628692627, "Pretrain/Step": 3856, "Pretrain/Step Time": 8.561380041763186} +{"Pretrain/Learning Rate": 3.3762451562586565e-05, "Pretrain/Loss": 2.0801944732666016, "Pretrain/Loss (Raw)": 2.1843433380126953, "Pretrain/Step": 3857, "Pretrain/Step Time": 8.559876089915633} +{"Pretrain/Learning Rate": 3.3754499752549885e-05, "Pretrain/Loss": 2.081587314605713, "Pretrain/Loss (Raw)": 2.1949291229248047, "Pretrain/Step": 3858, "Pretrain/Step Time": 8.56415320187807} +{"Pretrain/Learning Rate": 3.374654693290306e-05, "Pretrain/Loss": 2.08127498626709, "Pretrain/Loss (Raw)": 1.9727189540863037, "Pretrain/Step": 3859, "Pretrain/Step Time": 8.565068680793047} +{"Pretrain/Learning Rate": 3.373859310456321e-05, "Pretrain/Loss": 2.083019256591797, "Pretrain/Loss (Raw)": 2.1211087703704834, "Pretrain/Step": 3860, "Pretrain/Step Time": 8.564530353993177} +{"Pretrain/Learning Rate": 3.373063826844764e-05, "Pretrain/Loss": 2.083085060119629, "Pretrain/Loss (Raw)": 2.0856401920318604, "Pretrain/Step": 3861, "Pretrain/Step Time": 8.563079597428441} +{"Pretrain/Learning Rate": 3.3722682425473715e-05, "Pretrain/Loss": 2.0828590393066406, "Pretrain/Loss (Raw)": 1.9768297672271729, "Pretrain/Step": 3862, "Pretrain/Step Time": 8.559725182130933} +{"Pretrain/Learning Rate": 3.371472557655896e-05, "Pretrain/Loss": 2.0827465057373047, "Pretrain/Loss (Raw)": 2.0784265995025635, "Pretrain/Step": 3863, "Pretrain/Step Time": 8.562494011595845} +{"Pretrain/Learning Rate": 3.370676772262098e-05, "Pretrain/Loss": 2.082447052001953, "Pretrain/Loss (Raw)": 2.107164144515991, "Pretrain/Step": 3864, "Pretrain/Step Time": 8.565632769837976} +{"Pretrain/Learning Rate": 3.369880886457751e-05, "Pretrain/Loss": 2.0829546451568604, "Pretrain/Loss (Raw)": 2.109076738357544, "Pretrain/Step": 3865, "Pretrain/Step Time": 8.563897108659148} +{"Pretrain/Learning Rate": 3.369084900334643e-05, "Pretrain/Loss": 2.0818734169006348, "Pretrain/Loss (Raw)": 2.125838041305542, "Pretrain/Step": 3866, "Pretrain/Step Time": 8.567070756107569} +{"Pretrain/Learning Rate": 3.368288813984568e-05, "Pretrain/Loss": 2.0825071334838867, "Pretrain/Loss (Raw)": 2.0895485877990723, "Pretrain/Step": 3867, "Pretrain/Step Time": 8.562236443161964} +{"Pretrain/Learning Rate": 3.3674926274993356e-05, "Pretrain/Loss": 2.0819571018218994, "Pretrain/Loss (Raw)": 2.0849838256835938, "Pretrain/Step": 3868, "Pretrain/Step Time": 8.567284811288118} +{"Pretrain/Learning Rate": 3.3666963409707655e-05, "Pretrain/Loss": 2.0777502059936523, "Pretrain/Loss (Raw)": 1.7503679990768433, "Pretrain/Step": 3869, "Pretrain/Step Time": 8.565480066463351} +{"Pretrain/Learning Rate": 3.36589995449069e-05, "Pretrain/Loss": 2.075286388397217, "Pretrain/Loss (Raw)": 2.0601766109466553, "Pretrain/Step": 3870, "Pretrain/Step Time": 8.568055260926485} +{"Pretrain/Learning Rate": 3.36510346815095e-05, "Pretrain/Loss": 2.077967643737793, "Pretrain/Loss (Raw)": 2.1282410621643066, "Pretrain/Step": 3871, "Pretrain/Step Time": 8.56573342345655} +{"Pretrain/Learning Rate": 3.3643068820434035e-05, "Pretrain/Loss": 2.076486110687256, "Pretrain/Loss (Raw)": 2.0577285289764404, "Pretrain/Step": 3872, "Pretrain/Step Time": 8.56492999382317} +{"Pretrain/Learning Rate": 3.363510196259913e-05, "Pretrain/Loss": 2.0774288177490234, "Pretrain/Loss (Raw)": 2.124671697616577, "Pretrain/Step": 3873, "Pretrain/Step Time": 8.56140099465847} +{"Pretrain/Learning Rate": 3.362713410892359e-05, "Pretrain/Loss": 2.0766797065734863, "Pretrain/Loss (Raw)": 1.961235523223877, "Pretrain/Step": 3874, "Pretrain/Step Time": 8.562423627823591} +{"Pretrain/Learning Rate": 3.361916526032628e-05, "Pretrain/Loss": 2.077064037322998, "Pretrain/Loss (Raw)": 2.116637945175171, "Pretrain/Step": 3875, "Pretrain/Step Time": 8.56176389567554} +{"Pretrain/Learning Rate": 3.361119541772622e-05, "Pretrain/Loss": 2.077930450439453, "Pretrain/Loss (Raw)": 2.071258068084717, "Pretrain/Step": 3876, "Pretrain/Step Time": 8.561362555250525} +{"Pretrain/Learning Rate": 3.360322458204253e-05, "Pretrain/Loss": 2.0773558616638184, "Pretrain/Loss (Raw)": 1.9927548170089722, "Pretrain/Step": 3877, "Pretrain/Step Time": 8.561474492773414} +{"Pretrain/Learning Rate": 3.3595252754194445e-05, "Pretrain/Loss": 2.07869291305542, "Pretrain/Loss (Raw)": 2.1807968616485596, "Pretrain/Step": 3878, "Pretrain/Step Time": 8.56534082815051} +{"Pretrain/Learning Rate": 3.3587279935101306e-05, "Pretrain/Loss": 2.078415870666504, "Pretrain/Loss (Raw)": 2.1348559856414795, "Pretrain/Step": 3879, "Pretrain/Step Time": 8.5589743796736} +{"Pretrain/Learning Rate": 3.357930612568258e-05, "Pretrain/Loss": 2.0739223957061768, "Pretrain/Loss (Raw)": 1.9086247682571411, "Pretrain/Step": 3880, "Pretrain/Step Time": 8.554971912875772} +{"Pretrain/Learning Rate": 3.3571331326857844e-05, "Pretrain/Loss": 2.07352352142334, "Pretrain/Loss (Raw)": 2.044557809829712, "Pretrain/Step": 3881, "Pretrain/Step Time": 8.557843934744596} +{"Pretrain/Learning Rate": 3.3563355539546795e-05, "Pretrain/Loss": 2.074202537536621, "Pretrain/Loss (Raw)": 2.015043258666992, "Pretrain/Step": 3882, "Pretrain/Step Time": 8.554861258715391} +{"Pretrain/Learning Rate": 3.355537876466923e-05, "Pretrain/Loss": 2.075509548187256, "Pretrain/Loss (Raw)": 2.1477506160736084, "Pretrain/Step": 3883, "Pretrain/Step Time": 8.559270206838846} +{"Pretrain/Learning Rate": 3.354740100314506e-05, "Pretrain/Loss": 2.0764729976654053, "Pretrain/Loss (Raw)": 2.144935369491577, "Pretrain/Step": 3884, "Pretrain/Step Time": 8.558909332379699} +{"Pretrain/Learning Rate": 3.3539422255894345e-05, "Pretrain/Loss": 2.075160264968872, "Pretrain/Loss (Raw)": 1.9191323518753052, "Pretrain/Step": 3885, "Pretrain/Step Time": 8.55245996452868} +{"Pretrain/Learning Rate": 3.353144252383721e-05, "Pretrain/Loss": 2.0745415687561035, "Pretrain/Loss (Raw)": 2.1014420986175537, "Pretrain/Step": 3886, "Pretrain/Step Time": 8.550228206440806} +{"Pretrain/Learning Rate": 3.3523461807893925e-05, "Pretrain/Loss": 2.074777364730835, "Pretrain/Loss (Raw)": 1.9602726697921753, "Pretrain/Step": 3887, "Pretrain/Step Time": 8.553283091634512} +{"Pretrain/Learning Rate": 3.351548010898486e-05, "Pretrain/Loss": 2.077366828918457, "Pretrain/Loss (Raw)": 2.252418041229248, "Pretrain/Step": 3888, "Pretrain/Step Time": 8.547995986416936} +{"Pretrain/Learning Rate": 3.35074974280305e-05, "Pretrain/Loss": 2.077882766723633, "Pretrain/Loss (Raw)": 2.0566372871398926, "Pretrain/Step": 3889, "Pretrain/Step Time": 8.549599206075072} +{"Pretrain/Learning Rate": 3.349951376595145e-05, "Pretrain/Loss": 2.0787596702575684, "Pretrain/Loss (Raw)": 2.1188082695007324, "Pretrain/Step": 3890, "Pretrain/Step Time": 8.549775110557675} +{"Pretrain/Learning Rate": 3.3491529123668425e-05, "Pretrain/Loss": 2.0780141353607178, "Pretrain/Loss (Raw)": 1.9698760509490967, "Pretrain/Step": 3891, "Pretrain/Step Time": 8.547237202525139} +{"Pretrain/Learning Rate": 3.348354350210224e-05, "Pretrain/Loss": 2.07338285446167, "Pretrain/Loss (Raw)": 1.5207358598709106, "Pretrain/Step": 3892, "Pretrain/Step Time": 8.547051770612597} +{"Pretrain/Learning Rate": 3.347555690217385e-05, "Pretrain/Loss": 2.076173782348633, "Pretrain/Loss (Raw)": 2.2154548168182373, "Pretrain/Step": 3893, "Pretrain/Step Time": 8.549533842131495} +{"Pretrain/Learning Rate": 3.34675693248043e-05, "Pretrain/Loss": 2.075321912765503, "Pretrain/Loss (Raw)": 2.008404493331909, "Pretrain/Step": 3894, "Pretrain/Step Time": 8.54734698869288} +{"Pretrain/Learning Rate": 3.3459580770914744e-05, "Pretrain/Loss": 2.0796456336975098, "Pretrain/Loss (Raw)": 2.379362106323242, "Pretrain/Step": 3895, "Pretrain/Step Time": 8.554395351558924} +{"Pretrain/Learning Rate": 3.3451591241426486e-05, "Pretrain/Loss": 2.077955722808838, "Pretrain/Loss (Raw)": 2.05781626701355, "Pretrain/Step": 3896, "Pretrain/Step Time": 8.550522269681096} +{"Pretrain/Learning Rate": 3.3443600737260885e-05, "Pretrain/Loss": 2.075137138366699, "Pretrain/Loss (Raw)": 1.8726847171783447, "Pretrain/Step": 3897, "Pretrain/Step Time": 8.546754289418459} +{"Pretrain/Learning Rate": 3.343560925933947e-05, "Pretrain/Loss": 2.07545804977417, "Pretrain/Loss (Raw)": 2.2081804275512695, "Pretrain/Step": 3898, "Pretrain/Step Time": 8.547487052157521} +{"Pretrain/Learning Rate": 3.342761680858385e-05, "Pretrain/Loss": 2.0761170387268066, "Pretrain/Loss (Raw)": 2.0331900119781494, "Pretrain/Step": 3899, "Pretrain/Step Time": 8.546764086931944} +{"Pretrain/Learning Rate": 3.3419623385915736e-05, "Pretrain/Loss": 2.0771803855895996, "Pretrain/Loss (Raw)": 2.0674121379852295, "Pretrain/Step": 3900, "Pretrain/Step Time": 8.547945633530617} +{"Pretrain/Learning Rate": 3.3411628992256984e-05, "Pretrain/Loss": 2.0762217044830322, "Pretrain/Loss (Raw)": 2.2045013904571533, "Pretrain/Step": 3901, "Pretrain/Step Time": 8.557643920183182} +{"Pretrain/Learning Rate": 3.340363362852954e-05, "Pretrain/Loss": 2.0763707160949707, "Pretrain/Loss (Raw)": 2.1159486770629883, "Pretrain/Step": 3902, "Pretrain/Step Time": 8.55058335699141} +{"Pretrain/Learning Rate": 3.339563729565547e-05, "Pretrain/Loss": 2.0762088298797607, "Pretrain/Loss (Raw)": 2.1314079761505127, "Pretrain/Step": 3903, "Pretrain/Step Time": 8.549499908462167} +{"Pretrain/Learning Rate": 3.3387639994556934e-05, "Pretrain/Loss": 2.0735838413238525, "Pretrain/Loss (Raw)": 1.8770856857299805, "Pretrain/Step": 3904, "Pretrain/Step Time": 8.54800820723176} +{"Pretrain/Learning Rate": 3.337964172615624e-05, "Pretrain/Loss": 2.071773052215576, "Pretrain/Loss (Raw)": 1.8408806324005127, "Pretrain/Step": 3905, "Pretrain/Step Time": 8.543931275606155} +{"Pretrain/Learning Rate": 3.337164249137577e-05, "Pretrain/Loss": 2.07055926322937, "Pretrain/Loss (Raw)": 2.052635908126831, "Pretrain/Step": 3906, "Pretrain/Step Time": 8.544565666466951} +{"Pretrain/Learning Rate": 3.3363642291138046e-05, "Pretrain/Loss": 2.0691452026367188, "Pretrain/Loss (Raw)": 2.0155491828918457, "Pretrain/Step": 3907, "Pretrain/Step Time": 8.543024834245443} +{"Pretrain/Learning Rate": 3.3355641126365676e-05, "Pretrain/Loss": 2.0670366287231445, "Pretrain/Loss (Raw)": 1.9869228601455688, "Pretrain/Step": 3908, "Pretrain/Step Time": 8.542559610679746} +{"Pretrain/Learning Rate": 3.33476389979814e-05, "Pretrain/Loss": 2.0654659271240234, "Pretrain/Loss (Raw)": 1.8726540803909302, "Pretrain/Step": 3909, "Pretrain/Step Time": 8.542517736554146} +{"Pretrain/Learning Rate": 3.3339635906908064e-05, "Pretrain/Loss": 2.065687417984009, "Pretrain/Loss (Raw)": 2.1705057621002197, "Pretrain/Step": 3910, "Pretrain/Step Time": 8.542172087356448} +{"Pretrain/Learning Rate": 3.3331631854068616e-05, "Pretrain/Loss": 2.0675337314605713, "Pretrain/Loss (Raw)": 2.1519722938537598, "Pretrain/Step": 3911, "Pretrain/Step Time": 8.545676335692406} +{"Pretrain/Learning Rate": 3.3323626840386115e-05, "Pretrain/Loss": 2.066046714782715, "Pretrain/Loss (Raw)": 1.882521629333496, "Pretrain/Step": 3912, "Pretrain/Step Time": 8.540767772123218} +{"Pretrain/Learning Rate": 3.3315620866783755e-05, "Pretrain/Loss": 2.0670576095581055, "Pretrain/Loss (Raw)": 2.0617871284484863, "Pretrain/Step": 3913, "Pretrain/Step Time": 8.539627885445952} +{"Pretrain/Learning Rate": 3.33076139341848e-05, "Pretrain/Loss": 2.066225528717041, "Pretrain/Loss (Raw)": 1.9034217596054077, "Pretrain/Step": 3914, "Pretrain/Step Time": 8.542652087286115} +{"Pretrain/Learning Rate": 3.329960604351267e-05, "Pretrain/Loss": 2.068084478378296, "Pretrain/Loss (Raw)": 2.3353826999664307, "Pretrain/Step": 3915, "Pretrain/Step Time": 8.543076889589429} +{"Pretrain/Learning Rate": 3.329159719569085e-05, "Pretrain/Loss": 2.070006847381592, "Pretrain/Loss (Raw)": 2.2467236518859863, "Pretrain/Step": 3916, "Pretrain/Step Time": 8.543646100908518} +{"Pretrain/Learning Rate": 3.328358739164299e-05, "Pretrain/Loss": 2.0687742233276367, "Pretrain/Loss (Raw)": 2.041851043701172, "Pretrain/Step": 3917, "Pretrain/Step Time": 8.542138818651438} +{"Pretrain/Learning Rate": 3.327557663229278e-05, "Pretrain/Loss": 2.070770740509033, "Pretrain/Loss (Raw)": 2.2542495727539062, "Pretrain/Step": 3918, "Pretrain/Step Time": 8.542574746534228} +{"Pretrain/Learning Rate": 3.326756491856409e-05, "Pretrain/Loss": 2.0705103874206543, "Pretrain/Loss (Raw)": 1.9772716760635376, "Pretrain/Step": 3919, "Pretrain/Step Time": 8.539093093946576} +{"Pretrain/Learning Rate": 3.325955225138085e-05, "Pretrain/Loss": 2.0691754817962646, "Pretrain/Loss (Raw)": 1.8824880123138428, "Pretrain/Step": 3920, "Pretrain/Step Time": 8.541736342012882} +{"Pretrain/Learning Rate": 3.3251538631667125e-05, "Pretrain/Loss": 2.070720672607422, "Pretrain/Loss (Raw)": 2.211904764175415, "Pretrain/Step": 3921, "Pretrain/Step Time": 8.543375233188272} +{"Pretrain/Learning Rate": 3.324352406034707e-05, "Pretrain/Loss": 2.070894241333008, "Pretrain/Loss (Raw)": 1.9584819078445435, "Pretrain/Step": 3922, "Pretrain/Step Time": 8.547954335808754} +{"Pretrain/Learning Rate": 3.3235508538344996e-05, "Pretrain/Loss": 2.068286418914795, "Pretrain/Loss (Raw)": 1.940259575843811, "Pretrain/Step": 3923, "Pretrain/Step Time": 8.544578427448869} +{"Pretrain/Learning Rate": 3.322749206658526e-05, "Pretrain/Loss": 2.0656299591064453, "Pretrain/Loss (Raw)": 2.05454683303833, "Pretrain/Step": 3924, "Pretrain/Step Time": 8.541552904993296} +{"Pretrain/Learning Rate": 3.3219474645992366e-05, "Pretrain/Loss": 2.0653910636901855, "Pretrain/Loss (Raw)": 2.069192886352539, "Pretrain/Step": 3925, "Pretrain/Step Time": 8.543685177341104} +{"Pretrain/Learning Rate": 3.3211456277490926e-05, "Pretrain/Loss": 2.0659103393554688, "Pretrain/Loss (Raw)": 2.0497982501983643, "Pretrain/Step": 3926, "Pretrain/Step Time": 8.549835415557027} +{"Pretrain/Learning Rate": 3.3203436962005655e-05, "Pretrain/Loss": 2.067026376724243, "Pretrain/Loss (Raw)": 2.1860098838806152, "Pretrain/Step": 3927, "Pretrain/Step Time": 8.550657045096159} +{"Pretrain/Learning Rate": 3.3195416700461385e-05, "Pretrain/Loss": 2.066080093383789, "Pretrain/Loss (Raw)": 2.0661323070526123, "Pretrain/Step": 3928, "Pretrain/Step Time": 8.550570588558912} +{"Pretrain/Learning Rate": 3.318739549378304e-05, "Pretrain/Loss": 2.0653417110443115, "Pretrain/Loss (Raw)": 2.065342426300049, "Pretrain/Step": 3929, "Pretrain/Step Time": 8.550025360658765} +{"Pretrain/Learning Rate": 3.317937334289566e-05, "Pretrain/Loss": 2.064528465270996, "Pretrain/Loss (Raw)": 1.9342139959335327, "Pretrain/Step": 3930, "Pretrain/Step Time": 8.551816185936332} +{"Pretrain/Learning Rate": 3.317135024872442e-05, "Pretrain/Loss": 2.06180477142334, "Pretrain/Loss (Raw)": 1.8992795944213867, "Pretrain/Step": 3931, "Pretrain/Step Time": 8.55633352138102} +{"Pretrain/Learning Rate": 3.3163326212194546e-05, "Pretrain/Loss": 2.0612711906433105, "Pretrain/Loss (Raw)": 2.153717041015625, "Pretrain/Step": 3932, "Pretrain/Step Time": 8.553106701001525} +{"Pretrain/Learning Rate": 3.315530123423143e-05, "Pretrain/Loss": 2.060502529144287, "Pretrain/Loss (Raw)": 2.0581166744232178, "Pretrain/Step": 3933, "Pretrain/Step Time": 8.549440674483776} +{"Pretrain/Learning Rate": 3.314727531576055e-05, "Pretrain/Loss": 2.061267852783203, "Pretrain/Loss (Raw)": 2.060053825378418, "Pretrain/Step": 3934, "Pretrain/Step Time": 8.552060797810555} +{"Pretrain/Learning Rate": 3.3139248457707495e-05, "Pretrain/Loss": 2.060525894165039, "Pretrain/Loss (Raw)": 1.9787875413894653, "Pretrain/Step": 3935, "Pretrain/Step Time": 8.551391428336501} +{"Pretrain/Learning Rate": 3.313122066099794e-05, "Pretrain/Loss": 2.061023712158203, "Pretrain/Loss (Raw)": 2.0777955055236816, "Pretrain/Step": 3936, "Pretrain/Step Time": 8.548417132347822} +{"Pretrain/Learning Rate": 3.312319192655772e-05, "Pretrain/Loss": 2.0612475872039795, "Pretrain/Loss (Raw)": 2.094588279724121, "Pretrain/Step": 3937, "Pretrain/Step Time": 8.555149095132947} +{"Pretrain/Learning Rate": 3.311516225531271e-05, "Pretrain/Loss": 2.0604019165039062, "Pretrain/Loss (Raw)": 1.92034113407135, "Pretrain/Step": 3938, "Pretrain/Step Time": 8.547100687399507} +{"Pretrain/Learning Rate": 3.3107131648188966e-05, "Pretrain/Loss": 2.062113046646118, "Pretrain/Loss (Raw)": 2.2163124084472656, "Pretrain/Step": 3939, "Pretrain/Step Time": 8.54675137065351} +{"Pretrain/Learning Rate": 3.309910010611259e-05, "Pretrain/Loss": 2.062102794647217, "Pretrain/Loss (Raw)": 2.0641138553619385, "Pretrain/Step": 3940, "Pretrain/Step Time": 8.547799482941628} +{"Pretrain/Learning Rate": 3.3091067630009834e-05, "Pretrain/Loss": 2.061612844467163, "Pretrain/Loss (Raw)": 2.1627495288848877, "Pretrain/Step": 3941, "Pretrain/Step Time": 8.549219649285078} +{"Pretrain/Learning Rate": 3.3083034220807016e-05, "Pretrain/Loss": 2.0598702430725098, "Pretrain/Loss (Raw)": 2.0296525955200195, "Pretrain/Step": 3942, "Pretrain/Step Time": 8.547876708209515} +{"Pretrain/Learning Rate": 3.307499987943062e-05, "Pretrain/Loss": 2.060431718826294, "Pretrain/Loss (Raw)": 2.1683571338653564, "Pretrain/Step": 3943, "Pretrain/Step Time": 8.545251345261931} +{"Pretrain/Learning Rate": 3.3066964606807175e-05, "Pretrain/Loss": 2.059798240661621, "Pretrain/Loss (Raw)": 2.054515838623047, "Pretrain/Step": 3944, "Pretrain/Step Time": 8.54646554403007} +{"Pretrain/Learning Rate": 3.3058928403863364e-05, "Pretrain/Loss": 2.06111741065979, "Pretrain/Loss (Raw)": 2.168268918991089, "Pretrain/Step": 3945, "Pretrain/Step Time": 8.550395209342241} +{"Pretrain/Learning Rate": 3.305089127152596e-05, "Pretrain/Loss": 2.061431884765625, "Pretrain/Loss (Raw)": 2.132688522338867, "Pretrain/Step": 3946, "Pretrain/Step Time": 8.55449570901692} +{"Pretrain/Learning Rate": 3.304285321072183e-05, "Pretrain/Loss": 2.0594756603240967, "Pretrain/Loss (Raw)": 1.8351194858551025, "Pretrain/Step": 3947, "Pretrain/Step Time": 8.557491967454553} +{"Pretrain/Learning Rate": 3.303481422237797e-05, "Pretrain/Loss": 2.056300640106201, "Pretrain/Loss (Raw)": 1.8042060136795044, "Pretrain/Step": 3948, "Pretrain/Step Time": 8.552542835474014} +{"Pretrain/Learning Rate": 3.3026774307421476e-05, "Pretrain/Loss": 2.0539937019348145, "Pretrain/Loss (Raw)": 1.9977891445159912, "Pretrain/Step": 3949, "Pretrain/Step Time": 8.555777641013265} +{"Pretrain/Learning Rate": 3.301873346677954e-05, "Pretrain/Loss": 2.054882526397705, "Pretrain/Loss (Raw)": 2.1494204998016357, "Pretrain/Step": 3950, "Pretrain/Step Time": 8.5572219658643} +{"Pretrain/Learning Rate": 3.301069170137948e-05, "Pretrain/Loss": 2.054683208465576, "Pretrain/Loss (Raw)": 2.103888988494873, "Pretrain/Step": 3951, "Pretrain/Step Time": 8.5566445607692} +{"Pretrain/Learning Rate": 3.3002649012148704e-05, "Pretrain/Loss": 2.052661418914795, "Pretrain/Loss (Raw)": 1.9613653421401978, "Pretrain/Step": 3952, "Pretrain/Step Time": 8.55269487760961} +{"Pretrain/Learning Rate": 3.2994605400014736e-05, "Pretrain/Loss": 2.053755283355713, "Pretrain/Loss (Raw)": 2.0740880966186523, "Pretrain/Step": 3953, "Pretrain/Step Time": 8.55356420762837} +{"Pretrain/Learning Rate": 3.29865608659052e-05, "Pretrain/Loss": 2.0531415939331055, "Pretrain/Loss (Raw)": 2.0256524085998535, "Pretrain/Step": 3954, "Pretrain/Step Time": 8.552875027060509} +{"Pretrain/Learning Rate": 3.297851541074782e-05, "Pretrain/Loss": 2.052633762359619, "Pretrain/Loss (Raw)": 2.043321132659912, "Pretrain/Step": 3955, "Pretrain/Step Time": 8.54519428126514} +{"Pretrain/Learning Rate": 3.297046903547046e-05, "Pretrain/Loss": 2.0528082847595215, "Pretrain/Loss (Raw)": 2.071885824203491, "Pretrain/Step": 3956, "Pretrain/Step Time": 8.54970046132803} +{"Pretrain/Learning Rate": 3.296242174100105e-05, "Pretrain/Loss": 2.055729389190674, "Pretrain/Loss (Raw)": 2.2456893920898438, "Pretrain/Step": 3957, "Pretrain/Step Time": 8.550198931246996} +{"Pretrain/Learning Rate": 3.2954373528267646e-05, "Pretrain/Loss": 2.0533528327941895, "Pretrain/Loss (Raw)": 1.6350029706954956, "Pretrain/Step": 3958, "Pretrain/Step Time": 8.545844053849578} +{"Pretrain/Learning Rate": 3.29463243981984e-05, "Pretrain/Loss": 2.0540201663970947, "Pretrain/Loss (Raw)": 2.081885576248169, "Pretrain/Step": 3959, "Pretrain/Step Time": 8.545439975336194} +{"Pretrain/Learning Rate": 3.2938274351721587e-05, "Pretrain/Loss": 2.0547075271606445, "Pretrain/Loss (Raw)": 2.143317222595215, "Pretrain/Step": 3960, "Pretrain/Step Time": 8.542239570990205} +{"Pretrain/Learning Rate": 3.2930223389765566e-05, "Pretrain/Loss": 2.054901123046875, "Pretrain/Loss (Raw)": 1.996344804763794, "Pretrain/Step": 3961, "Pretrain/Step Time": 8.5543452501297} +{"Pretrain/Learning Rate": 3.292217151325882e-05, "Pretrain/Loss": 2.0574440956115723, "Pretrain/Loss (Raw)": 2.07621169090271, "Pretrain/Step": 3962, "Pretrain/Step Time": 8.547168709337711} +{"Pretrain/Learning Rate": 3.2914118723129916e-05, "Pretrain/Loss": 2.058685064315796, "Pretrain/Loss (Raw)": 2.125702142715454, "Pretrain/Step": 3963, "Pretrain/Step Time": 8.547834826633334} +{"Pretrain/Learning Rate": 3.2906065020307545e-05, "Pretrain/Loss": 2.0605227947235107, "Pretrain/Loss (Raw)": 2.1729214191436768, "Pretrain/Step": 3964, "Pretrain/Step Time": 8.541239276528358} +{"Pretrain/Learning Rate": 3.289801040572051e-05, "Pretrain/Loss": 2.06160306930542, "Pretrain/Loss (Raw)": 2.1114838123321533, "Pretrain/Step": 3965, "Pretrain/Step Time": 8.542351942509413} +{"Pretrain/Learning Rate": 3.288995488029769e-05, "Pretrain/Loss": 2.0616044998168945, "Pretrain/Loss (Raw)": 2.051941394805908, "Pretrain/Step": 3966, "Pretrain/Step Time": 8.540785705670714} +{"Pretrain/Learning Rate": 3.288189844496811e-05, "Pretrain/Loss": 2.06026554107666, "Pretrain/Loss (Raw)": 2.0110340118408203, "Pretrain/Step": 3967, "Pretrain/Step Time": 8.54832155816257} +{"Pretrain/Learning Rate": 3.287384110066084e-05, "Pretrain/Loss": 2.0611419677734375, "Pretrain/Loss (Raw)": 2.187338352203369, "Pretrain/Step": 3968, "Pretrain/Step Time": 8.536211321130395} +{"Pretrain/Learning Rate": 3.286578284830513e-05, "Pretrain/Loss": 2.0594005584716797, "Pretrain/Loss (Raw)": 1.9548735618591309, "Pretrain/Step": 3969, "Pretrain/Step Time": 8.539176605641842} +{"Pretrain/Learning Rate": 3.2857723688830264e-05, "Pretrain/Loss": 2.05940580368042, "Pretrain/Loss (Raw)": 2.1628174781799316, "Pretrain/Step": 3970, "Pretrain/Step Time": 8.538246724754572} +{"Pretrain/Learning Rate": 3.284966362316568e-05, "Pretrain/Loss": 2.0598061084747314, "Pretrain/Loss (Raw)": 1.9721797704696655, "Pretrain/Step": 3971, "Pretrain/Step Time": 8.537232372909784} +{"Pretrain/Learning Rate": 3.28416026522409e-05, "Pretrain/Loss": 2.0611162185668945, "Pretrain/Loss (Raw)": 2.1891512870788574, "Pretrain/Step": 3972, "Pretrain/Step Time": 8.53708759509027} +{"Pretrain/Learning Rate": 3.283354077698555e-05, "Pretrain/Loss": 2.058969497680664, "Pretrain/Loss (Raw)": 1.8442384004592896, "Pretrain/Step": 3973, "Pretrain/Step Time": 8.535666408017278} +{"Pretrain/Learning Rate": 3.2825477998329366e-05, "Pretrain/Loss": 2.058825969696045, "Pretrain/Loss (Raw)": 2.0406618118286133, "Pretrain/Step": 3974, "Pretrain/Step Time": 8.546645937487483} +{"Pretrain/Learning Rate": 3.281741431720219e-05, "Pretrain/Loss": 2.060426712036133, "Pretrain/Loss (Raw)": 2.5000498294830322, "Pretrain/Step": 3975, "Pretrain/Step Time": 8.533509396016598} +{"Pretrain/Learning Rate": 3.280934973453395e-05, "Pretrain/Loss": 2.0588855743408203, "Pretrain/Loss (Raw)": 2.0955307483673096, "Pretrain/Step": 3976, "Pretrain/Step Time": 8.532517367973924} +{"Pretrain/Learning Rate": 3.28012842512547e-05, "Pretrain/Loss": 2.057969093322754, "Pretrain/Loss (Raw)": 2.041565179824829, "Pretrain/Step": 3977, "Pretrain/Step Time": 8.53959135338664} +{"Pretrain/Learning Rate": 3.279321786829459e-05, "Pretrain/Loss": 2.058635711669922, "Pretrain/Loss (Raw)": 1.9135384559631348, "Pretrain/Step": 3978, "Pretrain/Step Time": 8.537561558187008} +{"Pretrain/Learning Rate": 3.278515058658387e-05, "Pretrain/Loss": 2.0623297691345215, "Pretrain/Loss (Raw)": 2.447317361831665, "Pretrain/Step": 3979, "Pretrain/Step Time": 8.537304263561964} +{"Pretrain/Learning Rate": 3.27770824070529e-05, "Pretrain/Loss": 2.065739870071411, "Pretrain/Loss (Raw)": 2.3045859336853027, "Pretrain/Step": 3980, "Pretrain/Step Time": 8.54401677660644} +{"Pretrain/Learning Rate": 3.276901333063215e-05, "Pretrain/Loss": 2.0662307739257812, "Pretrain/Loss (Raw)": 2.344700336456299, "Pretrain/Step": 3981, "Pretrain/Step Time": 8.539643302559853} +{"Pretrain/Learning Rate": 3.276094335825217e-05, "Pretrain/Loss": 2.064976215362549, "Pretrain/Loss (Raw)": 1.896953821182251, "Pretrain/Step": 3982, "Pretrain/Step Time": 8.53988685272634} +{"Pretrain/Learning Rate": 3.2752872490843626e-05, "Pretrain/Loss": 2.0654897689819336, "Pretrain/Loss (Raw)": 2.0969078540802, "Pretrain/Step": 3983, "Pretrain/Step Time": 8.541125601157546} +{"Pretrain/Learning Rate": 3.274480072933729e-05, "Pretrain/Loss": 2.067227840423584, "Pretrain/Loss (Raw)": 2.401437282562256, "Pretrain/Step": 3984, "Pretrain/Step Time": 8.537119310349226} +{"Pretrain/Learning Rate": 3.273672807466405e-05, "Pretrain/Loss": 2.0666608810424805, "Pretrain/Loss (Raw)": 2.111759662628174, "Pretrain/Step": 3985, "Pretrain/Step Time": 8.540577951818705} +{"Pretrain/Learning Rate": 3.272865452775487e-05, "Pretrain/Loss": 2.0650217533111572, "Pretrain/Loss (Raw)": 1.9851356744766235, "Pretrain/Step": 3986, "Pretrain/Step Time": 8.538945263251662} +{"Pretrain/Learning Rate": 3.272058008954083e-05, "Pretrain/Loss": 2.0660037994384766, "Pretrain/Loss (Raw)": 2.0984113216400146, "Pretrain/Step": 3987, "Pretrain/Step Time": 8.53306969255209} +{"Pretrain/Learning Rate": 3.271250476095311e-05, "Pretrain/Loss": 2.0655460357666016, "Pretrain/Loss (Raw)": 2.0624892711639404, "Pretrain/Step": 3988, "Pretrain/Step Time": 8.535935746505857} +{"Pretrain/Learning Rate": 3.2704428542923e-05, "Pretrain/Loss": 2.0687808990478516, "Pretrain/Loss (Raw)": 2.4997332096099854, "Pretrain/Step": 3989, "Pretrain/Step Time": 8.530782097950578} +{"Pretrain/Learning Rate": 3.269635143638188e-05, "Pretrain/Loss": 2.069319725036621, "Pretrain/Loss (Raw)": 2.0458028316497803, "Pretrain/Step": 3990, "Pretrain/Step Time": 8.533189246430993} +{"Pretrain/Learning Rate": 3.2688273442261255e-05, "Pretrain/Loss": 2.067678928375244, "Pretrain/Loss (Raw)": 1.8684247732162476, "Pretrain/Step": 3991, "Pretrain/Step Time": 8.529184060171247} +{"Pretrain/Learning Rate": 3.26801945614927e-05, "Pretrain/Loss": 2.0672826766967773, "Pretrain/Loss (Raw)": 2.0564088821411133, "Pretrain/Step": 3992, "Pretrain/Step Time": 8.532794043421745} +{"Pretrain/Learning Rate": 3.2672114795007926e-05, "Pretrain/Loss": 2.0665225982666016, "Pretrain/Loss (Raw)": 2.01177716255188, "Pretrain/Step": 3993, "Pretrain/Step Time": 8.52860190719366} +{"Pretrain/Learning Rate": 3.266403414373872e-05, "Pretrain/Loss": 2.0680806636810303, "Pretrain/Loss (Raw)": 2.3252644538879395, "Pretrain/Step": 3994, "Pretrain/Step Time": 8.526289463043213} +{"Pretrain/Learning Rate": 3.265595260861698e-05, "Pretrain/Loss": 2.0676093101501465, "Pretrain/Loss (Raw)": 2.0292418003082275, "Pretrain/Step": 3995, "Pretrain/Step Time": 8.529532216489315} +{"Pretrain/Learning Rate": 3.264787019057471e-05, "Pretrain/Loss": 2.0682780742645264, "Pretrain/Loss (Raw)": 2.1705799102783203, "Pretrain/Step": 3996, "Pretrain/Step Time": 8.526451079174876} +{"Pretrain/Learning Rate": 3.2639786890544014e-05, "Pretrain/Loss": 2.07114577293396, "Pretrain/Loss (Raw)": 2.1174206733703613, "Pretrain/Step": 3997, "Pretrain/Step Time": 8.5273760240525} +{"Pretrain/Learning Rate": 3.263170270945709e-05, "Pretrain/Loss": 2.0723774433135986, "Pretrain/Loss (Raw)": 2.2178432941436768, "Pretrain/Step": 3998, "Pretrain/Step Time": 8.52883342653513} +{"Pretrain/Learning Rate": 3.262361764824625e-05, "Pretrain/Loss": 2.07234263420105, "Pretrain/Loss (Raw)": 2.1237905025482178, "Pretrain/Step": 3999, "Pretrain/Step Time": 8.527041474357247} +{"Pretrain/Learning Rate": 3.26155317078439e-05, "Pretrain/Loss": 2.0705177783966064, "Pretrain/Loss (Raw)": 1.8241299390792847, "Pretrain/Step": 4000, "Pretrain/Step Time": 8.524866752326488} +{"Pretrain/Learning Rate": 3.260744488918254e-05, "Pretrain/Loss": 2.0701589584350586, "Pretrain/Loss (Raw)": 2.0787343978881836, "Pretrain/Step": 4001, "Pretrain/Step Time": 8.530394906178117} +{"Pretrain/Learning Rate": 3.25993571931948e-05, "Pretrain/Loss": 2.0707831382751465, "Pretrain/Loss (Raw)": 2.0411558151245117, "Pretrain/Step": 4002, "Pretrain/Step Time": 8.528355333954096} +{"Pretrain/Learning Rate": 3.259126862081337e-05, "Pretrain/Loss": 2.0701465606689453, "Pretrain/Loss (Raw)": 2.035162925720215, "Pretrain/Step": 4003, "Pretrain/Step Time": 8.526012184098363} +{"Pretrain/Learning Rate": 3.258317917297108e-05, "Pretrain/Loss": 2.0703585147857666, "Pretrain/Loss (Raw)": 2.0983684062957764, "Pretrain/Step": 4004, "Pretrain/Step Time": 8.533721357584} +{"Pretrain/Learning Rate": 3.2575088850600826e-05, "Pretrain/Loss": 2.07185697555542, "Pretrain/Loss (Raw)": 2.1845602989196777, "Pretrain/Step": 4005, "Pretrain/Step Time": 8.53110016696155} +{"Pretrain/Learning Rate": 3.2566997654635634e-05, "Pretrain/Loss": 2.07170033454895, "Pretrain/Loss (Raw)": 2.1607589721679688, "Pretrain/Step": 4006, "Pretrain/Step Time": 8.532989041879773} +{"Pretrain/Learning Rate": 3.2558905586008616e-05, "Pretrain/Loss": 2.0698964595794678, "Pretrain/Loss (Raw)": 1.9039568901062012, "Pretrain/Step": 4007, "Pretrain/Step Time": 8.531907677650452} +{"Pretrain/Learning Rate": 3.2550812645652985e-05, "Pretrain/Loss": 2.0718483924865723, "Pretrain/Loss (Raw)": 2.1584420204162598, "Pretrain/Step": 4008, "Pretrain/Step Time": 8.539309343323112} +{"Pretrain/Learning Rate": 3.2542718834502056e-05, "Pretrain/Loss": 2.0719962120056152, "Pretrain/Loss (Raw)": 2.063481330871582, "Pretrain/Step": 4009, "Pretrain/Step Time": 8.53688932955265} +{"Pretrain/Learning Rate": 3.253462415348926e-05, "Pretrain/Loss": 2.070359945297241, "Pretrain/Loss (Raw)": 1.805611491203308, "Pretrain/Step": 4010, "Pretrain/Step Time": 8.547179969027638} +{"Pretrain/Learning Rate": 3.252652860354809e-05, "Pretrain/Loss": 2.0699002742767334, "Pretrain/Loss (Raw)": 2.0889320373535156, "Pretrain/Step": 4011, "Pretrain/Step Time": 8.54059862345457} +{"Pretrain/Learning Rate": 3.2518432185612184e-05, "Pretrain/Loss": 2.0710368156433105, "Pretrain/Loss (Raw)": 2.2904093265533447, "Pretrain/Step": 4012, "Pretrain/Step Time": 8.545722711831331} +{"Pretrain/Learning Rate": 3.2510334900615254e-05, "Pretrain/Loss": 2.069817543029785, "Pretrain/Loss (Raw)": 1.7630345821380615, "Pretrain/Step": 4013, "Pretrain/Step Time": 8.545181790366769} +{"Pretrain/Learning Rate": 3.25022367494911e-05, "Pretrain/Loss": 2.070101261138916, "Pretrain/Loss (Raw)": 2.137765407562256, "Pretrain/Step": 4014, "Pretrain/Step Time": 8.545447658747435} +{"Pretrain/Learning Rate": 3.2494137733173666e-05, "Pretrain/Loss": 2.0704054832458496, "Pretrain/Loss (Raw)": 1.9992400407791138, "Pretrain/Step": 4015, "Pretrain/Step Time": 8.544230481609702} +{"Pretrain/Learning Rate": 3.2486037852596946e-05, "Pretrain/Loss": 2.0693697929382324, "Pretrain/Loss (Raw)": 2.119826316833496, "Pretrain/Step": 4016, "Pretrain/Step Time": 8.553664397448301} +{"Pretrain/Learning Rate": 3.247793710869507e-05, "Pretrain/Loss": 2.069552421569824, "Pretrain/Loss (Raw)": 2.080019474029541, "Pretrain/Step": 4017, "Pretrain/Step Time": 8.550364522263408} +{"Pretrain/Learning Rate": 3.2469835502402246e-05, "Pretrain/Loss": 2.067960262298584, "Pretrain/Loss (Raw)": 1.9150198698043823, "Pretrain/Step": 4018, "Pretrain/Step Time": 8.552586572244763} +{"Pretrain/Learning Rate": 3.2461733034652794e-05, "Pretrain/Loss": 2.069272041320801, "Pretrain/Loss (Raw)": 2.137786865234375, "Pretrain/Step": 4019, "Pretrain/Step Time": 8.55296828970313} +{"Pretrain/Learning Rate": 3.245362970638113e-05, "Pretrain/Loss": 2.075099468231201, "Pretrain/Loss (Raw)": 2.266653060913086, "Pretrain/Step": 4020, "Pretrain/Step Time": 8.555589409545064} +{"Pretrain/Learning Rate": 3.244552551852176e-05, "Pretrain/Loss": 2.0742204189300537, "Pretrain/Loss (Raw)": 2.1029067039489746, "Pretrain/Step": 4021, "Pretrain/Step Time": 8.553447594866157} +{"Pretrain/Learning Rate": 3.24374204720093e-05, "Pretrain/Loss": 2.074049234390259, "Pretrain/Loss (Raw)": 1.9865093231201172, "Pretrain/Step": 4022, "Pretrain/Step Time": 8.55625480785966} +{"Pretrain/Learning Rate": 3.242931456777848e-05, "Pretrain/Loss": 2.075342893600464, "Pretrain/Loss (Raw)": 2.5449612140655518, "Pretrain/Step": 4023, "Pretrain/Step Time": 8.544617606326938} +{"Pretrain/Learning Rate": 3.242120780676408e-05, "Pretrain/Loss": 2.0748558044433594, "Pretrain/Loss (Raw)": 1.995447039604187, "Pretrain/Step": 4024, "Pretrain/Step Time": 8.550995497033} +{"Pretrain/Learning Rate": 3.2413100189901036e-05, "Pretrain/Loss": 2.07759165763855, "Pretrain/Loss (Raw)": 2.22287917137146, "Pretrain/Step": 4025, "Pretrain/Step Time": 8.553561361506581} +{"Pretrain/Learning Rate": 3.2404991718124346e-05, "Pretrain/Loss": 2.074918508529663, "Pretrain/Loss (Raw)": 1.8660304546356201, "Pretrain/Step": 4026, "Pretrain/Step Time": 8.554009553045034} +{"Pretrain/Learning Rate": 3.239688239236911e-05, "Pretrain/Loss": 2.075568199157715, "Pretrain/Loss (Raw)": 2.1163623332977295, "Pretrain/Step": 4027, "Pretrain/Step Time": 8.557372944429517} +{"Pretrain/Learning Rate": 3.238877221357054e-05, "Pretrain/Loss": 2.074648380279541, "Pretrain/Loss (Raw)": 1.9496595859527588, "Pretrain/Step": 4028, "Pretrain/Step Time": 8.564200541004539} +{"Pretrain/Learning Rate": 3.2380661182663956e-05, "Pretrain/Loss": 2.0756518840789795, "Pretrain/Loss (Raw)": 2.332930564880371, "Pretrain/Step": 4029, "Pretrain/Step Time": 8.550222005695105} +{"Pretrain/Learning Rate": 3.237254930058474e-05, "Pretrain/Loss": 2.0750842094421387, "Pretrain/Loss (Raw)": 2.0432863235473633, "Pretrain/Step": 4030, "Pretrain/Step Time": 8.548885125666857} +{"Pretrain/Learning Rate": 3.236443656826839e-05, "Pretrain/Loss": 2.0755279064178467, "Pretrain/Loss (Raw)": 2.188239574432373, "Pretrain/Step": 4031, "Pretrain/Step Time": 8.542475113645196} +{"Pretrain/Learning Rate": 3.235632298665052e-05, "Pretrain/Loss": 2.076249599456787, "Pretrain/Loss (Raw)": 1.9694544076919556, "Pretrain/Step": 4032, "Pretrain/Step Time": 8.549202525988221} +{"Pretrain/Learning Rate": 3.234820855666681e-05, "Pretrain/Loss": 2.076992988586426, "Pretrain/Loss (Raw)": 1.936020016670227, "Pretrain/Step": 4033, "Pretrain/Step Time": 8.55149139650166} +{"Pretrain/Learning Rate": 3.234009327925308e-05, "Pretrain/Loss": 2.0759079456329346, "Pretrain/Loss (Raw)": 1.9137457609176636, "Pretrain/Step": 4034, "Pretrain/Step Time": 8.554527534171939} +{"Pretrain/Learning Rate": 3.23319771553452e-05, "Pretrain/Loss": 2.076479434967041, "Pretrain/Loss (Raw)": 2.088705539703369, "Pretrain/Step": 4035, "Pretrain/Step Time": 8.550263419747353} +{"Pretrain/Learning Rate": 3.232386018587916e-05, "Pretrain/Loss": 2.0764591693878174, "Pretrain/Loss (Raw)": 1.9843330383300781, "Pretrain/Step": 4036, "Pretrain/Step Time": 8.557507360354066} +{"Pretrain/Learning Rate": 3.2315742371791046e-05, "Pretrain/Loss": 2.078000068664551, "Pretrain/Loss (Raw)": 2.069854974746704, "Pretrain/Step": 4037, "Pretrain/Step Time": 8.551235953345895} +{"Pretrain/Learning Rate": 3.230762371401705e-05, "Pretrain/Loss": 2.079069137573242, "Pretrain/Loss (Raw)": 2.3073925971984863, "Pretrain/Step": 4038, "Pretrain/Step Time": 8.549894999712706} +{"Pretrain/Learning Rate": 3.2299504213493464e-05, "Pretrain/Loss": 2.079204797744751, "Pretrain/Loss (Raw)": 2.169332504272461, "Pretrain/Step": 4039, "Pretrain/Step Time": 8.550133876502514} +{"Pretrain/Learning Rate": 3.229138387115665e-05, "Pretrain/Loss": 2.0807642936706543, "Pretrain/Loss (Raw)": 2.0821192264556885, "Pretrain/Step": 4040, "Pretrain/Step Time": 8.556133925914764} +{"Pretrain/Learning Rate": 3.228326268794309e-05, "Pretrain/Loss": 2.081045627593994, "Pretrain/Loss (Raw)": 2.097788095474243, "Pretrain/Step": 4041, "Pretrain/Step Time": 8.557340921834111} +{"Pretrain/Learning Rate": 3.227514066478936e-05, "Pretrain/Loss": 2.082486391067505, "Pretrain/Loss (Raw)": 2.0878677368164062, "Pretrain/Step": 4042, "Pretrain/Step Time": 8.551337134093046} +{"Pretrain/Learning Rate": 3.226701780263212e-05, "Pretrain/Loss": 2.0832443237304688, "Pretrain/Loss (Raw)": 2.4323933124542236, "Pretrain/Step": 4043, "Pretrain/Step Time": 8.549339612945914} +{"Pretrain/Learning Rate": 3.225889410240815e-05, "Pretrain/Loss": 2.0826292037963867, "Pretrain/Loss (Raw)": 2.167954444885254, "Pretrain/Step": 4044, "Pretrain/Step Time": 8.550091231241822} +{"Pretrain/Learning Rate": 3.2250769565054305e-05, "Pretrain/Loss": 2.0821075439453125, "Pretrain/Loss (Raw)": 1.9750988483428955, "Pretrain/Step": 4045, "Pretrain/Step Time": 8.547415936365724} +{"Pretrain/Learning Rate": 3.2242644191507545e-05, "Pretrain/Loss": 2.0798110961914062, "Pretrain/Loss (Raw)": 1.9603042602539062, "Pretrain/Step": 4046, "Pretrain/Step Time": 8.5496321991086} +{"Pretrain/Learning Rate": 3.223451798270493e-05, "Pretrain/Loss": 2.0798182487487793, "Pretrain/Loss (Raw)": 1.9781912565231323, "Pretrain/Step": 4047, "Pretrain/Step Time": 8.547273548319936} +{"Pretrain/Learning Rate": 3.222639093958361e-05, "Pretrain/Loss": 2.082061767578125, "Pretrain/Loss (Raw)": 2.169672727584839, "Pretrain/Step": 4048, "Pretrain/Step Time": 8.548443678766489} +{"Pretrain/Learning Rate": 3.2218263063080836e-05, "Pretrain/Loss": 2.082202434539795, "Pretrain/Loss (Raw)": 2.229901075363159, "Pretrain/Step": 4049, "Pretrain/Step Time": 8.545473514124751} +{"Pretrain/Learning Rate": 3.221013435413395e-05, "Pretrain/Loss": 2.085392475128174, "Pretrain/Loss (Raw)": 2.3667891025543213, "Pretrain/Step": 4050, "Pretrain/Step Time": 8.547061692923307} +{"Pretrain/Learning Rate": 3.220200481368039e-05, "Pretrain/Loss": 2.0874691009521484, "Pretrain/Loss (Raw)": 2.2060718536376953, "Pretrain/Step": 4051, "Pretrain/Step Time": 8.547030935063958} +{"Pretrain/Learning Rate": 3.219387444265771e-05, "Pretrain/Loss": 2.0863735675811768, "Pretrain/Loss (Raw)": 1.9143309593200684, "Pretrain/Step": 4052, "Pretrain/Step Time": 8.553795415908098} +{"Pretrain/Learning Rate": 3.2185743242003524e-05, "Pretrain/Loss": 2.086308479309082, "Pretrain/Loss (Raw)": 2.060847043991089, "Pretrain/Step": 4053, "Pretrain/Step Time": 8.549904063344002} +{"Pretrain/Learning Rate": 3.217761121265557e-05, "Pretrain/Loss": 2.085880756378174, "Pretrain/Loss (Raw)": 1.9950854778289795, "Pretrain/Step": 4054, "Pretrain/Step Time": 8.546838015317917} +{"Pretrain/Learning Rate": 3.2169478355551665e-05, "Pretrain/Loss": 2.0850048065185547, "Pretrain/Loss (Raw)": 2.0738766193389893, "Pretrain/Step": 4055, "Pretrain/Step Time": 8.54320677369833} +{"Pretrain/Learning Rate": 3.216134467162973e-05, "Pretrain/Loss": 2.084404468536377, "Pretrain/Loss (Raw)": 1.989288568496704, "Pretrain/Step": 4056, "Pretrain/Step Time": 8.543803691864014} +{"Pretrain/Learning Rate": 3.215321016182779e-05, "Pretrain/Loss": 2.0848047733306885, "Pretrain/Loss (Raw)": 2.1165781021118164, "Pretrain/Step": 4057, "Pretrain/Step Time": 8.545816119760275} +{"Pretrain/Learning Rate": 3.2145074827083946e-05, "Pretrain/Loss": 2.0844969749450684, "Pretrain/Loss (Raw)": 1.8948330879211426, "Pretrain/Step": 4058, "Pretrain/Step Time": 8.550621649250388} +{"Pretrain/Learning Rate": 3.21369386683364e-05, "Pretrain/Loss": 2.0852413177490234, "Pretrain/Loss (Raw)": 1.9945484399795532, "Pretrain/Step": 4059, "Pretrain/Step Time": 8.5480318069458} +{"Pretrain/Learning Rate": 3.212880168652346e-05, "Pretrain/Loss": 2.08493709564209, "Pretrain/Loss (Raw)": 2.114772081375122, "Pretrain/Step": 4060, "Pretrain/Step Time": 8.546208249405026} +{"Pretrain/Learning Rate": 3.2120663882583514e-05, "Pretrain/Loss": 2.085160970687866, "Pretrain/Loss (Raw)": 2.086761236190796, "Pretrain/Step": 4061, "Pretrain/Step Time": 8.54353922791779} +{"Pretrain/Learning Rate": 3.2112525257455064e-05, "Pretrain/Loss": 2.085501194000244, "Pretrain/Loss (Raw)": 2.103614568710327, "Pretrain/Step": 4062, "Pretrain/Step Time": 8.545668506994843} +{"Pretrain/Learning Rate": 3.210438581207667e-05, "Pretrain/Loss": 2.085684299468994, "Pretrain/Loss (Raw)": 2.002192974090576, "Pretrain/Step": 4063, "Pretrain/Step Time": 8.546445360407233} +{"Pretrain/Learning Rate": 3.209624554738704e-05, "Pretrain/Loss": 2.0862231254577637, "Pretrain/Loss (Raw)": 2.1467721462249756, "Pretrain/Step": 4064, "Pretrain/Step Time": 8.548443332314491} +{"Pretrain/Learning Rate": 3.208810446432493e-05, "Pretrain/Loss": 2.084752082824707, "Pretrain/Loss (Raw)": 1.9062941074371338, "Pretrain/Step": 4065, "Pretrain/Step Time": 8.546720255166292} +{"Pretrain/Learning Rate": 3.207996256382922e-05, "Pretrain/Loss": 2.0850346088409424, "Pretrain/Loss (Raw)": 1.9565088748931885, "Pretrain/Step": 4066, "Pretrain/Step Time": 8.543627550825477} +{"Pretrain/Learning Rate": 3.207181984683886e-05, "Pretrain/Loss": 2.082935333251953, "Pretrain/Loss (Raw)": 1.9476052522659302, "Pretrain/Step": 4067, "Pretrain/Step Time": 8.541522320359945} +{"Pretrain/Learning Rate": 3.2063676314292914e-05, "Pretrain/Loss": 2.0844480991363525, "Pretrain/Loss (Raw)": 2.257744073867798, "Pretrain/Step": 4068, "Pretrain/Step Time": 8.542950658127666} +{"Pretrain/Learning Rate": 3.205553196713052e-05, "Pretrain/Loss": 2.08339524269104, "Pretrain/Loss (Raw)": 2.0279886722564697, "Pretrain/Step": 4069, "Pretrain/Step Time": 8.540248317644} +{"Pretrain/Learning Rate": 3.204738680629094e-05, "Pretrain/Loss": 2.084021806716919, "Pretrain/Loss (Raw)": 2.109863758087158, "Pretrain/Step": 4070, "Pretrain/Step Time": 8.54521245509386} +{"Pretrain/Learning Rate": 3.2039240832713516e-05, "Pretrain/Loss": 2.082352638244629, "Pretrain/Loss (Raw)": 1.9547256231307983, "Pretrain/Step": 4071, "Pretrain/Step Time": 8.547438044101} +{"Pretrain/Learning Rate": 3.203109404733765e-05, "Pretrain/Loss": 2.0816614627838135, "Pretrain/Loss (Raw)": 1.9660277366638184, "Pretrain/Step": 4072, "Pretrain/Step Time": 8.540226379409432} +{"Pretrain/Learning Rate": 3.20229464511029e-05, "Pretrain/Loss": 2.0794808864593506, "Pretrain/Loss (Raw)": 1.889155626296997, "Pretrain/Step": 4073, "Pretrain/Step Time": 8.539197003468871} +{"Pretrain/Learning Rate": 3.2014798044948866e-05, "Pretrain/Loss": 2.079402446746826, "Pretrain/Loss (Raw)": 2.1226489543914795, "Pretrain/Step": 4074, "Pretrain/Step Time": 8.536374665796757} +{"Pretrain/Learning Rate": 3.2006648829815265e-05, "Pretrain/Loss": 2.0808663368225098, "Pretrain/Loss (Raw)": 2.022488832473755, "Pretrain/Step": 4075, "Pretrain/Step Time": 8.5323123075068} +{"Pretrain/Learning Rate": 3.1998498806641907e-05, "Pretrain/Loss": 2.0826354026794434, "Pretrain/Loss (Raw)": 2.030651330947876, "Pretrain/Step": 4076, "Pretrain/Step Time": 8.546078447252512} +{"Pretrain/Learning Rate": 3.19903479763687e-05, "Pretrain/Loss": 2.084306478500366, "Pretrain/Loss (Raw)": 2.21169376373291, "Pretrain/Step": 4077, "Pretrain/Step Time": 8.541109895333648} +{"Pretrain/Learning Rate": 3.19821963399356e-05, "Pretrain/Loss": 2.0823428630828857, "Pretrain/Loss (Raw)": 1.8980579376220703, "Pretrain/Step": 4078, "Pretrain/Step Time": 8.539070706814528} +{"Pretrain/Learning Rate": 3.1974043898282744e-05, "Pretrain/Loss": 2.0824778079986572, "Pretrain/Loss (Raw)": 2.1211817264556885, "Pretrain/Step": 4079, "Pretrain/Step Time": 8.543081130832434} +{"Pretrain/Learning Rate": 3.196589065235026e-05, "Pretrain/Loss": 2.0852208137512207, "Pretrain/Loss (Raw)": 2.3124818801879883, "Pretrain/Step": 4080, "Pretrain/Step Time": 8.54015889018774} +{"Pretrain/Learning Rate": 3.195773660307846e-05, "Pretrain/Loss": 2.085594654083252, "Pretrain/Loss (Raw)": 2.1219210624694824, "Pretrain/Step": 4081, "Pretrain/Step Time": 8.53952530771494} +{"Pretrain/Learning Rate": 3.1949581751407676e-05, "Pretrain/Loss": 2.0869083404541016, "Pretrain/Loss (Raw)": 2.1938085556030273, "Pretrain/Step": 4082, "Pretrain/Step Time": 8.542232379317284} +{"Pretrain/Learning Rate": 3.1941426098278383e-05, "Pretrain/Loss": 2.0861752033233643, "Pretrain/Loss (Raw)": 1.9494781494140625, "Pretrain/Step": 4083, "Pretrain/Step Time": 8.541579814627767} +{"Pretrain/Learning Rate": 3.193326964463112e-05, "Pretrain/Loss": 2.0852956771850586, "Pretrain/Loss (Raw)": 1.9592771530151367, "Pretrain/Step": 4084, "Pretrain/Step Time": 8.539658242836595} +{"Pretrain/Learning Rate": 3.192511239140653e-05, "Pretrain/Loss": 2.084397792816162, "Pretrain/Loss (Raw)": 2.130784273147583, "Pretrain/Step": 4085, "Pretrain/Step Time": 8.537724930793047} +{"Pretrain/Learning Rate": 3.1916954339545355e-05, "Pretrain/Loss": 2.0872368812561035, "Pretrain/Loss (Raw)": 1.9984076023101807, "Pretrain/Step": 4086, "Pretrain/Step Time": 8.537611795589328} +{"Pretrain/Learning Rate": 3.19087954899884e-05, "Pretrain/Loss": 2.087547540664673, "Pretrain/Loss (Raw)": 2.1216511726379395, "Pretrain/Step": 4087, "Pretrain/Step Time": 8.535177234560251} +{"Pretrain/Learning Rate": 3.190063584367661e-05, "Pretrain/Loss": 2.0857229232788086, "Pretrain/Loss (Raw)": 1.909779667854309, "Pretrain/Step": 4088, "Pretrain/Step Time": 8.540887018665671} +{"Pretrain/Learning Rate": 3.1892475401550956e-05, "Pretrain/Loss": 2.0841403007507324, "Pretrain/Loss (Raw)": 1.7937533855438232, "Pretrain/Step": 4089, "Pretrain/Step Time": 8.544410331174731} +{"Pretrain/Learning Rate": 3.1884314164552576e-05, "Pretrain/Loss": 2.08392071723938, "Pretrain/Loss (Raw)": 2.0481131076812744, "Pretrain/Step": 4090, "Pretrain/Step Time": 8.538434507325292} +{"Pretrain/Learning Rate": 3.187615213362264e-05, "Pretrain/Loss": 2.0853195190429688, "Pretrain/Loss (Raw)": 2.3047406673431396, "Pretrain/Step": 4091, "Pretrain/Step Time": 8.538610491901636} +{"Pretrain/Learning Rate": 3.186798930970244e-05, "Pretrain/Loss": 2.0877771377563477, "Pretrain/Loss (Raw)": 2.487492322921753, "Pretrain/Step": 4092, "Pretrain/Step Time": 8.541736045852304} +{"Pretrain/Learning Rate": 3.185982569373335e-05, "Pretrain/Loss": 2.0885872840881348, "Pretrain/Loss (Raw)": 2.2151966094970703, "Pretrain/Step": 4093, "Pretrain/Step Time": 8.541055858135223} +{"Pretrain/Learning Rate": 3.185166128665684e-05, "Pretrain/Loss": 2.0880162715911865, "Pretrain/Loss (Raw)": 1.9788388013839722, "Pretrain/Step": 4094, "Pretrain/Step Time": 8.538111831992865} +{"Pretrain/Learning Rate": 3.184349608941446e-05, "Pretrain/Loss": 2.090116500854492, "Pretrain/Loss (Raw)": 2.2798616886138916, "Pretrain/Step": 4095, "Pretrain/Step Time": 8.54383423551917} +{"Pretrain/Learning Rate": 3.183533010294787e-05, "Pretrain/Loss": 2.0896759033203125, "Pretrain/Loss (Raw)": 2.130953550338745, "Pretrain/Step": 4096, "Pretrain/Step Time": 8.546702448278666} +{"Pretrain/Learning Rate": 3.18271633281988e-05, "Pretrain/Loss": 2.0905327796936035, "Pretrain/Loss (Raw)": 2.064537525177002, "Pretrain/Step": 4097, "Pretrain/Step Time": 8.543712679296732} +{"Pretrain/Learning Rate": 3.181899576610908e-05, "Pretrain/Loss": 2.088855743408203, "Pretrain/Loss (Raw)": 1.9481841325759888, "Pretrain/Step": 4098, "Pretrain/Step Time": 8.541954902932048} +{"Pretrain/Learning Rate": 3.1810827417620634e-05, "Pretrain/Loss": 2.0897531509399414, "Pretrain/Loss (Raw)": 2.087050437927246, "Pretrain/Step": 4099, "Pretrain/Step Time": 8.540443131700158} +{"Pretrain/Learning Rate": 3.1802658283675486e-05, "Pretrain/Loss": 2.0862598419189453, "Pretrain/Loss (Raw)": 1.7419724464416504, "Pretrain/Step": 4100, "Pretrain/Step Time": 8.544927345588803} +{"Pretrain/Learning Rate": 3.179448836521573e-05, "Pretrain/Loss": 2.086869716644287, "Pretrain/Loss (Raw)": 1.9223473072052002, "Pretrain/Step": 4101, "Pretrain/Step Time": 8.552688926458359} +{"Pretrain/Learning Rate": 3.178631766318355e-05, "Pretrain/Loss": 2.086388111114502, "Pretrain/Loss (Raw)": 1.9789836406707764, "Pretrain/Step": 4102, "Pretrain/Step Time": 8.539394875988364} +{"Pretrain/Learning Rate": 3.177814617852124e-05, "Pretrain/Loss": 2.083129405975342, "Pretrain/Loss (Raw)": 2.082963466644287, "Pretrain/Step": 4103, "Pretrain/Step Time": 8.546198807656765} +{"Pretrain/Learning Rate": 3.176997391217117e-05, "Pretrain/Loss": 2.085415840148926, "Pretrain/Loss (Raw)": 2.3881659507751465, "Pretrain/Step": 4104, "Pretrain/Step Time": 8.549516702070832} +{"Pretrain/Learning Rate": 3.176180086507582e-05, "Pretrain/Loss": 2.084719181060791, "Pretrain/Loss (Raw)": 1.9524004459381104, "Pretrain/Step": 4105, "Pretrain/Step Time": 8.54510959982872} +{"Pretrain/Learning Rate": 3.175362703817773e-05, "Pretrain/Loss": 2.085484027862549, "Pretrain/Loss (Raw)": 2.0114312171936035, "Pretrain/Step": 4106, "Pretrain/Step Time": 8.547979582101107} +{"Pretrain/Learning Rate": 3.1745452432419534e-05, "Pretrain/Loss": 2.0821914672851562, "Pretrain/Loss (Raw)": 2.025874137878418, "Pretrain/Step": 4107, "Pretrain/Step Time": 8.551704067736864} +{"Pretrain/Learning Rate": 3.1737277048743984e-05, "Pretrain/Loss": 2.080227851867676, "Pretrain/Loss (Raw)": 2.0532400608062744, "Pretrain/Step": 4108, "Pretrain/Step Time": 8.54417266882956} +{"Pretrain/Learning Rate": 3.17291008880939e-05, "Pretrain/Loss": 2.076739549636841, "Pretrain/Loss (Raw)": 1.8982025384902954, "Pretrain/Step": 4109, "Pretrain/Step Time": 8.539419438689947} +{"Pretrain/Learning Rate": 3.172092395141219e-05, "Pretrain/Loss": 2.0778796672821045, "Pretrain/Loss (Raw)": 2.0429039001464844, "Pretrain/Step": 4110, "Pretrain/Step Time": 8.542773822322488} +{"Pretrain/Learning Rate": 3.171274623964186e-05, "Pretrain/Loss": 2.07780122756958, "Pretrain/Loss (Raw)": 2.0868401527404785, "Pretrain/Step": 4111, "Pretrain/Step Time": 8.541122982278466} +{"Pretrain/Learning Rate": 3.170456775372601e-05, "Pretrain/Loss": 2.0761282444000244, "Pretrain/Loss (Raw)": 2.1873035430908203, "Pretrain/Step": 4112, "Pretrain/Step Time": 8.545419748872519} +{"Pretrain/Learning Rate": 3.1696388494607804e-05, "Pretrain/Loss": 2.075775384902954, "Pretrain/Loss (Raw)": 2.066593647003174, "Pretrain/Step": 4113, "Pretrain/Step Time": 8.552963024005294} +{"Pretrain/Learning Rate": 3.168820846323053e-05, "Pretrain/Loss": 2.076355218887329, "Pretrain/Loss (Raw)": 2.05936336517334, "Pretrain/Step": 4114, "Pretrain/Step Time": 8.549437893554568} +{"Pretrain/Learning Rate": 3.1680027660537524e-05, "Pretrain/Loss": 2.075336456298828, "Pretrain/Loss (Raw)": 1.9679906368255615, "Pretrain/Step": 4115, "Pretrain/Step Time": 8.54643133096397} +{"Pretrain/Learning Rate": 3.167184608747227e-05, "Pretrain/Loss": 2.0754709243774414, "Pretrain/Loss (Raw)": 2.079702615737915, "Pretrain/Step": 4116, "Pretrain/Step Time": 8.544918132945895} +{"Pretrain/Learning Rate": 3.1663663744978276e-05, "Pretrain/Loss": 2.0727288722991943, "Pretrain/Loss (Raw)": 2.148761034011841, "Pretrain/Step": 4117, "Pretrain/Step Time": 8.54808102734387} +{"Pretrain/Learning Rate": 3.165548063399919e-05, "Pretrain/Loss": 2.073263645172119, "Pretrain/Loss (Raw)": 2.1142539978027344, "Pretrain/Step": 4118, "Pretrain/Step Time": 8.549730388447642} +{"Pretrain/Learning Rate": 3.1647296755478694e-05, "Pretrain/Loss": 2.0753870010375977, "Pretrain/Loss (Raw)": 2.140214681625366, "Pretrain/Step": 4119, "Pretrain/Step Time": 8.557771291583776} +{"Pretrain/Learning Rate": 3.163911211036063e-05, "Pretrain/Loss": 2.074251651763916, "Pretrain/Loss (Raw)": 1.9110790491104126, "Pretrain/Step": 4120, "Pretrain/Step Time": 8.548128854483366} +{"Pretrain/Learning Rate": 3.163092669958887e-05, "Pretrain/Loss": 2.0746288299560547, "Pretrain/Loss (Raw)": 2.0600671768188477, "Pretrain/Step": 4121, "Pretrain/Step Time": 8.550057377666235} +{"Pretrain/Learning Rate": 3.16227405241074e-05, "Pretrain/Loss": 2.07185697555542, "Pretrain/Loss (Raw)": 1.9704771041870117, "Pretrain/Step": 4122, "Pretrain/Step Time": 8.552759744226933} +{"Pretrain/Learning Rate": 3.161455358486028e-05, "Pretrain/Loss": 2.073489189147949, "Pretrain/Loss (Raw)": 2.2381274700164795, "Pretrain/Step": 4123, "Pretrain/Step Time": 8.552490891888738} +{"Pretrain/Learning Rate": 3.160636588279167e-05, "Pretrain/Loss": 2.0717172622680664, "Pretrain/Loss (Raw)": 1.9437819719314575, "Pretrain/Step": 4124, "Pretrain/Step Time": 8.549982212483883} +{"Pretrain/Learning Rate": 3.159817741884582e-05, "Pretrain/Loss": 2.074324131011963, "Pretrain/Loss (Raw)": 2.451090097427368, "Pretrain/Step": 4125, "Pretrain/Step Time": 8.555049637332559} +{"Pretrain/Learning Rate": 3.1589988193967056e-05, "Pretrain/Loss": 2.074882984161377, "Pretrain/Loss (Raw)": 2.2893972396850586, "Pretrain/Step": 4126, "Pretrain/Step Time": 8.551706111058593} +{"Pretrain/Learning Rate": 3.15817982090998e-05, "Pretrain/Loss": 2.075671672821045, "Pretrain/Loss (Raw)": 2.2247354984283447, "Pretrain/Step": 4127, "Pretrain/Step Time": 8.551530851051211} +{"Pretrain/Learning Rate": 3.157360746518857e-05, "Pretrain/Loss": 2.081594705581665, "Pretrain/Loss (Raw)": 2.5822713375091553, "Pretrain/Step": 4128, "Pretrain/Step Time": 8.553571239113808} +{"Pretrain/Learning Rate": 3.1565415963177944e-05, "Pretrain/Loss": 2.081373453140259, "Pretrain/Loss (Raw)": 2.0504202842712402, "Pretrain/Step": 4129, "Pretrain/Step Time": 8.548431992530823} +{"Pretrain/Learning Rate": 3.1557223704012606e-05, "Pretrain/Loss": 2.0795698165893555, "Pretrain/Loss (Raw)": 1.8102773427963257, "Pretrain/Step": 4130, "Pretrain/Step Time": 8.54859789274633} +{"Pretrain/Learning Rate": 3.154903068863734e-05, "Pretrain/Loss": 2.079624891281128, "Pretrain/Loss (Raw)": 2.0422253608703613, "Pretrain/Step": 4131, "Pretrain/Step Time": 8.56039821729064} +{"Pretrain/Learning Rate": 3.154083691799699e-05, "Pretrain/Loss": 2.0789575576782227, "Pretrain/Loss (Raw)": 2.0129330158233643, "Pretrain/Step": 4132, "Pretrain/Step Time": 8.553176190704107} +{"Pretrain/Learning Rate": 3.1532642393036506e-05, "Pretrain/Loss": 2.0822393894195557, "Pretrain/Loss (Raw)": 2.6046581268310547, "Pretrain/Step": 4133, "Pretrain/Step Time": 8.549576880410314} +{"Pretrain/Learning Rate": 3.1524447114700914e-05, "Pretrain/Loss": 2.0825088024139404, "Pretrain/Loss (Raw)": 2.195233106613159, "Pretrain/Step": 4134, "Pretrain/Step Time": 8.544881461188197} +{"Pretrain/Learning Rate": 3.151625108393534e-05, "Pretrain/Loss": 2.0860705375671387, "Pretrain/Loss (Raw)": 2.3598592281341553, "Pretrain/Step": 4135, "Pretrain/Step Time": 8.545578813180327} +{"Pretrain/Learning Rate": 3.150805430168499e-05, "Pretrain/Loss": 2.0849475860595703, "Pretrain/Loss (Raw)": 2.0147340297698975, "Pretrain/Step": 4136, "Pretrain/Step Time": 8.543044839054346} +{"Pretrain/Learning Rate": 3.149985676889515e-05, "Pretrain/Loss": 2.085193634033203, "Pretrain/Loss (Raw)": 2.0949513912200928, "Pretrain/Step": 4137, "Pretrain/Step Time": 8.552828883752227} +{"Pretrain/Learning Rate": 3.14916584865112e-05, "Pretrain/Loss": 2.0872550010681152, "Pretrain/Loss (Raw)": 2.069483757019043, "Pretrain/Step": 4138, "Pretrain/Step Time": 8.541867163032293} +{"Pretrain/Learning Rate": 3.1483459455478603e-05, "Pretrain/Loss": 2.0848684310913086, "Pretrain/Loss (Raw)": 1.7834171056747437, "Pretrain/Step": 4139, "Pretrain/Step Time": 8.542323561385274} +{"Pretrain/Learning Rate": 3.147525967674291e-05, "Pretrain/Loss": 2.0835771560668945, "Pretrain/Loss (Raw)": 2.125141143798828, "Pretrain/Step": 4140, "Pretrain/Step Time": 8.53808799572289} +{"Pretrain/Learning Rate": 3.146705915124976e-05, "Pretrain/Loss": 2.0890073776245117, "Pretrain/Loss (Raw)": 2.4581074714660645, "Pretrain/Step": 4141, "Pretrain/Step Time": 8.538513071835041} +{"Pretrain/Learning Rate": 3.145885787994487e-05, "Pretrain/Loss": 2.0872955322265625, "Pretrain/Loss (Raw)": 1.918643593788147, "Pretrain/Step": 4142, "Pretrain/Step Time": 8.53667319379747} +{"Pretrain/Learning Rate": 3.1450655863774056e-05, "Pretrain/Loss": 2.0869979858398438, "Pretrain/Loss (Raw)": 1.9611612558364868, "Pretrain/Step": 4143, "Pretrain/Step Time": 8.54626096971333} +{"Pretrain/Learning Rate": 3.144245310368321e-05, "Pretrain/Loss": 2.08492374420166, "Pretrain/Loss (Raw)": 1.854304552078247, "Pretrain/Step": 4144, "Pretrain/Step Time": 8.537037182599306} +{"Pretrain/Learning Rate": 3.1434249600618315e-05, "Pretrain/Loss": 2.085294246673584, "Pretrain/Loss (Raw)": 2.127481460571289, "Pretrain/Step": 4145, "Pretrain/Step Time": 8.530678160488605} +{"Pretrain/Learning Rate": 3.142604535552544e-05, "Pretrain/Loss": 2.086583137512207, "Pretrain/Loss (Raw)": 2.079993724822998, "Pretrain/Step": 4146, "Pretrain/Step Time": 8.533274032175541} +{"Pretrain/Learning Rate": 3.1417840369350735e-05, "Pretrain/Loss": 2.087554693222046, "Pretrain/Loss (Raw)": 2.2621304988861084, "Pretrain/Step": 4147, "Pretrain/Step Time": 8.534921310842037} +{"Pretrain/Learning Rate": 3.140963464304043e-05, "Pretrain/Loss": 2.0868124961853027, "Pretrain/Loss (Raw)": 2.171644449234009, "Pretrain/Step": 4148, "Pretrain/Step Time": 8.530699903145432} +{"Pretrain/Learning Rate": 3.140142817754086e-05, "Pretrain/Loss": 2.086104393005371, "Pretrain/Loss (Raw)": 2.012263536453247, "Pretrain/Step": 4149, "Pretrain/Step Time": 8.538562677800655} +{"Pretrain/Learning Rate": 3.1393220973798425e-05, "Pretrain/Loss": 2.08809757232666, "Pretrain/Loss (Raw)": 2.2416322231292725, "Pretrain/Step": 4150, "Pretrain/Step Time": 8.535300510004163} +{"Pretrain/Learning Rate": 3.1385013032759623e-05, "Pretrain/Loss": 2.0834662914276123, "Pretrain/Loss (Raw)": 1.9521762132644653, "Pretrain/Step": 4151, "Pretrain/Step Time": 8.538927903398871} +{"Pretrain/Learning Rate": 3.137680435537104e-05, "Pretrain/Loss": 2.08457612991333, "Pretrain/Loss (Raw)": 2.137498617172241, "Pretrain/Step": 4152, "Pretrain/Step Time": 8.534267127513885} +{"Pretrain/Learning Rate": 3.136859494257931e-05, "Pretrain/Loss": 2.0832531452178955, "Pretrain/Loss (Raw)": 2.053546667098999, "Pretrain/Step": 4153, "Pretrain/Step Time": 8.537359589710832} +{"Pretrain/Learning Rate": 3.136038479533122e-05, "Pretrain/Loss": 2.085341453552246, "Pretrain/Loss (Raw)": 2.1333415508270264, "Pretrain/Step": 4154, "Pretrain/Step Time": 8.533362708985806} +{"Pretrain/Learning Rate": 3.135217391457358e-05, "Pretrain/Loss": 2.08359956741333, "Pretrain/Loss (Raw)": 1.8933930397033691, "Pretrain/Step": 4155, "Pretrain/Step Time": 8.538938330486417} +{"Pretrain/Learning Rate": 3.1343962301253305e-05, "Pretrain/Loss": 2.086536407470703, "Pretrain/Loss (Raw)": 2.3255562782287598, "Pretrain/Step": 4156, "Pretrain/Step Time": 8.528687899932265} +{"Pretrain/Learning Rate": 3.133574995631741e-05, "Pretrain/Loss": 2.0832855701446533, "Pretrain/Loss (Raw)": 1.916830062866211, "Pretrain/Step": 4157, "Pretrain/Step Time": 8.531774217262864} +{"Pretrain/Learning Rate": 3.132753688071297e-05, "Pretrain/Loss": 2.084040641784668, "Pretrain/Loss (Raw)": 2.1399319171905518, "Pretrain/Step": 4158, "Pretrain/Step Time": 8.537165440618992} +{"Pretrain/Learning Rate": 3.1319323075387165e-05, "Pretrain/Loss": 2.0833687782287598, "Pretrain/Loss (Raw)": 2.1022801399230957, "Pretrain/Step": 4159, "Pretrain/Step Time": 8.537445213645697} +{"Pretrain/Learning Rate": 3.131110854128724e-05, "Pretrain/Loss": 2.0833499431610107, "Pretrain/Loss (Raw)": 1.9670140743255615, "Pretrain/Step": 4160, "Pretrain/Step Time": 8.53856654651463} +{"Pretrain/Learning Rate": 3.130289327936055e-05, "Pretrain/Loss": 2.0852396488189697, "Pretrain/Loss (Raw)": 2.177910327911377, "Pretrain/Step": 4161, "Pretrain/Step Time": 8.545562950894237} +{"Pretrain/Learning Rate": 3.1294677290554494e-05, "Pretrain/Loss": 2.0870003700256348, "Pretrain/Loss (Raw)": 2.1391069889068604, "Pretrain/Step": 4162, "Pretrain/Step Time": 8.540826523676515} +{"Pretrain/Learning Rate": 3.128646057581659e-05, "Pretrain/Loss": 2.085833787918091, "Pretrain/Loss (Raw)": 1.9393939971923828, "Pretrain/Step": 4163, "Pretrain/Step Time": 8.543528409674764} +{"Pretrain/Learning Rate": 3.1278243136094436e-05, "Pretrain/Loss": 2.0879650115966797, "Pretrain/Loss (Raw)": 2.257140874862671, "Pretrain/Step": 4164, "Pretrain/Step Time": 8.534255746752024} +{"Pretrain/Learning Rate": 3.1270024972335706e-05, "Pretrain/Loss": 2.0890462398529053, "Pretrain/Loss (Raw)": 2.2082438468933105, "Pretrain/Step": 4165, "Pretrain/Step Time": 8.537080585956573} +{"Pretrain/Learning Rate": 3.1261806085488144e-05, "Pretrain/Loss": 2.0882136821746826, "Pretrain/Loss (Raw)": 2.2008206844329834, "Pretrain/Step": 4166, "Pretrain/Step Time": 8.537586817517877} +{"Pretrain/Learning Rate": 3.1253586476499594e-05, "Pretrain/Loss": 2.0879039764404297, "Pretrain/Loss (Raw)": 2.12968373298645, "Pretrain/Step": 4167, "Pretrain/Step Time": 8.539569117128849} +{"Pretrain/Learning Rate": 3.124536614631799e-05, "Pretrain/Loss": 2.0887248516082764, "Pretrain/Loss (Raw)": 2.187204122543335, "Pretrain/Step": 4168, "Pretrain/Step Time": 8.532074950635433} +{"Pretrain/Learning Rate": 3.123714509589133e-05, "Pretrain/Loss": 2.0882208347320557, "Pretrain/Loss (Raw)": 2.0332632064819336, "Pretrain/Step": 4169, "Pretrain/Step Time": 8.532012714073062} +{"Pretrain/Learning Rate": 3.122892332616771e-05, "Pretrain/Loss": 2.0877106189727783, "Pretrain/Loss (Raw)": 2.0225772857666016, "Pretrain/Step": 4170, "Pretrain/Step Time": 8.534355832263827} +{"Pretrain/Learning Rate": 3.12207008380953e-05, "Pretrain/Loss": 2.0858230590820312, "Pretrain/Loss (Raw)": 2.190775156021118, "Pretrain/Step": 4171, "Pretrain/Step Time": 8.53705638460815} +{"Pretrain/Learning Rate": 3.121247763262235e-05, "Pretrain/Loss": 2.084878444671631, "Pretrain/Loss (Raw)": 2.047034740447998, "Pretrain/Step": 4172, "Pretrain/Step Time": 8.53779031150043} +{"Pretrain/Learning Rate": 3.120425371069721e-05, "Pretrain/Loss": 2.0893936157226562, "Pretrain/Loss (Raw)": 2.5530526638031006, "Pretrain/Step": 4173, "Pretrain/Step Time": 8.547869097441435} +{"Pretrain/Learning Rate": 3.119602907326829e-05, "Pretrain/Loss": 2.0908703804016113, "Pretrain/Loss (Raw)": 2.149355411529541, "Pretrain/Step": 4174, "Pretrain/Step Time": 8.542627111077309} +{"Pretrain/Learning Rate": 3.118780372128411e-05, "Pretrain/Loss": 2.0907957553863525, "Pretrain/Loss (Raw)": 1.9686055183410645, "Pretrain/Step": 4175, "Pretrain/Step Time": 8.545080041512847} +{"Pretrain/Learning Rate": 3.1179577655693245e-05, "Pretrain/Loss": 2.092362642288208, "Pretrain/Loss (Raw)": 2.370237350463867, "Pretrain/Step": 4176, "Pretrain/Step Time": 8.53945709578693} +{"Pretrain/Learning Rate": 3.1171350877444365e-05, "Pretrain/Loss": 2.0902905464172363, "Pretrain/Loss (Raw)": 1.9646714925765991, "Pretrain/Step": 4177, "Pretrain/Step Time": 8.542116664350033} +{"Pretrain/Learning Rate": 3.116312338748623e-05, "Pretrain/Loss": 2.088364601135254, "Pretrain/Loss (Raw)": 2.120258331298828, "Pretrain/Step": 4178, "Pretrain/Step Time": 8.5386753808707} +{"Pretrain/Learning Rate": 3.115489518676765e-05, "Pretrain/Loss": 2.08674955368042, "Pretrain/Loss (Raw)": 1.9993809461593628, "Pretrain/Step": 4179, "Pretrain/Step Time": 8.5490813665092} +{"Pretrain/Learning Rate": 3.1146666276237554e-05, "Pretrain/Loss": 2.0863380432128906, "Pretrain/Loss (Raw)": 1.8616340160369873, "Pretrain/Step": 4180, "Pretrain/Step Time": 8.542154690250754} +{"Pretrain/Learning Rate": 3.113843665684495e-05, "Pretrain/Loss": 2.08646297454834, "Pretrain/Loss (Raw)": 2.0768556594848633, "Pretrain/Step": 4181, "Pretrain/Step Time": 8.540297316387296} +{"Pretrain/Learning Rate": 3.1130206329538905e-05, "Pretrain/Loss": 2.0869064331054688, "Pretrain/Loss (Raw)": 2.0518534183502197, "Pretrain/Step": 4182, "Pretrain/Step Time": 8.53931549936533} +{"Pretrain/Learning Rate": 3.112197529526857e-05, "Pretrain/Loss": 2.085428476333618, "Pretrain/Loss (Raw)": 1.884680151939392, "Pretrain/Step": 4183, "Pretrain/Step Time": 8.538795882835984} +{"Pretrain/Learning Rate": 3.11137435549832e-05, "Pretrain/Loss": 2.0884718894958496, "Pretrain/Loss (Raw)": 2.3788442611694336, "Pretrain/Step": 4184, "Pretrain/Step Time": 8.537863725796342} +{"Pretrain/Learning Rate": 3.110551110963212e-05, "Pretrain/Loss": 2.089595079421997, "Pretrain/Loss (Raw)": 2.2603416442871094, "Pretrain/Step": 4185, "Pretrain/Step Time": 8.539241114631295} +{"Pretrain/Learning Rate": 3.109727796016472e-05, "Pretrain/Loss": 2.0907950401306152, "Pretrain/Loss (Raw)": 2.048454523086548, "Pretrain/Step": 4186, "Pretrain/Step Time": 8.536284174770117} +{"Pretrain/Learning Rate": 3.10890441075305e-05, "Pretrain/Loss": 2.0905959606170654, "Pretrain/Loss (Raw)": 1.9690274000167847, "Pretrain/Step": 4187, "Pretrain/Step Time": 8.542963052168489} +{"Pretrain/Learning Rate": 3.108080955267902e-05, "Pretrain/Loss": 2.090911388397217, "Pretrain/Loss (Raw)": 2.1551871299743652, "Pretrain/Step": 4188, "Pretrain/Step Time": 8.538849756121635} +{"Pretrain/Learning Rate": 3.107257429655993e-05, "Pretrain/Loss": 2.0901646614074707, "Pretrain/Loss (Raw)": 1.9911563396453857, "Pretrain/Step": 4189, "Pretrain/Step Time": 8.540247512981296} +{"Pretrain/Learning Rate": 3.1064338340122953e-05, "Pretrain/Loss": 2.08939528465271, "Pretrain/Loss (Raw)": 2.0051496028900146, "Pretrain/Step": 4190, "Pretrain/Step Time": 8.537023335695267} +{"Pretrain/Learning Rate": 3.105610168431791e-05, "Pretrain/Loss": 2.0912399291992188, "Pretrain/Loss (Raw)": 2.238283157348633, "Pretrain/Step": 4191, "Pretrain/Step Time": 8.545512109994888} +{"Pretrain/Learning Rate": 3.1047864330094675e-05, "Pretrain/Loss": 2.089812755584717, "Pretrain/Loss (Raw)": 1.9641001224517822, "Pretrain/Step": 4192, "Pretrain/Step Time": 8.542845154181123} +{"Pretrain/Learning Rate": 3.1039626278403234e-05, "Pretrain/Loss": 2.091585159301758, "Pretrain/Loss (Raw)": 2.1331632137298584, "Pretrain/Step": 4193, "Pretrain/Step Time": 8.54388146288693} +{"Pretrain/Learning Rate": 3.1031387530193626e-05, "Pretrain/Loss": 2.0936381816864014, "Pretrain/Loss (Raw)": 2.219292640686035, "Pretrain/Step": 4194, "Pretrain/Step Time": 8.541646722704172} +{"Pretrain/Learning Rate": 3.1023148086415984e-05, "Pretrain/Loss": 2.0948410034179688, "Pretrain/Loss (Raw)": 2.1015639305114746, "Pretrain/Step": 4195, "Pretrain/Step Time": 8.542864181101322} +{"Pretrain/Learning Rate": 3.101490794802053e-05, "Pretrain/Loss": 2.0956320762634277, "Pretrain/Loss (Raw)": 2.3590352535247803, "Pretrain/Step": 4196, "Pretrain/Step Time": 8.53807515092194} +{"Pretrain/Learning Rate": 3.100666711595754e-05, "Pretrain/Loss": 2.096393585205078, "Pretrain/Loss (Raw)": 2.1254522800445557, "Pretrain/Step": 4197, "Pretrain/Step Time": 8.550205335021019} +{"Pretrain/Learning Rate": 3.09984255911774e-05, "Pretrain/Loss": 2.096579074859619, "Pretrain/Loss (Raw)": 2.133573532104492, "Pretrain/Step": 4198, "Pretrain/Step Time": 8.541507538408041} +{"Pretrain/Learning Rate": 3.099018337463056e-05, "Pretrain/Loss": 2.096412181854248, "Pretrain/Loss (Raw)": 1.933389663696289, "Pretrain/Step": 4199, "Pretrain/Step Time": 8.54083814099431} +{"Pretrain/Learning Rate": 3.0981940467267547e-05, "Pretrain/Loss": 2.0961596965789795, "Pretrain/Loss (Raw)": 1.9337092638015747, "Pretrain/Step": 4200, "Pretrain/Step Time": 8.541686518117785} +{"Pretrain/Learning Rate": 3.097369687003896e-05, "Pretrain/Loss": 2.0980420112609863, "Pretrain/Loss (Raw)": 2.130103588104248, "Pretrain/Step": 4201, "Pretrain/Step Time": 8.539001315832138} +{"Pretrain/Learning Rate": 3.096545258389551e-05, "Pretrain/Loss": 2.0976717472076416, "Pretrain/Loss (Raw)": 2.075237274169922, "Pretrain/Step": 4202, "Pretrain/Step Time": 8.539500813931227} +{"Pretrain/Learning Rate": 3.0957207609787945e-05, "Pretrain/Loss": 2.0969510078430176, "Pretrain/Loss (Raw)": 1.9302124977111816, "Pretrain/Step": 4203, "Pretrain/Step Time": 8.553229192271829} +{"Pretrain/Learning Rate": 3.094896194866714e-05, "Pretrain/Loss": 2.09873104095459, "Pretrain/Loss (Raw)": 2.2585363388061523, "Pretrain/Step": 4204, "Pretrain/Step Time": 8.538897179067135} +{"Pretrain/Learning Rate": 3.094071560148401e-05, "Pretrain/Loss": 2.0963377952575684, "Pretrain/Loss (Raw)": 1.9053457975387573, "Pretrain/Step": 4205, "Pretrain/Step Time": 8.544025449082255} +{"Pretrain/Learning Rate": 3.093246856918956e-05, "Pretrain/Loss": 2.097813606262207, "Pretrain/Loss (Raw)": 2.0869274139404297, "Pretrain/Step": 4206, "Pretrain/Step Time": 8.541208418086171} +{"Pretrain/Learning Rate": 3.092422085273488e-05, "Pretrain/Loss": 2.0974984169006348, "Pretrain/Loss (Raw)": 2.080850601196289, "Pretrain/Step": 4207, "Pretrain/Step Time": 8.53847336024046} +{"Pretrain/Learning Rate": 3.091597245307114e-05, "Pretrain/Loss": 2.097165822982788, "Pretrain/Loss (Raw)": 2.2699224948883057, "Pretrain/Step": 4208, "Pretrain/Step Time": 8.542715391144156} +{"Pretrain/Learning Rate": 3.0907723371149575e-05, "Pretrain/Loss": 2.096315860748291, "Pretrain/Loss (Raw)": 2.0131003856658936, "Pretrain/Step": 4209, "Pretrain/Step Time": 8.543547734618187} +{"Pretrain/Learning Rate": 3.0899473607921513e-05, "Pretrain/Loss": 2.09568452835083, "Pretrain/Loss (Raw)": 2.113027572631836, "Pretrain/Step": 4210, "Pretrain/Step Time": 8.539632180705667} +{"Pretrain/Learning Rate": 3.0891223164338354e-05, "Pretrain/Loss": 2.095519542694092, "Pretrain/Loss (Raw)": 1.9283615350723267, "Pretrain/Step": 4211, "Pretrain/Step Time": 8.548383180052042} +{"Pretrain/Learning Rate": 3.0882972041351585e-05, "Pretrain/Loss": 2.0968780517578125, "Pretrain/Loss (Raw)": 2.1331517696380615, "Pretrain/Step": 4212, "Pretrain/Step Time": 8.544879892840981} +{"Pretrain/Learning Rate": 3.0874720239912744e-05, "Pretrain/Loss": 2.0963151454925537, "Pretrain/Loss (Raw)": 2.058746337890625, "Pretrain/Step": 4213, "Pretrain/Step Time": 8.544187927618623} +{"Pretrain/Learning Rate": 3.0866467760973495e-05, "Pretrain/Loss": 2.096501111984253, "Pretrain/Loss (Raw)": 2.022193193435669, "Pretrain/Step": 4214, "Pretrain/Step Time": 8.545554207637906} +{"Pretrain/Learning Rate": 3.0858214605485545e-05, "Pretrain/Loss": 2.095102548599243, "Pretrain/Loss (Raw)": 1.9426478147506714, "Pretrain/Step": 4215, "Pretrain/Step Time": 8.553101485595107} +{"Pretrain/Learning Rate": 3.0849960774400667e-05, "Pretrain/Loss": 2.0954995155334473, "Pretrain/Loss (Raw)": 1.9605752229690552, "Pretrain/Step": 4216, "Pretrain/Step Time": 8.553284449502826} +{"Pretrain/Learning Rate": 3.0841706268670756e-05, "Pretrain/Loss": 2.09804105758667, "Pretrain/Loss (Raw)": 2.1190781593322754, "Pretrain/Step": 4217, "Pretrain/Step Time": 8.542849626392126} +{"Pretrain/Learning Rate": 3.083345108924775e-05, "Pretrain/Loss": 2.098498582839966, "Pretrain/Loss (Raw)": 2.106673002243042, "Pretrain/Step": 4218, "Pretrain/Step Time": 8.550842382013798} +{"Pretrain/Learning Rate": 3.082519523708368e-05, "Pretrain/Loss": 2.0962636470794678, "Pretrain/Loss (Raw)": 2.0186779499053955, "Pretrain/Step": 4219, "Pretrain/Step Time": 8.549303371459246} +{"Pretrain/Learning Rate": 3.081693871313064e-05, "Pretrain/Loss": 2.0941262245178223, "Pretrain/Loss (Raw)": 2.213913917541504, "Pretrain/Step": 4220, "Pretrain/Step Time": 8.54694447107613} +{"Pretrain/Learning Rate": 3.080868151834082e-05, "Pretrain/Loss": 2.095341682434082, "Pretrain/Loss (Raw)": 2.3707737922668457, "Pretrain/Step": 4221, "Pretrain/Step Time": 8.55659207329154} +{"Pretrain/Learning Rate": 3.080042365366648e-05, "Pretrain/Loss": 2.0947418212890625, "Pretrain/Loss (Raw)": 1.9020254611968994, "Pretrain/Step": 4222, "Pretrain/Step Time": 8.56160718202591} +{"Pretrain/Learning Rate": 3.079216512005994e-05, "Pretrain/Loss": 2.0939385890960693, "Pretrain/Loss (Raw)": 2.177062511444092, "Pretrain/Step": 4223, "Pretrain/Step Time": 8.549499625340104} +{"Pretrain/Learning Rate": 3.078390591847363e-05, "Pretrain/Loss": 2.0941672325134277, "Pretrain/Loss (Raw)": 2.160215139389038, "Pretrain/Step": 4224, "Pretrain/Step Time": 8.55232266522944} +{"Pretrain/Learning Rate": 3.077564604986004e-05, "Pretrain/Loss": 2.0922439098358154, "Pretrain/Loss (Raw)": 1.818365454673767, "Pretrain/Step": 4225, "Pretrain/Step Time": 8.550101563334465} +{"Pretrain/Learning Rate": 3.076738551517173e-05, "Pretrain/Loss": 2.0910840034484863, "Pretrain/Loss (Raw)": 1.7997336387634277, "Pretrain/Step": 4226, "Pretrain/Step Time": 8.548357171937823} +{"Pretrain/Learning Rate": 3.0759124315361344e-05, "Pretrain/Loss": 2.0922372341156006, "Pretrain/Loss (Raw)": 2.2346508502960205, "Pretrain/Step": 4227, "Pretrain/Step Time": 8.553270440548658} +{"Pretrain/Learning Rate": 3.07508624513816e-05, "Pretrain/Loss": 2.093717575073242, "Pretrain/Loss (Raw)": 1.9314595460891724, "Pretrain/Step": 4228, "Pretrain/Step Time": 8.553534096106887} +{"Pretrain/Learning Rate": 3.0742599924185306e-05, "Pretrain/Loss": 2.094688892364502, "Pretrain/Loss (Raw)": 2.0466668605804443, "Pretrain/Step": 4229, "Pretrain/Step Time": 8.547425225377083} +{"Pretrain/Learning Rate": 3.073433673472533e-05, "Pretrain/Loss": 2.096233606338501, "Pretrain/Loss (Raw)": 2.1766960620880127, "Pretrain/Step": 4230, "Pretrain/Step Time": 8.550360135734081} +{"Pretrain/Learning Rate": 3.072607288395461e-05, "Pretrain/Loss": 2.0967884063720703, "Pretrain/Loss (Raw)": 2.153968334197998, "Pretrain/Step": 4231, "Pretrain/Step Time": 8.547515835613012} +{"Pretrain/Learning Rate": 3.071780837282619e-05, "Pretrain/Loss": 2.094524621963501, "Pretrain/Loss (Raw)": 2.0984232425689697, "Pretrain/Step": 4232, "Pretrain/Step Time": 8.54185469634831} +{"Pretrain/Learning Rate": 3.0709543202293164e-05, "Pretrain/Loss": 2.095660448074341, "Pretrain/Loss (Raw)": 2.0977792739868164, "Pretrain/Step": 4233, "Pretrain/Step Time": 8.546757876873016} +{"Pretrain/Learning Rate": 3.070127737330871e-05, "Pretrain/Loss": 2.094377040863037, "Pretrain/Loss (Raw)": 1.847165822982788, "Pretrain/Step": 4234, "Pretrain/Step Time": 8.545862801373005} +{"Pretrain/Learning Rate": 3.069301088682609e-05, "Pretrain/Loss": 2.0954599380493164, "Pretrain/Loss (Raw)": 2.1644821166992188, "Pretrain/Step": 4235, "Pretrain/Step Time": 8.542593389749527} +{"Pretrain/Learning Rate": 3.068474374379863e-05, "Pretrain/Loss": 2.095970392227173, "Pretrain/Loss (Raw)": 2.1185760498046875, "Pretrain/Step": 4236, "Pretrain/Step Time": 8.543749589473009} +{"Pretrain/Learning Rate": 3.067647594517972e-05, "Pretrain/Loss": 2.094914436340332, "Pretrain/Loss (Raw)": 1.7630189657211304, "Pretrain/Step": 4237, "Pretrain/Step Time": 8.548394991084933} +{"Pretrain/Learning Rate": 3.0668207491922866e-05, "Pretrain/Loss": 2.095360040664673, "Pretrain/Loss (Raw)": 2.099965810775757, "Pretrain/Step": 4238, "Pretrain/Step Time": 8.544194402173162} +{"Pretrain/Learning Rate": 3.0659938384981616e-05, "Pretrain/Loss": 2.0967369079589844, "Pretrain/Loss (Raw)": 2.2630491256713867, "Pretrain/Step": 4239, "Pretrain/Step Time": 8.55546037107706} +{"Pretrain/Learning Rate": 3.0651668625309594e-05, "Pretrain/Loss": 2.09645938873291, "Pretrain/Loss (Raw)": 2.151806116104126, "Pretrain/Step": 4240, "Pretrain/Step Time": 8.554697632789612} +{"Pretrain/Learning Rate": 3.0643398213860525e-05, "Pretrain/Loss": 2.098194122314453, "Pretrain/Loss (Raw)": 2.288628578186035, "Pretrain/Step": 4241, "Pretrain/Step Time": 8.54125626012683} +{"Pretrain/Learning Rate": 3.0635127151588175e-05, "Pretrain/Loss": 2.097848415374756, "Pretrain/Loss (Raw)": 2.0151469707489014, "Pretrain/Step": 4242, "Pretrain/Step Time": 8.542329398915172} +{"Pretrain/Learning Rate": 3.0626855439446405e-05, "Pretrain/Loss": 2.097524642944336, "Pretrain/Loss (Raw)": 1.9265246391296387, "Pretrain/Step": 4243, "Pretrain/Step Time": 8.541711697354913} +{"Pretrain/Learning Rate": 3.061858307838915e-05, "Pretrain/Loss": 2.096621036529541, "Pretrain/Loss (Raw)": 1.9640320539474487, "Pretrain/Step": 4244, "Pretrain/Step Time": 8.54075000807643} +{"Pretrain/Learning Rate": 3.061031006937043e-05, "Pretrain/Loss": 2.0951099395751953, "Pretrain/Loss (Raw)": 1.9553381204605103, "Pretrain/Step": 4245, "Pretrain/Step Time": 8.539746144786477} +{"Pretrain/Learning Rate": 3.060203641334431e-05, "Pretrain/Loss": 2.095156192779541, "Pretrain/Loss (Raw)": 2.1201539039611816, "Pretrain/Step": 4246, "Pretrain/Step Time": 8.540641350671649} +{"Pretrain/Learning Rate": 3.059376211126495e-05, "Pretrain/Loss": 2.094634532928467, "Pretrain/Loss (Raw)": 2.0734803676605225, "Pretrain/Step": 4247, "Pretrain/Step Time": 8.535382745787501} +{"Pretrain/Learning Rate": 3.058548716408658e-05, "Pretrain/Loss": 2.095435619354248, "Pretrain/Loss (Raw)": 2.0135867595672607, "Pretrain/Step": 4248, "Pretrain/Step Time": 8.538984213024378} +{"Pretrain/Learning Rate": 3.057721157276352e-05, "Pretrain/Loss": 2.0965046882629395, "Pretrain/Loss (Raw)": 2.1969523429870605, "Pretrain/Step": 4249, "Pretrain/Step Time": 8.539622522890568} +{"Pretrain/Learning Rate": 3.056893533825014e-05, "Pretrain/Loss": 2.095461845397949, "Pretrain/Loss (Raw)": 1.836977481842041, "Pretrain/Step": 4250, "Pretrain/Step Time": 8.53768377006054} +{"Pretrain/Learning Rate": 3.056065846150089e-05, "Pretrain/Loss": 2.0931715965270996, "Pretrain/Loss (Raw)": 1.944952130317688, "Pretrain/Step": 4251, "Pretrain/Step Time": 8.536290690302849} +{"Pretrain/Learning Rate": 3.0552380943470306e-05, "Pretrain/Loss": 2.0939650535583496, "Pretrain/Loss (Raw)": 2.0453717708587646, "Pretrain/Step": 4252, "Pretrain/Step Time": 8.542546892538667} +{"Pretrain/Learning Rate": 3.054410278511299e-05, "Pretrain/Loss": 2.0901575088500977, "Pretrain/Loss (Raw)": 1.963728904724121, "Pretrain/Step": 4253, "Pretrain/Step Time": 8.536928750574589} +{"Pretrain/Learning Rate": 3.053582398738362e-05, "Pretrain/Loss": 2.088644027709961, "Pretrain/Loss (Raw)": 2.0956592559814453, "Pretrain/Step": 4254, "Pretrain/Step Time": 8.537731017917395} +{"Pretrain/Learning Rate": 3.052754455123693e-05, "Pretrain/Loss": 2.0894150733947754, "Pretrain/Loss (Raw)": 2.3234357833862305, "Pretrain/Step": 4255, "Pretrain/Step Time": 8.538746029138565} +{"Pretrain/Learning Rate": 3.051926447762776e-05, "Pretrain/Loss": 2.0847201347351074, "Pretrain/Loss (Raw)": 1.9813292026519775, "Pretrain/Step": 4256, "Pretrain/Step Time": 8.542603785172105} +{"Pretrain/Learning Rate": 3.0510983767511007e-05, "Pretrain/Loss": 2.0862278938293457, "Pretrain/Loss (Raw)": 2.243396520614624, "Pretrain/Step": 4257, "Pretrain/Step Time": 8.547594889998436} +{"Pretrain/Learning Rate": 3.050270242184164e-05, "Pretrain/Loss": 2.090090751647949, "Pretrain/Loss (Raw)": 2.3047080039978027, "Pretrain/Step": 4258, "Pretrain/Step Time": 8.542556464672089} +{"Pretrain/Learning Rate": 3.049442044157469e-05, "Pretrain/Loss": 2.0872974395751953, "Pretrain/Loss (Raw)": 1.6846989393234253, "Pretrain/Step": 4259, "Pretrain/Step Time": 8.540750861167908} +{"Pretrain/Learning Rate": 3.0486137827665296e-05, "Pretrain/Loss": 2.088327169418335, "Pretrain/Loss (Raw)": 2.1447434425354004, "Pretrain/Step": 4260, "Pretrain/Step Time": 8.537572419270873} +{"Pretrain/Learning Rate": 3.0477854581068626e-05, "Pretrain/Loss": 2.084505319595337, "Pretrain/Loss (Raw)": 2.1154544353485107, "Pretrain/Step": 4261, "Pretrain/Step Time": 8.53919075243175} +{"Pretrain/Learning Rate": 3.0469570702739958e-05, "Pretrain/Loss": 2.084874153137207, "Pretrain/Loss (Raw)": 2.2424349784851074, "Pretrain/Step": 4262, "Pretrain/Step Time": 8.545342164114118} +{"Pretrain/Learning Rate": 3.0461286193634626e-05, "Pretrain/Loss": 2.081540584564209, "Pretrain/Loss (Raw)": 1.933161735534668, "Pretrain/Step": 4263, "Pretrain/Step Time": 8.540576193481684} +{"Pretrain/Learning Rate": 3.045300105470803e-05, "Pretrain/Loss": 2.080766201019287, "Pretrain/Loss (Raw)": 1.9156150817871094, "Pretrain/Step": 4264, "Pretrain/Step Time": 8.552374633029103} +{"Pretrain/Learning Rate": 3.0444715286915658e-05, "Pretrain/Loss": 2.0802760124206543, "Pretrain/Loss (Raw)": 2.0322299003601074, "Pretrain/Step": 4265, "Pretrain/Step Time": 8.543892905116081} +{"Pretrain/Learning Rate": 3.0436428891213063e-05, "Pretrain/Loss": 2.0815279483795166, "Pretrain/Loss (Raw)": 2.229715585708618, "Pretrain/Step": 4266, "Pretrain/Step Time": 8.545914966613054} +{"Pretrain/Learning Rate": 3.0428141868555875e-05, "Pretrain/Loss": 2.0841355323791504, "Pretrain/Loss (Raw)": 2.117173671722412, "Pretrain/Step": 4267, "Pretrain/Step Time": 8.544914443045855} +{"Pretrain/Learning Rate": 3.0419854219899786e-05, "Pretrain/Loss": 2.0838003158569336, "Pretrain/Loss (Raw)": 2.082242727279663, "Pretrain/Step": 4268, "Pretrain/Step Time": 8.546513248234987} +{"Pretrain/Learning Rate": 3.041156594620057e-05, "Pretrain/Loss": 2.0814645290374756, "Pretrain/Loss (Raw)": 2.159149408340454, "Pretrain/Step": 4269, "Pretrain/Step Time": 8.550237851217389} +{"Pretrain/Learning Rate": 3.0403277048414063e-05, "Pretrain/Loss": 2.082087993621826, "Pretrain/Loss (Raw)": 1.9984142780303955, "Pretrain/Step": 4270, "Pretrain/Step Time": 8.553535560145974} +{"Pretrain/Learning Rate": 3.0394987527496192e-05, "Pretrain/Loss": 2.0800726413726807, "Pretrain/Loss (Raw)": 1.7032071352005005, "Pretrain/Step": 4271, "Pretrain/Step Time": 8.54460751824081} +{"Pretrain/Learning Rate": 3.0386697384402935e-05, "Pretrain/Loss": 2.0826730728149414, "Pretrain/Loss (Raw)": 2.1871707439422607, "Pretrain/Step": 4272, "Pretrain/Step Time": 8.544322993606329} +{"Pretrain/Learning Rate": 3.0378406620090354e-05, "Pretrain/Loss": 2.081157684326172, "Pretrain/Loss (Raw)": 1.9335142374038696, "Pretrain/Step": 4273, "Pretrain/Step Time": 8.54825566150248} +{"Pretrain/Learning Rate": 3.0370115235514574e-05, "Pretrain/Loss": 2.0807957649230957, "Pretrain/Loss (Raw)": 2.03364634513855, "Pretrain/Step": 4274, "Pretrain/Step Time": 8.543478041887283} +{"Pretrain/Learning Rate": 3.036182323163181e-05, "Pretrain/Loss": 2.0787057876586914, "Pretrain/Loss (Raw)": 1.9946246147155762, "Pretrain/Step": 4275, "Pretrain/Step Time": 8.54573886655271} +{"Pretrain/Learning Rate": 3.0353530609398313e-05, "Pretrain/Loss": 2.07761287689209, "Pretrain/Loss (Raw)": 2.0317509174346924, "Pretrain/Step": 4276, "Pretrain/Step Time": 8.553588872775435} +{"Pretrain/Learning Rate": 3.0345237369770448e-05, "Pretrain/Loss": 2.078179359436035, "Pretrain/Loss (Raw)": 2.0848095417022705, "Pretrain/Step": 4277, "Pretrain/Step Time": 8.542120650410652} +{"Pretrain/Learning Rate": 3.0336943513704613e-05, "Pretrain/Loss": 2.076551914215088, "Pretrain/Loss (Raw)": 2.033263921737671, "Pretrain/Step": 4278, "Pretrain/Step Time": 8.543840359896421} +{"Pretrain/Learning Rate": 3.0328649042157315e-05, "Pretrain/Loss": 2.0769944190979004, "Pretrain/Loss (Raw)": 2.0088446140289307, "Pretrain/Step": 4279, "Pretrain/Step Time": 8.542960757389665} +{"Pretrain/Learning Rate": 3.0320353956085095e-05, "Pretrain/Loss": 2.0770304203033447, "Pretrain/Loss (Raw)": 2.1421010494232178, "Pretrain/Step": 4280, "Pretrain/Step Time": 8.541620744392276} +{"Pretrain/Learning Rate": 3.0312058256444587e-05, "Pretrain/Loss": 2.077096700668335, "Pretrain/Loss (Raw)": 2.0620357990264893, "Pretrain/Step": 4281, "Pretrain/Step Time": 8.545755891129375} +{"Pretrain/Learning Rate": 3.0303761944192488e-05, "Pretrain/Loss": 2.0748791694641113, "Pretrain/Loss (Raw)": 1.849475622177124, "Pretrain/Step": 4282, "Pretrain/Step Time": 8.548636751249433} +{"Pretrain/Learning Rate": 3.0295465020285567e-05, "Pretrain/Loss": 2.0766549110412598, "Pretrain/Loss (Raw)": 2.1206986904144287, "Pretrain/Step": 4283, "Pretrain/Step Time": 8.542237045243382} +{"Pretrain/Learning Rate": 3.0287167485680672e-05, "Pretrain/Loss": 2.074211359024048, "Pretrain/Loss (Raw)": 2.01278018951416, "Pretrain/Step": 4284, "Pretrain/Step Time": 8.54406094737351} +{"Pretrain/Learning Rate": 3.0278869341334702e-05, "Pretrain/Loss": 2.07572078704834, "Pretrain/Loss (Raw)": 2.1100451946258545, "Pretrain/Step": 4285, "Pretrain/Step Time": 8.54351869598031} +{"Pretrain/Learning Rate": 3.0270570588204655e-05, "Pretrain/Loss": 2.0756092071533203, "Pretrain/Loss (Raw)": 2.1256370544433594, "Pretrain/Step": 4286, "Pretrain/Step Time": 8.53866447135806} +{"Pretrain/Learning Rate": 3.0262271227247563e-05, "Pretrain/Loss": 2.076539993286133, "Pretrain/Loss (Raw)": 2.2214584350585938, "Pretrain/Step": 4287, "Pretrain/Step Time": 8.545049557462335} +{"Pretrain/Learning Rate": 3.025397125942056e-05, "Pretrain/Loss": 2.0773048400878906, "Pretrain/Loss (Raw)": 2.0648984909057617, "Pretrain/Step": 4288, "Pretrain/Step Time": 8.549904204905033} +{"Pretrain/Learning Rate": 3.0245670685680833e-05, "Pretrain/Loss": 2.076658010482788, "Pretrain/Loss (Raw)": 2.0951225757598877, "Pretrain/Step": 4289, "Pretrain/Step Time": 8.53994795680046} +{"Pretrain/Learning Rate": 3.0237369506985646e-05, "Pretrain/Loss": 2.0760374069213867, "Pretrain/Loss (Raw)": 2.0596470832824707, "Pretrain/Step": 4290, "Pretrain/Step Time": 8.542533963918686} +{"Pretrain/Learning Rate": 3.022906772429232e-05, "Pretrain/Loss": 2.0778255462646484, "Pretrain/Loss (Raw)": 2.1682546138763428, "Pretrain/Step": 4291, "Pretrain/Step Time": 8.540492596104741} +{"Pretrain/Learning Rate": 3.0220765338558278e-05, "Pretrain/Loss": 2.0760998725891113, "Pretrain/Loss (Raw)": 2.0362799167633057, "Pretrain/Step": 4292, "Pretrain/Step Time": 8.541554877534509} +{"Pretrain/Learning Rate": 3.021246235074096e-05, "Pretrain/Loss": 2.0748181343078613, "Pretrain/Loss (Raw)": 2.0441761016845703, "Pretrain/Step": 4293, "Pretrain/Step Time": 8.539045913144946} +{"Pretrain/Learning Rate": 3.0204158761797936e-05, "Pretrain/Loss": 2.072985887527466, "Pretrain/Loss (Raw)": 1.966300368309021, "Pretrain/Step": 4294, "Pretrain/Step Time": 8.542297713458538} +{"Pretrain/Learning Rate": 3.0195854572686793e-05, "Pretrain/Loss": 2.0725698471069336, "Pretrain/Loss (Raw)": 2.076442241668701, "Pretrain/Step": 4295, "Pretrain/Step Time": 8.538541158661246} +{"Pretrain/Learning Rate": 3.0187549784365214e-05, "Pretrain/Loss": 2.070993661880493, "Pretrain/Loss (Raw)": 1.9854512214660645, "Pretrain/Step": 4296, "Pretrain/Step Time": 8.547492621466517} +{"Pretrain/Learning Rate": 3.0179244397790956e-05, "Pretrain/Loss": 2.07157039642334, "Pretrain/Loss (Raw)": 2.1070852279663086, "Pretrain/Step": 4297, "Pretrain/Step Time": 8.548942308872938} +{"Pretrain/Learning Rate": 3.017093841392183e-05, "Pretrain/Loss": 2.0726544857025146, "Pretrain/Loss (Raw)": 2.1613285541534424, "Pretrain/Step": 4298, "Pretrain/Step Time": 8.546454211696982} +{"Pretrain/Learning Rate": 3.0162631833715715e-05, "Pretrain/Loss": 2.0707409381866455, "Pretrain/Loss (Raw)": 1.9458328485488892, "Pretrain/Step": 4299, "Pretrain/Step Time": 8.546456968411803} +{"Pretrain/Learning Rate": 3.0154324658130572e-05, "Pretrain/Loss": 2.0712666511535645, "Pretrain/Loss (Raw)": 2.1143527030944824, "Pretrain/Step": 4300, "Pretrain/Step Time": 8.551923125982285} +{"Pretrain/Learning Rate": 3.0146016888124423e-05, "Pretrain/Loss": 2.066314697265625, "Pretrain/Loss (Raw)": 1.91917884349823, "Pretrain/Step": 4301, "Pretrain/Step Time": 8.543709801509976} +{"Pretrain/Learning Rate": 3.013770852465535e-05, "Pretrain/Loss": 2.064863920211792, "Pretrain/Loss (Raw)": 1.9636592864990234, "Pretrain/Step": 4302, "Pretrain/Step Time": 8.544756351038814} +{"Pretrain/Learning Rate": 3.0129399568681533e-05, "Pretrain/Loss": 2.0648927688598633, "Pretrain/Loss (Raw)": 1.9723180532455444, "Pretrain/Step": 4303, "Pretrain/Step Time": 8.546148549765348} +{"Pretrain/Learning Rate": 3.0121090021161175e-05, "Pretrain/Loss": 2.06259822845459, "Pretrain/Loss (Raw)": 2.0764994621276855, "Pretrain/Step": 4304, "Pretrain/Step Time": 8.547930708155036} +{"Pretrain/Learning Rate": 3.0112779883052593e-05, "Pretrain/Loss": 2.0623116493225098, "Pretrain/Loss (Raw)": 1.928039789199829, "Pretrain/Step": 4305, "Pretrain/Step Time": 8.544163633137941} +{"Pretrain/Learning Rate": 3.010446915531414e-05, "Pretrain/Loss": 2.062817335128784, "Pretrain/Loss (Raw)": 2.1849520206451416, "Pretrain/Step": 4306, "Pretrain/Step Time": 8.55335247516632} +{"Pretrain/Learning Rate": 3.0096157838904247e-05, "Pretrain/Loss": 2.0628910064697266, "Pretrain/Loss (Raw)": 2.0087854862213135, "Pretrain/Step": 4307, "Pretrain/Step Time": 8.541998274624348} +{"Pretrain/Learning Rate": 3.0087845934781424e-05, "Pretrain/Loss": 2.06611967086792, "Pretrain/Loss (Raw)": 2.2749550342559814, "Pretrain/Step": 4308, "Pretrain/Step Time": 8.5460553355515} +{"Pretrain/Learning Rate": 3.0079533443904227e-05, "Pretrain/Loss": 2.066767930984497, "Pretrain/Loss (Raw)": 2.1598031520843506, "Pretrain/Step": 4309, "Pretrain/Step Time": 8.548425937071443} +{"Pretrain/Learning Rate": 3.0071220367231306e-05, "Pretrain/Loss": 2.066723346710205, "Pretrain/Loss (Raw)": 2.0461575984954834, "Pretrain/Step": 4310, "Pretrain/Step Time": 8.547117363661528} +{"Pretrain/Learning Rate": 3.006290670572135e-05, "Pretrain/Loss": 2.0673491954803467, "Pretrain/Loss (Raw)": 1.9647867679595947, "Pretrain/Step": 4311, "Pretrain/Step Time": 8.549673857167363} +{"Pretrain/Learning Rate": 3.0054592460333137e-05, "Pretrain/Loss": 2.065906047821045, "Pretrain/Loss (Raw)": 2.194141387939453, "Pretrain/Step": 4312, "Pretrain/Step Time": 8.558440275490284} +{"Pretrain/Learning Rate": 3.00462776320255e-05, "Pretrain/Loss": 2.0639796257019043, "Pretrain/Loss (Raw)": 2.013747453689575, "Pretrain/Step": 4313, "Pretrain/Step Time": 8.554326422512531} +{"Pretrain/Learning Rate": 3.0037962221757354e-05, "Pretrain/Loss": 2.064507484436035, "Pretrain/Loss (Raw)": 2.116001605987549, "Pretrain/Step": 4314, "Pretrain/Step Time": 8.551639696583152} +{"Pretrain/Learning Rate": 3.0029646230487657e-05, "Pretrain/Loss": 2.066795825958252, "Pretrain/Loss (Raw)": 2.261936664581299, "Pretrain/Step": 4315, "Pretrain/Step Time": 8.545709375292063} +{"Pretrain/Learning Rate": 3.002132965917547e-05, "Pretrain/Loss": 2.065587043762207, "Pretrain/Loss (Raw)": 2.0004827976226807, "Pretrain/Step": 4316, "Pretrain/Step Time": 8.549652431160212} +{"Pretrain/Learning Rate": 3.001301250877987e-05, "Pretrain/Loss": 2.0695624351501465, "Pretrain/Loss (Raw)": 2.4999701976776123, "Pretrain/Step": 4317, "Pretrain/Step Time": 8.551355376839638} +{"Pretrain/Learning Rate": 3.000469478026005e-05, "Pretrain/Loss": 2.069972515106201, "Pretrain/Loss (Raw)": 2.057661294937134, "Pretrain/Step": 4318, "Pretrain/Step Time": 8.55029721558094} +{"Pretrain/Learning Rate": 2.9996376474575244e-05, "Pretrain/Loss": 2.069911479949951, "Pretrain/Loss (Raw)": 2.23046875, "Pretrain/Step": 4319, "Pretrain/Step Time": 8.541370807215571} +{"Pretrain/Learning Rate": 2.9988057592684766e-05, "Pretrain/Loss": 2.0714502334594727, "Pretrain/Loss (Raw)": 2.1610608100891113, "Pretrain/Step": 4320, "Pretrain/Step Time": 8.545315224677324} +{"Pretrain/Learning Rate": 2.9979738135547973e-05, "Pretrain/Loss": 2.071397066116333, "Pretrain/Loss (Raw)": 2.1263654232025146, "Pretrain/Step": 4321, "Pretrain/Step Time": 8.538102572783828} +{"Pretrain/Learning Rate": 2.9971418104124322e-05, "Pretrain/Loss": 2.0710930824279785, "Pretrain/Loss (Raw)": 2.1803677082061768, "Pretrain/Step": 4322, "Pretrain/Step Time": 8.541982429102063} +{"Pretrain/Learning Rate": 2.9963097499373312e-05, "Pretrain/Loss": 2.069518566131592, "Pretrain/Loss (Raw)": 1.9000625610351562, "Pretrain/Step": 4323, "Pretrain/Step Time": 8.54481934197247} +{"Pretrain/Learning Rate": 2.9954776322254495e-05, "Pretrain/Loss": 2.067420482635498, "Pretrain/Loss (Raw)": 2.0904879570007324, "Pretrain/Step": 4324, "Pretrain/Step Time": 8.549016514793038} +{"Pretrain/Learning Rate": 2.994645457372754e-05, "Pretrain/Loss": 2.0667223930358887, "Pretrain/Loss (Raw)": 2.0360658168792725, "Pretrain/Step": 4325, "Pretrain/Step Time": 8.540517842397094} +{"Pretrain/Learning Rate": 2.9938132254752126e-05, "Pretrain/Loss": 2.064601421356201, "Pretrain/Loss (Raw)": 1.8620821237564087, "Pretrain/Step": 4326, "Pretrain/Step Time": 8.539261613041162} +{"Pretrain/Learning Rate": 2.9929809366288035e-05, "Pretrain/Loss": 2.0665602684020996, "Pretrain/Loss (Raw)": 2.1841061115264893, "Pretrain/Step": 4327, "Pretrain/Step Time": 8.545490954071283} +{"Pretrain/Learning Rate": 2.99214859092951e-05, "Pretrain/Loss": 2.0685267448425293, "Pretrain/Loss (Raw)": 2.185462236404419, "Pretrain/Step": 4328, "Pretrain/Step Time": 8.53864124789834} +{"Pretrain/Learning Rate": 2.9913161884733215e-05, "Pretrain/Loss": 2.0718698501586914, "Pretrain/Loss (Raw)": 2.5579779148101807, "Pretrain/Step": 4329, "Pretrain/Step Time": 8.549718283116817} +{"Pretrain/Learning Rate": 2.9904837293562348e-05, "Pretrain/Loss": 2.070099115371704, "Pretrain/Loss (Raw)": 1.8485982418060303, "Pretrain/Step": 4330, "Pretrain/Step Time": 8.557039799168706} +{"Pretrain/Learning Rate": 2.989651213674254e-05, "Pretrain/Loss": 2.071636199951172, "Pretrain/Loss (Raw)": 2.126972198486328, "Pretrain/Step": 4331, "Pretrain/Step Time": 8.542917914688587} +{"Pretrain/Learning Rate": 2.988818641523387e-05, "Pretrain/Loss": 2.070556640625, "Pretrain/Loss (Raw)": 2.120349645614624, "Pretrain/Step": 4332, "Pretrain/Step Time": 8.545964969322085} +{"Pretrain/Learning Rate": 2.9879860129996517e-05, "Pretrain/Loss": 2.0719122886657715, "Pretrain/Loss (Raw)": 2.0788414478302, "Pretrain/Step": 4333, "Pretrain/Step Time": 8.545755580067635} +{"Pretrain/Learning Rate": 2.9871533281990692e-05, "Pretrain/Loss": 2.0725290775299072, "Pretrain/Loss (Raw)": 2.1659018993377686, "Pretrain/Step": 4334, "Pretrain/Step Time": 8.545956045389175} +{"Pretrain/Learning Rate": 2.9863205872176703e-05, "Pretrain/Loss": 2.0729012489318848, "Pretrain/Loss (Raw)": 2.128469467163086, "Pretrain/Step": 4335, "Pretrain/Step Time": 8.546775413677096} +{"Pretrain/Learning Rate": 2.9854877901514884e-05, "Pretrain/Loss": 2.0717973709106445, "Pretrain/Loss (Raw)": 2.1286303997039795, "Pretrain/Step": 4336, "Pretrain/Step Time": 8.546889524906874} +{"Pretrain/Learning Rate": 2.9846549370965672e-05, "Pretrain/Loss": 2.0716958045959473, "Pretrain/Loss (Raw)": 2.0001301765441895, "Pretrain/Step": 4337, "Pretrain/Step Time": 8.544081721454859} +{"Pretrain/Learning Rate": 2.9838220281489553e-05, "Pretrain/Loss": 2.0715112686157227, "Pretrain/Loss (Raw)": 2.089409351348877, "Pretrain/Step": 4338, "Pretrain/Step Time": 8.550264155492187} +{"Pretrain/Learning Rate": 2.9829890634047068e-05, "Pretrain/Loss": 2.0734987258911133, "Pretrain/Loss (Raw)": 2.1827335357666016, "Pretrain/Step": 4339, "Pretrain/Step Time": 8.54641748778522} +{"Pretrain/Learning Rate": 2.9821560429598844e-05, "Pretrain/Loss": 2.0736663341522217, "Pretrain/Loss (Raw)": 2.154623031616211, "Pretrain/Step": 4340, "Pretrain/Step Time": 8.543357225134969} +{"Pretrain/Learning Rate": 2.9813229669105546e-05, "Pretrain/Loss": 2.074120044708252, "Pretrain/Loss (Raw)": 2.116824150085449, "Pretrain/Step": 4341, "Pretrain/Step Time": 8.546867869794369} +{"Pretrain/Learning Rate": 2.9804898353527928e-05, "Pretrain/Loss": 2.074007987976074, "Pretrain/Loss (Raw)": 2.007819175720215, "Pretrain/Step": 4342, "Pretrain/Step Time": 8.554560316726565} +{"Pretrain/Learning Rate": 2.9796566483826777e-05, "Pretrain/Loss": 2.075240135192871, "Pretrain/Loss (Raw)": 2.100358724594116, "Pretrain/Step": 4343, "Pretrain/Step Time": 8.549897395074368} +{"Pretrain/Learning Rate": 2.9788234060962988e-05, "Pretrain/Loss": 2.076922655105591, "Pretrain/Loss (Raw)": 2.1759707927703857, "Pretrain/Step": 4344, "Pretrain/Step Time": 8.54902751185} +{"Pretrain/Learning Rate": 2.9779901085897478e-05, "Pretrain/Loss": 2.0759763717651367, "Pretrain/Loss (Raw)": 1.997916340827942, "Pretrain/Step": 4345, "Pretrain/Step Time": 8.54872558452189} +{"Pretrain/Learning Rate": 2.9771567559591257e-05, "Pretrain/Loss": 2.0750601291656494, "Pretrain/Loss (Raw)": 1.9894105195999146, "Pretrain/Step": 4346, "Pretrain/Step Time": 8.544934812933207} +{"Pretrain/Learning Rate": 2.9763233483005383e-05, "Pretrain/Loss": 2.075045585632324, "Pretrain/Loss (Raw)": 2.016843318939209, "Pretrain/Step": 4347, "Pretrain/Step Time": 8.550046745687723} +{"Pretrain/Learning Rate": 2.975489885710097e-05, "Pretrain/Loss": 2.0739431381225586, "Pretrain/Loss (Raw)": 2.0727880001068115, "Pretrain/Step": 4348, "Pretrain/Step Time": 8.558642281219363} +{"Pretrain/Learning Rate": 2.9746563682839225e-05, "Pretrain/Loss": 2.0711913108825684, "Pretrain/Loss (Raw)": 2.0185561180114746, "Pretrain/Step": 4349, "Pretrain/Step Time": 8.549461143091321} +{"Pretrain/Learning Rate": 2.9738227961181374e-05, "Pretrain/Loss": 2.0726773738861084, "Pretrain/Loss (Raw)": 2.0922152996063232, "Pretrain/Step": 4350, "Pretrain/Step Time": 8.547967106103897} +{"Pretrain/Learning Rate": 2.972989169308876e-05, "Pretrain/Loss": 2.0720221996307373, "Pretrain/Loss (Raw)": 2.0931973457336426, "Pretrain/Step": 4351, "Pretrain/Step Time": 8.548005560413003} +{"Pretrain/Learning Rate": 2.9721554879522743e-05, "Pretrain/Loss": 2.07084321975708, "Pretrain/Loss (Raw)": 2.009284734725952, "Pretrain/Step": 4352, "Pretrain/Step Time": 8.54266550205648} +{"Pretrain/Learning Rate": 2.9713217521444774e-05, "Pretrain/Loss": 2.073517084121704, "Pretrain/Loss (Raw)": 2.1606431007385254, "Pretrain/Step": 4353, "Pretrain/Step Time": 8.547628967091441} +{"Pretrain/Learning Rate": 2.9704879619816346e-05, "Pretrain/Loss": 2.076829433441162, "Pretrain/Loss (Raw)": 2.2237331867218018, "Pretrain/Step": 4354, "Pretrain/Step Time": 8.555449401959777} +{"Pretrain/Learning Rate": 2.969654117559903e-05, "Pretrain/Loss": 2.076261520385742, "Pretrain/Loss (Raw)": 2.1619107723236084, "Pretrain/Step": 4355, "Pretrain/Step Time": 8.550919409841299} +{"Pretrain/Learning Rate": 2.9688202189754456e-05, "Pretrain/Loss": 2.0777266025543213, "Pretrain/Loss (Raw)": 2.1190102100372314, "Pretrain/Step": 4356, "Pretrain/Step Time": 8.548718037083745} +{"Pretrain/Learning Rate": 2.9679862663244317e-05, "Pretrain/Loss": 2.0783634185791016, "Pretrain/Loss (Raw)": 2.1281914710998535, "Pretrain/Step": 4357, "Pretrain/Step Time": 8.548603678122163} +{"Pretrain/Learning Rate": 2.9671522597030355e-05, "Pretrain/Loss": 2.0770444869995117, "Pretrain/Loss (Raw)": 2.0078423023223877, "Pretrain/Step": 4358, "Pretrain/Step Time": 8.547201609238982} +{"Pretrain/Learning Rate": 2.9663181992074402e-05, "Pretrain/Loss": 2.0755300521850586, "Pretrain/Loss (Raw)": 1.9601637125015259, "Pretrain/Step": 4359, "Pretrain/Step Time": 8.54578741826117} +{"Pretrain/Learning Rate": 2.9654840849338322e-05, "Pretrain/Loss": 2.076155185699463, "Pretrain/Loss (Raw)": 2.178426504135132, "Pretrain/Step": 4360, "Pretrain/Step Time": 8.557225074619055} +{"Pretrain/Learning Rate": 2.964649916978407e-05, "Pretrain/Loss": 2.075592279434204, "Pretrain/Loss (Raw)": 2.0257318019866943, "Pretrain/Step": 4361, "Pretrain/Step Time": 8.551699977368116} +{"Pretrain/Learning Rate": 2.963815695437363e-05, "Pretrain/Loss": 2.076596260070801, "Pretrain/Loss (Raw)": 1.9756861925125122, "Pretrain/Step": 4362, "Pretrain/Step Time": 8.552932130172849} +{"Pretrain/Learning Rate": 2.962981420406908e-05, "Pretrain/Loss": 2.0748536586761475, "Pretrain/Loss (Raw)": 1.9414116144180298, "Pretrain/Step": 4363, "Pretrain/Step Time": 8.550519717857242} +{"Pretrain/Learning Rate": 2.9621470919832538e-05, "Pretrain/Loss": 2.073336601257324, "Pretrain/Loss (Raw)": 1.9243779182434082, "Pretrain/Step": 4364, "Pretrain/Step Time": 8.554172044619918} +{"Pretrain/Learning Rate": 2.9613127102626187e-05, "Pretrain/Loss": 2.0746243000030518, "Pretrain/Loss (Raw)": 1.9278576374053955, "Pretrain/Step": 4365, "Pretrain/Step Time": 8.553067523986101} +{"Pretrain/Learning Rate": 2.9604782753412292e-05, "Pretrain/Loss": 2.0718915462493896, "Pretrain/Loss (Raw)": 1.7501634359359741, "Pretrain/Step": 4366, "Pretrain/Step Time": 8.559507220983505} +{"Pretrain/Learning Rate": 2.9596437873153137e-05, "Pretrain/Loss": 2.068881034851074, "Pretrain/Loss (Raw)": 1.8777079582214355, "Pretrain/Step": 4367, "Pretrain/Step Time": 8.549120733514428} +{"Pretrain/Learning Rate": 2.9588092462811122e-05, "Pretrain/Loss": 2.068753719329834, "Pretrain/Loss (Raw)": 2.1354897022247314, "Pretrain/Step": 4368, "Pretrain/Step Time": 8.546755390241742} +{"Pretrain/Learning Rate": 2.957974652334865e-05, "Pretrain/Loss": 2.0666046142578125, "Pretrain/Loss (Raw)": 2.013582229614258, "Pretrain/Step": 4369, "Pretrain/Step Time": 8.547120241448283} +{"Pretrain/Learning Rate": 2.9571400055728242e-05, "Pretrain/Loss": 2.066488265991211, "Pretrain/Loss (Raw)": 2.000255584716797, "Pretrain/Step": 4370, "Pretrain/Step Time": 8.549611734226346} +{"Pretrain/Learning Rate": 2.9563053060912426e-05, "Pretrain/Loss": 2.0686545372009277, "Pretrain/Loss (Raw)": 2.203782081604004, "Pretrain/Step": 4371, "Pretrain/Step Time": 8.546410819515586} +{"Pretrain/Learning Rate": 2.9554705539863842e-05, "Pretrain/Loss": 2.0713000297546387, "Pretrain/Loss (Raw)": 2.3026442527770996, "Pretrain/Step": 4372, "Pretrain/Step Time": 8.54903874732554} +{"Pretrain/Learning Rate": 2.954635749354514e-05, "Pretrain/Loss": 2.0700294971466064, "Pretrain/Loss (Raw)": 1.7927230596542358, "Pretrain/Step": 4373, "Pretrain/Step Time": 8.550421914085746} +{"Pretrain/Learning Rate": 2.953800892291908e-05, "Pretrain/Loss": 2.0682740211486816, "Pretrain/Loss (Raw)": 1.8954569101333618, "Pretrain/Step": 4374, "Pretrain/Step Time": 8.552830001339316} +{"Pretrain/Learning Rate": 2.9529659828948442e-05, "Pretrain/Loss": 2.069880962371826, "Pretrain/Loss (Raw)": 2.279167413711548, "Pretrain/Step": 4375, "Pretrain/Step Time": 8.549942215904593} +{"Pretrain/Learning Rate": 2.9521310212596087e-05, "Pretrain/Loss": 2.0734548568725586, "Pretrain/Loss (Raw)": 2.471052646636963, "Pretrain/Step": 4376, "Pretrain/Step Time": 8.550588531419635} +{"Pretrain/Learning Rate": 2.951296007482493e-05, "Pretrain/Loss": 2.074009418487549, "Pretrain/Loss (Raw)": 2.2679336071014404, "Pretrain/Step": 4377, "Pretrain/Step Time": 8.549855060875416} +{"Pretrain/Learning Rate": 2.9504609416597956e-05, "Pretrain/Loss": 2.07572865486145, "Pretrain/Loss (Raw)": 2.057041883468628, "Pretrain/Step": 4378, "Pretrain/Step Time": 8.550256544724107} +{"Pretrain/Learning Rate": 2.9496258238878198e-05, "Pretrain/Loss": 2.075113296508789, "Pretrain/Loss (Raw)": 1.8661731481552124, "Pretrain/Step": 4379, "Pretrain/Step Time": 8.556293867528439} +{"Pretrain/Learning Rate": 2.9487906542628753e-05, "Pretrain/Loss": 2.0757758617401123, "Pretrain/Loss (Raw)": 2.1301753520965576, "Pretrain/Step": 4380, "Pretrain/Step Time": 8.553755244240165} +{"Pretrain/Learning Rate": 2.9479554328812775e-05, "Pretrain/Loss": 2.0762553215026855, "Pretrain/Loss (Raw)": 2.025110960006714, "Pretrain/Step": 4381, "Pretrain/Step Time": 8.55183531716466} +{"Pretrain/Learning Rate": 2.9471201598393482e-05, "Pretrain/Loss": 2.075453281402588, "Pretrain/Loss (Raw)": 1.9929791688919067, "Pretrain/Step": 4382, "Pretrain/Step Time": 8.551176346838474} +{"Pretrain/Learning Rate": 2.946284835233416e-05, "Pretrain/Loss": 2.072885036468506, "Pretrain/Loss (Raw)": 1.9947261810302734, "Pretrain/Step": 4383, "Pretrain/Step Time": 8.552230479195714} +{"Pretrain/Learning Rate": 2.945449459159813e-05, "Pretrain/Loss": 2.077700614929199, "Pretrain/Loss (Raw)": 2.597696304321289, "Pretrain/Step": 4384, "Pretrain/Step Time": 8.546203842386603} +{"Pretrain/Learning Rate": 2.9446140317148795e-05, "Pretrain/Loss": 2.0770888328552246, "Pretrain/Loss (Raw)": 2.165137529373169, "Pretrain/Step": 4385, "Pretrain/Step Time": 8.549769824370742} +{"Pretrain/Learning Rate": 2.9437785529949606e-05, "Pretrain/Loss": 2.0741348266601562, "Pretrain/Loss (Raw)": 1.9265674352645874, "Pretrain/Step": 4386, "Pretrain/Step Time": 8.556241085752845} +{"Pretrain/Learning Rate": 2.9429430230964084e-05, "Pretrain/Loss": 2.0783371925354004, "Pretrain/Loss (Raw)": 2.22259783744812, "Pretrain/Step": 4387, "Pretrain/Step Time": 8.547229429706931} +{"Pretrain/Learning Rate": 2.9421074421155787e-05, "Pretrain/Loss": 2.0780029296875, "Pretrain/Loss (Raw)": 2.1019387245178223, "Pretrain/Step": 4388, "Pretrain/Step Time": 8.550018522888422} +{"Pretrain/Learning Rate": 2.9412718101488364e-05, "Pretrain/Loss": 2.081712484359741, "Pretrain/Loss (Raw)": 2.5902998447418213, "Pretrain/Step": 4389, "Pretrain/Step Time": 8.550416009500623} +{"Pretrain/Learning Rate": 2.9404361272925497e-05, "Pretrain/Loss": 2.0776829719543457, "Pretrain/Loss (Raw)": 1.7266546487808228, "Pretrain/Step": 4390, "Pretrain/Step Time": 8.54574759490788} +{"Pretrain/Learning Rate": 2.939600393643092e-05, "Pretrain/Loss": 2.0778732299804688, "Pretrain/Loss (Raw)": 1.9575445652008057, "Pretrain/Step": 4391, "Pretrain/Step Time": 8.557178450748324} +{"Pretrain/Learning Rate": 2.9387646092968468e-05, "Pretrain/Loss": 2.0796988010406494, "Pretrain/Loss (Raw)": 2.149259328842163, "Pretrain/Step": 4392, "Pretrain/Step Time": 8.546117244288325} +{"Pretrain/Learning Rate": 2.9379287743501983e-05, "Pretrain/Loss": 2.080742359161377, "Pretrain/Loss (Raw)": 2.1658031940460205, "Pretrain/Step": 4393, "Pretrain/Step Time": 8.544662414118648} +{"Pretrain/Learning Rate": 2.9370928888995407e-05, "Pretrain/Loss": 2.0784077644348145, "Pretrain/Loss (Raw)": 1.930885910987854, "Pretrain/Step": 4394, "Pretrain/Step Time": 8.546710966154933} +{"Pretrain/Learning Rate": 2.936256953041271e-05, "Pretrain/Loss": 2.0773332118988037, "Pretrain/Loss (Raw)": 1.9796518087387085, "Pretrain/Step": 4395, "Pretrain/Step Time": 8.546811955049634} +{"Pretrain/Learning Rate": 2.935420966871795e-05, "Pretrain/Loss": 2.076608896255493, "Pretrain/Loss (Raw)": 1.9895105361938477, "Pretrain/Step": 4396, "Pretrain/Step Time": 8.552384309470654} +{"Pretrain/Learning Rate": 2.9345849304875195e-05, "Pretrain/Loss": 2.0768661499023438, "Pretrain/Loss (Raw)": 2.192103624343872, "Pretrain/Step": 4397, "Pretrain/Step Time": 8.549742659553885} +{"Pretrain/Learning Rate": 2.9337488439848633e-05, "Pretrain/Loss": 2.075282096862793, "Pretrain/Loss (Raw)": 1.795654535293579, "Pretrain/Step": 4398, "Pretrain/Step Time": 8.545941703021526} +{"Pretrain/Learning Rate": 2.9329127074602458e-05, "Pretrain/Loss": 2.0775623321533203, "Pretrain/Loss (Raw)": 1.9950698614120483, "Pretrain/Step": 4399, "Pretrain/Step Time": 8.550202399492264} +{"Pretrain/Learning Rate": 2.9320765210100952e-05, "Pretrain/Loss": 2.075838565826416, "Pretrain/Loss (Raw)": 1.9664970636367798, "Pretrain/Step": 4400, "Pretrain/Step Time": 8.550988165661693} +{"Pretrain/Learning Rate": 2.931240284730844e-05, "Pretrain/Loss": 2.076261520385742, "Pretrain/Loss (Raw)": 1.9876948595046997, "Pretrain/Step": 4401, "Pretrain/Step Time": 8.547260550782084} +{"Pretrain/Learning Rate": 2.9304039987189313e-05, "Pretrain/Loss": 2.07747220993042, "Pretrain/Loss (Raw)": 2.188589096069336, "Pretrain/Step": 4402, "Pretrain/Step Time": 8.54785137809813} +{"Pretrain/Learning Rate": 2.9295676630708013e-05, "Pretrain/Loss": 2.0784542560577393, "Pretrain/Loss (Raw)": 2.1203360557556152, "Pretrain/Step": 4403, "Pretrain/Step Time": 8.548711890354753} +{"Pretrain/Learning Rate": 2.9287312778829047e-05, "Pretrain/Loss": 2.0797972679138184, "Pretrain/Loss (Raw)": 2.2036468982696533, "Pretrain/Step": 4404, "Pretrain/Step Time": 8.54803261719644} +{"Pretrain/Learning Rate": 2.9278948432516968e-05, "Pretrain/Loss": 2.0799546241760254, "Pretrain/Loss (Raw)": 2.104940176010132, "Pretrain/Step": 4405, "Pretrain/Step Time": 8.552576903253794} +{"Pretrain/Learning Rate": 2.9270583592736385e-05, "Pretrain/Loss": 2.079928398132324, "Pretrain/Loss (Raw)": 2.0299196243286133, "Pretrain/Step": 4406, "Pretrain/Step Time": 8.54804727807641} +{"Pretrain/Learning Rate": 2.9262218260451984e-05, "Pretrain/Loss": 2.0801947116851807, "Pretrain/Loss (Raw)": 2.042959451675415, "Pretrain/Step": 4407, "Pretrain/Step Time": 8.553528049960732} +{"Pretrain/Learning Rate": 2.9253852436628483e-05, "Pretrain/Loss": 2.079854965209961, "Pretrain/Loss (Raw)": 2.098595142364502, "Pretrain/Step": 4408, "Pretrain/Step Time": 8.55376604013145} +{"Pretrain/Learning Rate": 2.924548612223068e-05, "Pretrain/Loss": 2.079427719116211, "Pretrain/Loss (Raw)": 2.007354259490967, "Pretrain/Step": 4409, "Pretrain/Step Time": 8.55761898867786} +{"Pretrain/Learning Rate": 2.923711931822341e-05, "Pretrain/Loss": 2.08147931098938, "Pretrain/Loss (Raw)": 2.1120810508728027, "Pretrain/Step": 4410, "Pretrain/Step Time": 8.553189070895314} +{"Pretrain/Learning Rate": 2.9228752025571575e-05, "Pretrain/Loss": 2.0819191932678223, "Pretrain/Loss (Raw)": 2.17699933052063, "Pretrain/Step": 4411, "Pretrain/Step Time": 8.555372698232532} +{"Pretrain/Learning Rate": 2.922038424524013e-05, "Pretrain/Loss": 2.0823605060577393, "Pretrain/Loss (Raw)": 2.069270610809326, "Pretrain/Step": 4412, "Pretrain/Step Time": 8.557530328631401} +{"Pretrain/Learning Rate": 2.9212015978194083e-05, "Pretrain/Loss": 2.0806596279144287, "Pretrain/Loss (Raw)": 1.8923122882843018, "Pretrain/Step": 4413, "Pretrain/Step Time": 8.555796401575208} +{"Pretrain/Learning Rate": 2.920364722539851e-05, "Pretrain/Loss": 2.078212261199951, "Pretrain/Loss (Raw)": 1.8123869895935059, "Pretrain/Step": 4414, "Pretrain/Step Time": 8.560118168592453} +{"Pretrain/Learning Rate": 2.9195277987818533e-05, "Pretrain/Loss": 2.0757129192352295, "Pretrain/Loss (Raw)": 1.901537299156189, "Pretrain/Step": 4415, "Pretrain/Step Time": 8.562887677922845} +{"Pretrain/Learning Rate": 2.918690826641932e-05, "Pretrain/Loss": 2.075566530227661, "Pretrain/Loss (Raw)": 2.046170473098755, "Pretrain/Step": 4416, "Pretrain/Step Time": 8.549596197903156} +{"Pretrain/Learning Rate": 2.917853806216613e-05, "Pretrain/Loss": 2.0754904747009277, "Pretrain/Loss (Raw)": 2.0853934288024902, "Pretrain/Step": 4417, "Pretrain/Step Time": 8.554372793063521} +{"Pretrain/Learning Rate": 2.9170167376024228e-05, "Pretrain/Loss": 2.076545238494873, "Pretrain/Loss (Raw)": 2.19466495513916, "Pretrain/Step": 4418, "Pretrain/Step Time": 8.555784249678254} +{"Pretrain/Learning Rate": 2.9161796208958974e-05, "Pretrain/Loss": 2.075911521911621, "Pretrain/Loss (Raw)": 2.0871331691741943, "Pretrain/Step": 4419, "Pretrain/Step Time": 8.557558696717024} +{"Pretrain/Learning Rate": 2.9153424561935782e-05, "Pretrain/Loss": 2.076596736907959, "Pretrain/Loss (Raw)": 2.1239988803863525, "Pretrain/Step": 4420, "Pretrain/Step Time": 8.556713255122304} +{"Pretrain/Learning Rate": 2.914505243592009e-05, "Pretrain/Loss": 2.076838731765747, "Pretrain/Loss (Raw)": 2.0751068592071533, "Pretrain/Step": 4421, "Pretrain/Step Time": 8.559302331879735} +{"Pretrain/Learning Rate": 2.913667983187742e-05, "Pretrain/Loss": 2.0778698921203613, "Pretrain/Loss (Raw)": 2.0982935428619385, "Pretrain/Step": 4422, "Pretrain/Step Time": 8.556365344673395} +{"Pretrain/Learning Rate": 2.9128306750773338e-05, "Pretrain/Loss": 2.0773158073425293, "Pretrain/Loss (Raw)": 2.005566358566284, "Pretrain/Step": 4423, "Pretrain/Step Time": 8.558839214965701} +{"Pretrain/Learning Rate": 2.911993319357347e-05, "Pretrain/Loss": 2.0791897773742676, "Pretrain/Loss (Raw)": 2.225308418273926, "Pretrain/Step": 4424, "Pretrain/Step Time": 8.553127260878682} +{"Pretrain/Learning Rate": 2.911155916124349e-05, "Pretrain/Loss": 2.0790257453918457, "Pretrain/Loss (Raw)": 2.0860347747802734, "Pretrain/Step": 4425, "Pretrain/Step Time": 8.547956503927708} +{"Pretrain/Learning Rate": 2.910318465474914e-05, "Pretrain/Loss": 2.077338695526123, "Pretrain/Loss (Raw)": 1.945414662361145, "Pretrain/Step": 4426, "Pretrain/Step Time": 8.548729015514255} +{"Pretrain/Learning Rate": 2.9094809675056188e-05, "Pretrain/Loss": 2.0773744583129883, "Pretrain/Loss (Raw)": 1.9504015445709229, "Pretrain/Step": 4427, "Pretrain/Step Time": 8.55649345740676} +{"Pretrain/Learning Rate": 2.9086434223130504e-05, "Pretrain/Loss": 2.0777502059936523, "Pretrain/Loss (Raw)": 2.1624796390533447, "Pretrain/Step": 4428, "Pretrain/Step Time": 8.547542788088322} +{"Pretrain/Learning Rate": 2.9078058299937962e-05, "Pretrain/Loss": 2.0779173374176025, "Pretrain/Loss (Raw)": 1.940544605255127, "Pretrain/Step": 4429, "Pretrain/Step Time": 8.546180248260498} +{"Pretrain/Learning Rate": 2.9069681906444518e-05, "Pretrain/Loss": 2.0779194831848145, "Pretrain/Loss (Raw)": 1.9639217853546143, "Pretrain/Step": 4430, "Pretrain/Step Time": 8.54830170981586} +{"Pretrain/Learning Rate": 2.906130504361619e-05, "Pretrain/Loss": 2.078835964202881, "Pretrain/Loss (Raw)": 2.0896620750427246, "Pretrain/Step": 4431, "Pretrain/Step Time": 8.544234953820705} +{"Pretrain/Learning Rate": 2.9052927712419013e-05, "Pretrain/Loss": 2.078216075897217, "Pretrain/Loss (Raw)": 1.9971716403961182, "Pretrain/Step": 4432, "Pretrain/Step Time": 8.544272236526012} +{"Pretrain/Learning Rate": 2.9044549913819124e-05, "Pretrain/Loss": 2.0792346000671387, "Pretrain/Loss (Raw)": 2.0583653450012207, "Pretrain/Step": 4433, "Pretrain/Step Time": 8.55161384679377} +{"Pretrain/Learning Rate": 2.9036171648782672e-05, "Pretrain/Loss": 2.0781471729278564, "Pretrain/Loss (Raw)": 2.0457870960235596, "Pretrain/Step": 4434, "Pretrain/Step Time": 8.544850764796138} +{"Pretrain/Learning Rate": 2.9027792918275894e-05, "Pretrain/Loss": 2.079155206680298, "Pretrain/Loss (Raw)": 2.1378064155578613, "Pretrain/Step": 4435, "Pretrain/Step Time": 8.549820287153125} +{"Pretrain/Learning Rate": 2.9019413723265053e-05, "Pretrain/Loss": 2.076951503753662, "Pretrain/Loss (Raw)": 1.992864966392517, "Pretrain/Step": 4436, "Pretrain/Step Time": 8.546680841594934} +{"Pretrain/Learning Rate": 2.9011034064716485e-05, "Pretrain/Loss": 2.0780978202819824, "Pretrain/Loss (Raw)": 2.3065450191497803, "Pretrain/Step": 4437, "Pretrain/Step Time": 8.544951563701034} +{"Pretrain/Learning Rate": 2.9002653943596564e-05, "Pretrain/Loss": 2.0780394077301025, "Pretrain/Loss (Raw)": 2.0386760234832764, "Pretrain/Step": 4438, "Pretrain/Step Time": 8.54643645696342} +{"Pretrain/Learning Rate": 2.8994273360871734e-05, "Pretrain/Loss": 2.079080104827881, "Pretrain/Loss (Raw)": 2.097982883453369, "Pretrain/Step": 4439, "Pretrain/Step Time": 8.552447404712439} +{"Pretrain/Learning Rate": 2.898589231750847e-05, "Pretrain/Loss": 2.0788612365722656, "Pretrain/Loss (Raw)": 2.166163444519043, "Pretrain/Step": 4440, "Pretrain/Step Time": 8.542191632091999} +{"Pretrain/Learning Rate": 2.897751081447333e-05, "Pretrain/Loss": 2.0792903900146484, "Pretrain/Loss (Raw)": 2.0686631202697754, "Pretrain/Step": 4441, "Pretrain/Step Time": 8.547638285905123} +{"Pretrain/Learning Rate": 2.8969128852732896e-05, "Pretrain/Loss": 2.0775723457336426, "Pretrain/Loss (Raw)": 1.8960868120193481, "Pretrain/Step": 4442, "Pretrain/Step Time": 8.550068411976099} +{"Pretrain/Learning Rate": 2.896074643325382e-05, "Pretrain/Loss": 2.074551582336426, "Pretrain/Loss (Raw)": 1.875279188156128, "Pretrain/Step": 4443, "Pretrain/Step Time": 8.551569683477283} +{"Pretrain/Learning Rate": 2.8952363557002798e-05, "Pretrain/Loss": 2.075265407562256, "Pretrain/Loss (Raw)": 2.091872453689575, "Pretrain/Step": 4444, "Pretrain/Step Time": 8.547311753034592} +{"Pretrain/Learning Rate": 2.89439802249466e-05, "Pretrain/Loss": 2.072282314300537, "Pretrain/Loss (Raw)": 2.1180992126464844, "Pretrain/Step": 4445, "Pretrain/Step Time": 8.552283823490143} +{"Pretrain/Learning Rate": 2.8935596438052003e-05, "Pretrain/Loss": 2.072017192840576, "Pretrain/Loss (Raw)": 2.0237128734588623, "Pretrain/Step": 4446, "Pretrain/Step Time": 8.550320375710726} +{"Pretrain/Learning Rate": 2.8927212197285885e-05, "Pretrain/Loss": 2.0701985359191895, "Pretrain/Loss (Raw)": 1.9977126121520996, "Pretrain/Step": 4447, "Pretrain/Step Time": 8.549954311922193} +{"Pretrain/Learning Rate": 2.8918827503615154e-05, "Pretrain/Loss": 2.069375991821289, "Pretrain/Loss (Raw)": 2.055760622024536, "Pretrain/Step": 4448, "Pretrain/Step Time": 8.54832229949534} +{"Pretrain/Learning Rate": 2.891044235800676e-05, "Pretrain/Loss": 2.0696303844451904, "Pretrain/Loss (Raw)": 2.1589391231536865, "Pretrain/Step": 4449, "Pretrain/Step Time": 8.553619720041752} +{"Pretrain/Learning Rate": 2.8902056761427744e-05, "Pretrain/Loss": 2.068333864212036, "Pretrain/Loss (Raw)": 2.0144240856170654, "Pretrain/Step": 4450, "Pretrain/Step Time": 8.553889015689492} +{"Pretrain/Learning Rate": 2.889367071484514e-05, "Pretrain/Loss": 2.069655656814575, "Pretrain/Loss (Raw)": 2.0692484378814697, "Pretrain/Step": 4451, "Pretrain/Step Time": 8.556778950616717} +{"Pretrain/Learning Rate": 2.888528421922608e-05, "Pretrain/Loss": 2.0688066482543945, "Pretrain/Loss (Raw)": 1.981812834739685, "Pretrain/Step": 4452, "Pretrain/Step Time": 8.553710797801614} +{"Pretrain/Learning Rate": 2.8876897275537744e-05, "Pretrain/Loss": 2.0699429512023926, "Pretrain/Loss (Raw)": 2.1815145015716553, "Pretrain/Step": 4453, "Pretrain/Step Time": 8.554931106045842} +{"Pretrain/Learning Rate": 2.8868509884747348e-05, "Pretrain/Loss": 2.0719711780548096, "Pretrain/Loss (Raw)": 2.1216886043548584, "Pretrain/Step": 4454, "Pretrain/Step Time": 8.556328807026148} +{"Pretrain/Learning Rate": 2.8860122047822154e-05, "Pretrain/Loss": 2.0709803104400635, "Pretrain/Loss (Raw)": 2.0572638511657715, "Pretrain/Step": 4455, "Pretrain/Step Time": 8.554269714280963} +{"Pretrain/Learning Rate": 2.88517337657295e-05, "Pretrain/Loss": 2.070220470428467, "Pretrain/Loss (Raw)": 2.088229179382324, "Pretrain/Step": 4456, "Pretrain/Step Time": 8.558191578835249} +{"Pretrain/Learning Rate": 2.8843345039436758e-05, "Pretrain/Loss": 2.066910743713379, "Pretrain/Loss (Raw)": 2.134293794631958, "Pretrain/Step": 4457, "Pretrain/Step Time": 8.557365335524082} +{"Pretrain/Learning Rate": 2.8834955869911356e-05, "Pretrain/Loss": 2.0690793991088867, "Pretrain/Loss (Raw)": 2.1261982917785645, "Pretrain/Step": 4458, "Pretrain/Step Time": 8.545635273680091} +{"Pretrain/Learning Rate": 2.8826566258120768e-05, "Pretrain/Loss": 2.068021774291992, "Pretrain/Loss (Raw)": 1.9916102886199951, "Pretrain/Step": 4459, "Pretrain/Step Time": 8.549196338281035} +{"Pretrain/Learning Rate": 2.8818176205032533e-05, "Pretrain/Loss": 2.0680861473083496, "Pretrain/Loss (Raw)": 2.128558874130249, "Pretrain/Step": 4460, "Pretrain/Step Time": 8.552660781890154} +{"Pretrain/Learning Rate": 2.8809785711614228e-05, "Pretrain/Loss": 2.0662763118743896, "Pretrain/Loss (Raw)": 1.8472082614898682, "Pretrain/Step": 4461, "Pretrain/Step Time": 8.549700230360031} +{"Pretrain/Learning Rate": 2.8801394778833475e-05, "Pretrain/Loss": 2.0643022060394287, "Pretrain/Loss (Raw)": 1.913215160369873, "Pretrain/Step": 4462, "Pretrain/Step Time": 8.546359654515982} +{"Pretrain/Learning Rate": 2.879300340765797e-05, "Pretrain/Loss": 2.063232660293579, "Pretrain/Loss (Raw)": 1.9915575981140137, "Pretrain/Step": 4463, "Pretrain/Step Time": 8.549619974568486} +{"Pretrain/Learning Rate": 2.8784611599055435e-05, "Pretrain/Loss": 2.0627193450927734, "Pretrain/Loss (Raw)": 2.0629425048828125, "Pretrain/Step": 4464, "Pretrain/Step Time": 8.546562565490603} +{"Pretrain/Learning Rate": 2.8776219353993662e-05, "Pretrain/Loss": 2.0631561279296875, "Pretrain/Loss (Raw)": 2.056020736694336, "Pretrain/Step": 4465, "Pretrain/Step Time": 8.552128294482827} +{"Pretrain/Learning Rate": 2.8767826673440467e-05, "Pretrain/Loss": 2.0632376670837402, "Pretrain/Loss (Raw)": 2.099874258041382, "Pretrain/Step": 4466, "Pretrain/Step Time": 8.548101479187608} +{"Pretrain/Learning Rate": 2.8759433558363758e-05, "Pretrain/Loss": 2.062268018722534, "Pretrain/Loss (Raw)": 2.0585997104644775, "Pretrain/Step": 4467, "Pretrain/Step Time": 8.54922354593873} +{"Pretrain/Learning Rate": 2.875104000973145e-05, "Pretrain/Loss": 2.0623550415039062, "Pretrain/Loss (Raw)": 2.1657614707946777, "Pretrain/Step": 4468, "Pretrain/Step Time": 8.549599749967456} +{"Pretrain/Learning Rate": 2.874264602851154e-05, "Pretrain/Loss": 2.061551570892334, "Pretrain/Loss (Raw)": 2.014004707336426, "Pretrain/Step": 4469, "Pretrain/Step Time": 8.55527738854289} +{"Pretrain/Learning Rate": 2.8734251615672043e-05, "Pretrain/Loss": 2.0619537830352783, "Pretrain/Loss (Raw)": 2.059298276901245, "Pretrain/Step": 4470, "Pretrain/Step Time": 8.546045668423176} +{"Pretrain/Learning Rate": 2.8725856772181058e-05, "Pretrain/Loss": 2.061800479888916, "Pretrain/Loss (Raw)": 2.080705165863037, "Pretrain/Step": 4471, "Pretrain/Step Time": 8.54803299345076} +{"Pretrain/Learning Rate": 2.8717461499006714e-05, "Pretrain/Loss": 2.0605757236480713, "Pretrain/Loss (Raw)": 2.019216537475586, "Pretrain/Step": 4472, "Pretrain/Step Time": 8.546567671000957} +{"Pretrain/Learning Rate": 2.8709065797117198e-05, "Pretrain/Loss": 2.0602498054504395, "Pretrain/Loss (Raw)": 1.9561827182769775, "Pretrain/Step": 4473, "Pretrain/Step Time": 8.545978743582964} +{"Pretrain/Learning Rate": 2.8700669667480732e-05, "Pretrain/Loss": 2.0610122680664062, "Pretrain/Loss (Raw)": 2.087031602859497, "Pretrain/Step": 4474, "Pretrain/Step Time": 8.54806405119598} +{"Pretrain/Learning Rate": 2.86922731110656e-05, "Pretrain/Loss": 2.0621304512023926, "Pretrain/Loss (Raw)": 2.159958600997925, "Pretrain/Step": 4475, "Pretrain/Step Time": 8.551406292244792} +{"Pretrain/Learning Rate": 2.8683876128840138e-05, "Pretrain/Loss": 2.0627715587615967, "Pretrain/Loss (Raw)": 2.154843330383301, "Pretrain/Step": 4476, "Pretrain/Step Time": 8.537015292793512} +{"Pretrain/Learning Rate": 2.8675478721772715e-05, "Pretrain/Loss": 2.0649776458740234, "Pretrain/Loss (Raw)": 2.3009769916534424, "Pretrain/Step": 4477, "Pretrain/Step Time": 8.540259467437863} +{"Pretrain/Learning Rate": 2.866708089083177e-05, "Pretrain/Loss": 2.065577983856201, "Pretrain/Loss (Raw)": 2.169027805328369, "Pretrain/Step": 4478, "Pretrain/Step Time": 8.535128310322762} +{"Pretrain/Learning Rate": 2.865868263698578e-05, "Pretrain/Loss": 2.0636584758758545, "Pretrain/Loss (Raw)": 1.84750497341156, "Pretrain/Step": 4479, "Pretrain/Step Time": 8.538611246272922} +{"Pretrain/Learning Rate": 2.8650283961203267e-05, "Pretrain/Loss": 2.065361499786377, "Pretrain/Loss (Raw)": 2.2272796630859375, "Pretrain/Step": 4480, "Pretrain/Step Time": 8.538520235568285} +{"Pretrain/Learning Rate": 2.86418848644528e-05, "Pretrain/Loss": 2.0648975372314453, "Pretrain/Loss (Raw)": 2.10125470161438, "Pretrain/Step": 4481, "Pretrain/Step Time": 8.533958058804274} +{"Pretrain/Learning Rate": 2.8633485347703015e-05, "Pretrain/Loss": 2.0627927780151367, "Pretrain/Loss (Raw)": 1.9543086290359497, "Pretrain/Step": 4482, "Pretrain/Step Time": 8.533880999311805} +{"Pretrain/Learning Rate": 2.8625085411922575e-05, "Pretrain/Loss": 2.0614285469055176, "Pretrain/Loss (Raw)": 1.9872790575027466, "Pretrain/Step": 4483, "Pretrain/Step Time": 8.536956291645765} +{"Pretrain/Learning Rate": 2.861668505808021e-05, "Pretrain/Loss": 2.060850143432617, "Pretrain/Loss (Raw)": 2.0449979305267334, "Pretrain/Step": 4484, "Pretrain/Step Time": 8.538504427298903} +{"Pretrain/Learning Rate": 2.8608284287144675e-05, "Pretrain/Loss": 2.0601696968078613, "Pretrain/Loss (Raw)": 2.0410830974578857, "Pretrain/Step": 4485, "Pretrain/Step Time": 8.540505055338144} +{"Pretrain/Learning Rate": 2.85998831000848e-05, "Pretrain/Loss": 2.0594544410705566, "Pretrain/Loss (Raw)": 1.9163061380386353, "Pretrain/Step": 4486, "Pretrain/Step Time": 8.541724096983671} +{"Pretrain/Learning Rate": 2.8591481497869433e-05, "Pretrain/Loss": 2.0599279403686523, "Pretrain/Loss (Raw)": 2.0207595825195312, "Pretrain/Step": 4487, "Pretrain/Step Time": 8.539978228509426} +{"Pretrain/Learning Rate": 2.8583079481467507e-05, "Pretrain/Loss": 2.0590171813964844, "Pretrain/Loss (Raw)": 2.0618629455566406, "Pretrain/Step": 4488, "Pretrain/Step Time": 8.539033252745867} +{"Pretrain/Learning Rate": 2.857467705184797e-05, "Pretrain/Loss": 2.0584912300109863, "Pretrain/Loss (Raw)": 1.9584065675735474, "Pretrain/Step": 4489, "Pretrain/Step Time": 8.53971852734685} +{"Pretrain/Learning Rate": 2.856627420997982e-05, "Pretrain/Loss": 2.058022975921631, "Pretrain/Loss (Raw)": 1.9157108068466187, "Pretrain/Step": 4490, "Pretrain/Step Time": 8.54110293649137} +{"Pretrain/Learning Rate": 2.8557870956832132e-05, "Pretrain/Loss": 2.058934211730957, "Pretrain/Loss (Raw)": 2.0580861568450928, "Pretrain/Step": 4491, "Pretrain/Step Time": 8.541226357221603} +{"Pretrain/Learning Rate": 2.8549467293374e-05, "Pretrain/Loss": 2.059779644012451, "Pretrain/Loss (Raw)": 2.0325927734375, "Pretrain/Step": 4492, "Pretrain/Step Time": 8.537364585325122} +{"Pretrain/Learning Rate": 2.854106322057457e-05, "Pretrain/Loss": 2.060961961746216, "Pretrain/Loss (Raw)": 2.0792031288146973, "Pretrain/Step": 4493, "Pretrain/Step Time": 8.53895416110754} +{"Pretrain/Learning Rate": 2.8532658739403046e-05, "Pretrain/Loss": 2.063284397125244, "Pretrain/Loss (Raw)": 2.0473945140838623, "Pretrain/Step": 4494, "Pretrain/Step Time": 8.537811808288097} +{"Pretrain/Learning Rate": 2.852425385082867e-05, "Pretrain/Loss": 2.0662107467651367, "Pretrain/Loss (Raw)": 2.2523252964019775, "Pretrain/Step": 4495, "Pretrain/Step Time": 8.542659608647227} +{"Pretrain/Learning Rate": 2.851584855582073e-05, "Pretrain/Loss": 2.0661425590515137, "Pretrain/Loss (Raw)": 2.1267130374908447, "Pretrain/Step": 4496, "Pretrain/Step Time": 8.544794229790568} +{"Pretrain/Learning Rate": 2.8507442855348577e-05, "Pretrain/Loss": 2.067288398742676, "Pretrain/Loss (Raw)": 2.160269260406494, "Pretrain/Step": 4497, "Pretrain/Step Time": 8.54385850764811} +{"Pretrain/Learning Rate": 2.8499036750381576e-05, "Pretrain/Loss": 2.0654804706573486, "Pretrain/Loss (Raw)": 1.7688249349594116, "Pretrain/Step": 4498, "Pretrain/Step Time": 8.541833760216832} +{"Pretrain/Learning Rate": 2.849063024188917e-05, "Pretrain/Loss": 2.064072608947754, "Pretrain/Loss (Raw)": 2.0236287117004395, "Pretrain/Step": 4499, "Pretrain/Step Time": 8.548029286786914} +{"Pretrain/Learning Rate": 2.8482223330840836e-05, "Pretrain/Loss": 2.0616748332977295, "Pretrain/Loss (Raw)": 1.9957048892974854, "Pretrain/Step": 4500, "Pretrain/Step Time": 8.546165620908141} +{"Pretrain/Learning Rate": 2.84738160182061e-05, "Pretrain/Loss": 2.0635786056518555, "Pretrain/Loss (Raw)": 2.0363998413085938, "Pretrain/Step": 4501, "Pretrain/Step Time": 8.547728478908539} +{"Pretrain/Learning Rate": 2.8465408304954533e-05, "Pretrain/Loss": 2.0641913414001465, "Pretrain/Loss (Raw)": 1.97389554977417, "Pretrain/Step": 4502, "Pretrain/Step Time": 8.542389869689941} +{"Pretrain/Learning Rate": 2.8457000192055748e-05, "Pretrain/Loss": 2.0624423027038574, "Pretrain/Loss (Raw)": 2.055290937423706, "Pretrain/Step": 4503, "Pretrain/Step Time": 8.543513748794794} +{"Pretrain/Learning Rate": 2.8448591680479415e-05, "Pretrain/Loss": 2.060182571411133, "Pretrain/Loss (Raw)": 2.1817991733551025, "Pretrain/Step": 4504, "Pretrain/Step Time": 8.54102136567235} +{"Pretrain/Learning Rate": 2.8440182771195235e-05, "Pretrain/Loss": 2.0601558685302734, "Pretrain/Loss (Raw)": 2.264525890350342, "Pretrain/Step": 4505, "Pretrain/Step Time": 8.540005031973124} +{"Pretrain/Learning Rate": 2.8431773465172972e-05, "Pretrain/Loss": 2.061223030090332, "Pretrain/Loss (Raw)": 2.1936330795288086, "Pretrain/Step": 4506, "Pretrain/Step Time": 8.54521545022726} +{"Pretrain/Learning Rate": 2.8423363763382415e-05, "Pretrain/Loss": 2.0628507137298584, "Pretrain/Loss (Raw)": 2.0745081901550293, "Pretrain/Step": 4507, "Pretrain/Step Time": 8.542572446167469} +{"Pretrain/Learning Rate": 2.8414953666793426e-05, "Pretrain/Loss": 2.0630812644958496, "Pretrain/Loss (Raw)": 2.1596858501434326, "Pretrain/Step": 4508, "Pretrain/Step Time": 8.540866829454899} +{"Pretrain/Learning Rate": 2.8406543176375882e-05, "Pretrain/Loss": 2.062392473220825, "Pretrain/Loss (Raw)": 1.9369438886642456, "Pretrain/Step": 4509, "Pretrain/Step Time": 8.542813904583454} +{"Pretrain/Learning Rate": 2.839813229309973e-05, "Pretrain/Loss": 2.0625948905944824, "Pretrain/Loss (Raw)": 2.018894910812378, "Pretrain/Step": 4510, "Pretrain/Step Time": 8.541768707334995} +{"Pretrain/Learning Rate": 2.8389721017934945e-05, "Pretrain/Loss": 2.0633058547973633, "Pretrain/Loss (Raw)": 2.0857179164886475, "Pretrain/Step": 4511, "Pretrain/Step Time": 8.539584150537848} +{"Pretrain/Learning Rate": 2.8381309351851564e-05, "Pretrain/Loss": 2.0593600273132324, "Pretrain/Loss (Raw)": 2.0926475524902344, "Pretrain/Step": 4512, "Pretrain/Step Time": 8.544262442737818} +{"Pretrain/Learning Rate": 2.837289729581965e-05, "Pretrain/Loss": 2.059314727783203, "Pretrain/Loss (Raw)": 2.159311056137085, "Pretrain/Step": 4513, "Pretrain/Step Time": 8.538154309615493} +{"Pretrain/Learning Rate": 2.8364484850809337e-05, "Pretrain/Loss": 2.059051752090454, "Pretrain/Loss (Raw)": 1.8929204940795898, "Pretrain/Step": 4514, "Pretrain/Step Time": 8.534424351528287} +{"Pretrain/Learning Rate": 2.835607201779077e-05, "Pretrain/Loss": 2.057812213897705, "Pretrain/Loss (Raw)": 2.0639591217041016, "Pretrain/Step": 4515, "Pretrain/Step Time": 8.537445396184921} +{"Pretrain/Learning Rate": 2.834765879773416e-05, "Pretrain/Loss": 2.0564403533935547, "Pretrain/Loss (Raw)": 1.9263302087783813, "Pretrain/Step": 4516, "Pretrain/Step Time": 8.535789458081126} +{"Pretrain/Learning Rate": 2.833924519160977e-05, "Pretrain/Loss": 2.0524277687072754, "Pretrain/Loss (Raw)": 2.076669692993164, "Pretrain/Step": 4517, "Pretrain/Step Time": 8.538051640614867} +{"Pretrain/Learning Rate": 2.8330831200387885e-05, "Pretrain/Loss": 2.0547733306884766, "Pretrain/Loss (Raw)": 2.026900053024292, "Pretrain/Step": 4518, "Pretrain/Step Time": 8.549509657546878} +{"Pretrain/Learning Rate": 2.8322416825038855e-05, "Pretrain/Loss": 2.056530475616455, "Pretrain/Loss (Raw)": 2.1824615001678467, "Pretrain/Step": 4519, "Pretrain/Step Time": 8.542038176208735} +{"Pretrain/Learning Rate": 2.831400206653305e-05, "Pretrain/Loss": 2.056696653366089, "Pretrain/Loss (Raw)": 2.1705331802368164, "Pretrain/Step": 4520, "Pretrain/Step Time": 8.543224927037954} +{"Pretrain/Learning Rate": 2.830558692584092e-05, "Pretrain/Loss": 2.0557260513305664, "Pretrain/Loss (Raw)": 2.0415494441986084, "Pretrain/Step": 4521, "Pretrain/Step Time": 8.544052636250854} +{"Pretrain/Learning Rate": 2.8297171403932928e-05, "Pretrain/Loss": 2.057033061981201, "Pretrain/Loss (Raw)": 2.0981996059417725, "Pretrain/Step": 4522, "Pretrain/Step Time": 8.537771502509713} +{"Pretrain/Learning Rate": 2.8288755501779597e-05, "Pretrain/Loss": 2.057269811630249, "Pretrain/Loss (Raw)": 2.0099480152130127, "Pretrain/Step": 4523, "Pretrain/Step Time": 8.543699169531465} +{"Pretrain/Learning Rate": 2.8280339220351475e-05, "Pretrain/Loss": 2.057248115539551, "Pretrain/Loss (Raw)": 1.9867310523986816, "Pretrain/Step": 4524, "Pretrain/Step Time": 8.545701151713729} +{"Pretrain/Learning Rate": 2.8271922560619184e-05, "Pretrain/Loss": 2.056507110595703, "Pretrain/Loss (Raw)": 2.097254753112793, "Pretrain/Step": 4525, "Pretrain/Step Time": 8.546399861574173} +{"Pretrain/Learning Rate": 2.8263505523553357e-05, "Pretrain/Loss": 2.0583128929138184, "Pretrain/Loss (Raw)": 2.0268077850341797, "Pretrain/Step": 4526, "Pretrain/Step Time": 8.548699514940381} +{"Pretrain/Learning Rate": 2.8255088110124705e-05, "Pretrain/Loss": 2.0579237937927246, "Pretrain/Loss (Raw)": 1.945237636566162, "Pretrain/Step": 4527, "Pretrain/Step Time": 8.543574944138527} +{"Pretrain/Learning Rate": 2.8246670321303947e-05, "Pretrain/Loss": 2.057924270629883, "Pretrain/Loss (Raw)": 1.9666000604629517, "Pretrain/Step": 4528, "Pretrain/Step Time": 8.543039917945862} +{"Pretrain/Learning Rate": 2.8238252158061873e-05, "Pretrain/Loss": 2.0583393573760986, "Pretrain/Loss (Raw)": 2.040802478790283, "Pretrain/Step": 4529, "Pretrain/Step Time": 8.543572360649705} +{"Pretrain/Learning Rate": 2.8229833621369295e-05, "Pretrain/Loss": 2.0569546222686768, "Pretrain/Loss (Raw)": 2.0113589763641357, "Pretrain/Step": 4530, "Pretrain/Step Time": 8.553596841171384} +{"Pretrain/Learning Rate": 2.822141471219709e-05, "Pretrain/Loss": 2.056002140045166, "Pretrain/Loss (Raw)": 1.9984163045883179, "Pretrain/Step": 4531, "Pretrain/Step Time": 8.54834994673729} +{"Pretrain/Learning Rate": 2.8212995431516163e-05, "Pretrain/Loss": 2.0544466972351074, "Pretrain/Loss (Raw)": 2.0045266151428223, "Pretrain/Step": 4532, "Pretrain/Step Time": 8.544448859989643} +{"Pretrain/Learning Rate": 2.820457578029746e-05, "Pretrain/Loss": 2.0537610054016113, "Pretrain/Loss (Raw)": 2.0172014236450195, "Pretrain/Step": 4533, "Pretrain/Step Time": 8.54478264413774} +{"Pretrain/Learning Rate": 2.8196155759511977e-05, "Pretrain/Loss": 2.0536410808563232, "Pretrain/Loss (Raw)": 2.0145576000213623, "Pretrain/Step": 4534, "Pretrain/Step Time": 8.546367282047868} +{"Pretrain/Learning Rate": 2.8187735370130745e-05, "Pretrain/Loss": 2.0559823513031006, "Pretrain/Loss (Raw)": 2.342632293701172, "Pretrain/Step": 4535, "Pretrain/Step Time": 8.54197963513434} +{"Pretrain/Learning Rate": 2.8179314613124858e-05, "Pretrain/Loss": 2.055424928665161, "Pretrain/Loss (Raw)": 2.027252674102783, "Pretrain/Step": 4536, "Pretrain/Step Time": 8.550692668184638} +{"Pretrain/Learning Rate": 2.817089348946542e-05, "Pretrain/Loss": 2.0578200817108154, "Pretrain/Loss (Raw)": 2.3139376640319824, "Pretrain/Step": 4537, "Pretrain/Step Time": 8.54133078828454} +{"Pretrain/Learning Rate": 2.8162472000123613e-05, "Pretrain/Loss": 2.0567972660064697, "Pretrain/Loss (Raw)": 1.9811573028564453, "Pretrain/Step": 4538, "Pretrain/Step Time": 8.542357955127954} +{"Pretrain/Learning Rate": 2.8154050146070627e-05, "Pretrain/Loss": 2.054898738861084, "Pretrain/Loss (Raw)": 1.9339905977249146, "Pretrain/Step": 4539, "Pretrain/Step Time": 8.54320145957172} +{"Pretrain/Learning Rate": 2.814562792827772e-05, "Pretrain/Loss": 2.053436279296875, "Pretrain/Loss (Raw)": 1.8820573091506958, "Pretrain/Step": 4540, "Pretrain/Step Time": 8.542922595515847} +{"Pretrain/Learning Rate": 2.8137205347716165e-05, "Pretrain/Loss": 2.0555531978607178, "Pretrain/Loss (Raw)": 2.163297653198242, "Pretrain/Step": 4541, "Pretrain/Step Time": 8.542985625565052} +{"Pretrain/Learning Rate": 2.8128782405357312e-05, "Pretrain/Loss": 2.0583596229553223, "Pretrain/Loss (Raw)": 2.171630859375, "Pretrain/Step": 4542, "Pretrain/Step Time": 8.552946822717786} +{"Pretrain/Learning Rate": 2.812035910217254e-05, "Pretrain/Loss": 2.059859275817871, "Pretrain/Loss (Raw)": 2.093471050262451, "Pretrain/Step": 4543, "Pretrain/Step Time": 8.543976996093988} +{"Pretrain/Learning Rate": 2.811193543913324e-05, "Pretrain/Loss": 2.059624671936035, "Pretrain/Loss (Raw)": 2.0161216259002686, "Pretrain/Step": 4544, "Pretrain/Step Time": 8.545173091813922} +{"Pretrain/Learning Rate": 2.8103511417210886e-05, "Pretrain/Loss": 2.061610221862793, "Pretrain/Loss (Raw)": 2.339576482772827, "Pretrain/Step": 4545, "Pretrain/Step Time": 8.54132353886962} +{"Pretrain/Learning Rate": 2.809508703737697e-05, "Pretrain/Loss": 2.0628440380096436, "Pretrain/Loss (Raw)": 2.352592706680298, "Pretrain/Step": 4546, "Pretrain/Step Time": 8.535883463919163} +{"Pretrain/Learning Rate": 2.808666230060304e-05, "Pretrain/Loss": 2.062699317932129, "Pretrain/Loss (Raw)": 2.0685877799987793, "Pretrain/Step": 4547, "Pretrain/Step Time": 8.537331795319915} +{"Pretrain/Learning Rate": 2.8078237207860658e-05, "Pretrain/Loss": 2.061800956726074, "Pretrain/Loss (Raw)": 2.008997917175293, "Pretrain/Step": 4548, "Pretrain/Step Time": 8.54843701981008} +{"Pretrain/Learning Rate": 2.806981176012146e-05, "Pretrain/Loss": 2.0621142387390137, "Pretrain/Loss (Raw)": 2.1152360439300537, "Pretrain/Step": 4549, "Pretrain/Step Time": 8.54867828451097} +{"Pretrain/Learning Rate": 2.80613859583571e-05, "Pretrain/Loss": 2.0629076957702637, "Pretrain/Loss (Raw)": 2.1998348236083984, "Pretrain/Step": 4550, "Pretrain/Step Time": 8.548020845279098} +{"Pretrain/Learning Rate": 2.8052959803539298e-05, "Pretrain/Loss": 2.064988374710083, "Pretrain/Loss (Raw)": 2.2719035148620605, "Pretrain/Step": 4551, "Pretrain/Step Time": 8.546506628394127} +{"Pretrain/Learning Rate": 2.8044533296639774e-05, "Pretrain/Loss": 2.063814163208008, "Pretrain/Loss (Raw)": 2.0749921798706055, "Pretrain/Step": 4552, "Pretrain/Step Time": 8.545942470431328} +{"Pretrain/Learning Rate": 2.8036106438630327e-05, "Pretrain/Loss": 2.063795804977417, "Pretrain/Loss (Raw)": 2.083716869354248, "Pretrain/Step": 4553, "Pretrain/Step Time": 8.548281997442245} +{"Pretrain/Learning Rate": 2.802767923048278e-05, "Pretrain/Loss": 2.064049005508423, "Pretrain/Loss (Raw)": 1.9778081178665161, "Pretrain/Step": 4554, "Pretrain/Step Time": 8.551819771528244} +{"Pretrain/Learning Rate": 2.8019251673168993e-05, "Pretrain/Loss": 2.065871000289917, "Pretrain/Loss (Raw)": 2.1836159229278564, "Pretrain/Step": 4555, "Pretrain/Step Time": 8.540310064330697} +{"Pretrain/Learning Rate": 2.8010823767660887e-05, "Pretrain/Loss": 2.0655629634857178, "Pretrain/Loss (Raw)": 2.1230392456054688, "Pretrain/Step": 4556, "Pretrain/Step Time": 8.542735792696476} +{"Pretrain/Learning Rate": 2.8002395514930385e-05, "Pretrain/Loss": 2.065746545791626, "Pretrain/Loss (Raw)": 1.9640511274337769, "Pretrain/Step": 4557, "Pretrain/Step Time": 8.543329810723662} +{"Pretrain/Learning Rate": 2.7993966915949493e-05, "Pretrain/Loss": 2.068985939025879, "Pretrain/Loss (Raw)": 2.3785946369171143, "Pretrain/Step": 4558, "Pretrain/Step Time": 8.540208790451288} +{"Pretrain/Learning Rate": 2.7985537971690216e-05, "Pretrain/Loss": 2.069526195526123, "Pretrain/Loss (Raw)": 2.1587908267974854, "Pretrain/Step": 4559, "Pretrain/Step Time": 8.53914812579751} +{"Pretrain/Learning Rate": 2.7977108683124647e-05, "Pretrain/Loss": 2.071187973022461, "Pretrain/Loss (Raw)": 2.2098889350891113, "Pretrain/Step": 4560, "Pretrain/Step Time": 8.553834836930037} +{"Pretrain/Learning Rate": 2.7968679051224868e-05, "Pretrain/Loss": 2.070462942123413, "Pretrain/Loss (Raw)": 1.9655570983886719, "Pretrain/Step": 4561, "Pretrain/Step Time": 8.545517407357693} +{"Pretrain/Learning Rate": 2.796024907696303e-05, "Pretrain/Loss": 2.0708250999450684, "Pretrain/Loss (Raw)": 2.092139482498169, "Pretrain/Step": 4562, "Pretrain/Step Time": 8.53976846113801} +{"Pretrain/Learning Rate": 2.795181876131132e-05, "Pretrain/Loss": 2.0692636966705322, "Pretrain/Loss (Raw)": 1.9379369020462036, "Pretrain/Step": 4563, "Pretrain/Step Time": 8.54128303565085} +{"Pretrain/Learning Rate": 2.7943388105241968e-05, "Pretrain/Loss": 2.069671630859375, "Pretrain/Loss (Raw)": 2.045065402984619, "Pretrain/Step": 4564, "Pretrain/Step Time": 8.541304973885417} +{"Pretrain/Learning Rate": 2.793495710972722e-05, "Pretrain/Loss": 2.066908836364746, "Pretrain/Loss (Raw)": 1.9529293775558472, "Pretrain/Step": 4565, "Pretrain/Step Time": 8.54113743826747} +{"Pretrain/Learning Rate": 2.79265257757394e-05, "Pretrain/Loss": 2.066251754760742, "Pretrain/Loss (Raw)": 1.9545409679412842, "Pretrain/Step": 4566, "Pretrain/Step Time": 8.546954739838839} +{"Pretrain/Learning Rate": 2.7918094104250826e-05, "Pretrain/Loss": 2.066042900085449, "Pretrain/Loss (Raw)": 2.071276903152466, "Pretrain/Step": 4567, "Pretrain/Step Time": 8.540135392919183} +{"Pretrain/Learning Rate": 2.7909662096233897e-05, "Pretrain/Loss": 2.0668697357177734, "Pretrain/Loss (Raw)": 2.2719614505767822, "Pretrain/Step": 4568, "Pretrain/Step Time": 8.539703983813524} +{"Pretrain/Learning Rate": 2.7901229752661018e-05, "Pretrain/Loss": 2.068863868713379, "Pretrain/Loss (Raw)": 2.3239517211914062, "Pretrain/Step": 4569, "Pretrain/Step Time": 8.533751895651221} +{"Pretrain/Learning Rate": 2.7892797074504656e-05, "Pretrain/Loss": 2.069478988647461, "Pretrain/Loss (Raw)": 1.9747971296310425, "Pretrain/Step": 4570, "Pretrain/Step Time": 8.530580289661884} +{"Pretrain/Learning Rate": 2.78843640627373e-05, "Pretrain/Loss": 2.0709853172302246, "Pretrain/Loss (Raw)": 2.0680837631225586, "Pretrain/Step": 4571, "Pretrain/Step Time": 8.528836162760854} +{"Pretrain/Learning Rate": 2.7875930718331496e-05, "Pretrain/Loss": 2.0702943801879883, "Pretrain/Loss (Raw)": 2.0034232139587402, "Pretrain/Step": 4572, "Pretrain/Step Time": 8.55174327455461} +{"Pretrain/Learning Rate": 2.786749704225981e-05, "Pretrain/Loss": 2.068918228149414, "Pretrain/Loss (Raw)": 1.9419790506362915, "Pretrain/Step": 4573, "Pretrain/Step Time": 8.544868554919958} +{"Pretrain/Learning Rate": 2.785906303549485e-05, "Pretrain/Loss": 2.0691041946411133, "Pretrain/Loss (Raw)": 2.0475306510925293, "Pretrain/Step": 4574, "Pretrain/Step Time": 8.546516560018063} +{"Pretrain/Learning Rate": 2.7850628699009268e-05, "Pretrain/Loss": 2.0709288120269775, "Pretrain/Loss (Raw)": 2.2312445640563965, "Pretrain/Step": 4575, "Pretrain/Step Time": 8.545569784939289} +{"Pretrain/Learning Rate": 2.7842194033775747e-05, "Pretrain/Loss": 2.0706379413604736, "Pretrain/Loss (Raw)": 2.01853084564209, "Pretrain/Step": 4576, "Pretrain/Step Time": 8.54148655757308} +{"Pretrain/Learning Rate": 2.7833759040767027e-05, "Pretrain/Loss": 2.0706229209899902, "Pretrain/Loss (Raw)": 2.1570231914520264, "Pretrain/Step": 4577, "Pretrain/Step Time": 8.537128746509552} +{"Pretrain/Learning Rate": 2.7825323720955853e-05, "Pretrain/Loss": 2.0710818767547607, "Pretrain/Loss (Raw)": 2.073164463043213, "Pretrain/Step": 4578, "Pretrain/Step Time": 8.540920032188296} +{"Pretrain/Learning Rate": 2.781688807531504e-05, "Pretrain/Loss": 2.069972276687622, "Pretrain/Loss (Raw)": 1.9272186756134033, "Pretrain/Step": 4579, "Pretrain/Step Time": 8.537795219570398} +{"Pretrain/Learning Rate": 2.7808452104817412e-05, "Pretrain/Loss": 2.0688257217407227, "Pretrain/Loss (Raw)": 1.8350536823272705, "Pretrain/Step": 4580, "Pretrain/Step Time": 8.540915004909039} +{"Pretrain/Learning Rate": 2.7800015810435865e-05, "Pretrain/Loss": 2.0688440799713135, "Pretrain/Loss (Raw)": 2.183892011642456, "Pretrain/Step": 4581, "Pretrain/Step Time": 8.53756226412952} +{"Pretrain/Learning Rate": 2.779157919314329e-05, "Pretrain/Loss": 2.0676159858703613, "Pretrain/Loss (Raw)": 1.964472770690918, "Pretrain/Step": 4582, "Pretrain/Step Time": 8.541878351941705} +{"Pretrain/Learning Rate": 2.7783142253912647e-05, "Pretrain/Loss": 2.065784454345703, "Pretrain/Loss (Raw)": 1.822821021080017, "Pretrain/Step": 4583, "Pretrain/Step Time": 8.544509299099445} +{"Pretrain/Learning Rate": 2.7774704993716937e-05, "Pretrain/Loss": 2.066598415374756, "Pretrain/Loss (Raw)": 2.192417860031128, "Pretrain/Step": 4584, "Pretrain/Step Time": 8.545634677633643} +{"Pretrain/Learning Rate": 2.776626741352916e-05, "Pretrain/Loss": 2.0631251335144043, "Pretrain/Loss (Raw)": 1.6897130012512207, "Pretrain/Step": 4585, "Pretrain/Step Time": 8.533657759428024} +{"Pretrain/Learning Rate": 2.7757829514322397e-05, "Pretrain/Loss": 2.0612053871154785, "Pretrain/Loss (Raw)": 1.8804458379745483, "Pretrain/Step": 4586, "Pretrain/Step Time": 8.538547618314624} +{"Pretrain/Learning Rate": 2.774939129706974e-05, "Pretrain/Loss": 2.0669970512390137, "Pretrain/Loss (Raw)": 2.732966423034668, "Pretrain/Step": 4587, "Pretrain/Step Time": 8.53772471472621} +{"Pretrain/Learning Rate": 2.7740952762744322e-05, "Pretrain/Loss": 2.0637080669403076, "Pretrain/Loss (Raw)": 1.7075480222702026, "Pretrain/Step": 4588, "Pretrain/Step Time": 8.54110161960125} +{"Pretrain/Learning Rate": 2.7732513912319314e-05, "Pretrain/Loss": 2.0631299018859863, "Pretrain/Loss (Raw)": 1.7732549905776978, "Pretrain/Step": 4589, "Pretrain/Step Time": 8.542214853689075} +{"Pretrain/Learning Rate": 2.7724074746767926e-05, "Pretrain/Loss": 2.0632388591766357, "Pretrain/Loss (Raw)": 1.9271334409713745, "Pretrain/Step": 4590, "Pretrain/Step Time": 8.549464970827103} +{"Pretrain/Learning Rate": 2.77156352670634e-05, "Pretrain/Loss": 2.0646097660064697, "Pretrain/Loss (Raw)": 2.167017936706543, "Pretrain/Step": 4591, "Pretrain/Step Time": 8.545327117666602} +{"Pretrain/Learning Rate": 2.770719547417902e-05, "Pretrain/Loss": 2.0658011436462402, "Pretrain/Loss (Raw)": 2.2154438495635986, "Pretrain/Step": 4592, "Pretrain/Step Time": 8.547347566112876} +{"Pretrain/Learning Rate": 2.76987553690881e-05, "Pretrain/Loss": 2.066087245941162, "Pretrain/Loss (Raw)": 2.092654228210449, "Pretrain/Step": 4593, "Pretrain/Step Time": 8.542094079777598} +{"Pretrain/Learning Rate": 2.7690314952764e-05, "Pretrain/Loss": 2.066218137741089, "Pretrain/Loss (Raw)": 2.1166181564331055, "Pretrain/Step": 4594, "Pretrain/Step Time": 8.546526385471225} +{"Pretrain/Learning Rate": 2.7681874226180093e-05, "Pretrain/Loss": 2.0668468475341797, "Pretrain/Loss (Raw)": 2.139087200164795, "Pretrain/Step": 4595, "Pretrain/Step Time": 8.545819900929928} +{"Pretrain/Learning Rate": 2.7673433190309823e-05, "Pretrain/Loss": 2.0667688846588135, "Pretrain/Loss (Raw)": 2.155773878097534, "Pretrain/Step": 4596, "Pretrain/Step Time": 8.54979189299047} +{"Pretrain/Learning Rate": 2.766499184612663e-05, "Pretrain/Loss": 2.068166732788086, "Pretrain/Loss (Raw)": 2.1929633617401123, "Pretrain/Step": 4597, "Pretrain/Step Time": 8.543042041361332} +{"Pretrain/Learning Rate": 2.7656550194604026e-05, "Pretrain/Loss": 2.0686028003692627, "Pretrain/Loss (Raw)": 2.1151018142700195, "Pretrain/Step": 4598, "Pretrain/Step Time": 8.547792851924896} +{"Pretrain/Learning Rate": 2.7648108236715536e-05, "Pretrain/Loss": 2.0685667991638184, "Pretrain/Loss (Raw)": 2.07606840133667, "Pretrain/Step": 4599, "Pretrain/Step Time": 8.55100922100246} +{"Pretrain/Learning Rate": 2.7639665973434725e-05, "Pretrain/Loss": 2.068753719329834, "Pretrain/Loss (Raw)": 2.0431501865386963, "Pretrain/Step": 4600, "Pretrain/Step Time": 8.547596601769328} +{"Pretrain/Learning Rate": 2.7631223405735196e-05, "Pretrain/Loss": 2.071634292602539, "Pretrain/Loss (Raw)": 2.3249006271362305, "Pretrain/Step": 4601, "Pretrain/Step Time": 8.548527469858527} +{"Pretrain/Learning Rate": 2.7622780534590582e-05, "Pretrain/Loss": 2.071371078491211, "Pretrain/Loss (Raw)": 2.053349733352661, "Pretrain/Step": 4602, "Pretrain/Step Time": 8.554140446707606} +{"Pretrain/Learning Rate": 2.7614337360974558e-05, "Pretrain/Loss": 2.0708065032958984, "Pretrain/Loss (Raw)": 2.0876998901367188, "Pretrain/Step": 4603, "Pretrain/Step Time": 8.547985028475523} +{"Pretrain/Learning Rate": 2.760589388586083e-05, "Pretrain/Loss": 2.0707602500915527, "Pretrain/Loss (Raw)": 2.148883819580078, "Pretrain/Step": 4604, "Pretrain/Step Time": 8.552551509812474} +{"Pretrain/Learning Rate": 2.7597450110223145e-05, "Pretrain/Loss": 2.069523334503174, "Pretrain/Loss (Raw)": 2.1426892280578613, "Pretrain/Step": 4605, "Pretrain/Step Time": 8.54845660738647} +{"Pretrain/Learning Rate": 2.7589006035035264e-05, "Pretrain/Loss": 2.069334030151367, "Pretrain/Loss (Raw)": 2.1447901725769043, "Pretrain/Step": 4606, "Pretrain/Step Time": 8.550923390313983} +{"Pretrain/Learning Rate": 2.7580561661271014e-05, "Pretrain/Loss": 2.071500301361084, "Pretrain/Loss (Raw)": 2.1247599124908447, "Pretrain/Step": 4607, "Pretrain/Step Time": 8.547339925542474} +{"Pretrain/Learning Rate": 2.7572116989904228e-05, "Pretrain/Loss": 2.0709800720214844, "Pretrain/Loss (Raw)": 2.160727024078369, "Pretrain/Step": 4608, "Pretrain/Step Time": 8.55736119300127} +{"Pretrain/Learning Rate": 2.7563672021908797e-05, "Pretrain/Loss": 2.0704586505889893, "Pretrain/Loss (Raw)": 2.0345072746276855, "Pretrain/Step": 4609, "Pretrain/Step Time": 8.555902570486069} +{"Pretrain/Learning Rate": 2.7555226758258624e-05, "Pretrain/Loss": 2.070512056350708, "Pretrain/Loss (Raw)": 1.9611274003982544, "Pretrain/Step": 4610, "Pretrain/Step Time": 8.559067422524095} +{"Pretrain/Learning Rate": 2.7546781199927667e-05, "Pretrain/Loss": 2.0719456672668457, "Pretrain/Loss (Raw)": 2.170804262161255, "Pretrain/Step": 4611, "Pretrain/Step Time": 8.554495979100466} +{"Pretrain/Learning Rate": 2.7538335347889892e-05, "Pretrain/Loss": 2.0726988315582275, "Pretrain/Loss (Raw)": 2.1413919925689697, "Pretrain/Step": 4612, "Pretrain/Step Time": 8.551755608990788} +{"Pretrain/Learning Rate": 2.752988920311933e-05, "Pretrain/Loss": 2.071959972381592, "Pretrain/Loss (Raw)": 1.9465042352676392, "Pretrain/Step": 4613, "Pretrain/Step Time": 8.553187768906355} +{"Pretrain/Learning Rate": 2.7521442766590027e-05, "Pretrain/Loss": 2.074178695678711, "Pretrain/Loss (Raw)": 2.200326681137085, "Pretrain/Step": 4614, "Pretrain/Step Time": 8.550746640190482} +{"Pretrain/Learning Rate": 2.7512996039276055e-05, "Pretrain/Loss": 2.0740342140197754, "Pretrain/Loss (Raw)": 2.0022504329681396, "Pretrain/Step": 4615, "Pretrain/Step Time": 8.558522986248136} +{"Pretrain/Learning Rate": 2.7504549022151543e-05, "Pretrain/Loss": 2.074000835418701, "Pretrain/Loss (Raw)": 2.0575637817382812, "Pretrain/Step": 4616, "Pretrain/Step Time": 8.548733364790678} +{"Pretrain/Learning Rate": 2.749610171619063e-05, "Pretrain/Loss": 2.0760269165039062, "Pretrain/Loss (Raw)": 2.217747449874878, "Pretrain/Step": 4617, "Pretrain/Step Time": 8.545908767729998} +{"Pretrain/Learning Rate": 2.748765412236751e-05, "Pretrain/Loss": 2.07712984085083, "Pretrain/Loss (Raw)": 2.0568976402282715, "Pretrain/Step": 4618, "Pretrain/Step Time": 8.54606638662517} +{"Pretrain/Learning Rate": 2.747920624165639e-05, "Pretrain/Loss": 2.0781564712524414, "Pretrain/Loss (Raw)": 2.1894822120666504, "Pretrain/Step": 4619, "Pretrain/Step Time": 8.542943082749844} +{"Pretrain/Learning Rate": 2.7470758075031533e-05, "Pretrain/Loss": 2.07858943939209, "Pretrain/Loss (Raw)": 2.0880231857299805, "Pretrain/Step": 4620, "Pretrain/Step Time": 8.555115768685937} +{"Pretrain/Learning Rate": 2.7462309623467204e-05, "Pretrain/Loss": 2.0773391723632812, "Pretrain/Loss (Raw)": 1.9191880226135254, "Pretrain/Step": 4621, "Pretrain/Step Time": 8.55064007639885} +{"Pretrain/Learning Rate": 2.7453860887937732e-05, "Pretrain/Loss": 2.078461170196533, "Pretrain/Loss (Raw)": 2.191013813018799, "Pretrain/Step": 4622, "Pretrain/Step Time": 8.549807356670499} +{"Pretrain/Learning Rate": 2.7445411869417453e-05, "Pretrain/Loss": 2.0785555839538574, "Pretrain/Loss (Raw)": 2.264407157897949, "Pretrain/Step": 4623, "Pretrain/Step Time": 8.542921425774693} +{"Pretrain/Learning Rate": 2.7436962568880752e-05, "Pretrain/Loss": 2.0787220001220703, "Pretrain/Loss (Raw)": 2.147984743118286, "Pretrain/Step": 4624, "Pretrain/Step Time": 8.542182372882962} +{"Pretrain/Learning Rate": 2.7428512987302053e-05, "Pretrain/Loss": 2.079469919204712, "Pretrain/Loss (Raw)": 2.2560174465179443, "Pretrain/Step": 4625, "Pretrain/Step Time": 8.542656350880861} +{"Pretrain/Learning Rate": 2.7420063125655787e-05, "Pretrain/Loss": 2.0819125175476074, "Pretrain/Loss (Raw)": 2.0814993381500244, "Pretrain/Step": 4626, "Pretrain/Step Time": 8.549297150224447} +{"Pretrain/Learning Rate": 2.741161298491644e-05, "Pretrain/Loss": 2.081541061401367, "Pretrain/Loss (Raw)": 1.9760648012161255, "Pretrain/Step": 4627, "Pretrain/Step Time": 8.547496516257524} +{"Pretrain/Learning Rate": 2.7403162566058517e-05, "Pretrain/Loss": 2.081711769104004, "Pretrain/Loss (Raw)": 2.0175702571868896, "Pretrain/Step": 4628, "Pretrain/Step Time": 8.54583140835166} +{"Pretrain/Learning Rate": 2.7394711870056567e-05, "Pretrain/Loss": 2.082277536392212, "Pretrain/Loss (Raw)": 2.108804225921631, "Pretrain/Step": 4629, "Pretrain/Step Time": 8.544417472556233} +{"Pretrain/Learning Rate": 2.7386260897885156e-05, "Pretrain/Loss": 2.083566188812256, "Pretrain/Loss (Raw)": 2.1388556957244873, "Pretrain/Step": 4630, "Pretrain/Step Time": 8.547898199409246} +{"Pretrain/Learning Rate": 2.73778096505189e-05, "Pretrain/Loss": 2.083906650543213, "Pretrain/Loss (Raw)": 2.098863124847412, "Pretrain/Step": 4631, "Pretrain/Step Time": 8.546507146209478} +{"Pretrain/Learning Rate": 2.7369358128932422e-05, "Pretrain/Loss": 2.083820104598999, "Pretrain/Loss (Raw)": 2.170703411102295, "Pretrain/Step": 4632, "Pretrain/Step Time": 8.555023092776537} +{"Pretrain/Learning Rate": 2.7360906334100407e-05, "Pretrain/Loss": 2.081357479095459, "Pretrain/Loss (Raw)": 1.9493229389190674, "Pretrain/Step": 4633, "Pretrain/Step Time": 8.551321636885405} +{"Pretrain/Learning Rate": 2.7352454266997545e-05, "Pretrain/Loss": 2.0801634788513184, "Pretrain/Loss (Raw)": 2.0407931804656982, "Pretrain/Step": 4634, "Pretrain/Step Time": 8.553713085129857} +{"Pretrain/Learning Rate": 2.734400192859857e-05, "Pretrain/Loss": 2.0801239013671875, "Pretrain/Loss (Raw)": 2.069424867630005, "Pretrain/Step": 4635, "Pretrain/Step Time": 8.55350330658257} +{"Pretrain/Learning Rate": 2.7335549319878252e-05, "Pretrain/Loss": 2.078521251678467, "Pretrain/Loss (Raw)": 1.9545700550079346, "Pretrain/Step": 4636, "Pretrain/Step Time": 8.552835907787085} +{"Pretrain/Learning Rate": 2.7327096441811383e-05, "Pretrain/Loss": 2.078455686569214, "Pretrain/Loss (Raw)": 1.9285470247268677, "Pretrain/Step": 4637, "Pretrain/Step Time": 8.550351152196527} +{"Pretrain/Learning Rate": 2.7318643295372776e-05, "Pretrain/Loss": 2.079636335372925, "Pretrain/Loss (Raw)": 2.17004132270813, "Pretrain/Step": 4638, "Pretrain/Step Time": 8.55809048563242} +{"Pretrain/Learning Rate": 2.7310189881537307e-05, "Pretrain/Loss": 2.0800938606262207, "Pretrain/Loss (Raw)": 2.1442713737487793, "Pretrain/Step": 4639, "Pretrain/Step Time": 8.55903915502131} +{"Pretrain/Learning Rate": 2.7301736201279858e-05, "Pretrain/Loss": 2.079725742340088, "Pretrain/Loss (Raw)": 2.045511484146118, "Pretrain/Step": 4640, "Pretrain/Step Time": 8.566682325676084} +{"Pretrain/Learning Rate": 2.7293282255575335e-05, "Pretrain/Loss": 2.0808632373809814, "Pretrain/Loss (Raw)": 2.3049185276031494, "Pretrain/Step": 4641, "Pretrain/Step Time": 8.567679727450013} +{"Pretrain/Learning Rate": 2.7284828045398703e-05, "Pretrain/Loss": 2.081686019897461, "Pretrain/Loss (Raw)": 1.9982407093048096, "Pretrain/Step": 4642, "Pretrain/Step Time": 8.565772688016295} +{"Pretrain/Learning Rate": 2.7276373571724927e-05, "Pretrain/Loss": 2.080214738845825, "Pretrain/Loss (Raw)": 1.87563157081604, "Pretrain/Step": 4643, "Pretrain/Step Time": 8.567314950749278} +{"Pretrain/Learning Rate": 2.7267918835529033e-05, "Pretrain/Loss": 2.080813407897949, "Pretrain/Loss (Raw)": 2.0029685497283936, "Pretrain/Step": 4644, "Pretrain/Step Time": 8.56823444366455} +{"Pretrain/Learning Rate": 2.725946383778605e-05, "Pretrain/Loss": 2.081547975540161, "Pretrain/Loss (Raw)": 2.170694351196289, "Pretrain/Step": 4645, "Pretrain/Step Time": 8.571739511564374} +{"Pretrain/Learning Rate": 2.7251008579471044e-05, "Pretrain/Loss": 2.0826034545898438, "Pretrain/Loss (Raw)": 2.1619949340820312, "Pretrain/Step": 4646, "Pretrain/Step Time": 8.558754660189152} +{"Pretrain/Learning Rate": 2.7242553061559123e-05, "Pretrain/Loss": 2.080061912536621, "Pretrain/Loss (Raw)": 1.85715913772583, "Pretrain/Step": 4647, "Pretrain/Step Time": 8.561138585209846} +{"Pretrain/Learning Rate": 2.7234097285025424e-05, "Pretrain/Loss": 2.080000877380371, "Pretrain/Loss (Raw)": 2.1626877784729004, "Pretrain/Step": 4648, "Pretrain/Step Time": 8.558675739914179} +{"Pretrain/Learning Rate": 2.7225641250845085e-05, "Pretrain/Loss": 2.079603672027588, "Pretrain/Loss (Raw)": 1.9907310009002686, "Pretrain/Step": 4649, "Pretrain/Step Time": 8.561760753393173} +{"Pretrain/Learning Rate": 2.7217184959993326e-05, "Pretrain/Loss": 2.0798497200012207, "Pretrain/Loss (Raw)": 2.129713296890259, "Pretrain/Step": 4650, "Pretrain/Step Time": 8.57295422628522} +{"Pretrain/Learning Rate": 2.7208728413445332e-05, "Pretrain/Loss": 2.080815315246582, "Pretrain/Loss (Raw)": 2.1335041522979736, "Pretrain/Step": 4651, "Pretrain/Step Time": 8.568536780774593} +{"Pretrain/Learning Rate": 2.720027161217638e-05, "Pretrain/Loss": 2.081986427307129, "Pretrain/Loss (Raw)": 2.1366350650787354, "Pretrain/Step": 4652, "Pretrain/Step Time": 8.55738396756351} +{"Pretrain/Learning Rate": 2.7191814557161736e-05, "Pretrain/Loss": 2.083242416381836, "Pretrain/Loss (Raw)": 2.2580294609069824, "Pretrain/Step": 4653, "Pretrain/Step Time": 8.554715778678656} +{"Pretrain/Learning Rate": 2.7183357249376712e-05, "Pretrain/Loss": 2.0837836265563965, "Pretrain/Loss (Raw)": 2.0961108207702637, "Pretrain/Step": 4654, "Pretrain/Step Time": 8.553909197449684} +{"Pretrain/Learning Rate": 2.7174899689796636e-05, "Pretrain/Loss": 2.0844240188598633, "Pretrain/Loss (Raw)": 2.027200937271118, "Pretrain/Step": 4655, "Pretrain/Step Time": 8.553796844556928} +{"Pretrain/Learning Rate": 2.7166441879396887e-05, "Pretrain/Loss": 2.0872080326080322, "Pretrain/Loss (Raw)": 2.322936773300171, "Pretrain/Step": 4656, "Pretrain/Step Time": 8.562492126598954} +{"Pretrain/Learning Rate": 2.7157983819152848e-05, "Pretrain/Loss": 2.087073564529419, "Pretrain/Loss (Raw)": 2.023599624633789, "Pretrain/Step": 4657, "Pretrain/Step Time": 8.565057948231697} +{"Pretrain/Learning Rate": 2.714952551003994e-05, "Pretrain/Loss": 2.0877673625946045, "Pretrain/Loss (Raw)": 2.100155830383301, "Pretrain/Step": 4658, "Pretrain/Step Time": 8.560156226158142} +{"Pretrain/Learning Rate": 2.714106695303363e-05, "Pretrain/Loss": 2.088364362716675, "Pretrain/Loss (Raw)": 2.0748255252838135, "Pretrain/Step": 4659, "Pretrain/Step Time": 8.56460084207356} +{"Pretrain/Learning Rate": 2.7132608149109383e-05, "Pretrain/Loss": 2.0898334980010986, "Pretrain/Loss (Raw)": 2.1925787925720215, "Pretrain/Step": 4660, "Pretrain/Step Time": 8.559219244867563} +{"Pretrain/Learning Rate": 2.7124149099242724e-05, "Pretrain/Loss": 2.0918383598327637, "Pretrain/Loss (Raw)": 2.2738194465637207, "Pretrain/Step": 4661, "Pretrain/Step Time": 8.55988317169249} +{"Pretrain/Learning Rate": 2.7115689804409174e-05, "Pretrain/Loss": 2.0930609703063965, "Pretrain/Loss (Raw)": 2.171076536178589, "Pretrain/Step": 4662, "Pretrain/Step Time": 8.564779506996274} +{"Pretrain/Learning Rate": 2.710723026558431e-05, "Pretrain/Loss": 2.091108560562134, "Pretrain/Loss (Raw)": 2.092709541320801, "Pretrain/Step": 4663, "Pretrain/Step Time": 8.562403747811913} +{"Pretrain/Learning Rate": 2.709877048374371e-05, "Pretrain/Loss": 2.090808868408203, "Pretrain/Loss (Raw)": 1.9888641834259033, "Pretrain/Step": 4664, "Pretrain/Step Time": 8.556163381785154} +{"Pretrain/Learning Rate": 2.709031045986302e-05, "Pretrain/Loss": 2.0887928009033203, "Pretrain/Loss (Raw)": 2.055927276611328, "Pretrain/Step": 4665, "Pretrain/Step Time": 8.55470971390605} +{"Pretrain/Learning Rate": 2.708185019491788e-05, "Pretrain/Loss": 2.088230609893799, "Pretrain/Loss (Raw)": 1.9091945886611938, "Pretrain/Step": 4666, "Pretrain/Step Time": 8.56174618192017} +{"Pretrain/Learning Rate": 2.707338968988396e-05, "Pretrain/Loss": 2.0915160179138184, "Pretrain/Loss (Raw)": 2.354510545730591, "Pretrain/Step": 4667, "Pretrain/Step Time": 8.554471438750625} +{"Pretrain/Learning Rate": 2.7064928945736974e-05, "Pretrain/Loss": 2.0941321849823, "Pretrain/Loss (Raw)": 2.216899871826172, "Pretrain/Step": 4668, "Pretrain/Step Time": 8.557099167257547} +{"Pretrain/Learning Rate": 2.7056467963452646e-05, "Pretrain/Loss": 2.0937509536743164, "Pretrain/Loss (Raw)": 2.1145265102386475, "Pretrain/Step": 4669, "Pretrain/Step Time": 8.561590569093823} +{"Pretrain/Learning Rate": 2.704800674400675e-05, "Pretrain/Loss": 2.0894837379455566, "Pretrain/Loss (Raw)": 1.6254197359085083, "Pretrain/Step": 4670, "Pretrain/Step Time": 8.550971066579223} +{"Pretrain/Learning Rate": 2.703954528837506e-05, "Pretrain/Loss": 2.0870981216430664, "Pretrain/Loss (Raw)": 1.788108229637146, "Pretrain/Step": 4671, "Pretrain/Step Time": 8.55396201647818} +{"Pretrain/Learning Rate": 2.7031083597533402e-05, "Pretrain/Loss": 2.085827112197876, "Pretrain/Loss (Raw)": 1.8534425497055054, "Pretrain/Step": 4672, "Pretrain/Step Time": 8.552233686670661} +{"Pretrain/Learning Rate": 2.702262167245761e-05, "Pretrain/Loss": 2.0840671062469482, "Pretrain/Loss (Raw)": 2.114306688308716, "Pretrain/Step": 4673, "Pretrain/Step Time": 8.552963275462389} +{"Pretrain/Learning Rate": 2.7014159514123555e-05, "Pretrain/Loss": 2.082066059112549, "Pretrain/Loss (Raw)": 2.0964415073394775, "Pretrain/Step": 4674, "Pretrain/Step Time": 8.555207777768373} +{"Pretrain/Learning Rate": 2.7005697123507134e-05, "Pretrain/Loss": 2.082855224609375, "Pretrain/Loss (Raw)": 2.1696107387542725, "Pretrain/Step": 4675, "Pretrain/Step Time": 8.55579517222941} +{"Pretrain/Learning Rate": 2.6997234501584267e-05, "Pretrain/Loss": 2.084188461303711, "Pretrain/Loss (Raw)": 2.1796350479125977, "Pretrain/Step": 4676, "Pretrain/Step Time": 8.547066373750567} +{"Pretrain/Learning Rate": 2.6988771649330906e-05, "Pretrain/Loss": 2.0840868949890137, "Pretrain/Loss (Raw)": 2.102248191833496, "Pretrain/Step": 4677, "Pretrain/Step Time": 8.548388563096523} +{"Pretrain/Learning Rate": 2.6980308567723035e-05, "Pretrain/Loss": 2.083233594894409, "Pretrain/Loss (Raw)": 2.0906057357788086, "Pretrain/Step": 4678, "Pretrain/Step Time": 8.548523258417845} +{"Pretrain/Learning Rate": 2.697184525773664e-05, "Pretrain/Loss": 2.0795376300811768, "Pretrain/Loss (Raw)": 1.7988083362579346, "Pretrain/Step": 4679, "Pretrain/Step Time": 8.547767071053386} +{"Pretrain/Learning Rate": 2.6963381720347764e-05, "Pretrain/Loss": 2.0792083740234375, "Pretrain/Loss (Raw)": 2.0328407287597656, "Pretrain/Step": 4680, "Pretrain/Step Time": 8.548524031415582} +{"Pretrain/Learning Rate": 2.6954917956532455e-05, "Pretrain/Loss": 2.079246997833252, "Pretrain/Loss (Raw)": 2.088660955429077, "Pretrain/Step": 4681, "Pretrain/Step Time": 8.553162656724453} +{"Pretrain/Learning Rate": 2.6946453967266792e-05, "Pretrain/Loss": 2.0798213481903076, "Pretrain/Loss (Raw)": 2.0513346195220947, "Pretrain/Step": 4682, "Pretrain/Step Time": 8.544236911460757} +{"Pretrain/Learning Rate": 2.693798975352689e-05, "Pretrain/Loss": 2.0826187133789062, "Pretrain/Loss (Raw)": 2.541680335998535, "Pretrain/Step": 4683, "Pretrain/Step Time": 8.554796332493424} +{"Pretrain/Learning Rate": 2.6929525316288874e-05, "Pretrain/Loss": 2.0824129581451416, "Pretrain/Loss (Raw)": 2.096686601638794, "Pretrain/Step": 4684, "Pretrain/Step Time": 8.55227368697524} +{"Pretrain/Learning Rate": 2.692106065652891e-05, "Pretrain/Loss": 2.0840907096862793, "Pretrain/Loss (Raw)": 2.17883563041687, "Pretrain/Step": 4685, "Pretrain/Step Time": 8.552776426076889} +{"Pretrain/Learning Rate": 2.6912595775223175e-05, "Pretrain/Loss": 2.0828375816345215, "Pretrain/Loss (Raw)": 2.21817684173584, "Pretrain/Step": 4686, "Pretrain/Step Time": 8.550770826637745} +{"Pretrain/Learning Rate": 2.6904130673347887e-05, "Pretrain/Loss": 2.0819954872131348, "Pretrain/Loss (Raw)": 2.050978422164917, "Pretrain/Step": 4687, "Pretrain/Step Time": 8.561101995408535} +{"Pretrain/Learning Rate": 2.6895665351879274e-05, "Pretrain/Loss": 2.0802407264709473, "Pretrain/Loss (Raw)": 1.9852935075759888, "Pretrain/Step": 4688, "Pretrain/Step Time": 8.545914001762867} +{"Pretrain/Learning Rate": 2.68871998117936e-05, "Pretrain/Loss": 2.0800724029541016, "Pretrain/Loss (Raw)": 1.9440244436264038, "Pretrain/Step": 4689, "Pretrain/Step Time": 8.55353725515306} +{"Pretrain/Learning Rate": 2.687873405406715e-05, "Pretrain/Loss": 2.0818283557891846, "Pretrain/Loss (Raw)": 2.3169007301330566, "Pretrain/Step": 4690, "Pretrain/Step Time": 8.558326467871666} +{"Pretrain/Learning Rate": 2.6870268079676237e-05, "Pretrain/Loss": 2.082258701324463, "Pretrain/Loss (Raw)": 1.9930009841918945, "Pretrain/Step": 4691, "Pretrain/Step Time": 8.552916711196303} +{"Pretrain/Learning Rate": 2.6861801889597193e-05, "Pretrain/Loss": 2.0807933807373047, "Pretrain/Loss (Raw)": 1.857539415359497, "Pretrain/Step": 4692, "Pretrain/Step Time": 8.554158568382263} +{"Pretrain/Learning Rate": 2.685333548480639e-05, "Pretrain/Loss": 2.080631732940674, "Pretrain/Loss (Raw)": 1.9322336912155151, "Pretrain/Step": 4693, "Pretrain/Step Time": 8.55959516018629} +{"Pretrain/Learning Rate": 2.68448688662802e-05, "Pretrain/Loss": 2.080777406692505, "Pretrain/Loss (Raw)": 1.9731686115264893, "Pretrain/Step": 4694, "Pretrain/Step Time": 8.551563451066613} +{"Pretrain/Learning Rate": 2.683640203499504e-05, "Pretrain/Loss": 2.080941915512085, "Pretrain/Loss (Raw)": 2.0923469066619873, "Pretrain/Step": 4695, "Pretrain/Step Time": 8.554995192214847} +{"Pretrain/Learning Rate": 2.682793499192734e-05, "Pretrain/Loss": 2.0792832374572754, "Pretrain/Loss (Raw)": 2.059645891189575, "Pretrain/Step": 4696, "Pretrain/Step Time": 8.556333873420954} +{"Pretrain/Learning Rate": 2.6819467738053572e-05, "Pretrain/Loss": 2.078256607055664, "Pretrain/Loss (Raw)": 2.1925721168518066, "Pretrain/Step": 4697, "Pretrain/Step Time": 8.55994351580739} +{"Pretrain/Learning Rate": 2.6811000274350205e-05, "Pretrain/Loss": 2.079052448272705, "Pretrain/Loss (Raw)": 2.076634168624878, "Pretrain/Step": 4698, "Pretrain/Step Time": 8.566812727600336} +{"Pretrain/Learning Rate": 2.680253260179375e-05, "Pretrain/Loss": 2.079134464263916, "Pretrain/Loss (Raw)": 2.0786170959472656, "Pretrain/Step": 4699, "Pretrain/Step Time": 8.573790738359094} +{"Pretrain/Learning Rate": 2.6794064721360752e-05, "Pretrain/Loss": 2.0801198482513428, "Pretrain/Loss (Raw)": 2.1295177936553955, "Pretrain/Step": 4700, "Pretrain/Step Time": 8.551847327500582} +{"Pretrain/Learning Rate": 2.6785596634027745e-05, "Pretrain/Loss": 2.080397367477417, "Pretrain/Loss (Raw)": 1.9775155782699585, "Pretrain/Step": 4701, "Pretrain/Step Time": 8.55240143276751} +{"Pretrain/Learning Rate": 2.677712834077133e-05, "Pretrain/Loss": 2.0808358192443848, "Pretrain/Loss (Raw)": 2.103672504425049, "Pretrain/Step": 4702, "Pretrain/Step Time": 8.550016963854432} +{"Pretrain/Learning Rate": 2.676865984256809e-05, "Pretrain/Loss": 2.0792298316955566, "Pretrain/Loss (Raw)": 2.0256357192993164, "Pretrain/Step": 4703, "Pretrain/Step Time": 8.549476390704513} +{"Pretrain/Learning Rate": 2.6760191140394668e-05, "Pretrain/Loss": 2.080322265625, "Pretrain/Loss (Raw)": 2.158355951309204, "Pretrain/Step": 4704, "Pretrain/Step Time": 8.555286774411798} +{"Pretrain/Learning Rate": 2.675172223522771e-05, "Pretrain/Loss": 2.07983660697937, "Pretrain/Loss (Raw)": 2.0948851108551025, "Pretrain/Step": 4705, "Pretrain/Step Time": 8.561585703864694} +{"Pretrain/Learning Rate": 2.6743253128043887e-05, "Pretrain/Loss": 2.080146312713623, "Pretrain/Loss (Raw)": 2.1128082275390625, "Pretrain/Step": 4706, "Pretrain/Step Time": 8.556424845010042} +{"Pretrain/Learning Rate": 2.6734783819819903e-05, "Pretrain/Loss": 2.082242965698242, "Pretrain/Loss (Raw)": 2.195570230484009, "Pretrain/Step": 4707, "Pretrain/Step Time": 8.558641413226724} +{"Pretrain/Learning Rate": 2.6726314311532467e-05, "Pretrain/Loss": 2.083515167236328, "Pretrain/Loss (Raw)": 1.9979140758514404, "Pretrain/Step": 4708, "Pretrain/Step Time": 8.55724391900003} +{"Pretrain/Learning Rate": 2.671784460415834e-05, "Pretrain/Loss": 2.0830931663513184, "Pretrain/Loss (Raw)": 2.129859209060669, "Pretrain/Step": 4709, "Pretrain/Step Time": 8.557767232879996} +{"Pretrain/Learning Rate": 2.6709374698674267e-05, "Pretrain/Loss": 2.084825038909912, "Pretrain/Loss (Raw)": 2.186161756515503, "Pretrain/Step": 4710, "Pretrain/Step Time": 8.5531873870641} +{"Pretrain/Learning Rate": 2.670090459605706e-05, "Pretrain/Loss": 2.086738109588623, "Pretrain/Loss (Raw)": 2.0677084922790527, "Pretrain/Step": 4711, "Pretrain/Step Time": 8.549211744219065} +{"Pretrain/Learning Rate": 2.6692434297283514e-05, "Pretrain/Loss": 2.0840234756469727, "Pretrain/Loss (Raw)": 1.8449163436889648, "Pretrain/Step": 4712, "Pretrain/Step Time": 8.559690587222576} +{"Pretrain/Learning Rate": 2.6683963803330468e-05, "Pretrain/Loss": 2.0870301723480225, "Pretrain/Loss (Raw)": 2.0746068954467773, "Pretrain/Step": 4713, "Pretrain/Step Time": 8.56149503774941} +{"Pretrain/Learning Rate": 2.6675493115174786e-05, "Pretrain/Loss": 2.0881705284118652, "Pretrain/Loss (Raw)": 2.026412010192871, "Pretrain/Step": 4714, "Pretrain/Step Time": 8.559688655659556} +{"Pretrain/Learning Rate": 2.6667022233793342e-05, "Pretrain/Loss": 2.084575653076172, "Pretrain/Loss (Raw)": 2.2727761268615723, "Pretrain/Step": 4715, "Pretrain/Step Time": 8.562619833275676} +{"Pretrain/Learning Rate": 2.6658551160163036e-05, "Pretrain/Loss": 2.085327625274658, "Pretrain/Loss (Raw)": 1.8038151264190674, "Pretrain/Step": 4716, "Pretrain/Step Time": 8.555090095847845} +{"Pretrain/Learning Rate": 2.6650079895260798e-05, "Pretrain/Loss": 2.0899760723114014, "Pretrain/Loss (Raw)": 2.3682827949523926, "Pretrain/Step": 4717, "Pretrain/Step Time": 8.553832650184631} +{"Pretrain/Learning Rate": 2.664160844006357e-05, "Pretrain/Loss": 2.090367317199707, "Pretrain/Loss (Raw)": 1.977189540863037, "Pretrain/Step": 4718, "Pretrain/Step Time": 8.555032724514604} +{"Pretrain/Learning Rate": 2.6633136795548326e-05, "Pretrain/Loss": 2.0884320735931396, "Pretrain/Loss (Raw)": 1.9193177223205566, "Pretrain/Step": 4719, "Pretrain/Step Time": 8.556458484381437} +{"Pretrain/Learning Rate": 2.662466496269204e-05, "Pretrain/Loss": 2.0866992473602295, "Pretrain/Loss (Raw)": 1.9936312437057495, "Pretrain/Step": 4720, "Pretrain/Step Time": 8.554837122559547} +{"Pretrain/Learning Rate": 2.661619294247174e-05, "Pretrain/Loss": 2.0868964195251465, "Pretrain/Loss (Raw)": 2.1178858280181885, "Pretrain/Step": 4721, "Pretrain/Step Time": 8.556330485269427} +{"Pretrain/Learning Rate": 2.6607720735864454e-05, "Pretrain/Loss": 2.086751699447632, "Pretrain/Loss (Raw)": 2.098104238510132, "Pretrain/Step": 4722, "Pretrain/Step Time": 8.552331786602736} +{"Pretrain/Learning Rate": 2.6599248343847244e-05, "Pretrain/Loss": 2.086869239807129, "Pretrain/Loss (Raw)": 2.1541101932525635, "Pretrain/Step": 4723, "Pretrain/Step Time": 8.550594417378306} +{"Pretrain/Learning Rate": 2.6590775767397174e-05, "Pretrain/Loss": 2.0854663848876953, "Pretrain/Loss (Raw)": 1.9762266874313354, "Pretrain/Step": 4724, "Pretrain/Step Time": 8.556944565847516} +{"Pretrain/Learning Rate": 2.6582303007491345e-05, "Pretrain/Loss": 2.0837440490722656, "Pretrain/Loss (Raw)": 1.9724996089935303, "Pretrain/Step": 4725, "Pretrain/Step Time": 8.55607569590211} +{"Pretrain/Learning Rate": 2.6573830065106874e-05, "Pretrain/Loss": 2.083237648010254, "Pretrain/Loss (Raw)": 2.050294876098633, "Pretrain/Step": 4726, "Pretrain/Step Time": 8.554093865677714} +{"Pretrain/Learning Rate": 2.6565356941220908e-05, "Pretrain/Loss": 2.082955837249756, "Pretrain/Loss (Raw)": 2.0400006771087646, "Pretrain/Step": 4727, "Pretrain/Step Time": 8.549114730209112} +{"Pretrain/Learning Rate": 2.6556883636810605e-05, "Pretrain/Loss": 2.0839109420776367, "Pretrain/Loss (Raw)": 2.1653835773468018, "Pretrain/Step": 4728, "Pretrain/Step Time": 8.553117401897907} +{"Pretrain/Learning Rate": 2.6548410152853142e-05, "Pretrain/Loss": 2.083192825317383, "Pretrain/Loss (Raw)": 2.232988119125366, "Pretrain/Step": 4729, "Pretrain/Step Time": 8.553819803521037} +{"Pretrain/Learning Rate": 2.6539936490325725e-05, "Pretrain/Loss": 2.0825376510620117, "Pretrain/Loss (Raw)": 1.9695123434066772, "Pretrain/Step": 4730, "Pretrain/Step Time": 8.550106164067984} +{"Pretrain/Learning Rate": 2.6531462650205575e-05, "Pretrain/Loss": 2.0820975303649902, "Pretrain/Loss (Raw)": 2.0313167572021484, "Pretrain/Step": 4731, "Pretrain/Step Time": 8.5518371257931} +{"Pretrain/Learning Rate": 2.6522988633469938e-05, "Pretrain/Loss": 2.082960605621338, "Pretrain/Loss (Raw)": 2.2593657970428467, "Pretrain/Step": 4732, "Pretrain/Step Time": 8.552724659442902} +{"Pretrain/Learning Rate": 2.6514514441096066e-05, "Pretrain/Loss": 2.0813422203063965, "Pretrain/Loss (Raw)": 1.935571551322937, "Pretrain/Step": 4733, "Pretrain/Step Time": 8.552785428240895} +{"Pretrain/Learning Rate": 2.650604007406126e-05, "Pretrain/Loss": 2.0797977447509766, "Pretrain/Loss (Raw)": 1.9470678567886353, "Pretrain/Step": 4734, "Pretrain/Step Time": 8.55287210084498} +{"Pretrain/Learning Rate": 2.6497565533342816e-05, "Pretrain/Loss": 2.0805788040161133, "Pretrain/Loss (Raw)": 2.2247321605682373, "Pretrain/Step": 4735, "Pretrain/Step Time": 8.551094457507133} +{"Pretrain/Learning Rate": 2.6489090819918057e-05, "Pretrain/Loss": 2.080127000808716, "Pretrain/Loss (Raw)": 2.102923631668091, "Pretrain/Step": 4736, "Pretrain/Step Time": 8.553014138713479} +{"Pretrain/Learning Rate": 2.6480615934764323e-05, "Pretrain/Loss": 2.0806643962860107, "Pretrain/Loss (Raw)": 2.1032750606536865, "Pretrain/Step": 4737, "Pretrain/Step Time": 8.553492138162255} +{"Pretrain/Learning Rate": 2.6472140878858994e-05, "Pretrain/Loss": 2.0798254013061523, "Pretrain/Loss (Raw)": 1.853763222694397, "Pretrain/Step": 4738, "Pretrain/Step Time": 8.552216041833162} +{"Pretrain/Learning Rate": 2.646366565317943e-05, "Pretrain/Loss": 2.078103542327881, "Pretrain/Loss (Raw)": 1.9503902196884155, "Pretrain/Step": 4739, "Pretrain/Step Time": 8.557528091594577} +{"Pretrain/Learning Rate": 2.6455190258703056e-05, "Pretrain/Loss": 2.0785295963287354, "Pretrain/Loss (Raw)": 2.1959235668182373, "Pretrain/Step": 4740, "Pretrain/Step Time": 8.560299875214696} +{"Pretrain/Learning Rate": 2.644671469640728e-05, "Pretrain/Loss": 2.080045223236084, "Pretrain/Loss (Raw)": 2.1404874324798584, "Pretrain/Step": 4741, "Pretrain/Step Time": 8.557366689667106} +{"Pretrain/Learning Rate": 2.6438238967269546e-05, "Pretrain/Loss": 2.0800914764404297, "Pretrain/Loss (Raw)": 2.2062771320343018, "Pretrain/Step": 4742, "Pretrain/Step Time": 8.563707668334246} +{"Pretrain/Learning Rate": 2.6429763072267317e-05, "Pretrain/Loss": 2.0813956260681152, "Pretrain/Loss (Raw)": 2.1691577434539795, "Pretrain/Step": 4743, "Pretrain/Step Time": 8.556829415261745} +{"Pretrain/Learning Rate": 2.642128701237807e-05, "Pretrain/Loss": 2.080686330795288, "Pretrain/Loss (Raw)": 1.9668004512786865, "Pretrain/Step": 4744, "Pretrain/Step Time": 8.561299204826355} +{"Pretrain/Learning Rate": 2.641281078857932e-05, "Pretrain/Loss": 2.079111337661743, "Pretrain/Loss (Raw)": 2.0161304473876953, "Pretrain/Step": 4745, "Pretrain/Step Time": 8.562199141830206} +{"Pretrain/Learning Rate": 2.6404334401848558e-05, "Pretrain/Loss": 2.079117774963379, "Pretrain/Loss (Raw)": 2.0577492713928223, "Pretrain/Step": 4746, "Pretrain/Step Time": 8.561067009344697} +{"Pretrain/Learning Rate": 2.6395857853163346e-05, "Pretrain/Loss": 2.079054355621338, "Pretrain/Loss (Raw)": 2.181321620941162, "Pretrain/Step": 4747, "Pretrain/Step Time": 8.563880929723382} +{"Pretrain/Learning Rate": 2.6387381143501217e-05, "Pretrain/Loss": 2.0792112350463867, "Pretrain/Loss (Raw)": 2.1081204414367676, "Pretrain/Step": 4748, "Pretrain/Step Time": 8.563617642968893} +{"Pretrain/Learning Rate": 2.6378904273839765e-05, "Pretrain/Loss": 2.0811824798583984, "Pretrain/Loss (Raw)": 2.171508312225342, "Pretrain/Step": 4749, "Pretrain/Step Time": 8.567011358216405} +{"Pretrain/Learning Rate": 2.6370427245156574e-05, "Pretrain/Loss": 2.0812783241271973, "Pretrain/Loss (Raw)": 2.203306198120117, "Pretrain/Step": 4750, "Pretrain/Step Time": 8.563632948324084} +{"Pretrain/Learning Rate": 2.6361950058429257e-05, "Pretrain/Loss": 2.0794317722320557, "Pretrain/Loss (Raw)": 2.0280258655548096, "Pretrain/Step": 4751, "Pretrain/Step Time": 8.56510265916586} +{"Pretrain/Learning Rate": 2.635347271463544e-05, "Pretrain/Loss": 2.0788416862487793, "Pretrain/Loss (Raw)": 2.0724849700927734, "Pretrain/Step": 4752, "Pretrain/Step Time": 8.564213631674647} +{"Pretrain/Learning Rate": 2.6344995214752772e-05, "Pretrain/Loss": 2.078329563140869, "Pretrain/Loss (Raw)": 2.190441370010376, "Pretrain/Step": 4753, "Pretrain/Step Time": 8.567316882312298} +{"Pretrain/Learning Rate": 2.6336517559758915e-05, "Pretrain/Loss": 2.0775742530822754, "Pretrain/Loss (Raw)": 1.9847933053970337, "Pretrain/Step": 4754, "Pretrain/Step Time": 8.564021805301309} +{"Pretrain/Learning Rate": 2.632803975063156e-05, "Pretrain/Loss": 2.0780985355377197, "Pretrain/Loss (Raw)": 2.0431947708129883, "Pretrain/Step": 4755, "Pretrain/Step Time": 8.562854267656803} +{"Pretrain/Learning Rate": 2.6319561788348402e-05, "Pretrain/Loss": 2.0786080360412598, "Pretrain/Loss (Raw)": 2.0828123092651367, "Pretrain/Step": 4756, "Pretrain/Step Time": 8.568304225802422} +{"Pretrain/Learning Rate": 2.6311083673887154e-05, "Pretrain/Loss": 2.0791006088256836, "Pretrain/Loss (Raw)": 2.171837329864502, "Pretrain/Step": 4757, "Pretrain/Step Time": 8.566528076305985} +{"Pretrain/Learning Rate": 2.6302605408225572e-05, "Pretrain/Loss": 2.07792592048645, "Pretrain/Loss (Raw)": 1.9885075092315674, "Pretrain/Step": 4758, "Pretrain/Step Time": 8.563833681866527} +{"Pretrain/Learning Rate": 2.6294126992341382e-05, "Pretrain/Loss": 2.077420711517334, "Pretrain/Loss (Raw)": 2.0341598987579346, "Pretrain/Step": 4759, "Pretrain/Step Time": 8.567545086145401} +{"Pretrain/Learning Rate": 2.628564842721238e-05, "Pretrain/Loss": 2.0762038230895996, "Pretrain/Loss (Raw)": 2.0149810314178467, "Pretrain/Step": 4760, "Pretrain/Step Time": 8.565818350762129} +{"Pretrain/Learning Rate": 2.6277169713816337e-05, "Pretrain/Loss": 2.07724666595459, "Pretrain/Loss (Raw)": 2.082773208618164, "Pretrain/Step": 4761, "Pretrain/Step Time": 8.565944412723184} +{"Pretrain/Learning Rate": 2.6268690853131067e-05, "Pretrain/Loss": 2.075901985168457, "Pretrain/Loss (Raw)": 1.8687217235565186, "Pretrain/Step": 4762, "Pretrain/Step Time": 8.559622768312693} +{"Pretrain/Learning Rate": 2.6260211846134387e-05, "Pretrain/Loss": 2.076439380645752, "Pretrain/Loss (Raw)": 2.1381783485412598, "Pretrain/Step": 4763, "Pretrain/Step Time": 8.55831291899085} +{"Pretrain/Learning Rate": 2.6251732693804144e-05, "Pretrain/Loss": 2.078892946243286, "Pretrain/Loss (Raw)": 2.2686290740966797, "Pretrain/Step": 4764, "Pretrain/Step Time": 8.556822521612048} +{"Pretrain/Learning Rate": 2.6243253397118178e-05, "Pretrain/Loss": 2.080918550491333, "Pretrain/Loss (Raw)": 2.187807083129883, "Pretrain/Step": 4765, "Pretrain/Step Time": 8.55718140117824} +{"Pretrain/Learning Rate": 2.6234773957054383e-05, "Pretrain/Loss": 2.0802745819091797, "Pretrain/Loss (Raw)": 2.087663173675537, "Pretrain/Step": 4766, "Pretrain/Step Time": 8.556413389742374} +{"Pretrain/Learning Rate": 2.6226294374590638e-05, "Pretrain/Loss": 2.078747272491455, "Pretrain/Loss (Raw)": 1.9487383365631104, "Pretrain/Step": 4767, "Pretrain/Step Time": 8.556365698575974} +{"Pretrain/Learning Rate": 2.6217814650704835e-05, "Pretrain/Loss": 2.0790762901306152, "Pretrain/Loss (Raw)": 2.087649345397949, "Pretrain/Step": 4768, "Pretrain/Step Time": 8.543000726029277} +{"Pretrain/Learning Rate": 2.620933478637492e-05, "Pretrain/Loss": 2.079030990600586, "Pretrain/Loss (Raw)": 2.2991139888763428, "Pretrain/Step": 4769, "Pretrain/Step Time": 8.540897686034441} +{"Pretrain/Learning Rate": 2.620085478257881e-05, "Pretrain/Loss": 2.080141067504883, "Pretrain/Loss (Raw)": 2.140302896499634, "Pretrain/Step": 4770, "Pretrain/Step Time": 8.543433926999569} +{"Pretrain/Learning Rate": 2.6192374640294477e-05, "Pretrain/Loss": 2.082387924194336, "Pretrain/Loss (Raw)": 2.163259744644165, "Pretrain/Step": 4771, "Pretrain/Step Time": 8.539183361455798} +{"Pretrain/Learning Rate": 2.618389436049987e-05, "Pretrain/Loss": 2.0826802253723145, "Pretrain/Loss (Raw)": 2.040383815765381, "Pretrain/Step": 4772, "Pretrain/Step Time": 8.547848476096988} +{"Pretrain/Learning Rate": 2.6175413944172995e-05, "Pretrain/Loss": 2.0817415714263916, "Pretrain/Loss (Raw)": 2.0505316257476807, "Pretrain/Step": 4773, "Pretrain/Step Time": 8.541093651205301} +{"Pretrain/Learning Rate": 2.6166933392291843e-05, "Pretrain/Loss": 2.080936908721924, "Pretrain/Loss (Raw)": 2.059002637863159, "Pretrain/Step": 4774, "Pretrain/Step Time": 8.550120487809181} +{"Pretrain/Learning Rate": 2.6158452705834434e-05, "Pretrain/Loss": 2.0821104049682617, "Pretrain/Loss (Raw)": 2.0073726177215576, "Pretrain/Step": 4775, "Pretrain/Step Time": 8.550361257046461} +{"Pretrain/Learning Rate": 2.6149971885778795e-05, "Pretrain/Loss": 2.0799736976623535, "Pretrain/Loss (Raw)": 1.8891814947128296, "Pretrain/Step": 4776, "Pretrain/Step Time": 8.549276266247034} +{"Pretrain/Learning Rate": 2.6141490933102987e-05, "Pretrain/Loss": 2.079103946685791, "Pretrain/Loss (Raw)": 1.8793973922729492, "Pretrain/Step": 4777, "Pretrain/Step Time": 8.548333574086428} +{"Pretrain/Learning Rate": 2.6133009848785062e-05, "Pretrain/Loss": 2.078817844390869, "Pretrain/Loss (Raw)": 2.093111038208008, "Pretrain/Step": 4778, "Pretrain/Step Time": 8.544559888541698} +{"Pretrain/Learning Rate": 2.6124528633803103e-05, "Pretrain/Loss": 2.078105926513672, "Pretrain/Loss (Raw)": 2.0423755645751953, "Pretrain/Step": 4779, "Pretrain/Step Time": 8.542550878599286} +{"Pretrain/Learning Rate": 2.61160472891352e-05, "Pretrain/Loss": 2.077993869781494, "Pretrain/Loss (Raw)": 2.1222963333129883, "Pretrain/Step": 4780, "Pretrain/Step Time": 8.548946674913168} +{"Pretrain/Learning Rate": 2.6107565815759473e-05, "Pretrain/Loss": 2.0758936405181885, "Pretrain/Loss (Raw)": 1.989180088043213, "Pretrain/Step": 4781, "Pretrain/Step Time": 8.546363160014153} +{"Pretrain/Learning Rate": 2.6099084214654034e-05, "Pretrain/Loss": 2.0754570960998535, "Pretrain/Loss (Raw)": 2.040259599685669, "Pretrain/Step": 4782, "Pretrain/Step Time": 8.548699639737606} +{"Pretrain/Learning Rate": 2.6090602486797017e-05, "Pretrain/Loss": 2.0756983757019043, "Pretrain/Loss (Raw)": 2.0580556392669678, "Pretrain/Step": 4783, "Pretrain/Step Time": 8.546622816473246} +{"Pretrain/Learning Rate": 2.608212063316659e-05, "Pretrain/Loss": 2.0737392902374268, "Pretrain/Loss (Raw)": 2.0721781253814697, "Pretrain/Step": 4784, "Pretrain/Step Time": 8.544871224090457} +{"Pretrain/Learning Rate": 2.6073638654740908e-05, "Pretrain/Loss": 2.0741899013519287, "Pretrain/Loss (Raw)": 2.081275701522827, "Pretrain/Step": 4785, "Pretrain/Step Time": 8.544374698773026} +{"Pretrain/Learning Rate": 2.606515655249816e-05, "Pretrain/Loss": 2.0764000415802, "Pretrain/Loss (Raw)": 2.3830602169036865, "Pretrain/Step": 4786, "Pretrain/Step Time": 8.542986063286662} +{"Pretrain/Learning Rate": 2.6056674327416537e-05, "Pretrain/Loss": 2.0737853050231934, "Pretrain/Loss (Raw)": 1.7401156425476074, "Pretrain/Step": 4787, "Pretrain/Step Time": 8.538094175979495} +{"Pretrain/Learning Rate": 2.604819198047425e-05, "Pretrain/Loss": 2.070340871810913, "Pretrain/Loss (Raw)": 1.7516969442367554, "Pretrain/Step": 4788, "Pretrain/Step Time": 8.543385650962591} +{"Pretrain/Learning Rate": 2.6039709512649522e-05, "Pretrain/Loss": 2.06898832321167, "Pretrain/Loss (Raw)": 2.1006946563720703, "Pretrain/Step": 4789, "Pretrain/Step Time": 8.543325141072273} +{"Pretrain/Learning Rate": 2.60312269249206e-05, "Pretrain/Loss": 2.0696756839752197, "Pretrain/Loss (Raw)": 2.259054660797119, "Pretrain/Step": 4790, "Pretrain/Step Time": 8.54466194100678} +{"Pretrain/Learning Rate": 2.602274421826573e-05, "Pretrain/Loss": 2.0683093070983887, "Pretrain/Loss (Raw)": 1.9178117513656616, "Pretrain/Step": 4791, "Pretrain/Step Time": 8.544449286535382} +{"Pretrain/Learning Rate": 2.6014261393663176e-05, "Pretrain/Loss": 2.0698435306549072, "Pretrain/Loss (Raw)": 2.1852664947509766, "Pretrain/Step": 4792, "Pretrain/Step Time": 8.543388510122895} +{"Pretrain/Learning Rate": 2.600577845209122e-05, "Pretrain/Loss": 2.07100772857666, "Pretrain/Loss (Raw)": 2.204925060272217, "Pretrain/Step": 4793, "Pretrain/Step Time": 8.547441694885492} +{"Pretrain/Learning Rate": 2.599729539452815e-05, "Pretrain/Loss": 2.07175874710083, "Pretrain/Loss (Raw)": 2.0053205490112305, "Pretrain/Step": 4794, "Pretrain/Step Time": 8.54327442869544} +{"Pretrain/Learning Rate": 2.598881222195228e-05, "Pretrain/Loss": 2.0691871643066406, "Pretrain/Loss (Raw)": 2.0253422260284424, "Pretrain/Step": 4795, "Pretrain/Step Time": 8.546589251607656} +{"Pretrain/Learning Rate": 2.5980328935341918e-05, "Pretrain/Loss": 2.0672898292541504, "Pretrain/Loss (Raw)": 1.9740787744522095, "Pretrain/Step": 4796, "Pretrain/Step Time": 8.543524466454983} +{"Pretrain/Learning Rate": 2.597184553567541e-05, "Pretrain/Loss": 2.0677454471588135, "Pretrain/Loss (Raw)": 2.172823429107666, "Pretrain/Step": 4797, "Pretrain/Step Time": 8.546016082167625} +{"Pretrain/Learning Rate": 2.5963362023931092e-05, "Pretrain/Loss": 2.0716216564178467, "Pretrain/Loss (Raw)": 2.1215763092041016, "Pretrain/Step": 4798, "Pretrain/Step Time": 8.54643220640719} +{"Pretrain/Learning Rate": 2.595487840108733e-05, "Pretrain/Loss": 2.073228597640991, "Pretrain/Loss (Raw)": 1.9937771558761597, "Pretrain/Step": 4799, "Pretrain/Step Time": 8.545004295185208} +{"Pretrain/Learning Rate": 2.5946394668122485e-05, "Pretrain/Loss": 2.0748977661132812, "Pretrain/Loss (Raw)": 2.0671253204345703, "Pretrain/Step": 4800, "Pretrain/Step Time": 8.54657526127994} +{"Pretrain/Learning Rate": 2.5937910826014955e-05, "Pretrain/Loss": 2.0746750831604004, "Pretrain/Loss (Raw)": 2.0858089923858643, "Pretrain/Step": 4801, "Pretrain/Step Time": 8.548126010224223} +{"Pretrain/Learning Rate": 2.5929426875743123e-05, "Pretrain/Loss": 2.0756168365478516, "Pretrain/Loss (Raw)": 2.21700119972229, "Pretrain/Step": 4802, "Pretrain/Step Time": 8.550323862582445} +{"Pretrain/Learning Rate": 2.592094281828541e-05, "Pretrain/Loss": 2.0748913288116455, "Pretrain/Loss (Raw)": 2.0767154693603516, "Pretrain/Step": 4803, "Pretrain/Step Time": 8.55093564465642} +{"Pretrain/Learning Rate": 2.5912458654620226e-05, "Pretrain/Loss": 2.0717015266418457, "Pretrain/Loss (Raw)": 1.7713394165039062, "Pretrain/Step": 4804, "Pretrain/Step Time": 8.558075020089746} +{"Pretrain/Learning Rate": 2.5903974385726014e-05, "Pretrain/Loss": 2.069802761077881, "Pretrain/Loss (Raw)": 1.8592246770858765, "Pretrain/Step": 4805, "Pretrain/Step Time": 8.558422850444913} +{"Pretrain/Learning Rate": 2.589549001258121e-05, "Pretrain/Loss": 2.070554256439209, "Pretrain/Loss (Raw)": 2.1867527961730957, "Pretrain/Step": 4806, "Pretrain/Step Time": 8.559953385964036} +{"Pretrain/Learning Rate": 2.5887005536164288e-05, "Pretrain/Loss": 2.0721821784973145, "Pretrain/Loss (Raw)": 2.007199764251709, "Pretrain/Step": 4807, "Pretrain/Step Time": 8.559635616838932} +{"Pretrain/Learning Rate": 2.58785209574537e-05, "Pretrain/Loss": 2.071979284286499, "Pretrain/Loss (Raw)": 2.0069000720977783, "Pretrain/Step": 4808, "Pretrain/Step Time": 8.560562564060092} +{"Pretrain/Learning Rate": 2.587003627742794e-05, "Pretrain/Loss": 2.074002742767334, "Pretrain/Loss (Raw)": 2.347646474838257, "Pretrain/Step": 4809, "Pretrain/Step Time": 8.562932973727584} +{"Pretrain/Learning Rate": 2.5861551497065496e-05, "Pretrain/Loss": 2.073868989944458, "Pretrain/Loss (Raw)": 2.034223794937134, "Pretrain/Step": 4810, "Pretrain/Step Time": 8.567057060077786} +{"Pretrain/Learning Rate": 2.5853066617344868e-05, "Pretrain/Loss": 2.069347381591797, "Pretrain/Loss (Raw)": 1.9629082679748535, "Pretrain/Step": 4811, "Pretrain/Step Time": 8.556871915236115} +{"Pretrain/Learning Rate": 2.5844581639244586e-05, "Pretrain/Loss": 2.0708205699920654, "Pretrain/Loss (Raw)": 2.28525447845459, "Pretrain/Step": 4812, "Pretrain/Step Time": 8.558096688240767} +{"Pretrain/Learning Rate": 2.583609656374316e-05, "Pretrain/Loss": 2.070220708847046, "Pretrain/Loss (Raw)": 2.1020407676696777, "Pretrain/Step": 4813, "Pretrain/Step Time": 8.55667277611792} +{"Pretrain/Learning Rate": 2.5827611391819152e-05, "Pretrain/Loss": 2.068037748336792, "Pretrain/Loss (Raw)": 1.9387518167495728, "Pretrain/Step": 4814, "Pretrain/Step Time": 8.55788137204945} +{"Pretrain/Learning Rate": 2.581912612445108e-05, "Pretrain/Loss": 2.0669476985931396, "Pretrain/Loss (Raw)": 1.9114519357681274, "Pretrain/Step": 4815, "Pretrain/Step Time": 8.559987612068653} +{"Pretrain/Learning Rate": 2.5810640762617538e-05, "Pretrain/Loss": 2.0678205490112305, "Pretrain/Loss (Raw)": 2.097041368484497, "Pretrain/Step": 4816, "Pretrain/Step Time": 8.56090765632689} +{"Pretrain/Learning Rate": 2.5802155307297077e-05, "Pretrain/Loss": 2.0683813095092773, "Pretrain/Loss (Raw)": 2.0157933235168457, "Pretrain/Step": 4817, "Pretrain/Step Time": 8.556326387450099} +{"Pretrain/Learning Rate": 2.5793669759468292e-05, "Pretrain/Loss": 2.064695119857788, "Pretrain/Loss (Raw)": 1.8450736999511719, "Pretrain/Step": 4818, "Pretrain/Step Time": 8.556998245418072} +{"Pretrain/Learning Rate": 2.578518412010976e-05, "Pretrain/Loss": 2.064983367919922, "Pretrain/Loss (Raw)": 2.0298707485198975, "Pretrain/Step": 4819, "Pretrain/Step Time": 8.559550231322646} +{"Pretrain/Learning Rate": 2.577669839020011e-05, "Pretrain/Loss": 2.06619930267334, "Pretrain/Loss (Raw)": 2.0132195949554443, "Pretrain/Step": 4820, "Pretrain/Step Time": 8.55875414609909} +{"Pretrain/Learning Rate": 2.576821257071793e-05, "Pretrain/Loss": 2.066655158996582, "Pretrain/Loss (Raw)": 1.9905738830566406, "Pretrain/Step": 4821, "Pretrain/Step Time": 8.559721915051341} +{"Pretrain/Learning Rate": 2.5759726662641865e-05, "Pretrain/Loss": 2.0651230812072754, "Pretrain/Loss (Raw)": 1.7770359516143799, "Pretrain/Step": 4822, "Pretrain/Step Time": 8.5622184202075} +{"Pretrain/Learning Rate": 2.5751240666950532e-05, "Pretrain/Loss": 2.065715789794922, "Pretrain/Loss (Raw)": 2.1682522296905518, "Pretrain/Step": 4823, "Pretrain/Step Time": 8.560797672718763} +{"Pretrain/Learning Rate": 2.5742754584622592e-05, "Pretrain/Loss": 2.067608594894409, "Pretrain/Loss (Raw)": 2.3019063472747803, "Pretrain/Step": 4824, "Pretrain/Step Time": 8.561995208263397} +{"Pretrain/Learning Rate": 2.5734268416636697e-05, "Pretrain/Loss": 2.0665791034698486, "Pretrain/Loss (Raw)": 2.0608057975769043, "Pretrain/Step": 4825, "Pretrain/Step Time": 8.55791986361146} +{"Pretrain/Learning Rate": 2.5725782163971495e-05, "Pretrain/Loss": 2.0674760341644287, "Pretrain/Loss (Raw)": 2.191436529159546, "Pretrain/Step": 4826, "Pretrain/Step Time": 8.553151153028011} +{"Pretrain/Learning Rate": 2.5717295827605686e-05, "Pretrain/Loss": 2.0676822662353516, "Pretrain/Loss (Raw)": 2.1050217151641846, "Pretrain/Step": 4827, "Pretrain/Step Time": 8.554240237921476} +{"Pretrain/Learning Rate": 2.5708809408517937e-05, "Pretrain/Loss": 2.067683696746826, "Pretrain/Loss (Raw)": 2.1297049522399902, "Pretrain/Step": 4828, "Pretrain/Step Time": 8.552694413810968} +{"Pretrain/Learning Rate": 2.5700322907686946e-05, "Pretrain/Loss": 2.070042848587036, "Pretrain/Loss (Raw)": 2.2794644832611084, "Pretrain/Step": 4829, "Pretrain/Step Time": 8.559376997873187} +{"Pretrain/Learning Rate": 2.5691836326091414e-05, "Pretrain/Loss": 2.066596031188965, "Pretrain/Loss (Raw)": 1.6624598503112793, "Pretrain/Step": 4830, "Pretrain/Step Time": 8.55940710939467} +{"Pretrain/Learning Rate": 2.5683349664710067e-05, "Pretrain/Loss": 2.0715126991271973, "Pretrain/Loss (Raw)": 2.6550066471099854, "Pretrain/Step": 4831, "Pretrain/Step Time": 8.561740269884467} +{"Pretrain/Learning Rate": 2.5674862924521605e-05, "Pretrain/Loss": 2.0716466903686523, "Pretrain/Loss (Raw)": 2.175475597381592, "Pretrain/Step": 4832, "Pretrain/Step Time": 8.56067550741136} +{"Pretrain/Learning Rate": 2.566637610650478e-05, "Pretrain/Loss": 2.0717153549194336, "Pretrain/Loss (Raw)": 2.1036715507507324, "Pretrain/Step": 4833, "Pretrain/Step Time": 8.559755604714155} +{"Pretrain/Learning Rate": 2.565788921163832e-05, "Pretrain/Loss": 2.070465564727783, "Pretrain/Loss (Raw)": 1.952833890914917, "Pretrain/Step": 4834, "Pretrain/Step Time": 8.557422310113907} +{"Pretrain/Learning Rate": 2.5649402240900972e-05, "Pretrain/Loss": 2.069371223449707, "Pretrain/Loss (Raw)": 2.0555243492126465, "Pretrain/Step": 4835, "Pretrain/Step Time": 8.55778531730175} +{"Pretrain/Learning Rate": 2.5640915195271504e-05, "Pretrain/Loss": 2.0699820518493652, "Pretrain/Loss (Raw)": 2.076115608215332, "Pretrain/Step": 4836, "Pretrain/Step Time": 8.553975231945515} +{"Pretrain/Learning Rate": 2.563242807572867e-05, "Pretrain/Loss": 2.0695321559906006, "Pretrain/Loss (Raw)": 2.0722410678863525, "Pretrain/Step": 4837, "Pretrain/Step Time": 8.559924138709903} +{"Pretrain/Learning Rate": 2.5623940883251256e-05, "Pretrain/Loss": 2.067753314971924, "Pretrain/Loss (Raw)": 1.9584912061691284, "Pretrain/Step": 4838, "Pretrain/Step Time": 8.564196398481727} +{"Pretrain/Learning Rate": 2.561545361881803e-05, "Pretrain/Loss": 2.068410873413086, "Pretrain/Loss (Raw)": 2.151869297027588, "Pretrain/Step": 4839, "Pretrain/Step Time": 8.56706322915852} +{"Pretrain/Learning Rate": 2.5606966283407803e-05, "Pretrain/Loss": 2.069939136505127, "Pretrain/Loss (Raw)": 2.0405280590057373, "Pretrain/Step": 4840, "Pretrain/Step Time": 8.553866673260927} +{"Pretrain/Learning Rate": 2.5598478877999356e-05, "Pretrain/Loss": 2.068690776824951, "Pretrain/Loss (Raw)": 1.9148167371749878, "Pretrain/Step": 4841, "Pretrain/Step Time": 8.554396525025368} +{"Pretrain/Learning Rate": 2.558999140357151e-05, "Pretrain/Loss": 2.069188356399536, "Pretrain/Loss (Raw)": 2.090097665786743, "Pretrain/Step": 4842, "Pretrain/Step Time": 8.549644758924842} +{"Pretrain/Learning Rate": 2.5581503861103073e-05, "Pretrain/Loss": 2.066984176635742, "Pretrain/Loss (Raw)": 1.9906601905822754, "Pretrain/Step": 4843, "Pretrain/Step Time": 8.54577231220901} +{"Pretrain/Learning Rate": 2.5573016251572872e-05, "Pretrain/Loss": 2.067046642303467, "Pretrain/Loss (Raw)": 1.8118208646774292, "Pretrain/Step": 4844, "Pretrain/Step Time": 8.546834444627166} +{"Pretrain/Learning Rate": 2.5564528575959733e-05, "Pretrain/Loss": 2.0662078857421875, "Pretrain/Loss (Raw)": 2.260890483856201, "Pretrain/Step": 4845, "Pretrain/Step Time": 8.552583780139685} +{"Pretrain/Learning Rate": 2.55560408352425e-05, "Pretrain/Loss": 2.066807746887207, "Pretrain/Loss (Raw)": 2.0540010929107666, "Pretrain/Step": 4846, "Pretrain/Step Time": 8.546139942482114} +{"Pretrain/Learning Rate": 2.5547553030400016e-05, "Pretrain/Loss": 2.068136215209961, "Pretrain/Loss (Raw)": 2.0893380641937256, "Pretrain/Step": 4847, "Pretrain/Step Time": 8.549295354634523} +{"Pretrain/Learning Rate": 2.5539065162411143e-05, "Pretrain/Loss": 2.06980562210083, "Pretrain/Loss (Raw)": 2.2073144912719727, "Pretrain/Step": 4848, "Pretrain/Step Time": 8.550199285149574} +{"Pretrain/Learning Rate": 2.5530577232254733e-05, "Pretrain/Loss": 2.0690860748291016, "Pretrain/Loss (Raw)": 2.0257763862609863, "Pretrain/Step": 4849, "Pretrain/Step Time": 8.5491230096668} +{"Pretrain/Learning Rate": 2.5522089240909652e-05, "Pretrain/Loss": 2.0689809322357178, "Pretrain/Loss (Raw)": 2.084651470184326, "Pretrain/Step": 4850, "Pretrain/Step Time": 8.548174928873777} +{"Pretrain/Learning Rate": 2.5513601189354786e-05, "Pretrain/Loss": 2.0705370903015137, "Pretrain/Loss (Raw)": 2.3533265590667725, "Pretrain/Step": 4851, "Pretrain/Step Time": 8.556358901783824} +{"Pretrain/Learning Rate": 2.5505113078569004e-05, "Pretrain/Loss": 2.07334566116333, "Pretrain/Loss (Raw)": 2.3356852531433105, "Pretrain/Step": 4852, "Pretrain/Step Time": 8.542782573029399} +{"Pretrain/Learning Rate": 2.5496624909531207e-05, "Pretrain/Loss": 2.0725231170654297, "Pretrain/Loss (Raw)": 1.8672301769256592, "Pretrain/Step": 4853, "Pretrain/Step Time": 8.550333920866251} +{"Pretrain/Learning Rate": 2.548813668322028e-05, "Pretrain/Loss": 2.0738306045532227, "Pretrain/Loss (Raw)": 2.2176520824432373, "Pretrain/Step": 4854, "Pretrain/Step Time": 8.549244785681367} +{"Pretrain/Learning Rate": 2.5479648400615136e-05, "Pretrain/Loss": 2.073948621749878, "Pretrain/Loss (Raw)": 2.055108070373535, "Pretrain/Step": 4855, "Pretrain/Step Time": 8.552486948668957} +{"Pretrain/Learning Rate": 2.547116006269467e-05, "Pretrain/Loss": 2.072777271270752, "Pretrain/Loss (Raw)": 2.0154483318328857, "Pretrain/Step": 4856, "Pretrain/Step Time": 8.549642413854599} +{"Pretrain/Learning Rate": 2.5462671670437816e-05, "Pretrain/Loss": 2.072113513946533, "Pretrain/Loss (Raw)": 2.148005723953247, "Pretrain/Step": 4857, "Pretrain/Step Time": 8.555183567106724} +{"Pretrain/Learning Rate": 2.545418322482348e-05, "Pretrain/Loss": 2.0724306106567383, "Pretrain/Loss (Raw)": 2.010101079940796, "Pretrain/Step": 4858, "Pretrain/Step Time": 8.551738373935223} +{"Pretrain/Learning Rate": 2.5445694726830593e-05, "Pretrain/Loss": 2.0725045204162598, "Pretrain/Loss (Raw)": 2.040794849395752, "Pretrain/Step": 4859, "Pretrain/Step Time": 8.54801381379366} +{"Pretrain/Learning Rate": 2.543720617743809e-05, "Pretrain/Loss": 2.071406841278076, "Pretrain/Loss (Raw)": 2.11883544921875, "Pretrain/Step": 4860, "Pretrain/Step Time": 8.545804049819708} +{"Pretrain/Learning Rate": 2.5428717577624915e-05, "Pretrain/Loss": 2.075137138366699, "Pretrain/Loss (Raw)": 2.4130630493164062, "Pretrain/Step": 4861, "Pretrain/Step Time": 8.551033910363913} +{"Pretrain/Learning Rate": 2.5420228928370005e-05, "Pretrain/Loss": 2.0766122341156006, "Pretrain/Loss (Raw)": 2.1359012126922607, "Pretrain/Step": 4862, "Pretrain/Step Time": 8.5516941472888} +{"Pretrain/Learning Rate": 2.5411740230652315e-05, "Pretrain/Loss": 2.0731871128082275, "Pretrain/Loss (Raw)": 1.786310076713562, "Pretrain/Step": 4863, "Pretrain/Step Time": 8.556556971743703} +{"Pretrain/Learning Rate": 2.5403251485450795e-05, "Pretrain/Loss": 2.071340560913086, "Pretrain/Loss (Raw)": 1.8665777444839478, "Pretrain/Step": 4864, "Pretrain/Step Time": 8.544237798079848} +{"Pretrain/Learning Rate": 2.5394762693744428e-05, "Pretrain/Loss": 2.0709760189056396, "Pretrain/Loss (Raw)": 2.056591510772705, "Pretrain/Step": 4865, "Pretrain/Step Time": 8.553644713014364} +{"Pretrain/Learning Rate": 2.538627385651216e-05, "Pretrain/Loss": 2.073028802871704, "Pretrain/Loss (Raw)": 2.11653995513916, "Pretrain/Step": 4866, "Pretrain/Step Time": 8.545396314933896} +{"Pretrain/Learning Rate": 2.5377784974732965e-05, "Pretrain/Loss": 2.073071002960205, "Pretrain/Loss (Raw)": 1.9557538032531738, "Pretrain/Step": 4867, "Pretrain/Step Time": 8.54399242438376} +{"Pretrain/Learning Rate": 2.536929604938584e-05, "Pretrain/Loss": 2.074190139770508, "Pretrain/Loss (Raw)": 2.3391740322113037, "Pretrain/Step": 4868, "Pretrain/Step Time": 8.540842497721314} +{"Pretrain/Learning Rate": 2.5360807081449738e-05, "Pretrain/Loss": 2.0712828636169434, "Pretrain/Loss (Raw)": 1.7683824300765991, "Pretrain/Step": 4869, "Pretrain/Step Time": 8.545034486800432} +{"Pretrain/Learning Rate": 2.5352318071903675e-05, "Pretrain/Loss": 2.0704972743988037, "Pretrain/Loss (Raw)": 2.1057305335998535, "Pretrain/Step": 4870, "Pretrain/Step Time": 8.54837166890502} +{"Pretrain/Learning Rate": 2.5343829021726618e-05, "Pretrain/Loss": 2.0710554122924805, "Pretrain/Loss (Raw)": 2.2406036853790283, "Pretrain/Step": 4871, "Pretrain/Step Time": 8.552664250135422} +{"Pretrain/Learning Rate": 2.533533993189759e-05, "Pretrain/Loss": 2.073965549468994, "Pretrain/Loss (Raw)": 2.3392632007598877, "Pretrain/Step": 4872, "Pretrain/Step Time": 8.548977172002196} +{"Pretrain/Learning Rate": 2.5326850803395575e-05, "Pretrain/Loss": 2.073613166809082, "Pretrain/Loss (Raw)": 1.9710222482681274, "Pretrain/Step": 4873, "Pretrain/Step Time": 8.55189260840416} +{"Pretrain/Learning Rate": 2.5318361637199594e-05, "Pretrain/Loss": 2.072531223297119, "Pretrain/Loss (Raw)": 1.9192931652069092, "Pretrain/Step": 4874, "Pretrain/Step Time": 8.552045434713364} +{"Pretrain/Learning Rate": 2.5309872434288645e-05, "Pretrain/Loss": 2.069761037826538, "Pretrain/Loss (Raw)": 1.8267195224761963, "Pretrain/Step": 4875, "Pretrain/Step Time": 8.550851676613092} +{"Pretrain/Learning Rate": 2.5301383195641742e-05, "Pretrain/Loss": 2.0680482387542725, "Pretrain/Loss (Raw)": 1.8888919353485107, "Pretrain/Step": 4876, "Pretrain/Step Time": 8.54335193708539} +{"Pretrain/Learning Rate": 2.5292893922237913e-05, "Pretrain/Loss": 2.066549301147461, "Pretrain/Loss (Raw)": 1.9796416759490967, "Pretrain/Step": 4877, "Pretrain/Step Time": 8.543810727074742} +{"Pretrain/Learning Rate": 2.5284404615056172e-05, "Pretrain/Loss": 2.065798282623291, "Pretrain/Loss (Raw)": 2.107192277908325, "Pretrain/Step": 4878, "Pretrain/Step Time": 8.541489023715258} +{"Pretrain/Learning Rate": 2.5275915275075556e-05, "Pretrain/Loss": 2.066636085510254, "Pretrain/Loss (Raw)": 2.135228395462036, "Pretrain/Step": 4879, "Pretrain/Step Time": 8.54488861374557} +{"Pretrain/Learning Rate": 2.5267425903275088e-05, "Pretrain/Loss": 2.06648325920105, "Pretrain/Loss (Raw)": 2.052940845489502, "Pretrain/Step": 4880, "Pretrain/Step Time": 8.547402035444975} +{"Pretrain/Learning Rate": 2.5258936500633807e-05, "Pretrain/Loss": 2.0652074813842773, "Pretrain/Loss (Raw)": 2.027157783508301, "Pretrain/Step": 4881, "Pretrain/Step Time": 8.548328323289752} +{"Pretrain/Learning Rate": 2.5250447068130746e-05, "Pretrain/Loss": 2.067172050476074, "Pretrain/Loss (Raw)": 2.236274242401123, "Pretrain/Step": 4882, "Pretrain/Step Time": 8.549901504069567} +{"Pretrain/Learning Rate": 2.5241957606744952e-05, "Pretrain/Loss": 2.0630273818969727, "Pretrain/Loss (Raw)": 1.5126190185546875, "Pretrain/Step": 4883, "Pretrain/Step Time": 8.55356009490788} +{"Pretrain/Learning Rate": 2.523346811745546e-05, "Pretrain/Loss": 2.0643062591552734, "Pretrain/Loss (Raw)": 2.246532440185547, "Pretrain/Step": 4884, "Pretrain/Step Time": 8.546663725748658} +{"Pretrain/Learning Rate": 2.5224978601241333e-05, "Pretrain/Loss": 2.0624070167541504, "Pretrain/Loss (Raw)": 1.9287340641021729, "Pretrain/Step": 4885, "Pretrain/Step Time": 8.552689565345645} +{"Pretrain/Learning Rate": 2.5216489059081607e-05, "Pretrain/Loss": 2.061674118041992, "Pretrain/Loss (Raw)": 1.89469575881958, "Pretrain/Step": 4886, "Pretrain/Step Time": 8.552444713190198} +{"Pretrain/Learning Rate": 2.5207999491955347e-05, "Pretrain/Loss": 2.0614757537841797, "Pretrain/Loss (Raw)": 2.0087881088256836, "Pretrain/Step": 4887, "Pretrain/Step Time": 8.549157341942191} +{"Pretrain/Learning Rate": 2.51995099008416e-05, "Pretrain/Loss": 2.0612525939941406, "Pretrain/Loss (Raw)": 1.9863756895065308, "Pretrain/Step": 4888, "Pretrain/Step Time": 8.552408933639526} +{"Pretrain/Learning Rate": 2.519102028671944e-05, "Pretrain/Loss": 2.0586819648742676, "Pretrain/Loss (Raw)": 1.7537728548049927, "Pretrain/Step": 4889, "Pretrain/Step Time": 8.555229587480426} +{"Pretrain/Learning Rate": 2.518253065056791e-05, "Pretrain/Loss": 2.0604028701782227, "Pretrain/Loss (Raw)": 2.0890021324157715, "Pretrain/Step": 4890, "Pretrain/Step Time": 8.553527127951384} +{"Pretrain/Learning Rate": 2.5174040993366094e-05, "Pretrain/Loss": 2.0587494373321533, "Pretrain/Loss (Raw)": 1.9265241622924805, "Pretrain/Step": 4891, "Pretrain/Step Time": 8.551443243399262} +{"Pretrain/Learning Rate": 2.516555131609305e-05, "Pretrain/Loss": 2.056364059448242, "Pretrain/Loss (Raw)": 1.9632974863052368, "Pretrain/Step": 4892, "Pretrain/Step Time": 8.553337236866355} +{"Pretrain/Learning Rate": 2.5157061619727844e-05, "Pretrain/Loss": 2.056730270385742, "Pretrain/Loss (Raw)": 2.234666585922241, "Pretrain/Step": 4893, "Pretrain/Step Time": 8.557054169476032} +{"Pretrain/Learning Rate": 2.514857190524955e-05, "Pretrain/Loss": 2.056929349899292, "Pretrain/Loss (Raw)": 2.1131820678710938, "Pretrain/Step": 4894, "Pretrain/Step Time": 8.561610480770469} +{"Pretrain/Learning Rate": 2.514008217363725e-05, "Pretrain/Loss": 2.0575571060180664, "Pretrain/Loss (Raw)": 2.0290918350219727, "Pretrain/Step": 4895, "Pretrain/Step Time": 8.559819223359227} +{"Pretrain/Learning Rate": 2.513159242587001e-05, "Pretrain/Loss": 2.059786319732666, "Pretrain/Loss (Raw)": 2.3729779720306396, "Pretrain/Step": 4896, "Pretrain/Step Time": 8.562060941010714} +{"Pretrain/Learning Rate": 2.5123102662926913e-05, "Pretrain/Loss": 2.058474063873291, "Pretrain/Loss (Raw)": 2.1311521530151367, "Pretrain/Step": 4897, "Pretrain/Step Time": 8.564107334241271} +{"Pretrain/Learning Rate": 2.5114612885787037e-05, "Pretrain/Loss": 2.058302879333496, "Pretrain/Loss (Raw)": 2.118406057357788, "Pretrain/Step": 4898, "Pretrain/Step Time": 8.5651497207582} +{"Pretrain/Learning Rate": 2.5106123095429456e-05, "Pretrain/Loss": 2.0587432384490967, "Pretrain/Loss (Raw)": 2.2195932865142822, "Pretrain/Step": 4899, "Pretrain/Step Time": 8.564908247441053} +{"Pretrain/Learning Rate": 2.5097633292833268e-05, "Pretrain/Loss": 2.0588817596435547, "Pretrain/Loss (Raw)": 2.058105707168579, "Pretrain/Step": 4900, "Pretrain/Step Time": 8.562754519283772} +{"Pretrain/Learning Rate": 2.5089143478977546e-05, "Pretrain/Loss": 2.0594096183776855, "Pretrain/Loss (Raw)": 2.118086576461792, "Pretrain/Step": 4901, "Pretrain/Step Time": 8.559284234419465} +{"Pretrain/Learning Rate": 2.5080653654841378e-05, "Pretrain/Loss": 2.058897018432617, "Pretrain/Loss (Raw)": 1.9934158325195312, "Pretrain/Step": 4902, "Pretrain/Step Time": 8.560487691313028} +{"Pretrain/Learning Rate": 2.507216382140385e-05, "Pretrain/Loss": 2.059648036956787, "Pretrain/Loss (Raw)": 2.1035146713256836, "Pretrain/Step": 4903, "Pretrain/Step Time": 8.556077716872096} +{"Pretrain/Learning Rate": 2.5063673979644054e-05, "Pretrain/Loss": 2.058483839035034, "Pretrain/Loss (Raw)": 1.7401485443115234, "Pretrain/Step": 4904, "Pretrain/Step Time": 8.563356941565871} +{"Pretrain/Learning Rate": 2.5055184130541065e-05, "Pretrain/Loss": 2.060243606567383, "Pretrain/Loss (Raw)": 2.10463547706604, "Pretrain/Step": 4905, "Pretrain/Step Time": 8.561189372092485} +{"Pretrain/Learning Rate": 2.504669427507399e-05, "Pretrain/Loss": 2.0602753162384033, "Pretrain/Loss (Raw)": 2.097186326980591, "Pretrain/Step": 4906, "Pretrain/Step Time": 8.570645650848746} +{"Pretrain/Learning Rate": 2.503820441422191e-05, "Pretrain/Loss": 2.060696840286255, "Pretrain/Loss (Raw)": 2.0963146686553955, "Pretrain/Step": 4907, "Pretrain/Step Time": 8.569284424185753} +{"Pretrain/Learning Rate": 2.5029714548963917e-05, "Pretrain/Loss": 2.0595250129699707, "Pretrain/Loss (Raw)": 1.9723011255264282, "Pretrain/Step": 4908, "Pretrain/Step Time": 8.564700597897172} +{"Pretrain/Learning Rate": 2.5021224680279105e-05, "Pretrain/Loss": 2.059319496154785, "Pretrain/Loss (Raw)": 1.9628822803497314, "Pretrain/Step": 4909, "Pretrain/Step Time": 8.568985952064395} +{"Pretrain/Learning Rate": 2.5012734809146554e-05, "Pretrain/Loss": 2.0620195865631104, "Pretrain/Loss (Raw)": 2.3858702182769775, "Pretrain/Step": 4910, "Pretrain/Step Time": 8.56717018969357} +{"Pretrain/Learning Rate": 2.5004244936545374e-05, "Pretrain/Loss": 2.06231951713562, "Pretrain/Loss (Raw)": 2.096468687057495, "Pretrain/Step": 4911, "Pretrain/Step Time": 8.569486243650317} +{"Pretrain/Learning Rate": 2.499575506345464e-05, "Pretrain/Loss": 2.0650832653045654, "Pretrain/Loss (Raw)": 2.4259397983551025, "Pretrain/Step": 4912, "Pretrain/Step Time": 8.565825764089823} +{"Pretrain/Learning Rate": 2.498726519085345e-05, "Pretrain/Loss": 2.06484317779541, "Pretrain/Loss (Raw)": 2.050518751144409, "Pretrain/Step": 4913, "Pretrain/Step Time": 8.565569069236517} +{"Pretrain/Learning Rate": 2.497877531972091e-05, "Pretrain/Loss": 2.060183525085449, "Pretrain/Loss (Raw)": 1.7866287231445312, "Pretrain/Step": 4914, "Pretrain/Step Time": 8.56417397595942} +{"Pretrain/Learning Rate": 2.497028545103609e-05, "Pretrain/Loss": 2.0613489151000977, "Pretrain/Loss (Raw)": 1.8892827033996582, "Pretrain/Step": 4915, "Pretrain/Step Time": 8.56913821771741} +{"Pretrain/Learning Rate": 2.49617955857781e-05, "Pretrain/Loss": 2.065192699432373, "Pretrain/Loss (Raw)": 2.243725061416626, "Pretrain/Step": 4916, "Pretrain/Step Time": 8.5737060662359} +{"Pretrain/Learning Rate": 2.4953305724926017e-05, "Pretrain/Loss": 2.0648672580718994, "Pretrain/Loss (Raw)": 2.0590178966522217, "Pretrain/Step": 4917, "Pretrain/Step Time": 8.574562449008226} +{"Pretrain/Learning Rate": 2.494481586945894e-05, "Pretrain/Loss": 2.063211441040039, "Pretrain/Loss (Raw)": 2.0471153259277344, "Pretrain/Step": 4918, "Pretrain/Step Time": 8.579183358699083} +{"Pretrain/Learning Rate": 2.4936326020355955e-05, "Pretrain/Loss": 2.065262794494629, "Pretrain/Loss (Raw)": 2.1803970336914062, "Pretrain/Step": 4919, "Pretrain/Step Time": 8.581953544169664} +{"Pretrain/Learning Rate": 2.4927836178596156e-05, "Pretrain/Loss": 2.0637893676757812, "Pretrain/Loss (Raw)": 1.9966744184494019, "Pretrain/Step": 4920, "Pretrain/Step Time": 8.581322949379683} +{"Pretrain/Learning Rate": 2.4919346345158624e-05, "Pretrain/Loss": 2.0620555877685547, "Pretrain/Loss (Raw)": 1.9829661846160889, "Pretrain/Step": 4921, "Pretrain/Step Time": 8.578483616933227} +{"Pretrain/Learning Rate": 2.491085652102246e-05, "Pretrain/Loss": 2.0632431507110596, "Pretrain/Loss (Raw)": 2.157344102859497, "Pretrain/Step": 4922, "Pretrain/Step Time": 8.577615169808269} +{"Pretrain/Learning Rate": 2.4902366707166734e-05, "Pretrain/Loss": 2.0640950202941895, "Pretrain/Loss (Raw)": 2.1343767642974854, "Pretrain/Step": 4923, "Pretrain/Step Time": 8.58276498503983} +{"Pretrain/Learning Rate": 2.4893876904570554e-05, "Pretrain/Loss": 2.0654938220977783, "Pretrain/Loss (Raw)": 2.1531388759613037, "Pretrain/Step": 4924, "Pretrain/Step Time": 8.595019605010748} +{"Pretrain/Learning Rate": 2.488538711421297e-05, "Pretrain/Loss": 2.0661022663116455, "Pretrain/Loss (Raw)": 2.2506892681121826, "Pretrain/Step": 4925, "Pretrain/Step Time": 8.592483764514327} +{"Pretrain/Learning Rate": 2.4876897337073103e-05, "Pretrain/Loss": 2.066227436065674, "Pretrain/Loss (Raw)": 2.1376187801361084, "Pretrain/Step": 4926, "Pretrain/Step Time": 8.58948945812881} +{"Pretrain/Learning Rate": 2.4868407574129994e-05, "Pretrain/Loss": 2.0662646293640137, "Pretrain/Loss (Raw)": 1.9985504150390625, "Pretrain/Step": 4927, "Pretrain/Step Time": 8.58972697891295} +{"Pretrain/Learning Rate": 2.4859917826362764e-05, "Pretrain/Loss": 2.0680489540100098, "Pretrain/Loss (Raw)": 2.295480489730835, "Pretrain/Step": 4928, "Pretrain/Step Time": 8.589315377175808} +{"Pretrain/Learning Rate": 2.485142809475045e-05, "Pretrain/Loss": 2.0684876441955566, "Pretrain/Loss (Raw)": 2.141958236694336, "Pretrain/Step": 4929, "Pretrain/Step Time": 8.596565486863256} +{"Pretrain/Learning Rate": 2.4842938380272168e-05, "Pretrain/Loss": 2.066284656524658, "Pretrain/Loss (Raw)": 1.9350299835205078, "Pretrain/Step": 4930, "Pretrain/Step Time": 8.600362678989768} +{"Pretrain/Learning Rate": 2.4834448683906957e-05, "Pretrain/Loss": 2.064962387084961, "Pretrain/Loss (Raw)": 1.9074496030807495, "Pretrain/Step": 4931, "Pretrain/Step Time": 8.598184363916516} +{"Pretrain/Learning Rate": 2.482595900663392e-05, "Pretrain/Loss": 2.067509889602661, "Pretrain/Loss (Raw)": 2.0974371433258057, "Pretrain/Step": 4932, "Pretrain/Step Time": 8.58919159322977} +{"Pretrain/Learning Rate": 2.481746934943209e-05, "Pretrain/Loss": 2.0678229331970215, "Pretrain/Loss (Raw)": 1.8992830514907837, "Pretrain/Step": 4933, "Pretrain/Step Time": 8.586726164445281} +{"Pretrain/Learning Rate": 2.480897971328056e-05, "Pretrain/Loss": 2.068857431411743, "Pretrain/Loss (Raw)": 2.3191897869110107, "Pretrain/Step": 4934, "Pretrain/Step Time": 8.586098363623023} +{"Pretrain/Learning Rate": 2.4800490099158403e-05, "Pretrain/Loss": 2.0700838565826416, "Pretrain/Loss (Raw)": 2.1641690731048584, "Pretrain/Step": 4935, "Pretrain/Step Time": 8.590532405301929} +{"Pretrain/Learning Rate": 2.4792000508044652e-05, "Pretrain/Loss": 2.070127010345459, "Pretrain/Loss (Raw)": 2.012406587600708, "Pretrain/Step": 4936, "Pretrain/Step Time": 8.595273688435555} +{"Pretrain/Learning Rate": 2.4783510940918396e-05, "Pretrain/Loss": 2.0662288665771484, "Pretrain/Loss (Raw)": 1.8486943244934082, "Pretrain/Step": 4937, "Pretrain/Step Time": 8.587825259193778} +{"Pretrain/Learning Rate": 2.4775021398758666e-05, "Pretrain/Loss": 2.0669374465942383, "Pretrain/Loss (Raw)": 2.1249239444732666, "Pretrain/Step": 4938, "Pretrain/Step Time": 8.591117769479752} +{"Pretrain/Learning Rate": 2.4766531882544545e-05, "Pretrain/Loss": 2.0707316398620605, "Pretrain/Loss (Raw)": 2.4485533237457275, "Pretrain/Step": 4939, "Pretrain/Step Time": 8.592110393568873} +{"Pretrain/Learning Rate": 2.475804239325505e-05, "Pretrain/Loss": 2.0717625617980957, "Pretrain/Loss (Raw)": 2.4172544479370117, "Pretrain/Step": 4940, "Pretrain/Step Time": 8.59015847556293} +{"Pretrain/Learning Rate": 2.474955293186926e-05, "Pretrain/Loss": 2.0711820125579834, "Pretrain/Loss (Raw)": 2.0277211666107178, "Pretrain/Step": 4941, "Pretrain/Step Time": 8.592067815363407} +{"Pretrain/Learning Rate": 2.4741063499366195e-05, "Pretrain/Loss": 2.072847366333008, "Pretrain/Loss (Raw)": 2.151893377304077, "Pretrain/Step": 4942, "Pretrain/Step Time": 8.600642457604408} +{"Pretrain/Learning Rate": 2.4732574096724918e-05, "Pretrain/Loss": 2.074965476989746, "Pretrain/Loss (Raw)": 2.1826059818267822, "Pretrain/Step": 4943, "Pretrain/Step Time": 8.593777809292078} +{"Pretrain/Learning Rate": 2.4724084724924446e-05, "Pretrain/Loss": 2.0740160942077637, "Pretrain/Loss (Raw)": 1.975465178489685, "Pretrain/Step": 4944, "Pretrain/Step Time": 8.596830939874053} +{"Pretrain/Learning Rate": 2.471559538494383e-05, "Pretrain/Loss": 2.0753488540649414, "Pretrain/Loss (Raw)": 2.18642520904541, "Pretrain/Step": 4945, "Pretrain/Step Time": 8.597205765545368} +{"Pretrain/Learning Rate": 2.470710607776209e-05, "Pretrain/Loss": 2.0770015716552734, "Pretrain/Loss (Raw)": 2.0566039085388184, "Pretrain/Step": 4946, "Pretrain/Step Time": 8.593735840171576} +{"Pretrain/Learning Rate": 2.4698616804358263e-05, "Pretrain/Loss": 2.078427314758301, "Pretrain/Loss (Raw)": 2.2123682498931885, "Pretrain/Step": 4947, "Pretrain/Step Time": 8.602746227756143} +{"Pretrain/Learning Rate": 2.469012756571136e-05, "Pretrain/Loss": 2.0794448852539062, "Pretrain/Loss (Raw)": 2.1434707641601562, "Pretrain/Step": 4948, "Pretrain/Step Time": 8.600048433989286} +{"Pretrain/Learning Rate": 2.4681638362800415e-05, "Pretrain/Loss": 2.0791077613830566, "Pretrain/Loss (Raw)": 1.9474390745162964, "Pretrain/Step": 4949, "Pretrain/Step Time": 8.601120570674539} +{"Pretrain/Learning Rate": 2.4673149196604424e-05, "Pretrain/Loss": 2.0816991329193115, "Pretrain/Loss (Raw)": 2.1087207794189453, "Pretrain/Step": 4950, "Pretrain/Step Time": 8.5988384578377} +{"Pretrain/Learning Rate": 2.4664660068102416e-05, "Pretrain/Loss": 2.0804061889648438, "Pretrain/Loss (Raw)": 2.0027623176574707, "Pretrain/Step": 4951, "Pretrain/Step Time": 8.597363602370024} +{"Pretrain/Learning Rate": 2.465617097827338e-05, "Pretrain/Loss": 2.0781004428863525, "Pretrain/Loss (Raw)": 2.0067596435546875, "Pretrain/Step": 4952, "Pretrain/Step Time": 8.596211267635226} +{"Pretrain/Learning Rate": 2.4647681928096337e-05, "Pretrain/Loss": 2.077542781829834, "Pretrain/Loss (Raw)": 1.9894376993179321, "Pretrain/Step": 4953, "Pretrain/Step Time": 8.604356603696942} +{"Pretrain/Learning Rate": 2.4639192918550268e-05, "Pretrain/Loss": 2.0763158798217773, "Pretrain/Loss (Raw)": 2.0344088077545166, "Pretrain/Step": 4954, "Pretrain/Step Time": 8.601864928379655} +{"Pretrain/Learning Rate": 2.4630703950614176e-05, "Pretrain/Loss": 2.076847791671753, "Pretrain/Loss (Raw)": 2.1730918884277344, "Pretrain/Step": 4955, "Pretrain/Step Time": 8.59810228832066} +{"Pretrain/Learning Rate": 2.462221502526704e-05, "Pretrain/Loss": 2.07778000831604, "Pretrain/Loss (Raw)": 2.2490296363830566, "Pretrain/Step": 4956, "Pretrain/Step Time": 8.597587099298835} +{"Pretrain/Learning Rate": 2.461372614348785e-05, "Pretrain/Loss": 2.0752391815185547, "Pretrain/Loss (Raw)": 1.9542226791381836, "Pretrain/Step": 4957, "Pretrain/Step Time": 8.595084235072136} +{"Pretrain/Learning Rate": 2.460523730625558e-05, "Pretrain/Loss": 2.0784711837768555, "Pretrain/Loss (Raw)": 2.0761454105377197, "Pretrain/Step": 4958, "Pretrain/Step Time": 8.595403088256717} +{"Pretrain/Learning Rate": 2.4596748514549208e-05, "Pretrain/Loss": 2.0761473178863525, "Pretrain/Loss (Raw)": 2.357581853866577, "Pretrain/Step": 4959, "Pretrain/Step Time": 8.59302930533886} +{"Pretrain/Learning Rate": 2.458825976934769e-05, "Pretrain/Loss": 2.074584722518921, "Pretrain/Loss (Raw)": 1.97542405128479, "Pretrain/Step": 4960, "Pretrain/Step Time": 8.599599676206708} +{"Pretrain/Learning Rate": 2.4579771071630004e-05, "Pretrain/Loss": 2.071110248565674, "Pretrain/Loss (Raw)": 1.6589720249176025, "Pretrain/Step": 4961, "Pretrain/Step Time": 8.59857883863151} +{"Pretrain/Learning Rate": 2.457128242237509e-05, "Pretrain/Loss": 2.070556163787842, "Pretrain/Loss (Raw)": 1.8818845748901367, "Pretrain/Step": 4962, "Pretrain/Step Time": 8.599646430462599} +{"Pretrain/Learning Rate": 2.4562793822561914e-05, "Pretrain/Loss": 2.069722890853882, "Pretrain/Loss (Raw)": 1.948878526687622, "Pretrain/Step": 4963, "Pretrain/Step Time": 8.596560657024384} +{"Pretrain/Learning Rate": 2.455430527316941e-05, "Pretrain/Loss": 2.070664405822754, "Pretrain/Loss (Raw)": 2.1966326236724854, "Pretrain/Step": 4964, "Pretrain/Step Time": 8.59878634661436} +{"Pretrain/Learning Rate": 2.4545816775176532e-05, "Pretrain/Loss": 2.069689989089966, "Pretrain/Loss (Raw)": 1.947502851486206, "Pretrain/Step": 4965, "Pretrain/Step Time": 8.597020691260695} +{"Pretrain/Learning Rate": 2.4537328329562186e-05, "Pretrain/Loss": 2.0701239109039307, "Pretrain/Loss (Raw)": 2.014040231704712, "Pretrain/Step": 4966, "Pretrain/Step Time": 8.598838651552796} +{"Pretrain/Learning Rate": 2.4528839937305336e-05, "Pretrain/Loss": 2.0689563751220703, "Pretrain/Loss (Raw)": 2.002436399459839, "Pretrain/Step": 4967, "Pretrain/Step Time": 8.596134938299656} +{"Pretrain/Learning Rate": 2.452035159938487e-05, "Pretrain/Loss": 2.0694355964660645, "Pretrain/Loss (Raw)": 2.101841449737549, "Pretrain/Step": 4968, "Pretrain/Step Time": 8.606644416227937} +{"Pretrain/Learning Rate": 2.4511863316779728e-05, "Pretrain/Loss": 2.070824384689331, "Pretrain/Loss (Raw)": 2.092621326446533, "Pretrain/Step": 4969, "Pretrain/Step Time": 8.608907846733928} +{"Pretrain/Learning Rate": 2.4503375090468795e-05, "Pretrain/Loss": 2.070582866668701, "Pretrain/Loss (Raw)": 2.059159755706787, "Pretrain/Step": 4970, "Pretrain/Step Time": 8.611836111173034} +{"Pretrain/Learning Rate": 2.4494886921431005e-05, "Pretrain/Loss": 2.0722107887268066, "Pretrain/Loss (Raw)": 2.1990301609039307, "Pretrain/Step": 4971, "Pretrain/Step Time": 8.610433971509337} +{"Pretrain/Learning Rate": 2.448639881064522e-05, "Pretrain/Loss": 2.0736711025238037, "Pretrain/Loss (Raw)": 1.998750925064087, "Pretrain/Step": 4972, "Pretrain/Step Time": 8.617424435913563} +{"Pretrain/Learning Rate": 2.4477910759090357e-05, "Pretrain/Loss": 2.0721888542175293, "Pretrain/Loss (Raw)": 2.0711724758148193, "Pretrain/Step": 4973, "Pretrain/Step Time": 8.611412279307842} +{"Pretrain/Learning Rate": 2.446942276774527e-05, "Pretrain/Loss": 2.0723133087158203, "Pretrain/Loss (Raw)": 2.0699310302734375, "Pretrain/Step": 4974, "Pretrain/Step Time": 8.614300826564431} +{"Pretrain/Learning Rate": 2.4460934837588856e-05, "Pretrain/Loss": 2.0728695392608643, "Pretrain/Loss (Raw)": 2.1605377197265625, "Pretrain/Step": 4975, "Pretrain/Step Time": 8.613860754296184} +{"Pretrain/Learning Rate": 2.4452446969599986e-05, "Pretrain/Loss": 2.073878526687622, "Pretrain/Loss (Raw)": 2.336446762084961, "Pretrain/Step": 4976, "Pretrain/Step Time": 8.610056046396494} +{"Pretrain/Learning Rate": 2.44439591647575e-05, "Pretrain/Loss": 2.0735244750976562, "Pretrain/Loss (Raw)": 1.9804840087890625, "Pretrain/Step": 4977, "Pretrain/Step Time": 8.612491993233562} +{"Pretrain/Learning Rate": 2.4435471424040273e-05, "Pretrain/Loss": 2.0735726356506348, "Pretrain/Loss (Raw)": 2.09077525138855, "Pretrain/Step": 4978, "Pretrain/Step Time": 8.616902155801654} +{"Pretrain/Learning Rate": 2.442698374842713e-05, "Pretrain/Loss": 2.071533679962158, "Pretrain/Loss (Raw)": 2.092359781265259, "Pretrain/Step": 4979, "Pretrain/Step Time": 8.610385781154037} +{"Pretrain/Learning Rate": 2.4418496138896936e-05, "Pretrain/Loss": 2.070310115814209, "Pretrain/Loss (Raw)": 2.179081678390503, "Pretrain/Step": 4980, "Pretrain/Step Time": 8.62060622498393} +{"Pretrain/Learning Rate": 2.4410008596428492e-05, "Pretrain/Loss": 2.071619987487793, "Pretrain/Loss (Raw)": 2.034877061843872, "Pretrain/Step": 4981, "Pretrain/Step Time": 8.612173452973366} +{"Pretrain/Learning Rate": 2.440152112200065e-05, "Pretrain/Loss": 2.070502519607544, "Pretrain/Loss (Raw)": 2.0746102333068848, "Pretrain/Step": 4982, "Pretrain/Step Time": 8.612603200599551} +{"Pretrain/Learning Rate": 2.4393033716592196e-05, "Pretrain/Loss": 2.0698800086975098, "Pretrain/Loss (Raw)": 1.9754304885864258, "Pretrain/Step": 4983, "Pretrain/Step Time": 8.60791771300137} +{"Pretrain/Learning Rate": 2.4384546381181976e-05, "Pretrain/Loss": 2.06929874420166, "Pretrain/Loss (Raw)": 1.9410420656204224, "Pretrain/Step": 4984, "Pretrain/Step Time": 8.618583243340254} +{"Pretrain/Learning Rate": 2.437605911674875e-05, "Pretrain/Loss": 2.068821907043457, "Pretrain/Loss (Raw)": 2.0869944095611572, "Pretrain/Step": 4985, "Pretrain/Step Time": 8.609337268397212} +{"Pretrain/Learning Rate": 2.4367571924271335e-05, "Pretrain/Loss": 2.068375587463379, "Pretrain/Loss (Raw)": 1.952959418296814, "Pretrain/Step": 4986, "Pretrain/Step Time": 8.613219294697046} +{"Pretrain/Learning Rate": 2.43590848047285e-05, "Pretrain/Loss": 2.0676000118255615, "Pretrain/Loss (Raw)": 1.9415260553359985, "Pretrain/Step": 4987, "Pretrain/Step Time": 8.61461872048676} +{"Pretrain/Learning Rate": 2.4350597759099034e-05, "Pretrain/Loss": 2.0656137466430664, "Pretrain/Loss (Raw)": 1.864605188369751, "Pretrain/Step": 4988, "Pretrain/Step Time": 8.615914152935147} +{"Pretrain/Learning Rate": 2.4342110788361685e-05, "Pretrain/Loss": 2.062288284301758, "Pretrain/Loss (Raw)": 1.9873685836791992, "Pretrain/Step": 4989, "Pretrain/Step Time": 8.610729170963168} +{"Pretrain/Learning Rate": 2.433362389349523e-05, "Pretrain/Loss": 2.060974597930908, "Pretrain/Loss (Raw)": 1.9677437543869019, "Pretrain/Step": 4990, "Pretrain/Step Time": 8.613357527181506} +{"Pretrain/Learning Rate": 2.4325137075478398e-05, "Pretrain/Loss": 2.0635480880737305, "Pretrain/Loss (Raw)": 2.115743398666382, "Pretrain/Step": 4991, "Pretrain/Step Time": 8.612925536930561} +{"Pretrain/Learning Rate": 2.4316650335289942e-05, "Pretrain/Loss": 2.062283992767334, "Pretrain/Loss (Raw)": 1.7047728300094604, "Pretrain/Step": 4992, "Pretrain/Step Time": 8.622063087299466} +{"Pretrain/Learning Rate": 2.430816367390859e-05, "Pretrain/Loss": 2.0627903938293457, "Pretrain/Loss (Raw)": 2.1213934421539307, "Pretrain/Step": 4993, "Pretrain/Step Time": 8.618190692737699} +{"Pretrain/Learning Rate": 2.429967709231306e-05, "Pretrain/Loss": 2.0628914833068848, "Pretrain/Loss (Raw)": 2.1295032501220703, "Pretrain/Step": 4994, "Pretrain/Step Time": 8.62065639719367} +{"Pretrain/Learning Rate": 2.429119059148207e-05, "Pretrain/Loss": 2.065586566925049, "Pretrain/Loss (Raw)": 2.300739288330078, "Pretrain/Step": 4995, "Pretrain/Step Time": 8.618096156045794} +{"Pretrain/Learning Rate": 2.4282704172394323e-05, "Pretrain/Loss": 2.063465118408203, "Pretrain/Loss (Raw)": 2.0676164627075195, "Pretrain/Step": 4996, "Pretrain/Step Time": 8.618176626041532} +{"Pretrain/Learning Rate": 2.4274217836028507e-05, "Pretrain/Loss": 2.065922737121582, "Pretrain/Loss (Raw)": 2.082939624786377, "Pretrain/Step": 4997, "Pretrain/Step Time": 8.6129533033818} +{"Pretrain/Learning Rate": 2.4265731583363316e-05, "Pretrain/Loss": 2.068171262741089, "Pretrain/Loss (Raw)": 2.3935341835021973, "Pretrain/Step": 4998, "Pretrain/Step Time": 8.608546508476138} +{"Pretrain/Learning Rate": 2.425724541537741e-05, "Pretrain/Loss": 2.070084571838379, "Pretrain/Loss (Raw)": 2.4855384826660156, "Pretrain/Step": 4999, "Pretrain/Step Time": 8.608171992003918} +{"Pretrain/Learning Rate": 2.4248759333049474e-05, "Pretrain/Loss": 2.066924571990967, "Pretrain/Loss (Raw)": 1.9347864389419556, "Pretrain/Step": 5000, "Pretrain/Step Time": 8.616699986159801} +{"Pretrain/Learning Rate": 2.424027333735814e-05, "Pretrain/Loss": 2.066939353942871, "Pretrain/Loss (Raw)": 1.9729136228561401, "Pretrain/Step": 5001, "Pretrain/Step Time": 9.09689961746335} +{"Pretrain/Learning Rate": 2.4231787429282073e-05, "Pretrain/Loss": 2.0702614784240723, "Pretrain/Loss (Raw)": 2.344515323638916, "Pretrain/Step": 5002, "Pretrain/Step Time": 9.09994831494987} +{"Pretrain/Learning Rate": 2.4223301609799895e-05, "Pretrain/Loss": 2.0734317302703857, "Pretrain/Loss (Raw)": 2.2325100898742676, "Pretrain/Step": 5003, "Pretrain/Step Time": 9.101618999615312} +{"Pretrain/Learning Rate": 2.421481587989024e-05, "Pretrain/Loss": 2.0719733238220215, "Pretrain/Loss (Raw)": 1.7022364139556885, "Pretrain/Step": 5004, "Pretrain/Step Time": 9.099994163960218} +{"Pretrain/Learning Rate": 2.4206330240531713e-05, "Pretrain/Loss": 2.0726799964904785, "Pretrain/Loss (Raw)": 2.0700652599334717, "Pretrain/Step": 5005, "Pretrain/Step Time": 9.097758272662759} +{"Pretrain/Learning Rate": 2.4197844692702925e-05, "Pretrain/Loss": 2.072421073913574, "Pretrain/Loss (Raw)": 2.0740458965301514, "Pretrain/Step": 5006, "Pretrain/Step Time": 9.106265446171165} +{"Pretrain/Learning Rate": 2.4189359237382464e-05, "Pretrain/Loss": 2.069575548171997, "Pretrain/Loss (Raw)": 1.7710119485855103, "Pretrain/Step": 5007, "Pretrain/Step Time": 9.101553477346897} +{"Pretrain/Learning Rate": 2.4180873875548925e-05, "Pretrain/Loss": 2.068718910217285, "Pretrain/Loss (Raw)": 1.9432734251022339, "Pretrain/Step": 5008, "Pretrain/Step Time": 9.098213009536266} +{"Pretrain/Learning Rate": 2.4172388608180857e-05, "Pretrain/Loss": 2.068821907043457, "Pretrain/Loss (Raw)": 2.0403575897216797, "Pretrain/Step": 5009, "Pretrain/Step Time": 9.096335824579} +{"Pretrain/Learning Rate": 2.4163903436256848e-05, "Pretrain/Loss": 2.068392753601074, "Pretrain/Loss (Raw)": 2.1813364028930664, "Pretrain/Step": 5010, "Pretrain/Step Time": 9.099485719576478} +{"Pretrain/Learning Rate": 2.4155418360755423e-05, "Pretrain/Loss": 2.0723466873168945, "Pretrain/Loss (Raw)": 2.018742084503174, "Pretrain/Step": 5011, "Pretrain/Step Time": 9.094001157209277} +{"Pretrain/Learning Rate": 2.4146933382655145e-05, "Pretrain/Loss": 2.069582939147949, "Pretrain/Loss (Raw)": 1.8927669525146484, "Pretrain/Step": 5012, "Pretrain/Step Time": 9.10226310417056} +{"Pretrain/Learning Rate": 2.413844850293451e-05, "Pretrain/Loss": 2.0717830657958984, "Pretrain/Loss (Raw)": 2.210355043411255, "Pretrain/Step": 5013, "Pretrain/Step Time": 9.100076049566269} +{"Pretrain/Learning Rate": 2.4129963722572074e-05, "Pretrain/Loss": 2.0731863975524902, "Pretrain/Loss (Raw)": 2.0743212699890137, "Pretrain/Step": 5014, "Pretrain/Step Time": 9.104163710027933} +{"Pretrain/Learning Rate": 2.41214790425463e-05, "Pretrain/Loss": 2.073805809020996, "Pretrain/Loss (Raw)": 2.0880610942840576, "Pretrain/Step": 5015, "Pretrain/Step Time": 9.10304045677185} +{"Pretrain/Learning Rate": 2.4112994463835714e-05, "Pretrain/Loss": 2.0746400356292725, "Pretrain/Loss (Raw)": 2.0931525230407715, "Pretrain/Step": 5016, "Pretrain/Step Time": 9.09138329140842} +{"Pretrain/Learning Rate": 2.4104509987418793e-05, "Pretrain/Loss": 2.077643871307373, "Pretrain/Loss (Raw)": 2.1382622718811035, "Pretrain/Step": 5017, "Pretrain/Step Time": 9.098108038306236} +{"Pretrain/Learning Rate": 2.4096025614273988e-05, "Pretrain/Loss": 2.0769195556640625, "Pretrain/Loss (Raw)": 1.9962944984436035, "Pretrain/Step": 5018, "Pretrain/Step Time": 9.104074934497476} +{"Pretrain/Learning Rate": 2.408754134537978e-05, "Pretrain/Loss": 2.0778656005859375, "Pretrain/Loss (Raw)": 2.0475893020629883, "Pretrain/Step": 5019, "Pretrain/Step Time": 9.108866220340133} +{"Pretrain/Learning Rate": 2.407905718171459e-05, "Pretrain/Loss": 2.077840805053711, "Pretrain/Loss (Raw)": 1.9601770639419556, "Pretrain/Step": 5020, "Pretrain/Step Time": 9.107997443526983} +{"Pretrain/Learning Rate": 2.4070573124256883e-05, "Pretrain/Loss": 2.076598644256592, "Pretrain/Loss (Raw)": 2.0756397247314453, "Pretrain/Step": 5021, "Pretrain/Step Time": 9.106698788702488} +{"Pretrain/Learning Rate": 2.4062089173985044e-05, "Pretrain/Loss": 2.0779531002044678, "Pretrain/Loss (Raw)": 2.2865676879882812, "Pretrain/Step": 5022, "Pretrain/Step Time": 9.095756359398365} +{"Pretrain/Learning Rate": 2.4053605331877517e-05, "Pretrain/Loss": 2.0781936645507812, "Pretrain/Loss (Raw)": 2.0598504543304443, "Pretrain/Step": 5023, "Pretrain/Step Time": 9.103493753820658} +{"Pretrain/Learning Rate": 2.404512159891267e-05, "Pretrain/Loss": 2.0748496055603027, "Pretrain/Loss (Raw)": 1.9449694156646729, "Pretrain/Step": 5024, "Pretrain/Step Time": 9.1032096426934} +{"Pretrain/Learning Rate": 2.4036637976068914e-05, "Pretrain/Loss": 2.0752310752868652, "Pretrain/Loss (Raw)": 2.179957389831543, "Pretrain/Step": 5025, "Pretrain/Step Time": 9.106658332049847} +{"Pretrain/Learning Rate": 2.4028154464324592e-05, "Pretrain/Loss": 2.0750081539154053, "Pretrain/Loss (Raw)": 2.089881658554077, "Pretrain/Step": 5026, "Pretrain/Step Time": 9.105737697333097} +{"Pretrain/Learning Rate": 2.4019671064658088e-05, "Pretrain/Loss": 2.0763070583343506, "Pretrain/Loss (Raw)": 2.3858642578125, "Pretrain/Step": 5027, "Pretrain/Step Time": 9.107149535790086} +{"Pretrain/Learning Rate": 2.4011187778047727e-05, "Pretrain/Loss": 2.0762243270874023, "Pretrain/Loss (Raw)": 2.04750394821167, "Pretrain/Step": 5028, "Pretrain/Step Time": 9.100613038986921} +{"Pretrain/Learning Rate": 2.4002704605471857e-05, "Pretrain/Loss": 2.074282169342041, "Pretrain/Loss (Raw)": 1.8695132732391357, "Pretrain/Step": 5029, "Pretrain/Step Time": 9.108925223350525} +{"Pretrain/Learning Rate": 2.3994221547908783e-05, "Pretrain/Loss": 2.0755558013916016, "Pretrain/Loss (Raw)": 2.1564550399780273, "Pretrain/Step": 5030, "Pretrain/Step Time": 9.103807909414172} +{"Pretrain/Learning Rate": 2.398573860633683e-05, "Pretrain/Loss": 2.075913429260254, "Pretrain/Loss (Raw)": 2.1492486000061035, "Pretrain/Step": 5031, "Pretrain/Step Time": 9.107778456062078} +{"Pretrain/Learning Rate": 2.3977255781734275e-05, "Pretrain/Loss": 2.0778770446777344, "Pretrain/Loss (Raw)": 1.9914913177490234, "Pretrain/Step": 5032, "Pretrain/Step Time": 9.102735102176666} +{"Pretrain/Learning Rate": 2.3968773075079404e-05, "Pretrain/Loss": 2.0770511627197266, "Pretrain/Loss (Raw)": 1.9989562034606934, "Pretrain/Step": 5033, "Pretrain/Step Time": 9.101142199710011} +{"Pretrain/Learning Rate": 2.396029048735048e-05, "Pretrain/Loss": 2.076855421066284, "Pretrain/Loss (Raw)": 2.072117328643799, "Pretrain/Step": 5034, "Pretrain/Step Time": 9.088289046660066} +{"Pretrain/Learning Rate": 2.3951808019525758e-05, "Pretrain/Loss": 2.0749964714050293, "Pretrain/Loss (Raw)": 1.858347773551941, "Pretrain/Step": 5035, "Pretrain/Step Time": 9.096165562048554} +{"Pretrain/Learning Rate": 2.394332567258347e-05, "Pretrain/Loss": 2.0754880905151367, "Pretrain/Loss (Raw)": 2.035262107849121, "Pretrain/Step": 5036, "Pretrain/Step Time": 9.09567529335618} +{"Pretrain/Learning Rate": 2.3934843447501852e-05, "Pretrain/Loss": 2.076730251312256, "Pretrain/Loss (Raw)": 2.1218879222869873, "Pretrain/Step": 5037, "Pretrain/Step Time": 9.10470468364656} +{"Pretrain/Learning Rate": 2.3926361345259098e-05, "Pretrain/Loss": 2.0767629146575928, "Pretrain/Loss (Raw)": 2.3900187015533447, "Pretrain/Step": 5038, "Pretrain/Step Time": 9.104914460331202} +{"Pretrain/Learning Rate": 2.391787936683342e-05, "Pretrain/Loss": 2.076634407043457, "Pretrain/Loss (Raw)": 2.080014705657959, "Pretrain/Step": 5039, "Pretrain/Step Time": 9.104406459257007} +{"Pretrain/Learning Rate": 2.390939751320299e-05, "Pretrain/Loss": 2.0736162662506104, "Pretrain/Loss (Raw)": 2.03962779045105, "Pretrain/Step": 5040, "Pretrain/Step Time": 9.10001626983285} +{"Pretrain/Learning Rate": 2.390091578534598e-05, "Pretrain/Loss": 2.0720577239990234, "Pretrain/Loss (Raw)": 1.851032018661499, "Pretrain/Step": 5041, "Pretrain/Step Time": 9.107518846169114} +{"Pretrain/Learning Rate": 2.3892434184240533e-05, "Pretrain/Loss": 2.0766687393188477, "Pretrain/Loss (Raw)": 2.376842498779297, "Pretrain/Step": 5042, "Pretrain/Step Time": 9.106905844062567} +{"Pretrain/Learning Rate": 2.3883952710864804e-05, "Pretrain/Loss": 2.078795909881592, "Pretrain/Loss (Raw)": 2.1615569591522217, "Pretrain/Step": 5043, "Pretrain/Step Time": 9.106994099915028} +{"Pretrain/Learning Rate": 2.3875471366196903e-05, "Pretrain/Loss": 2.077609062194824, "Pretrain/Loss (Raw)": 2.091794490814209, "Pretrain/Step": 5044, "Pretrain/Step Time": 9.106756556779146} +{"Pretrain/Learning Rate": 2.3866990151214947e-05, "Pretrain/Loss": 2.0771937370300293, "Pretrain/Loss (Raw)": 2.0058653354644775, "Pretrain/Step": 5045, "Pretrain/Step Time": 9.104042794555426} +{"Pretrain/Learning Rate": 2.3858509066897016e-05, "Pretrain/Loss": 2.0743408203125, "Pretrain/Loss (Raw)": 1.681944727897644, "Pretrain/Step": 5046, "Pretrain/Step Time": 9.092850344255567} +{"Pretrain/Learning Rate": 2.385002811422121e-05, "Pretrain/Loss": 2.073509693145752, "Pretrain/Loss (Raw)": 2.074003219604492, "Pretrain/Step": 5047, "Pretrain/Step Time": 9.091327019035816} +{"Pretrain/Learning Rate": 2.384154729416557e-05, "Pretrain/Loss": 2.0729928016662598, "Pretrain/Loss (Raw)": 1.930509090423584, "Pretrain/Step": 5048, "Pretrain/Step Time": 9.09812892973423} +{"Pretrain/Learning Rate": 2.383306660770817e-05, "Pretrain/Loss": 2.0736618041992188, "Pretrain/Loss (Raw)": 2.068631649017334, "Pretrain/Step": 5049, "Pretrain/Step Time": 9.094965767115355} +{"Pretrain/Learning Rate": 2.382458605582701e-05, "Pretrain/Loss": 2.0726871490478516, "Pretrain/Loss (Raw)": 2.032557249069214, "Pretrain/Step": 5050, "Pretrain/Step Time": 9.101552346721292} +{"Pretrain/Learning Rate": 2.3816105639500142e-05, "Pretrain/Loss": 2.0728697776794434, "Pretrain/Loss (Raw)": 2.1577723026275635, "Pretrain/Step": 5051, "Pretrain/Step Time": 9.095096033066511} +{"Pretrain/Learning Rate": 2.3807625359705532e-05, "Pretrain/Loss": 2.0708324909210205, "Pretrain/Loss (Raw)": 1.8923653364181519, "Pretrain/Step": 5052, "Pretrain/Step Time": 9.081066386774182} +{"Pretrain/Learning Rate": 2.37991452174212e-05, "Pretrain/Loss": 2.069915294647217, "Pretrain/Loss (Raw)": 2.1332919597625732, "Pretrain/Step": 5053, "Pretrain/Step Time": 9.078056430444121} +{"Pretrain/Learning Rate": 2.3790665213625087e-05, "Pretrain/Loss": 2.0697669982910156, "Pretrain/Loss (Raw)": 2.118623733520508, "Pretrain/Step": 5054, "Pretrain/Step Time": 9.088535975664854} +{"Pretrain/Learning Rate": 2.3782185349295174e-05, "Pretrain/Loss": 2.0703532695770264, "Pretrain/Loss (Raw)": 2.073582172393799, "Pretrain/Step": 5055, "Pretrain/Step Time": 9.085700940340757} +{"Pretrain/Learning Rate": 2.377370562540937e-05, "Pretrain/Loss": 2.0690784454345703, "Pretrain/Loss (Raw)": 2.132293462753296, "Pretrain/Step": 5056, "Pretrain/Step Time": 9.094560453668237} +{"Pretrain/Learning Rate": 2.3765226042945616e-05, "Pretrain/Loss": 2.0683391094207764, "Pretrain/Loss (Raw)": 2.0473475456237793, "Pretrain/Step": 5057, "Pretrain/Step Time": 9.083983546122909} +{"Pretrain/Learning Rate": 2.3756746602881824e-05, "Pretrain/Loss": 2.068655014038086, "Pretrain/Loss (Raw)": 1.975448727607727, "Pretrain/Step": 5058, "Pretrain/Step Time": 9.075694562867284} +{"Pretrain/Learning Rate": 2.3748267306195855e-05, "Pretrain/Loss": 2.068164110183716, "Pretrain/Loss (Raw)": 1.844638466835022, "Pretrain/Step": 5059, "Pretrain/Step Time": 9.077777354046702} +{"Pretrain/Learning Rate": 2.373978815386562e-05, "Pretrain/Loss": 2.0688302516937256, "Pretrain/Loss (Raw)": 2.18269944190979, "Pretrain/Step": 5060, "Pretrain/Step Time": 9.087392296642065} +{"Pretrain/Learning Rate": 2.3731309146868932e-05, "Pretrain/Loss": 2.0705912113189697, "Pretrain/Loss (Raw)": 2.12469220161438, "Pretrain/Step": 5061, "Pretrain/Step Time": 9.0872171074152} +{"Pretrain/Learning Rate": 2.372283028618367e-05, "Pretrain/Loss": 2.0688681602478027, "Pretrain/Loss (Raw)": 2.098628044128418, "Pretrain/Step": 5062, "Pretrain/Step Time": 9.093905618414283} +{"Pretrain/Learning Rate": 2.371435157278762e-05, "Pretrain/Loss": 2.067577362060547, "Pretrain/Loss (Raw)": 1.998928189277649, "Pretrain/Step": 5063, "Pretrain/Step Time": 9.091992631554604} +{"Pretrain/Learning Rate": 2.370587300765862e-05, "Pretrain/Loss": 2.0688462257385254, "Pretrain/Loss (Raw)": 2.1748127937316895, "Pretrain/Step": 5064, "Pretrain/Step Time": 9.083787586539984} +{"Pretrain/Learning Rate": 2.369739459177443e-05, "Pretrain/Loss": 2.069424629211426, "Pretrain/Loss (Raw)": 1.9227735996246338, "Pretrain/Step": 5065, "Pretrain/Step Time": 9.08387184329331} +{"Pretrain/Learning Rate": 2.3688916326112848e-05, "Pretrain/Loss": 2.0698790550231934, "Pretrain/Loss (Raw)": 2.183088541030884, "Pretrain/Step": 5066, "Pretrain/Step Time": 9.080508520826697} +{"Pretrain/Learning Rate": 2.3680438211651597e-05, "Pretrain/Loss": 2.0675787925720215, "Pretrain/Loss (Raw)": 2.1541004180908203, "Pretrain/Step": 5067, "Pretrain/Step Time": 9.081373142078519} +{"Pretrain/Learning Rate": 2.3671960249368448e-05, "Pretrain/Loss": 2.0647711753845215, "Pretrain/Loss (Raw)": 2.057887315750122, "Pretrain/Step": 5068, "Pretrain/Step Time": 9.08174416795373} +{"Pretrain/Learning Rate": 2.3663482440241087e-05, "Pretrain/Loss": 2.0652174949645996, "Pretrain/Loss (Raw)": 2.0848300457000732, "Pretrain/Step": 5069, "Pretrain/Step Time": 9.080852696672082} +{"Pretrain/Learning Rate": 2.3655004785247234e-05, "Pretrain/Loss": 2.065563678741455, "Pretrain/Loss (Raw)": 2.196192741394043, "Pretrain/Step": 5070, "Pretrain/Step Time": 9.071532741189003} +{"Pretrain/Learning Rate": 2.3646527285364565e-05, "Pretrain/Loss": 2.064972400665283, "Pretrain/Loss (Raw)": 2.1069483757019043, "Pretrain/Step": 5071, "Pretrain/Step Time": 9.071834595873952} +{"Pretrain/Learning Rate": 2.363804994157075e-05, "Pretrain/Loss": 2.0658605098724365, "Pretrain/Loss (Raw)": 2.089144706726074, "Pretrain/Step": 5072, "Pretrain/Step Time": 9.068441711366177} +{"Pretrain/Learning Rate": 2.3629572754843428e-05, "Pretrain/Loss": 2.0638999938964844, "Pretrain/Loss (Raw)": 1.9354596138000488, "Pretrain/Step": 5073, "Pretrain/Step Time": 9.064724128693342} +{"Pretrain/Learning Rate": 2.3621095726160237e-05, "Pretrain/Loss": 2.063875198364258, "Pretrain/Loss (Raw)": 2.0534324645996094, "Pretrain/Step": 5074, "Pretrain/Step Time": 9.068281028419733} +{"Pretrain/Learning Rate": 2.3612618856498785e-05, "Pretrain/Loss": 2.0628552436828613, "Pretrain/Loss (Raw)": 2.081834077835083, "Pretrain/Step": 5075, "Pretrain/Step Time": 9.060938593000174} +{"Pretrain/Learning Rate": 2.3604142146836666e-05, "Pretrain/Loss": 2.0622739791870117, "Pretrain/Loss (Raw)": 2.0690808296203613, "Pretrain/Step": 5076, "Pretrain/Step Time": 9.063257560133934} +{"Pretrain/Learning Rate": 2.3595665598151444e-05, "Pretrain/Loss": 2.062500476837158, "Pretrain/Loss (Raw)": 1.976415753364563, "Pretrain/Step": 5077, "Pretrain/Step Time": 9.05647830851376} +{"Pretrain/Learning Rate": 2.3587189211420694e-05, "Pretrain/Loss": 2.0627870559692383, "Pretrain/Loss (Raw)": 2.1454050540924072, "Pretrain/Step": 5078, "Pretrain/Step Time": 9.060590449720621} +{"Pretrain/Learning Rate": 2.3578712987621932e-05, "Pretrain/Loss": 2.062027931213379, "Pretrain/Loss (Raw)": 1.9055713415145874, "Pretrain/Step": 5079, "Pretrain/Step Time": 9.058467358350754} +{"Pretrain/Learning Rate": 2.3570236927732692e-05, "Pretrain/Loss": 2.0626578330993652, "Pretrain/Loss (Raw)": 2.0874009132385254, "Pretrain/Step": 5080, "Pretrain/Step Time": 9.058784820139408} +{"Pretrain/Learning Rate": 2.3561761032730463e-05, "Pretrain/Loss": 2.065587282180786, "Pretrain/Loss (Raw)": 2.364420175552368, "Pretrain/Step": 5081, "Pretrain/Step Time": 9.054897589609027} +{"Pretrain/Learning Rate": 2.355328530359273e-05, "Pretrain/Loss": 2.06638240814209, "Pretrain/Loss (Raw)": 2.1361727714538574, "Pretrain/Step": 5082, "Pretrain/Step Time": 9.055874494835734} +{"Pretrain/Learning Rate": 2.3544809741296954e-05, "Pretrain/Loss": 2.0653114318847656, "Pretrain/Loss (Raw)": 2.0360379219055176, "Pretrain/Step": 5083, "Pretrain/Step Time": 9.05101278796792} +{"Pretrain/Learning Rate": 2.3536334346820578e-05, "Pretrain/Loss": 2.0636191368103027, "Pretrain/Loss (Raw)": 2.0324065685272217, "Pretrain/Step": 5084, "Pretrain/Step Time": 9.05287242680788} +{"Pretrain/Learning Rate": 2.3527859121141012e-05, "Pretrain/Loss": 2.064584255218506, "Pretrain/Loss (Raw)": 2.0777130126953125, "Pretrain/Step": 5085, "Pretrain/Step Time": 9.052370244637132} +{"Pretrain/Learning Rate": 2.351938406523568e-05, "Pretrain/Loss": 2.064908027648926, "Pretrain/Loss (Raw)": 2.117621660232544, "Pretrain/Step": 5086, "Pretrain/Step Time": 9.052245538681746} +{"Pretrain/Learning Rate": 2.3510909180081946e-05, "Pretrain/Loss": 2.061135768890381, "Pretrain/Loss (Raw)": 1.8747212886810303, "Pretrain/Step": 5087, "Pretrain/Step Time": 9.05783485621214} +{"Pretrain/Learning Rate": 2.350243446665719e-05, "Pretrain/Loss": 2.05985164642334, "Pretrain/Loss (Raw)": 1.8110629320144653, "Pretrain/Step": 5088, "Pretrain/Step Time": 9.05340563505888} +{"Pretrain/Learning Rate": 2.3493959925938746e-05, "Pretrain/Loss": 2.063382625579834, "Pretrain/Loss (Raw)": 2.1109113693237305, "Pretrain/Step": 5089, "Pretrain/Step Time": 9.052907168865204} +{"Pretrain/Learning Rate": 2.348548555890394e-05, "Pretrain/Loss": 2.065291404724121, "Pretrain/Loss (Raw)": 2.1262283325195312, "Pretrain/Step": 5090, "Pretrain/Step Time": 9.05581740476191} +{"Pretrain/Learning Rate": 2.3477011366530068e-05, "Pretrain/Loss": 2.0658228397369385, "Pretrain/Loss (Raw)": 2.016904830932617, "Pretrain/Step": 5091, "Pretrain/Step Time": 9.055837385356426} +{"Pretrain/Learning Rate": 2.3468537349794438e-05, "Pretrain/Loss": 2.0649681091308594, "Pretrain/Loss (Raw)": 2.0872039794921875, "Pretrain/Step": 5092, "Pretrain/Step Time": 9.053644433617592} +{"Pretrain/Learning Rate": 2.3460063509674278e-05, "Pretrain/Loss": 2.065408706665039, "Pretrain/Loss (Raw)": 2.003927230834961, "Pretrain/Step": 5093, "Pretrain/Step Time": 9.053730623796582} +{"Pretrain/Learning Rate": 2.345158984714687e-05, "Pretrain/Loss": 2.066373825073242, "Pretrain/Loss (Raw)": 2.1375768184661865, "Pretrain/Step": 5094, "Pretrain/Step Time": 9.053859077394009} +{"Pretrain/Learning Rate": 2.3443116363189398e-05, "Pretrain/Loss": 2.0680956840515137, "Pretrain/Loss (Raw)": 2.2228381633758545, "Pretrain/Step": 5095, "Pretrain/Step Time": 9.052854720503092} +{"Pretrain/Learning Rate": 2.3434643058779104e-05, "Pretrain/Loss": 2.068140983581543, "Pretrain/Loss (Raw)": 2.1076178550720215, "Pretrain/Step": 5096, "Pretrain/Step Time": 9.044570077210665} +{"Pretrain/Learning Rate": 2.342616993489313e-05, "Pretrain/Loss": 2.068622589111328, "Pretrain/Loss (Raw)": 2.154298782348633, "Pretrain/Step": 5097, "Pretrain/Step Time": 9.042680710554123} +{"Pretrain/Learning Rate": 2.3417696992508657e-05, "Pretrain/Loss": 2.0727975368499756, "Pretrain/Loss (Raw)": 2.593526840209961, "Pretrain/Step": 5098, "Pretrain/Step Time": 9.044332668185234} +{"Pretrain/Learning Rate": 2.3409224232602832e-05, "Pretrain/Loss": 2.071742534637451, "Pretrain/Loss (Raw)": 2.0640218257904053, "Pretrain/Step": 5099, "Pretrain/Step Time": 9.050284016877413} +{"Pretrain/Learning Rate": 2.340075165615276e-05, "Pretrain/Loss": 2.0722641944885254, "Pretrain/Loss (Raw)": 2.0654735565185547, "Pretrain/Step": 5100, "Pretrain/Step Time": 9.046404715627432} +{"Pretrain/Learning Rate": 2.339227926413555e-05, "Pretrain/Loss": 2.0720295906066895, "Pretrain/Loss (Raw)": 2.041165828704834, "Pretrain/Step": 5101, "Pretrain/Step Time": 9.04853118956089} +{"Pretrain/Learning Rate": 2.3383807057528256e-05, "Pretrain/Loss": 2.0705642700195312, "Pretrain/Loss (Raw)": 1.882384181022644, "Pretrain/Step": 5102, "Pretrain/Step Time": 9.04251548834145} +{"Pretrain/Learning Rate": 2.3375335037307965e-05, "Pretrain/Loss": 2.0694384574890137, "Pretrain/Loss (Raw)": 2.016400098800659, "Pretrain/Step": 5103, "Pretrain/Step Time": 9.037932800129056} +{"Pretrain/Learning Rate": 2.3366863204451677e-05, "Pretrain/Loss": 2.067885398864746, "Pretrain/Loss (Raw)": 2.137667417526245, "Pretrain/Step": 5104, "Pretrain/Step Time": 9.043332017958164} +{"Pretrain/Learning Rate": 2.3358391559936438e-05, "Pretrain/Loss": 2.068521499633789, "Pretrain/Loss (Raw)": 2.0619266033172607, "Pretrain/Step": 5105, "Pretrain/Step Time": 9.038916340097785} +{"Pretrain/Learning Rate": 2.33499201047392e-05, "Pretrain/Loss": 2.0678281784057617, "Pretrain/Loss (Raw)": 2.0019943714141846, "Pretrain/Step": 5106, "Pretrain/Step Time": 9.045786606147885} +{"Pretrain/Learning Rate": 2.334144883983697e-05, "Pretrain/Loss": 2.0670506954193115, "Pretrain/Loss (Raw)": 1.9928802251815796, "Pretrain/Step": 5107, "Pretrain/Step Time": 9.040930047631264} +{"Pretrain/Learning Rate": 2.3332977766206657e-05, "Pretrain/Loss": 2.0700950622558594, "Pretrain/Loss (Raw)": 2.5687339305877686, "Pretrain/Step": 5108, "Pretrain/Step Time": 9.036173555999994} +{"Pretrain/Learning Rate": 2.332450688482522e-05, "Pretrain/Loss": 2.0710196495056152, "Pretrain/Loss (Raw)": 2.153254270553589, "Pretrain/Step": 5109, "Pretrain/Step Time": 9.039147330448031} +{"Pretrain/Learning Rate": 2.3316036196669534e-05, "Pretrain/Loss": 2.0701677799224854, "Pretrain/Loss (Raw)": 1.9655460119247437, "Pretrain/Step": 5110, "Pretrain/Step Time": 9.037523835897446} +{"Pretrain/Learning Rate": 2.3307565702716495e-05, "Pretrain/Loss": 2.068284273147583, "Pretrain/Loss (Raw)": 1.7343499660491943, "Pretrain/Step": 5111, "Pretrain/Step Time": 9.037344889715314} +{"Pretrain/Learning Rate": 2.3299095403942943e-05, "Pretrain/Loss": 2.0690579414367676, "Pretrain/Loss (Raw)": 2.0400686264038086, "Pretrain/Step": 5112, "Pretrain/Step Time": 9.038918796926737} +{"Pretrain/Learning Rate": 2.3290625301325735e-05, "Pretrain/Loss": 2.0709500312805176, "Pretrain/Loss (Raw)": 2.329204797744751, "Pretrain/Step": 5113, "Pretrain/Step Time": 9.038426660001278} +{"Pretrain/Learning Rate": 2.3282155395841667e-05, "Pretrain/Loss": 2.0712368488311768, "Pretrain/Loss (Raw)": 1.9896421432495117, "Pretrain/Step": 5114, "Pretrain/Step Time": 9.04157393425703} +{"Pretrain/Learning Rate": 2.327368568846754e-05, "Pretrain/Loss": 2.0708515644073486, "Pretrain/Loss (Raw)": 1.8922239542007446, "Pretrain/Step": 5115, "Pretrain/Step Time": 9.045380152761936} +{"Pretrain/Learning Rate": 2.3265216180180106e-05, "Pretrain/Loss": 2.0741348266601562, "Pretrain/Loss (Raw)": 2.2848525047302246, "Pretrain/Step": 5116, "Pretrain/Step Time": 9.045490061864257} +{"Pretrain/Learning Rate": 2.325674687195612e-05, "Pretrain/Loss": 2.07595157623291, "Pretrain/Loss (Raw)": 2.2199158668518066, "Pretrain/Step": 5117, "Pretrain/Step Time": 9.044440660625696} +{"Pretrain/Learning Rate": 2.32482777647723e-05, "Pretrain/Loss": 2.0740718841552734, "Pretrain/Loss (Raw)": 1.7271287441253662, "Pretrain/Step": 5118, "Pretrain/Step Time": 9.050893038511276} +{"Pretrain/Learning Rate": 2.323980885960534e-05, "Pretrain/Loss": 2.0734477043151855, "Pretrain/Loss (Raw)": 2.035860538482666, "Pretrain/Step": 5119, "Pretrain/Step Time": 9.04841360077262} +{"Pretrain/Learning Rate": 2.3231340157431917e-05, "Pretrain/Loss": 2.07654070854187, "Pretrain/Loss (Raw)": 2.1006853580474854, "Pretrain/Step": 5120, "Pretrain/Step Time": 9.041371451690793} +{"Pretrain/Learning Rate": 2.3222871659228685e-05, "Pretrain/Loss": 2.076603412628174, "Pretrain/Loss (Raw)": 2.1293957233428955, "Pretrain/Step": 5121, "Pretrain/Step Time": 9.035179750993848} +{"Pretrain/Learning Rate": 2.3214403365972258e-05, "Pretrain/Loss": 2.075956344604492, "Pretrain/Loss (Raw)": 2.0467042922973633, "Pretrain/Step": 5122, "Pretrain/Step Time": 9.03618305362761} +{"Pretrain/Learning Rate": 2.320593527863926e-05, "Pretrain/Loss": 2.072840690612793, "Pretrain/Loss (Raw)": 1.901944875717163, "Pretrain/Step": 5123, "Pretrain/Step Time": 9.036244535818696} +{"Pretrain/Learning Rate": 2.319746739820625e-05, "Pretrain/Loss": 2.071443796157837, "Pretrain/Loss (Raw)": 1.8887908458709717, "Pretrain/Step": 5124, "Pretrain/Step Time": 9.040647476911545} +{"Pretrain/Learning Rate": 2.3188999725649804e-05, "Pretrain/Loss": 2.070378303527832, "Pretrain/Loss (Raw)": 1.946567416191101, "Pretrain/Step": 5125, "Pretrain/Step Time": 9.04377856105566} +{"Pretrain/Learning Rate": 2.3180532261946437e-05, "Pretrain/Loss": 2.068600654602051, "Pretrain/Loss (Raw)": 2.1660053730010986, "Pretrain/Step": 5126, "Pretrain/Step Time": 9.04322149604559} +{"Pretrain/Learning Rate": 2.3172065008072663e-05, "Pretrain/Loss": 2.0655555725097656, "Pretrain/Loss (Raw)": 2.0957746505737305, "Pretrain/Step": 5127, "Pretrain/Step Time": 9.040755726397038} +{"Pretrain/Learning Rate": 2.3163597965004967e-05, "Pretrain/Loss": 2.06607723236084, "Pretrain/Loss (Raw)": 2.0015556812286377, "Pretrain/Step": 5128, "Pretrain/Step Time": 9.033378167077899} +{"Pretrain/Learning Rate": 2.315513113371981e-05, "Pretrain/Loss": 2.065638542175293, "Pretrain/Loss (Raw)": 1.9167311191558838, "Pretrain/Step": 5129, "Pretrain/Step Time": 8.548179047182202} +{"Pretrain/Learning Rate": 2.3146664515193616e-05, "Pretrain/Loss": 2.0632870197296143, "Pretrain/Loss (Raw)": 2.0435307025909424, "Pretrain/Step": 5130, "Pretrain/Step Time": 8.546458642929792} +{"Pretrain/Learning Rate": 2.3138198110402812e-05, "Pretrain/Loss": 2.0610833168029785, "Pretrain/Loss (Raw)": 1.9504361152648926, "Pretrain/Step": 5131, "Pretrain/Step Time": 8.555479317903519} +{"Pretrain/Learning Rate": 2.3129731920323765e-05, "Pretrain/Loss": 2.0656304359436035, "Pretrain/Loss (Raw)": 2.2843017578125, "Pretrain/Step": 5132, "Pretrain/Step Time": 8.55294968560338} +{"Pretrain/Learning Rate": 2.3121265945932862e-05, "Pretrain/Loss": 2.0662271976470947, "Pretrain/Loss (Raw)": 2.146397829055786, "Pretrain/Step": 5133, "Pretrain/Step Time": 8.559207417070866} +{"Pretrain/Learning Rate": 2.3112800188206404e-05, "Pretrain/Loss": 2.0661263465881348, "Pretrain/Loss (Raw)": 2.061152219772339, "Pretrain/Step": 5134, "Pretrain/Step Time": 8.555428368970752} +{"Pretrain/Learning Rate": 2.310433464812074e-05, "Pretrain/Loss": 2.0675201416015625, "Pretrain/Loss (Raw)": 1.9494372606277466, "Pretrain/Step": 5135, "Pretrain/Step Time": 8.556557606905699} +{"Pretrain/Learning Rate": 2.309586932665212e-05, "Pretrain/Loss": 2.069298267364502, "Pretrain/Loss (Raw)": 2.1708738803863525, "Pretrain/Step": 5136, "Pretrain/Step Time": 8.559226021170616} +{"Pretrain/Learning Rate": 2.3087404224776835e-05, "Pretrain/Loss": 2.068437099456787, "Pretrain/Loss (Raw)": 1.9301106929779053, "Pretrain/Step": 5137, "Pretrain/Step Time": 8.563737595453858} +{"Pretrain/Learning Rate": 2.307893934347109e-05, "Pretrain/Loss": 2.070249319076538, "Pretrain/Loss (Raw)": 2.4133031368255615, "Pretrain/Step": 5138, "Pretrain/Step Time": 8.553909808397293} +{"Pretrain/Learning Rate": 2.3070474683711125e-05, "Pretrain/Loss": 2.0702004432678223, "Pretrain/Loss (Raw)": 2.0124833583831787, "Pretrain/Step": 5139, "Pretrain/Step Time": 8.560916025191545} +{"Pretrain/Learning Rate": 2.306201024647311e-05, "Pretrain/Loss": 2.0716137886047363, "Pretrain/Loss (Raw)": 2.0736944675445557, "Pretrain/Step": 5140, "Pretrain/Step Time": 8.556713312864304} +{"Pretrain/Learning Rate": 2.3053546032733207e-05, "Pretrain/Loss": 2.0702672004699707, "Pretrain/Loss (Raw)": 2.0379669666290283, "Pretrain/Step": 5141, "Pretrain/Step Time": 8.55260269343853} +{"Pretrain/Learning Rate": 2.3045082043467554e-05, "Pretrain/Loss": 2.07010817527771, "Pretrain/Loss (Raw)": 2.0539751052856445, "Pretrain/Step": 5142, "Pretrain/Step Time": 8.55052706040442} +{"Pretrain/Learning Rate": 2.3036618279652232e-05, "Pretrain/Loss": 2.074047565460205, "Pretrain/Loss (Raw)": 2.5923101902008057, "Pretrain/Step": 5143, "Pretrain/Step Time": 8.558752983808517} +{"Pretrain/Learning Rate": 2.3028154742263362e-05, "Pretrain/Loss": 2.0733931064605713, "Pretrain/Loss (Raw)": 2.0093624591827393, "Pretrain/Step": 5144, "Pretrain/Step Time": 8.562104616314173} +{"Pretrain/Learning Rate": 2.3019691432276964e-05, "Pretrain/Loss": 2.0736019611358643, "Pretrain/Loss (Raw)": 2.1650054454803467, "Pretrain/Step": 5145, "Pretrain/Step Time": 8.555674666538835} +{"Pretrain/Learning Rate": 2.3011228350669096e-05, "Pretrain/Loss": 2.0742111206054688, "Pretrain/Loss (Raw)": 2.074260950088501, "Pretrain/Step": 5146, "Pretrain/Step Time": 8.551475282758474} +{"Pretrain/Learning Rate": 2.3002765498415728e-05, "Pretrain/Loss": 2.0762856006622314, "Pretrain/Loss (Raw)": 2.3131332397460938, "Pretrain/Step": 5147, "Pretrain/Step Time": 8.547903360798955} +{"Pretrain/Learning Rate": 2.2994302876492875e-05, "Pretrain/Loss": 2.0785129070281982, "Pretrain/Loss (Raw)": 2.2452731132507324, "Pretrain/Step": 5148, "Pretrain/Step Time": 8.555505312979221} +{"Pretrain/Learning Rate": 2.2985840485876444e-05, "Pretrain/Loss": 2.0780045986175537, "Pretrain/Loss (Raw)": 2.0105578899383545, "Pretrain/Step": 5149, "Pretrain/Step Time": 8.552138812839985} +{"Pretrain/Learning Rate": 2.2977378327542397e-05, "Pretrain/Loss": 2.0750770568847656, "Pretrain/Loss (Raw)": 1.9118776321411133, "Pretrain/Step": 5150, "Pretrain/Step Time": 8.555303128436208} +{"Pretrain/Learning Rate": 2.2968916402466604e-05, "Pretrain/Loss": 2.076622486114502, "Pretrain/Loss (Raw)": 2.2576706409454346, "Pretrain/Step": 5151, "Pretrain/Step Time": 8.546160725876689} +{"Pretrain/Learning Rate": 2.2960454711624945e-05, "Pretrain/Loss": 2.077868938446045, "Pretrain/Loss (Raw)": 2.104501247406006, "Pretrain/Step": 5152, "Pretrain/Step Time": 8.54992157407105} +{"Pretrain/Learning Rate": 2.2951993255993252e-05, "Pretrain/Loss": 2.077280282974243, "Pretrain/Loss (Raw)": 2.104609489440918, "Pretrain/Step": 5153, "Pretrain/Step Time": 8.543154709041119} +{"Pretrain/Learning Rate": 2.2943532036547356e-05, "Pretrain/Loss": 2.0772933959960938, "Pretrain/Loss (Raw)": 2.091531753540039, "Pretrain/Step": 5154, "Pretrain/Step Time": 8.550883879885077} +{"Pretrain/Learning Rate": 2.293507105426303e-05, "Pretrain/Loss": 2.076280117034912, "Pretrain/Loss (Raw)": 2.2561705112457275, "Pretrain/Step": 5155, "Pretrain/Step Time": 8.547668289393187} +{"Pretrain/Learning Rate": 2.2926610310116047e-05, "Pretrain/Loss": 2.0796761512756348, "Pretrain/Loss (Raw)": 2.4822282791137695, "Pretrain/Step": 5156, "Pretrain/Step Time": 8.552101707085967} +{"Pretrain/Learning Rate": 2.2918149805082127e-05, "Pretrain/Loss": 2.080420970916748, "Pretrain/Loss (Raw)": 1.964850664138794, "Pretrain/Step": 5157, "Pretrain/Step Time": 8.54672321304679} +{"Pretrain/Learning Rate": 2.2909689540136985e-05, "Pretrain/Loss": 2.078115463256836, "Pretrain/Loss (Raw)": 1.8613251447677612, "Pretrain/Step": 5158, "Pretrain/Step Time": 8.543383760377765} +{"Pretrain/Learning Rate": 2.290122951625629e-05, "Pretrain/Loss": 2.0758402347564697, "Pretrain/Loss (Raw)": 1.8580222129821777, "Pretrain/Step": 5159, "Pretrain/Step Time": 8.538772089406848} +{"Pretrain/Learning Rate": 2.2892769734415703e-05, "Pretrain/Loss": 2.078484058380127, "Pretrain/Loss (Raw)": 2.3298704624176025, "Pretrain/Step": 5160, "Pretrain/Step Time": 8.550080619752407} +{"Pretrain/Learning Rate": 2.2884310195590835e-05, "Pretrain/Loss": 2.077314853668213, "Pretrain/Loss (Raw)": 1.8493596315383911, "Pretrain/Step": 5161, "Pretrain/Step Time": 8.548139370977879} +{"Pretrain/Learning Rate": 2.2875850900757288e-05, "Pretrain/Loss": 2.0770344734191895, "Pretrain/Loss (Raw)": 2.03620982170105, "Pretrain/Step": 5162, "Pretrain/Step Time": 8.548979591578245} +{"Pretrain/Learning Rate": 2.2867391850890623e-05, "Pretrain/Loss": 2.077263593673706, "Pretrain/Loss (Raw)": 1.887660264968872, "Pretrain/Step": 5163, "Pretrain/Step Time": 8.544481799006462} +{"Pretrain/Learning Rate": 2.285893304696638e-05, "Pretrain/Loss": 2.0769004821777344, "Pretrain/Loss (Raw)": 1.9887765645980835, "Pretrain/Step": 5164, "Pretrain/Step Time": 8.545722551643848} +{"Pretrain/Learning Rate": 2.2850474489960065e-05, "Pretrain/Loss": 2.0758938789367676, "Pretrain/Loss (Raw)": 1.9930634498596191, "Pretrain/Step": 5165, "Pretrain/Step Time": 8.536633739247918} +{"Pretrain/Learning Rate": 2.2842016180847165e-05, "Pretrain/Loss": 2.0735626220703125, "Pretrain/Loss (Raw)": 2.0915935039520264, "Pretrain/Step": 5166, "Pretrain/Step Time": 8.540414247661829} +{"Pretrain/Learning Rate": 2.2833558120603122e-05, "Pretrain/Loss": 2.0718369483947754, "Pretrain/Loss (Raw)": 1.8591686487197876, "Pretrain/Step": 5167, "Pretrain/Step Time": 8.541643222793937} +{"Pretrain/Learning Rate": 2.282510031020337e-05, "Pretrain/Loss": 2.0701045989990234, "Pretrain/Loss (Raw)": 1.8178577423095703, "Pretrain/Step": 5168, "Pretrain/Step Time": 8.543840870261192} +{"Pretrain/Learning Rate": 2.2816642750623294e-05, "Pretrain/Loss": 2.071500062942505, "Pretrain/Loss (Raw)": 2.0296735763549805, "Pretrain/Step": 5169, "Pretrain/Step Time": 8.535168748348951} +{"Pretrain/Learning Rate": 2.280818544283827e-05, "Pretrain/Loss": 2.0692524909973145, "Pretrain/Loss (Raw)": 2.0891177654266357, "Pretrain/Step": 5170, "Pretrain/Step Time": 8.532589981332421} +{"Pretrain/Learning Rate": 2.279972838782362e-05, "Pretrain/Loss": 2.069831371307373, "Pretrain/Loss (Raw)": 2.2356550693511963, "Pretrain/Step": 5171, "Pretrain/Step Time": 8.532395297661424} +{"Pretrain/Learning Rate": 2.279127158655467e-05, "Pretrain/Loss": 2.070035696029663, "Pretrain/Loss (Raw)": 2.117973566055298, "Pretrain/Step": 5172, "Pretrain/Step Time": 8.532900005578995} +{"Pretrain/Learning Rate": 2.2782815040006683e-05, "Pretrain/Loss": 2.071382522583008, "Pretrain/Loss (Raw)": 2.1782562732696533, "Pretrain/Step": 5173, "Pretrain/Step Time": 8.533268854022026} +{"Pretrain/Learning Rate": 2.2774358749154917e-05, "Pretrain/Loss": 2.075345516204834, "Pretrain/Loss (Raw)": 2.1892058849334717, "Pretrain/Step": 5174, "Pretrain/Step Time": 8.5355604570359} +{"Pretrain/Learning Rate": 2.2765902714974585e-05, "Pretrain/Loss": 2.07497501373291, "Pretrain/Loss (Raw)": 2.0265655517578125, "Pretrain/Step": 5175, "Pretrain/Step Time": 8.536042772233486} +{"Pretrain/Learning Rate": 2.2757446938440886e-05, "Pretrain/Loss": 2.0757336616516113, "Pretrain/Loss (Raw)": 2.0276083946228027, "Pretrain/Step": 5176, "Pretrain/Step Time": 8.527408452704549} +{"Pretrain/Learning Rate": 2.274899142052896e-05, "Pretrain/Loss": 2.076340675354004, "Pretrain/Loss (Raw)": 2.1463565826416016, "Pretrain/Step": 5177, "Pretrain/Step Time": 8.526058267802} +{"Pretrain/Learning Rate": 2.2740536162213967e-05, "Pretrain/Loss": 2.0762546062469482, "Pretrain/Loss (Raw)": 2.0215389728546143, "Pretrain/Step": 5178, "Pretrain/Step Time": 8.53072864562273} +{"Pretrain/Learning Rate": 2.2732081164470973e-05, "Pretrain/Loss": 2.0741541385650635, "Pretrain/Loss (Raw)": 1.8888977766036987, "Pretrain/Step": 5179, "Pretrain/Step Time": 8.5320288464427} +{"Pretrain/Learning Rate": 2.2723626428275072e-05, "Pretrain/Loss": 2.0746920108795166, "Pretrain/Loss (Raw)": 1.961227536201477, "Pretrain/Step": 5180, "Pretrain/Step Time": 8.531319424510002} +{"Pretrain/Learning Rate": 2.2715171954601303e-05, "Pretrain/Loss": 2.07314395904541, "Pretrain/Loss (Raw)": 1.9351643323898315, "Pretrain/Step": 5181, "Pretrain/Step Time": 8.534791506826878} +{"Pretrain/Learning Rate": 2.2706717744424664e-05, "Pretrain/Loss": 2.0738446712493896, "Pretrain/Loss (Raw)": 2.20829176902771, "Pretrain/Step": 5182, "Pretrain/Step Time": 8.525946777313948} +{"Pretrain/Learning Rate": 2.2698263798720148e-05, "Pretrain/Loss": 2.0744376182556152, "Pretrain/Loss (Raw)": 2.149495840072632, "Pretrain/Step": 5183, "Pretrain/Step Time": 8.531295873224735} +{"Pretrain/Learning Rate": 2.268981011846269e-05, "Pretrain/Loss": 2.074751138687134, "Pretrain/Loss (Raw)": 2.172379493713379, "Pretrain/Step": 5184, "Pretrain/Step Time": 8.525777800008655} +{"Pretrain/Learning Rate": 2.2681356704627226e-05, "Pretrain/Loss": 2.075819969177246, "Pretrain/Loss (Raw)": 2.1841933727264404, "Pretrain/Step": 5185, "Pretrain/Step Time": 8.523892257362604} +{"Pretrain/Learning Rate": 2.267290355818862e-05, "Pretrain/Loss": 2.0768494606018066, "Pretrain/Loss (Raw)": 2.107217788696289, "Pretrain/Step": 5186, "Pretrain/Step Time": 8.529786758124828} +{"Pretrain/Learning Rate": 2.2664450680121754e-05, "Pretrain/Loss": 2.0778565406799316, "Pretrain/Loss (Raw)": 1.973523497581482, "Pretrain/Step": 5187, "Pretrain/Step Time": 8.526633273810148} +{"Pretrain/Learning Rate": 2.2655998071401424e-05, "Pretrain/Loss": 2.077454090118408, "Pretrain/Loss (Raw)": 2.131226062774658, "Pretrain/Step": 5188, "Pretrain/Step Time": 8.518363820388913} +{"Pretrain/Learning Rate": 2.264754573300246e-05, "Pretrain/Loss": 2.076019287109375, "Pretrain/Loss (Raw)": 1.9409871101379395, "Pretrain/Step": 5189, "Pretrain/Step Time": 8.519374774768949} +{"Pretrain/Learning Rate": 2.2639093665899592e-05, "Pretrain/Loss": 2.074519157409668, "Pretrain/Loss (Raw)": 1.9066470861434937, "Pretrain/Step": 5190, "Pretrain/Step Time": 8.520037084817886} +{"Pretrain/Learning Rate": 2.263064187106758e-05, "Pretrain/Loss": 2.0737781524658203, "Pretrain/Loss (Raw)": 1.9040980339050293, "Pretrain/Step": 5191, "Pretrain/Step Time": 8.516558399423957} +{"Pretrain/Learning Rate": 2.2622190349481102e-05, "Pretrain/Loss": 2.0733768939971924, "Pretrain/Loss (Raw)": 2.123430013656616, "Pretrain/Step": 5192, "Pretrain/Step Time": 8.524639142677188} +{"Pretrain/Learning Rate": 2.2613739102114846e-05, "Pretrain/Loss": 2.073638439178467, "Pretrain/Loss (Raw)": 1.956235408782959, "Pretrain/Step": 5193, "Pretrain/Step Time": 8.523288549855351} +{"Pretrain/Learning Rate": 2.2605288129943435e-05, "Pretrain/Loss": 2.072679042816162, "Pretrain/Loss (Raw)": 2.060277223587036, "Pretrain/Step": 5194, "Pretrain/Step Time": 8.52353742532432} +{"Pretrain/Learning Rate": 2.2596837433941486e-05, "Pretrain/Loss": 2.0716352462768555, "Pretrain/Loss (Raw)": 2.0204999446868896, "Pretrain/Step": 5195, "Pretrain/Step Time": 8.522218884900212} +{"Pretrain/Learning Rate": 2.2588387015083566e-05, "Pretrain/Loss": 2.0715713500976562, "Pretrain/Loss (Raw)": 2.0497214794158936, "Pretrain/Step": 5196, "Pretrain/Step Time": 8.533652311190963} +{"Pretrain/Learning Rate": 2.257993687434422e-05, "Pretrain/Loss": 2.0719196796417236, "Pretrain/Loss (Raw)": 2.1294169425964355, "Pretrain/Step": 5197, "Pretrain/Step Time": 8.532396217808127} +{"Pretrain/Learning Rate": 2.2571487012697952e-05, "Pretrain/Loss": 2.067868232727051, "Pretrain/Loss (Raw)": 1.6776031255722046, "Pretrain/Step": 5198, "Pretrain/Step Time": 8.539347575977445} +{"Pretrain/Learning Rate": 2.2563037431119254e-05, "Pretrain/Loss": 2.066873073577881, "Pretrain/Loss (Raw)": 1.9795904159545898, "Pretrain/Step": 5199, "Pretrain/Step Time": 8.533564424142241} +{"Pretrain/Learning Rate": 2.2554588130582556e-05, "Pretrain/Loss": 2.0675253868103027, "Pretrain/Loss (Raw)": 2.172605276107788, "Pretrain/Step": 5200, "Pretrain/Step Time": 8.534501168876886} +{"Pretrain/Learning Rate": 2.254613911206228e-05, "Pretrain/Loss": 2.066587209701538, "Pretrain/Loss (Raw)": 1.8154020309448242, "Pretrain/Step": 5201, "Pretrain/Step Time": 8.535934964194894} +{"Pretrain/Learning Rate": 2.25376903765328e-05, "Pretrain/Loss": 2.0658977031707764, "Pretrain/Loss (Raw)": 1.9651395082473755, "Pretrain/Step": 5202, "Pretrain/Step Time": 8.539907298982143} +{"Pretrain/Learning Rate": 2.252924192496848e-05, "Pretrain/Loss": 2.0656232833862305, "Pretrain/Loss (Raw)": 2.0467445850372314, "Pretrain/Step": 5203, "Pretrain/Step Time": 8.534108012914658} +{"Pretrain/Learning Rate": 2.2520793758343614e-05, "Pretrain/Loss": 2.0637855529785156, "Pretrain/Loss (Raw)": 1.8338593244552612, "Pretrain/Step": 5204, "Pretrain/Step Time": 8.537062108516693} +{"Pretrain/Learning Rate": 2.2512345877632498e-05, "Pretrain/Loss": 2.0635874271392822, "Pretrain/Loss (Raw)": 1.9510302543640137, "Pretrain/Step": 5205, "Pretrain/Step Time": 8.53781489469111} +{"Pretrain/Learning Rate": 2.2503898283809374e-05, "Pretrain/Loss": 2.0629522800445557, "Pretrain/Loss (Raw)": 2.0640954971313477, "Pretrain/Step": 5206, "Pretrain/Step Time": 8.542214788496494} +{"Pretrain/Learning Rate": 2.2495450977848467e-05, "Pretrain/Loss": 2.063504695892334, "Pretrain/Loss (Raw)": 1.9762951135635376, "Pretrain/Step": 5207, "Pretrain/Step Time": 8.541233386844397} +{"Pretrain/Learning Rate": 2.248700396072395e-05, "Pretrain/Loss": 2.0636751651763916, "Pretrain/Loss (Raw)": 2.109221935272217, "Pretrain/Step": 5208, "Pretrain/Step Time": 8.543578490614891} +{"Pretrain/Learning Rate": 2.2478557233409986e-05, "Pretrain/Loss": 2.061466932296753, "Pretrain/Loss (Raw)": 2.0817620754241943, "Pretrain/Step": 5209, "Pretrain/Step Time": 8.53951065801084} +{"Pretrain/Learning Rate": 2.2470110796880673e-05, "Pretrain/Loss": 2.0594992637634277, "Pretrain/Loss (Raw)": 1.8842850923538208, "Pretrain/Step": 5210, "Pretrain/Step Time": 8.545884354040027} +{"Pretrain/Learning Rate": 2.246166465211011e-05, "Pretrain/Loss": 2.0605783462524414, "Pretrain/Loss (Raw)": 2.17417049407959, "Pretrain/Step": 5211, "Pretrain/Step Time": 8.548167359083891} +{"Pretrain/Learning Rate": 2.245321880007234e-05, "Pretrain/Loss": 2.0600199699401855, "Pretrain/Loss (Raw)": 1.9609686136245728, "Pretrain/Step": 5212, "Pretrain/Step Time": 8.549035562202334} +{"Pretrain/Learning Rate": 2.244477324174138e-05, "Pretrain/Loss": 2.061239242553711, "Pretrain/Loss (Raw)": 2.233794927597046, "Pretrain/Step": 5213, "Pretrain/Step Time": 8.546580767259002} +{"Pretrain/Learning Rate": 2.2436327978091205e-05, "Pretrain/Loss": 2.0603084564208984, "Pretrain/Loss (Raw)": 1.9984586238861084, "Pretrain/Step": 5214, "Pretrain/Step Time": 8.548880496993661} +{"Pretrain/Learning Rate": 2.2427883010095775e-05, "Pretrain/Loss": 2.0615015029907227, "Pretrain/Loss (Raw)": 2.0274078845977783, "Pretrain/Step": 5215, "Pretrain/Step Time": 8.551659420132637} +{"Pretrain/Learning Rate": 2.241943833872899e-05, "Pretrain/Loss": 2.0623536109924316, "Pretrain/Loss (Raw)": 1.9201278686523438, "Pretrain/Step": 5216, "Pretrain/Step Time": 8.545723369345069} +{"Pretrain/Learning Rate": 2.2410993964964745e-05, "Pretrain/Loss": 2.061377763748169, "Pretrain/Loss (Raw)": 1.986038327217102, "Pretrain/Step": 5217, "Pretrain/Step Time": 8.546197354793549} +{"Pretrain/Learning Rate": 2.2402549889776864e-05, "Pretrain/Loss": 2.060504913330078, "Pretrain/Loss (Raw)": 2.0144693851470947, "Pretrain/Step": 5218, "Pretrain/Step Time": 8.543522221967578} +{"Pretrain/Learning Rate": 2.2394106114139183e-05, "Pretrain/Loss": 2.0607080459594727, "Pretrain/Loss (Raw)": 2.0429141521453857, "Pretrain/Step": 5219, "Pretrain/Step Time": 8.542287869378924} +{"Pretrain/Learning Rate": 2.2385662639025448e-05, "Pretrain/Loss": 2.060152530670166, "Pretrain/Loss (Raw)": 2.016098976135254, "Pretrain/Step": 5220, "Pretrain/Step Time": 8.545018756762147} +{"Pretrain/Learning Rate": 2.237721946540942e-05, "Pretrain/Loss": 2.0606141090393066, "Pretrain/Loss (Raw)": 2.0630292892456055, "Pretrain/Step": 5221, "Pretrain/Step Time": 8.549612862989306} +{"Pretrain/Learning Rate": 2.2368776594264813e-05, "Pretrain/Loss": 2.062514066696167, "Pretrain/Loss (Raw)": 2.3807411193847656, "Pretrain/Step": 5222, "Pretrain/Step Time": 8.545097393915057} +{"Pretrain/Learning Rate": 2.2360334026565277e-05, "Pretrain/Loss": 2.0631189346313477, "Pretrain/Loss (Raw)": 2.3002660274505615, "Pretrain/Step": 5223, "Pretrain/Step Time": 8.54505143687129} +{"Pretrain/Learning Rate": 2.2351891763284466e-05, "Pretrain/Loss": 2.063584089279175, "Pretrain/Loss (Raw)": 2.167177677154541, "Pretrain/Step": 5224, "Pretrain/Step Time": 8.545437356457114} +{"Pretrain/Learning Rate": 2.2343449805395973e-05, "Pretrain/Loss": 2.062573194503784, "Pretrain/Loss (Raw)": 2.0249111652374268, "Pretrain/Step": 5225, "Pretrain/Step Time": 8.54489147476852} +{"Pretrain/Learning Rate": 2.2335008153873375e-05, "Pretrain/Loss": 2.058699131011963, "Pretrain/Loss (Raw)": 2.09763765335083, "Pretrain/Step": 5226, "Pretrain/Step Time": 8.545254278928041} +{"Pretrain/Learning Rate": 2.2326566809690176e-05, "Pretrain/Loss": 2.0581252574920654, "Pretrain/Loss (Raw)": 1.990552544593811, "Pretrain/Step": 5227, "Pretrain/Step Time": 8.546321291476488} +{"Pretrain/Learning Rate": 2.2318125773819913e-05, "Pretrain/Loss": 2.0590689182281494, "Pretrain/Loss (Raw)": 2.1862611770629883, "Pretrain/Step": 5228, "Pretrain/Step Time": 8.543209919705987} +{"Pretrain/Learning Rate": 2.2309685047236002e-05, "Pretrain/Loss": 2.05849027633667, "Pretrain/Loss (Raw)": 1.967118740081787, "Pretrain/Step": 5229, "Pretrain/Step Time": 8.543197352439165} +{"Pretrain/Learning Rate": 2.2301244630911904e-05, "Pretrain/Loss": 2.0600509643554688, "Pretrain/Loss (Raw)": 2.0821194648742676, "Pretrain/Step": 5230, "Pretrain/Step Time": 8.546101668849587} +{"Pretrain/Learning Rate": 2.229280452582098e-05, "Pretrain/Loss": 2.0592753887176514, "Pretrain/Loss (Raw)": 1.9171332120895386, "Pretrain/Step": 5231, "Pretrain/Step Time": 8.548208925873041} +{"Pretrain/Learning Rate": 2.2284364732936608e-05, "Pretrain/Loss": 2.059574604034424, "Pretrain/Loss (Raw)": 2.1759774684906006, "Pretrain/Step": 5232, "Pretrain/Step Time": 8.544931441545486} +{"Pretrain/Learning Rate": 2.2275925253232073e-05, "Pretrain/Loss": 2.0585992336273193, "Pretrain/Loss (Raw)": 1.937082290649414, "Pretrain/Step": 5233, "Pretrain/Step Time": 8.554653082042933} +{"Pretrain/Learning Rate": 2.2267486087680695e-05, "Pretrain/Loss": 2.059579849243164, "Pretrain/Loss (Raw)": 2.127509593963623, "Pretrain/Step": 5234, "Pretrain/Step Time": 8.543256897479296} +{"Pretrain/Learning Rate": 2.2259047237255684e-05, "Pretrain/Loss": 2.0602662563323975, "Pretrain/Loss (Raw)": 2.080754280090332, "Pretrain/Step": 5235, "Pretrain/Step Time": 8.546376653015614} +{"Pretrain/Learning Rate": 2.2250608702930266e-05, "Pretrain/Loss": 2.0562641620635986, "Pretrain/Loss (Raw)": 2.0564355850219727, "Pretrain/Step": 5236, "Pretrain/Step Time": 8.548525389283895} +{"Pretrain/Learning Rate": 2.2242170485677606e-05, "Pretrain/Loss": 2.056333541870117, "Pretrain/Loss (Raw)": 2.162161350250244, "Pretrain/Step": 5237, "Pretrain/Step Time": 8.546091545373201} +{"Pretrain/Learning Rate": 2.223373258647084e-05, "Pretrain/Loss": 2.057682991027832, "Pretrain/Loss (Raw)": 2.138270378112793, "Pretrain/Step": 5238, "Pretrain/Step Time": 8.545515732839704} +{"Pretrain/Learning Rate": 2.222529500628307e-05, "Pretrain/Loss": 2.0591888427734375, "Pretrain/Loss (Raw)": 1.9270999431610107, "Pretrain/Step": 5239, "Pretrain/Step Time": 8.557034887373447} +{"Pretrain/Learning Rate": 2.2216857746087355e-05, "Pretrain/Loss": 2.058446168899536, "Pretrain/Loss (Raw)": 1.9450074434280396, "Pretrain/Step": 5240, "Pretrain/Step Time": 8.545936090871692} +{"Pretrain/Learning Rate": 2.2208420806856718e-05, "Pretrain/Loss": 2.057844400405884, "Pretrain/Loss (Raw)": 2.252201557159424, "Pretrain/Step": 5241, "Pretrain/Step Time": 8.54596402309835} +{"Pretrain/Learning Rate": 2.2199984189564148e-05, "Pretrain/Loss": 2.0578203201293945, "Pretrain/Loss (Raw)": 1.9865206480026245, "Pretrain/Step": 5242, "Pretrain/Step Time": 8.542791781947017} +{"Pretrain/Learning Rate": 2.2191547895182594e-05, "Pretrain/Loss": 2.059720516204834, "Pretrain/Loss (Raw)": 2.135467290878296, "Pretrain/Step": 5243, "Pretrain/Step Time": 8.541343307122588} +{"Pretrain/Learning Rate": 2.2183111924684975e-05, "Pretrain/Loss": 2.056504249572754, "Pretrain/Loss (Raw)": 1.873184084892273, "Pretrain/Step": 5244, "Pretrain/Step Time": 8.543711787089705} +{"Pretrain/Learning Rate": 2.2174676279044153e-05, "Pretrain/Loss": 2.0566492080688477, "Pretrain/Loss (Raw)": 2.2384302616119385, "Pretrain/Step": 5245, "Pretrain/Step Time": 8.54347651079297} +{"Pretrain/Learning Rate": 2.2166240959232985e-05, "Pretrain/Loss": 2.0589311122894287, "Pretrain/Loss (Raw)": 2.0192344188690186, "Pretrain/Step": 5246, "Pretrain/Step Time": 8.538081021979451} +{"Pretrain/Learning Rate": 2.215780596622426e-05, "Pretrain/Loss": 2.060945987701416, "Pretrain/Loss (Raw)": 2.293745279312134, "Pretrain/Step": 5247, "Pretrain/Step Time": 8.538337146863341} +{"Pretrain/Learning Rate": 2.2149371300990745e-05, "Pretrain/Loss": 2.0610551834106445, "Pretrain/Loss (Raw)": 2.1146786212921143, "Pretrain/Step": 5248, "Pretrain/Step Time": 8.536776630207896} +{"Pretrain/Learning Rate": 2.214093696450516e-05, "Pretrain/Loss": 2.0608201026916504, "Pretrain/Loss (Raw)": 2.0993216037750244, "Pretrain/Step": 5249, "Pretrain/Step Time": 8.539627522230148} +{"Pretrain/Learning Rate": 2.21325029577402e-05, "Pretrain/Loss": 2.059464454650879, "Pretrain/Loss (Raw)": 1.8731575012207031, "Pretrain/Step": 5250, "Pretrain/Step Time": 8.539425427094102} +{"Pretrain/Learning Rate": 2.2124069281668507e-05, "Pretrain/Loss": 2.0613205432891846, "Pretrain/Loss (Raw)": 2.139540433883667, "Pretrain/Step": 5251, "Pretrain/Step Time": 8.538477951660752} +{"Pretrain/Learning Rate": 2.2115635937262706e-05, "Pretrain/Loss": 2.062791347503662, "Pretrain/Loss (Raw)": 2.0770187377929688, "Pretrain/Step": 5252, "Pretrain/Step Time": 8.542614243924618} +{"Pretrain/Learning Rate": 2.210720292549535e-05, "Pretrain/Loss": 2.065222978591919, "Pretrain/Loss (Raw)": 2.2578442096710205, "Pretrain/Step": 5253, "Pretrain/Step Time": 8.539376830682158} +{"Pretrain/Learning Rate": 2.209877024733899e-05, "Pretrain/Loss": 2.0665602684020996, "Pretrain/Loss (Raw)": 2.3371756076812744, "Pretrain/Step": 5254, "Pretrain/Step Time": 8.54234953597188} +{"Pretrain/Learning Rate": 2.209033790376611e-05, "Pretrain/Loss": 2.0657262802124023, "Pretrain/Loss (Raw)": 1.989050030708313, "Pretrain/Step": 5255, "Pretrain/Step Time": 8.539808427914977} +{"Pretrain/Learning Rate": 2.2081905895749183e-05, "Pretrain/Loss": 2.0670180320739746, "Pretrain/Loss (Raw)": 2.166863203048706, "Pretrain/Step": 5256, "Pretrain/Step Time": 8.544523891061544} +{"Pretrain/Learning Rate": 2.207347422426061e-05, "Pretrain/Loss": 2.067563056945801, "Pretrain/Loss (Raw)": 1.986517071723938, "Pretrain/Step": 5257, "Pretrain/Step Time": 8.544615345075727} +{"Pretrain/Learning Rate": 2.206504289027279e-05, "Pretrain/Loss": 2.068460464477539, "Pretrain/Loss (Raw)": 2.1584043502807617, "Pretrain/Step": 5258, "Pretrain/Step Time": 8.548413589596748} +{"Pretrain/Learning Rate": 2.2056611894758038e-05, "Pretrain/Loss": 2.069174289703369, "Pretrain/Loss (Raw)": 2.041808605194092, "Pretrain/Step": 5259, "Pretrain/Step Time": 8.535513481125236} +{"Pretrain/Learning Rate": 2.204818123868869e-05, "Pretrain/Loss": 2.067725896835327, "Pretrain/Loss (Raw)": 2.0989067554473877, "Pretrain/Step": 5260, "Pretrain/Step Time": 8.541828585788608} +{"Pretrain/Learning Rate": 2.203975092303697e-05, "Pretrain/Loss": 2.0665388107299805, "Pretrain/Loss (Raw)": 1.9944273233413696, "Pretrain/Step": 5261, "Pretrain/Step Time": 8.535059031099081} +{"Pretrain/Learning Rate": 2.2031320948775135e-05, "Pretrain/Loss": 2.0676183700561523, "Pretrain/Loss (Raw)": 2.199371099472046, "Pretrain/Step": 5262, "Pretrain/Step Time": 8.53116456978023} +{"Pretrain/Learning Rate": 2.2022891316875362e-05, "Pretrain/Loss": 2.0680384635925293, "Pretrain/Loss (Raw)": 2.0031893253326416, "Pretrain/Step": 5263, "Pretrain/Step Time": 8.53764925710857} +{"Pretrain/Learning Rate": 2.201446202830978e-05, "Pretrain/Loss": 2.067272424697876, "Pretrain/Loss (Raw)": 2.072798490524292, "Pretrain/Step": 5264, "Pretrain/Step Time": 8.535797769203782} +{"Pretrain/Learning Rate": 2.2006033084050516e-05, "Pretrain/Loss": 2.0701074600219727, "Pretrain/Loss (Raw)": 2.2930331230163574, "Pretrain/Step": 5265, "Pretrain/Step Time": 8.530517041683197} +{"Pretrain/Learning Rate": 2.1997604485069614e-05, "Pretrain/Loss": 2.0668444633483887, "Pretrain/Loss (Raw)": 1.9956177473068237, "Pretrain/Step": 5266, "Pretrain/Step Time": 8.534403508529067} +{"Pretrain/Learning Rate": 2.1989176232339122e-05, "Pretrain/Loss": 2.0677497386932373, "Pretrain/Loss (Raw)": 2.1283674240112305, "Pretrain/Step": 5267, "Pretrain/Step Time": 8.530613493174314} +{"Pretrain/Learning Rate": 2.1980748326831002e-05, "Pretrain/Loss": 2.066452980041504, "Pretrain/Loss (Raw)": 1.907701015472412, "Pretrain/Step": 5268, "Pretrain/Step Time": 8.529976453632116} +{"Pretrain/Learning Rate": 2.1972320769517226e-05, "Pretrain/Loss": 2.0667552947998047, "Pretrain/Loss (Raw)": 2.076655387878418, "Pretrain/Step": 5269, "Pretrain/Step Time": 8.540504537522793} +{"Pretrain/Learning Rate": 2.1963893561369672e-05, "Pretrain/Loss": 2.066868782043457, "Pretrain/Loss (Raw)": 2.068525552749634, "Pretrain/Step": 5270, "Pretrain/Step Time": 8.539315644651651} +{"Pretrain/Learning Rate": 2.1955466703360232e-05, "Pretrain/Loss": 2.0634818077087402, "Pretrain/Loss (Raw)": 2.1587560176849365, "Pretrain/Step": 5271, "Pretrain/Step Time": 8.530951702967286} +{"Pretrain/Learning Rate": 2.1947040196460704e-05, "Pretrain/Loss": 2.0634357929229736, "Pretrain/Loss (Raw)": 2.0034778118133545, "Pretrain/Step": 5272, "Pretrain/Step Time": 8.529892805963755} +{"Pretrain/Learning Rate": 2.1938614041642903e-05, "Pretrain/Loss": 2.063469409942627, "Pretrain/Loss (Raw)": 2.169329881668091, "Pretrain/Step": 5273, "Pretrain/Step Time": 8.530491031706333} +{"Pretrain/Learning Rate": 2.1930188239878537e-05, "Pretrain/Loss": 2.0628674030303955, "Pretrain/Loss (Raw)": 1.9971734285354614, "Pretrain/Step": 5274, "Pretrain/Step Time": 8.528370764106512} +{"Pretrain/Learning Rate": 2.192176279213935e-05, "Pretrain/Loss": 2.060037612915039, "Pretrain/Loss (Raw)": 1.9509207010269165, "Pretrain/Step": 5275, "Pretrain/Step Time": 8.536368122324347} +{"Pretrain/Learning Rate": 2.191333769939696e-05, "Pretrain/Loss": 2.0573360919952393, "Pretrain/Loss (Raw)": 1.8995052576065063, "Pretrain/Step": 5276, "Pretrain/Step Time": 8.53026138804853} +{"Pretrain/Learning Rate": 2.1904912962623035e-05, "Pretrain/Loss": 2.055079460144043, "Pretrain/Loss (Raw)": 1.7216867208480835, "Pretrain/Step": 5277, "Pretrain/Step Time": 8.535012412816286} +{"Pretrain/Learning Rate": 2.1896488582789117e-05, "Pretrain/Loss": 2.054652214050293, "Pretrain/Loss (Raw)": 1.8572193384170532, "Pretrain/Step": 5278, "Pretrain/Step Time": 8.53188001550734} +{"Pretrain/Learning Rate": 2.1888064560866765e-05, "Pretrain/Loss": 2.054316759109497, "Pretrain/Loss (Raw)": 2.2146990299224854, "Pretrain/Step": 5279, "Pretrain/Step Time": 8.53210056759417} +{"Pretrain/Learning Rate": 2.187964089782747e-05, "Pretrain/Loss": 2.054638385772705, "Pretrain/Loss (Raw)": 2.145674467086792, "Pretrain/Step": 5280, "Pretrain/Step Time": 8.531085165217519} +{"Pretrain/Learning Rate": 2.187121759464269e-05, "Pretrain/Loss": 2.055429458618164, "Pretrain/Loss (Raw)": 2.2058892250061035, "Pretrain/Step": 5281, "Pretrain/Step Time": 8.538606537505984} +{"Pretrain/Learning Rate": 2.1862794652283837e-05, "Pretrain/Loss": 2.0545859336853027, "Pretrain/Loss (Raw)": 1.9835244417190552, "Pretrain/Step": 5282, "Pretrain/Step Time": 8.529354831203818} +{"Pretrain/Learning Rate": 2.1854372071722297e-05, "Pretrain/Loss": 2.052849531173706, "Pretrain/Loss (Raw)": 2.0339202880859375, "Pretrain/Step": 5283, "Pretrain/Step Time": 8.535475295037031} +{"Pretrain/Learning Rate": 2.1845949853929382e-05, "Pretrain/Loss": 2.0497937202453613, "Pretrain/Loss (Raw)": 2.091094732284546, "Pretrain/Step": 5284, "Pretrain/Step Time": 8.53080214932561} +{"Pretrain/Learning Rate": 2.1837527999876396e-05, "Pretrain/Loss": 2.054293632507324, "Pretrain/Loss (Raw)": 2.5408146381378174, "Pretrain/Step": 5285, "Pretrain/Step Time": 8.531578429043293} +{"Pretrain/Learning Rate": 2.1829106510534585e-05, "Pretrain/Loss": 2.055799961090088, "Pretrain/Loss (Raw)": 2.054164409637451, "Pretrain/Step": 5286, "Pretrain/Step Time": 8.537222065031528} +{"Pretrain/Learning Rate": 2.1820685386875155e-05, "Pretrain/Loss": 2.0577659606933594, "Pretrain/Loss (Raw)": 2.109663486480713, "Pretrain/Step": 5287, "Pretrain/Step Time": 8.543336171656847} +{"Pretrain/Learning Rate": 2.1812264629869257e-05, "Pretrain/Loss": 2.054464340209961, "Pretrain/Loss (Raw)": 1.907270908355713, "Pretrain/Step": 5288, "Pretrain/Step Time": 8.532897874712944} +{"Pretrain/Learning Rate": 2.1803844240488036e-05, "Pretrain/Loss": 2.0566487312316895, "Pretrain/Loss (Raw)": 2.128933906555176, "Pretrain/Step": 5289, "Pretrain/Step Time": 8.541406612843275} +{"Pretrain/Learning Rate": 2.179542421970255e-05, "Pretrain/Loss": 2.0560507774353027, "Pretrain/Loss (Raw)": 1.9597039222717285, "Pretrain/Step": 5290, "Pretrain/Step Time": 8.540968807414174} +{"Pretrain/Learning Rate": 2.1787004568483846e-05, "Pretrain/Loss": 2.059157133102417, "Pretrain/Loss (Raw)": 2.2852602005004883, "Pretrain/Step": 5291, "Pretrain/Step Time": 8.539123624563217} +{"Pretrain/Learning Rate": 2.1778585287802914e-05, "Pretrain/Loss": 2.060645580291748, "Pretrain/Loss (Raw)": 2.1792984008789062, "Pretrain/Step": 5292, "Pretrain/Step Time": 8.536753568798304} +{"Pretrain/Learning Rate": 2.1770166378630708e-05, "Pretrain/Loss": 2.061340808868408, "Pretrain/Loss (Raw)": 2.082031011581421, "Pretrain/Step": 5293, "Pretrain/Step Time": 8.546957064419985} +{"Pretrain/Learning Rate": 2.1761747841938133e-05, "Pretrain/Loss": 2.0606675148010254, "Pretrain/Loss (Raw)": 2.005430221557617, "Pretrain/Step": 5294, "Pretrain/Step Time": 8.541042385622859} +{"Pretrain/Learning Rate": 2.175332967869606e-05, "Pretrain/Loss": 2.062190532684326, "Pretrain/Loss (Raw)": 2.054115056991577, "Pretrain/Step": 5295, "Pretrain/Step Time": 8.544613698497415} +{"Pretrain/Learning Rate": 2.17449118898753e-05, "Pretrain/Loss": 2.0636510848999023, "Pretrain/Loss (Raw)": 2.0048344135284424, "Pretrain/Step": 5296, "Pretrain/Step Time": 8.54486239515245} +{"Pretrain/Learning Rate": 2.1736494476446646e-05, "Pretrain/Loss": 2.065103054046631, "Pretrain/Loss (Raw)": 2.215512752532959, "Pretrain/Step": 5297, "Pretrain/Step Time": 8.544973783195019} +{"Pretrain/Learning Rate": 2.172807743938082e-05, "Pretrain/Loss": 2.0648727416992188, "Pretrain/Loss (Raw)": 2.059617280960083, "Pretrain/Step": 5298, "Pretrain/Step Time": 8.546233491972089} +{"Pretrain/Learning Rate": 2.171966077964853e-05, "Pretrain/Loss": 2.0651636123657227, "Pretrain/Loss (Raw)": 2.272887706756592, "Pretrain/Step": 5299, "Pretrain/Step Time": 8.548683606088161} +{"Pretrain/Learning Rate": 2.1711244498220412e-05, "Pretrain/Loss": 2.0631675720214844, "Pretrain/Loss (Raw)": 1.8625062704086304, "Pretrain/Step": 5300, "Pretrain/Step Time": 8.54203829728067} +{"Pretrain/Learning Rate": 2.170282859606708e-05, "Pretrain/Loss": 2.062032699584961, "Pretrain/Loss (Raw)": 2.0330002307891846, "Pretrain/Step": 5301, "Pretrain/Step Time": 8.539916483685374} +{"Pretrain/Learning Rate": 2.1694413074159082e-05, "Pretrain/Loss": 2.0609426498413086, "Pretrain/Loss (Raw)": 2.0496294498443604, "Pretrain/Step": 5302, "Pretrain/Step Time": 8.542309921234846} +{"Pretrain/Learning Rate": 2.1685997933466948e-05, "Pretrain/Loss": 2.064347743988037, "Pretrain/Loss (Raw)": 2.4624316692352295, "Pretrain/Step": 5303, "Pretrain/Step Time": 8.541097212582827} +{"Pretrain/Learning Rate": 2.167758317496115e-05, "Pretrain/Loss": 2.0649921894073486, "Pretrain/Loss (Raw)": 2.110109806060791, "Pretrain/Step": 5304, "Pretrain/Step Time": 8.53803576529026} +{"Pretrain/Learning Rate": 2.1669168799612118e-05, "Pretrain/Loss": 2.061962127685547, "Pretrain/Loss (Raw)": 1.758488416671753, "Pretrain/Step": 5305, "Pretrain/Step Time": 8.54456514492631} +{"Pretrain/Learning Rate": 2.1660754808390235e-05, "Pretrain/Loss": 2.0644094944000244, "Pretrain/Loss (Raw)": 2.334824562072754, "Pretrain/Step": 5306, "Pretrain/Step Time": 8.53948337957263} +{"Pretrain/Learning Rate": 2.1652341202265838e-05, "Pretrain/Loss": 2.0654091835021973, "Pretrain/Loss (Raw)": 2.0168299674987793, "Pretrain/Step": 5307, "Pretrain/Step Time": 8.539675695821643} +{"Pretrain/Learning Rate": 2.1643927982209233e-05, "Pretrain/Loss": 2.0658345222473145, "Pretrain/Loss (Raw)": 2.01570463180542, "Pretrain/Step": 5308, "Pretrain/Step Time": 8.539334850385785} +{"Pretrain/Learning Rate": 2.1635515149190665e-05, "Pretrain/Loss": 2.0677309036254883, "Pretrain/Loss (Raw)": 2.177870988845825, "Pretrain/Step": 5309, "Pretrain/Step Time": 8.535683669149876} +{"Pretrain/Learning Rate": 2.1627102704180353e-05, "Pretrain/Loss": 2.0669474601745605, "Pretrain/Loss (Raw)": 2.108036518096924, "Pretrain/Step": 5310, "Pretrain/Step Time": 8.533907746896148} +{"Pretrain/Learning Rate": 2.1618690648148435e-05, "Pretrain/Loss": 2.0666537284851074, "Pretrain/Loss (Raw)": 2.1119019985198975, "Pretrain/Step": 5311, "Pretrain/Step Time": 8.540004456415772} +{"Pretrain/Learning Rate": 2.161027898206506e-05, "Pretrain/Loss": 2.0648610591888428, "Pretrain/Loss (Raw)": 1.9429230690002441, "Pretrain/Step": 5312, "Pretrain/Step Time": 8.537552274763584} +{"Pretrain/Learning Rate": 2.160186770690027e-05, "Pretrain/Loss": 2.063920736312866, "Pretrain/Loss (Raw)": 2.063822031021118, "Pretrain/Step": 5313, "Pretrain/Step Time": 8.539453711360693} +{"Pretrain/Learning Rate": 2.1593456823624127e-05, "Pretrain/Loss": 2.0632829666137695, "Pretrain/Loss (Raw)": 2.0255773067474365, "Pretrain/Step": 5314, "Pretrain/Step Time": 8.539820836856961} +{"Pretrain/Learning Rate": 2.1585046333206573e-05, "Pretrain/Loss": 2.0641493797302246, "Pretrain/Loss (Raw)": 2.084429979324341, "Pretrain/Step": 5315, "Pretrain/Step Time": 8.539925580844283} +{"Pretrain/Learning Rate": 2.157663623661759e-05, "Pretrain/Loss": 2.0617852210998535, "Pretrain/Loss (Raw)": 1.8286054134368896, "Pretrain/Step": 5316, "Pretrain/Step Time": 8.539152584969997} +{"Pretrain/Learning Rate": 2.156822653482703e-05, "Pretrain/Loss": 2.0610203742980957, "Pretrain/Loss (Raw)": 1.843126654624939, "Pretrain/Step": 5317, "Pretrain/Step Time": 8.547697484493256} +{"Pretrain/Learning Rate": 2.155981722880477e-05, "Pretrain/Loss": 2.0630831718444824, "Pretrain/Loss (Raw)": 2.1706206798553467, "Pretrain/Step": 5318, "Pretrain/Step Time": 8.541952980682254} +{"Pretrain/Learning Rate": 2.1551408319520588e-05, "Pretrain/Loss": 2.0639567375183105, "Pretrain/Loss (Raw)": 2.0159544944763184, "Pretrain/Step": 5319, "Pretrain/Step Time": 8.5458153616637} +{"Pretrain/Learning Rate": 2.1542999807944258e-05, "Pretrain/Loss": 2.062837600708008, "Pretrain/Loss (Raw)": 1.980191707611084, "Pretrain/Step": 5320, "Pretrain/Step Time": 8.539052555337548} +{"Pretrain/Learning Rate": 2.1534591695045473e-05, "Pretrain/Loss": 2.063610076904297, "Pretrain/Loss (Raw)": 2.05509614944458, "Pretrain/Step": 5321, "Pretrain/Step Time": 8.53895009867847} +{"Pretrain/Learning Rate": 2.1526183981793908e-05, "Pretrain/Loss": 2.066138744354248, "Pretrain/Loss (Raw)": 2.3839685916900635, "Pretrain/Step": 5322, "Pretrain/Step Time": 8.542465658858418} +{"Pretrain/Learning Rate": 2.1517776669159166e-05, "Pretrain/Loss": 2.0672075748443604, "Pretrain/Loss (Raw)": 2.1572842597961426, "Pretrain/Step": 5323, "Pretrain/Step Time": 8.550357749685645} +{"Pretrain/Learning Rate": 2.150936975811084e-05, "Pretrain/Loss": 2.0679593086242676, "Pretrain/Loss (Raw)": 2.1459572315216064, "Pretrain/Step": 5324, "Pretrain/Step Time": 8.538513291627169} +{"Pretrain/Learning Rate": 2.1500963249618433e-05, "Pretrain/Loss": 2.066897392272949, "Pretrain/Loss (Raw)": 1.9934724569320679, "Pretrain/Step": 5325, "Pretrain/Step Time": 8.539410565048456} +{"Pretrain/Learning Rate": 2.149255714465144e-05, "Pretrain/Loss": 2.069841146469116, "Pretrain/Loss (Raw)": 2.054422378540039, "Pretrain/Step": 5326, "Pretrain/Step Time": 8.534066781401634} +{"Pretrain/Learning Rate": 2.1484151444179273e-05, "Pretrain/Loss": 2.0686144828796387, "Pretrain/Loss (Raw)": 1.8225743770599365, "Pretrain/Step": 5327, "Pretrain/Step Time": 8.535195957869291} +{"Pretrain/Learning Rate": 2.147574614917134e-05, "Pretrain/Loss": 2.0672998428344727, "Pretrain/Loss (Raw)": 2.004352569580078, "Pretrain/Step": 5328, "Pretrain/Step Time": 8.532677406445146} +{"Pretrain/Learning Rate": 2.146734126059696e-05, "Pretrain/Loss": 2.0697474479675293, "Pretrain/Loss (Raw)": 2.1286752223968506, "Pretrain/Step": 5329, "Pretrain/Step Time": 8.54428586922586} +{"Pretrain/Learning Rate": 2.1458936779425438e-05, "Pretrain/Loss": 2.070544719696045, "Pretrain/Loss (Raw)": 2.067190647125244, "Pretrain/Step": 5330, "Pretrain/Step Time": 8.54119699075818} +{"Pretrain/Learning Rate": 2.145053270662601e-05, "Pretrain/Loss": 2.072307825088501, "Pretrain/Loss (Raw)": 2.2724215984344482, "Pretrain/Step": 5331, "Pretrain/Step Time": 8.539845066145062} +{"Pretrain/Learning Rate": 2.1442129043167874e-05, "Pretrain/Loss": 2.0736775398254395, "Pretrain/Loss (Raw)": 2.009162425994873, "Pretrain/Step": 5332, "Pretrain/Step Time": 8.540452705696225} +{"Pretrain/Learning Rate": 2.1433725790020186e-05, "Pretrain/Loss": 2.0756168365478516, "Pretrain/Loss (Raw)": 2.19929575920105, "Pretrain/Step": 5333, "Pretrain/Step Time": 8.543861709535122} +{"Pretrain/Learning Rate": 2.1425322948152042e-05, "Pretrain/Loss": 2.076263904571533, "Pretrain/Loss (Raw)": 2.1469132900238037, "Pretrain/Step": 5334, "Pretrain/Step Time": 8.53765319287777} +{"Pretrain/Learning Rate": 2.14169205185325e-05, "Pretrain/Loss": 2.077472448348999, "Pretrain/Loss (Raw)": 2.130971908569336, "Pretrain/Step": 5335, "Pretrain/Step Time": 8.544973082840443} +{"Pretrain/Learning Rate": 2.140851850213057e-05, "Pretrain/Loss": 2.0783705711364746, "Pretrain/Loss (Raw)": 2.2241714000701904, "Pretrain/Step": 5336, "Pretrain/Step Time": 8.543425494804978} +{"Pretrain/Learning Rate": 2.1400116899915205e-05, "Pretrain/Loss": 2.077441453933716, "Pretrain/Loss (Raw)": 1.9628535509109497, "Pretrain/Step": 5337, "Pretrain/Step Time": 8.542718220502138} +{"Pretrain/Learning Rate": 2.1391715712855327e-05, "Pretrain/Loss": 2.076634168624878, "Pretrain/Loss (Raw)": 1.7809501886367798, "Pretrain/Step": 5338, "Pretrain/Step Time": 8.535364648327231} +{"Pretrain/Learning Rate": 2.1383314941919795e-05, "Pretrain/Loss": 2.0752382278442383, "Pretrain/Loss (Raw)": 1.9955081939697266, "Pretrain/Step": 5339, "Pretrain/Step Time": 8.534379305317998} +{"Pretrain/Learning Rate": 2.1374914588077427e-05, "Pretrain/Loss": 2.074662923812866, "Pretrain/Loss (Raw)": 1.887303113937378, "Pretrain/Step": 5340, "Pretrain/Step Time": 8.53654782101512} +{"Pretrain/Learning Rate": 2.1366514652296987e-05, "Pretrain/Loss": 2.0722177028656006, "Pretrain/Loss (Raw)": 1.9208184480667114, "Pretrain/Step": 5341, "Pretrain/Step Time": 8.543194765225053} +{"Pretrain/Learning Rate": 2.135811513554721e-05, "Pretrain/Loss": 2.071542739868164, "Pretrain/Loss (Raw)": 1.9120509624481201, "Pretrain/Step": 5342, "Pretrain/Step Time": 8.539584148675203} +{"Pretrain/Learning Rate": 2.1349716038796742e-05, "Pretrain/Loss": 2.0709102153778076, "Pretrain/Loss (Raw)": 1.9464432001113892, "Pretrain/Step": 5343, "Pretrain/Step Time": 8.532708678394556} +{"Pretrain/Learning Rate": 2.1341317363014223e-05, "Pretrain/Loss": 2.0697569847106934, "Pretrain/Loss (Raw)": 1.7725200653076172, "Pretrain/Step": 5344, "Pretrain/Step Time": 8.534517887979746} +{"Pretrain/Learning Rate": 2.133291910916823e-05, "Pretrain/Loss": 2.070937395095825, "Pretrain/Loss (Raw)": 2.137131452560425, "Pretrain/Step": 5345, "Pretrain/Step Time": 8.531435161828995} +{"Pretrain/Learning Rate": 2.1324521278227287e-05, "Pretrain/Loss": 2.0706539154052734, "Pretrain/Loss (Raw)": 1.9781790971755981, "Pretrain/Step": 5346, "Pretrain/Step Time": 8.532467063516378} +{"Pretrain/Learning Rate": 2.131612387115987e-05, "Pretrain/Loss": 2.070158004760742, "Pretrain/Loss (Raw)": 1.9794694185256958, "Pretrain/Step": 5347, "Pretrain/Step Time": 8.548197392374277} +{"Pretrain/Learning Rate": 2.13077268889344e-05, "Pretrain/Loss": 2.0694832801818848, "Pretrain/Loss (Raw)": 1.9297019243240356, "Pretrain/Step": 5348, "Pretrain/Step Time": 8.545850494876504} +{"Pretrain/Learning Rate": 2.1299330332519273e-05, "Pretrain/Loss": 2.0694236755371094, "Pretrain/Loss (Raw)": 2.0553839206695557, "Pretrain/Step": 5349, "Pretrain/Step Time": 8.538826007395983} +{"Pretrain/Learning Rate": 2.1290934202882805e-05, "Pretrain/Loss": 2.0674333572387695, "Pretrain/Loss (Raw)": 2.1259868144989014, "Pretrain/Step": 5350, "Pretrain/Step Time": 8.53877635858953} +{"Pretrain/Learning Rate": 2.128253850099329e-05, "Pretrain/Loss": 2.0667223930358887, "Pretrain/Loss (Raw)": 2.2092785835266113, "Pretrain/Step": 5351, "Pretrain/Step Time": 8.539971506223083} +{"Pretrain/Learning Rate": 2.1274143227818938e-05, "Pretrain/Loss": 2.0676186084747314, "Pretrain/Loss (Raw)": 2.2818875312805176, "Pretrain/Step": 5352, "Pretrain/Step Time": 8.537244884297252} +{"Pretrain/Learning Rate": 2.126574838432796e-05, "Pretrain/Loss": 2.0676755905151367, "Pretrain/Loss (Raw)": 2.0322206020355225, "Pretrain/Step": 5353, "Pretrain/Step Time": 8.54706197604537} +{"Pretrain/Learning Rate": 2.1257353971488463e-05, "Pretrain/Loss": 2.068293333053589, "Pretrain/Loss (Raw)": 2.1766936779022217, "Pretrain/Step": 5354, "Pretrain/Step Time": 8.54440912604332} +{"Pretrain/Learning Rate": 2.1248959990268554e-05, "Pretrain/Loss": 2.068612575531006, "Pretrain/Loss (Raw)": 2.031440019607544, "Pretrain/Step": 5355, "Pretrain/Step Time": 8.540752470493317} +{"Pretrain/Learning Rate": 2.1240566441636238e-05, "Pretrain/Loss": 2.0665102005004883, "Pretrain/Loss (Raw)": 1.9171324968338013, "Pretrain/Step": 5356, "Pretrain/Step Time": 8.541455872356892} +{"Pretrain/Learning Rate": 2.1232173326559535e-05, "Pretrain/Loss": 2.0663866996765137, "Pretrain/Loss (Raw)": 1.9513241052627563, "Pretrain/Step": 5357, "Pretrain/Step Time": 8.540590349584818} +{"Pretrain/Learning Rate": 2.122378064600634e-05, "Pretrain/Loss": 2.066227912902832, "Pretrain/Loss (Raw)": 2.0617942810058594, "Pretrain/Step": 5358, "Pretrain/Step Time": 8.536663573235273} +{"Pretrain/Learning Rate": 2.121538840094457e-05, "Pretrain/Loss": 2.0688412189483643, "Pretrain/Loss (Raw)": 2.251631498336792, "Pretrain/Step": 5359, "Pretrain/Step Time": 8.541725784540176} +{"Pretrain/Learning Rate": 2.120699659234203e-05, "Pretrain/Loss": 2.067960739135742, "Pretrain/Loss (Raw)": 2.063260555267334, "Pretrain/Step": 5360, "Pretrain/Step Time": 8.541988205164671} +{"Pretrain/Learning Rate": 2.1198605221166528e-05, "Pretrain/Loss": 2.069772243499756, "Pretrain/Loss (Raw)": 2.1689670085906982, "Pretrain/Step": 5361, "Pretrain/Step Time": 8.54156923852861} +{"Pretrain/Learning Rate": 2.1190214288385778e-05, "Pretrain/Loss": 2.0697288513183594, "Pretrain/Loss (Raw)": 2.1219704151153564, "Pretrain/Step": 5362, "Pretrain/Step Time": 8.545836454257369} +{"Pretrain/Learning Rate": 2.1181823794967472e-05, "Pretrain/Loss": 2.0705413818359375, "Pretrain/Loss (Raw)": 2.184720516204834, "Pretrain/Step": 5363, "Pretrain/Step Time": 8.54529276676476} +{"Pretrain/Learning Rate": 2.1173433741879234e-05, "Pretrain/Loss": 2.068838119506836, "Pretrain/Loss (Raw)": 1.8384190797805786, "Pretrain/Step": 5364, "Pretrain/Step Time": 8.541313331574202} +{"Pretrain/Learning Rate": 2.116504413008865e-05, "Pretrain/Loss": 2.068681001663208, "Pretrain/Loss (Raw)": 2.1420676708221436, "Pretrain/Step": 5365, "Pretrain/Step Time": 8.544868368655443} +{"Pretrain/Learning Rate": 2.1156654960563248e-05, "Pretrain/Loss": 2.067535400390625, "Pretrain/Loss (Raw)": 1.9916515350341797, "Pretrain/Step": 5366, "Pretrain/Step Time": 8.546033566817641} +{"Pretrain/Learning Rate": 2.1148266234270508e-05, "Pretrain/Loss": 2.068849563598633, "Pretrain/Loss (Raw)": 2.095276355743408, "Pretrain/Step": 5367, "Pretrain/Step Time": 8.539059469476342} +{"Pretrain/Learning Rate": 2.1139877952177852e-05, "Pretrain/Loss": 2.0694499015808105, "Pretrain/Loss (Raw)": 2.021871328353882, "Pretrain/Step": 5368, "Pretrain/Step Time": 8.542134651914239} +{"Pretrain/Learning Rate": 2.1131490115252668e-05, "Pretrain/Loss": 2.068452835083008, "Pretrain/Loss (Raw)": 2.1245501041412354, "Pretrain/Step": 5369, "Pretrain/Step Time": 8.543289577588439} +{"Pretrain/Learning Rate": 2.1123102724462262e-05, "Pretrain/Loss": 2.068084239959717, "Pretrain/Loss (Raw)": 1.9393810033798218, "Pretrain/Step": 5370, "Pretrain/Step Time": 8.537420753389597} +{"Pretrain/Learning Rate": 2.1114715780773924e-05, "Pretrain/Loss": 2.0668511390686035, "Pretrain/Loss (Raw)": 1.9776405096054077, "Pretrain/Step": 5371, "Pretrain/Step Time": 8.54041668586433} +{"Pretrain/Learning Rate": 2.110632928515487e-05, "Pretrain/Loss": 2.0668234825134277, "Pretrain/Loss (Raw)": 1.8696073293685913, "Pretrain/Step": 5372, "Pretrain/Step Time": 8.534676695242524} +{"Pretrain/Learning Rate": 2.1097943238572272e-05, "Pretrain/Loss": 2.0649282932281494, "Pretrain/Loss (Raw)": 1.9958561658859253, "Pretrain/Step": 5373, "Pretrain/Step Time": 8.54261970333755} +{"Pretrain/Learning Rate": 2.108955764199324e-05, "Pretrain/Loss": 2.0654473304748535, "Pretrain/Loss (Raw)": 2.0857009887695312, "Pretrain/Step": 5374, "Pretrain/Step Time": 8.53933390416205} +{"Pretrain/Learning Rate": 2.1081172496384855e-05, "Pretrain/Loss": 2.0653533935546875, "Pretrain/Loss (Raw)": 2.281686782836914, "Pretrain/Step": 5375, "Pretrain/Step Time": 8.539474727585912} +{"Pretrain/Learning Rate": 2.107278780271412e-05, "Pretrain/Loss": 2.0652074813842773, "Pretrain/Loss (Raw)": 2.096015453338623, "Pretrain/Step": 5376, "Pretrain/Step Time": 8.540772825479507} +{"Pretrain/Learning Rate": 2.1064403561948003e-05, "Pretrain/Loss": 2.0656023025512695, "Pretrain/Loss (Raw)": 2.1498465538024902, "Pretrain/Step": 5377, "Pretrain/Step Time": 8.55024446733296} +{"Pretrain/Learning Rate": 2.105601977505341e-05, "Pretrain/Loss": 2.0666818618774414, "Pretrain/Loss (Raw)": 2.0113472938537598, "Pretrain/Step": 5378, "Pretrain/Step Time": 8.54830820672214} +{"Pretrain/Learning Rate": 2.1047636442997205e-05, "Pretrain/Loss": 2.066270351409912, "Pretrain/Loss (Raw)": 2.0868725776672363, "Pretrain/Step": 5379, "Pretrain/Step Time": 8.553468082100153} +{"Pretrain/Learning Rate": 2.1039253566746182e-05, "Pretrain/Loss": 2.065800666809082, "Pretrain/Loss (Raw)": 2.016879081726074, "Pretrain/Step": 5380, "Pretrain/Step Time": 8.545226952061057} +{"Pretrain/Learning Rate": 2.1030871147267113e-05, "Pretrain/Loss": 2.063082218170166, "Pretrain/Loss (Raw)": 1.9099071025848389, "Pretrain/Step": 5381, "Pretrain/Step Time": 8.550902083516121} +{"Pretrain/Learning Rate": 2.1022489185526674e-05, "Pretrain/Loss": 2.060847282409668, "Pretrain/Loss (Raw)": 2.051102876663208, "Pretrain/Step": 5382, "Pretrain/Step Time": 8.544292848557234} +{"Pretrain/Learning Rate": 2.1014107682491534e-05, "Pretrain/Loss": 2.062389373779297, "Pretrain/Loss (Raw)": 2.18642258644104, "Pretrain/Step": 5383, "Pretrain/Step Time": 8.55104023963213} +{"Pretrain/Learning Rate": 2.1005726639128276e-05, "Pretrain/Loss": 2.062264919281006, "Pretrain/Loss (Raw)": 2.1509275436401367, "Pretrain/Step": 5384, "Pretrain/Step Time": 8.548781832680106} +{"Pretrain/Learning Rate": 2.0997346056403438e-05, "Pretrain/Loss": 2.062603712081909, "Pretrain/Loss (Raw)": 2.0298781394958496, "Pretrain/Step": 5385, "Pretrain/Step Time": 8.547872357070446} +{"Pretrain/Learning Rate": 2.0988965935283524e-05, "Pretrain/Loss": 2.0627503395080566, "Pretrain/Loss (Raw)": 2.1771981716156006, "Pretrain/Step": 5386, "Pretrain/Step Time": 8.544849881902337} +{"Pretrain/Learning Rate": 2.098058627673495e-05, "Pretrain/Loss": 2.060450315475464, "Pretrain/Loss (Raw)": 1.7473890781402588, "Pretrain/Step": 5387, "Pretrain/Step Time": 8.548334799706936} +{"Pretrain/Learning Rate": 2.097220708172411e-05, "Pretrain/Loss": 2.0604782104492188, "Pretrain/Loss (Raw)": 2.1024858951568604, "Pretrain/Step": 5388, "Pretrain/Step Time": 8.54100021161139} +{"Pretrain/Learning Rate": 2.0963828351217327e-05, "Pretrain/Loss": 2.061393976211548, "Pretrain/Loss (Raw)": 2.111616373062134, "Pretrain/Step": 5389, "Pretrain/Step Time": 8.548518501222134} +{"Pretrain/Learning Rate": 2.0955450086180882e-05, "Pretrain/Loss": 2.0587453842163086, "Pretrain/Loss (Raw)": 1.8603782653808594, "Pretrain/Step": 5390, "Pretrain/Step Time": 8.549857685342431} +{"Pretrain/Learning Rate": 2.094707228758099e-05, "Pretrain/Loss": 2.0576353073120117, "Pretrain/Loss (Raw)": 1.8610762357711792, "Pretrain/Step": 5391, "Pretrain/Step Time": 8.548048363998532} +{"Pretrain/Learning Rate": 2.093869495638382e-05, "Pretrain/Loss": 2.056877374649048, "Pretrain/Loss (Raw)": 1.9758014678955078, "Pretrain/Step": 5392, "Pretrain/Step Time": 8.549628414213657} +{"Pretrain/Learning Rate": 2.093031809355548e-05, "Pretrain/Loss": 2.055227041244507, "Pretrain/Loss (Raw)": 2.0817813873291016, "Pretrain/Step": 5393, "Pretrain/Step Time": 8.549770621582866} +{"Pretrain/Learning Rate": 2.0921941700062047e-05, "Pretrain/Loss": 2.0544309616088867, "Pretrain/Loss (Raw)": 1.893750548362732, "Pretrain/Step": 5394, "Pretrain/Step Time": 8.548569023609161} +{"Pretrain/Learning Rate": 2.0913565776869498e-05, "Pretrain/Loss": 2.053065776824951, "Pretrain/Loss (Raw)": 1.9536091089248657, "Pretrain/Step": 5395, "Pretrain/Step Time": 8.551760284230113} +{"Pretrain/Learning Rate": 2.0905190324943814e-05, "Pretrain/Loss": 2.054814577102661, "Pretrain/Loss (Raw)": 2.131542444229126, "Pretrain/Step": 5396, "Pretrain/Step Time": 8.549312064424157} +{"Pretrain/Learning Rate": 2.089681534525086e-05, "Pretrain/Loss": 2.053363084793091, "Pretrain/Loss (Raw)": 1.8908616304397583, "Pretrain/Step": 5397, "Pretrain/Step Time": 8.547369826585054} +{"Pretrain/Learning Rate": 2.0888440838756515e-05, "Pretrain/Loss": 2.0529732704162598, "Pretrain/Loss (Raw)": 2.018620491027832, "Pretrain/Step": 5398, "Pretrain/Step Time": 8.547668376937509} +{"Pretrain/Learning Rate": 2.088006680642653e-05, "Pretrain/Loss": 2.052393913269043, "Pretrain/Loss (Raw)": 2.0846097469329834, "Pretrain/Step": 5399, "Pretrain/Step Time": 8.549875352531672} +{"Pretrain/Learning Rate": 2.087169324922667e-05, "Pretrain/Loss": 2.051926612854004, "Pretrain/Loss (Raw)": 1.9436432123184204, "Pretrain/Step": 5400, "Pretrain/Step Time": 8.548308113589883} +{"Pretrain/Learning Rate": 2.086332016812258e-05, "Pretrain/Loss": 2.0509157180786133, "Pretrain/Loss (Raw)": 2.039949417114258, "Pretrain/Step": 5401, "Pretrain/Step Time": 8.551663851365447} +{"Pretrain/Learning Rate": 2.085494756407992e-05, "Pretrain/Loss": 2.050955295562744, "Pretrain/Loss (Raw)": 2.00225830078125, "Pretrain/Step": 5402, "Pretrain/Step Time": 8.550180118530989} +{"Pretrain/Learning Rate": 2.0846575438064227e-05, "Pretrain/Loss": 2.0508809089660645, "Pretrain/Loss (Raw)": 1.9413844347000122, "Pretrain/Step": 5403, "Pretrain/Step Time": 8.544353256002069} +{"Pretrain/Learning Rate": 2.0838203791041028e-05, "Pretrain/Loss": 2.0518441200256348, "Pretrain/Loss (Raw)": 2.0228004455566406, "Pretrain/Step": 5404, "Pretrain/Step Time": 8.544663477689028} +{"Pretrain/Learning Rate": 2.0829832623975775e-05, "Pretrain/Loss": 2.0550665855407715, "Pretrain/Loss (Raw)": 2.1341583728790283, "Pretrain/Step": 5405, "Pretrain/Step Time": 8.540782792493701} +{"Pretrain/Learning Rate": 2.0821461937833884e-05, "Pretrain/Loss": 2.0583322048187256, "Pretrain/Loss (Raw)": 2.275193929672241, "Pretrain/Step": 5406, "Pretrain/Step Time": 8.544039186090231} +{"Pretrain/Learning Rate": 2.0813091733580685e-05, "Pretrain/Loss": 2.058555841445923, "Pretrain/Loss (Raw)": 2.2433571815490723, "Pretrain/Step": 5407, "Pretrain/Step Time": 8.551146186888218} +{"Pretrain/Learning Rate": 2.080472201218148e-05, "Pretrain/Loss": 2.057648181915283, "Pretrain/Loss (Raw)": 2.029481887817383, "Pretrain/Step": 5408, "Pretrain/Step Time": 8.547447448596358} +{"Pretrain/Learning Rate": 2.0796352774601495e-05, "Pretrain/Loss": 2.0565953254699707, "Pretrain/Loss (Raw)": 2.071122646331787, "Pretrain/Step": 5409, "Pretrain/Step Time": 8.54551039263606} +{"Pretrain/Learning Rate": 2.0787984021805922e-05, "Pretrain/Loss": 2.0561892986297607, "Pretrain/Loss (Raw)": 1.9315506219863892, "Pretrain/Step": 5410, "Pretrain/Step Time": 8.547137051820755} +{"Pretrain/Learning Rate": 2.077961575475988e-05, "Pretrain/Loss": 2.0564324855804443, "Pretrain/Loss (Raw)": 2.0650546550750732, "Pretrain/Step": 5411, "Pretrain/Step Time": 8.548621265217662} +{"Pretrain/Learning Rate": 2.0771247974428434e-05, "Pretrain/Loss": 2.056453227996826, "Pretrain/Loss (Raw)": 2.093742609024048, "Pretrain/Step": 5412, "Pretrain/Step Time": 8.553033381700516} +{"Pretrain/Learning Rate": 2.07628806817766e-05, "Pretrain/Loss": 2.0532007217407227, "Pretrain/Loss (Raw)": 2.124507427215576, "Pretrain/Step": 5413, "Pretrain/Step Time": 8.554015226662159} +{"Pretrain/Learning Rate": 2.0754513877769328e-05, "Pretrain/Loss": 2.054196834564209, "Pretrain/Loss (Raw)": 2.181636095046997, "Pretrain/Step": 5414, "Pretrain/Step Time": 8.547011833637953} +{"Pretrain/Learning Rate": 2.074614756337152e-05, "Pretrain/Loss": 2.0518388748168945, "Pretrain/Loss (Raw)": 1.8078783750534058, "Pretrain/Step": 5415, "Pretrain/Step Time": 8.547131607308984} +{"Pretrain/Learning Rate": 2.073778173954803e-05, "Pretrain/Loss": 2.0529632568359375, "Pretrain/Loss (Raw)": 2.05116868019104, "Pretrain/Step": 5416, "Pretrain/Step Time": 8.544924391433597} +{"Pretrain/Learning Rate": 2.072941640726362e-05, "Pretrain/Loss": 2.052745819091797, "Pretrain/Loss (Raw)": 2.1011037826538086, "Pretrain/Step": 5417, "Pretrain/Step Time": 8.538672832772136} +{"Pretrain/Learning Rate": 2.0721051567483045e-05, "Pretrain/Loss": 2.0542492866516113, "Pretrain/Loss (Raw)": 2.1521499156951904, "Pretrain/Step": 5418, "Pretrain/Step Time": 8.539690474048257} +{"Pretrain/Learning Rate": 2.071268722117096e-05, "Pretrain/Loss": 2.051909923553467, "Pretrain/Loss (Raw)": 1.9858298301696777, "Pretrain/Step": 5419, "Pretrain/Step Time": 8.542135044932365} +{"Pretrain/Learning Rate": 2.0704323369291993e-05, "Pretrain/Loss": 2.050612449645996, "Pretrain/Loss (Raw)": 2.0132033824920654, "Pretrain/Step": 5420, "Pretrain/Step Time": 8.548372779041529} +{"Pretrain/Learning Rate": 2.069596001281069e-05, "Pretrain/Loss": 2.0507493019104004, "Pretrain/Loss (Raw)": 2.0995771884918213, "Pretrain/Step": 5421, "Pretrain/Step Time": 8.540869530290365} +{"Pretrain/Learning Rate": 2.0687597152691567e-05, "Pretrain/Loss": 2.0509402751922607, "Pretrain/Loss (Raw)": 2.029834270477295, "Pretrain/Step": 5422, "Pretrain/Step Time": 8.543200954794884} +{"Pretrain/Learning Rate": 2.0679234789899054e-05, "Pretrain/Loss": 2.0515055656433105, "Pretrain/Loss (Raw)": 2.126495361328125, "Pretrain/Step": 5423, "Pretrain/Step Time": 8.536795068532228} +{"Pretrain/Learning Rate": 2.067087292539755e-05, "Pretrain/Loss": 2.052353858947754, "Pretrain/Loss (Raw)": 2.1134238243103027, "Pretrain/Step": 5424, "Pretrain/Step Time": 8.539038373157382} +{"Pretrain/Learning Rate": 2.0662511560151373e-05, "Pretrain/Loss": 2.0504183769226074, "Pretrain/Loss (Raw)": 1.967761516571045, "Pretrain/Step": 5425, "Pretrain/Step Time": 8.54088269919157} +{"Pretrain/Learning Rate": 2.0654150695124804e-05, "Pretrain/Loss": 2.051077365875244, "Pretrain/Loss (Raw)": 2.1439669132232666, "Pretrain/Step": 5426, "Pretrain/Step Time": 8.541689302772284} +{"Pretrain/Learning Rate": 2.064579033128206e-05, "Pretrain/Loss": 2.049692153930664, "Pretrain/Loss (Raw)": 2.09560489654541, "Pretrain/Step": 5427, "Pretrain/Step Time": 8.544215355068445} +{"Pretrain/Learning Rate": 2.063743046958729e-05, "Pretrain/Loss": 2.0512847900390625, "Pretrain/Loss (Raw)": 2.0663392543792725, "Pretrain/Step": 5428, "Pretrain/Step Time": 8.54526405222714} +{"Pretrain/Learning Rate": 2.0629071111004595e-05, "Pretrain/Loss": 2.0512545108795166, "Pretrain/Loss (Raw)": 2.029132843017578, "Pretrain/Step": 5429, "Pretrain/Step Time": 8.547472957521677} +{"Pretrain/Learning Rate": 2.0620712256498016e-05, "Pretrain/Loss": 2.050314426422119, "Pretrain/Loss (Raw)": 1.929300308227539, "Pretrain/Step": 5430, "Pretrain/Step Time": 8.541946019977331} +{"Pretrain/Learning Rate": 2.061235390703154e-05, "Pretrain/Loss": 2.0464489459991455, "Pretrain/Loss (Raw)": 1.967658281326294, "Pretrain/Step": 5431, "Pretrain/Step Time": 8.547896130010486} +{"Pretrain/Learning Rate": 2.0603996063569078e-05, "Pretrain/Loss": 2.046657085418701, "Pretrain/Loss (Raw)": 2.1367385387420654, "Pretrain/Step": 5432, "Pretrain/Step Time": 8.548618229106069} +{"Pretrain/Learning Rate": 2.0595638727074512e-05, "Pretrain/Loss": 2.048935890197754, "Pretrain/Loss (Raw)": 2.0501627922058105, "Pretrain/Step": 5433, "Pretrain/Step Time": 8.54842840321362} +{"Pretrain/Learning Rate": 2.058728189851164e-05, "Pretrain/Loss": 2.0465896129608154, "Pretrain/Loss (Raw)": 2.0345065593719482, "Pretrain/Step": 5434, "Pretrain/Step Time": 8.544673506170511} +{"Pretrain/Learning Rate": 2.0578925578844216e-05, "Pretrain/Loss": 2.0468878746032715, "Pretrain/Loss (Raw)": 2.055004358291626, "Pretrain/Step": 5435, "Pretrain/Step Time": 8.54307733103633} +{"Pretrain/Learning Rate": 2.0570569769035915e-05, "Pretrain/Loss": 2.0463314056396484, "Pretrain/Loss (Raw)": 1.9444953203201294, "Pretrain/Step": 5436, "Pretrain/Step Time": 8.54372115060687} +{"Pretrain/Learning Rate": 2.0562214470050396e-05, "Pretrain/Loss": 2.0439701080322266, "Pretrain/Loss (Raw)": 1.8756153583526611, "Pretrain/Step": 5437, "Pretrain/Step Time": 8.545169094577432} +{"Pretrain/Learning Rate": 2.0553859682851204e-05, "Pretrain/Loss": 2.0448553562164307, "Pretrain/Loss (Raw)": 2.2213382720947266, "Pretrain/Step": 5438, "Pretrain/Step Time": 8.54574890807271} +{"Pretrain/Learning Rate": 2.0545505408401878e-05, "Pretrain/Loss": 2.044102191925049, "Pretrain/Loss (Raw)": 2.015500545501709, "Pretrain/Step": 5439, "Pretrain/Step Time": 8.543608779087663} +{"Pretrain/Learning Rate": 2.053715164766584e-05, "Pretrain/Loss": 2.0451364517211914, "Pretrain/Loss (Raw)": 2.075305223464966, "Pretrain/Step": 5440, "Pretrain/Step Time": 8.54333020746708} +{"Pretrain/Learning Rate": 2.052879840160652e-05, "Pretrain/Loss": 2.04494047164917, "Pretrain/Loss (Raw)": 2.0387320518493652, "Pretrain/Step": 5441, "Pretrain/Step Time": 8.544733829796314} +{"Pretrain/Learning Rate": 2.052044567118722e-05, "Pretrain/Loss": 2.043823003768921, "Pretrain/Loss (Raw)": 1.8825706243515015, "Pretrain/Step": 5442, "Pretrain/Step Time": 8.543151704594493} +{"Pretrain/Learning Rate": 2.0512093457371253e-05, "Pretrain/Loss": 2.0436649322509766, "Pretrain/Loss (Raw)": 2.0641798973083496, "Pretrain/Step": 5443, "Pretrain/Step Time": 8.548079622909427} +{"Pretrain/Learning Rate": 2.0503741761121804e-05, "Pretrain/Loss": 2.0444695949554443, "Pretrain/Loss (Raw)": 1.9316045045852661, "Pretrain/Step": 5444, "Pretrain/Step Time": 8.552156979218125} +{"Pretrain/Learning Rate": 2.049539058340205e-05, "Pretrain/Loss": 2.045463800430298, "Pretrain/Loss (Raw)": 1.9703863859176636, "Pretrain/Step": 5445, "Pretrain/Step Time": 8.547169720754027} +{"Pretrain/Learning Rate": 2.0487039925175073e-05, "Pretrain/Loss": 2.046113967895508, "Pretrain/Loss (Raw)": 2.2538673877716064, "Pretrain/Step": 5446, "Pretrain/Step Time": 8.544309934601188} +{"Pretrain/Learning Rate": 2.0478689787403923e-05, "Pretrain/Loss": 2.0473451614379883, "Pretrain/Loss (Raw)": 2.173517942428589, "Pretrain/Step": 5447, "Pretrain/Step Time": 8.541587261483073} +{"Pretrain/Learning Rate": 2.0470340171051567e-05, "Pretrain/Loss": 2.0480270385742188, "Pretrain/Loss (Raw)": 2.0674800872802734, "Pretrain/Step": 5448, "Pretrain/Step Time": 8.54381214082241} +{"Pretrain/Learning Rate": 2.046199107708093e-05, "Pretrain/Loss": 2.045867919921875, "Pretrain/Loss (Raw)": 1.7787095308303833, "Pretrain/Step": 5449, "Pretrain/Step Time": 8.544736795127392} +{"Pretrain/Learning Rate": 2.0453642506454862e-05, "Pretrain/Loss": 2.0408754348754883, "Pretrain/Loss (Raw)": 1.7449374198913574, "Pretrain/Step": 5450, "Pretrain/Step Time": 8.54539910890162} +{"Pretrain/Learning Rate": 2.044529446013617e-05, "Pretrain/Loss": 2.0406415462493896, "Pretrain/Loss (Raw)": 2.127363681793213, "Pretrain/Step": 5451, "Pretrain/Step Time": 8.54042412340641} +{"Pretrain/Learning Rate": 2.0436946939087576e-05, "Pretrain/Loss": 2.0392351150512695, "Pretrain/Loss (Raw)": 1.9659391641616821, "Pretrain/Step": 5452, "Pretrain/Step Time": 8.539390033110976} +{"Pretrain/Learning Rate": 2.042859994427177e-05, "Pretrain/Loss": 2.038029432296753, "Pretrain/Loss (Raw)": 1.8391358852386475, "Pretrain/Step": 5453, "Pretrain/Step Time": 8.540621917694807} +{"Pretrain/Learning Rate": 2.042025347665135e-05, "Pretrain/Loss": 2.0393190383911133, "Pretrain/Loss (Raw)": 2.219485282897949, "Pretrain/Step": 5454, "Pretrain/Step Time": 8.540857929736376} +{"Pretrain/Learning Rate": 2.041190753718889e-05, "Pretrain/Loss": 2.0418591499328613, "Pretrain/Loss (Raw)": 2.1477017402648926, "Pretrain/Step": 5455, "Pretrain/Step Time": 8.544008253142238} +{"Pretrain/Learning Rate": 2.0403562126846865e-05, "Pretrain/Loss": 2.041224479675293, "Pretrain/Loss (Raw)": 1.9231197834014893, "Pretrain/Step": 5456, "Pretrain/Step Time": 8.553803946822882} +{"Pretrain/Learning Rate": 2.039521724658772e-05, "Pretrain/Loss": 2.0404810905456543, "Pretrain/Loss (Raw)": 2.0335445404052734, "Pretrain/Step": 5457, "Pretrain/Step Time": 8.545570140704513} +{"Pretrain/Learning Rate": 2.0386872897373816e-05, "Pretrain/Loss": 2.0398244857788086, "Pretrain/Loss (Raw)": 1.9831421375274658, "Pretrain/Step": 5458, "Pretrain/Step Time": 8.5445227753371} +{"Pretrain/Learning Rate": 2.037852908016747e-05, "Pretrain/Loss": 2.037550449371338, "Pretrain/Loss (Raw)": 1.9813300371170044, "Pretrain/Step": 5459, "Pretrain/Step Time": 8.547598008066416} +{"Pretrain/Learning Rate": 2.0370185795930927e-05, "Pretrain/Loss": 2.03873348236084, "Pretrain/Loss (Raw)": 2.1606006622314453, "Pretrain/Step": 5460, "Pretrain/Step Time": 8.544240184128284} +{"Pretrain/Learning Rate": 2.0361843045626378e-05, "Pretrain/Loss": 2.039102554321289, "Pretrain/Loss (Raw)": 2.246518611907959, "Pretrain/Step": 5461, "Pretrain/Step Time": 8.540939012542367} +{"Pretrain/Learning Rate": 2.035350083021594e-05, "Pretrain/Loss": 2.039146900177002, "Pretrain/Loss (Raw)": 2.152611494064331, "Pretrain/Step": 5462, "Pretrain/Step Time": 8.550121508538723} +{"Pretrain/Learning Rate": 2.0345159150661683e-05, "Pretrain/Loss": 2.037959337234497, "Pretrain/Loss (Raw)": 1.9789427518844604, "Pretrain/Step": 5463, "Pretrain/Step Time": 8.542382948100567} +{"Pretrain/Learning Rate": 2.0336818007925603e-05, "Pretrain/Loss": 2.0377440452575684, "Pretrain/Loss (Raw)": 2.196632146835327, "Pretrain/Step": 5464, "Pretrain/Step Time": 8.539020819589496} +{"Pretrain/Learning Rate": 2.032847740296965e-05, "Pretrain/Loss": 2.039468765258789, "Pretrain/Loss (Raw)": 2.1836066246032715, "Pretrain/Step": 5465, "Pretrain/Step Time": 8.540338518097997} +{"Pretrain/Learning Rate": 2.0320137336755692e-05, "Pretrain/Loss": 2.0418262481689453, "Pretrain/Loss (Raw)": 2.082728862762451, "Pretrain/Step": 5466, "Pretrain/Step Time": 8.540439443662763} +{"Pretrain/Learning Rate": 2.0311797810245543e-05, "Pretrain/Loss": 2.0416057109832764, "Pretrain/Loss (Raw)": 1.9672672748565674, "Pretrain/Step": 5467, "Pretrain/Step Time": 8.540095819160342} +{"Pretrain/Learning Rate": 2.0303458824400974e-05, "Pretrain/Loss": 2.040764570236206, "Pretrain/Loss (Raw)": 1.7796216011047363, "Pretrain/Step": 5468, "Pretrain/Step Time": 8.547203086316586} +{"Pretrain/Learning Rate": 2.0295120380183657e-05, "Pretrain/Loss": 2.042949676513672, "Pretrain/Loss (Raw)": 2.2005300521850586, "Pretrain/Step": 5469, "Pretrain/Step Time": 8.537142558023334} +{"Pretrain/Learning Rate": 2.0286782478555232e-05, "Pretrain/Loss": 2.043534994125366, "Pretrain/Loss (Raw)": 1.986969232559204, "Pretrain/Step": 5470, "Pretrain/Step Time": 8.53981657139957} +{"Pretrain/Learning Rate": 2.027844512047726e-05, "Pretrain/Loss": 2.0451674461364746, "Pretrain/Loss (Raw)": 2.1554009914398193, "Pretrain/Step": 5471, "Pretrain/Step Time": 8.542442422360182} +{"Pretrain/Learning Rate": 2.027010830691124e-05, "Pretrain/Loss": 2.0464088916778564, "Pretrain/Loss (Raw)": 1.9314169883728027, "Pretrain/Step": 5472, "Pretrain/Step Time": 8.540340995416045} +{"Pretrain/Learning Rate": 2.0261772038818622e-05, "Pretrain/Loss": 2.045362949371338, "Pretrain/Loss (Raw)": 2.0032546520233154, "Pretrain/Step": 5473, "Pretrain/Step Time": 8.545746386051178} +{"Pretrain/Learning Rate": 2.0253436317160784e-05, "Pretrain/Loss": 2.046229124069214, "Pretrain/Loss (Raw)": 2.0890395641326904, "Pretrain/Step": 5474, "Pretrain/Step Time": 8.553621483966708} +{"Pretrain/Learning Rate": 2.0245101142899032e-05, "Pretrain/Loss": 2.0443115234375, "Pretrain/Loss (Raw)": 1.7340210676193237, "Pretrain/Step": 5475, "Pretrain/Step Time": 8.541286304593086} +{"Pretrain/Learning Rate": 2.0236766516994623e-05, "Pretrain/Loss": 2.047236204147339, "Pretrain/Loss (Raw)": 2.3040568828582764, "Pretrain/Step": 5476, "Pretrain/Step Time": 8.541952323168516} +{"Pretrain/Learning Rate": 2.022843244040874e-05, "Pretrain/Loss": 2.0483222007751465, "Pretrain/Loss (Raw)": 2.1943860054016113, "Pretrain/Step": 5477, "Pretrain/Step Time": 8.539115836843848} +{"Pretrain/Learning Rate": 2.0220098914102525e-05, "Pretrain/Loss": 2.046607255935669, "Pretrain/Loss (Raw)": 1.9064817428588867, "Pretrain/Step": 5478, "Pretrain/Step Time": 8.544451579451561} +{"Pretrain/Learning Rate": 2.021176593903701e-05, "Pretrain/Loss": 2.044848918914795, "Pretrain/Loss (Raw)": 1.9842102527618408, "Pretrain/Step": 5479, "Pretrain/Step Time": 8.544762190431356} +{"Pretrain/Learning Rate": 2.0203433516173225e-05, "Pretrain/Loss": 2.041452407836914, "Pretrain/Loss (Raw)": 1.8471516370773315, "Pretrain/Step": 5480, "Pretrain/Step Time": 8.553180579096079} +{"Pretrain/Learning Rate": 2.0195101646472075e-05, "Pretrain/Loss": 2.0431065559387207, "Pretrain/Loss (Raw)": 2.2439398765563965, "Pretrain/Step": 5481, "Pretrain/Step Time": 8.542618706822395} +{"Pretrain/Learning Rate": 2.018677033089446e-05, "Pretrain/Loss": 2.041419267654419, "Pretrain/Loss (Raw)": 1.9607182741165161, "Pretrain/Step": 5482, "Pretrain/Step Time": 8.546704871580005} +{"Pretrain/Learning Rate": 2.017843957040115e-05, "Pretrain/Loss": 2.043374538421631, "Pretrain/Loss (Raw)": 2.2817234992980957, "Pretrain/Step": 5483, "Pretrain/Step Time": 8.544680617749691} +{"Pretrain/Learning Rate": 2.0170109365952934e-05, "Pretrain/Loss": 2.043653726577759, "Pretrain/Loss (Raw)": 1.9528560638427734, "Pretrain/Step": 5484, "Pretrain/Step Time": 8.543003793805838} +{"Pretrain/Learning Rate": 2.0161779718510443e-05, "Pretrain/Loss": 2.0445327758789062, "Pretrain/Loss (Raw)": 2.0638561248779297, "Pretrain/Step": 5485, "Pretrain/Step Time": 8.544015914201736} +{"Pretrain/Learning Rate": 2.015345062903433e-05, "Pretrain/Loss": 2.0448315143585205, "Pretrain/Loss (Raw)": 2.100039005279541, "Pretrain/Step": 5486, "Pretrain/Step Time": 8.549987381324172} +{"Pretrain/Learning Rate": 2.014512209848512e-05, "Pretrain/Loss": 2.0415098667144775, "Pretrain/Loss (Raw)": 1.8264436721801758, "Pretrain/Step": 5487, "Pretrain/Step Time": 8.54533558897674} +{"Pretrain/Learning Rate": 2.013679412782331e-05, "Pretrain/Loss": 2.044438123703003, "Pretrain/Loss (Raw)": 2.43807315826416, "Pretrain/Step": 5488, "Pretrain/Step Time": 8.549847861751914} +{"Pretrain/Learning Rate": 2.0128466718009313e-05, "Pretrain/Loss": 2.043370246887207, "Pretrain/Loss (Raw)": 2.032282829284668, "Pretrain/Step": 5489, "Pretrain/Step Time": 8.546230221167207} +{"Pretrain/Learning Rate": 2.0120139870003492e-05, "Pretrain/Loss": 2.0424747467041016, "Pretrain/Loss (Raw)": 2.0073537826538086, "Pretrain/Step": 5490, "Pretrain/Step Time": 8.54083058796823} +{"Pretrain/Learning Rate": 2.0111813584766134e-05, "Pretrain/Loss": 2.0410919189453125, "Pretrain/Loss (Raw)": 2.0077426433563232, "Pretrain/Step": 5491, "Pretrain/Step Time": 8.543697949498892} +{"Pretrain/Learning Rate": 2.010348786325747e-05, "Pretrain/Loss": 2.041393280029297, "Pretrain/Loss (Raw)": 1.8769582509994507, "Pretrain/Step": 5492, "Pretrain/Step Time": 8.54964186437428} +{"Pretrain/Learning Rate": 2.0095162706437655e-05, "Pretrain/Loss": 2.040055990219116, "Pretrain/Loss (Raw)": 1.9709057807922363, "Pretrain/Step": 5493, "Pretrain/Step Time": 8.54526505433023} +{"Pretrain/Learning Rate": 2.0086838115266794e-05, "Pretrain/Loss": 2.0399341583251953, "Pretrain/Loss (Raw)": 1.9760557413101196, "Pretrain/Step": 5494, "Pretrain/Step Time": 8.54870517924428} +{"Pretrain/Learning Rate": 2.007851409070491e-05, "Pretrain/Loss": 2.0386714935302734, "Pretrain/Loss (Raw)": 1.9336540699005127, "Pretrain/Step": 5495, "Pretrain/Step Time": 8.546449907124043} +{"Pretrain/Learning Rate": 2.007019063371197e-05, "Pretrain/Loss": 2.0389113426208496, "Pretrain/Loss (Raw)": 2.05256724357605, "Pretrain/Step": 5496, "Pretrain/Step Time": 8.544102244079113} +{"Pretrain/Learning Rate": 2.006186774524788e-05, "Pretrain/Loss": 2.038705825805664, "Pretrain/Loss (Raw)": 2.098254919052124, "Pretrain/Step": 5497, "Pretrain/Step Time": 8.543230870738626} +{"Pretrain/Learning Rate": 2.005354542627247e-05, "Pretrain/Loss": 2.0388174057006836, "Pretrain/Loss (Raw)": 1.9536759853363037, "Pretrain/Step": 5498, "Pretrain/Step Time": 8.556024802848697} +{"Pretrain/Learning Rate": 2.0045223677745507e-05, "Pretrain/Loss": 2.0381102561950684, "Pretrain/Loss (Raw)": 1.887118935585022, "Pretrain/Step": 5499, "Pretrain/Step Time": 8.548612346872687} +{"Pretrain/Learning Rate": 2.0036902500626704e-05, "Pretrain/Loss": 2.0397281646728516, "Pretrain/Loss (Raw)": 2.076688289642334, "Pretrain/Step": 5500, "Pretrain/Step Time": 8.553479826077819} +{"Pretrain/Learning Rate": 2.002858189587568e-05, "Pretrain/Loss": 2.040297508239746, "Pretrain/Loss (Raw)": 2.068727731704712, "Pretrain/Step": 5501, "Pretrain/Step Time": 8.547734271734953} +{"Pretrain/Learning Rate": 2.002026186445203e-05, "Pretrain/Loss": 2.0401265621185303, "Pretrain/Loss (Raw)": 2.063830614089966, "Pretrain/Step": 5502, "Pretrain/Step Time": 8.546554716303945} +{"Pretrain/Learning Rate": 2.0011942407315236e-05, "Pretrain/Loss": 2.0382251739501953, "Pretrain/Loss (Raw)": 2.038323402404785, "Pretrain/Step": 5503, "Pretrain/Step Time": 8.543704025447369} +{"Pretrain/Learning Rate": 2.0003623525424758e-05, "Pretrain/Loss": 2.0378684997558594, "Pretrain/Loss (Raw)": 2.0503299236297607, "Pretrain/Step": 5504, "Pretrain/Step Time": 8.557178994640708} +{"Pretrain/Learning Rate": 1.9995305219739952e-05, "Pretrain/Loss": 2.037921667098999, "Pretrain/Loss (Raw)": 2.1566598415374756, "Pretrain/Step": 5505, "Pretrain/Step Time": 8.544453177601099} +{"Pretrain/Learning Rate": 1.9986987491220137e-05, "Pretrain/Loss": 2.0374951362609863, "Pretrain/Loss (Raw)": 1.9567898511886597, "Pretrain/Step": 5506, "Pretrain/Step Time": 8.550506044179201} +{"Pretrain/Learning Rate": 1.997867034082454e-05, "Pretrain/Loss": 2.0380167961120605, "Pretrain/Loss (Raw)": 2.153597116470337, "Pretrain/Step": 5507, "Pretrain/Step Time": 8.54852956533432} +{"Pretrain/Learning Rate": 1.997035376951234e-05, "Pretrain/Loss": 2.037642002105713, "Pretrain/Loss (Raw)": 1.968931794166565, "Pretrain/Step": 5508, "Pretrain/Step Time": 8.54884173348546} +{"Pretrain/Learning Rate": 1.996203777824265e-05, "Pretrain/Loss": 2.0396502017974854, "Pretrain/Loss (Raw)": 2.1669511795043945, "Pretrain/Step": 5509, "Pretrain/Step Time": 8.545832553878427} +{"Pretrain/Learning Rate": 1.99537223679745e-05, "Pretrain/Loss": 2.0417964458465576, "Pretrain/Loss (Raw)": 2.3258280754089355, "Pretrain/Step": 5510, "Pretrain/Step Time": 8.550183491781354} +{"Pretrain/Learning Rate": 1.994540753966687e-05, "Pretrain/Loss": 2.0414249897003174, "Pretrain/Loss (Raw)": 2.1388742923736572, "Pretrain/Step": 5511, "Pretrain/Step Time": 8.5419015660882} +{"Pretrain/Learning Rate": 1.9937093294278653e-05, "Pretrain/Loss": 2.0433244705200195, "Pretrain/Loss (Raw)": 2.394029140472412, "Pretrain/Step": 5512, "Pretrain/Step Time": 8.540348393842578} +{"Pretrain/Learning Rate": 1.99287796327687e-05, "Pretrain/Loss": 2.043227195739746, "Pretrain/Loss (Raw)": 2.0174286365509033, "Pretrain/Step": 5513, "Pretrain/Step Time": 8.543098233640194} +{"Pretrain/Learning Rate": 1.9920466556095772e-05, "Pretrain/Loss": 2.0413317680358887, "Pretrain/Loss (Raw)": 1.934601902961731, "Pretrain/Step": 5514, "Pretrain/Step Time": 8.543115083128214} +{"Pretrain/Learning Rate": 1.991215406521858e-05, "Pretrain/Loss": 2.045624256134033, "Pretrain/Loss (Raw)": 2.2968363761901855, "Pretrain/Step": 5515, "Pretrain/Step Time": 8.539609337225556} +{"Pretrain/Learning Rate": 1.9903842161095752e-05, "Pretrain/Loss": 2.0464560985565186, "Pretrain/Loss (Raw)": 2.208958148956299, "Pretrain/Step": 5516, "Pretrain/Step Time": 8.548546429723501} +{"Pretrain/Learning Rate": 1.9895530844685865e-05, "Pretrain/Loss": 2.0446345806121826, "Pretrain/Loss (Raw)": 1.8784425258636475, "Pretrain/Step": 5517, "Pretrain/Step Time": 8.544289836660028} +{"Pretrain/Learning Rate": 1.988722011694741e-05, "Pretrain/Loss": 2.0448241233825684, "Pretrain/Loss (Raw)": 1.884671926498413, "Pretrain/Step": 5518, "Pretrain/Step Time": 8.544310668483377} +{"Pretrain/Learning Rate": 1.987890997883883e-05, "Pretrain/Loss": 2.0470032691955566, "Pretrain/Loss (Raw)": 2.140000581741333, "Pretrain/Step": 5519, "Pretrain/Step Time": 8.543361410498619} +{"Pretrain/Learning Rate": 1.987060043131847e-05, "Pretrain/Loss": 2.047795057296753, "Pretrain/Loss (Raw)": 2.0771381855010986, "Pretrain/Step": 5520, "Pretrain/Step Time": 8.54638928733766} +{"Pretrain/Learning Rate": 1.9862291475344654e-05, "Pretrain/Loss": 2.047239303588867, "Pretrain/Loss (Raw)": 2.0106678009033203, "Pretrain/Step": 5521, "Pretrain/Step Time": 8.543110923841596} +{"Pretrain/Learning Rate": 1.985398311187558e-05, "Pretrain/Loss": 2.048552989959717, "Pretrain/Loss (Raw)": 2.061898946762085, "Pretrain/Step": 5522, "Pretrain/Step Time": 8.548737715929747} +{"Pretrain/Learning Rate": 1.9845675341869437e-05, "Pretrain/Loss": 2.048952102661133, "Pretrain/Loss (Raw)": 2.004645347595215, "Pretrain/Step": 5523, "Pretrain/Step Time": 8.542067812755704} +{"Pretrain/Learning Rate": 1.9837368166284284e-05, "Pretrain/Loss": 2.0469939708709717, "Pretrain/Loss (Raw)": 1.8809454441070557, "Pretrain/Step": 5524, "Pretrain/Step Time": 8.544538993388414} +{"Pretrain/Learning Rate": 1.982906158607818e-05, "Pretrain/Loss": 2.0489706993103027, "Pretrain/Loss (Raw)": 2.143864154815674, "Pretrain/Step": 5525, "Pretrain/Step Time": 8.536335047334433} +{"Pretrain/Learning Rate": 1.982075560220904e-05, "Pretrain/Loss": 2.0521483421325684, "Pretrain/Loss (Raw)": 2.4253814220428467, "Pretrain/Step": 5526, "Pretrain/Step Time": 8.533593500033021} +{"Pretrain/Learning Rate": 1.981245021563479e-05, "Pretrain/Loss": 2.0494728088378906, "Pretrain/Loss (Raw)": 1.7421329021453857, "Pretrain/Step": 5527, "Pretrain/Step Time": 8.533843392506242} +{"Pretrain/Learning Rate": 1.9804145427313213e-05, "Pretrain/Loss": 2.0502514839172363, "Pretrain/Loss (Raw)": 2.043318510055542, "Pretrain/Step": 5528, "Pretrain/Step Time": 8.544137356802821} +{"Pretrain/Learning Rate": 1.9795841238202077e-05, "Pretrain/Loss": 2.0493855476379395, "Pretrain/Loss (Raw)": 1.9290823936462402, "Pretrain/Step": 5529, "Pretrain/Step Time": 8.538920495659113} +{"Pretrain/Learning Rate": 1.9787537649259043e-05, "Pretrain/Loss": 2.050389528274536, "Pretrain/Loss (Raw)": 2.1307876110076904, "Pretrain/Step": 5530, "Pretrain/Step Time": 8.544165823608637} +{"Pretrain/Learning Rate": 1.977923466144174e-05, "Pretrain/Loss": 2.051034688949585, "Pretrain/Loss (Raw)": 2.0239624977111816, "Pretrain/Step": 5531, "Pretrain/Step Time": 8.541974885389209} +{"Pretrain/Learning Rate": 1.977093227570768e-05, "Pretrain/Loss": 2.051194667816162, "Pretrain/Loss (Raw)": 2.043272018432617, "Pretrain/Step": 5532, "Pretrain/Step Time": 8.540111703798175} +{"Pretrain/Learning Rate": 1.9762630493014366e-05, "Pretrain/Loss": 2.049020290374756, "Pretrain/Loss (Raw)": 1.8558279275894165, "Pretrain/Step": 5533, "Pretrain/Step Time": 8.544019922614098} +{"Pretrain/Learning Rate": 1.9754329314319176e-05, "Pretrain/Loss": 2.048243999481201, "Pretrain/Loss (Raw)": 2.175819158554077, "Pretrain/Step": 5534, "Pretrain/Step Time": 8.54734294116497} +{"Pretrain/Learning Rate": 1.974602874057945e-05, "Pretrain/Loss": 2.047125816345215, "Pretrain/Loss (Raw)": 2.1002278327941895, "Pretrain/Step": 5535, "Pretrain/Step Time": 8.537568129599094} +{"Pretrain/Learning Rate": 1.9737728772752446e-05, "Pretrain/Loss": 2.0479702949523926, "Pretrain/Loss (Raw)": 2.137611150741577, "Pretrain/Step": 5536, "Pretrain/Step Time": 8.546912532299757} +{"Pretrain/Learning Rate": 1.9729429411795358e-05, "Pretrain/Loss": 2.0478904247283936, "Pretrain/Loss (Raw)": 2.060887336730957, "Pretrain/Step": 5537, "Pretrain/Step Time": 8.54094916768372} +{"Pretrain/Learning Rate": 1.97211306586653e-05, "Pretrain/Loss": 2.0502986907958984, "Pretrain/Loss (Raw)": 2.239823341369629, "Pretrain/Step": 5538, "Pretrain/Step Time": 8.539773503318429} +{"Pretrain/Learning Rate": 1.971283251431934e-05, "Pretrain/Loss": 2.0510756969451904, "Pretrain/Loss (Raw)": 2.1644885540008545, "Pretrain/Step": 5539, "Pretrain/Step Time": 8.53306962735951} +{"Pretrain/Learning Rate": 1.970453497971444e-05, "Pretrain/Loss": 2.0506744384765625, "Pretrain/Loss (Raw)": 2.0423855781555176, "Pretrain/Step": 5540, "Pretrain/Step Time": 8.545193502679467} +{"Pretrain/Learning Rate": 1.969623805580752e-05, "Pretrain/Loss": 2.0490591526031494, "Pretrain/Loss (Raw)": 1.917755126953125, "Pretrain/Step": 5541, "Pretrain/Step Time": 8.542166290804744} +{"Pretrain/Learning Rate": 1.9687941743555422e-05, "Pretrain/Loss": 2.047062635421753, "Pretrain/Loss (Raw)": 1.926084280014038, "Pretrain/Step": 5542, "Pretrain/Step Time": 8.542252536863089} +{"Pretrain/Learning Rate": 1.9679646043914914e-05, "Pretrain/Loss": 2.051483154296875, "Pretrain/Loss (Raw)": 2.37370228767395, "Pretrain/Step": 5543, "Pretrain/Step Time": 8.540156191214919} +{"Pretrain/Learning Rate": 1.967135095784269e-05, "Pretrain/Loss": 2.051222801208496, "Pretrain/Loss (Raw)": 2.017848253250122, "Pretrain/Step": 5544, "Pretrain/Step Time": 8.54027739353478} +{"Pretrain/Learning Rate": 1.966305648629539e-05, "Pretrain/Loss": 2.0511350631713867, "Pretrain/Loss (Raw)": 2.089852809906006, "Pretrain/Step": 5545, "Pretrain/Step Time": 8.540367729961872} +{"Pretrain/Learning Rate": 1.9654762630229558e-05, "Pretrain/Loss": 2.0514607429504395, "Pretrain/Loss (Raw)": 2.193869113922119, "Pretrain/Step": 5546, "Pretrain/Step Time": 8.548162430524826} +{"Pretrain/Learning Rate": 1.9646469390601692e-05, "Pretrain/Loss": 2.053121566772461, "Pretrain/Loss (Raw)": 2.1983768939971924, "Pretrain/Step": 5547, "Pretrain/Step Time": 8.544884711503983} +{"Pretrain/Learning Rate": 1.96381767683682e-05, "Pretrain/Loss": 2.0492875576019287, "Pretrain/Loss (Raw)": 1.5224716663360596, "Pretrain/Step": 5548, "Pretrain/Step Time": 8.54316021874547} +{"Pretrain/Learning Rate": 1.9629884764485422e-05, "Pretrain/Loss": 2.047729253768921, "Pretrain/Loss (Raw)": 1.900119423866272, "Pretrain/Step": 5549, "Pretrain/Step Time": 8.537950545549393} +{"Pretrain/Learning Rate": 1.962159337990965e-05, "Pretrain/Loss": 2.049800395965576, "Pretrain/Loss (Raw)": 2.294917106628418, "Pretrain/Step": 5550, "Pretrain/Step Time": 8.538433130830526} +{"Pretrain/Learning Rate": 1.9613302615597064e-05, "Pretrain/Loss": 2.0481748580932617, "Pretrain/Loss (Raw)": 1.9184361696243286, "Pretrain/Step": 5551, "Pretrain/Step Time": 8.537865126505494} +{"Pretrain/Learning Rate": 1.960501247250381e-05, "Pretrain/Loss": 2.048699378967285, "Pretrain/Loss (Raw)": 2.180593967437744, "Pretrain/Step": 5552, "Pretrain/Step Time": 8.543452005833387} +{"Pretrain/Learning Rate": 1.9596722951585936e-05, "Pretrain/Loss": 2.048511028289795, "Pretrain/Loss (Raw)": 1.9436252117156982, "Pretrain/Step": 5553, "Pretrain/Step Time": 8.541812635958195} +{"Pretrain/Learning Rate": 1.9588434053799437e-05, "Pretrain/Loss": 2.0468106269836426, "Pretrain/Loss (Raw)": 1.926310658454895, "Pretrain/Step": 5554, "Pretrain/Step Time": 8.542320065200329} +{"Pretrain/Learning Rate": 1.9580145780100216e-05, "Pretrain/Loss": 2.045442581176758, "Pretrain/Loss (Raw)": 1.9205044507980347, "Pretrain/Step": 5555, "Pretrain/Step Time": 8.538914181292057} +{"Pretrain/Learning Rate": 1.9571858131444128e-05, "Pretrain/Loss": 2.0445003509521484, "Pretrain/Loss (Raw)": 1.9457120895385742, "Pretrain/Step": 5556, "Pretrain/Step Time": 8.538940029218793} +{"Pretrain/Learning Rate": 1.9563571108786936e-05, "Pretrain/Loss": 2.045996904373169, "Pretrain/Loss (Raw)": 2.220731496810913, "Pretrain/Step": 5557, "Pretrain/Step Time": 8.539361292496324} +{"Pretrain/Learning Rate": 1.9555284713084345e-05, "Pretrain/Loss": 2.045809507369995, "Pretrain/Loss (Raw)": 1.9052928686141968, "Pretrain/Step": 5558, "Pretrain/Step Time": 8.541702881455421} +{"Pretrain/Learning Rate": 1.954699894529197e-05, "Pretrain/Loss": 2.0462093353271484, "Pretrain/Loss (Raw)": 2.018834352493286, "Pretrain/Step": 5559, "Pretrain/Step Time": 8.540138704702258} +{"Pretrain/Learning Rate": 1.953871380636538e-05, "Pretrain/Loss": 2.0453524589538574, "Pretrain/Loss (Raw)": 2.027066469192505, "Pretrain/Step": 5560, "Pretrain/Step Time": 8.55044425651431} +{"Pretrain/Learning Rate": 1.953042929726004e-05, "Pretrain/Loss": 2.044140100479126, "Pretrain/Loss (Raw)": 1.8949717283248901, "Pretrain/Step": 5561, "Pretrain/Step Time": 8.546544905751944} +{"Pretrain/Learning Rate": 1.952214541893138e-05, "Pretrain/Loss": 2.0438342094421387, "Pretrain/Loss (Raw)": 1.9953491687774658, "Pretrain/Step": 5562, "Pretrain/Step Time": 8.546933779492974} +{"Pretrain/Learning Rate": 1.9513862172334707e-05, "Pretrain/Loss": 2.043595790863037, "Pretrain/Loss (Raw)": 2.0244696140289307, "Pretrain/Step": 5563, "Pretrain/Step Time": 8.548000987619162} +{"Pretrain/Learning Rate": 1.9505579558425313e-05, "Pretrain/Loss": 2.0467443466186523, "Pretrain/Loss (Raw)": 2.347562551498413, "Pretrain/Step": 5564, "Pretrain/Step Time": 8.55294337309897} +{"Pretrain/Learning Rate": 1.9497297578158363e-05, "Pretrain/Loss": 2.047929525375366, "Pretrain/Loss (Raw)": 2.027311086654663, "Pretrain/Step": 5565, "Pretrain/Step Time": 8.551845472306013} +{"Pretrain/Learning Rate": 1.9489016232489e-05, "Pretrain/Loss": 2.045994281768799, "Pretrain/Loss (Raw)": 1.9736263751983643, "Pretrain/Step": 5566, "Pretrain/Step Time": 8.557344034314156} +{"Pretrain/Learning Rate": 1.9480735522372236e-05, "Pretrain/Loss": 2.0471127033233643, "Pretrain/Loss (Raw)": 2.1586356163024902, "Pretrain/Step": 5567, "Pretrain/Step Time": 8.545848546549678} +{"Pretrain/Learning Rate": 1.9472455448763077e-05, "Pretrain/Loss": 2.0490987300872803, "Pretrain/Loss (Raw)": 2.329542636871338, "Pretrain/Step": 5568, "Pretrain/Step Time": 8.549753993749619} +{"Pretrain/Learning Rate": 1.9464176012616386e-05, "Pretrain/Loss": 2.048595428466797, "Pretrain/Loss (Raw)": 1.9742748737335205, "Pretrain/Step": 5569, "Pretrain/Step Time": 8.552298679947853} +{"Pretrain/Learning Rate": 1.945589721488702e-05, "Pretrain/Loss": 2.0499048233032227, "Pretrain/Loss (Raw)": 2.050191640853882, "Pretrain/Step": 5570, "Pretrain/Step Time": 8.549563435837626} +{"Pretrain/Learning Rate": 1.9447619056529697e-05, "Pretrain/Loss": 2.0507781505584717, "Pretrain/Loss (Raw)": 2.175945997238159, "Pretrain/Step": 5571, "Pretrain/Step Time": 8.55252050049603} +{"Pretrain/Learning Rate": 1.9439341538499117e-05, "Pretrain/Loss": 2.0524957180023193, "Pretrain/Loss (Raw)": 2.151474714279175, "Pretrain/Step": 5572, "Pretrain/Step Time": 8.54925544001162} +{"Pretrain/Learning Rate": 1.9431064661749866e-05, "Pretrain/Loss": 2.051570415496826, "Pretrain/Loss (Raw)": 1.851946234703064, "Pretrain/Step": 5573, "Pretrain/Step Time": 8.543580519035459} +{"Pretrain/Learning Rate": 1.9422788427236487e-05, "Pretrain/Loss": 2.0510194301605225, "Pretrain/Loss (Raw)": 2.183335304260254, "Pretrain/Step": 5574, "Pretrain/Step Time": 8.541877821087837} +{"Pretrain/Learning Rate": 1.9414512835913422e-05, "Pretrain/Loss": 2.047621488571167, "Pretrain/Loss (Raw)": 1.7385872602462769, "Pretrain/Step": 5575, "Pretrain/Step Time": 8.54300882294774} +{"Pretrain/Learning Rate": 1.940623788873506e-05, "Pretrain/Loss": 2.0485386848449707, "Pretrain/Loss (Raw)": 2.1848747730255127, "Pretrain/Step": 5576, "Pretrain/Step Time": 8.541404463350773} +{"Pretrain/Learning Rate": 1.9397963586655702e-05, "Pretrain/Loss": 2.051520824432373, "Pretrain/Loss (Raw)": 2.160433530807495, "Pretrain/Step": 5577, "Pretrain/Step Time": 8.549201196059585} +{"Pretrain/Learning Rate": 1.9389689930629585e-05, "Pretrain/Loss": 2.0545334815979004, "Pretrain/Loss (Raw)": 2.130537271499634, "Pretrain/Step": 5578, "Pretrain/Step Time": 8.549089627340436} +{"Pretrain/Learning Rate": 1.9381416921610855e-05, "Pretrain/Loss": 2.0534887313842773, "Pretrain/Loss (Raw)": 1.9936379194259644, "Pretrain/Step": 5579, "Pretrain/Step Time": 8.545881312340498} +{"Pretrain/Learning Rate": 1.9373144560553604e-05, "Pretrain/Loss": 2.054445266723633, "Pretrain/Loss (Raw)": 2.088407039642334, "Pretrain/Step": 5580, "Pretrain/Step Time": 8.550214253365993} +{"Pretrain/Learning Rate": 1.9364872848411837e-05, "Pretrain/Loss": 2.0578293800354004, "Pretrain/Loss (Raw)": 2.272287130355835, "Pretrain/Step": 5581, "Pretrain/Step Time": 8.550427427515388} +{"Pretrain/Learning Rate": 1.9356601786139487e-05, "Pretrain/Loss": 2.05733323097229, "Pretrain/Loss (Raw)": 2.1559743881225586, "Pretrain/Step": 5582, "Pretrain/Step Time": 8.550470620393753} +{"Pretrain/Learning Rate": 1.934833137469041e-05, "Pretrain/Loss": 2.056454658508301, "Pretrain/Loss (Raw)": 2.0352442264556885, "Pretrain/Step": 5583, "Pretrain/Step Time": 8.553850434720516} +{"Pretrain/Learning Rate": 1.9340061615018393e-05, "Pretrain/Loss": 2.0584115982055664, "Pretrain/Loss (Raw)": 2.173600435256958, "Pretrain/Step": 5584, "Pretrain/Step Time": 8.547725772485137} +{"Pretrain/Learning Rate": 1.9331792508077136e-05, "Pretrain/Loss": 2.057389259338379, "Pretrain/Loss (Raw)": 1.902677297592163, "Pretrain/Step": 5585, "Pretrain/Step Time": 8.5509336553514} +{"Pretrain/Learning Rate": 1.9323524054820285e-05, "Pretrain/Loss": 2.058488368988037, "Pretrain/Loss (Raw)": 2.123852252960205, "Pretrain/Step": 5586, "Pretrain/Step Time": 8.548144694417715} +{"Pretrain/Learning Rate": 1.9315256256201382e-05, "Pretrain/Loss": 2.0585975646972656, "Pretrain/Loss (Raw)": 1.9952871799468994, "Pretrain/Step": 5587, "Pretrain/Step Time": 8.549752661958337} +{"Pretrain/Learning Rate": 1.930698911317392e-05, "Pretrain/Loss": 2.0589804649353027, "Pretrain/Loss (Raw)": 2.209648370742798, "Pretrain/Step": 5588, "Pretrain/Step Time": 8.54873401671648} +{"Pretrain/Learning Rate": 1.929872262669129e-05, "Pretrain/Loss": 2.0565099716186523, "Pretrain/Loss (Raw)": 1.9302465915679932, "Pretrain/Step": 5589, "Pretrain/Step Time": 8.55622929520905} +{"Pretrain/Learning Rate": 1.9290456797706835e-05, "Pretrain/Loss": 2.05570387840271, "Pretrain/Loss (Raw)": 2.049459934234619, "Pretrain/Step": 5590, "Pretrain/Step Time": 8.546962628141046} +{"Pretrain/Learning Rate": 1.928219162717381e-05, "Pretrain/Loss": 2.0563247203826904, "Pretrain/Loss (Raw)": 2.0584237575531006, "Pretrain/Step": 5591, "Pretrain/Step Time": 8.546139301732183} +{"Pretrain/Learning Rate": 1.927392711604539e-05, "Pretrain/Loss": 2.053722620010376, "Pretrain/Loss (Raw)": 1.8635529279708862, "Pretrain/Step": 5592, "Pretrain/Step Time": 8.548933234065771} +{"Pretrain/Learning Rate": 1.926566326527468e-05, "Pretrain/Loss": 2.052340507507324, "Pretrain/Loss (Raw)": 2.006697177886963, "Pretrain/Step": 5593, "Pretrain/Step Time": 8.549272468313575} +{"Pretrain/Learning Rate": 1.9257400075814697e-05, "Pretrain/Loss": 2.049710273742676, "Pretrain/Loss (Raw)": 1.746052861213684, "Pretrain/Step": 5594, "Pretrain/Step Time": 8.554647851735353} +{"Pretrain/Learning Rate": 1.92491375486184e-05, "Pretrain/Loss": 2.049193859100342, "Pretrain/Loss (Raw)": 1.9011435508728027, "Pretrain/Step": 5595, "Pretrain/Step Time": 8.559753432869911} +{"Pretrain/Learning Rate": 1.9240875684638658e-05, "Pretrain/Loss": 2.0513291358947754, "Pretrain/Loss (Raw)": 2.052949905395508, "Pretrain/Step": 5596, "Pretrain/Step Time": 8.55030425451696} +{"Pretrain/Learning Rate": 1.9232614484828277e-05, "Pretrain/Loss": 2.0498883724212646, "Pretrain/Loss (Raw)": 2.0161025524139404, "Pretrain/Step": 5597, "Pretrain/Step Time": 8.551220884546638} +{"Pretrain/Learning Rate": 1.922435395013996e-05, "Pretrain/Loss": 2.0510292053222656, "Pretrain/Loss (Raw)": 2.1330316066741943, "Pretrain/Step": 5598, "Pretrain/Step Time": 8.550978031009436} +{"Pretrain/Learning Rate": 1.921609408152637e-05, "Pretrain/Loss": 2.0494384765625, "Pretrain/Loss (Raw)": 1.9517900943756104, "Pretrain/Step": 5599, "Pretrain/Step Time": 8.549095038324594} +{"Pretrain/Learning Rate": 1.9207834879940058e-05, "Pretrain/Loss": 2.0517311096191406, "Pretrain/Loss (Raw)": 2.224855899810791, "Pretrain/Step": 5600, "Pretrain/Step Time": 8.552625622600317} +{"Pretrain/Learning Rate": 1.919957634633353e-05, "Pretrain/Loss": 2.0529375076293945, "Pretrain/Loss (Raw)": 2.157654047012329, "Pretrain/Step": 5601, "Pretrain/Step Time": 8.56029325723648} +{"Pretrain/Learning Rate": 1.9191318481659183e-05, "Pretrain/Loss": 2.0534329414367676, "Pretrain/Loss (Raw)": 2.1524853706359863, "Pretrain/Step": 5602, "Pretrain/Step Time": 8.55007316544652} +{"Pretrain/Learning Rate": 1.918306128686937e-05, "Pretrain/Loss": 2.0559914112091064, "Pretrain/Loss (Raw)": 2.0614960193634033, "Pretrain/Step": 5603, "Pretrain/Step Time": 8.545728558674455} +{"Pretrain/Learning Rate": 1.9174804762916324e-05, "Pretrain/Loss": 2.0538923740386963, "Pretrain/Loss (Raw)": 2.0353710651397705, "Pretrain/Step": 5604, "Pretrain/Step Time": 8.548680063337088} +{"Pretrain/Learning Rate": 1.916654891075226e-05, "Pretrain/Loss": 2.050952434539795, "Pretrain/Loss (Raw)": 1.8180652856826782, "Pretrain/Step": 5605, "Pretrain/Step Time": 8.549501106142998} +{"Pretrain/Learning Rate": 1.915829373132924e-05, "Pretrain/Loss": 2.052399158477783, "Pretrain/Loss (Raw)": 2.0916998386383057, "Pretrain/Step": 5606, "Pretrain/Step Time": 8.542834440246224} +{"Pretrain/Learning Rate": 1.9150039225599336e-05, "Pretrain/Loss": 2.053640842437744, "Pretrain/Loss (Raw)": 2.143129587173462, "Pretrain/Step": 5607, "Pretrain/Step Time": 8.548750383779407} +{"Pretrain/Learning Rate": 1.914178539451446e-05, "Pretrain/Loss": 2.0550267696380615, "Pretrain/Loss (Raw)": 2.0245416164398193, "Pretrain/Step": 5608, "Pretrain/Step Time": 8.541965639218688} +{"Pretrain/Learning Rate": 1.913353223902651e-05, "Pretrain/Loss": 2.054525852203369, "Pretrain/Loss (Raw)": 2.1798155307769775, "Pretrain/Step": 5609, "Pretrain/Step Time": 8.54525213316083} +{"Pretrain/Learning Rate": 1.912527976008725e-05, "Pretrain/Loss": 2.0566928386688232, "Pretrain/Loss (Raw)": 2.238086223602295, "Pretrain/Step": 5610, "Pretrain/Step Time": 8.546249529346824} +{"Pretrain/Learning Rate": 1.911702795864843e-05, "Pretrain/Loss": 2.0545544624328613, "Pretrain/Loss (Raw)": 2.008021354675293, "Pretrain/Step": 5611, "Pretrain/Step Time": 8.547142857685685} +{"Pretrain/Learning Rate": 1.9108776835661655e-05, "Pretrain/Loss": 2.055051326751709, "Pretrain/Loss (Raw)": 2.0164475440979004, "Pretrain/Step": 5612, "Pretrain/Step Time": 8.549466801807284} +{"Pretrain/Learning Rate": 1.91005263920785e-05, "Pretrain/Loss": 2.0542612075805664, "Pretrain/Loss (Raw)": 1.962720274925232, "Pretrain/Step": 5613, "Pretrain/Step Time": 8.55475446768105} +{"Pretrain/Learning Rate": 1.9092276628850438e-05, "Pretrain/Loss": 2.053330183029175, "Pretrain/Loss (Raw)": 1.980881929397583, "Pretrain/Step": 5614, "Pretrain/Step Time": 8.549351785331964} +{"Pretrain/Learning Rate": 1.9084027546928872e-05, "Pretrain/Loss": 2.056161403656006, "Pretrain/Loss (Raw)": 2.188847303390503, "Pretrain/Step": 5615, "Pretrain/Step Time": 8.545424977317452} +{"Pretrain/Learning Rate": 1.907577914726513e-05, "Pretrain/Loss": 2.0544676780700684, "Pretrain/Loss (Raw)": 2.2212319374084473, "Pretrain/Step": 5616, "Pretrain/Step Time": 8.543405713513494} +{"Pretrain/Learning Rate": 1.906753143081045e-05, "Pretrain/Loss": 2.0543313026428223, "Pretrain/Loss (Raw)": 2.014859199523926, "Pretrain/Step": 5617, "Pretrain/Step Time": 8.54849941469729} +{"Pretrain/Learning Rate": 1.9059284398515997e-05, "Pretrain/Loss": 2.055729389190674, "Pretrain/Loss (Raw)": 2.1862919330596924, "Pretrain/Step": 5618, "Pretrain/Step Time": 8.549283027648926} +{"Pretrain/Learning Rate": 1.9051038051332868e-05, "Pretrain/Loss": 2.056419849395752, "Pretrain/Loss (Raw)": 2.0961320400238037, "Pretrain/Step": 5619, "Pretrain/Step Time": 8.556406144052744} +{"Pretrain/Learning Rate": 1.9042792390212054e-05, "Pretrain/Loss": 2.060141086578369, "Pretrain/Loss (Raw)": 2.353257179260254, "Pretrain/Step": 5620, "Pretrain/Step Time": 8.54962869733572} +{"Pretrain/Learning Rate": 1.9034547416104502e-05, "Pretrain/Loss": 2.0610270500183105, "Pretrain/Loss (Raw)": 2.084307909011841, "Pretrain/Step": 5621, "Pretrain/Step Time": 8.552917916327715} +{"Pretrain/Learning Rate": 1.9026303129961047e-05, "Pretrain/Loss": 2.061906337738037, "Pretrain/Loss (Raw)": 2.088646650314331, "Pretrain/Step": 5622, "Pretrain/Step Time": 8.547420728951693} +{"Pretrain/Learning Rate": 1.901805953273247e-05, "Pretrain/Loss": 2.0611400604248047, "Pretrain/Loss (Raw)": 1.8355515003204346, "Pretrain/Step": 5623, "Pretrain/Step Time": 8.550420820713043} +{"Pretrain/Learning Rate": 1.900981662536945e-05, "Pretrain/Loss": 2.0600051879882812, "Pretrain/Loss (Raw)": 1.9073108434677124, "Pretrain/Step": 5624, "Pretrain/Step Time": 8.5505623947829} +{"Pretrain/Learning Rate": 1.9001574408822603e-05, "Pretrain/Loss": 2.0588037967681885, "Pretrain/Loss (Raw)": 1.9444630146026611, "Pretrain/Step": 5625, "Pretrain/Step Time": 8.557722814381123} +{"Pretrain/Learning Rate": 1.899333288404246e-05, "Pretrain/Loss": 2.0607309341430664, "Pretrain/Loss (Raw)": 2.200364589691162, "Pretrain/Step": 5626, "Pretrain/Step Time": 8.546140784397721} +{"Pretrain/Learning Rate": 1.8985092051979478e-05, "Pretrain/Loss": 2.063506603240967, "Pretrain/Loss (Raw)": 2.2424192428588867, "Pretrain/Step": 5627, "Pretrain/Step Time": 8.548941181972623} +{"Pretrain/Learning Rate": 1.897685191358402e-05, "Pretrain/Loss": 2.0634965896606445, "Pretrain/Loss (Raw)": 2.0754001140594482, "Pretrain/Step": 5628, "Pretrain/Step Time": 8.544139930978417} +{"Pretrain/Learning Rate": 1.8968612469806387e-05, "Pretrain/Loss": 2.063350200653076, "Pretrain/Loss (Raw)": 2.0499656200408936, "Pretrain/Step": 5629, "Pretrain/Step Time": 8.545183755457401} +{"Pretrain/Learning Rate": 1.8960373721596775e-05, "Pretrain/Loss": 2.061072826385498, "Pretrain/Loss (Raw)": 1.772336721420288, "Pretrain/Step": 5630, "Pretrain/Step Time": 8.542740739881992} +{"Pretrain/Learning Rate": 1.8952135669905334e-05, "Pretrain/Loss": 2.0605554580688477, "Pretrain/Loss (Raw)": 1.9721202850341797, "Pretrain/Step": 5631, "Pretrain/Step Time": 8.553483569994569} +{"Pretrain/Learning Rate": 1.89438983156821e-05, "Pretrain/Loss": 2.061124324798584, "Pretrain/Loss (Raw)": 2.123119831085205, "Pretrain/Step": 5632, "Pretrain/Step Time": 8.540007162839174} +{"Pretrain/Learning Rate": 1.8935661659877046e-05, "Pretrain/Loss": 2.0603652000427246, "Pretrain/Loss (Raw)": 2.059480667114258, "Pretrain/Step": 5633, "Pretrain/Step Time": 8.545924937352538} +{"Pretrain/Learning Rate": 1.8927425703440076e-05, "Pretrain/Loss": 2.0597896575927734, "Pretrain/Loss (Raw)": 1.8831162452697754, "Pretrain/Step": 5634, "Pretrain/Step Time": 8.543820602819324} +{"Pretrain/Learning Rate": 1.8919190447320982e-05, "Pretrain/Loss": 2.0578341484069824, "Pretrain/Loss (Raw)": 1.9033106565475464, "Pretrain/Step": 5635, "Pretrain/Step Time": 8.543595787137747} +{"Pretrain/Learning Rate": 1.8910955892469505e-05, "Pretrain/Loss": 2.059382915496826, "Pretrain/Loss (Raw)": 2.1671793460845947, "Pretrain/Step": 5636, "Pretrain/Step Time": 8.543191438540816} +{"Pretrain/Learning Rate": 1.890272203983528e-05, "Pretrain/Loss": 2.0572028160095215, "Pretrain/Loss (Raw)": 1.8879045248031616, "Pretrain/Step": 5637, "Pretrain/Step Time": 8.548871379345655} +{"Pretrain/Learning Rate": 1.8894488890367885e-05, "Pretrain/Loss": 2.0566353797912598, "Pretrain/Loss (Raw)": 2.2531826496124268, "Pretrain/Step": 5638, "Pretrain/Step Time": 8.543961921706796} +{"Pretrain/Learning Rate": 1.8886256445016798e-05, "Pretrain/Loss": 2.054924964904785, "Pretrain/Loss (Raw)": 1.9199517965316772, "Pretrain/Step": 5639, "Pretrain/Step Time": 8.549060294404626} +{"Pretrain/Learning Rate": 1.8878024704731433e-05, "Pretrain/Loss": 2.053539276123047, "Pretrain/Loss (Raw)": 2.216642141342163, "Pretrain/Step": 5640, "Pretrain/Step Time": 8.549096781760454} +{"Pretrain/Learning Rate": 1.88697936704611e-05, "Pretrain/Loss": 2.053567886352539, "Pretrain/Loss (Raw)": 2.0211029052734375, "Pretrain/Step": 5641, "Pretrain/Step Time": 8.55120049789548} +{"Pretrain/Learning Rate": 1.8861563343155054e-05, "Pretrain/Loss": 2.0552964210510254, "Pretrain/Loss (Raw)": 2.1558377742767334, "Pretrain/Step": 5642, "Pretrain/Step Time": 8.546359162777662} +{"Pretrain/Learning Rate": 1.8853333723762438e-05, "Pretrain/Loss": 2.0564258098602295, "Pretrain/Loss (Raw)": 2.4414353370666504, "Pretrain/Step": 5643, "Pretrain/Step Time": 8.556256486102939} +{"Pretrain/Learning Rate": 1.884510481323236e-05, "Pretrain/Loss": 2.0564866065979004, "Pretrain/Loss (Raw)": 2.216719388961792, "Pretrain/Step": 5644, "Pretrain/Step Time": 8.548604097217321} +{"Pretrain/Learning Rate": 1.8836876612513777e-05, "Pretrain/Loss": 2.058746337890625, "Pretrain/Loss (Raw)": 2.1677119731903076, "Pretrain/Step": 5645, "Pretrain/Step Time": 8.551295539364219} +{"Pretrain/Learning Rate": 1.882864912255564e-05, "Pretrain/Loss": 2.060013771057129, "Pretrain/Loss (Raw)": 2.0468530654907227, "Pretrain/Step": 5646, "Pretrain/Step Time": 8.550815345719457} +{"Pretrain/Learning Rate": 1.882042234430675e-05, "Pretrain/Loss": 2.05903959274292, "Pretrain/Loss (Raw)": 2.015331983566284, "Pretrain/Step": 5647, "Pretrain/Step Time": 8.548879157751799} +{"Pretrain/Learning Rate": 1.8812196278715895e-05, "Pretrain/Loss": 2.057939052581787, "Pretrain/Loss (Raw)": 1.9362562894821167, "Pretrain/Step": 5648, "Pretrain/Step Time": 8.545782871544361} +{"Pretrain/Learning Rate": 1.8803970926731703e-05, "Pretrain/Loss": 2.0588083267211914, "Pretrain/Loss (Raw)": 2.1219732761383057, "Pretrain/Step": 5649, "Pretrain/Step Time": 8.55617974512279} +{"Pretrain/Learning Rate": 1.8795746289302798e-05, "Pretrain/Loss": 2.0595028400421143, "Pretrain/Loss (Raw)": 2.150770425796509, "Pretrain/Step": 5650, "Pretrain/Step Time": 8.550102123990655} +{"Pretrain/Learning Rate": 1.878752236737765e-05, "Pretrain/Loss": 2.0580015182495117, "Pretrain/Loss (Raw)": 1.8124805688858032, "Pretrain/Step": 5651, "Pretrain/Step Time": 8.548641564324498} +{"Pretrain/Learning Rate": 1.8779299161904712e-05, "Pretrain/Loss": 2.060640573501587, "Pretrain/Loss (Raw)": 2.218745708465576, "Pretrain/Step": 5652, "Pretrain/Step Time": 8.549237405881286} +{"Pretrain/Learning Rate": 1.87710766738323e-05, "Pretrain/Loss": 2.059098720550537, "Pretrain/Loss (Raw)": 1.946528434753418, "Pretrain/Step": 5653, "Pretrain/Step Time": 8.548895621672273} +{"Pretrain/Learning Rate": 1.8762854904108677e-05, "Pretrain/Loss": 2.0539379119873047, "Pretrain/Loss (Raw)": 1.764751672744751, "Pretrain/Step": 5654, "Pretrain/Step Time": 8.555308753624558} +{"Pretrain/Learning Rate": 1.8754633853682016e-05, "Pretrain/Loss": 2.0555992126464844, "Pretrain/Loss (Raw)": 1.9548211097717285, "Pretrain/Step": 5655, "Pretrain/Step Time": 8.559921506792307} +{"Pretrain/Learning Rate": 1.874641352350041e-05, "Pretrain/Loss": 2.0540363788604736, "Pretrain/Loss (Raw)": 1.843253254890442, "Pretrain/Step": 5656, "Pretrain/Step Time": 8.547465598210692} +{"Pretrain/Learning Rate": 1.8738193914511865e-05, "Pretrain/Loss": 2.0532262325286865, "Pretrain/Loss (Raw)": 1.825395941734314, "Pretrain/Step": 5657, "Pretrain/Step Time": 8.553751794621348} +{"Pretrain/Learning Rate": 1.8729975027664303e-05, "Pretrain/Loss": 2.0534751415252686, "Pretrain/Loss (Raw)": 2.1626274585723877, "Pretrain/Step": 5658, "Pretrain/Step Time": 8.552678536623716} +{"Pretrain/Learning Rate": 1.8721756863905566e-05, "Pretrain/Loss": 2.0527944564819336, "Pretrain/Loss (Raw)": 1.9368581771850586, "Pretrain/Step": 5659, "Pretrain/Step Time": 8.552305772900581} +{"Pretrain/Learning Rate": 1.8713539424183417e-05, "Pretrain/Loss": 2.0532474517822266, "Pretrain/Loss (Raw)": 2.101250171661377, "Pretrain/Step": 5660, "Pretrain/Step Time": 8.550587141886353} +{"Pretrain/Learning Rate": 1.8705322709445515e-05, "Pretrain/Loss": 2.0536088943481445, "Pretrain/Loss (Raw)": 1.902097225189209, "Pretrain/Step": 5661, "Pretrain/Step Time": 8.555621923878789} +{"Pretrain/Learning Rate": 1.8697106720639467e-05, "Pretrain/Loss": 2.054584503173828, "Pretrain/Loss (Raw)": 2.3006694316864014, "Pretrain/Step": 5662, "Pretrain/Step Time": 8.547107491642237} +{"Pretrain/Learning Rate": 1.8688891458712765e-05, "Pretrain/Loss": 2.053966522216797, "Pretrain/Loss (Raw)": 2.021127223968506, "Pretrain/Step": 5663, "Pretrain/Step Time": 8.557897880673409} +{"Pretrain/Learning Rate": 1.8680676924612847e-05, "Pretrain/Loss": 2.0539724826812744, "Pretrain/Loss (Raw)": 2.138387680053711, "Pretrain/Step": 5664, "Pretrain/Step Time": 8.549414668232203} +{"Pretrain/Learning Rate": 1.8672463119287037e-05, "Pretrain/Loss": 2.0532705783843994, "Pretrain/Loss (Raw)": 1.9710447788238525, "Pretrain/Step": 5665, "Pretrain/Step Time": 8.554251700639725} +{"Pretrain/Learning Rate": 1.86642500436826e-05, "Pretrain/Loss": 2.0532166957855225, "Pretrain/Loss (Raw)": 2.2329249382019043, "Pretrain/Step": 5666, "Pretrain/Step Time": 8.557648118585348} +{"Pretrain/Learning Rate": 1.8656037698746704e-05, "Pretrain/Loss": 2.05159592628479, "Pretrain/Loss (Raw)": 1.9570116996765137, "Pretrain/Step": 5667, "Pretrain/Step Time": 8.564133871346712} +{"Pretrain/Learning Rate": 1.8647826085426433e-05, "Pretrain/Loss": 2.0519227981567383, "Pretrain/Loss (Raw)": 2.084247589111328, "Pretrain/Step": 5668, "Pretrain/Step Time": 8.549341460689902} +{"Pretrain/Learning Rate": 1.8639615204668786e-05, "Pretrain/Loss": 2.052572250366211, "Pretrain/Loss (Raw)": 2.0009145736694336, "Pretrain/Step": 5669, "Pretrain/Step Time": 8.55056381970644} +{"Pretrain/Learning Rate": 1.863140505742069e-05, "Pretrain/Loss": 2.054138660430908, "Pretrain/Loss (Raw)": 2.1265673637390137, "Pretrain/Step": 5670, "Pretrain/Step Time": 8.552559709176421} +{"Pretrain/Learning Rate": 1.862319564462897e-05, "Pretrain/Loss": 2.0517454147338867, "Pretrain/Loss (Raw)": 2.0673410892486572, "Pretrain/Step": 5671, "Pretrain/Step Time": 8.549457002431154} +{"Pretrain/Learning Rate": 1.8614986967240382e-05, "Pretrain/Loss": 2.052706480026245, "Pretrain/Loss (Raw)": 2.1408491134643555, "Pretrain/Step": 5672, "Pretrain/Step Time": 8.551114745438099} +{"Pretrain/Learning Rate": 1.8606779026201577e-05, "Pretrain/Loss": 2.052180767059326, "Pretrain/Loss (Raw)": 2.0225672721862793, "Pretrain/Step": 5673, "Pretrain/Step Time": 8.55560028553009} +{"Pretrain/Learning Rate": 1.859857182245914e-05, "Pretrain/Loss": 2.050205707550049, "Pretrain/Loss (Raw)": 1.9410666227340698, "Pretrain/Step": 5674, "Pretrain/Step Time": 8.5444379709661} +{"Pretrain/Learning Rate": 1.859036535695957e-05, "Pretrain/Loss": 2.04840350151062, "Pretrain/Loss (Raw)": 1.9677002429962158, "Pretrain/Step": 5675, "Pretrain/Step Time": 8.554427821189165} +{"Pretrain/Learning Rate": 1.858215963064927e-05, "Pretrain/Loss": 2.052753448486328, "Pretrain/Loss (Raw)": 2.079256057739258, "Pretrain/Step": 5676, "Pretrain/Step Time": 8.551072316244245} +{"Pretrain/Learning Rate": 1.8573954644474562e-05, "Pretrain/Loss": 2.052962303161621, "Pretrain/Loss (Raw)": 1.9268747568130493, "Pretrain/Step": 5677, "Pretrain/Step Time": 8.551476599648595} +{"Pretrain/Learning Rate": 1.8565750399381684e-05, "Pretrain/Loss": 2.0494446754455566, "Pretrain/Loss (Raw)": 1.844625473022461, "Pretrain/Step": 5678, "Pretrain/Step Time": 8.551521927118301} +{"Pretrain/Learning Rate": 1.8557546896316793e-05, "Pretrain/Loss": 2.0498738288879395, "Pretrain/Loss (Raw)": 1.973374605178833, "Pretrain/Step": 5679, "Pretrain/Step Time": 8.559089301154017} +{"Pretrain/Learning Rate": 1.8549344136225946e-05, "Pretrain/Loss": 2.050663471221924, "Pretrain/Loss (Raw)": 2.281670331954956, "Pretrain/Step": 5680, "Pretrain/Step Time": 8.54883005283773} +{"Pretrain/Learning Rate": 1.8541142120055136e-05, "Pretrain/Loss": 2.050685167312622, "Pretrain/Loss (Raw)": 1.9464077949523926, "Pretrain/Step": 5681, "Pretrain/Step Time": 8.554517770186067} +{"Pretrain/Learning Rate": 1.8532940848750245e-05, "Pretrain/Loss": 2.0510447025299072, "Pretrain/Loss (Raw)": 1.9723387956619263, "Pretrain/Step": 5682, "Pretrain/Step Time": 8.55611346848309} +{"Pretrain/Learning Rate": 1.8524740323257095e-05, "Pretrain/Loss": 2.0541019439697266, "Pretrain/Loss (Raw)": 2.311826467514038, "Pretrain/Step": 5683, "Pretrain/Step Time": 8.553505199030042} +{"Pretrain/Learning Rate": 1.85165405445214e-05, "Pretrain/Loss": 2.0571582317352295, "Pretrain/Loss (Raw)": 2.3369040489196777, "Pretrain/Step": 5684, "Pretrain/Step Time": 8.550168186426163} +{"Pretrain/Learning Rate": 1.8508341513488804e-05, "Pretrain/Loss": 2.056427478790283, "Pretrain/Loss (Raw)": 2.1272220611572266, "Pretrain/Step": 5685, "Pretrain/Step Time": 8.551175137981772} +{"Pretrain/Learning Rate": 1.8500143231104846e-05, "Pretrain/Loss": 2.05794095993042, "Pretrain/Loss (Raw)": 2.0989990234375, "Pretrain/Step": 5686, "Pretrain/Step Time": 8.550393737852573} +{"Pretrain/Learning Rate": 1.8491945698315014e-05, "Pretrain/Loss": 2.0566930770874023, "Pretrain/Loss (Raw)": 1.859128713607788, "Pretrain/Step": 5687, "Pretrain/Step Time": 8.552544886246324} +{"Pretrain/Learning Rate": 1.8483748916064654e-05, "Pretrain/Loss": 2.0586535930633545, "Pretrain/Loss (Raw)": 2.277985095977783, "Pretrain/Step": 5688, "Pretrain/Step Time": 8.544351860880852} +{"Pretrain/Learning Rate": 1.8475552885299092e-05, "Pretrain/Loss": 2.0595955848693848, "Pretrain/Loss (Raw)": 2.0155789852142334, "Pretrain/Step": 5689, "Pretrain/Step Time": 8.54573849402368} +{"Pretrain/Learning Rate": 1.8467357606963496e-05, "Pretrain/Loss": 2.058741807937622, "Pretrain/Loss (Raw)": 1.8860373497009277, "Pretrain/Step": 5690, "Pretrain/Step Time": 8.541187085211277} +{"Pretrain/Learning Rate": 1.845916308200302e-05, "Pretrain/Loss": 2.058424234390259, "Pretrain/Loss (Raw)": 1.98383367061615, "Pretrain/Step": 5691, "Pretrain/Step Time": 8.548157684504986} +{"Pretrain/Learning Rate": 1.8450969311362666e-05, "Pretrain/Loss": 2.0576210021972656, "Pretrain/Loss (Raw)": 2.2447361946105957, "Pretrain/Step": 5692, "Pretrain/Step Time": 8.549387691542506} +{"Pretrain/Learning Rate": 1.8442776295987403e-05, "Pretrain/Loss": 2.059061050415039, "Pretrain/Loss (Raw)": 2.2116732597351074, "Pretrain/Step": 5693, "Pretrain/Step Time": 8.548143217340112} +{"Pretrain/Learning Rate": 1.843458403682206e-05, "Pretrain/Loss": 2.058898448944092, "Pretrain/Loss (Raw)": 1.9527759552001953, "Pretrain/Step": 5694, "Pretrain/Step Time": 8.54206807911396} +{"Pretrain/Learning Rate": 1.8426392534811445e-05, "Pretrain/Loss": 2.059173583984375, "Pretrain/Loss (Raw)": 2.1938636302948, "Pretrain/Step": 5695, "Pretrain/Step Time": 8.547165714204311} +{"Pretrain/Learning Rate": 1.84182017909002e-05, "Pretrain/Loss": 2.057241916656494, "Pretrain/Loss (Raw)": 2.082265615463257, "Pretrain/Step": 5696, "Pretrain/Step Time": 8.546897035092115} +{"Pretrain/Learning Rate": 1.841001180603295e-05, "Pretrain/Loss": 2.05908203125, "Pretrain/Loss (Raw)": 2.209824562072754, "Pretrain/Step": 5697, "Pretrain/Step Time": 8.552539598196745} +{"Pretrain/Learning Rate": 1.8401822581154188e-05, "Pretrain/Loss": 2.0593295097351074, "Pretrain/Loss (Raw)": 2.081862211227417, "Pretrain/Step": 5698, "Pretrain/Step Time": 8.554636327549815} +{"Pretrain/Learning Rate": 1.8393634117208343e-05, "Pretrain/Loss": 2.059452533721924, "Pretrain/Loss (Raw)": 2.19172739982605, "Pretrain/Step": 5699, "Pretrain/Step Time": 8.548578526824713} +{"Pretrain/Learning Rate": 1.838544641513973e-05, "Pretrain/Loss": 2.0597193241119385, "Pretrain/Loss (Raw)": 2.185607433319092, "Pretrain/Step": 5700, "Pretrain/Step Time": 8.547241438180208} +{"Pretrain/Learning Rate": 1.8377259475892612e-05, "Pretrain/Loss": 2.060173511505127, "Pretrain/Loss (Raw)": 1.9100923538208008, "Pretrain/Step": 5701, "Pretrain/Step Time": 8.546946108341217} +{"Pretrain/Learning Rate": 1.8369073300411137e-05, "Pretrain/Loss": 2.0586888790130615, "Pretrain/Loss (Raw)": 1.9932845830917358, "Pretrain/Step": 5702, "Pretrain/Step Time": 8.549970338121057} +{"Pretrain/Learning Rate": 1.836088788963938e-05, "Pretrain/Loss": 2.0613460540771484, "Pretrain/Loss (Raw)": 2.078702926635742, "Pretrain/Step": 5703, "Pretrain/Step Time": 8.548568520694971} +{"Pretrain/Learning Rate": 1.8352703244521308e-05, "Pretrain/Loss": 2.0606300830841064, "Pretrain/Loss (Raw)": 2.0932400226593018, "Pretrain/Step": 5704, "Pretrain/Step Time": 8.552026199176908} +{"Pretrain/Learning Rate": 1.8344519366000828e-05, "Pretrain/Loss": 2.060028314590454, "Pretrain/Loss (Raw)": 2.083420991897583, "Pretrain/Step": 5705, "Pretrain/Step Time": 8.54577505402267} +{"Pretrain/Learning Rate": 1.833633625502173e-05, "Pretrain/Loss": 2.0595591068267822, "Pretrain/Loss (Raw)": 2.070443868637085, "Pretrain/Step": 5706, "Pretrain/Step Time": 8.543302899226546} +{"Pretrain/Learning Rate": 1.832815391252774e-05, "Pretrain/Loss": 2.0598366260528564, "Pretrain/Loss (Raw)": 2.0291898250579834, "Pretrain/Step": 5707, "Pretrain/Step Time": 8.544841280207038} +{"Pretrain/Learning Rate": 1.8319972339462478e-05, "Pretrain/Loss": 2.0602023601531982, "Pretrain/Loss (Raw)": 2.135221004486084, "Pretrain/Step": 5708, "Pretrain/Step Time": 8.544985080137849} +{"Pretrain/Learning Rate": 1.8311791536769483e-05, "Pretrain/Loss": 2.0588784217834473, "Pretrain/Loss (Raw)": 2.1028435230255127, "Pretrain/Step": 5709, "Pretrain/Step Time": 8.549297213554382} +{"Pretrain/Learning Rate": 1.8303611505392205e-05, "Pretrain/Loss": 2.061710834503174, "Pretrain/Loss (Raw)": 2.518494129180908, "Pretrain/Step": 5710, "Pretrain/Step Time": 8.555726751685143} +{"Pretrain/Learning Rate": 1.8295432246274e-05, "Pretrain/Loss": 2.0623741149902344, "Pretrain/Loss (Raw)": 2.1201136112213135, "Pretrain/Step": 5711, "Pretrain/Step Time": 8.548562213778496} +{"Pretrain/Learning Rate": 1.828725376035814e-05, "Pretrain/Loss": 2.0622036457061768, "Pretrain/Loss (Raw)": 2.151811361312866, "Pretrain/Step": 5712, "Pretrain/Step Time": 8.544821508228779} +{"Pretrain/Learning Rate": 1.827907604858782e-05, "Pretrain/Loss": 2.062880039215088, "Pretrain/Loss (Raw)": 1.9892758131027222, "Pretrain/Step": 5713, "Pretrain/Step Time": 8.541417701169848} +{"Pretrain/Learning Rate": 1.8270899111906102e-05, "Pretrain/Loss": 2.060603141784668, "Pretrain/Loss (Raw)": 1.8323596715927124, "Pretrain/Step": 5714, "Pretrain/Step Time": 8.544811578467488} +{"Pretrain/Learning Rate": 1.826272295125602e-05, "Pretrain/Loss": 2.0606908798217773, "Pretrain/Loss (Raw)": 2.0065717697143555, "Pretrain/Step": 5715, "Pretrain/Step Time": 8.540389962494373} +{"Pretrain/Learning Rate": 1.8254547567580472e-05, "Pretrain/Loss": 2.0611772537231445, "Pretrain/Loss (Raw)": 2.2719178199768066, "Pretrain/Step": 5716, "Pretrain/Step Time": 8.548298545181751} +{"Pretrain/Learning Rate": 1.824637296182228e-05, "Pretrain/Loss": 2.0622472763061523, "Pretrain/Loss (Raw)": 2.0671908855438232, "Pretrain/Step": 5717, "Pretrain/Step Time": 8.539233066141605} +{"Pretrain/Learning Rate": 1.8238199134924185e-05, "Pretrain/Loss": 2.0622777938842773, "Pretrain/Loss (Raw)": 2.053349256515503, "Pretrain/Step": 5718, "Pretrain/Step Time": 8.541330510750413} +{"Pretrain/Learning Rate": 1.8230026087828824e-05, "Pretrain/Loss": 2.064053773880005, "Pretrain/Loss (Raw)": 2.285747766494751, "Pretrain/Step": 5719, "Pretrain/Step Time": 8.542201574891806} +{"Pretrain/Learning Rate": 1.8221853821478763e-05, "Pretrain/Loss": 2.0650439262390137, "Pretrain/Loss (Raw)": 1.9902986288070679, "Pretrain/Step": 5720, "Pretrain/Step Time": 8.540886567905545} +{"Pretrain/Learning Rate": 1.821368233681645e-05, "Pretrain/Loss": 2.0640244483947754, "Pretrain/Loss (Raw)": 1.8762134313583374, "Pretrain/Step": 5721, "Pretrain/Step Time": 8.539754746481776} +{"Pretrain/Learning Rate": 1.820551163478428e-05, "Pretrain/Loss": 2.0659096240997314, "Pretrain/Loss (Raw)": 1.9873175621032715, "Pretrain/Step": 5722, "Pretrain/Step Time": 8.542423093691468} +{"Pretrain/Learning Rate": 1.8197341716324516e-05, "Pretrain/Loss": 2.067112684249878, "Pretrain/Loss (Raw)": 2.0551695823669434, "Pretrain/Step": 5723, "Pretrain/Step Time": 8.544408928602934} +{"Pretrain/Learning Rate": 1.8189172582379365e-05, "Pretrain/Loss": 2.067617177963257, "Pretrain/Loss (Raw)": 2.117530345916748, "Pretrain/Step": 5724, "Pretrain/Step Time": 8.546465842053294} +{"Pretrain/Learning Rate": 1.818100423389092e-05, "Pretrain/Loss": 2.065849542617798, "Pretrain/Loss (Raw)": 1.7898492813110352, "Pretrain/Step": 5725, "Pretrain/Step Time": 8.547965018078685} +{"Pretrain/Learning Rate": 1.817283667180121e-05, "Pretrain/Loss": 2.0656607151031494, "Pretrain/Loss (Raw)": 2.1088335514068604, "Pretrain/Step": 5726, "Pretrain/Step Time": 8.547880174592137} +{"Pretrain/Learning Rate": 1.8164669897052134e-05, "Pretrain/Loss": 2.0679702758789062, "Pretrain/Loss (Raw)": 2.2473931312561035, "Pretrain/Step": 5727, "Pretrain/Step Time": 8.54563220590353} +{"Pretrain/Learning Rate": 1.8156503910585544e-05, "Pretrain/Loss": 2.0677525997161865, "Pretrain/Loss (Raw)": 2.1970200538635254, "Pretrain/Step": 5728, "Pretrain/Step Time": 8.553859066218138} +{"Pretrain/Learning Rate": 1.814833871334316e-05, "Pretrain/Loss": 2.0669775009155273, "Pretrain/Loss (Raw)": 2.0584850311279297, "Pretrain/Step": 5729, "Pretrain/Step Time": 8.545344926416874} +{"Pretrain/Learning Rate": 1.8140174306266655e-05, "Pretrain/Loss": 2.0658373832702637, "Pretrain/Loss (Raw)": 2.0065014362335205, "Pretrain/Step": 5730, "Pretrain/Step Time": 8.545169088989496} +{"Pretrain/Learning Rate": 1.8132010690297557e-05, "Pretrain/Loss": 2.0661532878875732, "Pretrain/Loss (Raw)": 2.101964235305786, "Pretrain/Step": 5731, "Pretrain/Step Time": 8.544661991298199} +{"Pretrain/Learning Rate": 1.8123847866377367e-05, "Pretrain/Loss": 2.067741632461548, "Pretrain/Loss (Raw)": 2.2386696338653564, "Pretrain/Step": 5732, "Pretrain/Step Time": 8.544246627017856} +{"Pretrain/Learning Rate": 1.8115685835447423e-05, "Pretrain/Loss": 2.0689949989318848, "Pretrain/Loss (Raw)": 1.978489875793457, "Pretrain/Step": 5733, "Pretrain/Step Time": 8.543948374688625} +{"Pretrain/Learning Rate": 1.810752459844905e-05, "Pretrain/Loss": 2.069035291671753, "Pretrain/Loss (Raw)": 2.0968568325042725, "Pretrain/Step": 5734, "Pretrain/Step Time": 8.55657821148634} +{"Pretrain/Learning Rate": 1.8099364156323396e-05, "Pretrain/Loss": 2.0701725482940674, "Pretrain/Loss (Raw)": 2.288710117340088, "Pretrain/Step": 5735, "Pretrain/Step Time": 8.547135598957539} +{"Pretrain/Learning Rate": 1.8091204510011607e-05, "Pretrain/Loss": 2.069871187210083, "Pretrain/Loss (Raw)": 1.9859589338302612, "Pretrain/Step": 5736, "Pretrain/Step Time": 8.551979878917336} +{"Pretrain/Learning Rate": 1.8083045660454655e-05, "Pretrain/Loss": 2.069708824157715, "Pretrain/Loss (Raw)": 2.159029483795166, "Pretrain/Step": 5737, "Pretrain/Step Time": 8.548794345930219} +{"Pretrain/Learning Rate": 1.8074887608593477e-05, "Pretrain/Loss": 2.0677103996276855, "Pretrain/Loss (Raw)": 1.9822748899459839, "Pretrain/Step": 5738, "Pretrain/Step Time": 8.545200623571873} +{"Pretrain/Learning Rate": 1.8066730355368888e-05, "Pretrain/Loss": 2.0703399181365967, "Pretrain/Loss (Raw)": 2.344616174697876, "Pretrain/Step": 5739, "Pretrain/Step Time": 8.547497330233455} +{"Pretrain/Learning Rate": 1.805857390172163e-05, "Pretrain/Loss": 2.0689187049865723, "Pretrain/Loss (Raw)": 1.8345123529434204, "Pretrain/Step": 5740, "Pretrain/Step Time": 8.550579456612468} +{"Pretrain/Learning Rate": 1.8050418248592334e-05, "Pretrain/Loss": 2.0711007118225098, "Pretrain/Loss (Raw)": 2.2420382499694824, "Pretrain/Step": 5741, "Pretrain/Step Time": 8.543841984122992} +{"Pretrain/Learning Rate": 1.8042263396921554e-05, "Pretrain/Loss": 2.07072114944458, "Pretrain/Loss (Raw)": 1.9322998523712158, "Pretrain/Step": 5742, "Pretrain/Step Time": 8.54898950830102} +{"Pretrain/Learning Rate": 1.803410934764974e-05, "Pretrain/Loss": 2.0695929527282715, "Pretrain/Loss (Raw)": 2.0444202423095703, "Pretrain/Step": 5743, "Pretrain/Step Time": 8.550381124019623} +{"Pretrain/Learning Rate": 1.8025956101717272e-05, "Pretrain/Loss": 2.0677952766418457, "Pretrain/Loss (Raw)": 1.9911165237426758, "Pretrain/Step": 5744, "Pretrain/Step Time": 8.552948825061321} +{"Pretrain/Learning Rate": 1.80178036600644e-05, "Pretrain/Loss": 2.066347599029541, "Pretrain/Loss (Raw)": 1.829575538635254, "Pretrain/Step": 5745, "Pretrain/Step Time": 8.54748197644949} +{"Pretrain/Learning Rate": 1.8009652023631318e-05, "Pretrain/Loss": 2.063145399093628, "Pretrain/Loss (Raw)": 1.7764232158660889, "Pretrain/Step": 5746, "Pretrain/Step Time": 8.552453976124525} +{"Pretrain/Learning Rate": 1.8001501193358096e-05, "Pretrain/Loss": 2.0629677772521973, "Pretrain/Loss (Raw)": 2.0733892917633057, "Pretrain/Step": 5747, "Pretrain/Step Time": 8.541551377624273} +{"Pretrain/Learning Rate": 1.799335117018474e-05, "Pretrain/Loss": 2.0596837997436523, "Pretrain/Loss (Raw)": 1.932908296585083, "Pretrain/Step": 5748, "Pretrain/Step Time": 8.548285830765963} +{"Pretrain/Learning Rate": 1.798520195505114e-05, "Pretrain/Loss": 2.0579891204833984, "Pretrain/Loss (Raw)": 1.8674123287200928, "Pretrain/Step": 5749, "Pretrain/Step Time": 8.547447722405195} +{"Pretrain/Learning Rate": 1.7977053548897112e-05, "Pretrain/Loss": 2.0573978424072266, "Pretrain/Loss (Raw)": 2.012906789779663, "Pretrain/Step": 5750, "Pretrain/Step Time": 8.548997482284904} +{"Pretrain/Learning Rate": 1.7968905952662354e-05, "Pretrain/Loss": 2.0586507320404053, "Pretrain/Loss (Raw)": 1.995959997177124, "Pretrain/Step": 5751, "Pretrain/Step Time": 8.54600234515965} +{"Pretrain/Learning Rate": 1.79607591672865e-05, "Pretrain/Loss": 2.060070514678955, "Pretrain/Loss (Raw)": 2.089027166366577, "Pretrain/Step": 5752, "Pretrain/Step Time": 8.55126591771841} +{"Pretrain/Learning Rate": 1.7952613193709063e-05, "Pretrain/Loss": 2.0609846115112305, "Pretrain/Loss (Raw)": 2.0614876747131348, "Pretrain/Step": 5753, "Pretrain/Step Time": 8.548197768628597} +{"Pretrain/Learning Rate": 1.7944468032869486e-05, "Pretrain/Loss": 2.0605015754699707, "Pretrain/Loss (Raw)": 2.1385114192962646, "Pretrain/Step": 5754, "Pretrain/Step Time": 8.550771495327353} +{"Pretrain/Learning Rate": 1.7936323685707095e-05, "Pretrain/Loss": 2.0588536262512207, "Pretrain/Loss (Raw)": 2.0314888954162598, "Pretrain/Step": 5755, "Pretrain/Step Time": 8.548767231404781} +{"Pretrain/Learning Rate": 1.7928180153161146e-05, "Pretrain/Loss": 2.061244010925293, "Pretrain/Loss (Raw)": 2.381392002105713, "Pretrain/Step": 5756, "Pretrain/Step Time": 8.549917405471206} +{"Pretrain/Learning Rate": 1.792003743617079e-05, "Pretrain/Loss": 2.0606250762939453, "Pretrain/Loss (Raw)": 1.9707064628601074, "Pretrain/Step": 5757, "Pretrain/Step Time": 8.549942353740335} +{"Pretrain/Learning Rate": 1.7911895535675067e-05, "Pretrain/Loss": 2.0623714923858643, "Pretrain/Loss (Raw)": 1.9959053993225098, "Pretrain/Step": 5758, "Pretrain/Step Time": 8.561504308134317} +{"Pretrain/Learning Rate": 1.7903754452612964e-05, "Pretrain/Loss": 2.0626094341278076, "Pretrain/Loss (Raw)": 2.00256085395813, "Pretrain/Step": 5759, "Pretrain/Step Time": 8.55084840208292} +{"Pretrain/Learning Rate": 1.7895614187923326e-05, "Pretrain/Loss": 2.0626392364501953, "Pretrain/Loss (Raw)": 2.12692928314209, "Pretrain/Step": 5760, "Pretrain/Step Time": 8.558268813416362} +{"Pretrain/Learning Rate": 1.7887474742544945e-05, "Pretrain/Loss": 2.0633344650268555, "Pretrain/Loss (Raw)": 2.1484780311584473, "Pretrain/Step": 5761, "Pretrain/Step Time": 8.555347504094243} +{"Pretrain/Learning Rate": 1.7879336117416485e-05, "Pretrain/Loss": 2.0654871463775635, "Pretrain/Loss (Raw)": 2.1586599349975586, "Pretrain/Step": 5762, "Pretrain/Step Time": 8.550869334489107} +{"Pretrain/Learning Rate": 1.7871198313476544e-05, "Pretrain/Loss": 2.0672547817230225, "Pretrain/Loss (Raw)": 2.1295711994171143, "Pretrain/Step": 5763, "Pretrain/Step Time": 8.549563188105822} +{"Pretrain/Learning Rate": 1.78630613316636e-05, "Pretrain/Loss": 2.0673987865448, "Pretrain/Loss (Raw)": 2.1855998039245605, "Pretrain/Step": 5764, "Pretrain/Step Time": 8.554936237633228} +{"Pretrain/Learning Rate": 1.785492517291606e-05, "Pretrain/Loss": 2.0694894790649414, "Pretrain/Loss (Raw)": 2.155545949935913, "Pretrain/Step": 5765, "Pretrain/Step Time": 8.548538906499743} +{"Pretrain/Learning Rate": 1.784678983817221e-05, "Pretrain/Loss": 2.0673625469207764, "Pretrain/Loss (Raw)": 1.980901837348938, "Pretrain/Step": 5766, "Pretrain/Step Time": 8.554721927270293} +{"Pretrain/Learning Rate": 1.783865532837027e-05, "Pretrain/Loss": 2.0695714950561523, "Pretrain/Loss (Raw)": 2.202711343765259, "Pretrain/Step": 5767, "Pretrain/Step Time": 8.55418075621128} +{"Pretrain/Learning Rate": 1.7830521644448334e-05, "Pretrain/Loss": 2.066230535507202, "Pretrain/Loss (Raw)": 1.788992166519165, "Pretrain/Step": 5768, "Pretrain/Step Time": 8.553204042837024} +{"Pretrain/Learning Rate": 1.7822388787344434e-05, "Pretrain/Loss": 2.0659546852111816, "Pretrain/Loss (Raw)": 1.9857844114303589, "Pretrain/Step": 5769, "Pretrain/Step Time": 8.550475282594562} +{"Pretrain/Learning Rate": 1.781425675799648e-05, "Pretrain/Loss": 2.065241813659668, "Pretrain/Loss (Raw)": 2.0646111965179443, "Pretrain/Step": 5770, "Pretrain/Step Time": 8.554994221776724} +{"Pretrain/Learning Rate": 1.7806125557342303e-05, "Pretrain/Loss": 2.062972068786621, "Pretrain/Loss (Raw)": 2.1509218215942383, "Pretrain/Step": 5771, "Pretrain/Step Time": 8.554061630740762} +{"Pretrain/Learning Rate": 1.7797995186319606e-05, "Pretrain/Loss": 2.062319755554199, "Pretrain/Loss (Raw)": 2.133225917816162, "Pretrain/Step": 5772, "Pretrain/Step Time": 8.552788853645325} +{"Pretrain/Learning Rate": 1.778986564586606e-05, "Pretrain/Loss": 2.064206123352051, "Pretrain/Loss (Raw)": 2.409156560897827, "Pretrain/Step": 5773, "Pretrain/Step Time": 8.548020351678133} +{"Pretrain/Learning Rate": 1.778173693691917e-05, "Pretrain/Loss": 2.0669751167297363, "Pretrain/Loss (Raw)": 2.4012725353240967, "Pretrain/Step": 5774, "Pretrain/Step Time": 8.552345596253872} +{"Pretrain/Learning Rate": 1.77736090604164e-05, "Pretrain/Loss": 2.06721830368042, "Pretrain/Loss (Raw)": 2.0464820861816406, "Pretrain/Step": 5775, "Pretrain/Step Time": 8.551784319803119} +{"Pretrain/Learning Rate": 1.7765482017295077e-05, "Pretrain/Loss": 2.069014549255371, "Pretrain/Loss (Raw)": 2.1661343574523926, "Pretrain/Step": 5776, "Pretrain/Step Time": 8.558832427486777} +{"Pretrain/Learning Rate": 1.7757355808492468e-05, "Pretrain/Loss": 2.0674564838409424, "Pretrain/Loss (Raw)": 1.9225513935089111, "Pretrain/Step": 5777, "Pretrain/Step Time": 8.553765878081322} +{"Pretrain/Learning Rate": 1.77492304349457e-05, "Pretrain/Loss": 2.066560745239258, "Pretrain/Loss (Raw)": 2.0361437797546387, "Pretrain/Step": 5778, "Pretrain/Step Time": 8.552438294515014} +{"Pretrain/Learning Rate": 1.7741105897591865e-05, "Pretrain/Loss": 2.068179130554199, "Pretrain/Loss (Raw)": 2.0196220874786377, "Pretrain/Step": 5779, "Pretrain/Step Time": 8.556936329230666} +{"Pretrain/Learning Rate": 1.7732982197367888e-05, "Pretrain/Loss": 2.065046787261963, "Pretrain/Loss (Raw)": 1.8177956342697144, "Pretrain/Step": 5780, "Pretrain/Step Time": 8.556344635784626} +{"Pretrain/Learning Rate": 1.7724859335210654e-05, "Pretrain/Loss": 2.066612720489502, "Pretrain/Loss (Raw)": 2.1469886302948, "Pretrain/Step": 5781, "Pretrain/Step Time": 8.560318501666188} +{"Pretrain/Learning Rate": 1.771673731205692e-05, "Pretrain/Loss": 2.0690388679504395, "Pretrain/Loss (Raw)": 2.075303077697754, "Pretrain/Step": 5782, "Pretrain/Step Time": 8.558738945052028} +{"Pretrain/Learning Rate": 1.770861612884336e-05, "Pretrain/Loss": 2.0709071159362793, "Pretrain/Loss (Raw)": 2.193944215774536, "Pretrain/Step": 5783, "Pretrain/Step Time": 8.551846619695425} +{"Pretrain/Learning Rate": 1.7700495786506545e-05, "Pretrain/Loss": 2.072391986846924, "Pretrain/Loss (Raw)": 2.0332887172698975, "Pretrain/Step": 5784, "Pretrain/Step Time": 8.561606239527464} +{"Pretrain/Learning Rate": 1.7692376285982953e-05, "Pretrain/Loss": 2.073587417602539, "Pretrain/Loss (Raw)": 1.9784342050552368, "Pretrain/Step": 5785, "Pretrain/Step Time": 8.5569997895509} +{"Pretrain/Learning Rate": 1.768425762820896e-05, "Pretrain/Loss": 2.0722198486328125, "Pretrain/Loss (Raw)": 1.987601637840271, "Pretrain/Step": 5786, "Pretrain/Step Time": 8.552783070132136} +{"Pretrain/Learning Rate": 1.7676139814120857e-05, "Pretrain/Loss": 2.072317600250244, "Pretrain/Loss (Raw)": 1.9493434429168701, "Pretrain/Step": 5787, "Pretrain/Step Time": 8.554185468703508} +{"Pretrain/Learning Rate": 1.7668022844654812e-05, "Pretrain/Loss": 2.071774482727051, "Pretrain/Loss (Raw)": 2.0317423343658447, "Pretrain/Step": 5788, "Pretrain/Step Time": 8.56159633025527} +{"Pretrain/Learning Rate": 1.765990672074693e-05, "Pretrain/Loss": 2.071159839630127, "Pretrain/Loss (Raw)": 1.8234009742736816, "Pretrain/Step": 5789, "Pretrain/Step Time": 8.551565360277891} +{"Pretrain/Learning Rate": 1.7651791443333187e-05, "Pretrain/Loss": 2.068136215209961, "Pretrain/Loss (Raw)": 1.913646936416626, "Pretrain/Step": 5790, "Pretrain/Step Time": 8.555440574884415} +{"Pretrain/Learning Rate": 1.764367701334949e-05, "Pretrain/Loss": 2.0682454109191895, "Pretrain/Loss (Raw)": 2.0351243019104004, "Pretrain/Step": 5791, "Pretrain/Step Time": 8.549318784847856} +{"Pretrain/Learning Rate": 1.7635563431731612e-05, "Pretrain/Loss": 2.0685224533081055, "Pretrain/Loss (Raw)": 2.1738526821136475, "Pretrain/Step": 5792, "Pretrain/Step Time": 8.554127022624016} +{"Pretrain/Learning Rate": 1.762745069941527e-05, "Pretrain/Loss": 2.06897234916687, "Pretrain/Loss (Raw)": 2.028613328933716, "Pretrain/Step": 5793, "Pretrain/Step Time": 8.551936984062195} +{"Pretrain/Learning Rate": 1.7619338817336046e-05, "Pretrain/Loss": 2.067859649658203, "Pretrain/Loss (Raw)": 2.0905234813690186, "Pretrain/Step": 5794, "Pretrain/Step Time": 8.551897138357162} +{"Pretrain/Learning Rate": 1.7611227786429457e-05, "Pretrain/Loss": 2.0697765350341797, "Pretrain/Loss (Raw)": 2.202348470687866, "Pretrain/Step": 5795, "Pretrain/Step Time": 8.54548897780478} +{"Pretrain/Learning Rate": 1.7603117607630893e-05, "Pretrain/Loss": 2.0681867599487305, "Pretrain/Loss (Raw)": 1.8807382583618164, "Pretrain/Step": 5796, "Pretrain/Step Time": 8.547430031001568} +{"Pretrain/Learning Rate": 1.7595008281875657e-05, "Pretrain/Loss": 2.068575382232666, "Pretrain/Loss (Raw)": 2.05068039894104, "Pretrain/Step": 5797, "Pretrain/Step Time": 8.546445781365037} +{"Pretrain/Learning Rate": 1.7586899810098967e-05, "Pretrain/Loss": 2.0697338581085205, "Pretrain/Loss (Raw)": 2.274853229522705, "Pretrain/Step": 5798, "Pretrain/Step Time": 8.54810544103384} +{"Pretrain/Learning Rate": 1.757879219323592e-05, "Pretrain/Loss": 2.0678696632385254, "Pretrain/Loss (Raw)": 1.8287312984466553, "Pretrain/Step": 5799, "Pretrain/Step Time": 8.551508665084839} +{"Pretrain/Learning Rate": 1.757068543222153e-05, "Pretrain/Loss": 2.06779146194458, "Pretrain/Loss (Raw)": 2.130835771560669, "Pretrain/Step": 5800, "Pretrain/Step Time": 8.550584308803082} +{"Pretrain/Learning Rate": 1.7562579527990696e-05, "Pretrain/Loss": 2.0676259994506836, "Pretrain/Loss (Raw)": 2.0014123916625977, "Pretrain/Step": 5801, "Pretrain/Step Time": 8.546384846791625} +{"Pretrain/Learning Rate": 1.7554474481478245e-05, "Pretrain/Loss": 2.0659050941467285, "Pretrain/Loss (Raw)": 1.7207598686218262, "Pretrain/Step": 5802, "Pretrain/Step Time": 8.551945650950074} +{"Pretrain/Learning Rate": 1.7546370293618875e-05, "Pretrain/Loss": 2.0661771297454834, "Pretrain/Loss (Raw)": 2.002523899078369, "Pretrain/Step": 5803, "Pretrain/Step Time": 8.54407169483602} +{"Pretrain/Learning Rate": 1.7538266965347212e-05, "Pretrain/Loss": 2.0664658546447754, "Pretrain/Loss (Raw)": 2.116196393966675, "Pretrain/Step": 5804, "Pretrain/Step Time": 8.543625492602587} +{"Pretrain/Learning Rate": 1.7530164497597757e-05, "Pretrain/Loss": 2.067568302154541, "Pretrain/Loss (Raw)": 2.068014144897461, "Pretrain/Step": 5805, "Pretrain/Step Time": 8.541012117639184} +{"Pretrain/Learning Rate": 1.7522062891304936e-05, "Pretrain/Loss": 2.0693821907043457, "Pretrain/Loss (Raw)": 2.0767767429351807, "Pretrain/Step": 5806, "Pretrain/Step Time": 8.549008512869477} +{"Pretrain/Learning Rate": 1.7513962147403057e-05, "Pretrain/Loss": 2.0709385871887207, "Pretrain/Loss (Raw)": 2.1726016998291016, "Pretrain/Step": 5807, "Pretrain/Step Time": 8.541886642575264} +{"Pretrain/Learning Rate": 1.750586226682634e-05, "Pretrain/Loss": 2.0695641040802, "Pretrain/Loss (Raw)": 2.105746030807495, "Pretrain/Step": 5808, "Pretrain/Step Time": 8.548172373324633} +{"Pretrain/Learning Rate": 1.74977632505089e-05, "Pretrain/Loss": 2.0701045989990234, "Pretrain/Loss (Raw)": 2.0155866146087646, "Pretrain/Step": 5809, "Pretrain/Step Time": 8.542004583403468} +{"Pretrain/Learning Rate": 1.7489665099384755e-05, "Pretrain/Loss": 2.068474531173706, "Pretrain/Loss (Raw)": 1.7636977434158325, "Pretrain/Step": 5810, "Pretrain/Step Time": 8.543780004605651} +{"Pretrain/Learning Rate": 1.7481567814387815e-05, "Pretrain/Loss": 2.0652194023132324, "Pretrain/Loss (Raw)": 1.8951411247253418, "Pretrain/Step": 5811, "Pretrain/Step Time": 8.540193082764745} +{"Pretrain/Learning Rate": 1.7473471396451913e-05, "Pretrain/Loss": 2.0623793601989746, "Pretrain/Loss (Raw)": 1.9734100103378296, "Pretrain/Step": 5812, "Pretrain/Step Time": 8.547788893803954} +{"Pretrain/Learning Rate": 1.746537584651074e-05, "Pretrain/Loss": 2.062497138977051, "Pretrain/Loss (Raw)": 2.142277479171753, "Pretrain/Step": 5813, "Pretrain/Step Time": 8.543967453762889} +{"Pretrain/Learning Rate": 1.7457281165497947e-05, "Pretrain/Loss": 2.062286615371704, "Pretrain/Loss (Raw)": 2.072064161300659, "Pretrain/Step": 5814, "Pretrain/Step Time": 8.551482923328876} +{"Pretrain/Learning Rate": 1.7449187354347014e-05, "Pretrain/Loss": 2.063375949859619, "Pretrain/Loss (Raw)": 1.998556137084961, "Pretrain/Step": 5815, "Pretrain/Step Time": 8.5465984698385} +{"Pretrain/Learning Rate": 1.7441094413991393e-05, "Pretrain/Loss": 2.0618348121643066, "Pretrain/Loss (Raw)": 2.080745220184326, "Pretrain/Step": 5816, "Pretrain/Step Time": 8.54518730379641} +{"Pretrain/Learning Rate": 1.7433002345364368e-05, "Pretrain/Loss": 2.0609312057495117, "Pretrain/Loss (Raw)": 1.899915099143982, "Pretrain/Step": 5817, "Pretrain/Step Time": 8.54718872345984} +{"Pretrain/Learning Rate": 1.7424911149399183e-05, "Pretrain/Loss": 2.0627386569976807, "Pretrain/Loss (Raw)": 2.117365598678589, "Pretrain/Step": 5818, "Pretrain/Step Time": 8.549124965444207} +{"Pretrain/Learning Rate": 1.7416820827028926e-05, "Pretrain/Loss": 2.0633492469787598, "Pretrain/Loss (Raw)": 2.061967611312866, "Pretrain/Step": 5819, "Pretrain/Step Time": 8.55187363177538} +{"Pretrain/Learning Rate": 1.7408731379186638e-05, "Pretrain/Loss": 2.062194585800171, "Pretrain/Loss (Raw)": 2.096965789794922, "Pretrain/Step": 5820, "Pretrain/Step Time": 8.545796018093824} +{"Pretrain/Learning Rate": 1.740064280680521e-05, "Pretrain/Loss": 2.0609209537506104, "Pretrain/Loss (Raw)": 2.048644781112671, "Pretrain/Step": 5821, "Pretrain/Step Time": 8.552459072321653} +{"Pretrain/Learning Rate": 1.7392555110817467e-05, "Pretrain/Loss": 2.061145305633545, "Pretrain/Loss (Raw)": 1.9815014600753784, "Pretrain/Step": 5822, "Pretrain/Step Time": 8.552243169397116} +{"Pretrain/Learning Rate": 1.738446829215611e-05, "Pretrain/Loss": 2.060884475708008, "Pretrain/Loss (Raw)": 2.1604855060577393, "Pretrain/Step": 5823, "Pretrain/Step Time": 8.552870888262987} +{"Pretrain/Learning Rate": 1.737638235175376e-05, "Pretrain/Loss": 2.0620079040527344, "Pretrain/Loss (Raw)": 2.22603702545166, "Pretrain/Step": 5824, "Pretrain/Step Time": 8.548550345003605} +{"Pretrain/Learning Rate": 1.736829729054292e-05, "Pretrain/Loss": 2.060070753097534, "Pretrain/Loss (Raw)": 1.9618825912475586, "Pretrain/Step": 5825, "Pretrain/Step Time": 8.553086843341589} +{"Pretrain/Learning Rate": 1.7360213109456e-05, "Pretrain/Loss": 2.0603156089782715, "Pretrain/Loss (Raw)": 2.1132049560546875, "Pretrain/Step": 5826, "Pretrain/Step Time": 8.551338823512197} +{"Pretrain/Learning Rate": 1.73521298094253e-05, "Pretrain/Loss": 2.0600175857543945, "Pretrain/Loss (Raw)": 2.153571128845215, "Pretrain/Step": 5827, "Pretrain/Step Time": 8.548529678955674} +{"Pretrain/Learning Rate": 1.734404739138303e-05, "Pretrain/Loss": 2.0591650009155273, "Pretrain/Loss (Raw)": 2.0764994621276855, "Pretrain/Step": 5828, "Pretrain/Step Time": 8.550973104313016} +{"Pretrain/Learning Rate": 1.733596585626129e-05, "Pretrain/Loss": 2.0609912872314453, "Pretrain/Loss (Raw)": 2.1438417434692383, "Pretrain/Step": 5829, "Pretrain/Step Time": 8.55342360585928} +{"Pretrain/Learning Rate": 1.7327885204992083e-05, "Pretrain/Loss": 2.0611376762390137, "Pretrain/Loss (Raw)": 2.0120105743408203, "Pretrain/Step": 5830, "Pretrain/Step Time": 8.550694186240435} +{"Pretrain/Learning Rate": 1.7319805438507303e-05, "Pretrain/Loss": 2.0628623962402344, "Pretrain/Loss (Raw)": 2.299462080001831, "Pretrain/Step": 5831, "Pretrain/Step Time": 8.562328409403563} +{"Pretrain/Learning Rate": 1.7311726557738754e-05, "Pretrain/Loss": 2.062551498413086, "Pretrain/Loss (Raw)": 2.0534796714782715, "Pretrain/Step": 5832, "Pretrain/Step Time": 8.557927273213863} +{"Pretrain/Learning Rate": 1.7303648563618125e-05, "Pretrain/Loss": 2.063182830810547, "Pretrain/Loss (Raw)": 2.1642305850982666, "Pretrain/Step": 5833, "Pretrain/Step Time": 8.559947419911623} +{"Pretrain/Learning Rate": 1.7295571457077015e-05, "Pretrain/Loss": 2.063469171524048, "Pretrain/Loss (Raw)": 2.107083559036255, "Pretrain/Step": 5834, "Pretrain/Step Time": 8.554407579824328} +{"Pretrain/Learning Rate": 1.72874952390469e-05, "Pretrain/Loss": 2.0646438598632812, "Pretrain/Loss (Raw)": 2.1795620918273926, "Pretrain/Step": 5835, "Pretrain/Step Time": 8.556685037910938} +{"Pretrain/Learning Rate": 1.7279419910459182e-05, "Pretrain/Loss": 2.0626463890075684, "Pretrain/Loss (Raw)": 1.8795260190963745, "Pretrain/Step": 5836, "Pretrain/Step Time": 8.552520629018545} +{"Pretrain/Learning Rate": 1.727134547224514e-05, "Pretrain/Loss": 2.0606465339660645, "Pretrain/Loss (Raw)": 1.846848964691162, "Pretrain/Step": 5837, "Pretrain/Step Time": 8.552490727975965} +{"Pretrain/Learning Rate": 1.726327192533595e-05, "Pretrain/Loss": 2.0562429428100586, "Pretrain/Loss (Raw)": 1.9548664093017578, "Pretrain/Step": 5838, "Pretrain/Step Time": 8.54651140794158} +{"Pretrain/Learning Rate": 1.7255199270662708e-05, "Pretrain/Loss": 2.0550806522369385, "Pretrain/Loss (Raw)": 1.9713276624679565, "Pretrain/Step": 5839, "Pretrain/Step Time": 8.554278004914522} +{"Pretrain/Learning Rate": 1.7247127509156377e-05, "Pretrain/Loss": 2.0551109313964844, "Pretrain/Loss (Raw)": 2.1556649208068848, "Pretrain/Step": 5840, "Pretrain/Step Time": 8.556132152676582} +{"Pretrain/Learning Rate": 1.7239056641747836e-05, "Pretrain/Loss": 2.0542120933532715, "Pretrain/Loss (Raw)": 1.8742560148239136, "Pretrain/Step": 5841, "Pretrain/Step Time": 8.557092368602753} +{"Pretrain/Learning Rate": 1.723098666936785e-05, "Pretrain/Loss": 2.056915044784546, "Pretrain/Loss (Raw)": 2.178321599960327, "Pretrain/Step": 5842, "Pretrain/Step Time": 8.553387269377708} +{"Pretrain/Learning Rate": 1.7222917592947096e-05, "Pretrain/Loss": 2.0562338829040527, "Pretrain/Loss (Raw)": 1.9193874597549438, "Pretrain/Step": 5843, "Pretrain/Step Time": 8.561671908944845} +{"Pretrain/Learning Rate": 1.7214849413416128e-05, "Pretrain/Loss": 2.0549988746643066, "Pretrain/Loss (Raw)": 2.1138434410095215, "Pretrain/Step": 5844, "Pretrain/Step Time": 8.551998741924763} +{"Pretrain/Learning Rate": 1.7206782131705414e-05, "Pretrain/Loss": 2.0546154975891113, "Pretrain/Loss (Raw)": 2.0181307792663574, "Pretrain/Step": 5845, "Pretrain/Step Time": 8.553794477134943} +{"Pretrain/Learning Rate": 1.7198715748745304e-05, "Pretrain/Loss": 2.0541539192199707, "Pretrain/Loss (Raw)": 1.9942445755004883, "Pretrain/Step": 5846, "Pretrain/Step Time": 8.553739489987493} +{"Pretrain/Learning Rate": 1.7190650265466056e-05, "Pretrain/Loss": 2.0511863231658936, "Pretrain/Loss (Raw)": 1.905905842781067, "Pretrain/Step": 5847, "Pretrain/Step Time": 8.55501814931631} +{"Pretrain/Learning Rate": 1.7182585682797815e-05, "Pretrain/Loss": 2.049814462661743, "Pretrain/Loss (Raw)": 1.8146860599517822, "Pretrain/Step": 5848, "Pretrain/Step Time": 8.55730214342475} +{"Pretrain/Learning Rate": 1.7174522001670633e-05, "Pretrain/Loss": 2.0528950691223145, "Pretrain/Loss (Raw)": 2.2705252170562744, "Pretrain/Step": 5849, "Pretrain/Step Time": 8.563745828345418} +{"Pretrain/Learning Rate": 1.7166459223014448e-05, "Pretrain/Loss": 2.0537078380584717, "Pretrain/Loss (Raw)": 2.091374397277832, "Pretrain/Step": 5850, "Pretrain/Step Time": 8.55737211368978} +{"Pretrain/Learning Rate": 1.71583973477591e-05, "Pretrain/Loss": 2.0548810958862305, "Pretrain/Loss (Raw)": 2.2053587436676025, "Pretrain/Step": 5851, "Pretrain/Step Time": 8.554689003154635} +{"Pretrain/Learning Rate": 1.7150336376834315e-05, "Pretrain/Loss": 2.0552897453308105, "Pretrain/Loss (Raw)": 2.169818639755249, "Pretrain/Step": 5852, "Pretrain/Step Time": 8.549433875828981} +{"Pretrain/Learning Rate": 1.714227631116974e-05, "Pretrain/Loss": 2.0581045150756836, "Pretrain/Loss (Raw)": 2.1501624584198, "Pretrain/Step": 5853, "Pretrain/Step Time": 8.555983604863286} +{"Pretrain/Learning Rate": 1.7134217151694872e-05, "Pretrain/Loss": 2.056466579437256, "Pretrain/Loss (Raw)": 1.8991707563400269, "Pretrain/Step": 5854, "Pretrain/Step Time": 8.557233536615968} +{"Pretrain/Learning Rate": 1.7126158899339164e-05, "Pretrain/Loss": 2.051820993423462, "Pretrain/Loss (Raw)": 1.6527395248413086, "Pretrain/Step": 5855, "Pretrain/Step Time": 8.55868355371058} +{"Pretrain/Learning Rate": 1.7118101555031895e-05, "Pretrain/Loss": 2.0512194633483887, "Pretrain/Loss (Raw)": 2.120018243789673, "Pretrain/Step": 5856, "Pretrain/Step Time": 8.558951709419489} +{"Pretrain/Learning Rate": 1.7110045119702314e-05, "Pretrain/Loss": 2.0512804985046387, "Pretrain/Loss (Raw)": 2.066307783126831, "Pretrain/Step": 5857, "Pretrain/Step Time": 8.554464993998408} +{"Pretrain/Learning Rate": 1.7101989594279495e-05, "Pretrain/Loss": 2.052726984024048, "Pretrain/Loss (Raw)": 2.1916394233703613, "Pretrain/Step": 5858, "Pretrain/Step Time": 8.55588778667152} +{"Pretrain/Learning Rate": 1.7093934979692465e-05, "Pretrain/Loss": 2.0533065795898438, "Pretrain/Loss (Raw)": 2.1761693954467773, "Pretrain/Step": 5859, "Pretrain/Step Time": 8.559264734387398} +{"Pretrain/Learning Rate": 1.7085881276870093e-05, "Pretrain/Loss": 2.0550625324249268, "Pretrain/Loss (Raw)": 2.4634311199188232, "Pretrain/Step": 5860, "Pretrain/Step Time": 8.559079004451632} +{"Pretrain/Learning Rate": 1.70778284867412e-05, "Pretrain/Loss": 2.0550448894500732, "Pretrain/Loss (Raw)": 1.9762349128723145, "Pretrain/Step": 5861, "Pretrain/Step Time": 8.561523795127869} +{"Pretrain/Learning Rate": 1.706977661023444e-05, "Pretrain/Loss": 2.0550341606140137, "Pretrain/Loss (Raw)": 2.0954482555389404, "Pretrain/Step": 5862, "Pretrain/Step Time": 8.555826453492045} +{"Pretrain/Learning Rate": 1.7061725648278423e-05, "Pretrain/Loss": 2.0535030364990234, "Pretrain/Loss (Raw)": 2.092752456665039, "Pretrain/Step": 5863, "Pretrain/Step Time": 8.559342417865992} +{"Pretrain/Learning Rate": 1.7053675601801606e-05, "Pretrain/Loss": 2.054063320159912, "Pretrain/Loss (Raw)": 2.0576844215393066, "Pretrain/Step": 5864, "Pretrain/Step Time": 8.555475950241089} +{"Pretrain/Learning Rate": 1.7045626471732363e-05, "Pretrain/Loss": 2.0533342361450195, "Pretrain/Loss (Raw)": 2.0657131671905518, "Pretrain/Step": 5865, "Pretrain/Step Time": 8.555339820683002} +{"Pretrain/Learning Rate": 1.7037578258998956e-05, "Pretrain/Loss": 2.0526366233825684, "Pretrain/Loss (Raw)": 1.8929556608200073, "Pretrain/Step": 5866, "Pretrain/Step Time": 8.555472070351243} +{"Pretrain/Learning Rate": 1.702953096452955e-05, "Pretrain/Loss": 2.050201416015625, "Pretrain/Loss (Raw)": 2.032931089401245, "Pretrain/Step": 5867, "Pretrain/Step Time": 8.557761589065194} +{"Pretrain/Learning Rate": 1.702148458925218e-05, "Pretrain/Loss": 2.052929401397705, "Pretrain/Loss (Raw)": 2.1836917400360107, "Pretrain/Step": 5868, "Pretrain/Step Time": 8.548761488869786} +{"Pretrain/Learning Rate": 1.7013439134094815e-05, "Pretrain/Loss": 2.048715114593506, "Pretrain/Loss (Raw)": 1.70261812210083, "Pretrain/Step": 5869, "Pretrain/Step Time": 8.558893194422126} +{"Pretrain/Learning Rate": 1.7005394599985273e-05, "Pretrain/Loss": 2.0484910011291504, "Pretrain/Loss (Raw)": 1.9035948514938354, "Pretrain/Step": 5870, "Pretrain/Step Time": 8.552671264857054} +{"Pretrain/Learning Rate": 1.6997350987851308e-05, "Pretrain/Loss": 2.049039840698242, "Pretrain/Loss (Raw)": 2.1146633625030518, "Pretrain/Step": 5871, "Pretrain/Step Time": 8.5568408370018} +{"Pretrain/Learning Rate": 1.6989308298620526e-05, "Pretrain/Loss": 2.0509116649627686, "Pretrain/Loss (Raw)": 2.230719566345215, "Pretrain/Step": 5872, "Pretrain/Step Time": 8.553264869377017} +{"Pretrain/Learning Rate": 1.6981266533220467e-05, "Pretrain/Loss": 2.052478790283203, "Pretrain/Loss (Raw)": 2.0301756858825684, "Pretrain/Step": 5873, "Pretrain/Step Time": 8.553385440260172} +{"Pretrain/Learning Rate": 1.6973225692578533e-05, "Pretrain/Loss": 2.0547218322753906, "Pretrain/Loss (Raw)": 2.063502550125122, "Pretrain/Step": 5874, "Pretrain/Step Time": 8.55481513403356} +{"Pretrain/Learning Rate": 1.6965185777622037e-05, "Pretrain/Loss": 2.0535500049591064, "Pretrain/Loss (Raw)": 1.9234156608581543, "Pretrain/Step": 5875, "Pretrain/Step Time": 8.555178448557854} +{"Pretrain/Learning Rate": 1.6957146789278175e-05, "Pretrain/Loss": 2.0535128116607666, "Pretrain/Loss (Raw)": 1.9281424283981323, "Pretrain/Step": 5876, "Pretrain/Step Time": 8.547165164723992} +{"Pretrain/Learning Rate": 1.694910872847405e-05, "Pretrain/Loss": 2.055978536605835, "Pretrain/Loss (Raw)": 2.1830296516418457, "Pretrain/Step": 5877, "Pretrain/Step Time": 8.543593751266599} +{"Pretrain/Learning Rate": 1.694107159613664e-05, "Pretrain/Loss": 2.0576930046081543, "Pretrain/Loss (Raw)": 2.232361316680908, "Pretrain/Step": 5878, "Pretrain/Step Time": 8.543996876105666} +{"Pretrain/Learning Rate": 1.6933035393192824e-05, "Pretrain/Loss": 2.057884454727173, "Pretrain/Loss (Raw)": 2.020482063293457, "Pretrain/Step": 5879, "Pretrain/Step Time": 8.552680226042867} +{"Pretrain/Learning Rate": 1.6925000120569385e-05, "Pretrain/Loss": 2.0591654777526855, "Pretrain/Loss (Raw)": 2.2529854774475098, "Pretrain/Step": 5880, "Pretrain/Step Time": 8.545711245387793} +{"Pretrain/Learning Rate": 1.6916965779192983e-05, "Pretrain/Loss": 2.0580852031707764, "Pretrain/Loss (Raw)": 1.9232057332992554, "Pretrain/Step": 5881, "Pretrain/Step Time": 8.54393570125103} +{"Pretrain/Learning Rate": 1.6908932369990176e-05, "Pretrain/Loss": 2.057742118835449, "Pretrain/Loss (Raw)": 2.094604969024658, "Pretrain/Step": 5882, "Pretrain/Step Time": 8.54358945786953} +{"Pretrain/Learning Rate": 1.6900899893887408e-05, "Pretrain/Loss": 2.0576446056365967, "Pretrain/Loss (Raw)": 2.019002914428711, "Pretrain/Step": 5883, "Pretrain/Step Time": 8.549089312553406} +{"Pretrain/Learning Rate": 1.6892868351811036e-05, "Pretrain/Loss": 2.0544700622558594, "Pretrain/Loss (Raw)": 1.9750237464904785, "Pretrain/Step": 5884, "Pretrain/Step Time": 8.5508799161762} +{"Pretrain/Learning Rate": 1.6884837744687284e-05, "Pretrain/Loss": 2.0550942420959473, "Pretrain/Loss (Raw)": 2.050633430480957, "Pretrain/Step": 5885, "Pretrain/Step Time": 8.552128557115793} +{"Pretrain/Learning Rate": 1.687680807344229e-05, "Pretrain/Loss": 2.055832862854004, "Pretrain/Loss (Raw)": 2.0904297828674316, "Pretrain/Step": 5886, "Pretrain/Step Time": 8.541200339794159} +{"Pretrain/Learning Rate": 1.6868779339002056e-05, "Pretrain/Loss": 2.058964967727661, "Pretrain/Loss (Raw)": 2.403484344482422, "Pretrain/Step": 5887, "Pretrain/Step Time": 8.54957072623074} +{"Pretrain/Learning Rate": 1.6860751542292515e-05, "Pretrain/Loss": 2.05790114402771, "Pretrain/Loss (Raw)": 1.9907526969909668, "Pretrain/Step": 5888, "Pretrain/Step Time": 8.541370315477252} +{"Pretrain/Learning Rate": 1.685272468423945e-05, "Pretrain/Loss": 2.0575051307678223, "Pretrain/Loss (Raw)": 2.097804069519043, "Pretrain/Step": 5889, "Pretrain/Step Time": 8.543449716642499} +{"Pretrain/Learning Rate": 1.6844698765768575e-05, "Pretrain/Loss": 2.056394100189209, "Pretrain/Loss (Raw)": 2.016465187072754, "Pretrain/Step": 5890, "Pretrain/Step Time": 8.543391108512878} +{"Pretrain/Learning Rate": 1.6836673787805456e-05, "Pretrain/Loss": 2.0544662475585938, "Pretrain/Loss (Raw)": 1.8827916383743286, "Pretrain/Step": 5891, "Pretrain/Step Time": 8.541394418105483} +{"Pretrain/Learning Rate": 1.6828649751275592e-05, "Pretrain/Loss": 2.0522308349609375, "Pretrain/Loss (Raw)": 1.8994184732437134, "Pretrain/Step": 5892, "Pretrain/Step Time": 8.536760959774256} +{"Pretrain/Learning Rate": 1.682062665710434e-05, "Pretrain/Loss": 2.05178165435791, "Pretrain/Loss (Raw)": 2.0980725288391113, "Pretrain/Step": 5893, "Pretrain/Step Time": 8.539713006466627} +{"Pretrain/Learning Rate": 1.6812604506216966e-05, "Pretrain/Loss": 2.051410675048828, "Pretrain/Loss (Raw)": 1.9334149360656738, "Pretrain/Step": 5894, "Pretrain/Step Time": 8.534066498279572} +{"Pretrain/Learning Rate": 1.6804583299538614e-05, "Pretrain/Loss": 2.050351858139038, "Pretrain/Loss (Raw)": 2.0672175884246826, "Pretrain/Step": 5895, "Pretrain/Step Time": 8.533638225868344} +{"Pretrain/Learning Rate": 1.6796563037994347e-05, "Pretrain/Loss": 2.0511722564697266, "Pretrain/Loss (Raw)": 1.8939927816390991, "Pretrain/Step": 5896, "Pretrain/Step Time": 8.534961979836226} +{"Pretrain/Learning Rate": 1.678854372250907e-05, "Pretrain/Loss": 2.0517115592956543, "Pretrain/Loss (Raw)": 2.054816246032715, "Pretrain/Step": 5897, "Pretrain/Step Time": 8.533253060653806} +{"Pretrain/Learning Rate": 1.6780525354007644e-05, "Pretrain/Loss": 2.053194046020508, "Pretrain/Loss (Raw)": 2.254343271255493, "Pretrain/Step": 5898, "Pretrain/Step Time": 8.541160456836224} +{"Pretrain/Learning Rate": 1.6772507933414744e-05, "Pretrain/Loss": 2.0532851219177246, "Pretrain/Loss (Raw)": 2.1625988483428955, "Pretrain/Step": 5899, "Pretrain/Step Time": 8.531793197616935} +{"Pretrain/Learning Rate": 1.6764491461655017e-05, "Pretrain/Loss": 2.05206298828125, "Pretrain/Loss (Raw)": 1.97678542137146, "Pretrain/Step": 5900, "Pretrain/Step Time": 8.536975618451834} +{"Pretrain/Learning Rate": 1.6756475939652927e-05, "Pretrain/Loss": 2.0485029220581055, "Pretrain/Loss (Raw)": 1.9534778594970703, "Pretrain/Step": 5901, "Pretrain/Step Time": 8.536876946687698} +{"Pretrain/Learning Rate": 1.674846136833289e-05, "Pretrain/Loss": 2.046416997909546, "Pretrain/Loss (Raw)": 2.1342780590057373, "Pretrain/Step": 5902, "Pretrain/Step Time": 8.53305198252201} +{"Pretrain/Learning Rate": 1.6740447748619156e-05, "Pretrain/Loss": 2.045764207839966, "Pretrain/Loss (Raw)": 1.962930679321289, "Pretrain/Step": 5903, "Pretrain/Step Time": 8.531133316457272} +{"Pretrain/Learning Rate": 1.6732435081435924e-05, "Pretrain/Loss": 2.044340133666992, "Pretrain/Loss (Raw)": 1.9838131666183472, "Pretrain/Step": 5904, "Pretrain/Step Time": 8.532650107517838} +{"Pretrain/Learning Rate": 1.6724423367707226e-05, "Pretrain/Loss": 2.044198513031006, "Pretrain/Loss (Raw)": 1.9044479131698608, "Pretrain/Step": 5905, "Pretrain/Step Time": 8.530155193060637} +{"Pretrain/Learning Rate": 1.6716412608357024e-05, "Pretrain/Loss": 2.0436954498291016, "Pretrain/Loss (Raw)": 1.9717661142349243, "Pretrain/Step": 5906, "Pretrain/Step Time": 8.531539686024189} +{"Pretrain/Learning Rate": 1.670840280430915e-05, "Pretrain/Loss": 2.044053077697754, "Pretrain/Loss (Raw)": 2.0653703212738037, "Pretrain/Step": 5907, "Pretrain/Step Time": 8.53087237663567} +{"Pretrain/Learning Rate": 1.6700393956487342e-05, "Pretrain/Loss": 2.046671152114868, "Pretrain/Loss (Raw)": 2.1529133319854736, "Pretrain/Step": 5908, "Pretrain/Step Time": 8.529415650293231} +{"Pretrain/Learning Rate": 1.6692386065815203e-05, "Pretrain/Loss": 2.045888662338257, "Pretrain/Loss (Raw)": 2.046834707260132, "Pretrain/Step": 5909, "Pretrain/Step Time": 8.52187211252749} +{"Pretrain/Learning Rate": 1.668437913321626e-05, "Pretrain/Loss": 2.0460801124572754, "Pretrain/Loss (Raw)": 2.0997939109802246, "Pretrain/Step": 5910, "Pretrain/Step Time": 8.531976211816072} +{"Pretrain/Learning Rate": 1.667637315961389e-05, "Pretrain/Loss": 2.0449743270874023, "Pretrain/Loss (Raw)": 2.0524168014526367, "Pretrain/Step": 5911, "Pretrain/Step Time": 8.533187340945005} +{"Pretrain/Learning Rate": 1.6668368145931397e-05, "Pretrain/Loss": 2.045927047729492, "Pretrain/Loss (Raw)": 2.1552393436431885, "Pretrain/Step": 5912, "Pretrain/Step Time": 8.530672522261739} +{"Pretrain/Learning Rate": 1.6660364093091945e-05, "Pretrain/Loss": 2.0464797019958496, "Pretrain/Loss (Raw)": 2.049189805984497, "Pretrain/Step": 5913, "Pretrain/Step Time": 8.52845248579979} +{"Pretrain/Learning Rate": 1.6652361002018608e-05, "Pretrain/Loss": 2.0494914054870605, "Pretrain/Loss (Raw)": 2.373093605041504, "Pretrain/Step": 5914, "Pretrain/Step Time": 8.53161857277155} +{"Pretrain/Learning Rate": 1.664435887363433e-05, "Pretrain/Loss": 2.0490665435791016, "Pretrain/Loss (Raw)": 1.8949626684188843, "Pretrain/Step": 5915, "Pretrain/Step Time": 8.530048824846745} +{"Pretrain/Learning Rate": 1.6636357708861966e-05, "Pretrain/Loss": 2.0486087799072266, "Pretrain/Loss (Raw)": 1.9731574058532715, "Pretrain/Step": 5916, "Pretrain/Step Time": 8.53892383724451} +{"Pretrain/Learning Rate": 1.6628357508624234e-05, "Pretrain/Loss": 2.0501291751861572, "Pretrain/Loss (Raw)": 2.0179996490478516, "Pretrain/Step": 5917, "Pretrain/Step Time": 8.537496265023947} +{"Pretrain/Learning Rate": 1.662035827384377e-05, "Pretrain/Loss": 2.0504791736602783, "Pretrain/Loss (Raw)": 1.9584461450576782, "Pretrain/Step": 5918, "Pretrain/Step Time": 8.539451690390706} +{"Pretrain/Learning Rate": 1.661236000544307e-05, "Pretrain/Loss": 2.051943302154541, "Pretrain/Loss (Raw)": 2.2225182056427, "Pretrain/Step": 5919, "Pretrain/Step Time": 8.53851062245667} +{"Pretrain/Learning Rate": 1.660436270434454e-05, "Pretrain/Loss": 2.0535969734191895, "Pretrain/Loss (Raw)": 2.3855321407318115, "Pretrain/Step": 5920, "Pretrain/Step Time": 8.535027042031288} +{"Pretrain/Learning Rate": 1.6596366371470466e-05, "Pretrain/Loss": 2.0534591674804688, "Pretrain/Loss (Raw)": 2.0109519958496094, "Pretrain/Step": 5921, "Pretrain/Step Time": 8.5346912574023} +{"Pretrain/Learning Rate": 1.658837100774302e-05, "Pretrain/Loss": 2.054572820663452, "Pretrain/Loss (Raw)": 2.233105421066284, "Pretrain/Step": 5922, "Pretrain/Step Time": 8.540612060576677} +{"Pretrain/Learning Rate": 1.658037661408427e-05, "Pretrain/Loss": 2.0538530349731445, "Pretrain/Loss (Raw)": 2.1101861000061035, "Pretrain/Step": 5923, "Pretrain/Step Time": 8.540188357234001} +{"Pretrain/Learning Rate": 1.657238319141616e-05, "Pretrain/Loss": 2.053912878036499, "Pretrain/Loss (Raw)": 1.8884221315383911, "Pretrain/Step": 5924, "Pretrain/Step Time": 8.53481014445424} +{"Pretrain/Learning Rate": 1.656439074066053e-05, "Pretrain/Loss": 2.0529870986938477, "Pretrain/Loss (Raw)": 1.9322004318237305, "Pretrain/Step": 5925, "Pretrain/Step Time": 8.534761164337397} +{"Pretrain/Learning Rate": 1.655639926273911e-05, "Pretrain/Loss": 2.048661708831787, "Pretrain/Loss (Raw)": 1.7212003469467163, "Pretrain/Step": 5926, "Pretrain/Step Time": 8.532191975042224} +{"Pretrain/Learning Rate": 1.654840875857352e-05, "Pretrain/Loss": 2.0530762672424316, "Pretrain/Loss (Raw)": 2.3937387466430664, "Pretrain/Step": 5927, "Pretrain/Step Time": 8.528767742216587} +{"Pretrain/Learning Rate": 1.654041922908525e-05, "Pretrain/Loss": 2.051649808883667, "Pretrain/Loss (Raw)": 1.9482824802398682, "Pretrain/Step": 5928, "Pretrain/Step Time": 8.535150155425072} +{"Pretrain/Learning Rate": 1.6532430675195705e-05, "Pretrain/Loss": 2.052337169647217, "Pretrain/Loss (Raw)": 2.0894076824188232, "Pretrain/Step": 5929, "Pretrain/Step Time": 8.537599477916956} +{"Pretrain/Learning Rate": 1.652444309782615e-05, "Pretrain/Loss": 2.05543851852417, "Pretrain/Loss (Raw)": 2.117743730545044, "Pretrain/Step": 5930, "Pretrain/Step Time": 8.541321363300085} +{"Pretrain/Learning Rate": 1.651645649789776e-05, "Pretrain/Loss": 2.054710865020752, "Pretrain/Loss (Raw)": 1.9093466997146606, "Pretrain/Step": 5931, "Pretrain/Step Time": 8.54407973214984} +{"Pretrain/Learning Rate": 1.6508470876331577e-05, "Pretrain/Loss": 2.055452346801758, "Pretrain/Loss (Raw)": 2.211125135421753, "Pretrain/Step": 5932, "Pretrain/Step Time": 8.543019980192184} +{"Pretrain/Learning Rate": 1.650048623404855e-05, "Pretrain/Loss": 2.057314157485962, "Pretrain/Loss (Raw)": 2.3063268661499023, "Pretrain/Step": 5933, "Pretrain/Step Time": 8.548189725726843} +{"Pretrain/Learning Rate": 1.6492502571969498e-05, "Pretrain/Loss": 2.056428909301758, "Pretrain/Loss (Raw)": 1.963467001914978, "Pretrain/Step": 5934, "Pretrain/Step Time": 8.550275661051273} +{"Pretrain/Learning Rate": 1.6484519891015143e-05, "Pretrain/Loss": 2.052537679672241, "Pretrain/Loss (Raw)": 1.6744900941848755, "Pretrain/Step": 5935, "Pretrain/Step Time": 8.547990450635552} +{"Pretrain/Learning Rate": 1.647653819210607e-05, "Pretrain/Loss": 2.0519487857818604, "Pretrain/Loss (Raw)": 2.0303902626037598, "Pretrain/Step": 5936, "Pretrain/Step Time": 8.547494646161795} +{"Pretrain/Learning Rate": 1.6468557476162793e-05, "Pretrain/Loss": 2.0519278049468994, "Pretrain/Loss (Raw)": 2.0129058361053467, "Pretrain/Step": 5937, "Pretrain/Step Time": 8.54865993000567} +{"Pretrain/Learning Rate": 1.6460577744105654e-05, "Pretrain/Loss": 2.0529046058654785, "Pretrain/Loss (Raw)": 1.8887381553649902, "Pretrain/Step": 5938, "Pretrain/Step Time": 8.543003490194678} +{"Pretrain/Learning Rate": 1.6452598996854943e-05, "Pretrain/Loss": 2.052995443344116, "Pretrain/Loss (Raw)": 1.9067656993865967, "Pretrain/Step": 5939, "Pretrain/Step Time": 8.546473680064082} +{"Pretrain/Learning Rate": 1.6444621235330777e-05, "Pretrain/Loss": 2.0550734996795654, "Pretrain/Loss (Raw)": 2.239405870437622, "Pretrain/Step": 5940, "Pretrain/Step Time": 8.550293354317546} +{"Pretrain/Learning Rate": 1.6436644460453217e-05, "Pretrain/Loss": 2.054325580596924, "Pretrain/Loss (Raw)": 2.0465495586395264, "Pretrain/Step": 5941, "Pretrain/Step Time": 8.550502873957157} +{"Pretrain/Learning Rate": 1.642866867314216e-05, "Pretrain/Loss": 2.0546038150787354, "Pretrain/Loss (Raw)": 2.1076643466949463, "Pretrain/Step": 5942, "Pretrain/Step Time": 8.546197015792131} +{"Pretrain/Learning Rate": 1.642069387431743e-05, "Pretrain/Loss": 2.053739070892334, "Pretrain/Loss (Raw)": 1.8878575563430786, "Pretrain/Step": 5943, "Pretrain/Step Time": 8.544526904821396} +{"Pretrain/Learning Rate": 1.64127200648987e-05, "Pretrain/Loss": 2.0532450675964355, "Pretrain/Loss (Raw)": 2.0174977779388428, "Pretrain/Step": 5944, "Pretrain/Step Time": 8.546207206323743} +{"Pretrain/Learning Rate": 1.6404747245805567e-05, "Pretrain/Loss": 2.054309606552124, "Pretrain/Loss (Raw)": 2.036186456680298, "Pretrain/Step": 5945, "Pretrain/Step Time": 8.546712096780539} +{"Pretrain/Learning Rate": 1.6396775417957478e-05, "Pretrain/Loss": 2.055528163909912, "Pretrain/Loss (Raw)": 2.273357391357422, "Pretrain/Step": 5946, "Pretrain/Step Time": 8.554833995178342} +{"Pretrain/Learning Rate": 1.6388804582273788e-05, "Pretrain/Loss": 2.0565907955169678, "Pretrain/Loss (Raw)": 2.197974681854248, "Pretrain/Step": 5947, "Pretrain/Step Time": 8.541973512619734} +{"Pretrain/Learning Rate": 1.6380834739673727e-05, "Pretrain/Loss": 2.056577205657959, "Pretrain/Loss (Raw)": 2.0952513217926025, "Pretrain/Step": 5948, "Pretrain/Step Time": 8.547598725184798} +{"Pretrain/Learning Rate": 1.6372865891076426e-05, "Pretrain/Loss": 2.05668568611145, "Pretrain/Loss (Raw)": 2.0625057220458984, "Pretrain/Step": 5949, "Pretrain/Step Time": 8.545335181057453} +{"Pretrain/Learning Rate": 1.6364898037400876e-05, "Pretrain/Loss": 2.056914806365967, "Pretrain/Loss (Raw)": 2.01082181930542, "Pretrain/Step": 5950, "Pretrain/Step Time": 8.545391449704766} +{"Pretrain/Learning Rate": 1.6356931179565978e-05, "Pretrain/Loss": 2.0561752319335938, "Pretrain/Loss (Raw)": 2.0658364295959473, "Pretrain/Step": 5951, "Pretrain/Step Time": 8.542175451293588} +{"Pretrain/Learning Rate": 1.63489653184905e-05, "Pretrain/Loss": 2.0543503761291504, "Pretrain/Loss (Raw)": 1.9924496412277222, "Pretrain/Step": 5952, "Pretrain/Step Time": 8.557940147817135} +{"Pretrain/Learning Rate": 1.6341000455093115e-05, "Pretrain/Loss": 2.056422472000122, "Pretrain/Loss (Raw)": 2.2271227836608887, "Pretrain/Step": 5953, "Pretrain/Step Time": 8.544700460508466} +{"Pretrain/Learning Rate": 1.633303659029235e-05, "Pretrain/Loss": 2.0562562942504883, "Pretrain/Loss (Raw)": 2.0919063091278076, "Pretrain/Step": 5954, "Pretrain/Step Time": 8.544863441959023} +{"Pretrain/Learning Rate": 1.6325073725006654e-05, "Pretrain/Loss": 2.0550589561462402, "Pretrain/Loss (Raw)": 2.0003280639648438, "Pretrain/Step": 5955, "Pretrain/Step Time": 8.545192327350378} +{"Pretrain/Learning Rate": 1.6317111860154328e-05, "Pretrain/Loss": 2.0545425415039062, "Pretrain/Loss (Raw)": 2.0103890895843506, "Pretrain/Step": 5956, "Pretrain/Step Time": 8.541809624060988} +{"Pretrain/Learning Rate": 1.6309150996653582e-05, "Pretrain/Loss": 2.0529651641845703, "Pretrain/Loss (Raw)": 1.9419463872909546, "Pretrain/Step": 5957, "Pretrain/Step Time": 8.538155123591423} +{"Pretrain/Learning Rate": 1.630119113542249e-05, "Pretrain/Loss": 2.05465030670166, "Pretrain/Loss (Raw)": 2.227689743041992, "Pretrain/Step": 5958, "Pretrain/Step Time": 8.548226561397314} +{"Pretrain/Learning Rate": 1.629323227737903e-05, "Pretrain/Loss": 2.053574323654175, "Pretrain/Loss (Raw)": 2.1617703437805176, "Pretrain/Step": 5959, "Pretrain/Step Time": 8.53448936715722} +{"Pretrain/Learning Rate": 1.628527442344105e-05, "Pretrain/Loss": 2.052323818206787, "Pretrain/Loss (Raw)": 1.893420934677124, "Pretrain/Step": 5960, "Pretrain/Step Time": 8.536649983376265} +{"Pretrain/Learning Rate": 1.6277317574526284e-05, "Pretrain/Loss": 2.050776958465576, "Pretrain/Loss (Raw)": 1.9661809206008911, "Pretrain/Step": 5961, "Pretrain/Step Time": 8.538161626085639} +{"Pretrain/Learning Rate": 1.626936173155237e-05, "Pretrain/Loss": 2.0498411655426025, "Pretrain/Loss (Raw)": 1.9873313903808594, "Pretrain/Step": 5962, "Pretrain/Step Time": 8.54234535433352} +{"Pretrain/Learning Rate": 1.626140689543679e-05, "Pretrain/Loss": 2.049128293991089, "Pretrain/Loss (Raw)": 2.0883162021636963, "Pretrain/Step": 5963, "Pretrain/Step Time": 8.541218727827072} +{"Pretrain/Learning Rate": 1.6253453067096954e-05, "Pretrain/Loss": 2.050811767578125, "Pretrain/Loss (Raw)": 2.095022678375244, "Pretrain/Step": 5964, "Pretrain/Step Time": 8.546726012602448} +{"Pretrain/Learning Rate": 1.6245500247450114e-05, "Pretrain/Loss": 2.0527610778808594, "Pretrain/Loss (Raw)": 2.09633731842041, "Pretrain/Step": 5965, "Pretrain/Step Time": 8.540019109845161} +{"Pretrain/Learning Rate": 1.6237548437413448e-05, "Pretrain/Loss": 2.0526905059814453, "Pretrain/Loss (Raw)": 1.9458166360855103, "Pretrain/Step": 5966, "Pretrain/Step Time": 8.54041730798781} +{"Pretrain/Learning Rate": 1.622959763790398e-05, "Pretrain/Loss": 2.0542707443237305, "Pretrain/Loss (Raw)": 2.1736457347869873, "Pretrain/Step": 5967, "Pretrain/Step Time": 8.534630104899406} +{"Pretrain/Learning Rate": 1.6221647849838645e-05, "Pretrain/Loss": 2.0534415245056152, "Pretrain/Loss (Raw)": 2.049515962600708, "Pretrain/Step": 5968, "Pretrain/Step Time": 8.537647608667612} +{"Pretrain/Learning Rate": 1.621369907413424e-05, "Pretrain/Loss": 2.056349754333496, "Pretrain/Loss (Raw)": 2.24648380279541, "Pretrain/Step": 5969, "Pretrain/Step Time": 8.535477792844176} +{"Pretrain/Learning Rate": 1.6205751311707463e-05, "Pretrain/Loss": 2.055429697036743, "Pretrain/Loss (Raw)": 2.0605709552764893, "Pretrain/Step": 5970, "Pretrain/Step Time": 8.535664893686771} +{"Pretrain/Learning Rate": 1.6197804563474882e-05, "Pretrain/Loss": 2.0550026893615723, "Pretrain/Loss (Raw)": 1.8647377490997314, "Pretrain/Step": 5971, "Pretrain/Step Time": 8.534258747473359} +{"Pretrain/Learning Rate": 1.6189858830352962e-05, "Pretrain/Loss": 2.0550153255462646, "Pretrain/Loss (Raw)": 2.1154496669769287, "Pretrain/Step": 5972, "Pretrain/Step Time": 8.538437779992819} +{"Pretrain/Learning Rate": 1.618191411325803e-05, "Pretrain/Loss": 2.056086778640747, "Pretrain/Loss (Raw)": 2.155272960662842, "Pretrain/Step": 5973, "Pretrain/Step Time": 8.535857196897268} +{"Pretrain/Learning Rate": 1.617397041310632e-05, "Pretrain/Loss": 2.05535888671875, "Pretrain/Loss (Raw)": 1.9010881185531616, "Pretrain/Step": 5974, "Pretrain/Step Time": 8.532711580395699} +{"Pretrain/Learning Rate": 1.6166027730813926e-05, "Pretrain/Loss": 2.060110569000244, "Pretrain/Loss (Raw)": 2.514124870300293, "Pretrain/Step": 5975, "Pretrain/Step Time": 8.5388092584908} +{"Pretrain/Learning Rate": 1.6158086067296844e-05, "Pretrain/Loss": 2.05953311920166, "Pretrain/Loss (Raw)": 1.7407842874526978, "Pretrain/Step": 5976, "Pretrain/Step Time": 8.540139498189092} +{"Pretrain/Learning Rate": 1.615014542347094e-05, "Pretrain/Loss": 2.0583198070526123, "Pretrain/Loss (Raw)": 2.1151907444000244, "Pretrain/Step": 5977, "Pretrain/Step Time": 8.537389930337667} +{"Pretrain/Learning Rate": 1.6142205800251968e-05, "Pretrain/Loss": 2.0572381019592285, "Pretrain/Loss (Raw)": 1.9529266357421875, "Pretrain/Step": 5978, "Pretrain/Step Time": 8.539039799943566} +{"Pretrain/Learning Rate": 1.6134267198555563e-05, "Pretrain/Loss": 2.0552120208740234, "Pretrain/Loss (Raw)": 1.9460183382034302, "Pretrain/Step": 5979, "Pretrain/Step Time": 8.535411296412349} +{"Pretrain/Learning Rate": 1.612632961929725e-05, "Pretrain/Loss": 2.0532336235046387, "Pretrain/Loss (Raw)": 1.916589379310608, "Pretrain/Step": 5980, "Pretrain/Step Time": 8.53836764395237} +{"Pretrain/Learning Rate": 1.6118393063392402e-05, "Pretrain/Loss": 2.0518178939819336, "Pretrain/Loss (Raw)": 1.9689515829086304, "Pretrain/Step": 5981, "Pretrain/Step Time": 8.538979273289442} +{"Pretrain/Learning Rate": 1.6110457531756334e-05, "Pretrain/Loss": 2.0536623001098633, "Pretrain/Loss (Raw)": 2.135225296020508, "Pretrain/Step": 5982, "Pretrain/Step Time": 8.534470099955797} +{"Pretrain/Learning Rate": 1.6102523025304178e-05, "Pretrain/Loss": 2.057054042816162, "Pretrain/Loss (Raw)": 2.086886167526245, "Pretrain/Step": 5983, "Pretrain/Step Time": 8.537025989964604} +{"Pretrain/Learning Rate": 1.6094589544951006e-05, "Pretrain/Loss": 2.0562376976013184, "Pretrain/Loss (Raw)": 2.0155529975891113, "Pretrain/Step": 5984, "Pretrain/Step Time": 8.527288744226098} +{"Pretrain/Learning Rate": 1.6086657091611718e-05, "Pretrain/Loss": 2.0566155910491943, "Pretrain/Loss (Raw)": 2.1146669387817383, "Pretrain/Step": 5985, "Pretrain/Step Time": 8.530313111841679} +{"Pretrain/Learning Rate": 1.607872566620115e-05, "Pretrain/Loss": 2.0551066398620605, "Pretrain/Loss (Raw)": 1.9984902143478394, "Pretrain/Step": 5986, "Pretrain/Step Time": 8.53057624027133} +{"Pretrain/Learning Rate": 1.6070795269633964e-05, "Pretrain/Loss": 2.0533010959625244, "Pretrain/Loss (Raw)": 1.9450639486312866, "Pretrain/Step": 5987, "Pretrain/Step Time": 8.531680285930634} +{"Pretrain/Learning Rate": 1.6062865902824754e-05, "Pretrain/Loss": 2.0524349212646484, "Pretrain/Loss (Raw)": 2.3525712490081787, "Pretrain/Step": 5988, "Pretrain/Step Time": 8.536846423521638} +{"Pretrain/Learning Rate": 1.605493756668795e-05, "Pretrain/Loss": 2.052217960357666, "Pretrain/Loss (Raw)": 1.948468804359436, "Pretrain/Step": 5989, "Pretrain/Step Time": 8.536873389035463} +{"Pretrain/Learning Rate": 1.6047010262137908e-05, "Pretrain/Loss": 2.0515666007995605, "Pretrain/Loss (Raw)": 2.012037515640259, "Pretrain/Step": 5990, "Pretrain/Step Time": 8.532044241204858} +{"Pretrain/Learning Rate": 1.603908399008882e-05, "Pretrain/Loss": 2.0510478019714355, "Pretrain/Loss (Raw)": 2.0263710021972656, "Pretrain/Step": 5991, "Pretrain/Step Time": 8.533660359680653} +{"Pretrain/Learning Rate": 1.60311587514548e-05, "Pretrain/Loss": 2.0525665283203125, "Pretrain/Loss (Raw)": 2.2520787715911865, "Pretrain/Step": 5992, "Pretrain/Step Time": 8.53460842370987} +{"Pretrain/Learning Rate": 1.6023234547149808e-05, "Pretrain/Loss": 2.054473400115967, "Pretrain/Loss (Raw)": 2.3097996711730957, "Pretrain/Step": 5993, "Pretrain/Step Time": 8.533622082322836} +{"Pretrain/Learning Rate": 1.6015311378087714e-05, "Pretrain/Loss": 2.0559613704681396, "Pretrain/Loss (Raw)": 2.0833945274353027, "Pretrain/Step": 5994, "Pretrain/Step Time": 8.54077516682446} +{"Pretrain/Learning Rate": 1.600738924518224e-05, "Pretrain/Loss": 2.054417371749878, "Pretrain/Loss (Raw)": 1.83530592918396, "Pretrain/Step": 5995, "Pretrain/Step Time": 8.540168717503548} +{"Pretrain/Learning Rate": 1.5999468149347024e-05, "Pretrain/Loss": 2.0535969734191895, "Pretrain/Loss (Raw)": 2.0786616802215576, "Pretrain/Step": 5996, "Pretrain/Step Time": 8.54353548772633} +{"Pretrain/Learning Rate": 1.5991548091495546e-05, "Pretrain/Loss": 2.0554611682891846, "Pretrain/Loss (Raw)": 1.9412641525268555, "Pretrain/Step": 5997, "Pretrain/Step Time": 8.532471092417836} +{"Pretrain/Learning Rate": 1.5983629072541196e-05, "Pretrain/Loss": 2.0552618503570557, "Pretrain/Loss (Raw)": 1.8780733346939087, "Pretrain/Step": 5998, "Pretrain/Step Time": 8.536187369376421} +{"Pretrain/Learning Rate": 1.597571109339722e-05, "Pretrain/Loss": 2.054839611053467, "Pretrain/Loss (Raw)": 2.060593605041504, "Pretrain/Step": 5999, "Pretrain/Step Time": 8.538743698969483} +{"Pretrain/Learning Rate": 1.5967794154976773e-05, "Pretrain/Loss": 2.0554308891296387, "Pretrain/Loss (Raw)": 2.306432008743286, "Pretrain/Step": 6000, "Pretrain/Step Time": 8.543052293360233} +{"Pretrain/Learning Rate": 1.5959878258192863e-05, "Pretrain/Loss": 2.052936553955078, "Pretrain/Loss (Raw)": 1.7109264135360718, "Pretrain/Step": 6001, "Pretrain/Step Time": 8.54140667617321} +{"Pretrain/Learning Rate": 1.5951963403958382e-05, "Pretrain/Loss": 2.0542664527893066, "Pretrain/Loss (Raw)": 2.2337145805358887, "Pretrain/Step": 6002, "Pretrain/Step Time": 8.534626830369234} +{"Pretrain/Learning Rate": 1.5944049593186127e-05, "Pretrain/Loss": 2.0535740852355957, "Pretrain/Loss (Raw)": 1.834804654121399, "Pretrain/Step": 6003, "Pretrain/Step Time": 8.536314120516181} +{"Pretrain/Learning Rate": 1.5936136826788745e-05, "Pretrain/Loss": 2.052302598953247, "Pretrain/Loss (Raw)": 1.7653577327728271, "Pretrain/Step": 6004, "Pretrain/Step Time": 8.536424422636628} +{"Pretrain/Learning Rate": 1.5928225105678774e-05, "Pretrain/Loss": 2.052029609680176, "Pretrain/Loss (Raw)": 2.1481072902679443, "Pretrain/Step": 6005, "Pretrain/Step Time": 8.537004698067904} +{"Pretrain/Learning Rate": 1.592031443076863e-05, "Pretrain/Loss": 2.0513181686401367, "Pretrain/Loss (Raw)": 2.1412811279296875, "Pretrain/Step": 6006, "Pretrain/Step Time": 8.547823956236243} +{"Pretrain/Learning Rate": 1.591240480297061e-05, "Pretrain/Loss": 2.055320978164673, "Pretrain/Loss (Raw)": 2.5328633785247803, "Pretrain/Step": 6007, "Pretrain/Step Time": 8.536855136975646} +{"Pretrain/Learning Rate": 1.590449622319689e-05, "Pretrain/Loss": 2.0529966354370117, "Pretrain/Loss (Raw)": 1.9554709196090698, "Pretrain/Step": 6008, "Pretrain/Step Time": 8.542241346091032} +{"Pretrain/Learning Rate": 1.589658869235953e-05, "Pretrain/Loss": 2.0552310943603516, "Pretrain/Loss (Raw)": 2.2092018127441406, "Pretrain/Step": 6009, "Pretrain/Step Time": 8.543370701372623} +{"Pretrain/Learning Rate": 1.588868221137045e-05, "Pretrain/Loss": 2.054349422454834, "Pretrain/Loss (Raw)": 1.98171865940094, "Pretrain/Step": 6010, "Pretrain/Step Time": 8.541061110794544} +{"Pretrain/Learning Rate": 1.588077678114148e-05, "Pretrain/Loss": 2.0540199279785156, "Pretrain/Loss (Raw)": 1.9768668413162231, "Pretrain/Step": 6011, "Pretrain/Step Time": 8.53688252530992} +{"Pretrain/Learning Rate": 1.5872872402584296e-05, "Pretrain/Loss": 2.0544941425323486, "Pretrain/Loss (Raw)": 2.035712242126465, "Pretrain/Step": 6012, "Pretrain/Step Time": 8.544043285772204} +{"Pretrain/Learning Rate": 1.586496907661048e-05, "Pretrain/Loss": 2.05401611328125, "Pretrain/Loss (Raw)": 1.989431381225586, "Pretrain/Step": 6013, "Pretrain/Step Time": 8.541194269433618} +{"Pretrain/Learning Rate": 1.5857066804131472e-05, "Pretrain/Loss": 2.054837703704834, "Pretrain/Loss (Raw)": 2.1956000328063965, "Pretrain/Step": 6014, "Pretrain/Step Time": 8.54969965107739} +{"Pretrain/Learning Rate": 1.5849165586058608e-05, "Pretrain/Loss": 2.05226469039917, "Pretrain/Loss (Raw)": 2.074150562286377, "Pretrain/Step": 6015, "Pretrain/Step Time": 8.541447816416621} +{"Pretrain/Learning Rate": 1.5841265423303084e-05, "Pretrain/Loss": 2.053304672241211, "Pretrain/Loss (Raw)": 2.1238818168640137, "Pretrain/Step": 6016, "Pretrain/Step Time": 8.545336417853832} +{"Pretrain/Learning Rate": 1.5833366316775994e-05, "Pretrain/Loss": 2.0528621673583984, "Pretrain/Loss (Raw)": 2.0411593914031982, "Pretrain/Step": 6017, "Pretrain/Step Time": 8.543145576491952} +{"Pretrain/Learning Rate": 1.582546826738829e-05, "Pretrain/Loss": 2.0519440174102783, "Pretrain/Loss (Raw)": 1.8989325761795044, "Pretrain/Step": 6018, "Pretrain/Step Time": 8.546256495639682} +{"Pretrain/Learning Rate": 1.581757127605082e-05, "Pretrain/Loss": 2.0521159172058105, "Pretrain/Loss (Raw)": 1.9048058986663818, "Pretrain/Step": 6019, "Pretrain/Step Time": 8.548403732478619} +{"Pretrain/Learning Rate": 1.5809675343674295e-05, "Pretrain/Loss": 2.051647186279297, "Pretrain/Loss (Raw)": 1.839408278465271, "Pretrain/Step": 6020, "Pretrain/Step Time": 8.550771865993738} +{"Pretrain/Learning Rate": 1.5801780471169324e-05, "Pretrain/Loss": 2.051342010498047, "Pretrain/Loss (Raw)": 2.0590174198150635, "Pretrain/Step": 6021, "Pretrain/Step Time": 8.547597773373127} +{"Pretrain/Learning Rate": 1.579388665944636e-05, "Pretrain/Loss": 2.0523011684417725, "Pretrain/Loss (Raw)": 2.0561678409576416, "Pretrain/Step": 6022, "Pretrain/Step Time": 8.547886479645967} +{"Pretrain/Learning Rate": 1.578599390941578e-05, "Pretrain/Loss": 2.0524673461914062, "Pretrain/Loss (Raw)": 2.0885329246520996, "Pretrain/Step": 6023, "Pretrain/Step Time": 8.546912424266338} +{"Pretrain/Learning Rate": 1.577810222198779e-05, "Pretrain/Loss": 2.052164077758789, "Pretrain/Loss (Raw)": 1.8551610708236694, "Pretrain/Step": 6024, "Pretrain/Step Time": 8.54684715718031} +{"Pretrain/Learning Rate": 1.577021159807252e-05, "Pretrain/Loss": 2.053889751434326, "Pretrain/Loss (Raw)": 2.2757065296173096, "Pretrain/Step": 6025, "Pretrain/Step Time": 8.55333073809743} +{"Pretrain/Learning Rate": 1.5762322038579925e-05, "Pretrain/Loss": 2.0532679557800293, "Pretrain/Loss (Raw)": 2.174708127975464, "Pretrain/Step": 6026, "Pretrain/Step Time": 8.548118840903044} +{"Pretrain/Learning Rate": 1.5754433544419893e-05, "Pretrain/Loss": 2.0534634590148926, "Pretrain/Loss (Raw)": 2.1876442432403564, "Pretrain/Step": 6027, "Pretrain/Step Time": 8.546668568626046} +{"Pretrain/Learning Rate": 1.574654611650214e-05, "Pretrain/Loss": 2.053750991821289, "Pretrain/Loss (Raw)": 2.0135743618011475, "Pretrain/Step": 6028, "Pretrain/Step Time": 8.54597538895905} +{"Pretrain/Learning Rate": 1.5738659755736308e-05, "Pretrain/Loss": 2.0537209510803223, "Pretrain/Loss (Raw)": 1.949664831161499, "Pretrain/Step": 6029, "Pretrain/Step Time": 8.54782997816801} +{"Pretrain/Learning Rate": 1.5730774463031862e-05, "Pretrain/Loss": 2.0541200637817383, "Pretrain/Loss (Raw)": 2.185336112976074, "Pretrain/Step": 6030, "Pretrain/Step Time": 8.554371168836951} +{"Pretrain/Learning Rate": 1.572289023929819e-05, "Pretrain/Loss": 2.051879644393921, "Pretrain/Loss (Raw)": 1.6761906147003174, "Pretrain/Step": 6031, "Pretrain/Step Time": 8.554382475093007} +{"Pretrain/Learning Rate": 1.5715007085444523e-05, "Pretrain/Loss": 2.054610252380371, "Pretrain/Loss (Raw)": 2.333322286605835, "Pretrain/Step": 6032, "Pretrain/Step Time": 8.547875538468361} +{"Pretrain/Learning Rate": 1.5707125002379996e-05, "Pretrain/Loss": 2.0568957328796387, "Pretrain/Loss (Raw)": 2.1970012187957764, "Pretrain/Step": 6033, "Pretrain/Step Time": 8.549775192514062} +{"Pretrain/Learning Rate": 1.56992439910136e-05, "Pretrain/Loss": 2.0570359230041504, "Pretrain/Loss (Raw)": 1.9896776676177979, "Pretrain/Step": 6034, "Pretrain/Step Time": 8.54882768727839} +{"Pretrain/Learning Rate": 1.569136405225422e-05, "Pretrain/Loss": 2.0576653480529785, "Pretrain/Loss (Raw)": 2.1459414958953857, "Pretrain/Step": 6035, "Pretrain/Step Time": 8.546916184946895} +{"Pretrain/Learning Rate": 1.5683485187010593e-05, "Pretrain/Loss": 2.0564191341400146, "Pretrain/Loss (Raw)": 1.993391752243042, "Pretrain/Step": 6036, "Pretrain/Step Time": 8.55623584613204} +{"Pretrain/Learning Rate": 1.5675607396191366e-05, "Pretrain/Loss": 2.0555715560913086, "Pretrain/Loss (Raw)": 1.9383684396743774, "Pretrain/Step": 6037, "Pretrain/Step Time": 8.557405048981309} +{"Pretrain/Learning Rate": 1.5667730680705022e-05, "Pretrain/Loss": 2.0550713539123535, "Pretrain/Loss (Raw)": 2.0357301235198975, "Pretrain/Step": 6038, "Pretrain/Step Time": 8.552668858319521} +{"Pretrain/Learning Rate": 1.5659855041459955e-05, "Pretrain/Loss": 2.055027961730957, "Pretrain/Loss (Raw)": 2.0468955039978027, "Pretrain/Step": 6039, "Pretrain/Step Time": 8.549454674124718} +{"Pretrain/Learning Rate": 1.5651980479364416e-05, "Pretrain/Loss": 2.050382375717163, "Pretrain/Loss (Raw)": 1.5605905055999756, "Pretrain/Step": 6040, "Pretrain/Step Time": 8.553325483575463} +{"Pretrain/Learning Rate": 1.564410699532654e-05, "Pretrain/Loss": 2.05057954788208, "Pretrain/Loss (Raw)": 2.074437379837036, "Pretrain/Step": 6041, "Pretrain/Step Time": 8.554526614025235} +{"Pretrain/Learning Rate": 1.5636234590254324e-05, "Pretrain/Loss": 2.0478272438049316, "Pretrain/Loss (Raw)": 2.020784854888916, "Pretrain/Step": 6042, "Pretrain/Step Time": 8.555412273854017} +{"Pretrain/Learning Rate": 1.5628363265055664e-05, "Pretrain/Loss": 2.0487060546875, "Pretrain/Loss (Raw)": 2.0074644088745117, "Pretrain/Step": 6043, "Pretrain/Step Time": 8.557010613381863} +{"Pretrain/Learning Rate": 1.5620493020638315e-05, "Pretrain/Loss": 2.050102472305298, "Pretrain/Loss (Raw)": 2.15187931060791, "Pretrain/Step": 6044, "Pretrain/Step Time": 8.545029247179627} +{"Pretrain/Learning Rate": 1.5612623857909904e-05, "Pretrain/Loss": 2.05025315284729, "Pretrain/Loss (Raw)": 2.037302017211914, "Pretrain/Step": 6045, "Pretrain/Step Time": 8.549450566992164} +{"Pretrain/Learning Rate": 1.5604755777777948e-05, "Pretrain/Loss": 2.0503177642822266, "Pretrain/Loss (Raw)": 1.9667019844055176, "Pretrain/Step": 6046, "Pretrain/Step Time": 8.545721961185336} +{"Pretrain/Learning Rate": 1.5596888781149827e-05, "Pretrain/Loss": 2.04740571975708, "Pretrain/Loss (Raw)": 1.8497843742370605, "Pretrain/Step": 6047, "Pretrain/Step Time": 8.547814480960369} +{"Pretrain/Learning Rate": 1.55890228689328e-05, "Pretrain/Loss": 2.045009136199951, "Pretrain/Loss (Raw)": 2.0787668228149414, "Pretrain/Step": 6048, "Pretrain/Step Time": 8.550810780376196} +{"Pretrain/Learning Rate": 1.5581158042034e-05, "Pretrain/Loss": 2.0446090698242188, "Pretrain/Loss (Raw)": 1.959762692451477, "Pretrain/Step": 6049, "Pretrain/Step Time": 8.553068859502673} +{"Pretrain/Learning Rate": 1.557329430136044e-05, "Pretrain/Loss": 2.044041872024536, "Pretrain/Loss (Raw)": 2.160506010055542, "Pretrain/Step": 6050, "Pretrain/Step Time": 8.543269028887153} +{"Pretrain/Learning Rate": 1.5565431647819e-05, "Pretrain/Loss": 2.0430350303649902, "Pretrain/Loss (Raw)": 1.98130464553833, "Pretrain/Step": 6051, "Pretrain/Step Time": 8.54605402238667} +{"Pretrain/Learning Rate": 1.555757008231644e-05, "Pretrain/Loss": 2.0440421104431152, "Pretrain/Loss (Raw)": 2.017287015914917, "Pretrain/Step": 6052, "Pretrain/Step Time": 8.550522023811936} +{"Pretrain/Learning Rate": 1.5549709605759393e-05, "Pretrain/Loss": 2.042511463165283, "Pretrain/Loss (Raw)": 1.7363059520721436, "Pretrain/Step": 6053, "Pretrain/Step Time": 8.549983639270067} +{"Pretrain/Learning Rate": 1.5541850219054366e-05, "Pretrain/Loss": 2.0443594455718994, "Pretrain/Loss (Raw)": 1.9577516317367554, "Pretrain/Step": 6054, "Pretrain/Step Time": 8.5586748868227} +{"Pretrain/Learning Rate": 1.5533991923107737e-05, "Pretrain/Loss": 2.0416998863220215, "Pretrain/Loss (Raw)": 2.0533134937286377, "Pretrain/Step": 6055, "Pretrain/Step Time": 8.556840961799026} +{"Pretrain/Learning Rate": 1.552613471882577e-05, "Pretrain/Loss": 2.0414938926696777, "Pretrain/Loss (Raw)": 1.9219391345977783, "Pretrain/Step": 6056, "Pretrain/Step Time": 8.559915443882346} +{"Pretrain/Learning Rate": 1.5518278607114585e-05, "Pretrain/Loss": 2.0420145988464355, "Pretrain/Loss (Raw)": 2.1560447216033936, "Pretrain/Step": 6057, "Pretrain/Step Time": 8.556753624230623} +{"Pretrain/Learning Rate": 1.5510423588880194e-05, "Pretrain/Loss": 2.041134834289551, "Pretrain/Loss (Raw)": 2.0051019191741943, "Pretrain/Step": 6058, "Pretrain/Step Time": 8.546983970329165} +{"Pretrain/Learning Rate": 1.5502569665028465e-05, "Pretrain/Loss": 2.0424866676330566, "Pretrain/Loss (Raw)": 2.0823898315429688, "Pretrain/Step": 6059, "Pretrain/Step Time": 8.549593191593885} +{"Pretrain/Learning Rate": 1.549471683646516e-05, "Pretrain/Loss": 2.038792133331299, "Pretrain/Loss (Raw)": 1.738226294517517, "Pretrain/Step": 6060, "Pretrain/Step Time": 8.55339372716844} +{"Pretrain/Learning Rate": 1.54868651040959e-05, "Pretrain/Loss": 2.0352983474731445, "Pretrain/Loss (Raw)": 1.8591134548187256, "Pretrain/Step": 6061, "Pretrain/Step Time": 8.550182057544589} +{"Pretrain/Learning Rate": 1.5479014468826184e-05, "Pretrain/Loss": 2.0361690521240234, "Pretrain/Loss (Raw)": 2.0749564170837402, "Pretrain/Step": 6062, "Pretrain/Step Time": 8.541656715795398} +{"Pretrain/Learning Rate": 1.547116493156138e-05, "Pretrain/Loss": 2.03831148147583, "Pretrain/Loss (Raw)": 1.9487066268920898, "Pretrain/Step": 6063, "Pretrain/Step Time": 8.545588366687298} +{"Pretrain/Learning Rate": 1.5463316493206748e-05, "Pretrain/Loss": 2.038118362426758, "Pretrain/Loss (Raw)": 2.0056722164154053, "Pretrain/Step": 6064, "Pretrain/Step Time": 8.541562862694263} +{"Pretrain/Learning Rate": 1.545546915466738e-05, "Pretrain/Loss": 2.0379109382629395, "Pretrain/Loss (Raw)": 1.9863373041152954, "Pretrain/Step": 6065, "Pretrain/Step Time": 8.540003776550293} +{"Pretrain/Learning Rate": 1.54476229168483e-05, "Pretrain/Loss": 2.0426583290100098, "Pretrain/Loss (Raw)": 2.49642276763916, "Pretrain/Step": 6066, "Pretrain/Step Time": 8.546936983242631} +{"Pretrain/Learning Rate": 1.543977778065434e-05, "Pretrain/Loss": 2.0455265045166016, "Pretrain/Loss (Raw)": 2.273895263671875, "Pretrain/Step": 6067, "Pretrain/Step Time": 8.547115748748183} +{"Pretrain/Learning Rate": 1.5431933746990276e-05, "Pretrain/Loss": 2.0437374114990234, "Pretrain/Loss (Raw)": 2.010374069213867, "Pretrain/Step": 6068, "Pretrain/Step Time": 8.545178739354014} +{"Pretrain/Learning Rate": 1.542409081676068e-05, "Pretrain/Loss": 2.043161392211914, "Pretrain/Loss (Raw)": 1.9728288650512695, "Pretrain/Step": 6069, "Pretrain/Step Time": 8.544831994920969} +{"Pretrain/Learning Rate": 1.541624899087007e-05, "Pretrain/Loss": 2.042957305908203, "Pretrain/Loss (Raw)": 2.081563949584961, "Pretrain/Step": 6070, "Pretrain/Step Time": 8.541843747720122} +{"Pretrain/Learning Rate": 1.5408408270222773e-05, "Pretrain/Loss": 2.0425000190734863, "Pretrain/Loss (Raw)": 1.8293263912200928, "Pretrain/Step": 6071, "Pretrain/Step Time": 8.543741451576352} +{"Pretrain/Learning Rate": 1.5400568655723043e-05, "Pretrain/Loss": 2.042553663253784, "Pretrain/Loss (Raw)": 2.0243659019470215, "Pretrain/Step": 6072, "Pretrain/Step Time": 8.545691834762692} +{"Pretrain/Learning Rate": 1.5392730148274965e-05, "Pretrain/Loss": 2.042698860168457, "Pretrain/Loss (Raw)": 2.054734230041504, "Pretrain/Step": 6073, "Pretrain/Step Time": 8.54799772053957} +{"Pretrain/Learning Rate": 1.5384892748782513e-05, "Pretrain/Loss": 2.040687084197998, "Pretrain/Loss (Raw)": 2.0158543586730957, "Pretrain/Step": 6074, "Pretrain/Step Time": 8.546614471822977} +{"Pretrain/Learning Rate": 1.5377056458149542e-05, "Pretrain/Loss": 2.0395889282226562, "Pretrain/Loss (Raw)": 2.057443141937256, "Pretrain/Step": 6075, "Pretrain/Step Time": 8.547538600862026} +{"Pretrain/Learning Rate": 1.5369221277279765e-05, "Pretrain/Loss": 2.0393099784851074, "Pretrain/Loss (Raw)": 2.0595149993896484, "Pretrain/Step": 6076, "Pretrain/Step Time": 8.544451458379626} +{"Pretrain/Learning Rate": 1.5361387207076766e-05, "Pretrain/Loss": 2.037872552871704, "Pretrain/Loss (Raw)": 1.8785284757614136, "Pretrain/Step": 6077, "Pretrain/Step Time": 8.544433252885938} +{"Pretrain/Learning Rate": 1.5353554248444022e-05, "Pretrain/Loss": 2.0388307571411133, "Pretrain/Loss (Raw)": 2.1334831714630127, "Pretrain/Step": 6078, "Pretrain/Step Time": 8.543416196480393} +{"Pretrain/Learning Rate": 1.5345722402284852e-05, "Pretrain/Loss": 2.0377297401428223, "Pretrain/Loss (Raw)": 1.9248957633972168, "Pretrain/Step": 6079, "Pretrain/Step Time": 8.548952026292682} +{"Pretrain/Learning Rate": 1.5337891669502468e-05, "Pretrain/Loss": 2.0389301776885986, "Pretrain/Loss (Raw)": 2.146101951599121, "Pretrain/Step": 6080, "Pretrain/Step Time": 8.538147263228893} +{"Pretrain/Learning Rate": 1.5330062050999945e-05, "Pretrain/Loss": 2.0373873710632324, "Pretrain/Loss (Raw)": 2.029648780822754, "Pretrain/Step": 6081, "Pretrain/Step Time": 8.535820903256536} +{"Pretrain/Learning Rate": 1.5322233547680235e-05, "Pretrain/Loss": 2.0382235050201416, "Pretrain/Loss (Raw)": 2.198932409286499, "Pretrain/Step": 6082, "Pretrain/Step Time": 8.53545143827796} +{"Pretrain/Learning Rate": 1.531440616044615e-05, "Pretrain/Loss": 2.038236141204834, "Pretrain/Loss (Raw)": 2.001945734024048, "Pretrain/Step": 6083, "Pretrain/Step Time": 8.538003969937563} +{"Pretrain/Learning Rate": 1.530657989020039e-05, "Pretrain/Loss": 2.038407802581787, "Pretrain/Loss (Raw)": 2.0323565006256104, "Pretrain/Step": 6084, "Pretrain/Step Time": 8.541102819144726} +{"Pretrain/Learning Rate": 1.5298754737845515e-05, "Pretrain/Loss": 2.0408782958984375, "Pretrain/Loss (Raw)": 2.2581892013549805, "Pretrain/Step": 6085, "Pretrain/Step Time": 8.554443076252937} +{"Pretrain/Learning Rate": 1.5290930704283953e-05, "Pretrain/Loss": 2.0388503074645996, "Pretrain/Loss (Raw)": 1.968076467514038, "Pretrain/Step": 6086, "Pretrain/Step Time": 8.544850561767817} +{"Pretrain/Learning Rate": 1.5283107790418023e-05, "Pretrain/Loss": 2.038790225982666, "Pretrain/Loss (Raw)": 2.1541008949279785, "Pretrain/Step": 6087, "Pretrain/Step Time": 8.545646516606212} +{"Pretrain/Learning Rate": 1.527528599714988e-05, "Pretrain/Loss": 2.040243148803711, "Pretrain/Loss (Raw)": 2.079393148422241, "Pretrain/Step": 6088, "Pretrain/Step Time": 8.544846821576357} +{"Pretrain/Learning Rate": 1.5267465325381584e-05, "Pretrain/Loss": 2.040529727935791, "Pretrain/Loss (Raw)": 2.0028605461120605, "Pretrain/Step": 6089, "Pretrain/Step Time": 8.542038960382342} +{"Pretrain/Learning Rate": 1.5259645776015047e-05, "Pretrain/Loss": 2.0411906242370605, "Pretrain/Loss (Raw)": 2.071920156478882, "Pretrain/Step": 6090, "Pretrain/Step Time": 8.54890133626759} +{"Pretrain/Learning Rate": 1.5251827349952058e-05, "Pretrain/Loss": 2.0419044494628906, "Pretrain/Loss (Raw)": 2.1796774864196777, "Pretrain/Step": 6091, "Pretrain/Step Time": 8.550747610628605} +{"Pretrain/Learning Rate": 1.524401004809427e-05, "Pretrain/Loss": 2.041938304901123, "Pretrain/Loss (Raw)": 2.099358558654785, "Pretrain/Step": 6092, "Pretrain/Step Time": 8.548080964013934} +{"Pretrain/Learning Rate": 1.5236193871343224e-05, "Pretrain/Loss": 2.0420470237731934, "Pretrain/Loss (Raw)": 2.1102638244628906, "Pretrain/Step": 6093, "Pretrain/Step Time": 8.548016985878348} +{"Pretrain/Learning Rate": 1.5228378820600303e-05, "Pretrain/Loss": 2.0411548614501953, "Pretrain/Loss (Raw)": 1.8316192626953125, "Pretrain/Step": 6094, "Pretrain/Step Time": 8.546585753560066} +{"Pretrain/Learning Rate": 1.5220564896766784e-05, "Pretrain/Loss": 2.041144371032715, "Pretrain/Loss (Raw)": 2.172287702560425, "Pretrain/Step": 6095, "Pretrain/Step Time": 8.546206332743168} +{"Pretrain/Learning Rate": 1.52127521007438e-05, "Pretrain/Loss": 2.039142608642578, "Pretrain/Loss (Raw)": 1.7933111190795898, "Pretrain/Step": 6096, "Pretrain/Step Time": 8.544150102883577} +{"Pretrain/Learning Rate": 1.5204940433432368e-05, "Pretrain/Loss": 2.0378856658935547, "Pretrain/Loss (Raw)": 2.0855906009674072, "Pretrain/Step": 6097, "Pretrain/Step Time": 8.548435464501381} +{"Pretrain/Learning Rate": 1.5197129895733354e-05, "Pretrain/Loss": 2.038658857345581, "Pretrain/Loss (Raw)": 2.159546375274658, "Pretrain/Step": 6098, "Pretrain/Step Time": 8.551125910133123} +{"Pretrain/Learning Rate": 1.518932048854752e-05, "Pretrain/Loss": 2.0389013290405273, "Pretrain/Loss (Raw)": 1.8957568407058716, "Pretrain/Step": 6099, "Pretrain/Step Time": 8.547378873452544} +{"Pretrain/Learning Rate": 1.5181512212775472e-05, "Pretrain/Loss": 2.0361530780792236, "Pretrain/Loss (Raw)": 1.7636619806289673, "Pretrain/Step": 6100, "Pretrain/Step Time": 8.551173187792301} +{"Pretrain/Learning Rate": 1.5173705069317706e-05, "Pretrain/Loss": 2.033707857131958, "Pretrain/Loss (Raw)": 1.8423030376434326, "Pretrain/Step": 6101, "Pretrain/Step Time": 8.55082331597805} +{"Pretrain/Learning Rate": 1.5165899059074567e-05, "Pretrain/Loss": 2.033710479736328, "Pretrain/Loss (Raw)": 1.901423692703247, "Pretrain/Step": 6102, "Pretrain/Step Time": 8.549668414518237} +{"Pretrain/Learning Rate": 1.5158094182946298e-05, "Pretrain/Loss": 2.0283377170562744, "Pretrain/Loss (Raw)": 1.8264081478118896, "Pretrain/Step": 6103, "Pretrain/Step Time": 8.554494764655828} +{"Pretrain/Learning Rate": 1.5150290441832976e-05, "Pretrain/Loss": 2.030043125152588, "Pretrain/Loss (Raw)": 1.9590784311294556, "Pretrain/Step": 6104, "Pretrain/Step Time": 8.549734758213162} +{"Pretrain/Learning Rate": 1.5142487836634587e-05, "Pretrain/Loss": 2.0292649269104004, "Pretrain/Loss (Raw)": 2.015585422515869, "Pretrain/Step": 6105, "Pretrain/Step Time": 8.548045391216874} +{"Pretrain/Learning Rate": 1.5134686368250932e-05, "Pretrain/Loss": 2.0285770893096924, "Pretrain/Loss (Raw)": 1.8648793697357178, "Pretrain/Step": 6106, "Pretrain/Step Time": 8.549014709889889} +{"Pretrain/Learning Rate": 1.512688603758175e-05, "Pretrain/Loss": 2.029981851577759, "Pretrain/Loss (Raw)": 2.125823736190796, "Pretrain/Step": 6107, "Pretrain/Step Time": 8.547562342137098} +{"Pretrain/Learning Rate": 1.5119086845526576e-05, "Pretrain/Loss": 2.0306808948516846, "Pretrain/Loss (Raw)": 2.006049394607544, "Pretrain/Step": 6108, "Pretrain/Step Time": 8.546540264040232} +{"Pretrain/Learning Rate": 1.5111288792984884e-05, "Pretrain/Loss": 2.0300679206848145, "Pretrain/Loss (Raw)": 1.8904979228973389, "Pretrain/Step": 6109, "Pretrain/Step Time": 8.5500153824687} +{"Pretrain/Learning Rate": 1.5103491880855953e-05, "Pretrain/Loss": 2.028355360031128, "Pretrain/Loss (Raw)": 1.9160425662994385, "Pretrain/Step": 6110, "Pretrain/Step Time": 8.553097350522876} +{"Pretrain/Learning Rate": 1.5095696110038981e-05, "Pretrain/Loss": 2.027780532836914, "Pretrain/Loss (Raw)": 2.0133216381073, "Pretrain/Step": 6111, "Pretrain/Step Time": 8.552848102524877} +{"Pretrain/Learning Rate": 1.5087901481432993e-05, "Pretrain/Loss": 2.028099775314331, "Pretrain/Loss (Raw)": 2.0563814640045166, "Pretrain/Step": 6112, "Pretrain/Step Time": 8.551976339891553} +{"Pretrain/Learning Rate": 1.5080107995936929e-05, "Pretrain/Loss": 2.0260748863220215, "Pretrain/Loss (Raw)": 1.8555067777633667, "Pretrain/Step": 6113, "Pretrain/Step Time": 8.555724456906319} +{"Pretrain/Learning Rate": 1.5072315654449543e-05, "Pretrain/Loss": 2.0274529457092285, "Pretrain/Loss (Raw)": 2.1748783588409424, "Pretrain/Step": 6114, "Pretrain/Step Time": 8.554435931146145} +{"Pretrain/Learning Rate": 1.5064524457869506e-05, "Pretrain/Loss": 2.025468349456787, "Pretrain/Loss (Raw)": 1.6910330057144165, "Pretrain/Step": 6115, "Pretrain/Step Time": 8.560448372736573} +{"Pretrain/Learning Rate": 1.5056734407095316e-05, "Pretrain/Loss": 2.023077964782715, "Pretrain/Loss (Raw)": 2.0465798377990723, "Pretrain/Step": 6116, "Pretrain/Step Time": 8.551801392808557} +{"Pretrain/Learning Rate": 1.5048945503025375e-05, "Pretrain/Loss": 2.0252459049224854, "Pretrain/Loss (Raw)": 2.22597599029541, "Pretrain/Step": 6117, "Pretrain/Step Time": 8.550094464793801} +{"Pretrain/Learning Rate": 1.5041157746557924e-05, "Pretrain/Loss": 2.0237650871276855, "Pretrain/Loss (Raw)": 1.8224890232086182, "Pretrain/Step": 6118, "Pretrain/Step Time": 8.551216239109635} +{"Pretrain/Learning Rate": 1.5033371138591095e-05, "Pretrain/Loss": 2.023818016052246, "Pretrain/Loss (Raw)": 2.033156394958496, "Pretrain/Step": 6119, "Pretrain/Step Time": 8.549296751618385} +{"Pretrain/Learning Rate": 1.5025585680022866e-05, "Pretrain/Loss": 2.0199928283691406, "Pretrain/Loss (Raw)": 1.762439489364624, "Pretrain/Step": 6120, "Pretrain/Step Time": 8.548330495133996} +{"Pretrain/Learning Rate": 1.50178013717511e-05, "Pretrain/Loss": 2.018509864807129, "Pretrain/Loss (Raw)": 2.119980573654175, "Pretrain/Step": 6121, "Pretrain/Step Time": 8.557683296501637} +{"Pretrain/Learning Rate": 1.5010018214673515e-05, "Pretrain/Loss": 2.01737642288208, "Pretrain/Loss (Raw)": 1.938309669494629, "Pretrain/Step": 6122, "Pretrain/Step Time": 8.546618955209851} +{"Pretrain/Learning Rate": 1.5002236209687709e-05, "Pretrain/Loss": 2.0172877311706543, "Pretrain/Loss (Raw)": 1.8239903450012207, "Pretrain/Step": 6123, "Pretrain/Step Time": 8.546537052839994} +{"Pretrain/Learning Rate": 1.4994455357691128e-05, "Pretrain/Loss": 2.017871141433716, "Pretrain/Loss (Raw)": 2.1533095836639404, "Pretrain/Step": 6124, "Pretrain/Step Time": 8.546761944890022} +{"Pretrain/Learning Rate": 1.4986675659581103e-05, "Pretrain/Loss": 2.0179309844970703, "Pretrain/Loss (Raw)": 1.9489481449127197, "Pretrain/Step": 6125, "Pretrain/Step Time": 8.546039981767535} +{"Pretrain/Learning Rate": 1.4978897116254832e-05, "Pretrain/Loss": 2.0184202194213867, "Pretrain/Loss (Raw)": 1.940689206123352, "Pretrain/Step": 6126, "Pretrain/Step Time": 8.54522622935474} +{"Pretrain/Learning Rate": 1.4971119728609359e-05, "Pretrain/Loss": 2.019371509552002, "Pretrain/Loss (Raw)": 2.1823365688323975, "Pretrain/Step": 6127, "Pretrain/Step Time": 8.547095652669668} +{"Pretrain/Learning Rate": 1.4963343497541621e-05, "Pretrain/Loss": 2.0180110931396484, "Pretrain/Loss (Raw)": 2.1323091983795166, "Pretrain/Step": 6128, "Pretrain/Step Time": 8.544335534796119} +{"Pretrain/Learning Rate": 1.4955568423948402e-05, "Pretrain/Loss": 2.0200107097625732, "Pretrain/Loss (Raw)": 1.966886281967163, "Pretrain/Step": 6129, "Pretrain/Step Time": 8.546212676912546} +{"Pretrain/Learning Rate": 1.494779450872637e-05, "Pretrain/Loss": 2.01838755607605, "Pretrain/Loss (Raw)": 2.025942087173462, "Pretrain/Step": 6130, "Pretrain/Step Time": 8.54630921408534} +{"Pretrain/Learning Rate": 1.4940021752772034e-05, "Pretrain/Loss": 2.0195839405059814, "Pretrain/Loss (Raw)": 1.987939476966858, "Pretrain/Step": 6131, "Pretrain/Step Time": 8.551139488816261} +{"Pretrain/Learning Rate": 1.4932250156981803e-05, "Pretrain/Loss": 2.021592855453491, "Pretrain/Loss (Raw)": 2.022498607635498, "Pretrain/Step": 6132, "Pretrain/Step Time": 8.552993100136518} +{"Pretrain/Learning Rate": 1.4924479722251916e-05, "Pretrain/Loss": 2.020984172821045, "Pretrain/Loss (Raw)": 2.0702080726623535, "Pretrain/Step": 6133, "Pretrain/Step Time": 8.559416139498353} +{"Pretrain/Learning Rate": 1.4916710449478511e-05, "Pretrain/Loss": 2.019096851348877, "Pretrain/Loss (Raw)": 1.8996940851211548, "Pretrain/Step": 6134, "Pretrain/Step Time": 8.54647540487349} +{"Pretrain/Learning Rate": 1.4908942339557564e-05, "Pretrain/Loss": 2.0155189037323, "Pretrain/Loss (Raw)": 2.0749013423919678, "Pretrain/Step": 6135, "Pretrain/Step Time": 8.551885575056076} +{"Pretrain/Learning Rate": 1.4901175393384944e-05, "Pretrain/Loss": 2.017543315887451, "Pretrain/Loss (Raw)": 2.2145755290985107, "Pretrain/Step": 6136, "Pretrain/Step Time": 8.54933337494731} +{"Pretrain/Learning Rate": 1.4893409611856362e-05, "Pretrain/Loss": 2.016751289367676, "Pretrain/Loss (Raw)": 2.107832908630371, "Pretrain/Step": 6137, "Pretrain/Step Time": 8.547846212983131} +{"Pretrain/Learning Rate": 1.488564499586741e-05, "Pretrain/Loss": 2.0153281688690186, "Pretrain/Loss (Raw)": 1.7995507717132568, "Pretrain/Step": 6138, "Pretrain/Step Time": 8.553899317979813} +{"Pretrain/Learning Rate": 1.4877881546313532e-05, "Pretrain/Loss": 2.016378879547119, "Pretrain/Loss (Raw)": 2.1113572120666504, "Pretrain/Step": 6139, "Pretrain/Step Time": 8.556227207183838} +{"Pretrain/Learning Rate": 1.4870119264090057e-05, "Pretrain/Loss": 2.016805648803711, "Pretrain/Loss (Raw)": 2.090348958969116, "Pretrain/Step": 6140, "Pretrain/Step Time": 8.548567861318588} +{"Pretrain/Learning Rate": 1.4862358150092157e-05, "Pretrain/Loss": 2.0176610946655273, "Pretrain/Loss (Raw)": 2.0989205837249756, "Pretrain/Step": 6141, "Pretrain/Step Time": 8.550483768805861} +{"Pretrain/Learning Rate": 1.485459820521489e-05, "Pretrain/Loss": 2.0206267833709717, "Pretrain/Loss (Raw)": 2.5752172470092773, "Pretrain/Step": 6142, "Pretrain/Step Time": 8.542489795014262} +{"Pretrain/Learning Rate": 1.484683943035316e-05, "Pretrain/Loss": 2.020831823348999, "Pretrain/Loss (Raw)": 2.1003940105438232, "Pretrain/Step": 6143, "Pretrain/Step Time": 8.546726278960705} +{"Pretrain/Learning Rate": 1.4839081826401755e-05, "Pretrain/Loss": 2.021419048309326, "Pretrain/Loss (Raw)": 2.1990177631378174, "Pretrain/Step": 6144, "Pretrain/Step Time": 8.543617635965347} +{"Pretrain/Learning Rate": 1.4831325394255307e-05, "Pretrain/Loss": 2.022277355194092, "Pretrain/Loss (Raw)": 2.15102481842041, "Pretrain/Step": 6145, "Pretrain/Step Time": 8.54989785887301} +{"Pretrain/Learning Rate": 1.4823570134808342e-05, "Pretrain/Loss": 2.0224294662475586, "Pretrain/Loss (Raw)": 1.918415904045105, "Pretrain/Step": 6146, "Pretrain/Step Time": 8.546675637364388} +{"Pretrain/Learning Rate": 1.4815816048955208e-05, "Pretrain/Loss": 2.0242748260498047, "Pretrain/Loss (Raw)": 2.1410038471221924, "Pretrain/Step": 6147, "Pretrain/Step Time": 8.554541261866689} +{"Pretrain/Learning Rate": 1.4808063137590172e-05, "Pretrain/Loss": 2.0263783931732178, "Pretrain/Loss (Raw)": 2.108684539794922, "Pretrain/Step": 6148, "Pretrain/Step Time": 8.553575230762362} +{"Pretrain/Learning Rate": 1.4800311401607304e-05, "Pretrain/Loss": 2.027209997177124, "Pretrain/Loss (Raw)": 2.1654646396636963, "Pretrain/Step": 6149, "Pretrain/Step Time": 8.55372628942132} +{"Pretrain/Learning Rate": 1.4792560841900604e-05, "Pretrain/Loss": 2.0274062156677246, "Pretrain/Loss (Raw)": 2.081300973892212, "Pretrain/Step": 6150, "Pretrain/Step Time": 8.555794415995479} +{"Pretrain/Learning Rate": 1.4784811459363873e-05, "Pretrain/Loss": 2.027888536453247, "Pretrain/Loss (Raw)": 2.150259017944336, "Pretrain/Step": 6151, "Pretrain/Step Time": 8.55820375867188} +{"Pretrain/Learning Rate": 1.4777063254890833e-05, "Pretrain/Loss": 2.028355836868286, "Pretrain/Loss (Raw)": 1.9149694442749023, "Pretrain/Step": 6152, "Pretrain/Step Time": 8.558363679796457} +{"Pretrain/Learning Rate": 1.4769316229375012e-05, "Pretrain/Loss": 2.0266242027282715, "Pretrain/Loss (Raw)": 2.054030418395996, "Pretrain/Step": 6153, "Pretrain/Step Time": 8.560987200587988} +{"Pretrain/Learning Rate": 1.4761570383709871e-05, "Pretrain/Loss": 2.025496006011963, "Pretrain/Loss (Raw)": 2.03033185005188, "Pretrain/Step": 6154, "Pretrain/Step Time": 8.56070901080966} +{"Pretrain/Learning Rate": 1.4753825718788667e-05, "Pretrain/Loss": 2.0243139266967773, "Pretrain/Loss (Raw)": 2.036311149597168, "Pretrain/Step": 6155, "Pretrain/Step Time": 8.565050272271037} +{"Pretrain/Learning Rate": 1.4746082235504572e-05, "Pretrain/Loss": 2.023867607116699, "Pretrain/Loss (Raw)": 1.956441044807434, "Pretrain/Step": 6156, "Pretrain/Step Time": 8.56251472979784} +{"Pretrain/Learning Rate": 1.4738339934750584e-05, "Pretrain/Loss": 2.0243642330169678, "Pretrain/Loss (Raw)": 2.013254404067993, "Pretrain/Step": 6157, "Pretrain/Step Time": 8.56898008659482} +{"Pretrain/Learning Rate": 1.4730598817419593e-05, "Pretrain/Loss": 2.0237433910369873, "Pretrain/Loss (Raw)": 2.1058661937713623, "Pretrain/Step": 6158, "Pretrain/Step Time": 8.55917153507471} +{"Pretrain/Learning Rate": 1.4722858884404333e-05, "Pretrain/Loss": 2.029287576675415, "Pretrain/Loss (Raw)": 2.385835886001587, "Pretrain/Step": 6159, "Pretrain/Step Time": 8.565253708511591} +{"Pretrain/Learning Rate": 1.4715120136597421e-05, "Pretrain/Loss": 2.027895450592041, "Pretrain/Loss (Raw)": 2.155144691467285, "Pretrain/Step": 6160, "Pretrain/Step Time": 8.563126400113106} +{"Pretrain/Learning Rate": 1.4707382574891312e-05, "Pretrain/Loss": 2.0272350311279297, "Pretrain/Loss (Raw)": 2.1124722957611084, "Pretrain/Step": 6161, "Pretrain/Step Time": 8.564040768891573} +{"Pretrain/Learning Rate": 1.4699646200178353e-05, "Pretrain/Loss": 2.0275707244873047, "Pretrain/Loss (Raw)": 2.0326521396636963, "Pretrain/Step": 6162, "Pretrain/Step Time": 8.563355602324009} +{"Pretrain/Learning Rate": 1.469191101335072e-05, "Pretrain/Loss": 2.026191473007202, "Pretrain/Loss (Raw)": 1.9693886041641235, "Pretrain/Step": 6163, "Pretrain/Step Time": 8.569831417873502} +{"Pretrain/Learning Rate": 1.4684177015300491e-05, "Pretrain/Loss": 2.028564453125, "Pretrain/Loss (Raw)": 2.2971391677856445, "Pretrain/Step": 6164, "Pretrain/Step Time": 8.558300033211708} +{"Pretrain/Learning Rate": 1.467644420691957e-05, "Pretrain/Loss": 2.0304527282714844, "Pretrain/Loss (Raw)": 2.1800827980041504, "Pretrain/Step": 6165, "Pretrain/Step Time": 8.566139355301857} +{"Pretrain/Learning Rate": 1.4668712589099753e-05, "Pretrain/Loss": 2.02748441696167, "Pretrain/Loss (Raw)": 1.6557912826538086, "Pretrain/Step": 6166, "Pretrain/Step Time": 8.557852052152157} +{"Pretrain/Learning Rate": 1.466098216273269e-05, "Pretrain/Loss": 2.0286197662353516, "Pretrain/Loss (Raw)": 2.1922073364257812, "Pretrain/Step": 6167, "Pretrain/Step Time": 8.560532500967383} +{"Pretrain/Learning Rate": 1.465325292870987e-05, "Pretrain/Loss": 2.0328664779663086, "Pretrain/Loss (Raw)": 2.1041646003723145, "Pretrain/Step": 6168, "Pretrain/Step Time": 8.554601868614554} +{"Pretrain/Learning Rate": 1.464552488792269e-05, "Pretrain/Loss": 2.033998966217041, "Pretrain/Loss (Raw)": 2.2193551063537598, "Pretrain/Step": 6169, "Pretrain/Step Time": 8.565860204398632} +{"Pretrain/Learning Rate": 1.4637798041262363e-05, "Pretrain/Loss": 2.0340170860290527, "Pretrain/Loss (Raw)": 2.023138999938965, "Pretrain/Step": 6170, "Pretrain/Step Time": 8.560387233272195} +{"Pretrain/Learning Rate": 1.4630072389620003e-05, "Pretrain/Loss": 2.0349812507629395, "Pretrain/Loss (Raw)": 2.1308741569519043, "Pretrain/Step": 6171, "Pretrain/Step Time": 8.560201486572623} +{"Pretrain/Learning Rate": 1.462234793388655e-05, "Pretrain/Loss": 2.036630153656006, "Pretrain/Loss (Raw)": 2.3629255294799805, "Pretrain/Step": 6172, "Pretrain/Step Time": 8.557423090562224} +{"Pretrain/Learning Rate": 1.4614624674952842e-05, "Pretrain/Loss": 2.0356364250183105, "Pretrain/Loss (Raw)": 1.9101192951202393, "Pretrain/Step": 6173, "Pretrain/Step Time": 8.555933335795999} +{"Pretrain/Learning Rate": 1.460690261370955e-05, "Pretrain/Loss": 2.0371365547180176, "Pretrain/Loss (Raw)": 2.158701181411743, "Pretrain/Step": 6174, "Pretrain/Step Time": 8.558110293000937} +{"Pretrain/Learning Rate": 1.4599181751047225e-05, "Pretrain/Loss": 2.038954734802246, "Pretrain/Loss (Raw)": 2.082519769668579, "Pretrain/Step": 6175, "Pretrain/Step Time": 8.561293611302972} +{"Pretrain/Learning Rate": 1.4591462087856262e-05, "Pretrain/Loss": 2.040158748626709, "Pretrain/Loss (Raw)": 2.232886552810669, "Pretrain/Step": 6176, "Pretrain/Step Time": 8.554712731391191} +{"Pretrain/Learning Rate": 1.4583743625026958e-05, "Pretrain/Loss": 2.0418624877929688, "Pretrain/Loss (Raw)": 2.1778500080108643, "Pretrain/Step": 6177, "Pretrain/Step Time": 8.555930122733116} +{"Pretrain/Learning Rate": 1.4576026363449402e-05, "Pretrain/Loss": 2.0410194396972656, "Pretrain/Loss (Raw)": 2.0525918006896973, "Pretrain/Step": 6178, "Pretrain/Step Time": 8.559873502701521} +{"Pretrain/Learning Rate": 1.4568310304013613e-05, "Pretrain/Loss": 2.0417754650115967, "Pretrain/Loss (Raw)": 2.0780560970306396, "Pretrain/Step": 6179, "Pretrain/Step Time": 8.557589961215854} +{"Pretrain/Learning Rate": 1.4560595447609427e-05, "Pretrain/Loss": 2.042020559310913, "Pretrain/Loss (Raw)": 2.0486741065979004, "Pretrain/Step": 6180, "Pretrain/Step Time": 8.56263417750597} +{"Pretrain/Learning Rate": 1.4552881795126588e-05, "Pretrain/Loss": 2.043761730194092, "Pretrain/Loss (Raw)": 1.9591797590255737, "Pretrain/Step": 6181, "Pretrain/Step Time": 8.567062763497233} +{"Pretrain/Learning Rate": 1.4545169347454627e-05, "Pretrain/Loss": 2.0446054935455322, "Pretrain/Loss (Raw)": 2.065758466720581, "Pretrain/Step": 6182, "Pretrain/Step Time": 8.557956878095865} +{"Pretrain/Learning Rate": 1.453745810548301e-05, "Pretrain/Loss": 2.04504656791687, "Pretrain/Loss (Raw)": 2.1097590923309326, "Pretrain/Step": 6183, "Pretrain/Step Time": 8.56257962435484} +{"Pretrain/Learning Rate": 1.452974807010103e-05, "Pretrain/Loss": 2.0451066493988037, "Pretrain/Loss (Raw)": 1.9296468496322632, "Pretrain/Step": 6184, "Pretrain/Step Time": 8.555833116173744} +{"Pretrain/Learning Rate": 1.4522039242197835e-05, "Pretrain/Loss": 2.0442354679107666, "Pretrain/Loss (Raw)": 2.044513463973999, "Pretrain/Step": 6185, "Pretrain/Step Time": 8.555507818236947} +{"Pretrain/Learning Rate": 1.4514331622662441e-05, "Pretrain/Loss": 2.0438268184661865, "Pretrain/Loss (Raw)": 1.9528216123580933, "Pretrain/Step": 6186, "Pretrain/Step Time": 8.55849409289658} +{"Pretrain/Learning Rate": 1.4506625212383743e-05, "Pretrain/Loss": 2.044283390045166, "Pretrain/Loss (Raw)": 2.1407973766326904, "Pretrain/Step": 6187, "Pretrain/Step Time": 8.553967325016856} +{"Pretrain/Learning Rate": 1.4498920012250472e-05, "Pretrain/Loss": 2.0471556186676025, "Pretrain/Loss (Raw)": 2.1058833599090576, "Pretrain/Step": 6188, "Pretrain/Step Time": 8.55606634542346} +{"Pretrain/Learning Rate": 1.449121602315123e-05, "Pretrain/Loss": 2.0490071773529053, "Pretrain/Loss (Raw)": 2.0961215496063232, "Pretrain/Step": 6189, "Pretrain/Step Time": 8.55893912166357} +{"Pretrain/Learning Rate": 1.4483513245974461e-05, "Pretrain/Loss": 2.0468225479125977, "Pretrain/Loss (Raw)": 1.795317530632019, "Pretrain/Step": 6190, "Pretrain/Step Time": 8.554402912035584} +{"Pretrain/Learning Rate": 1.4475811681608515e-05, "Pretrain/Loss": 2.048650026321411, "Pretrain/Loss (Raw)": 2.1826272010803223, "Pretrain/Step": 6191, "Pretrain/Step Time": 8.554668996483088} +{"Pretrain/Learning Rate": 1.4468111330941556e-05, "Pretrain/Loss": 2.0492501258850098, "Pretrain/Loss (Raw)": 2.0825042724609375, "Pretrain/Step": 6192, "Pretrain/Step Time": 8.558596644550562} +{"Pretrain/Learning Rate": 1.4460412194861624e-05, "Pretrain/Loss": 2.0506114959716797, "Pretrain/Loss (Raw)": 2.1605470180511475, "Pretrain/Step": 6193, "Pretrain/Step Time": 8.556672658771276} +{"Pretrain/Learning Rate": 1.4452714274256612e-05, "Pretrain/Loss": 2.0461068153381348, "Pretrain/Loss (Raw)": 1.9198386669158936, "Pretrain/Step": 6194, "Pretrain/Step Time": 8.55445908382535} +{"Pretrain/Learning Rate": 1.4445017570014303e-05, "Pretrain/Loss": 2.0428192615509033, "Pretrain/Loss (Raw)": 1.8530806303024292, "Pretrain/Step": 6195, "Pretrain/Step Time": 8.558579931035638} +{"Pretrain/Learning Rate": 1.4437322083022304e-05, "Pretrain/Loss": 2.0425281524658203, "Pretrain/Loss (Raw)": 1.9731208086013794, "Pretrain/Step": 6196, "Pretrain/Step Time": 8.550198327749968} +{"Pretrain/Learning Rate": 1.4429627814168095e-05, "Pretrain/Loss": 2.0415406227111816, "Pretrain/Loss (Raw)": 1.846445083618164, "Pretrain/Step": 6197, "Pretrain/Step Time": 8.55550867319107} +{"Pretrain/Learning Rate": 1.4421934764339004e-05, "Pretrain/Loss": 2.0403833389282227, "Pretrain/Loss (Raw)": 1.9334293603897095, "Pretrain/Step": 6198, "Pretrain/Step Time": 8.557722937315702} +{"Pretrain/Learning Rate": 1.4414242934422251e-05, "Pretrain/Loss": 2.0406956672668457, "Pretrain/Loss (Raw)": 1.8692882061004639, "Pretrain/Step": 6199, "Pretrain/Step Time": 8.554120905697346} +{"Pretrain/Learning Rate": 1.440655232530489e-05, "Pretrain/Loss": 2.040879726409912, "Pretrain/Loss (Raw)": 2.0479230880737305, "Pretrain/Step": 6200, "Pretrain/Step Time": 8.560162140056491} +{"Pretrain/Learning Rate": 1.4398862937873825e-05, "Pretrain/Loss": 2.040463924407959, "Pretrain/Loss (Raw)": 2.001530170440674, "Pretrain/Step": 6201, "Pretrain/Step Time": 8.556547734886408} +{"Pretrain/Learning Rate": 1.4391174773015836e-05, "Pretrain/Loss": 2.0400588512420654, "Pretrain/Loss (Raw)": 1.964002251625061, "Pretrain/Step": 6202, "Pretrain/Step Time": 8.550125880166888} +{"Pretrain/Learning Rate": 1.4383487831617571e-05, "Pretrain/Loss": 2.04217529296875, "Pretrain/Loss (Raw)": 2.3283331394195557, "Pretrain/Step": 6203, "Pretrain/Step Time": 8.551685651764274} +{"Pretrain/Learning Rate": 1.4375802114565515e-05, "Pretrain/Loss": 2.042907953262329, "Pretrain/Loss (Raw)": 2.153292179107666, "Pretrain/Step": 6204, "Pretrain/Step Time": 8.552077086642385} +{"Pretrain/Learning Rate": 1.4368117622746025e-05, "Pretrain/Loss": 2.0448453426361084, "Pretrain/Loss (Raw)": 2.1265430450439453, "Pretrain/Step": 6205, "Pretrain/Step Time": 8.547678666189313} +{"Pretrain/Learning Rate": 1.4360434357045294e-05, "Pretrain/Loss": 2.0435705184936523, "Pretrain/Loss (Raw)": 1.9702820777893066, "Pretrain/Step": 6206, "Pretrain/Step Time": 8.554919593036175} +{"Pretrain/Learning Rate": 1.4352752318349421e-05, "Pretrain/Loss": 2.0453248023986816, "Pretrain/Loss (Raw)": 2.1494297981262207, "Pretrain/Step": 6207, "Pretrain/Step Time": 8.555337781086564} +{"Pretrain/Learning Rate": 1.4345071507544326e-05, "Pretrain/Loss": 2.044126033782959, "Pretrain/Loss (Raw)": 1.9926789999008179, "Pretrain/Step": 6208, "Pretrain/Step Time": 8.554892571642995} +{"Pretrain/Learning Rate": 1.4337391925515777e-05, "Pretrain/Loss": 2.042611837387085, "Pretrain/Loss (Raw)": 1.8358228206634521, "Pretrain/Step": 6209, "Pretrain/Step Time": 8.557794956490397} +{"Pretrain/Learning Rate": 1.432971357314945e-05, "Pretrain/Loss": 2.041444778442383, "Pretrain/Loss (Raw)": 2.049544334411621, "Pretrain/Step": 6210, "Pretrain/Step Time": 8.56102418154478} +{"Pretrain/Learning Rate": 1.4322036451330828e-05, "Pretrain/Loss": 2.040242910385132, "Pretrain/Loss (Raw)": 1.8481260538101196, "Pretrain/Step": 6211, "Pretrain/Step Time": 8.558152904734015} +{"Pretrain/Learning Rate": 1.4314360560945284e-05, "Pretrain/Loss": 2.039912223815918, "Pretrain/Loss (Raw)": 1.9900091886520386, "Pretrain/Step": 6212, "Pretrain/Step Time": 8.567669274285436} +{"Pretrain/Learning Rate": 1.430668590287802e-05, "Pretrain/Loss": 2.0377368927001953, "Pretrain/Loss (Raw)": 1.9797732830047607, "Pretrain/Step": 6213, "Pretrain/Step Time": 8.55898816511035} +{"Pretrain/Learning Rate": 1.4299012478014146e-05, "Pretrain/Loss": 2.0395760536193848, "Pretrain/Loss (Raw)": 2.203476905822754, "Pretrain/Step": 6214, "Pretrain/Step Time": 8.556486424058676} +{"Pretrain/Learning Rate": 1.4291340287238558e-05, "Pretrain/Loss": 2.037592887878418, "Pretrain/Loss (Raw)": 1.9002490043640137, "Pretrain/Step": 6215, "Pretrain/Step Time": 8.558267610147595} +{"Pretrain/Learning Rate": 1.4283669331436078e-05, "Pretrain/Loss": 2.0367865562438965, "Pretrain/Loss (Raw)": 1.9761872291564941, "Pretrain/Step": 6216, "Pretrain/Step Time": 8.56080793403089} +{"Pretrain/Learning Rate": 1.4275999611491342e-05, "Pretrain/Loss": 2.0365123748779297, "Pretrain/Loss (Raw)": 1.9677822589874268, "Pretrain/Step": 6217, "Pretrain/Step Time": 8.56066737510264} +{"Pretrain/Learning Rate": 1.4268331128288881e-05, "Pretrain/Loss": 2.0366621017456055, "Pretrain/Loss (Raw)": 2.0910451412200928, "Pretrain/Step": 6218, "Pretrain/Step Time": 8.559059316292405} +{"Pretrain/Learning Rate": 1.4260663882713022e-05, "Pretrain/Loss": 2.034359931945801, "Pretrain/Loss (Raw)": 1.8850129842758179, "Pretrain/Step": 6219, "Pretrain/Step Time": 8.554995881393552} +{"Pretrain/Learning Rate": 1.4252997875648021e-05, "Pretrain/Loss": 2.0344247817993164, "Pretrain/Loss (Raw)": 2.107663869857788, "Pretrain/Step": 6220, "Pretrain/Step Time": 8.55529166944325} +{"Pretrain/Learning Rate": 1.4245333107977937e-05, "Pretrain/Loss": 2.037689447402954, "Pretrain/Loss (Raw)": 2.5281500816345215, "Pretrain/Step": 6221, "Pretrain/Step Time": 8.557036025449634} +{"Pretrain/Learning Rate": 1.4237669580586736e-05, "Pretrain/Loss": 2.0390095710754395, "Pretrain/Loss (Raw)": 2.0005831718444824, "Pretrain/Step": 6222, "Pretrain/Step Time": 8.557355552911758} +{"Pretrain/Learning Rate": 1.4230007294358173e-05, "Pretrain/Loss": 2.0364537239074707, "Pretrain/Loss (Raw)": 1.8451677560806274, "Pretrain/Step": 6223, "Pretrain/Step Time": 8.558684838935733} +{"Pretrain/Learning Rate": 1.4222346250175928e-05, "Pretrain/Loss": 2.0385875701904297, "Pretrain/Loss (Raw)": 2.0664215087890625, "Pretrain/Step": 6224, "Pretrain/Step Time": 8.559934493154287} +{"Pretrain/Learning Rate": 1.4214686448923498e-05, "Pretrain/Loss": 2.039301872253418, "Pretrain/Loss (Raw)": 2.1770074367523193, "Pretrain/Step": 6225, "Pretrain/Step Time": 8.55696115270257} +{"Pretrain/Learning Rate": 1.420702789148425e-05, "Pretrain/Loss": 2.0383119583129883, "Pretrain/Loss (Raw)": 2.0328218936920166, "Pretrain/Step": 6226, "Pretrain/Step Time": 8.55787475220859} +{"Pretrain/Learning Rate": 1.4199370578741395e-05, "Pretrain/Loss": 2.042646646499634, "Pretrain/Loss (Raw)": 2.450639247894287, "Pretrain/Step": 6227, "Pretrain/Step Time": 8.556633478030562} +{"Pretrain/Learning Rate": 1.419171451157803e-05, "Pretrain/Loss": 2.04467511177063, "Pretrain/Loss (Raw)": 2.0232808589935303, "Pretrain/Step": 6228, "Pretrain/Step Time": 8.553796108812094} +{"Pretrain/Learning Rate": 1.4184059690877075e-05, "Pretrain/Loss": 2.046327590942383, "Pretrain/Loss (Raw)": 2.0538506507873535, "Pretrain/Step": 6229, "Pretrain/Step Time": 8.558475390076637} +{"Pretrain/Learning Rate": 1.4176406117521324e-05, "Pretrain/Loss": 2.047722816467285, "Pretrain/Loss (Raw)": 2.0799808502197266, "Pretrain/Step": 6230, "Pretrain/Step Time": 8.560306329280138} +{"Pretrain/Learning Rate": 1.4168753792393414e-05, "Pretrain/Loss": 2.048875570297241, "Pretrain/Loss (Raw)": 1.9739657640457153, "Pretrain/Step": 6231, "Pretrain/Step Time": 8.559034019708633} +{"Pretrain/Learning Rate": 1.4161102716375863e-05, "Pretrain/Loss": 2.050502300262451, "Pretrain/Loss (Raw)": 2.167318344116211, "Pretrain/Step": 6232, "Pretrain/Step Time": 8.561760526150465} +{"Pretrain/Learning Rate": 1.4153452890351022e-05, "Pretrain/Loss": 2.050011157989502, "Pretrain/Loss (Raw)": 1.9526921510696411, "Pretrain/Step": 6233, "Pretrain/Step Time": 8.562161838635802} +{"Pretrain/Learning Rate": 1.41458043152011e-05, "Pretrain/Loss": 2.0509207248687744, "Pretrain/Loss (Raw)": 1.9813107252120972, "Pretrain/Step": 6234, "Pretrain/Step Time": 8.557194605469704} +{"Pretrain/Learning Rate": 1.4138156991808165e-05, "Pretrain/Loss": 2.0491533279418945, "Pretrain/Loss (Raw)": 1.899632453918457, "Pretrain/Step": 6235, "Pretrain/Step Time": 8.560623290017247} +{"Pretrain/Learning Rate": 1.4130510921054157e-05, "Pretrain/Loss": 2.0479679107666016, "Pretrain/Loss (Raw)": 1.8542864322662354, "Pretrain/Step": 6236, "Pretrain/Step Time": 8.559398353099823} +{"Pretrain/Learning Rate": 1.4122866103820854e-05, "Pretrain/Loss": 2.0485167503356934, "Pretrain/Loss (Raw)": 1.9607518911361694, "Pretrain/Step": 6237, "Pretrain/Step Time": 8.555210104212165} +{"Pretrain/Learning Rate": 1.411522254098988e-05, "Pretrain/Loss": 2.0490100383758545, "Pretrain/Loss (Raw)": 1.9791970252990723, "Pretrain/Step": 6238, "Pretrain/Step Time": 8.555776225402951} +{"Pretrain/Learning Rate": 1.4107580233442725e-05, "Pretrain/Loss": 2.049668788909912, "Pretrain/Loss (Raw)": 2.097625732421875, "Pretrain/Step": 6239, "Pretrain/Step Time": 8.554041104391217} +{"Pretrain/Learning Rate": 1.4099939182060755e-05, "Pretrain/Loss": 2.0498287677764893, "Pretrain/Loss (Raw)": 2.0768821239471436, "Pretrain/Step": 6240, "Pretrain/Step Time": 8.551316507160664} +{"Pretrain/Learning Rate": 1.409229938772516e-05, "Pretrain/Loss": 2.0519585609436035, "Pretrain/Loss (Raw)": 2.1281158924102783, "Pretrain/Step": 6241, "Pretrain/Step Time": 8.54425398260355} +{"Pretrain/Learning Rate": 1.4084660851316999e-05, "Pretrain/Loss": 2.0519533157348633, "Pretrain/Loss (Raw)": 2.174184560775757, "Pretrain/Step": 6242, "Pretrain/Step Time": 8.549858445301652} +{"Pretrain/Learning Rate": 1.4077023573717174e-05, "Pretrain/Loss": 2.0546011924743652, "Pretrain/Loss (Raw)": 2.029999256134033, "Pretrain/Step": 6243, "Pretrain/Step Time": 8.54479931294918} +{"Pretrain/Learning Rate": 1.4069387555806473e-05, "Pretrain/Loss": 2.0555620193481445, "Pretrain/Loss (Raw)": 2.1695284843444824, "Pretrain/Step": 6244, "Pretrain/Step Time": 8.552972611039877} +{"Pretrain/Learning Rate": 1.4061752798465503e-05, "Pretrain/Loss": 2.0551276206970215, "Pretrain/Loss (Raw)": 2.170370101928711, "Pretrain/Step": 6245, "Pretrain/Step Time": 8.554785698652267} +{"Pretrain/Learning Rate": 1.4054119302574741e-05, "Pretrain/Loss": 2.0573620796203613, "Pretrain/Loss (Raw)": 2.108487367630005, "Pretrain/Step": 6246, "Pretrain/Step Time": 8.550873523578048} +{"Pretrain/Learning Rate": 1.4046487069014513e-05, "Pretrain/Loss": 2.0590310096740723, "Pretrain/Loss (Raw)": 2.2468152046203613, "Pretrain/Step": 6247, "Pretrain/Step Time": 8.550883498042822} +{"Pretrain/Learning Rate": 1.403885609866502e-05, "Pretrain/Loss": 2.0637590885162354, "Pretrain/Loss (Raw)": 2.3676319122314453, "Pretrain/Step": 6248, "Pretrain/Step Time": 8.55003579519689} +{"Pretrain/Learning Rate": 1.4031226392406293e-05, "Pretrain/Loss": 2.0627517700195312, "Pretrain/Loss (Raw)": 1.9910446405410767, "Pretrain/Step": 6249, "Pretrain/Step Time": 8.554205894470215} +{"Pretrain/Learning Rate": 1.4023597951118217e-05, "Pretrain/Loss": 2.0642104148864746, "Pretrain/Loss (Raw)": 2.125013589859009, "Pretrain/Step": 6250, "Pretrain/Step Time": 8.558053858578205} +{"Pretrain/Learning Rate": 1.4015970775680554e-05, "Pretrain/Loss": 2.065778970718384, "Pretrain/Loss (Raw)": 2.0247700214385986, "Pretrain/Step": 6251, "Pretrain/Step Time": 8.553487360477448} +{"Pretrain/Learning Rate": 1.4008344866972902e-05, "Pretrain/Loss": 2.064223051071167, "Pretrain/Loss (Raw)": 1.9541521072387695, "Pretrain/Step": 6252, "Pretrain/Step Time": 8.554430970922112} +{"Pretrain/Learning Rate": 1.4000720225874714e-05, "Pretrain/Loss": 2.0650482177734375, "Pretrain/Loss (Raw)": 2.054553985595703, "Pretrain/Step": 6253, "Pretrain/Step Time": 8.554841378703713} +{"Pretrain/Learning Rate": 1.399309685326529e-05, "Pretrain/Loss": 2.064758062362671, "Pretrain/Loss (Raw)": 1.9035533666610718, "Pretrain/Step": 6254, "Pretrain/Step Time": 8.556329121813178} +{"Pretrain/Learning Rate": 1.3985474750023821e-05, "Pretrain/Loss": 2.0642168521881104, "Pretrain/Loss (Raw)": 2.1130638122558594, "Pretrain/Step": 6255, "Pretrain/Step Time": 8.561054594814777} +{"Pretrain/Learning Rate": 1.3977853917029287e-05, "Pretrain/Loss": 2.064054489135742, "Pretrain/Loss (Raw)": 2.111522674560547, "Pretrain/Step": 6256, "Pretrain/Step Time": 8.555877588689327} +{"Pretrain/Learning Rate": 1.3970234355160588e-05, "Pretrain/Loss": 2.0667524337768555, "Pretrain/Loss (Raw)": 2.312229871749878, "Pretrain/Step": 6257, "Pretrain/Step Time": 8.554483655840158} +{"Pretrain/Learning Rate": 1.3962616065296428e-05, "Pretrain/Loss": 2.0674855709075928, "Pretrain/Loss (Raw)": 2.119776725769043, "Pretrain/Step": 6258, "Pretrain/Step Time": 8.558029057458043} +{"Pretrain/Learning Rate": 1.395499904831541e-05, "Pretrain/Loss": 2.0668015480041504, "Pretrain/Loss (Raw)": 1.9004144668579102, "Pretrain/Step": 6259, "Pretrain/Step Time": 8.553984194993973} +{"Pretrain/Learning Rate": 1.394738330509593e-05, "Pretrain/Loss": 2.06695556640625, "Pretrain/Loss (Raw)": 2.0421900749206543, "Pretrain/Step": 6260, "Pretrain/Step Time": 8.556380331516266} +{"Pretrain/Learning Rate": 1.3939768836516299e-05, "Pretrain/Loss": 2.066465377807617, "Pretrain/Loss (Raw)": 2.0074892044067383, "Pretrain/Step": 6261, "Pretrain/Step Time": 8.553050553426147} +{"Pretrain/Learning Rate": 1.393215564345463e-05, "Pretrain/Loss": 2.067695140838623, "Pretrain/Loss (Raw)": 2.057093381881714, "Pretrain/Step": 6262, "Pretrain/Step Time": 8.561939420178533} +{"Pretrain/Learning Rate": 1.3924543726788953e-05, "Pretrain/Loss": 2.070004463195801, "Pretrain/Loss (Raw)": 2.3705008029937744, "Pretrain/Step": 6263, "Pretrain/Step Time": 8.558174712583423} +{"Pretrain/Learning Rate": 1.3916933087397055e-05, "Pretrain/Loss": 2.0687875747680664, "Pretrain/Loss (Raw)": 2.0588126182556152, "Pretrain/Step": 6264, "Pretrain/Step Time": 8.557250758633018} +{"Pretrain/Learning Rate": 1.3909323726156672e-05, "Pretrain/Loss": 2.067772150039673, "Pretrain/Loss (Raw)": 1.9778454303741455, "Pretrain/Step": 6265, "Pretrain/Step Time": 8.558560330420732} +{"Pretrain/Learning Rate": 1.3901715643945337e-05, "Pretrain/Loss": 2.068854570388794, "Pretrain/Loss (Raw)": 1.9380898475646973, "Pretrain/Step": 6266, "Pretrain/Step Time": 8.557983495295048} +{"Pretrain/Learning Rate": 1.3894108841640452e-05, "Pretrain/Loss": 2.0678763389587402, "Pretrain/Loss (Raw)": 1.9861520528793335, "Pretrain/Step": 6267, "Pretrain/Step Time": 8.555248429998755} +{"Pretrain/Learning Rate": 1.3886503320119256e-05, "Pretrain/Loss": 2.066443681716919, "Pretrain/Loss (Raw)": 1.9069697856903076, "Pretrain/Step": 6268, "Pretrain/Step Time": 8.560119537636638} +{"Pretrain/Learning Rate": 1.3878899080258878e-05, "Pretrain/Loss": 2.0682320594787598, "Pretrain/Loss (Raw)": 2.327842950820923, "Pretrain/Step": 6269, "Pretrain/Step Time": 8.55741143040359} +{"Pretrain/Learning Rate": 1.3871296122936261e-05, "Pretrain/Loss": 2.06430721282959, "Pretrain/Loss (Raw)": 2.0728065967559814, "Pretrain/Step": 6270, "Pretrain/Step Time": 8.56146796606481} +{"Pretrain/Learning Rate": 1.3863694449028214e-05, "Pretrain/Loss": 2.0653812885284424, "Pretrain/Loss (Raw)": 2.237896203994751, "Pretrain/Step": 6271, "Pretrain/Step Time": 8.561236528679729} +{"Pretrain/Learning Rate": 1.3856094059411392e-05, "Pretrain/Loss": 2.0638153553009033, "Pretrain/Loss (Raw)": 1.9985699653625488, "Pretrain/Step": 6272, "Pretrain/Step Time": 8.560501676052809} +{"Pretrain/Learning Rate": 1.3848494954962324e-05, "Pretrain/Loss": 2.062828779220581, "Pretrain/Loss (Raw)": 2.0247621536254883, "Pretrain/Step": 6273, "Pretrain/Step Time": 8.55552783422172} +{"Pretrain/Learning Rate": 1.3840897136557366e-05, "Pretrain/Loss": 2.0633230209350586, "Pretrain/Loss (Raw)": 1.9816704988479614, "Pretrain/Step": 6274, "Pretrain/Step Time": 8.560285553336143} +{"Pretrain/Learning Rate": 1.383330060507273e-05, "Pretrain/Loss": 2.063070297241211, "Pretrain/Loss (Raw)": 2.1086618900299072, "Pretrain/Step": 6275, "Pretrain/Step Time": 8.553432231768966} +{"Pretrain/Learning Rate": 1.382570536138448e-05, "Pretrain/Loss": 2.062880039215088, "Pretrain/Loss (Raw)": 2.0843071937561035, "Pretrain/Step": 6276, "Pretrain/Step Time": 8.550145626068115} +{"Pretrain/Learning Rate": 1.3818111406368555e-05, "Pretrain/Loss": 2.0623855590820312, "Pretrain/Loss (Raw)": 2.102179527282715, "Pretrain/Step": 6277, "Pretrain/Step Time": 8.550089372321963} +{"Pretrain/Learning Rate": 1.381051874090071e-05, "Pretrain/Loss": 2.0618093013763428, "Pretrain/Loss (Raw)": 2.007542371749878, "Pretrain/Step": 6278, "Pretrain/Step Time": 8.549608577042818} +{"Pretrain/Learning Rate": 1.3802927365856571e-05, "Pretrain/Loss": 2.0602712631225586, "Pretrain/Loss (Raw)": 1.9533631801605225, "Pretrain/Step": 6279, "Pretrain/Step Time": 8.552211336791515} +{"Pretrain/Learning Rate": 1.3795337282111604e-05, "Pretrain/Loss": 2.0607354640960693, "Pretrain/Loss (Raw)": 1.9744114875793457, "Pretrain/Step": 6280, "Pretrain/Step Time": 8.552954114973545} +{"Pretrain/Learning Rate": 1.3787748490541144e-05, "Pretrain/Loss": 2.0607924461364746, "Pretrain/Loss (Raw)": 2.061326026916504, "Pretrain/Step": 6281, "Pretrain/Step Time": 8.54569530300796} +{"Pretrain/Learning Rate": 1.3780160992020364e-05, "Pretrain/Loss": 2.0603625774383545, "Pretrain/Loss (Raw)": 1.9753135442733765, "Pretrain/Step": 6282, "Pretrain/Step Time": 8.541763335466385} +{"Pretrain/Learning Rate": 1.3772574787424291e-05, "Pretrain/Loss": 2.06242299079895, "Pretrain/Loss (Raw)": 2.3000433444976807, "Pretrain/Step": 6283, "Pretrain/Step Time": 8.538900872692466} +{"Pretrain/Learning Rate": 1.3764989877627785e-05, "Pretrain/Loss": 2.062074661254883, "Pretrain/Loss (Raw)": 1.9118382930755615, "Pretrain/Step": 6284, "Pretrain/Step Time": 8.539142264053226} +{"Pretrain/Learning Rate": 1.3757406263505602e-05, "Pretrain/Loss": 2.0629124641418457, "Pretrain/Loss (Raw)": 2.1205053329467773, "Pretrain/Step": 6285, "Pretrain/Step Time": 8.537612896412611} +{"Pretrain/Learning Rate": 1.37498239459323e-05, "Pretrain/Loss": 2.0614945888519287, "Pretrain/Loss (Raw)": 1.924353003501892, "Pretrain/Step": 6286, "Pretrain/Step Time": 8.54152380488813} +{"Pretrain/Learning Rate": 1.3742242925782317e-05, "Pretrain/Loss": 2.0606932640075684, "Pretrain/Loss (Raw)": 2.2832820415496826, "Pretrain/Step": 6287, "Pretrain/Step Time": 8.540178753435612} +{"Pretrain/Learning Rate": 1.3734663203929916e-05, "Pretrain/Loss": 2.060483455657959, "Pretrain/Loss (Raw)": 2.128290891647339, "Pretrain/Step": 6288, "Pretrain/Step Time": 8.540719512850046} +{"Pretrain/Learning Rate": 1.372708478124925e-05, "Pretrain/Loss": 2.060922622680664, "Pretrain/Loss (Raw)": 2.1686818599700928, "Pretrain/Step": 6289, "Pretrain/Step Time": 8.53689762018621} +{"Pretrain/Learning Rate": 1.3719507658614284e-05, "Pretrain/Loss": 2.058969497680664, "Pretrain/Loss (Raw)": 1.7826505899429321, "Pretrain/Step": 6290, "Pretrain/Step Time": 8.538764441385865} +{"Pretrain/Learning Rate": 1.3711931836898842e-05, "Pretrain/Loss": 2.060060977935791, "Pretrain/Loss (Raw)": 2.1091065406799316, "Pretrain/Step": 6291, "Pretrain/Step Time": 8.541826281696558} +{"Pretrain/Learning Rate": 1.3704357316976623e-05, "Pretrain/Loss": 2.0580615997314453, "Pretrain/Loss (Raw)": 2.041236639022827, "Pretrain/Step": 6292, "Pretrain/Step Time": 8.545837001875043} +{"Pretrain/Learning Rate": 1.3696784099721143e-05, "Pretrain/Loss": 2.058530330657959, "Pretrain/Loss (Raw)": 2.240077018737793, "Pretrain/Step": 6293, "Pretrain/Step Time": 8.542780980467796} +{"Pretrain/Learning Rate": 1.3689212186005784e-05, "Pretrain/Loss": 2.0622336864471436, "Pretrain/Loss (Raw)": 2.129805564880371, "Pretrain/Step": 6294, "Pretrain/Step Time": 8.54419724456966} +{"Pretrain/Learning Rate": 1.3681641576703763e-05, "Pretrain/Loss": 2.061728000640869, "Pretrain/Loss (Raw)": 2.1274898052215576, "Pretrain/Step": 6295, "Pretrain/Step Time": 8.546684922650456} +{"Pretrain/Learning Rate": 1.3674072272688182e-05, "Pretrain/Loss": 2.061840057373047, "Pretrain/Loss (Raw)": 2.118478536605835, "Pretrain/Step": 6296, "Pretrain/Step Time": 8.545339953154325} +{"Pretrain/Learning Rate": 1.3666504274831954e-05, "Pretrain/Loss": 2.0612919330596924, "Pretrain/Loss (Raw)": 2.1491987705230713, "Pretrain/Step": 6297, "Pretrain/Step Time": 8.539542939513922} +{"Pretrain/Learning Rate": 1.3658937584007859e-05, "Pretrain/Loss": 2.0573790073394775, "Pretrain/Loss (Raw)": 1.5223034620285034, "Pretrain/Step": 6298, "Pretrain/Step Time": 8.541576309129596} +{"Pretrain/Learning Rate": 1.3651372201088508e-05, "Pretrain/Loss": 2.0564427375793457, "Pretrain/Loss (Raw)": 2.0110301971435547, "Pretrain/Step": 6299, "Pretrain/Step Time": 8.541242079809308} +{"Pretrain/Learning Rate": 1.3643808126946417e-05, "Pretrain/Loss": 2.0535998344421387, "Pretrain/Loss (Raw)": 1.9990267753601074, "Pretrain/Step": 6300, "Pretrain/Step Time": 8.54196147993207} +{"Pretrain/Learning Rate": 1.3636245362453865e-05, "Pretrain/Loss": 2.0546178817749023, "Pretrain/Loss (Raw)": 2.04044246673584, "Pretrain/Step": 6301, "Pretrain/Step Time": 8.548428820446134} +{"Pretrain/Learning Rate": 1.3628683908483054e-05, "Pretrain/Loss": 2.0510592460632324, "Pretrain/Loss (Raw)": 1.703194499015808, "Pretrain/Step": 6302, "Pretrain/Step Time": 8.547721726819873} +{"Pretrain/Learning Rate": 1.3621123765905985e-05, "Pretrain/Loss": 2.050983428955078, "Pretrain/Loss (Raw)": 2.072798252105713, "Pretrain/Step": 6303, "Pretrain/Step Time": 8.547172144055367} +{"Pretrain/Learning Rate": 1.3613564935594565e-05, "Pretrain/Loss": 2.0494027137756348, "Pretrain/Loss (Raw)": 2.0305769443511963, "Pretrain/Step": 6304, "Pretrain/Step Time": 8.549813935533166} +{"Pretrain/Learning Rate": 1.3606007418420472e-05, "Pretrain/Loss": 2.049032688140869, "Pretrain/Loss (Raw)": 2.1304614543914795, "Pretrain/Step": 6305, "Pretrain/Step Time": 8.549422577023506} +{"Pretrain/Learning Rate": 1.3598451215255303e-05, "Pretrain/Loss": 2.0483193397521973, "Pretrain/Loss (Raw)": 1.9612904787063599, "Pretrain/Step": 6306, "Pretrain/Step Time": 8.547400675714016} +{"Pretrain/Learning Rate": 1.3590896326970465e-05, "Pretrain/Loss": 2.048704147338867, "Pretrain/Loss (Raw)": 2.1273105144500732, "Pretrain/Step": 6307, "Pretrain/Step Time": 8.550354799255729} +{"Pretrain/Learning Rate": 1.3583342754437226e-05, "Pretrain/Loss": 2.049488067626953, "Pretrain/Loss (Raw)": 2.1490368843078613, "Pretrain/Step": 6308, "Pretrain/Step Time": 8.543153071776032} +{"Pretrain/Learning Rate": 1.3575790498526687e-05, "Pretrain/Loss": 2.0504863262176514, "Pretrain/Loss (Raw)": 2.0869319438934326, "Pretrain/Step": 6309, "Pretrain/Step Time": 8.543196821585298} +{"Pretrain/Learning Rate": 1.356823956010983e-05, "Pretrain/Loss": 2.0494399070739746, "Pretrain/Loss (Raw)": 1.9318372011184692, "Pretrain/Step": 6310, "Pretrain/Step Time": 8.546023722738028} +{"Pretrain/Learning Rate": 1.3560689940057453e-05, "Pretrain/Loss": 2.0480294227600098, "Pretrain/Loss (Raw)": 1.9292019605636597, "Pretrain/Step": 6311, "Pretrain/Step Time": 8.549294631928205} +{"Pretrain/Learning Rate": 1.3553141639240218e-05, "Pretrain/Loss": 2.0479862689971924, "Pretrain/Loss (Raw)": 1.9241241216659546, "Pretrain/Step": 6312, "Pretrain/Step Time": 8.546115327626467} +{"Pretrain/Learning Rate": 1.354559465852862e-05, "Pretrain/Loss": 2.0477757453918457, "Pretrain/Loss (Raw)": 2.017570734024048, "Pretrain/Step": 6313, "Pretrain/Step Time": 8.548447001725435} +{"Pretrain/Learning Rate": 1.353804899879303e-05, "Pretrain/Loss": 2.047327995300293, "Pretrain/Loss (Raw)": 1.8954942226409912, "Pretrain/Step": 6314, "Pretrain/Step Time": 8.546318346634507} +{"Pretrain/Learning Rate": 1.3530504660903637e-05, "Pretrain/Loss": 2.04693865776062, "Pretrain/Loss (Raw)": 2.090986490249634, "Pretrain/Step": 6315, "Pretrain/Step Time": 8.549192378297448} +{"Pretrain/Learning Rate": 1.3522961645730498e-05, "Pretrain/Loss": 2.0463483333587646, "Pretrain/Loss (Raw)": 2.030308961868286, "Pretrain/Step": 6316, "Pretrain/Step Time": 8.54616660811007} +{"Pretrain/Learning Rate": 1.3515419954143489e-05, "Pretrain/Loss": 2.0460307598114014, "Pretrain/Loss (Raw)": 2.0554728507995605, "Pretrain/Step": 6317, "Pretrain/Step Time": 8.54914815351367} +{"Pretrain/Learning Rate": 1.3507879587012378e-05, "Pretrain/Loss": 2.0477864742279053, "Pretrain/Loss (Raw)": 2.020049810409546, "Pretrain/Step": 6318, "Pretrain/Step Time": 8.547376276925206} +{"Pretrain/Learning Rate": 1.3500340545206747e-05, "Pretrain/Loss": 2.0451254844665527, "Pretrain/Loss (Raw)": 1.8420032262802124, "Pretrain/Step": 6319, "Pretrain/Step Time": 8.551717886701226} +{"Pretrain/Learning Rate": 1.3492802829596035e-05, "Pretrain/Loss": 2.045051336288452, "Pretrain/Loss (Raw)": 2.0730342864990234, "Pretrain/Step": 6320, "Pretrain/Step Time": 8.544759688898921} +{"Pretrain/Learning Rate": 1.348526644104951e-05, "Pretrain/Loss": 2.044863224029541, "Pretrain/Loss (Raw)": 2.136475086212158, "Pretrain/Step": 6321, "Pretrain/Step Time": 8.554324463009834} +{"Pretrain/Learning Rate": 1.3477731380436332e-05, "Pretrain/Loss": 2.046541213989258, "Pretrain/Loss (Raw)": 2.1345877647399902, "Pretrain/Step": 6322, "Pretrain/Step Time": 8.552947761490941} +{"Pretrain/Learning Rate": 1.3470197648625463e-05, "Pretrain/Loss": 2.0483899116516113, "Pretrain/Loss (Raw)": 2.089750051498413, "Pretrain/Step": 6323, "Pretrain/Step Time": 8.55116518959403} +{"Pretrain/Learning Rate": 1.3462665246485734e-05, "Pretrain/Loss": 2.047269105911255, "Pretrain/Loss (Raw)": 1.8296457529067993, "Pretrain/Step": 6324, "Pretrain/Step Time": 8.549043755978346} +{"Pretrain/Learning Rate": 1.3455134174885802e-05, "Pretrain/Loss": 2.0474138259887695, "Pretrain/Loss (Raw)": 1.8649455308914185, "Pretrain/Step": 6325, "Pretrain/Step Time": 8.549876730889082} +{"Pretrain/Learning Rate": 1.3447604434694207e-05, "Pretrain/Loss": 2.0481791496276855, "Pretrain/Loss (Raw)": 2.031412363052368, "Pretrain/Step": 6326, "Pretrain/Step Time": 8.55158151499927} +{"Pretrain/Learning Rate": 1.3440076026779309e-05, "Pretrain/Loss": 2.0482165813446045, "Pretrain/Loss (Raw)": 1.8740938901901245, "Pretrain/Step": 6327, "Pretrain/Step Time": 8.56298847682774} +{"Pretrain/Learning Rate": 1.3432548952009313e-05, "Pretrain/Loss": 2.048250675201416, "Pretrain/Loss (Raw)": 2.0522913932800293, "Pretrain/Step": 6328, "Pretrain/Step Time": 8.555924063548446} +{"Pretrain/Learning Rate": 1.3425023211252272e-05, "Pretrain/Loss": 2.051297187805176, "Pretrain/Loss (Raw)": 2.391441822052002, "Pretrain/Step": 6329, "Pretrain/Step Time": 8.554947759956121} +{"Pretrain/Learning Rate": 1.3417498805376105e-05, "Pretrain/Loss": 2.0510833263397217, "Pretrain/Loss (Raw)": 1.9366464614868164, "Pretrain/Step": 6330, "Pretrain/Step Time": 8.556422751396894} +{"Pretrain/Learning Rate": 1.3409975735248556e-05, "Pretrain/Loss": 2.0484042167663574, "Pretrain/Loss (Raw)": 1.9854098558425903, "Pretrain/Step": 6331, "Pretrain/Step Time": 8.555125758051872} +{"Pretrain/Learning Rate": 1.3402454001737209e-05, "Pretrain/Loss": 2.048621654510498, "Pretrain/Loss (Raw)": 2.181123733520508, "Pretrain/Step": 6332, "Pretrain/Step Time": 8.555613255128264} +{"Pretrain/Learning Rate": 1.3394933605709525e-05, "Pretrain/Loss": 2.0484416484832764, "Pretrain/Loss (Raw)": 2.1034960746765137, "Pretrain/Step": 6333, "Pretrain/Step Time": 8.55808875337243} +{"Pretrain/Learning Rate": 1.3387414548032783e-05, "Pretrain/Loss": 2.0495712757110596, "Pretrain/Loss (Raw)": 2.114877462387085, "Pretrain/Step": 6334, "Pretrain/Step Time": 8.558871634304523} +{"Pretrain/Learning Rate": 1.3379896829574115e-05, "Pretrain/Loss": 2.0496177673339844, "Pretrain/Loss (Raw)": 2.1553750038146973, "Pretrain/Step": 6335, "Pretrain/Step Time": 8.553959511220455} +{"Pretrain/Learning Rate": 1.337238045120049e-05, "Pretrain/Loss": 2.0513651371002197, "Pretrain/Loss (Raw)": 2.216355085372925, "Pretrain/Step": 6336, "Pretrain/Step Time": 8.552416894584894} +{"Pretrain/Learning Rate": 1.3364865413778755e-05, "Pretrain/Loss": 2.052915096282959, "Pretrain/Loss (Raw)": 2.034205913543701, "Pretrain/Step": 6337, "Pretrain/Step Time": 8.555200524628162} +{"Pretrain/Learning Rate": 1.3357351718175564e-05, "Pretrain/Loss": 2.0537242889404297, "Pretrain/Loss (Raw)": 2.1531448364257812, "Pretrain/Step": 6338, "Pretrain/Step Time": 8.558099444955587} +{"Pretrain/Learning Rate": 1.3349839365257438e-05, "Pretrain/Loss": 2.0559260845184326, "Pretrain/Loss (Raw)": 2.1299500465393066, "Pretrain/Step": 6339, "Pretrain/Step Time": 8.563147004693747} +{"Pretrain/Learning Rate": 1.3342328355890721e-05, "Pretrain/Loss": 2.0558552742004395, "Pretrain/Loss (Raw)": 1.9809142351150513, "Pretrain/Step": 6340, "Pretrain/Step Time": 8.556029612198472} +{"Pretrain/Learning Rate": 1.3334818690941652e-05, "Pretrain/Loss": 2.0563302040100098, "Pretrain/Loss (Raw)": 2.0405960083007812, "Pretrain/Step": 6341, "Pretrain/Step Time": 8.552234573289752} +{"Pretrain/Learning Rate": 1.332731037127624e-05, "Pretrain/Loss": 2.054687738418579, "Pretrain/Loss (Raw)": 1.9932186603546143, "Pretrain/Step": 6342, "Pretrain/Step Time": 8.558686638250947} +{"Pretrain/Learning Rate": 1.3319803397760408e-05, "Pretrain/Loss": 2.0562422275543213, "Pretrain/Loss (Raw)": 2.099233627319336, "Pretrain/Step": 6343, "Pretrain/Step Time": 8.556989511474967} +{"Pretrain/Learning Rate": 1.331229777125988e-05, "Pretrain/Loss": 2.0560057163238525, "Pretrain/Loss (Raw)": 1.9459280967712402, "Pretrain/Step": 6344, "Pretrain/Step Time": 8.55780011229217} +{"Pretrain/Learning Rate": 1.3304793492640263e-05, "Pretrain/Loss": 2.0556552410125732, "Pretrain/Loss (Raw)": 1.9228957891464233, "Pretrain/Step": 6345, "Pretrain/Step Time": 8.559834286570549} +{"Pretrain/Learning Rate": 1.329729056276695e-05, "Pretrain/Loss": 2.0545363426208496, "Pretrain/Loss (Raw)": 1.9478540420532227, "Pretrain/Step": 6346, "Pretrain/Step Time": 8.553215617313981} +{"Pretrain/Learning Rate": 1.328978898250525e-05, "Pretrain/Loss": 2.055783271789551, "Pretrain/Loss (Raw)": 2.0446274280548096, "Pretrain/Step": 6347, "Pretrain/Step Time": 8.55713490396738} +{"Pretrain/Learning Rate": 1.3282288752720262e-05, "Pretrain/Loss": 2.0529205799102783, "Pretrain/Loss (Raw)": 1.7412267923355103, "Pretrain/Step": 6348, "Pretrain/Step Time": 8.553321078419685} +{"Pretrain/Learning Rate": 1.3274789874276949e-05, "Pretrain/Loss": 2.050563097000122, "Pretrain/Loss (Raw)": 2.226374626159668, "Pretrain/Step": 6349, "Pretrain/Step Time": 8.552598109468818} +{"Pretrain/Learning Rate": 1.3267292348040111e-05, "Pretrain/Loss": 2.0519800186157227, "Pretrain/Loss (Raw)": 2.181938886642456, "Pretrain/Step": 6350, "Pretrain/Step Time": 8.551265474408865} +{"Pretrain/Learning Rate": 1.3259796174874411e-05, "Pretrain/Loss": 2.0538508892059326, "Pretrain/Loss (Raw)": 2.0846445560455322, "Pretrain/Step": 6351, "Pretrain/Step Time": 8.553000781685114} +{"Pretrain/Learning Rate": 1.3252301355644341e-05, "Pretrain/Loss": 2.0532021522521973, "Pretrain/Loss (Raw)": 1.9834041595458984, "Pretrain/Step": 6352, "Pretrain/Step Time": 8.555543448776007} +{"Pretrain/Learning Rate": 1.324480789121424e-05, "Pretrain/Loss": 2.0498950481414795, "Pretrain/Loss (Raw)": 1.753687858581543, "Pretrain/Step": 6353, "Pretrain/Step Time": 8.55415416508913} +{"Pretrain/Learning Rate": 1.323731578244827e-05, "Pretrain/Loss": 2.050126552581787, "Pretrain/Loss (Raw)": 2.062471628189087, "Pretrain/Step": 6354, "Pretrain/Step Time": 8.552964519709349} +{"Pretrain/Learning Rate": 1.3229825030210482e-05, "Pretrain/Loss": 2.046884298324585, "Pretrain/Loss (Raw)": 2.035625696182251, "Pretrain/Step": 6355, "Pretrain/Step Time": 8.55304971896112} +{"Pretrain/Learning Rate": 1.3222335635364736e-05, "Pretrain/Loss": 2.0483922958374023, "Pretrain/Loss (Raw)": 2.216270685195923, "Pretrain/Step": 6356, "Pretrain/Step Time": 8.549098474904895} +{"Pretrain/Learning Rate": 1.3214847598774744e-05, "Pretrain/Loss": 2.047657012939453, "Pretrain/Loss (Raw)": 1.9597724676132202, "Pretrain/Step": 6357, "Pretrain/Step Time": 8.551598763093352} +{"Pretrain/Learning Rate": 1.3207360921304046e-05, "Pretrain/Loss": 2.0467700958251953, "Pretrain/Loss (Raw)": 1.9664403200149536, "Pretrain/Step": 6358, "Pretrain/Step Time": 8.558764351531863} +{"Pretrain/Learning Rate": 1.319987560381607e-05, "Pretrain/Loss": 2.048323631286621, "Pretrain/Loss (Raw)": 2.1728243827819824, "Pretrain/Step": 6359, "Pretrain/Step Time": 8.54896279424429} +{"Pretrain/Learning Rate": 1.319239164717404e-05, "Pretrain/Loss": 2.045988082885742, "Pretrain/Loss (Raw)": 1.8683414459228516, "Pretrain/Step": 6360, "Pretrain/Step Time": 8.547359416261315} +{"Pretrain/Learning Rate": 1.3184909052241046e-05, "Pretrain/Loss": 2.045133113861084, "Pretrain/Loss (Raw)": 1.8432502746582031, "Pretrain/Step": 6361, "Pretrain/Step Time": 8.547927068546414} +{"Pretrain/Learning Rate": 1.3177427819880002e-05, "Pretrain/Loss": 2.046145439147949, "Pretrain/Loss (Raw)": 2.1109185218811035, "Pretrain/Step": 6362, "Pretrain/Step Time": 8.553527800366282} +{"Pretrain/Learning Rate": 1.3169947950953704e-05, "Pretrain/Loss": 2.0500268936157227, "Pretrain/Loss (Raw)": 2.396458864212036, "Pretrain/Step": 6363, "Pretrain/Step Time": 8.550870165228844} +{"Pretrain/Learning Rate": 1.3162469446324755e-05, "Pretrain/Loss": 2.053102970123291, "Pretrain/Loss (Raw)": 2.2480077743530273, "Pretrain/Step": 6364, "Pretrain/Step Time": 8.556355457752943} +{"Pretrain/Learning Rate": 1.3154992306855607e-05, "Pretrain/Loss": 2.054837703704834, "Pretrain/Loss (Raw)": 2.182798385620117, "Pretrain/Step": 6365, "Pretrain/Step Time": 8.551573313772678} +{"Pretrain/Learning Rate": 1.3147516533408552e-05, "Pretrain/Loss": 2.0546114444732666, "Pretrain/Loss (Raw)": 1.9502540826797485, "Pretrain/Step": 6366, "Pretrain/Step Time": 8.551467046141624} +{"Pretrain/Learning Rate": 1.3140042126845753e-05, "Pretrain/Loss": 2.054737091064453, "Pretrain/Loss (Raw)": 2.1136927604675293, "Pretrain/Step": 6367, "Pretrain/Step Time": 8.550906397402287} +{"Pretrain/Learning Rate": 1.3132569088029179e-05, "Pretrain/Loss": 2.0546460151672363, "Pretrain/Loss (Raw)": 2.065223455429077, "Pretrain/Step": 6368, "Pretrain/Step Time": 8.554341649636626} +{"Pretrain/Learning Rate": 1.312509741782066e-05, "Pretrain/Loss": 2.0514440536499023, "Pretrain/Loss (Raw)": 1.718273401260376, "Pretrain/Step": 6369, "Pretrain/Step Time": 8.555556494742632} +{"Pretrain/Learning Rate": 1.3117627117081854e-05, "Pretrain/Loss": 2.049485206604004, "Pretrain/Loss (Raw)": 1.9234594106674194, "Pretrain/Step": 6370, "Pretrain/Step Time": 8.556389398872852} +{"Pretrain/Learning Rate": 1.3110158186674293e-05, "Pretrain/Loss": 2.049471616744995, "Pretrain/Loss (Raw)": 2.0282676219940186, "Pretrain/Step": 6371, "Pretrain/Step Time": 8.55557339079678} +{"Pretrain/Learning Rate": 1.3102690627459314e-05, "Pretrain/Loss": 2.0479683876037598, "Pretrain/Loss (Raw)": 1.9770961999893188, "Pretrain/Step": 6372, "Pretrain/Step Time": 8.551541624590755} +{"Pretrain/Learning Rate": 1.30952244402981e-05, "Pretrain/Loss": 2.045024871826172, "Pretrain/Loss (Raw)": 1.7936153411865234, "Pretrain/Step": 6373, "Pretrain/Step Time": 8.554811766371131} +{"Pretrain/Learning Rate": 1.3087759626051716e-05, "Pretrain/Loss": 2.043407678604126, "Pretrain/Loss (Raw)": 1.9014800786972046, "Pretrain/Step": 6374, "Pretrain/Step Time": 8.557573862373829} +{"Pretrain/Learning Rate": 1.308029618558102e-05, "Pretrain/Loss": 2.042123317718506, "Pretrain/Loss (Raw)": 2.082392454147339, "Pretrain/Step": 6375, "Pretrain/Step Time": 8.553960673511028} +{"Pretrain/Learning Rate": 1.3072834119746741e-05, "Pretrain/Loss": 2.038989782333374, "Pretrain/Loss (Raw)": 1.9665554761886597, "Pretrain/Step": 6376, "Pretrain/Step Time": 8.56430446729064} +{"Pretrain/Learning Rate": 1.3065373429409419e-05, "Pretrain/Loss": 2.040712356567383, "Pretrain/Loss (Raw)": 2.2115612030029297, "Pretrain/Step": 6377, "Pretrain/Step Time": 8.556742120534182} +{"Pretrain/Learning Rate": 1.3057914115429482e-05, "Pretrain/Loss": 2.03812313079834, "Pretrain/Loss (Raw)": 1.7935727834701538, "Pretrain/Step": 6378, "Pretrain/Step Time": 8.55583638139069} +{"Pretrain/Learning Rate": 1.3050456178667165e-05, "Pretrain/Loss": 2.0373499393463135, "Pretrain/Loss (Raw)": 1.9258078336715698, "Pretrain/Step": 6379, "Pretrain/Step Time": 8.555821502581239} +{"Pretrain/Learning Rate": 1.3042999619982546e-05, "Pretrain/Loss": 2.040567398071289, "Pretrain/Loss (Raw)": 2.365992784500122, "Pretrain/Step": 6380, "Pretrain/Step Time": 8.555154170840979} +{"Pretrain/Learning Rate": 1.3035544440235548e-05, "Pretrain/Loss": 2.039128065109253, "Pretrain/Loss (Raw)": 1.87031090259552, "Pretrain/Step": 6381, "Pretrain/Step Time": 8.555040182545781} +{"Pretrain/Learning Rate": 1.3028090640285958e-05, "Pretrain/Loss": 2.040523052215576, "Pretrain/Loss (Raw)": 2.0821309089660645, "Pretrain/Step": 6382, "Pretrain/Step Time": 8.560830110684037} +{"Pretrain/Learning Rate": 1.3020638220993353e-05, "Pretrain/Loss": 2.0406253337860107, "Pretrain/Loss (Raw)": 2.126136064529419, "Pretrain/Step": 6383, "Pretrain/Step Time": 8.551168842241168} +{"Pretrain/Learning Rate": 1.3013187183217206e-05, "Pretrain/Loss": 2.0388922691345215, "Pretrain/Loss (Raw)": 1.889673113822937, "Pretrain/Step": 6384, "Pretrain/Step Time": 8.554716981947422} +{"Pretrain/Learning Rate": 1.3005737527816786e-05, "Pretrain/Loss": 2.0360679626464844, "Pretrain/Loss (Raw)": 1.9507524967193604, "Pretrain/Step": 6385, "Pretrain/Step Time": 8.552407961338758} +{"Pretrain/Learning Rate": 1.2998289255651253e-05, "Pretrain/Loss": 2.036229372024536, "Pretrain/Loss (Raw)": 2.140413999557495, "Pretrain/Step": 6386, "Pretrain/Step Time": 8.548723485320807} +{"Pretrain/Learning Rate": 1.2990842367579539e-05, "Pretrain/Loss": 2.0355212688446045, "Pretrain/Loss (Raw)": 1.8098045587539673, "Pretrain/Step": 6387, "Pretrain/Step Time": 8.549283880740404} +{"Pretrain/Learning Rate": 1.2983396864460482e-05, "Pretrain/Loss": 2.0367207527160645, "Pretrain/Loss (Raw)": 2.1957032680511475, "Pretrain/Step": 6388, "Pretrain/Step Time": 8.554003722965717} +{"Pretrain/Learning Rate": 1.2975952747152709e-05, "Pretrain/Loss": 2.037688732147217, "Pretrain/Loss (Raw)": 2.1313977241516113, "Pretrain/Step": 6389, "Pretrain/Step Time": 8.5516784992069} +{"Pretrain/Learning Rate": 1.2968510016514749e-05, "Pretrain/Loss": 2.0372722148895264, "Pretrain/Loss (Raw)": 2.0037777423858643, "Pretrain/Step": 6390, "Pretrain/Step Time": 8.545402966439724} +{"Pretrain/Learning Rate": 1.2961068673404886e-05, "Pretrain/Loss": 2.0338382720947266, "Pretrain/Loss (Raw)": 1.9309521913528442, "Pretrain/Step": 6391, "Pretrain/Step Time": 8.546921417117119} +{"Pretrain/Learning Rate": 1.295362871868132e-05, "Pretrain/Loss": 2.032594680786133, "Pretrain/Loss (Raw)": 1.8996310234069824, "Pretrain/Step": 6392, "Pretrain/Step Time": 8.550086097791791} +{"Pretrain/Learning Rate": 1.2946190153202059e-05, "Pretrain/Loss": 2.0331735610961914, "Pretrain/Loss (Raw)": 2.05195689201355, "Pretrain/Step": 6393, "Pretrain/Step Time": 8.547902010381222} +{"Pretrain/Learning Rate": 1.2938752977824947e-05, "Pretrain/Loss": 2.0348756313323975, "Pretrain/Loss (Raw)": 2.155953884124756, "Pretrain/Step": 6394, "Pretrain/Step Time": 8.548667313531041} +{"Pretrain/Learning Rate": 1.2931317193407665e-05, "Pretrain/Loss": 2.0352559089660645, "Pretrain/Loss (Raw)": 2.034823417663574, "Pretrain/Step": 6395, "Pretrain/Step Time": 8.545833170413971} +{"Pretrain/Learning Rate": 1.2923882800807768e-05, "Pretrain/Loss": 2.0374202728271484, "Pretrain/Loss (Raw)": 2.183999538421631, "Pretrain/Step": 6396, "Pretrain/Step Time": 8.542094899341464} +{"Pretrain/Learning Rate": 1.2916449800882607e-05, "Pretrain/Loss": 2.034360885620117, "Pretrain/Loss (Raw)": 1.9362611770629883, "Pretrain/Step": 6397, "Pretrain/Step Time": 8.545947691425681} +{"Pretrain/Learning Rate": 1.2909018194489397e-05, "Pretrain/Loss": 2.0318479537963867, "Pretrain/Loss (Raw)": 1.7511175870895386, "Pretrain/Step": 6398, "Pretrain/Step Time": 8.548206282779574} +{"Pretrain/Learning Rate": 1.2901587982485172e-05, "Pretrain/Loss": 2.0309667587280273, "Pretrain/Loss (Raw)": 2.1251258850097656, "Pretrain/Step": 6399, "Pretrain/Step Time": 8.54516881890595} +{"Pretrain/Learning Rate": 1.289415916572684e-05, "Pretrain/Loss": 2.031778573989868, "Pretrain/Loss (Raw)": 2.1024816036224365, "Pretrain/Step": 6400, "Pretrain/Step Time": 8.551737548783422} +{"Pretrain/Learning Rate": 1.2886731745071117e-05, "Pretrain/Loss": 2.031949996948242, "Pretrain/Loss (Raw)": 2.0467002391815186, "Pretrain/Step": 6401, "Pretrain/Step Time": 8.549242848530412} +{"Pretrain/Learning Rate": 1.287930572137457e-05, "Pretrain/Loss": 2.031468152999878, "Pretrain/Loss (Raw)": 1.920005202293396, "Pretrain/Step": 6402, "Pretrain/Step Time": 8.549935536459088} +{"Pretrain/Learning Rate": 1.2871881095493592e-05, "Pretrain/Loss": 2.03078031539917, "Pretrain/Loss (Raw)": 2.0206239223480225, "Pretrain/Step": 6403, "Pretrain/Step Time": 8.549184955656528} +{"Pretrain/Learning Rate": 1.2864457868284446e-05, "Pretrain/Loss": 2.0312135219573975, "Pretrain/Loss (Raw)": 2.139723539352417, "Pretrain/Step": 6404, "Pretrain/Step Time": 8.552636742591858} +{"Pretrain/Learning Rate": 1.2857036040603205e-05, "Pretrain/Loss": 2.031170129776001, "Pretrain/Loss (Raw)": 2.096648693084717, "Pretrain/Step": 6405, "Pretrain/Step Time": 8.548937829211354} +{"Pretrain/Learning Rate": 1.2849615613305782e-05, "Pretrain/Loss": 2.0315957069396973, "Pretrain/Loss (Raw)": 2.06201434135437, "Pretrain/Step": 6406, "Pretrain/Step Time": 8.55467675998807} +{"Pretrain/Learning Rate": 1.2842196587247935e-05, "Pretrain/Loss": 2.033719539642334, "Pretrain/Loss (Raw)": 2.225212812423706, "Pretrain/Step": 6407, "Pretrain/Step Time": 8.54741301573813} +{"Pretrain/Learning Rate": 1.2834778963285276e-05, "Pretrain/Loss": 2.034214735031128, "Pretrain/Loss (Raw)": 2.0377914905548096, "Pretrain/Step": 6408, "Pretrain/Step Time": 8.555907405912876} +{"Pretrain/Learning Rate": 1.282736274227323e-05, "Pretrain/Loss": 2.033554792404175, "Pretrain/Loss (Raw)": 1.9768561124801636, "Pretrain/Step": 6409, "Pretrain/Step Time": 8.557092683389783} +{"Pretrain/Learning Rate": 1.2819947925067071e-05, "Pretrain/Loss": 2.0337536334991455, "Pretrain/Loss (Raw)": 2.000765085220337, "Pretrain/Step": 6410, "Pretrain/Step Time": 8.554099509492517} +{"Pretrain/Learning Rate": 1.2812534512521906e-05, "Pretrain/Loss": 2.032360315322876, "Pretrain/Loss (Raw)": 2.1217055320739746, "Pretrain/Step": 6411, "Pretrain/Step Time": 8.55628951266408} +{"Pretrain/Learning Rate": 1.2805122505492697e-05, "Pretrain/Loss": 2.0331361293792725, "Pretrain/Loss (Raw)": 2.01112961769104, "Pretrain/Step": 6412, "Pretrain/Step Time": 8.551360446959734} +{"Pretrain/Learning Rate": 1.2797711904834226e-05, "Pretrain/Loss": 2.0306551456451416, "Pretrain/Loss (Raw)": 1.8029462099075317, "Pretrain/Step": 6413, "Pretrain/Step Time": 8.55542765557766} +{"Pretrain/Learning Rate": 1.279030271140111e-05, "Pretrain/Loss": 2.0307974815368652, "Pretrain/Loss (Raw)": 1.9425691366195679, "Pretrain/Step": 6414, "Pretrain/Step Time": 8.55559991300106} +{"Pretrain/Learning Rate": 1.2782894926047822e-05, "Pretrain/Loss": 2.0293221473693848, "Pretrain/Loss (Raw)": 2.0944395065307617, "Pretrain/Step": 6415, "Pretrain/Step Time": 8.551041051745415} +{"Pretrain/Learning Rate": 1.2775488549628667e-05, "Pretrain/Loss": 2.0284881591796875, "Pretrain/Loss (Raw)": 2.021528482437134, "Pretrain/Step": 6416, "Pretrain/Step Time": 8.551732432097197} +{"Pretrain/Learning Rate": 1.2768083582997772e-05, "Pretrain/Loss": 2.0273661613464355, "Pretrain/Loss (Raw)": 2.0250916481018066, "Pretrain/Step": 6417, "Pretrain/Step Time": 8.555291429162025} +{"Pretrain/Learning Rate": 1.2760680027009109e-05, "Pretrain/Loss": 2.02700138092041, "Pretrain/Loss (Raw)": 1.7359609603881836, "Pretrain/Step": 6418, "Pretrain/Step Time": 8.55710213445127} +{"Pretrain/Learning Rate": 1.2753277882516507e-05, "Pretrain/Loss": 2.0243537425994873, "Pretrain/Loss (Raw)": 1.7701866626739502, "Pretrain/Step": 6419, "Pretrain/Step Time": 8.559385364875197} +{"Pretrain/Learning Rate": 1.2745877150373612e-05, "Pretrain/Loss": 2.0282957553863525, "Pretrain/Loss (Raw)": 2.5457961559295654, "Pretrain/Step": 6420, "Pretrain/Step Time": 8.55635229125619} +{"Pretrain/Learning Rate": 1.2738477831433904e-05, "Pretrain/Loss": 2.02616024017334, "Pretrain/Loss (Raw)": 1.966762900352478, "Pretrain/Step": 6421, "Pretrain/Step Time": 8.553311865776777} +{"Pretrain/Learning Rate": 1.2731079926550701e-05, "Pretrain/Loss": 2.0259008407592773, "Pretrain/Loss (Raw)": 2.096586227416992, "Pretrain/Step": 6422, "Pretrain/Step Time": 8.5544094145298} +{"Pretrain/Learning Rate": 1.2723683436577195e-05, "Pretrain/Loss": 2.025273323059082, "Pretrain/Loss (Raw)": 2.047177791595459, "Pretrain/Step": 6423, "Pretrain/Step Time": 8.55326778255403} +{"Pretrain/Learning Rate": 1.271628836236634e-05, "Pretrain/Loss": 2.0251553058624268, "Pretrain/Loss (Raw)": 2.1033692359924316, "Pretrain/Step": 6424, "Pretrain/Step Time": 8.561103817075491} +{"Pretrain/Learning Rate": 1.2708894704771007e-05, "Pretrain/Loss": 2.024815797805786, "Pretrain/Loss (Raw)": 2.105734348297119, "Pretrain/Step": 6425, "Pretrain/Step Time": 8.55364011414349} +{"Pretrain/Learning Rate": 1.2701502464643844e-05, "Pretrain/Loss": 2.0310802459716797, "Pretrain/Loss (Raw)": 2.3241629600524902, "Pretrain/Step": 6426, "Pretrain/Step Time": 8.560001287609339} +{"Pretrain/Learning Rate": 1.2694111642837386e-05, "Pretrain/Loss": 2.0315139293670654, "Pretrain/Loss (Raw)": 2.0665435791015625, "Pretrain/Step": 6427, "Pretrain/Step Time": 8.559342972934246} +{"Pretrain/Learning Rate": 1.2686722240203946e-05, "Pretrain/Loss": 2.032229423522949, "Pretrain/Loss (Raw)": 2.0906128883361816, "Pretrain/Step": 6428, "Pretrain/Step Time": 8.559747552499175} +{"Pretrain/Learning Rate": 1.2679334257595727e-05, "Pretrain/Loss": 2.035966396331787, "Pretrain/Loss (Raw)": 2.518758535385132, "Pretrain/Step": 6429, "Pretrain/Step Time": 8.556334141641855} +{"Pretrain/Learning Rate": 1.2671947695864727e-05, "Pretrain/Loss": 2.0385043621063232, "Pretrain/Loss (Raw)": 2.0280559062957764, "Pretrain/Step": 6430, "Pretrain/Step Time": 8.559079954400659} +{"Pretrain/Learning Rate": 1.266456255586283e-05, "Pretrain/Loss": 2.0374772548675537, "Pretrain/Loss (Raw)": 1.9413259029388428, "Pretrain/Step": 6431, "Pretrain/Step Time": 8.549984484910965} +{"Pretrain/Learning Rate": 1.2657178838441686e-05, "Pretrain/Loss": 2.035961389541626, "Pretrain/Loss (Raw)": 1.8365364074707031, "Pretrain/Step": 6432, "Pretrain/Step Time": 8.554697094485164} +{"Pretrain/Learning Rate": 1.2649796544452852e-05, "Pretrain/Loss": 2.036245822906494, "Pretrain/Loss (Raw)": 2.1668684482574463, "Pretrain/Step": 6433, "Pretrain/Step Time": 8.551607007160783} +{"Pretrain/Learning Rate": 1.2642415674747673e-05, "Pretrain/Loss": 2.0362496376037598, "Pretrain/Loss (Raw)": 1.9617983102798462, "Pretrain/Step": 6434, "Pretrain/Step Time": 8.552244303748012} +{"Pretrain/Learning Rate": 1.263503623017735e-05, "Pretrain/Loss": 2.0393855571746826, "Pretrain/Loss (Raw)": 2.528702974319458, "Pretrain/Step": 6435, "Pretrain/Step Time": 8.549781011417508} +{"Pretrain/Learning Rate": 1.2627658211592907e-05, "Pretrain/Loss": 2.0391554832458496, "Pretrain/Loss (Raw)": 2.119579315185547, "Pretrain/Step": 6436, "Pretrain/Step Time": 8.551741074770689} +{"Pretrain/Learning Rate": 1.262028161984523e-05, "Pretrain/Loss": 2.0382533073425293, "Pretrain/Loss (Raw)": 1.9714587926864624, "Pretrain/Step": 6437, "Pretrain/Step Time": 8.55481624417007} +{"Pretrain/Learning Rate": 1.2612906455785006e-05, "Pretrain/Loss": 2.0389137268066406, "Pretrain/Loss (Raw)": 2.0163633823394775, "Pretrain/Step": 6438, "Pretrain/Step Time": 8.559379832819104} +{"Pretrain/Learning Rate": 1.2605532720262785e-05, "Pretrain/Loss": 2.0389456748962402, "Pretrain/Loss (Raw)": 1.9333139657974243, "Pretrain/Step": 6439, "Pretrain/Step Time": 8.553715143352747} +{"Pretrain/Learning Rate": 1.2598160414128924e-05, "Pretrain/Loss": 2.0401952266693115, "Pretrain/Loss (Raw)": 2.0840671062469482, "Pretrain/Step": 6440, "Pretrain/Step Time": 8.556086577475071} +{"Pretrain/Learning Rate": 1.2590789538233652e-05, "Pretrain/Loss": 2.040034294128418, "Pretrain/Loss (Raw)": 1.996942162513733, "Pretrain/Step": 6441, "Pretrain/Step Time": 8.556698774918914} +{"Pretrain/Learning Rate": 1.2583420093427006e-05, "Pretrain/Loss": 2.039961814880371, "Pretrain/Loss (Raw)": 1.8862290382385254, "Pretrain/Step": 6442, "Pretrain/Step Time": 8.556651011109352} +{"Pretrain/Learning Rate": 1.2576052080558864e-05, "Pretrain/Loss": 2.0396487712860107, "Pretrain/Loss (Raw)": 2.050931930541992, "Pretrain/Step": 6443, "Pretrain/Step Time": 8.554768854752183} +{"Pretrain/Learning Rate": 1.2568685500478927e-05, "Pretrain/Loss": 2.0392773151397705, "Pretrain/Loss (Raw)": 1.9827693700790405, "Pretrain/Step": 6444, "Pretrain/Step Time": 8.559080196544528} +{"Pretrain/Learning Rate": 1.256132035403677e-05, "Pretrain/Loss": 2.038447380065918, "Pretrain/Loss (Raw)": 1.949205756187439, "Pretrain/Step": 6445, "Pretrain/Step Time": 8.551805049180984} +{"Pretrain/Learning Rate": 1.255395664208176e-05, "Pretrain/Loss": 2.0387558937072754, "Pretrain/Loss (Raw)": 2.0595765113830566, "Pretrain/Step": 6446, "Pretrain/Step Time": 8.5597739610821} +{"Pretrain/Learning Rate": 1.2546594365463119e-05, "Pretrain/Loss": 2.040025234222412, "Pretrain/Loss (Raw)": 2.004443645477295, "Pretrain/Step": 6447, "Pretrain/Step Time": 8.556039579212666} +{"Pretrain/Learning Rate": 1.2539233525029886e-05, "Pretrain/Loss": 2.0421526432037354, "Pretrain/Loss (Raw)": 2.3453571796417236, "Pretrain/Step": 6448, "Pretrain/Step Time": 8.557782476767898} +{"Pretrain/Learning Rate": 1.2531874121630973e-05, "Pretrain/Loss": 2.0403528213500977, "Pretrain/Loss (Raw)": 1.906111240386963, "Pretrain/Step": 6449, "Pretrain/Step Time": 8.558706795796752} +{"Pretrain/Learning Rate": 1.2524516156115088e-05, "Pretrain/Loss": 2.0418190956115723, "Pretrain/Loss (Raw)": 2.3222451210021973, "Pretrain/Step": 6450, "Pretrain/Step Time": 8.561383066698909} +{"Pretrain/Learning Rate": 1.2517159629330783e-05, "Pretrain/Loss": 2.040926218032837, "Pretrain/Loss (Raw)": 1.9754830598831177, "Pretrain/Step": 6451, "Pretrain/Step Time": 8.565763050690293} +{"Pretrain/Learning Rate": 1.2509804542126444e-05, "Pretrain/Loss": 2.0439581871032715, "Pretrain/Loss (Raw)": 2.217742919921875, "Pretrain/Step": 6452, "Pretrain/Step Time": 8.56728420779109} +{"Pretrain/Learning Rate": 1.250245089535031e-05, "Pretrain/Loss": 2.0448684692382812, "Pretrain/Loss (Raw)": 1.9814672470092773, "Pretrain/Step": 6453, "Pretrain/Step Time": 8.56633235141635} +{"Pretrain/Learning Rate": 1.2495098689850429e-05, "Pretrain/Loss": 2.045267105102539, "Pretrain/Loss (Raw)": 2.0824360847473145, "Pretrain/Step": 6454, "Pretrain/Step Time": 8.563826953992248} +{"Pretrain/Learning Rate": 1.2487747926474683e-05, "Pretrain/Loss": 2.0477614402770996, "Pretrain/Loss (Raw)": 2.1933445930480957, "Pretrain/Step": 6455, "Pretrain/Step Time": 8.562349025160074} +{"Pretrain/Learning Rate": 1.2480398606070815e-05, "Pretrain/Loss": 2.049295663833618, "Pretrain/Loss (Raw)": 2.248692750930786, "Pretrain/Step": 6456, "Pretrain/Step Time": 8.561600372195244} +{"Pretrain/Learning Rate": 1.2473050729486371e-05, "Pretrain/Loss": 2.046820878982544, "Pretrain/Loss (Raw)": 2.074657440185547, "Pretrain/Step": 6457, "Pretrain/Step Time": 8.560625094920397} +{"Pretrain/Learning Rate": 1.246570429756875e-05, "Pretrain/Loss": 2.0475692749023438, "Pretrain/Loss (Raw)": 2.032421112060547, "Pretrain/Step": 6458, "Pretrain/Step Time": 8.556951904669404} +{"Pretrain/Learning Rate": 1.245835931116516e-05, "Pretrain/Loss": 2.0481061935424805, "Pretrain/Loss (Raw)": 2.0541555881500244, "Pretrain/Step": 6459, "Pretrain/Step Time": 8.557683549821377} +{"Pretrain/Learning Rate": 1.2451015771122684e-05, "Pretrain/Loss": 2.0455639362335205, "Pretrain/Loss (Raw)": 1.855718731880188, "Pretrain/Step": 6460, "Pretrain/Step Time": 8.557666812092066} +{"Pretrain/Learning Rate": 1.2443673678288204e-05, "Pretrain/Loss": 2.0442404747009277, "Pretrain/Loss (Raw)": 1.934078335762024, "Pretrain/Step": 6461, "Pretrain/Step Time": 8.560294987633824} +{"Pretrain/Learning Rate": 1.243633303350844e-05, "Pretrain/Loss": 2.043394088745117, "Pretrain/Loss (Raw)": 2.006556749343872, "Pretrain/Step": 6462, "Pretrain/Step Time": 8.559701140969992} +{"Pretrain/Learning Rate": 1.2428993837629943e-05, "Pretrain/Loss": 2.0454461574554443, "Pretrain/Loss (Raw)": 2.418039321899414, "Pretrain/Step": 6463, "Pretrain/Step Time": 8.559241281822324} +{"Pretrain/Learning Rate": 1.2421656091499123e-05, "Pretrain/Loss": 2.0426149368286133, "Pretrain/Loss (Raw)": 1.8539493083953857, "Pretrain/Step": 6464, "Pretrain/Step Time": 8.55657160654664} +{"Pretrain/Learning Rate": 1.2414319795962196e-05, "Pretrain/Loss": 2.043511152267456, "Pretrain/Loss (Raw)": 2.148939609527588, "Pretrain/Step": 6465, "Pretrain/Step Time": 8.555014433339238} +{"Pretrain/Learning Rate": 1.240698495186521e-05, "Pretrain/Loss": 2.041618824005127, "Pretrain/Loss (Raw)": 1.9108895063400269, "Pretrain/Step": 6466, "Pretrain/Step Time": 8.550757620483637} +{"Pretrain/Learning Rate": 1.2399651560054056e-05, "Pretrain/Loss": 2.0422728061676025, "Pretrain/Loss (Raw)": 2.2136988639831543, "Pretrain/Step": 6467, "Pretrain/Step Time": 8.549960045143962} diff --git a/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/run-metrics.jsonl b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/run-metrics.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..48bfeb3a2b009c63dc2f364a6fb07fe8e54769ce --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-run1+stage-pretrain+x7/run-metrics.jsonl @@ -0,0 +1 @@ +{"hparams": {"dataset": {"align_stage_components": ["download/llava-laion-cc-sbu-558k/chat.json", "download/llava-laion-cc-sbu-558k"], "dataset_id": "obelics", "dataset_resampled": true, "dataset_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_hq_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl/", "finetune_stage_components": ["/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/llava_v1_5_mix665k.json", "/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/data"], "max_num_images": 6, "min_num_images": 1, "train_num_samples": 2441407, "type": "obelics", "workers": 4}, "model": {"align_epochs": 1, "align_global_batch_size": 256, "align_learning_rate": 0.001, "align_lr_scheduler_type": "linear-warmup+cosine-decay", "align_max_grad_norm": 1.0, "align_max_steps": null, "align_per_device_batch_size": 16, "align_train_strategy": "fsdp-shard-grad-op", "align_warmup_ratio": 0.03, "align_weight_decay": 0.0, "arch_specifier": "no-align+avgpool", "enable_gradient_checkpointing": true, "enable_mixed_precision_training": true, "finetune_epochs": 1, "finetune_global_batch_size": 128, "finetune_learning_rate": 2e-05, "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", "finetune_max_grad_norm": 1.0, "finetune_max_steps": null, "finetune_per_device_batch_size": 16, "finetune_train_strategy": "fsdp-full-shard", "finetune_warmup_ratio": 0.03, "finetune_weight_decay": 0.1, "image_resize_strategy": "resize-naive", "llm_backbone_id": "phi3-3b", "llm_max_length": 4096, "model_id": "phi3-3b-continue-training-hq", "pretrain_epochs": 1, "pretrain_global_batch_size": 256, "pretrain_learning_rate": 5e-05, "pretrain_lr_scheduler_type": "linear-warmup+cosine-decay", "pretrain_max_grad_norm": 1.0, "pretrain_max_steps": 9537, "pretrain_per_device_batch_size": 8, "pretrain_train_strategy": "fsdp-full-shard", "pretrain_warmup_ratio": 0.03, "pretrain_weight_decay": 0.01, "reduce_in_full_precision": false, "type": "one-stage+7b", "vision_backbone_id": "siglip-vit-so400m-384px"}, "mount_path": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models", "pretrained_checkpoint": null, "run_id": "obelics+phi3-3b-continue-training-hq+stage-pretrain+x7", "run_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints", "seed": 7, "stage": "pretrain", "trackers": ["jsonl", "wandb"], "wandb_entity": null, "wandb_project": "mmpretrain"}, "run_id": "obelics+phi3-3b-continue-training-hq+stage-pretrain+x7"}