diff --git a/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/checkpoints/latest-checkpoint.pt b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/checkpoints/latest-checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..129a907faf295c5588c9acedb041ac5a971ee9b9 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/checkpoints/latest-checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aaa02614f9fc1dda49e3dd4664acb70948c1090bf29b7322e1ce2477dba8e2c +size 17049347853 diff --git a/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/checkpoints/latest-optimizer.pt b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/checkpoints/latest-optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..c99658222dfa6d1ec5bac61dcee285d000667462 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/checkpoints/latest-optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb43f2f1713aa50a03ced8fad543aeeeedbb15eb10d2fabe445f284bc6531fe5 +size 33976939737 diff --git a/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/checkpoints/latest-scheduler.pt b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/checkpoints/latest-scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4f09f488c3f319b68cc9fde89e14a033705ac40 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/checkpoints/latest-scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ba4d4ded2fe863df5701c02896d2a60bb9e25903168be9a20a3a5a9fe9e6ba5 +size 1192 diff --git a/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/config.json b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/config.json new file mode 100644 index 0000000000000000000000000000000000000000..791c7915dbecd96d60b096ac4c2e1ab270401c4a --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/config.json @@ -0,0 +1,74 @@ +{ + "dataset": { + "align_stage_components": [ + "download/llava-laion-cc-sbu-558k/chat.json", + "download/llava-laion-cc-sbu-558k" + ], + "dataset_id": "obelics", + "dataset_resampled": true, + "dataset_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl_pil/", + "finetune_stage_components": [ + "/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/llava_v1_5_mix665k.json", + "/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/data" + ], + "max_num_images": 6, + "min_num_images": 1, + "train_num_samples": 2441407, + "type": "obelics", + "workers": 4 + }, + "model": { + "align_epochs": 1, + "align_global_batch_size": 256, + "align_learning_rate": 0.001, + "align_lr_scheduler_type": "linear-warmup+cosine-decay", + "align_max_grad_norm": 1.0, + "align_max_steps": null, + "align_per_device_batch_size": 16, + "align_train_strategy": "fsdp-shard-grad-op", + "align_warmup_ratio": 0.03, + "align_weight_decay": 0.0, + "arch_specifier": "no-align+avgpool", + "enable_gradient_checkpointing": true, + "enable_mixed_precision_training": true, + "finetune_epochs": 1, + "finetune_global_batch_size": 128, + "finetune_learning_rate": 2e-05, + "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", + "finetune_max_grad_norm": 1.0, + "finetune_max_steps": null, + "finetune_per_device_batch_size": 16, + "finetune_train_strategy": "fsdp-full-shard", + "finetune_warmup_ratio": 0.03, + "finetune_weight_decay": 0.1, + "image_resize_strategy": "resize-naive", + "llm_backbone_id": "phi3-3b", + "llm_max_length": 4096, + "model_id": "phi3-3b-continue-training-hq", + "pretrain_epochs": 1, + "pretrain_global_batch_size": 256, + "pretrain_learning_rate": 5e-05, + "pretrain_lr_scheduler_type": "linear-warmup+cosine-decay", + "pretrain_max_grad_norm": 1.0, + "pretrain_max_steps": 9536, + "pretrain_per_device_batch_size": 2, + "pretrain_train_strategy": "fsdp-full-shard", + "pretrain_warmup_ratio": 0.03, + "pretrain_weight_decay": 0.01, + "reduce_in_full_precision": false, + "type": "one-stage+7b", + "vision_backbone_id": "siglip-vit-so400m-384px" + }, + "mount_path": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models", + "pretrained_checkpoint": null, + "run_id": "obelics+phi3-3b-continue-training-hq+stage-full-pretrain+x7", + "run_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints/mllm_pretrain_checkpoints", + "seed": 7, + "stage": "full-pretrain", + "trackers": [ + "jsonl", + "wandb" + ], + "wandb_entity": null, + "wandb_project": "mmpretrain" +} \ No newline at end of file diff --git a/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/config.yaml b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..fe9d549895ca6a95db3ed2fb9da7dc17afa8806f --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/config.yaml @@ -0,0 +1,67 @@ +dataset: + align_stage_components: + - download/llava-laion-cc-sbu-558k/chat.json + - download/llava-laion-cc-sbu-558k + dataset_id: obelics + dataset_resampled: true + dataset_root_dir: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl_pil/ + finetune_stage_components: + - /fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/llava_v1_5_mix665k.json + - /fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/data + max_num_images: 6 + min_num_images: 1 + train_num_samples: 2441407 + type: obelics + workers: 4 +model: + align_epochs: 1 + align_global_batch_size: 256 + align_learning_rate: 0.001 + align_lr_scheduler_type: linear-warmup+cosine-decay + align_max_grad_norm: 1.0 + align_max_steps: null + align_per_device_batch_size: 16 + align_train_strategy: fsdp-shard-grad-op + align_warmup_ratio: 0.03 + align_weight_decay: 0.0 + arch_specifier: no-align+avgpool + enable_gradient_checkpointing: true + enable_mixed_precision_training: true + finetune_epochs: 1 + finetune_global_batch_size: 128 + finetune_learning_rate: 2.0e-05 + finetune_lr_scheduler_type: linear-warmup+cosine-decay + finetune_max_grad_norm: 1.0 + finetune_max_steps: null + finetune_per_device_batch_size: 16 + finetune_train_strategy: fsdp-full-shard + finetune_warmup_ratio: 0.03 + finetune_weight_decay: 0.1 + image_resize_strategy: resize-naive + llm_backbone_id: phi3-3b + llm_max_length: 4096 + model_id: phi3-3b-continue-training-hq + pretrain_epochs: 1 + pretrain_global_batch_size: 256 + pretrain_learning_rate: 5.0e-05 + pretrain_lr_scheduler_type: linear-warmup+cosine-decay + pretrain_max_grad_norm: 1.0 + pretrain_max_steps: 9536 + pretrain_per_device_batch_size: 2 + pretrain_train_strategy: fsdp-full-shard + pretrain_warmup_ratio: 0.03 + pretrain_weight_decay: 0.01 + reduce_in_full_precision: false + type: one-stage+7b + vision_backbone_id: siglip-vit-so400m-384px +mount_path: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models +pretrained_checkpoint: null +run_id: obelics+phi3-3b-continue-training-hq+stage-full-pretrain+x7 +run_root_dir: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints/mllm_pretrain_checkpoints +seed: 7 +stage: full-pretrain +trackers: +- jsonl +- wandb +wandb_entity: null +wandb_project: mmpretrain diff --git a/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/obelics+phi3-3b-continue-training-hq+stage-full-pretrain+x7.jsonl b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/obelics+phi3-3b-continue-training-hq+stage-full-pretrain+x7.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..caea7548a167dea1d3d89426d36aef3d8e09b655 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/obelics+phi3-3b-continue-training-hq+stage-full-pretrain+x7.jsonl @@ -0,0 +1,9536 @@ +{"Full-pretrain/Learning Rate": 1.7482517482517484e-07, "Full-pretrain/Loss": 2.956385612487793, "Full-pretrain/Loss (Raw)": 2.956385612487793, "Full-pretrain/Step": 1, "Full-pretrain/Step Time": 21.787632942199707} +{"Full-pretrain/Learning Rate": 3.496503496503497e-07, "Full-pretrain/Loss": 3.4745378494262695, "Full-pretrain/Loss (Raw)": 3.992690324783325, "Full-pretrain/Step": 2, "Full-pretrain/Step Time": 19.769787788391113} +{"Full-pretrain/Learning Rate": 5.244755244755246e-07, "Full-pretrain/Loss": 3.7824227809906006, "Full-pretrain/Loss (Raw)": 4.398192405700684, "Full-pretrain/Step": 3, "Full-pretrain/Step Time": 19.150408109029133} +{"Full-pretrain/Learning Rate": 6.993006993006994e-07, "Full-pretrain/Loss": 3.9603238105773926, "Full-pretrain/Loss (Raw)": 4.494027137756348, "Full-pretrain/Step": 4, "Full-pretrain/Step Time": 18.850386381149292} +{"Full-pretrain/Learning Rate": 8.741258741258743e-07, "Full-pretrain/Loss": 4.223567485809326, "Full-pretrain/Loss (Raw)": 5.276539325714111, "Full-pretrain/Step": 5, "Full-pretrain/Step Time": 18.751159191131592} +{"Full-pretrain/Learning Rate": 1.0489510489510491e-06, "Full-pretrain/Loss": 4.173791408538818, "Full-pretrain/Loss (Raw)": 3.924912214279175, "Full-pretrain/Step": 6, "Full-pretrain/Step Time": 18.529614249865215} +{"Full-pretrain/Learning Rate": 1.2237762237762238e-06, "Full-pretrain/Loss": 4.269876480102539, "Full-pretrain/Loss (Raw)": 4.846385478973389, "Full-pretrain/Step": 7, "Full-pretrain/Step Time": 18.37526719910758} +{"Full-pretrain/Learning Rate": 1.3986013986013987e-06, "Full-pretrain/Loss": 4.373673439025879, "Full-pretrain/Loss (Raw)": 5.100254058837891, "Full-pretrain/Step": 8, "Full-pretrain/Step Time": 18.47487509250641} +{"Full-pretrain/Learning Rate": 1.5734265734265736e-06, "Full-pretrain/Loss": 4.189217567443848, "Full-pretrain/Loss (Raw)": 2.7135705947875977, "Full-pretrain/Step": 9, "Full-pretrain/Step Time": 18.356183979246353} +{"Full-pretrain/Learning Rate": 1.7482517482517485e-06, "Full-pretrain/Loss": 4.205020427703857, "Full-pretrain/Loss (Raw)": 4.347247123718262, "Full-pretrain/Step": 10, "Full-pretrain/Step Time": 18.247130227088928} +{"Full-pretrain/Learning Rate": 1.9230769230769234e-06, "Full-pretrain/Loss": 4.186237335205078, "Full-pretrain/Loss (Raw)": 3.998408794403076, "Full-pretrain/Step": 11, "Full-pretrain/Step Time": 18.262666658921674} +{"Full-pretrain/Learning Rate": 2.0979020979020983e-06, "Full-pretrain/Loss": 4.06561279296875, "Full-pretrain/Loss (Raw)": 2.7387442588806152, "Full-pretrain/Step": 12, "Full-pretrain/Step Time": 18.237130622069042} +{"Full-pretrain/Learning Rate": 2.2727272727272728e-06, "Full-pretrain/Loss": 3.995032787322998, "Full-pretrain/Loss (Raw)": 3.1480705738067627, "Full-pretrain/Step": 13, "Full-pretrain/Step Time": 18.19682810856746} +{"Full-pretrain/Learning Rate": 2.4475524475524477e-06, "Full-pretrain/Loss": 3.9099674224853516, "Full-pretrain/Loss (Raw)": 2.8041155338287354, "Full-pretrain/Step": 14, "Full-pretrain/Step Time": 18.122643419674464} +{"Full-pretrain/Learning Rate": 2.6223776223776225e-06, "Full-pretrain/Loss": 3.826328754425049, "Full-pretrain/Loss (Raw)": 2.6553874015808105, "Full-pretrain/Step": 15, "Full-pretrain/Step Time": 18.03926459948222} +{"Full-pretrain/Learning Rate": 2.7972027972027974e-06, "Full-pretrain/Loss": 3.8459720611572266, "Full-pretrain/Loss (Raw)": 4.140625953674316, "Full-pretrain/Step": 16, "Full-pretrain/Step Time": 18.13856576383114} +{"Full-pretrain/Learning Rate": 2.9720279720279723e-06, "Full-pretrain/Loss": 3.7713801860809326, "Full-pretrain/Loss (Raw)": 2.5779147148132324, "Full-pretrain/Step": 17, "Full-pretrain/Step Time": 18.13031829104704} +{"Full-pretrain/Learning Rate": 3.1468531468531472e-06, "Full-pretrain/Loss": 3.7050087451934814, "Full-pretrain/Loss (Raw)": 2.5766830444335938, "Full-pretrain/Step": 18, "Full-pretrain/Step Time": 18.07896653811137} +{"Full-pretrain/Learning Rate": 3.3216783216783217e-06, "Full-pretrain/Loss": 3.643810510635376, "Full-pretrain/Loss (Raw)": 2.542245388031006, "Full-pretrain/Step": 19, "Full-pretrain/Step Time": 18.021746723275434} +{"Full-pretrain/Learning Rate": 3.496503496503497e-06, "Full-pretrain/Loss": 3.644371747970581, "Full-pretrain/Loss (Raw)": 3.6550326347351074, "Full-pretrain/Step": 20, "Full-pretrain/Step Time": 18.039619898796083} +{"Full-pretrain/Learning Rate": 3.6713286713286715e-06, "Full-pretrain/Loss": 3.604778289794922, "Full-pretrain/Loss (Raw)": 2.812905788421631, "Full-pretrain/Step": 21, "Full-pretrain/Step Time": 18.061832087380544} +{"Full-pretrain/Learning Rate": 3.846153846153847e-06, "Full-pretrain/Loss": 3.5610625743865967, "Full-pretrain/Loss (Raw)": 2.643038034439087, "Full-pretrain/Step": 22, "Full-pretrain/Step Time": 18.01472917470065} +{"Full-pretrain/Learning Rate": 4.020979020979021e-06, "Full-pretrain/Loss": 3.5351245403289795, "Full-pretrain/Loss (Raw)": 2.9644861221313477, "Full-pretrain/Step": 23, "Full-pretrain/Step Time": 17.97752427018207} +{"Full-pretrain/Learning Rate": 4.195804195804197e-06, "Full-pretrain/Loss": 3.4941630363464355, "Full-pretrain/Loss (Raw)": 2.552046298980713, "Full-pretrain/Step": 24, "Full-pretrain/Step Time": 17.954658101002376} +{"Full-pretrain/Learning Rate": 4.370629370629371e-06, "Full-pretrain/Loss": 3.4681780338287354, "Full-pretrain/Loss (Raw)": 2.8445472717285156, "Full-pretrain/Step": 25, "Full-pretrain/Step Time": 17.957984962463378} +{"Full-pretrain/Learning Rate": 4.5454545454545455e-06, "Full-pretrain/Loss": 3.4482953548431396, "Full-pretrain/Loss (Raw)": 2.9512252807617188, "Full-pretrain/Step": 26, "Full-pretrain/Step Time": 17.93578604551462} +{"Full-pretrain/Learning Rate": 4.72027972027972e-06, "Full-pretrain/Loss": 3.4170138835906982, "Full-pretrain/Loss (Raw)": 2.6036927700042725, "Full-pretrain/Step": 27, "Full-pretrain/Step Time": 17.891768013989484} +{"Full-pretrain/Learning Rate": 4.895104895104895e-06, "Full-pretrain/Loss": 3.3791286945343018, "Full-pretrain/Loss (Raw)": 2.3562309741973877, "Full-pretrain/Step": 28, "Full-pretrain/Step Time": 17.868757682187216} +{"Full-pretrain/Learning Rate": 5.06993006993007e-06, "Full-pretrain/Loss": 3.350975751876831, "Full-pretrain/Loss (Raw)": 2.56269907951355, "Full-pretrain/Step": 29, "Full-pretrain/Step Time": 17.883728117778382} +{"Full-pretrain/Learning Rate": 5.244755244755245e-06, "Full-pretrain/Loss": 3.315340757369995, "Full-pretrain/Loss (Raw)": 2.2819125652313232, "Full-pretrain/Step": 30, "Full-pretrain/Step Time": 17.86326772371928} +{"Full-pretrain/Learning Rate": 5.419580419580419e-06, "Full-pretrain/Loss": 3.2818992137908936, "Full-pretrain/Loss (Raw)": 2.2786641120910645, "Full-pretrain/Step": 31, "Full-pretrain/Step Time": 17.834812994926207} +{"Full-pretrain/Learning Rate": 5.594405594405595e-06, "Full-pretrain/Loss": 3.254014730453491, "Full-pretrain/Loss (Raw)": 2.3895907402038574, "Full-pretrain/Step": 32, "Full-pretrain/Step Time": 17.82331942766905} +{"Full-pretrain/Learning Rate": 5.76923076923077e-06, "Full-pretrain/Loss": 3.25718355178833, "Full-pretrain/Loss (Raw)": 3.057786464691162, "Full-pretrain/Step": 33, "Full-pretrain/Step Time": 17.818923523931794} +{"Full-pretrain/Learning Rate": 5.944055944055945e-06, "Full-pretrain/Loss": 3.2065584659576416, "Full-pretrain/Loss (Raw)": 2.3726887702941895, "Full-pretrain/Step": 34, "Full-pretrain/Step Time": 17.833133536226608} +{"Full-pretrain/Learning Rate": 6.1188811188811196e-06, "Full-pretrain/Loss": 3.151601791381836, "Full-pretrain/Loss (Raw)": 2.639575958251953, "Full-pretrain/Step": 35, "Full-pretrain/Step Time": 17.82230314527239} +{"Full-pretrain/Learning Rate": 6.2937062937062944e-06, "Full-pretrain/Loss": 3.092717170715332, "Full-pretrain/Loss (Raw)": 2.609724283218384, "Full-pretrain/Step": 36, "Full-pretrain/Step Time": 17.810628341303932} +{"Full-pretrain/Learning Rate": 6.468531468531469e-06, "Full-pretrain/Loss": 3.0096120834350586, "Full-pretrain/Loss (Raw)": 2.6171774864196777, "Full-pretrain/Step": 37, "Full-pretrain/Step Time": 17.838135667749352} +{"Full-pretrain/Learning Rate": 6.643356643356643e-06, "Full-pretrain/Loss": 2.9655370712280273, "Full-pretrain/Loss (Raw)": 2.514511823654175, "Full-pretrain/Step": 38, "Full-pretrain/Step Time": 17.837194963505393} +{"Full-pretrain/Learning Rate": 6.818181818181818e-06, "Full-pretrain/Loss": 2.896817445755005, "Full-pretrain/Loss (Raw)": 2.6473536491394043, "Full-pretrain/Step": 39, "Full-pretrain/Step Time": 17.820460472351467} +{"Full-pretrain/Learning Rate": 6.993006993006994e-06, "Full-pretrain/Loss": 2.80672025680542, "Full-pretrain/Loss (Raw)": 2.2171430587768555, "Full-pretrain/Step": 40, "Full-pretrain/Step Time": 17.809495168924332} +{"Full-pretrain/Learning Rate": 7.167832167832168e-06, "Full-pretrain/Loss": 2.804598331451416, "Full-pretrain/Loss (Raw)": 2.6456785202026367, "Full-pretrain/Step": 41, "Full-pretrain/Step Time": 17.80375024167503} +{"Full-pretrain/Learning Rate": 7.342657342657343e-06, "Full-pretrain/Loss": 2.749075412750244, "Full-pretrain/Loss (Raw)": 2.570507049560547, "Full-pretrain/Step": 42, "Full-pretrain/Step Time": 17.823405560993013} +{"Full-pretrain/Learning Rate": 7.517482517482517e-06, "Full-pretrain/Loss": 2.7010810375213623, "Full-pretrain/Loss (Raw)": 2.462589740753174, "Full-pretrain/Step": 43, "Full-pretrain/Step Time": 17.80874205744544} +{"Full-pretrain/Learning Rate": 7.692307692307694e-06, "Full-pretrain/Loss": 2.693193197250366, "Full-pretrain/Loss (Raw)": 2.486332654953003, "Full-pretrain/Step": 44, "Full-pretrain/Step Time": 17.804288186810233} +{"Full-pretrain/Learning Rate": 7.867132867132867e-06, "Full-pretrain/Loss": 2.6718902587890625, "Full-pretrain/Loss (Raw)": 2.4663820266723633, "Full-pretrain/Step": 45, "Full-pretrain/Step Time": 17.80200743675232} +{"Full-pretrain/Learning Rate": 8.041958041958042e-06, "Full-pretrain/Loss": 2.658491849899292, "Full-pretrain/Loss (Raw)": 2.3753557205200195, "Full-pretrain/Step": 46, "Full-pretrain/Step Time": 17.801320459531702} +{"Full-pretrain/Learning Rate": 8.216783216783217e-06, "Full-pretrain/Loss": 2.6482114791870117, "Full-pretrain/Loss (Raw)": 2.3264212608337402, "Full-pretrain/Step": 47, "Full-pretrain/Step Time": 17.797302200439127} +{"Full-pretrain/Learning Rate": 8.391608391608393e-06, "Full-pretrain/Loss": 2.5855839252471924, "Full-pretrain/Loss (Raw)": 2.136544704437256, "Full-pretrain/Step": 48, "Full-pretrain/Step Time": 17.79114327331384} +{"Full-pretrain/Learning Rate": 8.566433566433566e-06, "Full-pretrain/Loss": 2.577399253845215, "Full-pretrain/Loss (Raw)": 2.3160059452056885, "Full-pretrain/Step": 49, "Full-pretrain/Step Time": 17.775948641251546} +{"Full-pretrain/Learning Rate": 8.741258741258741e-06, "Full-pretrain/Loss": 2.5915491580963135, "Full-pretrain/Loss (Raw)": 3.0294740200042725, "Full-pretrain/Step": 50, "Full-pretrain/Step Time": 17.778688669204712} +{"Full-pretrain/Learning Rate": 8.916083916083918e-06, "Full-pretrain/Loss": 2.5957512855529785, "Full-pretrain/Loss (Raw)": 2.676718235015869, "Full-pretrain/Step": 51, "Full-pretrain/Step Time": 17.77631992452285} +{"Full-pretrain/Learning Rate": 9.090909090909091e-06, "Full-pretrain/Loss": 2.5546345710754395, "Full-pretrain/Loss (Raw)": 2.339296579360962, "Full-pretrain/Step": 52, "Full-pretrain/Step Time": 17.772014095233036} +{"Full-pretrain/Learning Rate": 9.265734265734266e-06, "Full-pretrain/Loss": 2.54644513130188, "Full-pretrain/Loss (Raw)": 2.550842523574829, "Full-pretrain/Step": 53, "Full-pretrain/Step Time": 17.761630044793183} +{"Full-pretrain/Learning Rate": 9.44055944055944e-06, "Full-pretrain/Loss": 2.5372819900512695, "Full-pretrain/Loss (Raw)": 2.349821090698242, "Full-pretrain/Step": 54, "Full-pretrain/Step Time": 17.760763477396083} +{"Full-pretrain/Learning Rate": 9.615384615384616e-06, "Full-pretrain/Loss": 2.510408878326416, "Full-pretrain/Loss (Raw)": 2.1045405864715576, "Full-pretrain/Step": 55, "Full-pretrain/Step Time": 17.767324833436447} +{"Full-pretrain/Learning Rate": 9.79020979020979e-06, "Full-pretrain/Loss": 2.5101208686828613, "Full-pretrain/Loss (Raw)": 2.5428295135498047, "Full-pretrain/Step": 56, "Full-pretrain/Step Time": 17.76024032490594} +{"Full-pretrain/Learning Rate": 9.965034965034966e-06, "Full-pretrain/Loss": 2.512364149093628, "Full-pretrain/Loss (Raw)": 2.9163339138031006, "Full-pretrain/Step": 57, "Full-pretrain/Step Time": 17.756750654755976} +{"Full-pretrain/Learning Rate": 1.013986013986014e-05, "Full-pretrain/Loss": 2.4987192153930664, "Full-pretrain/Loss (Raw)": 2.5145840644836426, "Full-pretrain/Step": 58, "Full-pretrain/Step Time": 17.75900847747408} +{"Full-pretrain/Learning Rate": 1.0314685314685315e-05, "Full-pretrain/Loss": 2.4987030029296875, "Full-pretrain/Loss (Raw)": 2.6031761169433594, "Full-pretrain/Step": 59, "Full-pretrain/Step Time": 17.762171862489087} +{"Full-pretrain/Learning Rate": 1.048951048951049e-05, "Full-pretrain/Loss": 2.5000271797180176, "Full-pretrain/Loss (Raw)": 2.3986034393310547, "Full-pretrain/Step": 60, "Full-pretrain/Step Time": 17.75277738571167} +{"Full-pretrain/Learning Rate": 1.0664335664335665e-05, "Full-pretrain/Loss": 2.508906841278076, "Full-pretrain/Loss (Raw)": 2.846848249435425, "Full-pretrain/Step": 61, "Full-pretrain/Step Time": 17.747208583550375} +{"Full-pretrain/Learning Rate": 1.0839160839160838e-05, "Full-pretrain/Loss": 2.520927906036377, "Full-pretrain/Loss (Raw)": 2.666592597961426, "Full-pretrain/Step": 62, "Full-pretrain/Step Time": 17.745386977349558} +{"Full-pretrain/Learning Rate": 1.1013986013986015e-05, "Full-pretrain/Loss": 2.532991409301758, "Full-pretrain/Loss (Raw)": 2.66469669342041, "Full-pretrain/Step": 63, "Full-pretrain/Step Time": 17.759588597312806} +{"Full-pretrain/Learning Rate": 1.118881118881119e-05, "Full-pretrain/Loss": 2.540055990219116, "Full-pretrain/Loss (Raw)": 2.6156539916992188, "Full-pretrain/Step": 64, "Full-pretrain/Step Time": 17.760466367006302} +{"Full-pretrain/Learning Rate": 1.1363636363636365e-05, "Full-pretrain/Loss": 2.5126724243164062, "Full-pretrain/Loss (Raw)": 2.1815176010131836, "Full-pretrain/Step": 65, "Full-pretrain/Step Time": 17.747444141828097} +{"Full-pretrain/Learning Rate": 1.153846153846154e-05, "Full-pretrain/Loss": 2.5155739784240723, "Full-pretrain/Loss (Raw)": 2.4655327796936035, "Full-pretrain/Step": 66, "Full-pretrain/Step Time": 17.758645845182013} +{"Full-pretrain/Learning Rate": 1.1713286713286714e-05, "Full-pretrain/Loss": 2.5096991062164307, "Full-pretrain/Loss (Raw)": 2.4515786170959473, "Full-pretrain/Step": 67, "Full-pretrain/Step Time": 17.75746396406373} +{"Full-pretrain/Learning Rate": 1.188811188811189e-05, "Full-pretrain/Loss": 2.505296468734741, "Full-pretrain/Loss (Raw)": 2.468843460083008, "Full-pretrain/Step": 68, "Full-pretrain/Step Time": 17.746785945752087} +{"Full-pretrain/Learning Rate": 1.2062937062937063e-05, "Full-pretrain/Loss": 2.5054025650024414, "Full-pretrain/Loss (Raw)": 2.6205759048461914, "Full-pretrain/Step": 69, "Full-pretrain/Step Time": 17.74694938245027} +{"Full-pretrain/Learning Rate": 1.2237762237762239e-05, "Full-pretrain/Loss": 2.500459671020508, "Full-pretrain/Loss (Raw)": 2.3563315868377686, "Full-pretrain/Step": 70, "Full-pretrain/Step Time": 17.747683906555174} +{"Full-pretrain/Learning Rate": 1.2412587412587414e-05, "Full-pretrain/Loss": 2.494940757751465, "Full-pretrain/Loss (Raw)": 2.4707531929016113, "Full-pretrain/Step": 71, "Full-pretrain/Step Time": 17.746393217167384} +{"Full-pretrain/Learning Rate": 1.2587412587412589e-05, "Full-pretrain/Loss": 2.5020360946655273, "Full-pretrain/Loss (Raw)": 2.4441885948181152, "Full-pretrain/Step": 72, "Full-pretrain/Step Time": 17.741761022143894} +{"Full-pretrain/Learning Rate": 1.2762237762237764e-05, "Full-pretrain/Loss": 2.496438980102539, "Full-pretrain/Loss (Raw)": 2.4665780067443848, "Full-pretrain/Step": 73, "Full-pretrain/Step Time": 17.74264820961103} +{"Full-pretrain/Learning Rate": 1.2937062937062939e-05, "Full-pretrain/Loss": 2.4895236492156982, "Full-pretrain/Loss (Raw)": 2.3492116928100586, "Full-pretrain/Step": 74, "Full-pretrain/Step Time": 17.7438102316212} +{"Full-pretrain/Learning Rate": 1.3111888111888112e-05, "Full-pretrain/Loss": 2.4877400398254395, "Full-pretrain/Loss (Raw)": 2.405517101287842, "Full-pretrain/Step": 75, "Full-pretrain/Step Time": 17.742701059977215} +{"Full-pretrain/Learning Rate": 1.3286713286713287e-05, "Full-pretrain/Loss": 2.4842529296875, "Full-pretrain/Loss (Raw)": 2.3747382164001465, "Full-pretrain/Step": 76, "Full-pretrain/Step Time": 17.73785982633892} +{"Full-pretrain/Learning Rate": 1.3461538461538462e-05, "Full-pretrain/Loss": 2.4834885597229004, "Full-pretrain/Loss (Raw)": 2.4419314861297607, "Full-pretrain/Step": 77, "Full-pretrain/Step Time": 17.743937671958626} +{"Full-pretrain/Learning Rate": 1.3636363636363637e-05, "Full-pretrain/Loss": 2.483997344970703, "Full-pretrain/Loss (Raw)": 2.3916268348693848, "Full-pretrain/Step": 78, "Full-pretrain/Step Time": 17.74028463852711} +{"Full-pretrain/Learning Rate": 1.381118881118881e-05, "Full-pretrain/Loss": 2.4815011024475098, "Full-pretrain/Loss (Raw)": 2.246549367904663, "Full-pretrain/Step": 79, "Full-pretrain/Step Time": 17.742644430715828} +{"Full-pretrain/Learning Rate": 1.3986013986013988e-05, "Full-pretrain/Loss": 2.4941818714141846, "Full-pretrain/Loss (Raw)": 2.542327404022217, "Full-pretrain/Step": 80, "Full-pretrain/Step Time": 17.739482846856117} +{"Full-pretrain/Learning Rate": 1.4160839160839163e-05, "Full-pretrain/Loss": 2.4931373596191406, "Full-pretrain/Loss (Raw)": 2.282585620880127, "Full-pretrain/Step": 81, "Full-pretrain/Step Time": 17.739487362496646} +{"Full-pretrain/Learning Rate": 1.4335664335664336e-05, "Full-pretrain/Loss": 2.4759521484375, "Full-pretrain/Loss (Raw)": 2.479544162750244, "Full-pretrain/Step": 82, "Full-pretrain/Step Time": 17.74488452294978} +{"Full-pretrain/Learning Rate": 1.4510489510489511e-05, "Full-pretrain/Loss": 2.472342014312744, "Full-pretrain/Loss (Raw)": 2.561187744140625, "Full-pretrain/Step": 83, "Full-pretrain/Step Time": 17.738490136272937} +{"Full-pretrain/Learning Rate": 1.4685314685314686e-05, "Full-pretrain/Loss": 2.4746506214141846, "Full-pretrain/Loss (Raw)": 2.413179874420166, "Full-pretrain/Step": 84, "Full-pretrain/Step Time": 17.73585767121542} +{"Full-pretrain/Learning Rate": 1.486013986013986e-05, "Full-pretrain/Loss": 2.4652693271636963, "Full-pretrain/Loss (Raw)": 2.250636577606201, "Full-pretrain/Step": 85, "Full-pretrain/Step Time": 17.736966105068433} +{"Full-pretrain/Learning Rate": 1.5034965034965034e-05, "Full-pretrain/Loss": 2.4728832244873047, "Full-pretrain/Loss (Raw)": 2.5934722423553467, "Full-pretrain/Step": 86, "Full-pretrain/Step Time": 17.734175476917002} +{"Full-pretrain/Learning Rate": 1.5209790209790212e-05, "Full-pretrain/Loss": 2.4853124618530273, "Full-pretrain/Loss (Raw)": 2.502272605895996, "Full-pretrain/Step": 87, "Full-pretrain/Step Time": 17.727165235870185} +{"Full-pretrain/Learning Rate": 1.5384615384615387e-05, "Full-pretrain/Loss": 2.4847617149353027, "Full-pretrain/Loss (Raw)": 2.525212526321411, "Full-pretrain/Step": 88, "Full-pretrain/Step Time": 17.72776551138271} +{"Full-pretrain/Learning Rate": 1.555944055944056e-05, "Full-pretrain/Loss": 2.4703807830810547, "Full-pretrain/Loss (Raw)": 2.45613431930542, "Full-pretrain/Step": 89, "Full-pretrain/Step Time": 17.736318014980704} +{"Full-pretrain/Learning Rate": 1.5734265734265734e-05, "Full-pretrain/Loss": 2.459644317626953, "Full-pretrain/Loss (Raw)": 2.1710145473480225, "Full-pretrain/Step": 90, "Full-pretrain/Step Time": 17.739301784833273} +{"Full-pretrain/Learning Rate": 1.590909090909091e-05, "Full-pretrain/Loss": 2.457369327545166, "Full-pretrain/Loss (Raw)": 2.5303797721862793, "Full-pretrain/Step": 91, "Full-pretrain/Step Time": 17.739316974367416} +{"Full-pretrain/Learning Rate": 1.6083916083916083e-05, "Full-pretrain/Loss": 2.4534382820129395, "Full-pretrain/Loss (Raw)": 2.272814989089966, "Full-pretrain/Step": 92, "Full-pretrain/Step Time": 17.739631238191023} +{"Full-pretrain/Learning Rate": 1.625874125874126e-05, "Full-pretrain/Loss": 2.4330575466156006, "Full-pretrain/Loss (Raw)": 2.1946585178375244, "Full-pretrain/Step": 93, "Full-pretrain/Step Time": 17.735987950396794} +{"Full-pretrain/Learning Rate": 1.6433566433566433e-05, "Full-pretrain/Loss": 2.43107271194458, "Full-pretrain/Loss (Raw)": 2.6030831336975098, "Full-pretrain/Step": 94, "Full-pretrain/Step Time": 17.737125934438502} +{"Full-pretrain/Learning Rate": 1.660839160839161e-05, "Full-pretrain/Loss": 2.425527811050415, "Full-pretrain/Loss (Raw)": 2.4872570037841797, "Full-pretrain/Step": 95, "Full-pretrain/Step Time": 17.731110803704514} +{"Full-pretrain/Learning Rate": 1.6783216783216786e-05, "Full-pretrain/Loss": 2.419416666030884, "Full-pretrain/Loss (Raw)": 2.420098066329956, "Full-pretrain/Step": 96, "Full-pretrain/Step Time": 17.729144754509132} +{"Full-pretrain/Learning Rate": 1.695804195804196e-05, "Full-pretrain/Loss": 2.431959629058838, "Full-pretrain/Loss (Raw)": 2.5828933715820312, "Full-pretrain/Step": 97, "Full-pretrain/Step Time": 17.73256215360976} +{"Full-pretrain/Learning Rate": 1.7132867132867133e-05, "Full-pretrain/Loss": 2.428513526916504, "Full-pretrain/Loss (Raw)": 2.355260133743286, "Full-pretrain/Step": 98, "Full-pretrain/Step Time": 17.730922635720702} +{"Full-pretrain/Learning Rate": 1.730769230769231e-05, "Full-pretrain/Loss": 2.4283676147460938, "Full-pretrain/Loss (Raw)": 2.4469032287597656, "Full-pretrain/Step": 99, "Full-pretrain/Step Time": 17.734894555024425} +{"Full-pretrain/Learning Rate": 1.7482517482517483e-05, "Full-pretrain/Loss": 2.423102855682373, "Full-pretrain/Loss (Raw)": 2.3003721237182617, "Full-pretrain/Step": 100, "Full-pretrain/Step Time": 17.7303786277771} +{"Full-pretrain/Learning Rate": 1.7657342657342656e-05, "Full-pretrain/Loss": 2.4113821983337402, "Full-pretrain/Loss (Raw)": 2.2455155849456787, "Full-pretrain/Step": 101, "Full-pretrain/Step Time": 17.733387276677803} +{"Full-pretrain/Learning Rate": 1.7832167832167836e-05, "Full-pretrain/Loss": 2.4074149131774902, "Full-pretrain/Loss (Raw)": 2.229377269744873, "Full-pretrain/Step": 102, "Full-pretrain/Step Time": 17.730086702926485} +{"Full-pretrain/Learning Rate": 1.800699300699301e-05, "Full-pretrain/Loss": 2.4061481952667236, "Full-pretrain/Loss (Raw)": 2.430218458175659, "Full-pretrain/Step": 103, "Full-pretrain/Step Time": 17.727416925059938} +{"Full-pretrain/Learning Rate": 1.8181818181818182e-05, "Full-pretrain/Loss": 2.393758773803711, "Full-pretrain/Loss (Raw)": 2.047726631164551, "Full-pretrain/Step": 104, "Full-pretrain/Step Time": 17.719613439761677} +{"Full-pretrain/Learning Rate": 1.835664335664336e-05, "Full-pretrain/Loss": 2.3956379890441895, "Full-pretrain/Loss (Raw)": 2.5267133712768555, "Full-pretrain/Step": 105, "Full-pretrain/Step Time": 17.719036590485345} +{"Full-pretrain/Learning Rate": 1.8531468531468532e-05, "Full-pretrain/Loss": 2.400634765625, "Full-pretrain/Loss (Raw)": 2.50911283493042, "Full-pretrain/Step": 106, "Full-pretrain/Step Time": 17.718622844174224} +{"Full-pretrain/Learning Rate": 1.8706293706293705e-05, "Full-pretrain/Loss": 2.3977646827697754, "Full-pretrain/Loss (Raw)": 2.3136682510375977, "Full-pretrain/Step": 107, "Full-pretrain/Step Time": 17.714975954216218} +{"Full-pretrain/Learning Rate": 1.888111888111888e-05, "Full-pretrain/Loss": 2.3967840671539307, "Full-pretrain/Loss (Raw)": 2.3433609008789062, "Full-pretrain/Step": 108, "Full-pretrain/Step Time": 17.710320940724127} +{"Full-pretrain/Learning Rate": 1.9055944055944055e-05, "Full-pretrain/Loss": 2.3897409439086914, "Full-pretrain/Loss (Raw)": 2.216548442840576, "Full-pretrain/Step": 109, "Full-pretrain/Step Time": 17.707898621165423} +{"Full-pretrain/Learning Rate": 1.923076923076923e-05, "Full-pretrain/Loss": 2.384075164794922, "Full-pretrain/Loss (Raw)": 2.2103192806243896, "Full-pretrain/Step": 110, "Full-pretrain/Step Time": 17.705216134678235} +{"Full-pretrain/Learning Rate": 1.9405594405594408e-05, "Full-pretrain/Loss": 2.3906960487365723, "Full-pretrain/Loss (Raw)": 2.458423614501953, "Full-pretrain/Step": 111, "Full-pretrain/Step Time": 17.705416952167546} +{"Full-pretrain/Learning Rate": 1.958041958041958e-05, "Full-pretrain/Loss": 2.3803153038024902, "Full-pretrain/Loss (Raw)": 2.210139036178589, "Full-pretrain/Step": 112, "Full-pretrain/Step Time": 17.699570193886757} +{"Full-pretrain/Learning Rate": 1.9755244755244758e-05, "Full-pretrain/Loss": 2.3795273303985596, "Full-pretrain/Loss (Raw)": 2.257376194000244, "Full-pretrain/Step": 113, "Full-pretrain/Step Time": 17.697608768412497} +{"Full-pretrain/Learning Rate": 1.993006993006993e-05, "Full-pretrain/Loss": 2.39111065864563, "Full-pretrain/Loss (Raw)": 2.8502087593078613, "Full-pretrain/Step": 114, "Full-pretrain/Step Time": 17.700596200792415} +{"Full-pretrain/Learning Rate": 2.0104895104895104e-05, "Full-pretrain/Loss": 2.3924708366394043, "Full-pretrain/Loss (Raw)": 2.604715585708618, "Full-pretrain/Step": 115, "Full-pretrain/Step Time": 17.699150093742038} +{"Full-pretrain/Learning Rate": 2.027972027972028e-05, "Full-pretrain/Loss": 2.3925540447235107, "Full-pretrain/Loss (Raw)": 2.4158406257629395, "Full-pretrain/Step": 116, "Full-pretrain/Step Time": 17.69246648508927} +{"Full-pretrain/Learning Rate": 2.0454545454545457e-05, "Full-pretrain/Loss": 2.3893229961395264, "Full-pretrain/Loss (Raw)": 2.1472463607788086, "Full-pretrain/Step": 117, "Full-pretrain/Step Time": 17.6938914335691} +{"Full-pretrain/Learning Rate": 2.062937062937063e-05, "Full-pretrain/Loss": 2.377553939819336, "Full-pretrain/Loss (Raw)": 2.216862440109253, "Full-pretrain/Step": 118, "Full-pretrain/Step Time": 17.697399996094784} +{"Full-pretrain/Learning Rate": 2.0804195804195807e-05, "Full-pretrain/Loss": 2.369455337524414, "Full-pretrain/Loss (Raw)": 2.2431154251098633, "Full-pretrain/Step": 119, "Full-pretrain/Step Time": 17.692317626055548} +{"Full-pretrain/Learning Rate": 2.097902097902098e-05, "Full-pretrain/Loss": 2.3612289428710938, "Full-pretrain/Loss (Raw)": 2.2619643211364746, "Full-pretrain/Step": 120, "Full-pretrain/Step Time": 17.689015982548394} +{"Full-pretrain/Learning Rate": 2.1153846153846154e-05, "Full-pretrain/Loss": 2.3562123775482178, "Full-pretrain/Loss (Raw)": 2.2956106662750244, "Full-pretrain/Step": 121, "Full-pretrain/Step Time": 17.685171150964155} +{"Full-pretrain/Learning Rate": 2.132867132867133e-05, "Full-pretrain/Loss": 2.361546039581299, "Full-pretrain/Loss (Raw)": 2.3416943550109863, "Full-pretrain/Step": 122, "Full-pretrain/Step Time": 17.690528343935483} +{"Full-pretrain/Learning Rate": 2.1503496503496503e-05, "Full-pretrain/Loss": 2.357400894165039, "Full-pretrain/Loss (Raw)": 2.397726535797119, "Full-pretrain/Step": 123, "Full-pretrain/Step Time": 17.68956783728871} +{"Full-pretrain/Learning Rate": 2.1678321678321677e-05, "Full-pretrain/Loss": 2.370567798614502, "Full-pretrain/Loss (Raw)": 2.6941637992858887, "Full-pretrain/Step": 124, "Full-pretrain/Step Time": 17.681832380833164} +{"Full-pretrain/Learning Rate": 2.1853146853146857e-05, "Full-pretrain/Loss": 2.3698954582214355, "Full-pretrain/Loss (Raw)": 2.1731412410736084, "Full-pretrain/Step": 125, "Full-pretrain/Step Time": 17.67973394203186} +{"Full-pretrain/Learning Rate": 2.202797202797203e-05, "Full-pretrain/Loss": 2.3657546043395996, "Full-pretrain/Loss (Raw)": 2.4705734252929688, "Full-pretrain/Step": 126, "Full-pretrain/Step Time": 17.68356640376742} +{"Full-pretrain/Learning Rate": 2.2202797202797203e-05, "Full-pretrain/Loss": 2.3567728996276855, "Full-pretrain/Loss (Raw)": 2.1998414993286133, "Full-pretrain/Step": 127, "Full-pretrain/Step Time": 17.686162306567816} +{"Full-pretrain/Learning Rate": 2.237762237762238e-05, "Full-pretrain/Loss": 2.352224349975586, "Full-pretrain/Loss (Raw)": 2.274550437927246, "Full-pretrain/Step": 128, "Full-pretrain/Step Time": 17.68028506077826} +{"Full-pretrain/Learning Rate": 2.2552447552447553e-05, "Full-pretrain/Loss": 2.3442230224609375, "Full-pretrain/Loss (Raw)": 2.3268465995788574, "Full-pretrain/Step": 129, "Full-pretrain/Step Time": 17.64991289936006} +{"Full-pretrain/Learning Rate": 2.272727272727273e-05, "Full-pretrain/Loss": 2.350882053375244, "Full-pretrain/Loss (Raw)": 2.568345069885254, "Full-pretrain/Step": 130, "Full-pretrain/Step Time": 17.65155733935535} +{"Full-pretrain/Learning Rate": 2.2902097902097902e-05, "Full-pretrain/Loss": 2.3442325592041016, "Full-pretrain/Loss (Raw)": 2.2341248989105225, "Full-pretrain/Step": 131, "Full-pretrain/Step Time": 17.6517701074481} +{"Full-pretrain/Learning Rate": 2.307692307692308e-05, "Full-pretrain/Loss": 2.348130226135254, "Full-pretrain/Loss (Raw)": 2.42509126663208, "Full-pretrain/Step": 132, "Full-pretrain/Step Time": 17.646906407549977} +{"Full-pretrain/Learning Rate": 2.3251748251748252e-05, "Full-pretrain/Loss": 2.358604669570923, "Full-pretrain/Loss (Raw)": 2.5806992053985596, "Full-pretrain/Step": 133, "Full-pretrain/Step Time": 17.642579071223736} +{"Full-pretrain/Learning Rate": 2.342657342657343e-05, "Full-pretrain/Loss": 2.3701159954071045, "Full-pretrain/Loss (Raw)": 2.5977394580841064, "Full-pretrain/Step": 134, "Full-pretrain/Step Time": 17.642837077379227} +{"Full-pretrain/Learning Rate": 2.3601398601398602e-05, "Full-pretrain/Loss": 2.3825836181640625, "Full-pretrain/Loss (Raw)": 2.8291802406311035, "Full-pretrain/Step": 135, "Full-pretrain/Step Time": 17.648007191717625} +{"Full-pretrain/Learning Rate": 2.377622377622378e-05, "Full-pretrain/Loss": 2.3876466751098633, "Full-pretrain/Loss (Raw)": 2.2097506523132324, "Full-pretrain/Step": 136, "Full-pretrain/Step Time": 17.634839538484812} +{"Full-pretrain/Learning Rate": 2.3951048951048952e-05, "Full-pretrain/Loss": 2.3738951683044434, "Full-pretrain/Loss (Raw)": 2.086665153503418, "Full-pretrain/Step": 137, "Full-pretrain/Step Time": 17.635356575250626} +{"Full-pretrain/Learning Rate": 2.4125874125874125e-05, "Full-pretrain/Loss": 2.368170738220215, "Full-pretrain/Loss (Raw)": 2.325925588607788, "Full-pretrain/Step": 138, "Full-pretrain/Step Time": 17.640584368258715} +{"Full-pretrain/Learning Rate": 2.43006993006993e-05, "Full-pretrain/Loss": 2.371790885925293, "Full-pretrain/Loss (Raw)": 2.4295129776000977, "Full-pretrain/Step": 139, "Full-pretrain/Step Time": 17.632398657500744} +{"Full-pretrain/Learning Rate": 2.4475524475524478e-05, "Full-pretrain/Loss": 2.367018699645996, "Full-pretrain/Loss (Raw)": 2.190657615661621, "Full-pretrain/Step": 140, "Full-pretrain/Step Time": 17.628062712028623} +{"Full-pretrain/Learning Rate": 2.465034965034965e-05, "Full-pretrain/Loss": 2.371650218963623, "Full-pretrain/Loss (Raw)": 2.3647544384002686, "Full-pretrain/Step": 141, "Full-pretrain/Step Time": 17.625106433406472} +{"Full-pretrain/Learning Rate": 2.4825174825174828e-05, "Full-pretrain/Loss": 2.3741326332092285, "Full-pretrain/Loss (Raw)": 2.2897486686706543, "Full-pretrain/Step": 142, "Full-pretrain/Step Time": 17.628641981631517} +{"Full-pretrain/Learning Rate": 2.5e-05, "Full-pretrain/Loss": 2.3724563121795654, "Full-pretrain/Loss (Raw)": 2.404787063598633, "Full-pretrain/Step": 143, "Full-pretrain/Step Time": 17.63568497635424} +{"Full-pretrain/Learning Rate": 2.5174825174825178e-05, "Full-pretrain/Loss": 2.3764045238494873, "Full-pretrain/Loss (Raw)": 2.336480140686035, "Full-pretrain/Step": 144, "Full-pretrain/Step Time": 17.618263876065612} +{"Full-pretrain/Learning Rate": 2.534965034965035e-05, "Full-pretrain/Loss": 2.3788959980010986, "Full-pretrain/Loss (Raw)": 2.3371050357818604, "Full-pretrain/Step": 145, "Full-pretrain/Step Time": 17.615230737254024} +{"Full-pretrain/Learning Rate": 2.5524475524475528e-05, "Full-pretrain/Loss": 2.3638181686401367, "Full-pretrain/Loss (Raw)": 2.367720603942871, "Full-pretrain/Step": 146, "Full-pretrain/Step Time": 17.616698877885938} +{"Full-pretrain/Learning Rate": 2.5699300699300697e-05, "Full-pretrain/Loss": 2.3572678565979004, "Full-pretrain/Loss (Raw)": 2.3951051235198975, "Full-pretrain/Step": 147, "Full-pretrain/Step Time": 17.624759308993816} +{"Full-pretrain/Learning Rate": 2.5874125874125877e-05, "Full-pretrain/Loss": 2.3505959510803223, "Full-pretrain/Loss (Raw)": 2.202332019805908, "Full-pretrain/Step": 148, "Full-pretrain/Step Time": 17.614213751628995} +{"Full-pretrain/Learning Rate": 2.6048951048951047e-05, "Full-pretrain/Loss": 2.3551249504089355, "Full-pretrain/Loss (Raw)": 2.2921814918518066, "Full-pretrain/Step": 149, "Full-pretrain/Step Time": 17.6043848246336} +{"Full-pretrain/Learning Rate": 2.6223776223776224e-05, "Full-pretrain/Loss": 2.3498780727386475, "Full-pretrain/Loss (Raw)": 2.0489649772644043, "Full-pretrain/Step": 150, "Full-pretrain/Step Time": 17.606800731271505} +{"Full-pretrain/Learning Rate": 2.6398601398601404e-05, "Full-pretrain/Loss": 2.3517448902130127, "Full-pretrain/Loss (Raw)": 2.302854061126709, "Full-pretrain/Step": 151, "Full-pretrain/Step Time": 17.611692732200027} +{"Full-pretrain/Learning Rate": 2.6573426573426574e-05, "Full-pretrain/Loss": 2.353682279586792, "Full-pretrain/Loss (Raw)": 2.32395601272583, "Full-pretrain/Step": 152, "Full-pretrain/Step Time": 17.6122017595917} +{"Full-pretrain/Learning Rate": 2.674825174825175e-05, "Full-pretrain/Loss": 2.3517799377441406, "Full-pretrain/Loss (Raw)": 2.2347426414489746, "Full-pretrain/Step": 153, "Full-pretrain/Step Time": 17.602521259337664} +{"Full-pretrain/Learning Rate": 2.6923076923076923e-05, "Full-pretrain/Loss": 2.350602626800537, "Full-pretrain/Loss (Raw)": 2.304015636444092, "Full-pretrain/Step": 154, "Full-pretrain/Step Time": 17.608599338680506} +{"Full-pretrain/Learning Rate": 2.70979020979021e-05, "Full-pretrain/Loss": 2.349372625350952, "Full-pretrain/Loss (Raw)": 2.3583664894104004, "Full-pretrain/Step": 155, "Full-pretrain/Step Time": 17.612156754359603} +{"Full-pretrain/Learning Rate": 2.7272727272727273e-05, "Full-pretrain/Loss": 2.3409008979797363, "Full-pretrain/Loss (Raw)": 2.4230690002441406, "Full-pretrain/Step": 156, "Full-pretrain/Step Time": 17.616753067821264} +{"Full-pretrain/Learning Rate": 2.744755244755245e-05, "Full-pretrain/Loss": 2.3422904014587402, "Full-pretrain/Loss (Raw)": 2.217604160308838, "Full-pretrain/Step": 157, "Full-pretrain/Step Time": 17.60806338302791} +{"Full-pretrain/Learning Rate": 2.762237762237762e-05, "Full-pretrain/Loss": 2.339308261871338, "Full-pretrain/Loss (Raw)": 2.375150680541992, "Full-pretrain/Step": 158, "Full-pretrain/Step Time": 17.61105198599398} +{"Full-pretrain/Learning Rate": 2.77972027972028e-05, "Full-pretrain/Loss": 2.344454288482666, "Full-pretrain/Loss (Raw)": 2.3645081520080566, "Full-pretrain/Step": 159, "Full-pretrain/Step Time": 17.619851702824235} +{"Full-pretrain/Learning Rate": 2.7972027972027976e-05, "Full-pretrain/Loss": 2.3337976932525635, "Full-pretrain/Loss (Raw)": 1.9335448741912842, "Full-pretrain/Step": 160, "Full-pretrain/Step Time": 17.618995267897844} +{"Full-pretrain/Learning Rate": 2.8146853146853146e-05, "Full-pretrain/Loss": 2.335977792739868, "Full-pretrain/Loss (Raw)": 2.3966054916381836, "Full-pretrain/Step": 161, "Full-pretrain/Step Time": 17.616553952917457} +{"Full-pretrain/Learning Rate": 2.8321678321678326e-05, "Full-pretrain/Loss": 2.3270039558410645, "Full-pretrain/Loss (Raw)": 2.2811830043792725, "Full-pretrain/Step": 162, "Full-pretrain/Step Time": 17.609943693503737} +{"Full-pretrain/Learning Rate": 2.8496503496503496e-05, "Full-pretrain/Loss": 2.3359766006469727, "Full-pretrain/Loss (Raw)": 2.521249771118164, "Full-pretrain/Step": 163, "Full-pretrain/Step Time": 17.613215221092105} +{"Full-pretrain/Learning Rate": 2.8671328671328672e-05, "Full-pretrain/Loss": 2.332341432571411, "Full-pretrain/Loss (Raw)": 2.308769702911377, "Full-pretrain/Step": 164, "Full-pretrain/Step Time": 17.61568285897374} +{"Full-pretrain/Learning Rate": 2.8846153846153845e-05, "Full-pretrain/Loss": 2.3215065002441406, "Full-pretrain/Loss (Raw)": 2.2339744567871094, "Full-pretrain/Step": 165, "Full-pretrain/Step Time": 17.607780531048775} +{"Full-pretrain/Learning Rate": 2.9020979020979022e-05, "Full-pretrain/Loss": 2.3075790405273438, "Full-pretrain/Loss (Raw)": 2.152062177658081, "Full-pretrain/Step": 166, "Full-pretrain/Step Time": 17.604819230735302} +{"Full-pretrain/Learning Rate": 2.91958041958042e-05, "Full-pretrain/Loss": 2.2846384048461914, "Full-pretrain/Loss (Raw)": 2.0950865745544434, "Full-pretrain/Step": 167, "Full-pretrain/Step Time": 17.610039960592985} +{"Full-pretrain/Learning Rate": 2.9370629370629372e-05, "Full-pretrain/Loss": 2.287402629852295, "Full-pretrain/Loss (Raw)": 2.298201084136963, "Full-pretrain/Step": 168, "Full-pretrain/Step Time": 17.61007510125637} +{"Full-pretrain/Learning Rate": 2.954545454545455e-05, "Full-pretrain/Loss": 2.2924017906188965, "Full-pretrain/Loss (Raw)": 2.246640682220459, "Full-pretrain/Step": 169, "Full-pretrain/Step Time": 17.61378590017557} +{"Full-pretrain/Learning Rate": 2.972027972027972e-05, "Full-pretrain/Loss": 2.291863441467285, "Full-pretrain/Loss (Raw)": 2.308694362640381, "Full-pretrain/Step": 170, "Full-pretrain/Step Time": 17.60226279683411} +{"Full-pretrain/Learning Rate": 2.9895104895104898e-05, "Full-pretrain/Loss": 2.293942928314209, "Full-pretrain/Loss (Raw)": 2.4960618019104004, "Full-pretrain/Step": 171, "Full-pretrain/Step Time": 17.610816357657313} +{"Full-pretrain/Learning Rate": 3.0069930069930068e-05, "Full-pretrain/Loss": 2.293041706085205, "Full-pretrain/Loss (Raw)": 2.1618170738220215, "Full-pretrain/Step": 172, "Full-pretrain/Step Time": 17.61400919780135} +{"Full-pretrain/Learning Rate": 3.0244755244755245e-05, "Full-pretrain/Loss": 2.288443088531494, "Full-pretrain/Loss (Raw)": 2.2175896167755127, "Full-pretrain/Step": 173, "Full-pretrain/Step Time": 17.61107743345201} +{"Full-pretrain/Learning Rate": 3.0419580419580425e-05, "Full-pretrain/Loss": 2.292367458343506, "Full-pretrain/Loss (Raw)": 2.415334701538086, "Full-pretrain/Step": 174, "Full-pretrain/Step Time": 17.609460650011897} +{"Full-pretrain/Learning Rate": 3.0594405594405594e-05, "Full-pretrain/Loss": 2.283578872680664, "Full-pretrain/Loss (Raw)": 2.1235504150390625, "Full-pretrain/Step": 175, "Full-pretrain/Step Time": 17.608549447730184} +{"Full-pretrain/Learning Rate": 3.0769230769230774e-05, "Full-pretrain/Loss": 2.2836732864379883, "Full-pretrain/Loss (Raw)": 2.3395042419433594, "Full-pretrain/Step": 176, "Full-pretrain/Step Time": 17.617208916693926} +{"Full-pretrain/Learning Rate": 3.094405594405594e-05, "Full-pretrain/Loss": 2.280701160430908, "Full-pretrain/Loss (Raw)": 2.241992950439453, "Full-pretrain/Step": 177, "Full-pretrain/Step Time": 17.623572055250406} +{"Full-pretrain/Learning Rate": 3.111888111888112e-05, "Full-pretrain/Loss": 2.2776131629943848, "Full-pretrain/Loss (Raw)": 2.2689032554626465, "Full-pretrain/Step": 178, "Full-pretrain/Step Time": 17.621300920844078} +{"Full-pretrain/Learning Rate": 3.1293706293706294e-05, "Full-pretrain/Loss": 2.2741105556488037, "Full-pretrain/Loss (Raw)": 2.283022880554199, "Full-pretrain/Step": 179, "Full-pretrain/Step Time": 17.619399452582} +{"Full-pretrain/Learning Rate": 3.146853146853147e-05, "Full-pretrain/Loss": 2.27595853805542, "Full-pretrain/Loss (Raw)": 2.261465072631836, "Full-pretrain/Step": 180, "Full-pretrain/Step Time": 17.62176539003849} +{"Full-pretrain/Learning Rate": 3.164335664335665e-05, "Full-pretrain/Loss": 2.275791883468628, "Full-pretrain/Loss (Raw)": 2.2868518829345703, "Full-pretrain/Step": 181, "Full-pretrain/Step Time": 17.627906017005444} +{"Full-pretrain/Learning Rate": 3.181818181818182e-05, "Full-pretrain/Loss": 2.2793455123901367, "Full-pretrain/Loss (Raw)": 2.1626861095428467, "Full-pretrain/Step": 182, "Full-pretrain/Step Time": 17.625575862824917} +{"Full-pretrain/Learning Rate": 3.1993006993006994e-05, "Full-pretrain/Loss": 2.278348922729492, "Full-pretrain/Loss (Raw)": 2.2709569931030273, "Full-pretrain/Step": 183, "Full-pretrain/Step Time": 17.620169814676046} +{"Full-pretrain/Learning Rate": 3.216783216783217e-05, "Full-pretrain/Loss": 2.283242702484131, "Full-pretrain/Loss (Raw)": 2.4805641174316406, "Full-pretrain/Step": 184, "Full-pretrain/Step Time": 17.625290310010314} +{"Full-pretrain/Learning Rate": 3.234265734265735e-05, "Full-pretrain/Loss": 2.2826428413391113, "Full-pretrain/Loss (Raw)": 2.215546131134033, "Full-pretrain/Step": 185, "Full-pretrain/Step Time": 17.623831778764725} +{"Full-pretrain/Learning Rate": 3.251748251748252e-05, "Full-pretrain/Loss": 2.274026393890381, "Full-pretrain/Loss (Raw)": 2.028286933898926, "Full-pretrain/Step": 186, "Full-pretrain/Step Time": 17.623458417132497} +{"Full-pretrain/Learning Rate": 3.269230769230769e-05, "Full-pretrain/Loss": 2.2715556621551514, "Full-pretrain/Loss (Raw)": 2.2793049812316895, "Full-pretrain/Step": 187, "Full-pretrain/Step Time": 17.619387596845627} +{"Full-pretrain/Learning Rate": 3.2867132867132866e-05, "Full-pretrain/Loss": 2.278155565261841, "Full-pretrain/Loss (Raw)": 2.6342620849609375, "Full-pretrain/Step": 188, "Full-pretrain/Step Time": 17.6296706199646} +{"Full-pretrain/Learning Rate": 3.3041958041958046e-05, "Full-pretrain/Loss": 2.2814221382141113, "Full-pretrain/Loss (Raw)": 2.3221399784088135, "Full-pretrain/Step": 189, "Full-pretrain/Step Time": 17.628070067614317} +{"Full-pretrain/Learning Rate": 3.321678321678322e-05, "Full-pretrain/Loss": 2.276815414428711, "Full-pretrain/Loss (Raw)": 2.2277283668518066, "Full-pretrain/Step": 190, "Full-pretrain/Step Time": 17.626179821789265} +{"Full-pretrain/Learning Rate": 3.339160839160839e-05, "Full-pretrain/Loss": 2.277039051055908, "Full-pretrain/Loss (Raw)": 2.3716726303100586, "Full-pretrain/Step": 191, "Full-pretrain/Step Time": 17.619067803025246} +{"Full-pretrain/Learning Rate": 3.356643356643357e-05, "Full-pretrain/Loss": 2.2784600257873535, "Full-pretrain/Loss (Raw)": 1.9790087938308716, "Full-pretrain/Step": 192, "Full-pretrain/Step Time": 17.616391653195024} +{"Full-pretrain/Learning Rate": 3.374125874125874e-05, "Full-pretrain/Loss": 2.273700475692749, "Full-pretrain/Loss (Raw)": 2.2442994117736816, "Full-pretrain/Step": 193, "Full-pretrain/Step Time": 17.621076818555593} +{"Full-pretrain/Learning Rate": 3.391608391608392e-05, "Full-pretrain/Loss": 2.2750039100646973, "Full-pretrain/Loss (Raw)": 2.3229010105133057, "Full-pretrain/Step": 194, "Full-pretrain/Step Time": 17.612045565620065} +{"Full-pretrain/Learning Rate": 3.409090909090909e-05, "Full-pretrain/Loss": 2.268221855163574, "Full-pretrain/Loss (Raw)": 2.3042235374450684, "Full-pretrain/Step": 195, "Full-pretrain/Step Time": 17.613690609112382} +{"Full-pretrain/Learning Rate": 3.4265734265734265e-05, "Full-pretrain/Loss": 2.26545786857605, "Full-pretrain/Loss (Raw)": 2.220317840576172, "Full-pretrain/Step": 196, "Full-pretrain/Step Time": 17.61580199562013} +{"Full-pretrain/Learning Rate": 3.4440559440559445e-05, "Full-pretrain/Loss": 2.2736382484436035, "Full-pretrain/Loss (Raw)": 2.49574875831604, "Full-pretrain/Step": 197, "Full-pretrain/Step Time": 17.611449481919408} +{"Full-pretrain/Learning Rate": 3.461538461538462e-05, "Full-pretrain/Loss": 2.2809643745422363, "Full-pretrain/Loss (Raw)": 2.386500358581543, "Full-pretrain/Step": 198, "Full-pretrain/Step Time": 17.606081746518612} +{"Full-pretrain/Learning Rate": 3.479020979020979e-05, "Full-pretrain/Loss": 2.2848806381225586, "Full-pretrain/Loss (Raw)": 2.220397710800171, "Full-pretrain/Step": 199, "Full-pretrain/Step Time": 17.609084187075496} +{"Full-pretrain/Learning Rate": 3.4965034965034965e-05, "Full-pretrain/Loss": 2.2850635051727295, "Full-pretrain/Loss (Raw)": 2.304060935974121, "Full-pretrain/Step": 200, "Full-pretrain/Step Time": 17.605544039979577} +{"Full-pretrain/Learning Rate": 3.5139860139860145e-05, "Full-pretrain/Loss": 2.2841978073120117, "Full-pretrain/Loss (Raw)": 2.218942165374756, "Full-pretrain/Step": 201, "Full-pretrain/Step Time": 17.605579882860184} +{"Full-pretrain/Learning Rate": 3.531468531468531e-05, "Full-pretrain/Loss": 2.2950282096862793, "Full-pretrain/Loss (Raw)": 2.655259132385254, "Full-pretrain/Step": 202, "Full-pretrain/Step Time": 17.60762817785144} +{"Full-pretrain/Learning Rate": 3.548951048951049e-05, "Full-pretrain/Loss": 2.2841880321502686, "Full-pretrain/Loss (Raw)": 2.1491737365722656, "Full-pretrain/Step": 203, "Full-pretrain/Step Time": 17.609390072524548} +{"Full-pretrain/Learning Rate": 3.566433566433567e-05, "Full-pretrain/Loss": 2.283463954925537, "Full-pretrain/Loss (Raw)": 2.1386561393737793, "Full-pretrain/Step": 204, "Full-pretrain/Step Time": 17.60601164959371} +{"Full-pretrain/Learning Rate": 3.583916083916084e-05, "Full-pretrain/Loss": 2.284975290298462, "Full-pretrain/Loss (Raw)": 2.2659499645233154, "Full-pretrain/Step": 205, "Full-pretrain/Step Time": 17.602690069004893} +{"Full-pretrain/Learning Rate": 3.601398601398602e-05, "Full-pretrain/Loss": 2.2749383449554443, "Full-pretrain/Loss (Raw)": 2.094149112701416, "Full-pretrain/Step": 206, "Full-pretrain/Step Time": 17.60089728422463} +{"Full-pretrain/Learning Rate": 3.618881118881119e-05, "Full-pretrain/Loss": 2.2825136184692383, "Full-pretrain/Loss (Raw)": 2.3659610748291016, "Full-pretrain/Step": 207, "Full-pretrain/Step Time": 17.60215832479298} +{"Full-pretrain/Learning Rate": 3.6363636363636364e-05, "Full-pretrain/Loss": 2.2795772552490234, "Full-pretrain/Loss (Raw)": 2.245537281036377, "Full-pretrain/Step": 208, "Full-pretrain/Step Time": 17.60186872445047} +{"Full-pretrain/Learning Rate": 3.653846153846154e-05, "Full-pretrain/Loss": 2.280552864074707, "Full-pretrain/Loss (Raw)": 2.273219585418701, "Full-pretrain/Step": 209, "Full-pretrain/Step Time": 17.599217606708407} +{"Full-pretrain/Learning Rate": 3.671328671328672e-05, "Full-pretrain/Loss": 2.2767066955566406, "Full-pretrain/Loss (Raw)": 2.1458210945129395, "Full-pretrain/Step": 210, "Full-pretrain/Step Time": 17.593530409038067} +{"Full-pretrain/Learning Rate": 3.688811188811189e-05, "Full-pretrain/Loss": 2.2825160026550293, "Full-pretrain/Loss (Raw)": 2.4689178466796875, "Full-pretrain/Step": 211, "Full-pretrain/Step Time": 17.59740144573152} +{"Full-pretrain/Learning Rate": 3.7062937062937064e-05, "Full-pretrain/Loss": 2.2858963012695312, "Full-pretrain/Loss (Raw)": 2.3696417808532715, "Full-pretrain/Step": 212, "Full-pretrain/Step Time": 17.597805373370647} +{"Full-pretrain/Learning Rate": 3.7237762237762244e-05, "Full-pretrain/Loss": 2.284372091293335, "Full-pretrain/Loss (Raw)": 2.2380709648132324, "Full-pretrain/Step": 213, "Full-pretrain/Step Time": 17.59593452140689} +{"Full-pretrain/Learning Rate": 3.741258741258741e-05, "Full-pretrain/Loss": 2.294215202331543, "Full-pretrain/Loss (Raw)": 2.4776670932769775, "Full-pretrain/Step": 214, "Full-pretrain/Step Time": 17.60096567682922} +{"Full-pretrain/Learning Rate": 3.758741258741259e-05, "Full-pretrain/Loss": 2.2979660034179688, "Full-pretrain/Loss (Raw)": 2.3909811973571777, "Full-pretrain/Step": 215, "Full-pretrain/Step Time": 17.60901656933129} +{"Full-pretrain/Learning Rate": 3.776223776223776e-05, "Full-pretrain/Loss": 2.29209303855896, "Full-pretrain/Loss (Raw)": 2.292631149291992, "Full-pretrain/Step": 216, "Full-pretrain/Step Time": 17.606718165799975} +{"Full-pretrain/Learning Rate": 3.7937062937062936e-05, "Full-pretrain/Loss": 2.2909798622131348, "Full-pretrain/Loss (Raw)": 2.1799275875091553, "Full-pretrain/Step": 217, "Full-pretrain/Step Time": 17.597297063097358} +{"Full-pretrain/Learning Rate": 3.811188811188811e-05, "Full-pretrain/Loss": 2.297795295715332, "Full-pretrain/Loss (Raw)": 2.24638032913208, "Full-pretrain/Step": 218, "Full-pretrain/Step Time": 17.596692262217402} +{"Full-pretrain/Learning Rate": 3.828671328671329e-05, "Full-pretrain/Loss": 2.2968125343322754, "Full-pretrain/Loss (Raw)": 2.247854471206665, "Full-pretrain/Step": 219, "Full-pretrain/Step Time": 17.602213948965073} +{"Full-pretrain/Learning Rate": 3.846153846153846e-05, "Full-pretrain/Loss": 2.2796213626861572, "Full-pretrain/Loss (Raw)": 2.084141731262207, "Full-pretrain/Step": 220, "Full-pretrain/Step Time": 17.599893156439066} +{"Full-pretrain/Learning Rate": 3.8636363636363636e-05, "Full-pretrain/Loss": 2.2777509689331055, "Full-pretrain/Loss (Raw)": 2.2622900009155273, "Full-pretrain/Step": 221, "Full-pretrain/Step Time": 17.601096834987402} +{"Full-pretrain/Learning Rate": 3.8811188811188816e-05, "Full-pretrain/Loss": 2.2760262489318848, "Full-pretrain/Loss (Raw)": 2.1725330352783203, "Full-pretrain/Step": 222, "Full-pretrain/Step Time": 17.595069497823715} +{"Full-pretrain/Learning Rate": 3.898601398601399e-05, "Full-pretrain/Loss": 2.275251865386963, "Full-pretrain/Loss (Raw)": 2.346900224685669, "Full-pretrain/Step": 223, "Full-pretrain/Step Time": 17.60195429250598} +{"Full-pretrain/Learning Rate": 3.916083916083916e-05, "Full-pretrain/Loss": 2.2744688987731934, "Full-pretrain/Loss (Raw)": 1.9539413452148438, "Full-pretrain/Step": 224, "Full-pretrain/Step Time": 17.60216056369245} +{"Full-pretrain/Learning Rate": 3.9335664335664336e-05, "Full-pretrain/Loss": 2.272345542907715, "Full-pretrain/Loss (Raw)": 2.1763548851013184, "Full-pretrain/Step": 225, "Full-pretrain/Step Time": 17.597854044288397} +{"Full-pretrain/Learning Rate": 3.9510489510489516e-05, "Full-pretrain/Loss": 2.272411823272705, "Full-pretrain/Loss (Raw)": 2.3250203132629395, "Full-pretrain/Step": 226, "Full-pretrain/Step Time": 17.599331626668572} +{"Full-pretrain/Learning Rate": 3.968531468531469e-05, "Full-pretrain/Loss": 2.2763028144836426, "Full-pretrain/Loss (Raw)": 2.4287424087524414, "Full-pretrain/Step": 227, "Full-pretrain/Step Time": 17.59279560483992} +{"Full-pretrain/Learning Rate": 3.986013986013986e-05, "Full-pretrain/Loss": 2.2797069549560547, "Full-pretrain/Loss (Raw)": 2.329245090484619, "Full-pretrain/Step": 228, "Full-pretrain/Step Time": 17.590088983997703} +{"Full-pretrain/Learning Rate": 4.0034965034965035e-05, "Full-pretrain/Loss": 2.2719836235046387, "Full-pretrain/Loss (Raw)": 2.2486000061035156, "Full-pretrain/Step": 229, "Full-pretrain/Step Time": 17.589998906478286} +{"Full-pretrain/Learning Rate": 4.020979020979021e-05, "Full-pretrain/Loss": 2.258922576904297, "Full-pretrain/Loss (Raw)": 1.9685560464859009, "Full-pretrain/Step": 230, "Full-pretrain/Step Time": 17.59135092049837} +{"Full-pretrain/Learning Rate": 4.038461538461539e-05, "Full-pretrain/Loss": 2.2575578689575195, "Full-pretrain/Loss (Raw)": 2.1767282485961914, "Full-pretrain/Step": 231, "Full-pretrain/Step Time": 17.594289673492312} +{"Full-pretrain/Learning Rate": 4.055944055944056e-05, "Full-pretrain/Loss": 2.2540340423583984, "Full-pretrain/Loss (Raw)": 2.191287040710449, "Full-pretrain/Step": 232, "Full-pretrain/Step Time": 17.594126649200916} +{"Full-pretrain/Learning Rate": 4.0734265734265735e-05, "Full-pretrain/Loss": 2.2537472248077393, "Full-pretrain/Loss (Raw)": 2.2097673416137695, "Full-pretrain/Step": 233, "Full-pretrain/Step Time": 17.593385947868228} +{"Full-pretrain/Learning Rate": 4.0909090909090915e-05, "Full-pretrain/Loss": 2.2528741359710693, "Full-pretrain/Loss (Raw)": 2.627323865890503, "Full-pretrain/Step": 234, "Full-pretrain/Step Time": 17.589843729510903} +{"Full-pretrain/Learning Rate": 4.108391608391609e-05, "Full-pretrain/Loss": 2.2552783489227295, "Full-pretrain/Loss (Raw)": 2.226107120513916, "Full-pretrain/Step": 235, "Full-pretrain/Step Time": 17.592183416709304} +{"Full-pretrain/Learning Rate": 4.125874125874126e-05, "Full-pretrain/Loss": 2.2612180709838867, "Full-pretrain/Loss (Raw)": 2.328726291656494, "Full-pretrain/Step": 236, "Full-pretrain/Step Time": 17.591211216524243} +{"Full-pretrain/Learning Rate": 4.1433566433566434e-05, "Full-pretrain/Loss": 2.26106595993042, "Full-pretrain/Loss (Raw)": 2.261080741882324, "Full-pretrain/Step": 237, "Full-pretrain/Step Time": 17.601250998675823} +{"Full-pretrain/Learning Rate": 4.1608391608391614e-05, "Full-pretrain/Loss": 2.263763904571533, "Full-pretrain/Loss (Raw)": 2.180492401123047, "Full-pretrain/Step": 238, "Full-pretrain/Step Time": 17.600915618240833} +{"Full-pretrain/Learning Rate": 4.178321678321678e-05, "Full-pretrain/Loss": 2.257570266723633, "Full-pretrain/Loss (Raw)": 2.1677637100219727, "Full-pretrain/Step": 239, "Full-pretrain/Step Time": 17.60141441784799} +{"Full-pretrain/Learning Rate": 4.195804195804196e-05, "Full-pretrain/Loss": 2.2621870040893555, "Full-pretrain/Loss (Raw)": 2.39327073097229, "Full-pretrain/Step": 240, "Full-pretrain/Step Time": 17.6010510828346} +{"Full-pretrain/Learning Rate": 4.213286713286714e-05, "Full-pretrain/Loss": 2.264650344848633, "Full-pretrain/Loss (Raw)": 2.352039337158203, "Full-pretrain/Step": 241, "Full-pretrain/Step Time": 17.60063854791224} +{"Full-pretrain/Learning Rate": 4.230769230769231e-05, "Full-pretrain/Loss": 2.2685751914978027, "Full-pretrain/Loss (Raw)": 2.2714178562164307, "Full-pretrain/Step": 242, "Full-pretrain/Step Time": 17.599930940195918} +{"Full-pretrain/Learning Rate": 4.248251748251749e-05, "Full-pretrain/Loss": 2.2560980319976807, "Full-pretrain/Loss (Raw)": 2.069654703140259, "Full-pretrain/Step": 243, "Full-pretrain/Step Time": 17.60268242843449} +{"Full-pretrain/Learning Rate": 4.265734265734266e-05, "Full-pretrain/Loss": 2.2533392906188965, "Full-pretrain/Loss (Raw)": 2.2813620567321777, "Full-pretrain/Step": 244, "Full-pretrain/Step Time": 17.604679133743048} +{"Full-pretrain/Learning Rate": 4.2832167832167833e-05, "Full-pretrain/Loss": 2.2534871101379395, "Full-pretrain/Loss (Raw)": 2.242798328399658, "Full-pretrain/Step": 245, "Full-pretrain/Step Time": 17.603650834411383} +{"Full-pretrain/Learning Rate": 4.300699300699301e-05, "Full-pretrain/Loss": 2.24623966217041, "Full-pretrain/Loss (Raw)": 2.245750665664673, "Full-pretrain/Step": 246, "Full-pretrain/Step Time": 17.600864863023162} +{"Full-pretrain/Learning Rate": 4.318181818181819e-05, "Full-pretrain/Loss": 2.239321231842041, "Full-pretrain/Loss (Raw)": 2.169588565826416, "Full-pretrain/Step": 247, "Full-pretrain/Step Time": 17.60484859906137} +{"Full-pretrain/Learning Rate": 4.335664335664335e-05, "Full-pretrain/Loss": 2.235301971435547, "Full-pretrain/Loss (Raw)": 2.164015531539917, "Full-pretrain/Step": 248, "Full-pretrain/Step Time": 17.606402151286602} +{"Full-pretrain/Learning Rate": 4.353146853146853e-05, "Full-pretrain/Loss": 2.235013008117676, "Full-pretrain/Loss (Raw)": 2.1706767082214355, "Full-pretrain/Step": 249, "Full-pretrain/Step Time": 17.607487708330154} +{"Full-pretrain/Learning Rate": 4.370629370629371e-05, "Full-pretrain/Loss": 2.2345314025878906, "Full-pretrain/Loss (Raw)": 2.2309746742248535, "Full-pretrain/Step": 250, "Full-pretrain/Step Time": 17.60618708655238} +{"Full-pretrain/Learning Rate": 4.388111888111888e-05, "Full-pretrain/Loss": 2.227437973022461, "Full-pretrain/Loss (Raw)": 2.0208628177642822, "Full-pretrain/Step": 251, "Full-pretrain/Step Time": 17.605835117399693} +{"Full-pretrain/Learning Rate": 4.405594405594406e-05, "Full-pretrain/Loss": 2.223203182220459, "Full-pretrain/Loss (Raw)": 1.9486311674118042, "Full-pretrain/Step": 252, "Full-pretrain/Step Time": 17.614317500963807} +{"Full-pretrain/Learning Rate": 4.423076923076923e-05, "Full-pretrain/Loss": 2.222386598587036, "Full-pretrain/Loss (Raw)": 2.236158847808838, "Full-pretrain/Step": 253, "Full-pretrain/Step Time": 17.61350386403501} +{"Full-pretrain/Learning Rate": 4.4405594405594406e-05, "Full-pretrain/Loss": 2.229820728302002, "Full-pretrain/Loss (Raw)": 2.410426378250122, "Full-pretrain/Step": 254, "Full-pretrain/Step Time": 17.613127253949642} +{"Full-pretrain/Learning Rate": 4.458041958041958e-05, "Full-pretrain/Loss": 2.228335380554199, "Full-pretrain/Loss (Raw)": 2.2993743419647217, "Full-pretrain/Step": 255, "Full-pretrain/Step Time": 17.61766368150711} +{"Full-pretrain/Learning Rate": 4.475524475524476e-05, "Full-pretrain/Loss": 2.230043888092041, "Full-pretrain/Loss (Raw)": 2.008608341217041, "Full-pretrain/Step": 256, "Full-pretrain/Step Time": 17.624356243759394} +{"Full-pretrain/Learning Rate": 4.493006993006993e-05, "Full-pretrain/Loss": 2.234293222427368, "Full-pretrain/Loss (Raw)": 2.312333822250366, "Full-pretrain/Step": 257, "Full-pretrain/Step Time": 17.62417438067496} +{"Full-pretrain/Learning Rate": 4.5104895104895105e-05, "Full-pretrain/Loss": 2.23201322555542, "Full-pretrain/Loss (Raw)": 2.2520649433135986, "Full-pretrain/Step": 258, "Full-pretrain/Step Time": 17.622869916260242} +{"Full-pretrain/Learning Rate": 4.5279720279720285e-05, "Full-pretrain/Loss": 2.221184730529785, "Full-pretrain/Loss (Raw)": 2.0822200775146484, "Full-pretrain/Step": 259, "Full-pretrain/Step Time": 17.62840968556702} +{"Full-pretrain/Learning Rate": 4.545454545454546e-05, "Full-pretrain/Loss": 2.2115681171417236, "Full-pretrain/Loss (Raw)": 2.021516799926758, "Full-pretrain/Step": 260, "Full-pretrain/Step Time": 17.629528110846877} +{"Full-pretrain/Learning Rate": 4.562937062937063e-05, "Full-pretrain/Loss": 2.210681915283203, "Full-pretrain/Loss (Raw)": 2.220236301422119, "Full-pretrain/Step": 261, "Full-pretrain/Step Time": 17.62991330958903} +{"Full-pretrain/Learning Rate": 4.5804195804195805e-05, "Full-pretrain/Loss": 2.226487636566162, "Full-pretrain/Loss (Raw)": 2.474337339401245, "Full-pretrain/Step": 262, "Full-pretrain/Step Time": 17.630009254440665} +{"Full-pretrain/Learning Rate": 4.597902097902098e-05, "Full-pretrain/Loss": 2.2301723957061768, "Full-pretrain/Loss (Raw)": 2.294642448425293, "Full-pretrain/Step": 263, "Full-pretrain/Step Time": 17.634197967126966} +{"Full-pretrain/Learning Rate": 4.615384615384616e-05, "Full-pretrain/Loss": 2.2307887077331543, "Full-pretrain/Loss (Raw)": 2.2110133171081543, "Full-pretrain/Step": 264, "Full-pretrain/Step Time": 17.634891539812088} +{"Full-pretrain/Learning Rate": 4.632867132867133e-05, "Full-pretrain/Loss": 2.232266902923584, "Full-pretrain/Loss (Raw)": 2.257071018218994, "Full-pretrain/Step": 265, "Full-pretrain/Step Time": 17.635059541091323} +{"Full-pretrain/Learning Rate": 4.6503496503496505e-05, "Full-pretrain/Loss": 2.2234511375427246, "Full-pretrain/Loss (Raw)": 2.3452155590057373, "Full-pretrain/Step": 266, "Full-pretrain/Step Time": 17.63328268006444} +{"Full-pretrain/Learning Rate": 4.667832167832168e-05, "Full-pretrain/Loss": 2.218543767929077, "Full-pretrain/Loss (Raw)": 2.0690689086914062, "Full-pretrain/Step": 267, "Full-pretrain/Step Time": 17.63940687663853} +{"Full-pretrain/Learning Rate": 4.685314685314686e-05, "Full-pretrain/Loss": 2.2180120944976807, "Full-pretrain/Loss (Raw)": 2.3117170333862305, "Full-pretrain/Step": 268, "Full-pretrain/Step Time": 17.64001845009625} +{"Full-pretrain/Learning Rate": 4.702797202797203e-05, "Full-pretrain/Loss": 2.2174112796783447, "Full-pretrain/Loss (Raw)": 2.241854667663574, "Full-pretrain/Step": 269, "Full-pretrain/Step Time": 17.641083169728518} +{"Full-pretrain/Learning Rate": 4.7202797202797204e-05, "Full-pretrain/Loss": 2.2157182693481445, "Full-pretrain/Loss (Raw)": 2.126321792602539, "Full-pretrain/Step": 270, "Full-pretrain/Step Time": 17.642802910879254} +{"Full-pretrain/Learning Rate": 4.7377622377622384e-05, "Full-pretrain/Loss": 2.2162585258483887, "Full-pretrain/Loss (Raw)": 2.1850454807281494, "Full-pretrain/Step": 271, "Full-pretrain/Step Time": 17.647682905197144} +{"Full-pretrain/Learning Rate": 4.755244755244756e-05, "Full-pretrain/Loss": 2.209033966064453, "Full-pretrain/Loss (Raw)": 2.162091016769409, "Full-pretrain/Step": 272, "Full-pretrain/Step Time": 17.644633838906884} +{"Full-pretrain/Learning Rate": 4.772727272727273e-05, "Full-pretrain/Loss": 2.2089080810546875, "Full-pretrain/Loss (Raw)": 2.348003387451172, "Full-pretrain/Step": 273, "Full-pretrain/Step Time": 17.646665642037988} +{"Full-pretrain/Learning Rate": 4.7902097902097904e-05, "Full-pretrain/Loss": 2.2043089866638184, "Full-pretrain/Loss (Raw)": 2.124253988265991, "Full-pretrain/Step": 274, "Full-pretrain/Step Time": 17.649189172312617} +{"Full-pretrain/Learning Rate": 4.8076923076923084e-05, "Full-pretrain/Loss": 2.212877035140991, "Full-pretrain/Loss (Raw)": 2.34382963180542, "Full-pretrain/Step": 275, "Full-pretrain/Step Time": 17.650630151852965} +{"Full-pretrain/Learning Rate": 4.825174825174825e-05, "Full-pretrain/Loss": 2.2103519439697266, "Full-pretrain/Loss (Raw)": 2.200559616088867, "Full-pretrain/Step": 276, "Full-pretrain/Step Time": 17.655262496322393} +{"Full-pretrain/Learning Rate": 4.842657342657343e-05, "Full-pretrain/Loss": 2.2163758277893066, "Full-pretrain/Loss (Raw)": 2.4355626106262207, "Full-pretrain/Step": 277, "Full-pretrain/Step Time": 17.660466806963086} +{"Full-pretrain/Learning Rate": 4.86013986013986e-05, "Full-pretrain/Loss": 2.218207836151123, "Full-pretrain/Loss (Raw)": 2.3043770790100098, "Full-pretrain/Step": 278, "Full-pretrain/Step Time": 17.659154096618295} +{"Full-pretrain/Learning Rate": 4.8776223776223776e-05, "Full-pretrain/Loss": 2.2224395275115967, "Full-pretrain/Loss (Raw)": 2.3049991130828857, "Full-pretrain/Step": 279, "Full-pretrain/Step Time": 17.659552037715912} +{"Full-pretrain/Learning Rate": 4.8951048951048956e-05, "Full-pretrain/Loss": 2.221039056777954, "Full-pretrain/Loss (Raw)": 2.11920166015625, "Full-pretrain/Step": 280, "Full-pretrain/Step Time": 17.66153551824391} +{"Full-pretrain/Learning Rate": 4.912587412587413e-05, "Full-pretrain/Loss": 2.227308750152588, "Full-pretrain/Loss (Raw)": 2.3713066577911377, "Full-pretrain/Step": 281, "Full-pretrain/Step Time": 17.666069768369198} +{"Full-pretrain/Learning Rate": 4.93006993006993e-05, "Full-pretrain/Loss": 2.225775718688965, "Full-pretrain/Loss (Raw)": 2.181922197341919, "Full-pretrain/Step": 282, "Full-pretrain/Step Time": 17.665721667930484} +{"Full-pretrain/Learning Rate": 4.9475524475524476e-05, "Full-pretrain/Loss": 2.2311336994171143, "Full-pretrain/Loss (Raw)": 2.192309617996216, "Full-pretrain/Step": 283, "Full-pretrain/Step Time": 17.66783912666142} +{"Full-pretrain/Learning Rate": 4.9650349650349656e-05, "Full-pretrain/Loss": 2.2391772270202637, "Full-pretrain/Loss (Raw)": 2.206033945083618, "Full-pretrain/Step": 284, "Full-pretrain/Step Time": 17.66685999557376} +{"Full-pretrain/Learning Rate": 4.982517482517482e-05, "Full-pretrain/Loss": 2.2411537170410156, "Full-pretrain/Loss (Raw)": 2.299398899078369, "Full-pretrain/Step": 285, "Full-pretrain/Step Time": 17.670744813978672} +{"Full-pretrain/Learning Rate": 5e-05, "Full-pretrain/Loss": 2.2411553859710693, "Full-pretrain/Loss (Raw)": 2.4104812145233154, "Full-pretrain/Step": 286, "Full-pretrain/Step Time": 17.669895688071847} +{"Full-pretrain/Learning Rate": 4.99999985581294e-05, "Full-pretrain/Loss": 2.2333431243896484, "Full-pretrain/Loss (Raw)": 2.049384355545044, "Full-pretrain/Step": 287, "Full-pretrain/Step Time": 17.668655982241035} +{"Full-pretrain/Learning Rate": 4.9999994232517746e-05, "Full-pretrain/Loss": 2.235287666320801, "Full-pretrain/Loss (Raw)": 2.0708298683166504, "Full-pretrain/Step": 288, "Full-pretrain/Step Time": 17.665234867483377} +{"Full-pretrain/Learning Rate": 4.999998702316553e-05, "Full-pretrain/Loss": 2.2277002334594727, "Full-pretrain/Loss (Raw)": 2.069540500640869, "Full-pretrain/Step": 289, "Full-pretrain/Step Time": 17.6719679068774} +{"Full-pretrain/Learning Rate": 4.999997693007361e-05, "Full-pretrain/Loss": 2.2249855995178223, "Full-pretrain/Loss (Raw)": 2.165194034576416, "Full-pretrain/Step": 290, "Full-pretrain/Step Time": 17.67365050688386} +{"Full-pretrain/Learning Rate": 4.999996395324314e-05, "Full-pretrain/Loss": 2.229271411895752, "Full-pretrain/Loss (Raw)": 2.2193708419799805, "Full-pretrain/Step": 291, "Full-pretrain/Step Time": 17.668392995372415} +{"Full-pretrain/Learning Rate": 4.999994809267561e-05, "Full-pretrain/Loss": 2.2383599281311035, "Full-pretrain/Loss (Raw)": 2.312349796295166, "Full-pretrain/Step": 292, "Full-pretrain/Step Time": 17.66722335293889} +{"Full-pretrain/Learning Rate": 4.999992934837285e-05, "Full-pretrain/Loss": 2.2352304458618164, "Full-pretrain/Loss (Raw)": 2.1200857162475586, "Full-pretrain/Step": 293, "Full-pretrain/Step Time": 17.668465150520205} +{"Full-pretrain/Learning Rate": 4.9999907720337026e-05, "Full-pretrain/Loss": 2.2289233207702637, "Full-pretrain/Loss (Raw)": 2.2725095748901367, "Full-pretrain/Step": 294, "Full-pretrain/Step Time": 17.67075820825994} +{"Full-pretrain/Learning Rate": 4.999988320857063e-05, "Full-pretrain/Loss": 2.229548931121826, "Full-pretrain/Loss (Raw)": 2.314662456512451, "Full-pretrain/Step": 295, "Full-pretrain/Step Time": 17.671037206426263} +{"Full-pretrain/Learning Rate": 4.999985581307649e-05, "Full-pretrain/Loss": 2.22641658782959, "Full-pretrain/Loss (Raw)": 2.1107778549194336, "Full-pretrain/Step": 296, "Full-pretrain/Step Time": 17.669558737426996} +{"Full-pretrain/Learning Rate": 4.999982553385778e-05, "Full-pretrain/Loss": 2.2215070724487305, "Full-pretrain/Loss (Raw)": 2.0999670028686523, "Full-pretrain/Step": 297, "Full-pretrain/Step Time": 17.667061924934387} +{"Full-pretrain/Learning Rate": 4.999979237091797e-05, "Full-pretrain/Loss": 2.214339256286621, "Full-pretrain/Loss (Raw)": 2.1158435344696045, "Full-pretrain/Step": 298, "Full-pretrain/Step Time": 17.670249650254846} +{"Full-pretrain/Learning Rate": 4.99997563242609e-05, "Full-pretrain/Loss": 2.219111680984497, "Full-pretrain/Loss (Raw)": 2.2217860221862793, "Full-pretrain/Step": 299, "Full-pretrain/Step Time": 17.664211861789227} +{"Full-pretrain/Learning Rate": 4.999971739389072e-05, "Full-pretrain/Loss": 2.2187585830688477, "Full-pretrain/Loss (Raw)": 2.3004183769226074, "Full-pretrain/Step": 300, "Full-pretrain/Step Time": 17.660327369347215} +{"Full-pretrain/Learning Rate": 4.999967557981192e-05, "Full-pretrain/Loss": 2.2080297470092773, "Full-pretrain/Loss (Raw)": 1.8985304832458496, "Full-pretrain/Step": 301, "Full-pretrain/Step Time": 17.65896850451827} +{"Full-pretrain/Learning Rate": 4.999963088202934e-05, "Full-pretrain/Loss": 2.2136356830596924, "Full-pretrain/Loss (Raw)": 2.305713415145874, "Full-pretrain/Step": 302, "Full-pretrain/Step Time": 17.660407001152635} +{"Full-pretrain/Learning Rate": 4.9999583300548115e-05, "Full-pretrain/Loss": 2.213040828704834, "Full-pretrain/Loss (Raw)": 2.166013240814209, "Full-pretrain/Step": 303, "Full-pretrain/Step Time": 17.659842398017645} +{"Full-pretrain/Learning Rate": 4.9999532835373744e-05, "Full-pretrain/Loss": 2.2116074562072754, "Full-pretrain/Loss (Raw)": 2.116227388381958, "Full-pretrain/Step": 304, "Full-pretrain/Step Time": 17.648945806548} +{"Full-pretrain/Learning Rate": 4.999947948651204e-05, "Full-pretrain/Loss": 2.2100977897644043, "Full-pretrain/Loss (Raw)": 2.2996885776519775, "Full-pretrain/Step": 305, "Full-pretrain/Step Time": 17.649526512250304} +{"Full-pretrain/Learning Rate": 4.9999423253969166e-05, "Full-pretrain/Loss": 2.2137322425842285, "Full-pretrain/Loss (Raw)": 2.2405519485473633, "Full-pretrain/Step": 306, "Full-pretrain/Step Time": 17.648143181577325} +{"Full-pretrain/Learning Rate": 4.999936413775161e-05, "Full-pretrain/Loss": 2.2129721641540527, "Full-pretrain/Loss (Raw)": 2.319514274597168, "Full-pretrain/Step": 307, "Full-pretrain/Step Time": 17.648078011348844} +{"Full-pretrain/Learning Rate": 4.9999302137866186e-05, "Full-pretrain/Loss": 2.2162835597991943, "Full-pretrain/Loss (Raw)": 2.306520938873291, "Full-pretrain/Step": 308, "Full-pretrain/Step Time": 17.649292644113302} +{"Full-pretrain/Learning Rate": 4.999923725432004e-05, "Full-pretrain/Loss": 2.208204507827759, "Full-pretrain/Loss (Raw)": 2.177032232284546, "Full-pretrain/Step": 309, "Full-pretrain/Step Time": 17.64886467717588} +{"Full-pretrain/Learning Rate": 4.999916948712066e-05, "Full-pretrain/Loss": 2.204550266265869, "Full-pretrain/Loss (Raw)": 2.1874377727508545, "Full-pretrain/Step": 310, "Full-pretrain/Step Time": 17.648984245955944} +{"Full-pretrain/Learning Rate": 4.999909883627587e-05, "Full-pretrain/Loss": 2.201127529144287, "Full-pretrain/Loss (Raw)": 2.1954681873321533, "Full-pretrain/Step": 311, "Full-pretrain/Step Time": 17.645237093791366} +{"Full-pretrain/Learning Rate": 4.999902530179381e-05, "Full-pretrain/Loss": 2.2053654193878174, "Full-pretrain/Loss (Raw)": 2.2548184394836426, "Full-pretrain/Step": 312, "Full-pretrain/Step Time": 17.640948547050357} +{"Full-pretrain/Learning Rate": 4.999894888368297e-05, "Full-pretrain/Loss": 2.2024073600769043, "Full-pretrain/Loss (Raw)": 2.27665114402771, "Full-pretrain/Step": 313, "Full-pretrain/Step Time": 17.647460117936134} +{"Full-pretrain/Learning Rate": 4.9998869581952165e-05, "Full-pretrain/Loss": 2.2050065994262695, "Full-pretrain/Loss (Raw)": 2.2651004791259766, "Full-pretrain/Step": 314, "Full-pretrain/Step Time": 17.641582952812314} +{"Full-pretrain/Learning Rate": 4.999878739661054e-05, "Full-pretrain/Loss": 2.2064499855041504, "Full-pretrain/Loss (Raw)": 2.2384963035583496, "Full-pretrain/Step": 315, "Full-pretrain/Step Time": 17.64102110080421} +{"Full-pretrain/Learning Rate": 4.9998702327667565e-05, "Full-pretrain/Loss": 2.2035953998565674, "Full-pretrain/Loss (Raw)": 2.1146883964538574, "Full-pretrain/Step": 316, "Full-pretrain/Step Time": 17.627935143187642} +{"Full-pretrain/Learning Rate": 4.999861437513307e-05, "Full-pretrain/Loss": 2.193246364593506, "Full-pretrain/Loss (Raw)": 1.968224048614502, "Full-pretrain/Step": 317, "Full-pretrain/Step Time": 17.635518841445446} +{"Full-pretrain/Learning Rate": 4.999852353901719e-05, "Full-pretrain/Loss": 2.1907477378845215, "Full-pretrain/Loss (Raw)": 2.3305280208587646, "Full-pretrain/Step": 318, "Full-pretrain/Step Time": 17.638352155685425} +{"Full-pretrain/Learning Rate": 4.999842981933041e-05, "Full-pretrain/Loss": 2.19085431098938, "Full-pretrain/Loss (Raw)": 2.052795648574829, "Full-pretrain/Step": 319, "Full-pretrain/Step Time": 17.63344614394009} +{"Full-pretrain/Learning Rate": 4.999833321608352e-05, "Full-pretrain/Loss": 2.1918952465057373, "Full-pretrain/Loss (Raw)": 2.1041440963745117, "Full-pretrain/Step": 320, "Full-pretrain/Step Time": 17.632964681833982} +{"Full-pretrain/Learning Rate": 4.999823372928769e-05, "Full-pretrain/Loss": 2.1972570419311523, "Full-pretrain/Loss (Raw)": 2.2411093711853027, "Full-pretrain/Step": 321, "Full-pretrain/Step Time": 17.639181070029736} +{"Full-pretrain/Learning Rate": 4.999813135895438e-05, "Full-pretrain/Loss": 2.198660373687744, "Full-pretrain/Loss (Raw)": 2.2101058959960938, "Full-pretrain/Step": 322, "Full-pretrain/Step Time": 17.63980907201767} +{"Full-pretrain/Learning Rate": 4.9998026105095405e-05, "Full-pretrain/Loss": 2.1960363388061523, "Full-pretrain/Loss (Raw)": 2.1354050636291504, "Full-pretrain/Step": 323, "Full-pretrain/Step Time": 17.635757002979517} +{"Full-pretrain/Learning Rate": 4.999791796772291e-05, "Full-pretrain/Loss": 2.18881893157959, "Full-pretrain/Loss (Raw)": 2.081395387649536, "Full-pretrain/Step": 324, "Full-pretrain/Step Time": 17.640092259272933} +{"Full-pretrain/Learning Rate": 4.999780694684934e-05, "Full-pretrain/Loss": 2.1935667991638184, "Full-pretrain/Loss (Raw)": 2.272010326385498, "Full-pretrain/Step": 325, "Full-pretrain/Step Time": 17.645765585824847} +{"Full-pretrain/Learning Rate": 4.999769304248755e-05, "Full-pretrain/Loss": 2.1839332580566406, "Full-pretrain/Loss (Raw)": 1.9642393589019775, "Full-pretrain/Step": 326, "Full-pretrain/Step Time": 17.650068992748857} +{"Full-pretrain/Learning Rate": 4.9997576254650635e-05, "Full-pretrain/Loss": 2.179645538330078, "Full-pretrain/Loss (Raw)": 2.1774563789367676, "Full-pretrain/Step": 327, "Full-pretrain/Step Time": 17.644596207886934} +{"Full-pretrain/Learning Rate": 4.9997456583352096e-05, "Full-pretrain/Loss": 2.17979097366333, "Full-pretrain/Loss (Raw)": 2.115432024002075, "Full-pretrain/Step": 328, "Full-pretrain/Step Time": 17.64874397777021} +{"Full-pretrain/Learning Rate": 4.999733402860572e-05, "Full-pretrain/Loss": 2.182776927947998, "Full-pretrain/Loss (Raw)": 2.195514678955078, "Full-pretrain/Step": 329, "Full-pretrain/Step Time": 17.645085694268346} +{"Full-pretrain/Learning Rate": 4.999720859042565e-05, "Full-pretrain/Loss": 2.1829025745391846, "Full-pretrain/Loss (Raw)": 2.1198666095733643, "Full-pretrain/Step": 330, "Full-pretrain/Step Time": 17.638209046795964} +{"Full-pretrain/Learning Rate": 4.9997080268826344e-05, "Full-pretrain/Loss": 2.1826906204223633, "Full-pretrain/Loss (Raw)": 2.214996814727783, "Full-pretrain/Step": 331, "Full-pretrain/Step Time": 17.639521803706884} +{"Full-pretrain/Learning Rate": 4.999694906382262e-05, "Full-pretrain/Loss": 2.1780266761779785, "Full-pretrain/Loss (Raw)": 2.1511759757995605, "Full-pretrain/Step": 332, "Full-pretrain/Step Time": 17.642311487346888} +{"Full-pretrain/Learning Rate": 4.9996814975429604e-05, "Full-pretrain/Loss": 2.187446117401123, "Full-pretrain/Loss (Raw)": 2.1999495029449463, "Full-pretrain/Step": 333, "Full-pretrain/Step Time": 17.64217366464436} +{"Full-pretrain/Learning Rate": 4.9996678003662776e-05, "Full-pretrain/Loss": 2.1819543838500977, "Full-pretrain/Loss (Raw)": 2.12998366355896, "Full-pretrain/Step": 334, "Full-pretrain/Step Time": 17.643882788717747} +{"Full-pretrain/Learning Rate": 4.999653814853791e-05, "Full-pretrain/Loss": 2.183450222015381, "Full-pretrain/Loss (Raw)": 2.2138800621032715, "Full-pretrain/Step": 335, "Full-pretrain/Step Time": 17.641540491953492} +{"Full-pretrain/Learning Rate": 4.999639541007116e-05, "Full-pretrain/Loss": 2.1829700469970703, "Full-pretrain/Loss (Raw)": 2.100855827331543, "Full-pretrain/Step": 336, "Full-pretrain/Step Time": 17.642106195911765} +{"Full-pretrain/Learning Rate": 4.999624978827899e-05, "Full-pretrain/Loss": 2.1793675422668457, "Full-pretrain/Loss (Raw)": 2.1844141483306885, "Full-pretrain/Step": 337, "Full-pretrain/Step Time": 17.64018694497645} +{"Full-pretrain/Learning Rate": 4.999610128317818e-05, "Full-pretrain/Loss": 2.1771485805511475, "Full-pretrain/Loss (Raw)": 2.1695473194122314, "Full-pretrain/Step": 338, "Full-pretrain/Step Time": 17.642082987353206} +{"Full-pretrain/Learning Rate": 4.9995949894785874e-05, "Full-pretrain/Loss": 2.17581844329834, "Full-pretrain/Loss (Raw)": 2.2769412994384766, "Full-pretrain/Step": 339, "Full-pretrain/Step Time": 17.64310336485505} +{"Full-pretrain/Learning Rate": 4.9995795623119537e-05, "Full-pretrain/Loss": 2.175666570663452, "Full-pretrain/Loss (Raw)": 2.301666736602783, "Full-pretrain/Step": 340, "Full-pretrain/Step Time": 17.640380267053843} +{"Full-pretrain/Learning Rate": 4.999563846819696e-05, "Full-pretrain/Loss": 2.178757667541504, "Full-pretrain/Loss (Raw)": 2.2759411334991455, "Full-pretrain/Step": 341, "Full-pretrain/Step Time": 17.636882008984685} +{"Full-pretrain/Learning Rate": 4.999547843003626e-05, "Full-pretrain/Loss": 2.181117057800293, "Full-pretrain/Loss (Raw)": 2.262948513031006, "Full-pretrain/Step": 342, "Full-pretrain/Step Time": 17.634649666026235} +{"Full-pretrain/Learning Rate": 4.9995315508655916e-05, "Full-pretrain/Loss": 2.1801252365112305, "Full-pretrain/Loss (Raw)": 2.163721799850464, "Full-pretrain/Step": 343, "Full-pretrain/Step Time": 17.63148015551269} +{"Full-pretrain/Learning Rate": 4.99951497040747e-05, "Full-pretrain/Loss": 2.1737136840820312, "Full-pretrain/Loss (Raw)": 2.0496506690979004, "Full-pretrain/Step": 344, "Full-pretrain/Step Time": 17.624766232445836} +{"Full-pretrain/Learning Rate": 4.999498101631177e-05, "Full-pretrain/Loss": 2.1712865829467773, "Full-pretrain/Loss (Raw)": 2.198983669281006, "Full-pretrain/Step": 345, "Full-pretrain/Step Time": 17.628814794123173} +{"Full-pretrain/Learning Rate": 4.999480944538655e-05, "Full-pretrain/Loss": 2.166534423828125, "Full-pretrain/Loss (Raw)": 2.1130404472351074, "Full-pretrain/Step": 346, "Full-pretrain/Step Time": 17.624167378991842} +{"Full-pretrain/Learning Rate": 4.999463499131885e-05, "Full-pretrain/Loss": 2.169116258621216, "Full-pretrain/Loss (Raw)": 2.3211052417755127, "Full-pretrain/Step": 347, "Full-pretrain/Step Time": 17.620049502700567} +{"Full-pretrain/Learning Rate": 4.9994457654128776e-05, "Full-pretrain/Loss": 2.178349494934082, "Full-pretrain/Loss (Raw)": 2.410153388977051, "Full-pretrain/Step": 348, "Full-pretrain/Step Time": 17.619513535872102} +{"Full-pretrain/Learning Rate": 4.99942774338368e-05, "Full-pretrain/Loss": 2.187595844268799, "Full-pretrain/Loss (Raw)": 2.264110565185547, "Full-pretrain/Step": 349, "Full-pretrain/Step Time": 17.616378996521235} +{"Full-pretrain/Learning Rate": 4.999409433046372e-05, "Full-pretrain/Loss": 2.1841273307800293, "Full-pretrain/Loss (Raw)": 2.219534158706665, "Full-pretrain/Step": 350, "Full-pretrain/Step Time": 17.61587398312986} +{"Full-pretrain/Learning Rate": 4.999390834403063e-05, "Full-pretrain/Loss": 2.1829001903533936, "Full-pretrain/Loss (Raw)": 2.013522148132324, "Full-pretrain/Step": 351, "Full-pretrain/Step Time": 17.61675265803933} +{"Full-pretrain/Learning Rate": 4.999371947455899e-05, "Full-pretrain/Loss": 2.186985969543457, "Full-pretrain/Loss (Raw)": 2.234891653060913, "Full-pretrain/Step": 352, "Full-pretrain/Step Time": 17.61667519621551} +{"Full-pretrain/Learning Rate": 4.99935277220706e-05, "Full-pretrain/Loss": 2.183155059814453, "Full-pretrain/Loss (Raw)": 2.118523120880127, "Full-pretrain/Step": 353, "Full-pretrain/Step Time": 17.613752283155918} +{"Full-pretrain/Learning Rate": 4.999333308658757e-05, "Full-pretrain/Loss": 2.1829066276550293, "Full-pretrain/Loss (Raw)": 2.2021560668945312, "Full-pretrain/Step": 354, "Full-pretrain/Step Time": 17.612115755677223} +{"Full-pretrain/Learning Rate": 4.999313556813236e-05, "Full-pretrain/Loss": 2.186643123626709, "Full-pretrain/Loss (Raw)": 2.2549707889556885, "Full-pretrain/Step": 355, "Full-pretrain/Step Time": 17.621026718989015} +{"Full-pretrain/Learning Rate": 4.9992935166727725e-05, "Full-pretrain/Loss": 2.1860969066619873, "Full-pretrain/Loss (Raw)": 2.063915252685547, "Full-pretrain/Step": 356, "Full-pretrain/Step Time": 17.624138075858355} +{"Full-pretrain/Learning Rate": 4.9992731882396815e-05, "Full-pretrain/Loss": 2.1800715923309326, "Full-pretrain/Loss (Raw)": 2.07920503616333, "Full-pretrain/Step": 357, "Full-pretrain/Step Time": 17.617287488654256} +{"Full-pretrain/Learning Rate": 4.9992525715163065e-05, "Full-pretrain/Loss": 2.182249069213867, "Full-pretrain/Loss (Raw)": 2.033916473388672, "Full-pretrain/Step": 358, "Full-pretrain/Step Time": 17.612282432615757} +{"Full-pretrain/Learning Rate": 4.999231666505025e-05, "Full-pretrain/Loss": 2.1826236248016357, "Full-pretrain/Loss (Raw)": 2.189445972442627, "Full-pretrain/Step": 359, "Full-pretrain/Step Time": 17.612126974388957} +{"Full-pretrain/Learning Rate": 4.99921047320825e-05, "Full-pretrain/Loss": 2.18003511428833, "Full-pretrain/Loss (Raw)": 2.0325937271118164, "Full-pretrain/Step": 360, "Full-pretrain/Step Time": 17.619445372372866} +{"Full-pretrain/Learning Rate": 4.999188991628425e-05, "Full-pretrain/Loss": 2.1816623210906982, "Full-pretrain/Loss (Raw)": 2.247586488723755, "Full-pretrain/Step": 361, "Full-pretrain/Step Time": 17.618135053664446} +{"Full-pretrain/Learning Rate": 4.999167221768028e-05, "Full-pretrain/Loss": 2.18328857421875, "Full-pretrain/Loss (Raw)": 2.171901226043701, "Full-pretrain/Step": 362, "Full-pretrain/Step Time": 17.619305312633514} +{"Full-pretrain/Learning Rate": 4.99914516362957e-05, "Full-pretrain/Loss": 2.183415412902832, "Full-pretrain/Loss (Raw)": 2.2190611362457275, "Full-pretrain/Step": 363, "Full-pretrain/Step Time": 17.618505099788308} +{"Full-pretrain/Learning Rate": 4.999122817215596e-05, "Full-pretrain/Loss": 2.188706874847412, "Full-pretrain/Loss (Raw)": 2.320504665374756, "Full-pretrain/Step": 364, "Full-pretrain/Step Time": 17.62112132832408} +{"Full-pretrain/Learning Rate": 4.999100182528683e-05, "Full-pretrain/Loss": 2.191094398498535, "Full-pretrain/Loss (Raw)": 2.2763476371765137, "Full-pretrain/Step": 365, "Full-pretrain/Step Time": 17.613087937235832} +{"Full-pretrain/Learning Rate": 4.999077259571442e-05, "Full-pretrain/Loss": 2.1875953674316406, "Full-pretrain/Loss (Raw)": 2.0180110931396484, "Full-pretrain/Step": 366, "Full-pretrain/Step Time": 17.611185736954212} +{"Full-pretrain/Learning Rate": 4.9990540483465174e-05, "Full-pretrain/Loss": 2.1881444454193115, "Full-pretrain/Loss (Raw)": 2.2314517498016357, "Full-pretrain/Step": 367, "Full-pretrain/Step Time": 17.611975990235806} +{"Full-pretrain/Learning Rate": 4.999030548856587e-05, "Full-pretrain/Loss": 2.186957836151123, "Full-pretrain/Loss (Raw)": 2.062885046005249, "Full-pretrain/Step": 368, "Full-pretrain/Step Time": 17.6139061357826} +{"Full-pretrain/Learning Rate": 4.999006761104361e-05, "Full-pretrain/Loss": 2.180166721343994, "Full-pretrain/Loss (Raw)": 1.967104434967041, "Full-pretrain/Step": 369, "Full-pretrain/Step Time": 17.615313982591033} +{"Full-pretrain/Learning Rate": 4.998982685092583e-05, "Full-pretrain/Loss": 2.178884744644165, "Full-pretrain/Loss (Raw)": 2.128519058227539, "Full-pretrain/Step": 370, "Full-pretrain/Step Time": 17.60846314765513} +{"Full-pretrain/Learning Rate": 4.998958320824031e-05, "Full-pretrain/Loss": 2.1677353382110596, "Full-pretrain/Loss (Raw)": 1.9201658964157104, "Full-pretrain/Step": 371, "Full-pretrain/Step Time": 17.604289084672928} +{"Full-pretrain/Learning Rate": 4.9989336683015145e-05, "Full-pretrain/Loss": 2.1640729904174805, "Full-pretrain/Loss (Raw)": 2.1844677925109863, "Full-pretrain/Step": 372, "Full-pretrain/Step Time": 17.60571894608438} +{"Full-pretrain/Learning Rate": 4.9989087275278766e-05, "Full-pretrain/Loss": 2.1562283039093018, "Full-pretrain/Loss (Raw)": 2.0249125957489014, "Full-pretrain/Step": 373, "Full-pretrain/Step Time": 17.602112859487534} +{"Full-pretrain/Learning Rate": 4.9988834985059966e-05, "Full-pretrain/Loss": 2.1498913764953613, "Full-pretrain/Loss (Raw)": 2.0601654052734375, "Full-pretrain/Step": 374, "Full-pretrain/Step Time": 17.600481498986483} +{"Full-pretrain/Learning Rate": 4.998857981238782e-05, "Full-pretrain/Loss": 2.1463260650634766, "Full-pretrain/Loss (Raw)": 2.0496344566345215, "Full-pretrain/Step": 375, "Full-pretrain/Step Time": 17.60013189725578} +{"Full-pretrain/Learning Rate": 4.9988321757291786e-05, "Full-pretrain/Loss": 2.1520538330078125, "Full-pretrain/Loss (Raw)": 2.232938289642334, "Full-pretrain/Step": 376, "Full-pretrain/Step Time": 17.59848141297698} +{"Full-pretrain/Learning Rate": 4.998806081980162e-05, "Full-pretrain/Loss": 2.1461844444274902, "Full-pretrain/Loss (Raw)": 2.0111632347106934, "Full-pretrain/Step": 377, "Full-pretrain/Step Time": 17.60090043209493} +{"Full-pretrain/Learning Rate": 4.998779699994741e-05, "Full-pretrain/Loss": 2.1581027507781982, "Full-pretrain/Loss (Raw)": 2.4944214820861816, "Full-pretrain/Step": 378, "Full-pretrain/Step Time": 17.59670232795179} +{"Full-pretrain/Learning Rate": 4.99875302977596e-05, "Full-pretrain/Loss": 2.145836353302002, "Full-pretrain/Loss (Raw)": 1.9285824298858643, "Full-pretrain/Step": 379, "Full-pretrain/Step Time": 17.595543263480067} +{"Full-pretrain/Learning Rate": 4.9987260713268954e-05, "Full-pretrain/Loss": 2.1329526901245117, "Full-pretrain/Loss (Raw)": 1.997872233390808, "Full-pretrain/Step": 380, "Full-pretrain/Step Time": 17.592935658991337} +{"Full-pretrain/Learning Rate": 4.998698824650656e-05, "Full-pretrain/Loss": 2.136721611022949, "Full-pretrain/Loss (Raw)": 2.3847174644470215, "Full-pretrain/Step": 381, "Full-pretrain/Step Time": 17.595982803031802} +{"Full-pretrain/Learning Rate": 4.998671289750386e-05, "Full-pretrain/Loss": 2.1340744495391846, "Full-pretrain/Loss (Raw)": 2.1348252296447754, "Full-pretrain/Step": 382, "Full-pretrain/Step Time": 17.58984251692891} +{"Full-pretrain/Learning Rate": 4.998643466629261e-05, "Full-pretrain/Loss": 2.135531425476074, "Full-pretrain/Loss (Raw)": 2.0601532459259033, "Full-pretrain/Step": 383, "Full-pretrain/Step Time": 17.584779342636466} +{"Full-pretrain/Learning Rate": 4.9986153552904894e-05, "Full-pretrain/Loss": 2.1355204582214355, "Full-pretrain/Loss (Raw)": 2.2345409393310547, "Full-pretrain/Step": 384, "Full-pretrain/Step Time": 17.581577060744166} +{"Full-pretrain/Learning Rate": 4.998586955737315e-05, "Full-pretrain/Loss": 2.1437766551971436, "Full-pretrain/Loss (Raw)": 2.382716417312622, "Full-pretrain/Step": 385, "Full-pretrain/Step Time": 17.57923761755228} +{"Full-pretrain/Learning Rate": 4.998558267973014e-05, "Full-pretrain/Loss": 2.1359283924102783, "Full-pretrain/Loss (Raw)": 1.9510133266448975, "Full-pretrain/Step": 386, "Full-pretrain/Step Time": 17.58164196461439} +{"Full-pretrain/Learning Rate": 4.998529292000894e-05, "Full-pretrain/Loss": 2.1353988647460938, "Full-pretrain/Loss (Raw)": 2.2380247116088867, "Full-pretrain/Step": 387, "Full-pretrain/Step Time": 17.570862950757146} +{"Full-pretrain/Learning Rate": 4.9985000278242974e-05, "Full-pretrain/Loss": 2.1388447284698486, "Full-pretrain/Loss (Raw)": 2.1741833686828613, "Full-pretrain/Step": 388, "Full-pretrain/Step Time": 17.57516391016543} +{"Full-pretrain/Learning Rate": 4.998470475446602e-05, "Full-pretrain/Loss": 2.146148681640625, "Full-pretrain/Loss (Raw)": 2.3129372596740723, "Full-pretrain/Step": 389, "Full-pretrain/Step Time": 17.56657106988132} +{"Full-pretrain/Learning Rate": 4.998440634871215e-05, "Full-pretrain/Loss": 2.1519718170166016, "Full-pretrain/Loss (Raw)": 2.2202515602111816, "Full-pretrain/Step": 390, "Full-pretrain/Step Time": 17.567183196544647} +{"Full-pretrain/Learning Rate": 4.998410506101578e-05, "Full-pretrain/Loss": 2.1474599838256836, "Full-pretrain/Loss (Raw)": 2.0450727939605713, "Full-pretrain/Step": 391, "Full-pretrain/Step Time": 17.556075962260365} +{"Full-pretrain/Learning Rate": 4.998380089141169e-05, "Full-pretrain/Loss": 2.1435623168945312, "Full-pretrain/Loss (Raw)": 1.9078662395477295, "Full-pretrain/Step": 392, "Full-pretrain/Step Time": 17.559836076572537} +{"Full-pretrain/Learning Rate": 4.998349383993493e-05, "Full-pretrain/Loss": 2.1465377807617188, "Full-pretrain/Loss (Raw)": 2.342801332473755, "Full-pretrain/Step": 393, "Full-pretrain/Step Time": 17.556784853339195} +{"Full-pretrain/Learning Rate": 4.998318390662094e-05, "Full-pretrain/Loss": 2.1477508544921875, "Full-pretrain/Loss (Raw)": 2.21071195602417, "Full-pretrain/Step": 394, "Full-pretrain/Step Time": 17.555174697190523} +{"Full-pretrain/Learning Rate": 4.998287109150547e-05, "Full-pretrain/Loss": 2.14414119720459, "Full-pretrain/Loss (Raw)": 2.1035568714141846, "Full-pretrain/Step": 395, "Full-pretrain/Step Time": 17.549683686345816} +{"Full-pretrain/Learning Rate": 4.9982555394624595e-05, "Full-pretrain/Loss": 2.1400012969970703, "Full-pretrain/Loss (Raw)": 2.1880195140838623, "Full-pretrain/Step": 396, "Full-pretrain/Step Time": 17.5522339399904} +{"Full-pretrain/Learning Rate": 4.998223681601473e-05, "Full-pretrain/Loss": 2.1373391151428223, "Full-pretrain/Loss (Raw)": 2.1911544799804688, "Full-pretrain/Step": 397, "Full-pretrain/Step Time": 17.551761461421847} +{"Full-pretrain/Learning Rate": 4.9981915355712636e-05, "Full-pretrain/Loss": 2.14141845703125, "Full-pretrain/Loss (Raw)": 2.1485533714294434, "Full-pretrain/Step": 398, "Full-pretrain/Step Time": 17.545711843296885} +{"Full-pretrain/Learning Rate": 4.998159101375538e-05, "Full-pretrain/Loss": 2.135833978652954, "Full-pretrain/Loss (Raw)": 2.0527544021606445, "Full-pretrain/Step": 399, "Full-pretrain/Step Time": 17.540060887113214} +{"Full-pretrain/Learning Rate": 4.998126379018039e-05, "Full-pretrain/Loss": 2.1406655311584473, "Full-pretrain/Loss (Raw)": 2.2174954414367676, "Full-pretrain/Step": 400, "Full-pretrain/Step Time": 17.545658888295293} +{"Full-pretrain/Learning Rate": 4.9980933685025385e-05, "Full-pretrain/Loss": 2.1402781009674072, "Full-pretrain/Loss (Raw)": 1.9547038078308105, "Full-pretrain/Step": 401, "Full-pretrain/Step Time": 17.543396644294262} +{"Full-pretrain/Learning Rate": 4.998060069832847e-05, "Full-pretrain/Loss": 2.1480722427368164, "Full-pretrain/Loss (Raw)": 2.3779311180114746, "Full-pretrain/Step": 402, "Full-pretrain/Step Time": 17.540782479569316} +{"Full-pretrain/Learning Rate": 4.9980264830128035e-05, "Full-pretrain/Loss": 2.1579294204711914, "Full-pretrain/Loss (Raw)": 2.2355942726135254, "Full-pretrain/Step": 403, "Full-pretrain/Step Time": 17.536581909283996} +{"Full-pretrain/Learning Rate": 4.9979926080462834e-05, "Full-pretrain/Loss": 2.1498312950134277, "Full-pretrain/Loss (Raw)": 1.9253365993499756, "Full-pretrain/Step": 404, "Full-pretrain/Step Time": 17.533545829355717} +{"Full-pretrain/Learning Rate": 4.997958444937194e-05, "Full-pretrain/Loss": 2.153622627258301, "Full-pretrain/Loss (Raw)": 2.146230697631836, "Full-pretrain/Step": 405, "Full-pretrain/Step Time": 17.53466052748263} +{"Full-pretrain/Learning Rate": 4.9979239936894765e-05, "Full-pretrain/Loss": 2.1599984169006348, "Full-pretrain/Loss (Raw)": 2.2641916275024414, "Full-pretrain/Step": 406, "Full-pretrain/Step Time": 17.53682160936296} +{"Full-pretrain/Learning Rate": 4.997889254307103e-05, "Full-pretrain/Loss": 2.1716790199279785, "Full-pretrain/Loss (Raw)": 2.4234137535095215, "Full-pretrain/Step": 407, "Full-pretrain/Step Time": 17.533499678596854} +{"Full-pretrain/Learning Rate": 4.997854226794082e-05, "Full-pretrain/Loss": 2.1713781356811523, "Full-pretrain/Loss (Raw)": 2.2233080863952637, "Full-pretrain/Step": 408, "Full-pretrain/Step Time": 17.53686454333365} +{"Full-pretrain/Learning Rate": 4.997818911154454e-05, "Full-pretrain/Loss": 2.1715729236602783, "Full-pretrain/Loss (Raw)": 2.017394542694092, "Full-pretrain/Step": 409, "Full-pretrain/Step Time": 17.54037146642804} +{"Full-pretrain/Learning Rate": 4.997783307392292e-05, "Full-pretrain/Loss": 2.154414653778076, "Full-pretrain/Loss (Raw)": 1.9453566074371338, "Full-pretrain/Step": 410, "Full-pretrain/Step Time": 17.535956289619207} +{"Full-pretrain/Learning Rate": 4.9977474155117045e-05, "Full-pretrain/Loss": 2.1536734104156494, "Full-pretrain/Loss (Raw)": 1.9048608541488647, "Full-pretrain/Step": 411, "Full-pretrain/Step Time": 17.536027604714036} +{"Full-pretrain/Learning Rate": 4.9977112355168286e-05, "Full-pretrain/Loss": 2.1547188758850098, "Full-pretrain/Loss (Raw)": 2.0313382148742676, "Full-pretrain/Step": 412, "Full-pretrain/Step Time": 17.534599551931024} +{"Full-pretrain/Learning Rate": 4.997674767411841e-05, "Full-pretrain/Loss": 2.156765937805176, "Full-pretrain/Loss (Raw)": 2.4502174854278564, "Full-pretrain/Step": 413, "Full-pretrain/Step Time": 17.534165089949965} +{"Full-pretrain/Learning Rate": 4.997638011200946e-05, "Full-pretrain/Loss": 2.158466339111328, "Full-pretrain/Loss (Raw)": 2.189234733581543, "Full-pretrain/Step": 414, "Full-pretrain/Step Time": 17.536088990047574} +{"Full-pretrain/Learning Rate": 4.997600966888384e-05, "Full-pretrain/Loss": 2.160496950149536, "Full-pretrain/Loss (Raw)": 2.1251327991485596, "Full-pretrain/Step": 415, "Full-pretrain/Step Time": 17.533223131671548} +{"Full-pretrain/Learning Rate": 4.997563634478428e-05, "Full-pretrain/Loss": 2.159311056137085, "Full-pretrain/Loss (Raw)": 2.1965928077697754, "Full-pretrain/Step": 416, "Full-pretrain/Step Time": 17.536238476634026} +{"Full-pretrain/Learning Rate": 4.9975260139753856e-05, "Full-pretrain/Loss": 2.1475391387939453, "Full-pretrain/Loss (Raw)": 2.0060126781463623, "Full-pretrain/Step": 417, "Full-pretrain/Step Time": 17.531400062143803} +{"Full-pretrain/Learning Rate": 4.997488105383594e-05, "Full-pretrain/Loss": 2.1549150943756104, "Full-pretrain/Loss (Raw)": 2.1870439052581787, "Full-pretrain/Step": 418, "Full-pretrain/Step Time": 17.52880983427167} +{"Full-pretrain/Learning Rate": 4.997449908707428e-05, "Full-pretrain/Loss": 2.1470320224761963, "Full-pretrain/Loss (Raw)": 1.9857678413391113, "Full-pretrain/Step": 419, "Full-pretrain/Step Time": 17.53065087646246} +{"Full-pretrain/Learning Rate": 4.997411423951292e-05, "Full-pretrain/Loss": 2.1433217525482178, "Full-pretrain/Loss (Raw)": 2.0554513931274414, "Full-pretrain/Step": 420, "Full-pretrain/Step Time": 17.527226792648435} +{"Full-pretrain/Learning Rate": 4.997372651119626e-05, "Full-pretrain/Loss": 2.133510112762451, "Full-pretrain/Loss (Raw)": 1.9989649057388306, "Full-pretrain/Step": 421, "Full-pretrain/Step Time": 17.527248604223132} +{"Full-pretrain/Learning Rate": 4.9973335902169026e-05, "Full-pretrain/Loss": 2.129368782043457, "Full-pretrain/Loss (Raw)": 2.0877342224121094, "Full-pretrain/Step": 422, "Full-pretrain/Step Time": 17.52677822113037} +{"Full-pretrain/Learning Rate": 4.997294241247628e-05, "Full-pretrain/Loss": 2.131094455718994, "Full-pretrain/Loss (Raw)": 2.100295066833496, "Full-pretrain/Step": 423, "Full-pretrain/Step Time": 17.521020395681262} +{"Full-pretrain/Learning Rate": 4.9972546042163385e-05, "Full-pretrain/Loss": 2.1357858180999756, "Full-pretrain/Loss (Raw)": 2.057983875274658, "Full-pretrain/Step": 424, "Full-pretrain/Step Time": 17.51940586976707} +{"Full-pretrain/Learning Rate": 4.997214679127608e-05, "Full-pretrain/Loss": 2.1397058963775635, "Full-pretrain/Loss (Raw)": 2.4682457447052, "Full-pretrain/Step": 425, "Full-pretrain/Step Time": 17.51874008961022} +{"Full-pretrain/Learning Rate": 4.997174465986044e-05, "Full-pretrain/Loss": 2.1392159461975098, "Full-pretrain/Loss (Raw)": 2.1950416564941406, "Full-pretrain/Step": 426, "Full-pretrain/Step Time": 17.521085876971483} +{"Full-pretrain/Learning Rate": 4.997133964796281e-05, "Full-pretrain/Loss": 2.13930082321167, "Full-pretrain/Loss (Raw)": 2.1062700748443604, "Full-pretrain/Step": 427, "Full-pretrain/Step Time": 17.521364444866776} +{"Full-pretrain/Learning Rate": 4.997093175562994e-05, "Full-pretrain/Loss": 2.138502597808838, "Full-pretrain/Loss (Raw)": 2.1624703407287598, "Full-pretrain/Step": 428, "Full-pretrain/Step Time": 17.515519397333264} +{"Full-pretrain/Learning Rate": 4.997052098290886e-05, "Full-pretrain/Loss": 2.135822057723999, "Full-pretrain/Loss (Raw)": 2.1053781509399414, "Full-pretrain/Step": 429, "Full-pretrain/Step Time": 17.51840803399682} +{"Full-pretrain/Learning Rate": 4.997010732984696e-05, "Full-pretrain/Loss": 2.135004997253418, "Full-pretrain/Loss (Raw)": 2.1224095821380615, "Full-pretrain/Step": 430, "Full-pretrain/Step Time": 17.518538035452366} +{"Full-pretrain/Learning Rate": 4.996969079649195e-05, "Full-pretrain/Loss": 2.1328248977661133, "Full-pretrain/Loss (Raw)": 1.9829890727996826, "Full-pretrain/Step": 431, "Full-pretrain/Step Time": 17.5221089720726} +{"Full-pretrain/Learning Rate": 4.996927138289189e-05, "Full-pretrain/Loss": 2.1361045837402344, "Full-pretrain/Loss (Raw)": 2.322453022003174, "Full-pretrain/Step": 432, "Full-pretrain/Step Time": 17.522650385275483} +{"Full-pretrain/Learning Rate": 4.996884908909515e-05, "Full-pretrain/Loss": 2.144843101501465, "Full-pretrain/Loss (Raw)": 2.2343363761901855, "Full-pretrain/Step": 433, "Full-pretrain/Step Time": 17.520301066339016} +{"Full-pretrain/Learning Rate": 4.996842391515044e-05, "Full-pretrain/Loss": 2.1322860717773438, "Full-pretrain/Loss (Raw)": 1.9761037826538086, "Full-pretrain/Step": 434, "Full-pretrain/Step Time": 17.525248112156987} +{"Full-pretrain/Learning Rate": 4.9967995861106806e-05, "Full-pretrain/Loss": 2.126277208328247, "Full-pretrain/Loss (Raw)": 2.0433101654052734, "Full-pretrain/Step": 435, "Full-pretrain/Step Time": 17.52660552226007} +{"Full-pretrain/Learning Rate": 4.996756492701362e-05, "Full-pretrain/Loss": 2.1366822719573975, "Full-pretrain/Loss (Raw)": 2.25830078125, "Full-pretrain/Step": 436, "Full-pretrain/Step Time": 17.523318266496062} +{"Full-pretrain/Learning Rate": 4.99671311129206e-05, "Full-pretrain/Loss": 2.1423864364624023, "Full-pretrain/Loss (Raw)": 2.328763961791992, "Full-pretrain/Step": 437, "Full-pretrain/Step Time": 17.51794433221221} +{"Full-pretrain/Learning Rate": 4.9966694418877776e-05, "Full-pretrain/Loss": 2.1382970809936523, "Full-pretrain/Loss (Raw)": 2.1333346366882324, "Full-pretrain/Step": 438, "Full-pretrain/Step Time": 17.51859119348228} +{"Full-pretrain/Learning Rate": 4.9966254844935535e-05, "Full-pretrain/Loss": 2.129864454269409, "Full-pretrain/Loss (Raw)": 2.153571128845215, "Full-pretrain/Step": 439, "Full-pretrain/Step Time": 17.525389160960913} +{"Full-pretrain/Learning Rate": 4.996581239114456e-05, "Full-pretrain/Loss": 2.126169443130493, "Full-pretrain/Loss (Raw)": 2.1050608158111572, "Full-pretrain/Step": 440, "Full-pretrain/Step Time": 17.528009036555886} +{"Full-pretrain/Learning Rate": 4.99653670575559e-05, "Full-pretrain/Loss": 2.1306838989257812, "Full-pretrain/Loss (Raw)": 2.1618542671203613, "Full-pretrain/Step": 441, "Full-pretrain/Step Time": 17.520944729447365} +{"Full-pretrain/Learning Rate": 4.996491884422093e-05, "Full-pretrain/Loss": 2.1338937282562256, "Full-pretrain/Loss (Raw)": 2.0480759143829346, "Full-pretrain/Step": 442, "Full-pretrain/Step Time": 17.527884433045983} +{"Full-pretrain/Learning Rate": 4.9964467751191334e-05, "Full-pretrain/Loss": 2.1418280601501465, "Full-pretrain/Loss (Raw)": 2.158757209777832, "Full-pretrain/Step": 443, "Full-pretrain/Step Time": 17.527844158932567} +{"Full-pretrain/Learning Rate": 4.996401377851916e-05, "Full-pretrain/Loss": 2.1454310417175293, "Full-pretrain/Loss (Raw)": 2.1466355323791504, "Full-pretrain/Step": 444, "Full-pretrain/Step Time": 17.53154785372317} +{"Full-pretrain/Learning Rate": 4.9963556926256776e-05, "Full-pretrain/Loss": 2.136780023574829, "Full-pretrain/Loss (Raw)": 2.173384428024292, "Full-pretrain/Step": 445, "Full-pretrain/Step Time": 17.523927798494697} +{"Full-pretrain/Learning Rate": 4.996309719445687e-05, "Full-pretrain/Loss": 2.1384332180023193, "Full-pretrain/Loss (Raw)": 2.2421345710754395, "Full-pretrain/Step": 446, "Full-pretrain/Step Time": 17.52486958913505} +{"Full-pretrain/Learning Rate": 4.9962634583172475e-05, "Full-pretrain/Loss": 2.1387877464294434, "Full-pretrain/Loss (Raw)": 2.1364734172821045, "Full-pretrain/Step": 447, "Full-pretrain/Step Time": 17.530696334317327} +{"Full-pretrain/Learning Rate": 4.9962169092456956e-05, "Full-pretrain/Loss": 2.1386678218841553, "Full-pretrain/Loss (Raw)": 2.1927576065063477, "Full-pretrain/Step": 448, "Full-pretrain/Step Time": 17.533497294411063} +{"Full-pretrain/Learning Rate": 4.9961700722364e-05, "Full-pretrain/Loss": 2.1430933475494385, "Full-pretrain/Loss (Raw)": 2.147636890411377, "Full-pretrain/Step": 449, "Full-pretrain/Step Time": 17.525892194360495} +{"Full-pretrain/Learning Rate": 4.9961229472947634e-05, "Full-pretrain/Loss": 2.1416077613830566, "Full-pretrain/Loss (Raw)": 2.1395037174224854, "Full-pretrain/Step": 450, "Full-pretrain/Step Time": 17.528928484767675} +{"Full-pretrain/Learning Rate": 4.9960755344262225e-05, "Full-pretrain/Loss": 2.1412060260772705, "Full-pretrain/Loss (Raw)": 1.9729100465774536, "Full-pretrain/Step": 451, "Full-pretrain/Step Time": 17.532594554126263} +{"Full-pretrain/Learning Rate": 4.9960278336362465e-05, "Full-pretrain/Loss": 2.139707326889038, "Full-pretrain/Loss (Raw)": 2.00748872756958, "Full-pretrain/Step": 452, "Full-pretrain/Step Time": 17.530220549553633} +{"Full-pretrain/Learning Rate": 4.9959798449303365e-05, "Full-pretrain/Loss": 2.130652666091919, "Full-pretrain/Loss (Raw)": 1.7092201709747314, "Full-pretrain/Step": 453, "Full-pretrain/Step Time": 17.5300416611135} +{"Full-pretrain/Learning Rate": 4.995931568314029e-05, "Full-pretrain/Loss": 2.1379175186157227, "Full-pretrain/Loss (Raw)": 2.3202085494995117, "Full-pretrain/Step": 454, "Full-pretrain/Step Time": 17.528807105496526} +{"Full-pretrain/Learning Rate": 4.995883003792891e-05, "Full-pretrain/Loss": 2.139054298400879, "Full-pretrain/Loss (Raw)": 2.136672019958496, "Full-pretrain/Step": 455, "Full-pretrain/Step Time": 17.530740041285753} +{"Full-pretrain/Learning Rate": 4.9958341513725264e-05, "Full-pretrain/Loss": 2.141639471054077, "Full-pretrain/Loss (Raw)": 2.1407055854797363, "Full-pretrain/Step": 456, "Full-pretrain/Step Time": 17.528970265761018} +{"Full-pretrain/Learning Rate": 4.9957850110585696e-05, "Full-pretrain/Loss": 2.1279373168945312, "Full-pretrain/Loss (Raw)": 2.0297837257385254, "Full-pretrain/Step": 457, "Full-pretrain/Step Time": 17.530870439484715} +{"Full-pretrain/Learning Rate": 4.9957355828566884e-05, "Full-pretrain/Loss": 2.129723072052002, "Full-pretrain/Loss (Raw)": 2.2521824836730957, "Full-pretrain/Step": 458, "Full-pretrain/Step Time": 17.5355591122061} +{"Full-pretrain/Learning Rate": 4.995685866772586e-05, "Full-pretrain/Loss": 2.127239465713501, "Full-pretrain/Loss (Raw)": 2.0267975330352783, "Full-pretrain/Step": 459, "Full-pretrain/Step Time": 17.530998215079308} +{"Full-pretrain/Learning Rate": 4.9956358628119945e-05, "Full-pretrain/Loss": 2.1199543476104736, "Full-pretrain/Loss (Raw)": 1.9293423891067505, "Full-pretrain/Step": 460, "Full-pretrain/Step Time": 17.53713587857783} +{"Full-pretrain/Learning Rate": 4.9955855709806845e-05, "Full-pretrain/Loss": 2.1188197135925293, "Full-pretrain/Loss (Raw)": 2.069080352783203, "Full-pretrain/Step": 461, "Full-pretrain/Step Time": 17.535066569224} +{"Full-pretrain/Learning Rate": 4.9955349912844554e-05, "Full-pretrain/Loss": 2.1191983222961426, "Full-pretrain/Loss (Raw)": 2.134512424468994, "Full-pretrain/Step": 462, "Full-pretrain/Step Time": 17.535740623250604} +{"Full-pretrain/Learning Rate": 4.995484123729141e-05, "Full-pretrain/Loss": 2.1224050521850586, "Full-pretrain/Loss (Raw)": 2.0856070518493652, "Full-pretrain/Step": 463, "Full-pretrain/Step Time": 17.53773056715727} +{"Full-pretrain/Learning Rate": 4.995432968320611e-05, "Full-pretrain/Loss": 2.107997417449951, "Full-pretrain/Loss (Raw)": 1.8614078760147095, "Full-pretrain/Step": 464, "Full-pretrain/Step Time": 17.539313251152635} +{"Full-pretrain/Learning Rate": 4.995381525064765e-05, "Full-pretrain/Loss": 2.110152244567871, "Full-pretrain/Loss (Raw)": 2.303295135498047, "Full-pretrain/Step": 465, "Full-pretrain/Step Time": 17.54530488885939} +{"Full-pretrain/Learning Rate": 4.995329793967537e-05, "Full-pretrain/Loss": 2.1183362007141113, "Full-pretrain/Loss (Raw)": 2.237985134124756, "Full-pretrain/Step": 466, "Full-pretrain/Step Time": 17.545850668102503} +{"Full-pretrain/Learning Rate": 4.995277775034893e-05, "Full-pretrain/Loss": 2.1210505962371826, "Full-pretrain/Loss (Raw)": 2.1301772594451904, "Full-pretrain/Step": 467, "Full-pretrain/Step Time": 17.543927805498242} +{"Full-pretrain/Learning Rate": 4.995225468272836e-05, "Full-pretrain/Loss": 2.111940622329712, "Full-pretrain/Loss (Raw)": 1.9667725563049316, "Full-pretrain/Step": 468, "Full-pretrain/Step Time": 17.541336936876178} +{"Full-pretrain/Learning Rate": 4.995172873687398e-05, "Full-pretrain/Loss": 2.1061816215515137, "Full-pretrain/Loss (Raw)": 2.144484043121338, "Full-pretrain/Step": 469, "Full-pretrain/Step Time": 17.54934016801417} +{"Full-pretrain/Learning Rate": 4.995119991284646e-05, "Full-pretrain/Loss": 2.1120517253875732, "Full-pretrain/Loss (Raw)": 2.321174144744873, "Full-pretrain/Step": 470, "Full-pretrain/Step Time": 17.543817782774568} +{"Full-pretrain/Learning Rate": 4.995066821070679e-05, "Full-pretrain/Loss": 2.106954574584961, "Full-pretrain/Loss (Raw)": 1.990466833114624, "Full-pretrain/Step": 471, "Full-pretrain/Step Time": 17.54567152261734} +{"Full-pretrain/Learning Rate": 4.9950133630516315e-05, "Full-pretrain/Loss": 2.110534429550171, "Full-pretrain/Loss (Raw)": 2.2196121215820312, "Full-pretrain/Step": 472, "Full-pretrain/Step Time": 17.55194006115198} +{"Full-pretrain/Learning Rate": 4.9949596172336696e-05, "Full-pretrain/Loss": 2.109316349029541, "Full-pretrain/Loss (Raw)": 2.122875690460205, "Full-pretrain/Step": 473, "Full-pretrain/Step Time": 17.548869850113988} +{"Full-pretrain/Learning Rate": 4.994905583622992e-05, "Full-pretrain/Loss": 2.108884572982788, "Full-pretrain/Loss (Raw)": 2.034259557723999, "Full-pretrain/Step": 474, "Full-pretrain/Step Time": 17.55012564174831} +{"Full-pretrain/Learning Rate": 4.9948512622258325e-05, "Full-pretrain/Loss": 2.113504409790039, "Full-pretrain/Loss (Raw)": 2.306596517562866, "Full-pretrain/Step": 475, "Full-pretrain/Step Time": 17.547730151563883} +{"Full-pretrain/Learning Rate": 4.994796653048457e-05, "Full-pretrain/Loss": 2.110790967941284, "Full-pretrain/Loss (Raw)": 2.0598068237304688, "Full-pretrain/Step": 476, "Full-pretrain/Step Time": 17.553531052544713} +{"Full-pretrain/Learning Rate": 4.994741756097164e-05, "Full-pretrain/Loss": 2.110478401184082, "Full-pretrain/Loss (Raw)": 2.1633777618408203, "Full-pretrain/Step": 477, "Full-pretrain/Step Time": 17.556276870891452} +{"Full-pretrain/Learning Rate": 4.994686571378286e-05, "Full-pretrain/Loss": 2.1111130714416504, "Full-pretrain/Loss (Raw)": 2.262441635131836, "Full-pretrain/Step": 478, "Full-pretrain/Step Time": 17.56287706270814} +{"Full-pretrain/Learning Rate": 4.994631098898189e-05, "Full-pretrain/Loss": 2.1128790378570557, "Full-pretrain/Loss (Raw)": 2.192990779876709, "Full-pretrain/Step": 479, "Full-pretrain/Step Time": 17.560345694422722} +{"Full-pretrain/Learning Rate": 4.994575338663271e-05, "Full-pretrain/Loss": 2.1079647541046143, "Full-pretrain/Loss (Raw)": 2.0354976654052734, "Full-pretrain/Step": 480, "Full-pretrain/Step Time": 17.558780504390597} +{"Full-pretrain/Learning Rate": 4.994519290679964e-05, "Full-pretrain/Loss": 2.1088955402374268, "Full-pretrain/Loss (Raw)": 2.177419900894165, "Full-pretrain/Step": 481, "Full-pretrain/Step Time": 17.55799220688641} +{"Full-pretrain/Learning Rate": 4.994462954954734e-05, "Full-pretrain/Loss": 2.1124958992004395, "Full-pretrain/Loss (Raw)": 2.2547197341918945, "Full-pretrain/Step": 482, "Full-pretrain/Step Time": 17.565431097522378} +{"Full-pretrain/Learning Rate": 4.994406331494079e-05, "Full-pretrain/Loss": 2.119962215423584, "Full-pretrain/Loss (Raw)": 2.2118287086486816, "Full-pretrain/Step": 483, "Full-pretrain/Step Time": 17.563679622486234} +{"Full-pretrain/Learning Rate": 4.994349420304531e-05, "Full-pretrain/Loss": 2.1216061115264893, "Full-pretrain/Loss (Raw)": 2.0600948333740234, "Full-pretrain/Step": 484, "Full-pretrain/Step Time": 17.562611447647214} +{"Full-pretrain/Learning Rate": 4.9942922213926525e-05, "Full-pretrain/Loss": 2.1356189250946045, "Full-pretrain/Loss (Raw)": 2.15762996673584, "Full-pretrain/Step": 485, "Full-pretrain/Step Time": 17.563118621706963} +{"Full-pretrain/Learning Rate": 4.994234734765043e-05, "Full-pretrain/Loss": 2.1313257217407227, "Full-pretrain/Loss (Raw)": 2.1828267574310303, "Full-pretrain/Step": 486, "Full-pretrain/Step Time": 17.565680094063282} +{"Full-pretrain/Learning Rate": 4.994176960428334e-05, "Full-pretrain/Loss": 2.134598731994629, "Full-pretrain/Loss (Raw)": 2.2414064407348633, "Full-pretrain/Step": 487, "Full-pretrain/Step Time": 17.56472653336823} +{"Full-pretrain/Learning Rate": 4.9941188983891885e-05, "Full-pretrain/Loss": 2.1391777992248535, "Full-pretrain/Loss (Raw)": 2.287234306335449, "Full-pretrain/Step": 488, "Full-pretrain/Step Time": 17.566028125584126} +{"Full-pretrain/Learning Rate": 4.9940605486543045e-05, "Full-pretrain/Loss": 2.1441268920898438, "Full-pretrain/Loss (Raw)": 2.188161849975586, "Full-pretrain/Step": 489, "Full-pretrain/Step Time": 17.563857620581985} +{"Full-pretrain/Learning Rate": 4.994001911230414e-05, "Full-pretrain/Loss": 2.1425986289978027, "Full-pretrain/Loss (Raw)": 2.203268051147461, "Full-pretrain/Step": 490, "Full-pretrain/Step Time": 17.569916123524308} +{"Full-pretrain/Learning Rate": 4.993942986124278e-05, "Full-pretrain/Loss": 2.1454639434814453, "Full-pretrain/Loss (Raw)": 2.1184964179992676, "Full-pretrain/Step": 491, "Full-pretrain/Step Time": 17.576593292877078} +{"Full-pretrain/Learning Rate": 4.9938837733426955e-05, "Full-pretrain/Loss": 2.1422250270843506, "Full-pretrain/Loss (Raw)": 1.8256908655166626, "Full-pretrain/Step": 492, "Full-pretrain/Step Time": 17.58010215871036} +{"Full-pretrain/Learning Rate": 4.993824272892497e-05, "Full-pretrain/Loss": 2.1430749893188477, "Full-pretrain/Loss (Raw)": 2.096283435821533, "Full-pretrain/Step": 493, "Full-pretrain/Step Time": 17.579486455768347} +{"Full-pretrain/Learning Rate": 4.993764484780543e-05, "Full-pretrain/Loss": 2.1389524936676025, "Full-pretrain/Loss (Raw)": 2.002584934234619, "Full-pretrain/Step": 494, "Full-pretrain/Step Time": 17.584242736920714} +{"Full-pretrain/Learning Rate": 4.993704409013734e-05, "Full-pretrain/Loss": 2.1425137519836426, "Full-pretrain/Loss (Raw)": 2.1995749473571777, "Full-pretrain/Step": 495, "Full-pretrain/Step Time": 17.5852411929518} +{"Full-pretrain/Learning Rate": 4.993644045598997e-05, "Full-pretrain/Loss": 2.1546926498413086, "Full-pretrain/Loss (Raw)": 2.251126289367676, "Full-pretrain/Step": 496, "Full-pretrain/Step Time": 17.584199380129576} +{"Full-pretrain/Learning Rate": 4.9935833945432955e-05, "Full-pretrain/Loss": 2.1470344066619873, "Full-pretrain/Loss (Raw)": 2.058230400085449, "Full-pretrain/Step": 497, "Full-pretrain/Step Time": 17.57968778349459} +{"Full-pretrain/Learning Rate": 4.993522455853626e-05, "Full-pretrain/Loss": 2.1440036296844482, "Full-pretrain/Loss (Raw)": 2.1410000324249268, "Full-pretrain/Step": 498, "Full-pretrain/Step Time": 17.585440007969737} +{"Full-pretrain/Learning Rate": 4.9934612295370174e-05, "Full-pretrain/Loss": 2.146733522415161, "Full-pretrain/Loss (Raw)": 2.217536211013794, "Full-pretrain/Step": 499, "Full-pretrain/Step Time": 17.593953855335712} +{"Full-pretrain/Learning Rate": 4.993399715600532e-05, "Full-pretrain/Loss": 2.1480062007904053, "Full-pretrain/Loss (Raw)": 2.0074996948242188, "Full-pretrain/Step": 500, "Full-pretrain/Step Time": 17.596486615017056} +{"Full-pretrain/Learning Rate": 4.993337914051266e-05, "Full-pretrain/Loss": 2.157349109649658, "Full-pretrain/Loss (Raw)": 2.443453788757324, "Full-pretrain/Step": 501, "Full-pretrain/Step Time": 17.595276679843664} +{"Full-pretrain/Learning Rate": 4.993275824896348e-05, "Full-pretrain/Loss": 2.154670476913452, "Full-pretrain/Loss (Raw)": 2.2354602813720703, "Full-pretrain/Step": 502, "Full-pretrain/Step Time": 17.600697608664632} +{"Full-pretrain/Learning Rate": 4.993213448142939e-05, "Full-pretrain/Loss": 2.1598353385925293, "Full-pretrain/Loss (Raw)": 2.1557469367980957, "Full-pretrain/Step": 503, "Full-pretrain/Step Time": 17.600194377824664} +{"Full-pretrain/Learning Rate": 4.993150783798236e-05, "Full-pretrain/Loss": 2.1641180515289307, "Full-pretrain/Loss (Raw)": 2.3566555976867676, "Full-pretrain/Step": 504, "Full-pretrain/Step Time": 17.604419400915504} +{"Full-pretrain/Learning Rate": 4.9930878318694655e-05, "Full-pretrain/Loss": 2.1623411178588867, "Full-pretrain/Loss (Raw)": 2.0660128593444824, "Full-pretrain/Step": 505, "Full-pretrain/Step Time": 17.59890465810895} +{"Full-pretrain/Learning Rate": 4.99302459236389e-05, "Full-pretrain/Loss": 2.168377161026001, "Full-pretrain/Loss (Raw)": 2.2274169921875, "Full-pretrain/Step": 506, "Full-pretrain/Step Time": 17.604117900133133} +{"Full-pretrain/Learning Rate": 4.992961065288804e-05, "Full-pretrain/Loss": 2.1551671028137207, "Full-pretrain/Loss (Raw)": 1.883874535560608, "Full-pretrain/Step": 507, "Full-pretrain/Step Time": 17.605495892465115} +{"Full-pretrain/Learning Rate": 4.992897250651535e-05, "Full-pretrain/Loss": 2.155790328979492, "Full-pretrain/Loss (Raw)": 2.0797548294067383, "Full-pretrain/Step": 508, "Full-pretrain/Step Time": 17.603682616725564} +{"Full-pretrain/Learning Rate": 4.992833148459444e-05, "Full-pretrain/Loss": 2.159043312072754, "Full-pretrain/Loss (Raw)": 2.2674665451049805, "Full-pretrain/Step": 509, "Full-pretrain/Step Time": 17.601689351722598} +{"Full-pretrain/Learning Rate": 4.992768758719926e-05, "Full-pretrain/Loss": 2.1535377502441406, "Full-pretrain/Loss (Raw)": 2.08626389503479, "Full-pretrain/Step": 510, "Full-pretrain/Step Time": 17.60834465548396} +{"Full-pretrain/Learning Rate": 4.992704081440407e-05, "Full-pretrain/Loss": 2.1479849815368652, "Full-pretrain/Loss (Raw)": 2.015305995941162, "Full-pretrain/Step": 511, "Full-pretrain/Step Time": 17.606824051588774} +{"Full-pretrain/Learning Rate": 4.992639116628349e-05, "Full-pretrain/Loss": 2.1500797271728516, "Full-pretrain/Loss (Raw)": 2.10252046585083, "Full-pretrain/Step": 512, "Full-pretrain/Step Time": 17.607367986813188} +{"Full-pretrain/Learning Rate": 4.9925738642912447e-05, "Full-pretrain/Loss": 2.1526310443878174, "Full-pretrain/Loss (Raw)": 2.2590696811676025, "Full-pretrain/Step": 513, "Full-pretrain/Step Time": 17.608024643734097} +{"Full-pretrain/Learning Rate": 4.99250832443662e-05, "Full-pretrain/Loss": 2.1622681617736816, "Full-pretrain/Loss (Raw)": 2.5631017684936523, "Full-pretrain/Step": 514, "Full-pretrain/Step Time": 17.605822909623384} +{"Full-pretrain/Learning Rate": 4.9924424970720376e-05, "Full-pretrain/Loss": 2.1587181091308594, "Full-pretrain/Loss (Raw)": 2.098231792449951, "Full-pretrain/Step": 515, "Full-pretrain/Step Time": 17.609439315274358} +{"Full-pretrain/Learning Rate": 4.992376382205088e-05, "Full-pretrain/Loss": 2.156428337097168, "Full-pretrain/Loss (Raw)": 1.9868178367614746, "Full-pretrain/Step": 516, "Full-pretrain/Step Time": 17.605655182152987} +{"Full-pretrain/Learning Rate": 4.9923099798433985e-05, "Full-pretrain/Loss": 2.154344081878662, "Full-pretrain/Loss (Raw)": 2.090941905975342, "Full-pretrain/Step": 517, "Full-pretrain/Step Time": 17.60905939899385} +{"Full-pretrain/Learning Rate": 4.992243289994629e-05, "Full-pretrain/Loss": 2.1495108604431152, "Full-pretrain/Loss (Raw)": 2.028158664703369, "Full-pretrain/Step": 518, "Full-pretrain/Step Time": 17.609473356977105} +{"Full-pretrain/Learning Rate": 4.992176312666472e-05, "Full-pretrain/Loss": 2.147829055786133, "Full-pretrain/Loss (Raw)": 2.187589645385742, "Full-pretrain/Step": 519, "Full-pretrain/Step Time": 17.615257864817977} +{"Full-pretrain/Learning Rate": 4.992109047866653e-05, "Full-pretrain/Loss": 2.141611099243164, "Full-pretrain/Loss (Raw)": 2.0882608890533447, "Full-pretrain/Step": 520, "Full-pretrain/Step Time": 17.608517859131098} +{"Full-pretrain/Learning Rate": 4.992041495602932e-05, "Full-pretrain/Loss": 2.1408379077911377, "Full-pretrain/Loss (Raw)": 2.1634154319763184, "Full-pretrain/Step": 521, "Full-pretrain/Step Time": 17.61146137677133} +{"Full-pretrain/Learning Rate": 4.9919736558830984e-05, "Full-pretrain/Loss": 2.137601375579834, "Full-pretrain/Loss (Raw)": 2.099696159362793, "Full-pretrain/Step": 522, "Full-pretrain/Step Time": 17.611338138580322} +{"Full-pretrain/Learning Rate": 4.9919055287149805e-05, "Full-pretrain/Loss": 2.13618803024292, "Full-pretrain/Loss (Raw)": 2.073268413543701, "Full-pretrain/Step": 523, "Full-pretrain/Step Time": 17.614799370989203} +{"Full-pretrain/Learning Rate": 4.991837114106436e-05, "Full-pretrain/Loss": 2.1422910690307617, "Full-pretrain/Loss (Raw)": 2.020998001098633, "Full-pretrain/Step": 524, "Full-pretrain/Step Time": 17.611132288351655} +{"Full-pretrain/Learning Rate": 4.991768412065355e-05, "Full-pretrain/Loss": 2.1423301696777344, "Full-pretrain/Loss (Raw)": 2.097534656524658, "Full-pretrain/Step": 525, "Full-pretrain/Step Time": 17.614547926932573} +{"Full-pretrain/Learning Rate": 4.991699422599664e-05, "Full-pretrain/Loss": 2.1461849212646484, "Full-pretrain/Loss (Raw)": 2.1259303092956543, "Full-pretrain/Step": 526, "Full-pretrain/Step Time": 17.61767360754311} +{"Full-pretrain/Learning Rate": 4.99163014571732e-05, "Full-pretrain/Loss": 2.139267921447754, "Full-pretrain/Loss (Raw)": 1.9782319068908691, "Full-pretrain/Step": 527, "Full-pretrain/Step Time": 17.622853176668286} +{"Full-pretrain/Learning Rate": 4.991560581426315e-05, "Full-pretrain/Loss": 2.1344027519226074, "Full-pretrain/Loss (Raw)": 2.095439910888672, "Full-pretrain/Step": 528, "Full-pretrain/Step Time": 17.617742206901312} +{"Full-pretrain/Learning Rate": 4.991490729734671e-05, "Full-pretrain/Loss": 2.1354141235351562, "Full-pretrain/Loss (Raw)": 2.090592622756958, "Full-pretrain/Step": 529, "Full-pretrain/Step Time": 17.620469100773335} +{"Full-pretrain/Learning Rate": 4.991420590650448e-05, "Full-pretrain/Loss": 2.1314034461975098, "Full-pretrain/Loss (Raw)": 2.0126688480377197, "Full-pretrain/Step": 530, "Full-pretrain/Step Time": 17.620386412367225} +{"Full-pretrain/Learning Rate": 4.9913501641817354e-05, "Full-pretrain/Loss": 2.129753589630127, "Full-pretrain/Loss (Raw)": 2.164736270904541, "Full-pretrain/Step": 531, "Full-pretrain/Step Time": 17.62072023563087} +{"Full-pretrain/Learning Rate": 4.9912794503366566e-05, "Full-pretrain/Loss": 2.139029026031494, "Full-pretrain/Loss (Raw)": 2.3043196201324463, "Full-pretrain/Step": 532, "Full-pretrain/Step Time": 17.621559405699372} +{"Full-pretrain/Learning Rate": 4.991208449123369e-05, "Full-pretrain/Loss": 2.1264290809631348, "Full-pretrain/Loss (Raw)": 2.040250062942505, "Full-pretrain/Step": 533, "Full-pretrain/Step Time": 17.615455336868763} +{"Full-pretrain/Learning Rate": 4.991137160550062e-05, "Full-pretrain/Loss": 2.1225523948669434, "Full-pretrain/Loss (Raw)": 2.111402988433838, "Full-pretrain/Step": 534, "Full-pretrain/Step Time": 17.61831190995872} +{"Full-pretrain/Learning Rate": 4.991065584624959e-05, "Full-pretrain/Loss": 2.124511241912842, "Full-pretrain/Loss (Raw)": 2.2184300422668457, "Full-pretrain/Step": 535, "Full-pretrain/Step Time": 17.620369501411915} +{"Full-pretrain/Learning Rate": 4.9909937213563165e-05, "Full-pretrain/Loss": 2.119119644165039, "Full-pretrain/Loss (Raw)": 2.184128522872925, "Full-pretrain/Step": 536, "Full-pretrain/Step Time": 17.61536243930459} +{"Full-pretrain/Learning Rate": 4.9909215707524236e-05, "Full-pretrain/Loss": 2.1328656673431396, "Full-pretrain/Loss (Raw)": 2.5058860778808594, "Full-pretrain/Step": 537, "Full-pretrain/Step Time": 17.609150238335133} +{"Full-pretrain/Learning Rate": 4.9908491328216025e-05, "Full-pretrain/Loss": 2.138068675994873, "Full-pretrain/Loss (Raw)": 2.3939175605773926, "Full-pretrain/Step": 538, "Full-pretrain/Step Time": 17.61224924772978} +{"Full-pretrain/Learning Rate": 4.9907764075722094e-05, "Full-pretrain/Loss": 2.1491289138793945, "Full-pretrain/Loss (Raw)": 2.2377943992614746, "Full-pretrain/Step": 539, "Full-pretrain/Step Time": 17.615412905812263} +{"Full-pretrain/Learning Rate": 4.9907033950126336e-05, "Full-pretrain/Loss": 2.156754970550537, "Full-pretrain/Loss (Raw)": 2.323787212371826, "Full-pretrain/Step": 540, "Full-pretrain/Step Time": 17.61250756494701} +{"Full-pretrain/Learning Rate": 4.990630095151296e-05, "Full-pretrain/Loss": 2.1551942825317383, "Full-pretrain/Loss (Raw)": 2.2175261974334717, "Full-pretrain/Step": 541, "Full-pretrain/Step Time": 17.613153252750635} +{"Full-pretrain/Learning Rate": 4.990556507996652e-05, "Full-pretrain/Loss": 2.1469886302948, "Full-pretrain/Loss (Raw)": 1.8236875534057617, "Full-pretrain/Step": 542, "Full-pretrain/Step Time": 17.611874086782336} +{"Full-pretrain/Learning Rate": 4.99048263355719e-05, "Full-pretrain/Loss": 2.1547670364379883, "Full-pretrain/Loss (Raw)": 2.264209747314453, "Full-pretrain/Step": 543, "Full-pretrain/Step Time": 17.614056270569563} +{"Full-pretrain/Learning Rate": 4.990408471841432e-05, "Full-pretrain/Loss": 2.1575047969818115, "Full-pretrain/Loss (Raw)": 2.1901309490203857, "Full-pretrain/Step": 544, "Full-pretrain/Step Time": 17.618639262393117} +{"Full-pretrain/Learning Rate": 4.990334022857932e-05, "Full-pretrain/Loss": 2.1467580795288086, "Full-pretrain/Loss (Raw)": 1.9151711463928223, "Full-pretrain/Step": 545, "Full-pretrain/Step Time": 17.61467137373984} +{"Full-pretrain/Learning Rate": 4.990259286615276e-05, "Full-pretrain/Loss": 2.130547046661377, "Full-pretrain/Loss (Raw)": 2.044349193572998, "Full-pretrain/Step": 546, "Full-pretrain/Step Time": 17.621255364269018} +{"Full-pretrain/Learning Rate": 4.9901842631220884e-05, "Full-pretrain/Loss": 2.1352031230926514, "Full-pretrain/Loss (Raw)": 2.2472267150878906, "Full-pretrain/Step": 547, "Full-pretrain/Step Time": 17.622571444138885} +{"Full-pretrain/Learning Rate": 4.9901089523870205e-05, "Full-pretrain/Loss": 2.139681100845337, "Full-pretrain/Loss (Raw)": 2.130115032196045, "Full-pretrain/Step": 548, "Full-pretrain/Step Time": 17.623990627005696} +{"Full-pretrain/Learning Rate": 4.99003335441876e-05, "Full-pretrain/Loss": 2.138186454772949, "Full-pretrain/Loss (Raw)": 2.0431101322174072, "Full-pretrain/Step": 549, "Full-pretrain/Step Time": 17.619628528133035} +{"Full-pretrain/Learning Rate": 4.989957469226027e-05, "Full-pretrain/Loss": 2.1404967308044434, "Full-pretrain/Loss (Raw)": 2.102083444595337, "Full-pretrain/Step": 550, "Full-pretrain/Step Time": 17.62407662346959} +{"Full-pretrain/Learning Rate": 4.989881296817575e-05, "Full-pretrain/Loss": 2.142651319503784, "Full-pretrain/Loss (Raw)": 2.2565395832061768, "Full-pretrain/Step": 551, "Full-pretrain/Step Time": 17.62640676088631} +{"Full-pretrain/Learning Rate": 4.9898048372021905e-05, "Full-pretrain/Loss": 2.1435117721557617, "Full-pretrain/Loss (Raw)": 2.1157984733581543, "Full-pretrain/Step": 552, "Full-pretrain/Step Time": 17.629904923960567} +{"Full-pretrain/Learning Rate": 4.9897280903886937e-05, "Full-pretrain/Loss": 2.142157554626465, "Full-pretrain/Loss (Raw)": 2.120081663131714, "Full-pretrain/Step": 553, "Full-pretrain/Step Time": 17.62504466623068} +{"Full-pretrain/Learning Rate": 4.989651056385936e-05, "Full-pretrain/Loss": 2.147108793258667, "Full-pretrain/Loss (Raw)": 2.2581286430358887, "Full-pretrain/Step": 554, "Full-pretrain/Step Time": 17.625954980030656} +{"Full-pretrain/Learning Rate": 4.989573735202803e-05, "Full-pretrain/Loss": 2.1463980674743652, "Full-pretrain/Loss (Raw)": 2.0505270957946777, "Full-pretrain/Step": 555, "Full-pretrain/Step Time": 17.627559948712587} +{"Full-pretrain/Learning Rate": 4.989496126848215e-05, "Full-pretrain/Loss": 2.154247760772705, "Full-pretrain/Loss (Raw)": 2.272193431854248, "Full-pretrain/Step": 556, "Full-pretrain/Step Time": 17.632194397971034} +{"Full-pretrain/Learning Rate": 4.9894182313311244e-05, "Full-pretrain/Loss": 2.1593680381774902, "Full-pretrain/Loss (Raw)": 2.2613840103149414, "Full-pretrain/Step": 557, "Full-pretrain/Step Time": 17.626747181639075} +{"Full-pretrain/Learning Rate": 4.9893400486605154e-05, "Full-pretrain/Loss": 2.1613001823425293, "Full-pretrain/Loss (Raw)": 2.1877527236938477, "Full-pretrain/Step": 558, "Full-pretrain/Step Time": 17.62967475131154} +{"Full-pretrain/Learning Rate": 4.9892615788454065e-05, "Full-pretrain/Loss": 2.1647205352783203, "Full-pretrain/Loss (Raw)": 2.08768892288208, "Full-pretrain/Step": 559, "Full-pretrain/Step Time": 17.629710217937827} +{"Full-pretrain/Learning Rate": 4.989182821894849e-05, "Full-pretrain/Loss": 2.169231653213501, "Full-pretrain/Loss (Raw)": 2.2397944927215576, "Full-pretrain/Step": 560, "Full-pretrain/Step Time": 17.62913645245135} +{"Full-pretrain/Learning Rate": 4.989103777817928e-05, "Full-pretrain/Loss": 2.1624486446380615, "Full-pretrain/Loss (Raw)": 1.8735371828079224, "Full-pretrain/Step": 561, "Full-pretrain/Step Time": 17.62501478381455} +{"Full-pretrain/Learning Rate": 4.989024446623761e-05, "Full-pretrain/Loss": 2.176265239715576, "Full-pretrain/Loss (Raw)": 2.4547982215881348, "Full-pretrain/Step": 562, "Full-pretrain/Step Time": 17.62606581300497} +{"Full-pretrain/Learning Rate": 4.988944828321498e-05, "Full-pretrain/Loss": 2.1753878593444824, "Full-pretrain/Loss (Raw)": 2.1366682052612305, "Full-pretrain/Step": 563, "Full-pretrain/Step Time": 17.625845786184072} +{"Full-pretrain/Learning Rate": 4.988864922920325e-05, "Full-pretrain/Loss": 2.168436050415039, "Full-pretrain/Loss (Raw)": 2.0818519592285156, "Full-pretrain/Step": 564, "Full-pretrain/Step Time": 17.628468880429864} +{"Full-pretrain/Learning Rate": 4.988784730429457e-05, "Full-pretrain/Loss": 2.174088478088379, "Full-pretrain/Loss (Raw)": 2.2211337089538574, "Full-pretrain/Step": 565, "Full-pretrain/Step Time": 17.629012435674667} +{"Full-pretrain/Learning Rate": 4.988704250858145e-05, "Full-pretrain/Loss": 2.173025131225586, "Full-pretrain/Loss (Raw)": 2.0773744583129883, "Full-pretrain/Step": 566, "Full-pretrain/Step Time": 17.62823927588761} +{"Full-pretrain/Learning Rate": 4.9886234842156724e-05, "Full-pretrain/Loss": 2.166989326477051, "Full-pretrain/Loss (Raw)": 2.025287628173828, "Full-pretrain/Step": 567, "Full-pretrain/Step Time": 17.62947910837829} +{"Full-pretrain/Learning Rate": 4.988542430511356e-05, "Full-pretrain/Loss": 2.1588215827941895, "Full-pretrain/Loss (Raw)": 1.9227522611618042, "Full-pretrain/Step": 568, "Full-pretrain/Step Time": 17.62989019602537} +{"Full-pretrain/Learning Rate": 4.988461089754544e-05, "Full-pretrain/Loss": 2.1418545246124268, "Full-pretrain/Loss (Raw)": 1.9629452228546143, "Full-pretrain/Step": 569, "Full-pretrain/Step Time": 17.628674434497952} +{"Full-pretrain/Learning Rate": 4.98837946195462e-05, "Full-pretrain/Loss": 2.1397714614868164, "Full-pretrain/Loss (Raw)": 2.327263355255127, "Full-pretrain/Step": 570, "Full-pretrain/Step Time": 17.6199423186481} +{"Full-pretrain/Learning Rate": 4.988297547121e-05, "Full-pretrain/Loss": 2.1402535438537598, "Full-pretrain/Loss (Raw)": 2.2532176971435547, "Full-pretrain/Step": 571, "Full-pretrain/Step Time": 17.625801157206297} +{"Full-pretrain/Learning Rate": 4.988215345263132e-05, "Full-pretrain/Loss": 2.132887840270996, "Full-pretrain/Loss (Raw)": 2.0880863666534424, "Full-pretrain/Step": 572, "Full-pretrain/Step Time": 17.626430423930287} +{"Full-pretrain/Learning Rate": 4.9881328563904984e-05, "Full-pretrain/Loss": 2.129866123199463, "Full-pretrain/Loss (Raw)": 2.1208338737487793, "Full-pretrain/Step": 573, "Full-pretrain/Step Time": 17.626948116347194} +{"Full-pretrain/Learning Rate": 4.988050080512614e-05, "Full-pretrain/Loss": 2.138890266418457, "Full-pretrain/Loss (Raw)": 2.112448215484619, "Full-pretrain/Step": 574, "Full-pretrain/Step Time": 17.624330937862396} +{"Full-pretrain/Learning Rate": 4.987967017639027e-05, "Full-pretrain/Loss": 2.131633996963501, "Full-pretrain/Loss (Raw)": 2.032015800476074, "Full-pretrain/Step": 575, "Full-pretrain/Step Time": 17.622175686061382} +{"Full-pretrain/Learning Rate": 4.9878836677793196e-05, "Full-pretrain/Loss": 2.120614767074585, "Full-pretrain/Loss (Raw)": 1.8375087976455688, "Full-pretrain/Step": 576, "Full-pretrain/Step Time": 17.625953260809183} +{"Full-pretrain/Learning Rate": 4.987800030943105e-05, "Full-pretrain/Loss": 2.123154878616333, "Full-pretrain/Loss (Raw)": 1.996460199356079, "Full-pretrain/Step": 577, "Full-pretrain/Step Time": 17.621890796348453} +{"Full-pretrain/Learning Rate": 4.9877161071400314e-05, "Full-pretrain/Loss": 2.125514030456543, "Full-pretrain/Loss (Raw)": 2.119839668273926, "Full-pretrain/Step": 578, "Full-pretrain/Step Time": 17.616090316325426} +{"Full-pretrain/Learning Rate": 4.9876318963797786e-05, "Full-pretrain/Loss": 2.1214776039123535, "Full-pretrain/Loss (Raw)": 2.1180620193481445, "Full-pretrain/Step": 579, "Full-pretrain/Step Time": 17.612490503117442} +{"Full-pretrain/Learning Rate": 4.987547398672061e-05, "Full-pretrain/Loss": 2.116748571395874, "Full-pretrain/Loss (Raw)": 1.9787824153900146, "Full-pretrain/Step": 580, "Full-pretrain/Step Time": 17.615565126761794} +{"Full-pretrain/Learning Rate": 4.987462614026625e-05, "Full-pretrain/Loss": 2.121448040008545, "Full-pretrain/Loss (Raw)": 2.193497657775879, "Full-pretrain/Step": 581, "Full-pretrain/Step Time": 17.613259391859174} +{"Full-pretrain/Learning Rate": 4.987377542453251e-05, "Full-pretrain/Loss": 2.1235179901123047, "Full-pretrain/Loss (Raw)": 2.168323516845703, "Full-pretrain/Step": 582, "Full-pretrain/Step Time": 17.611877290531993} +{"Full-pretrain/Learning Rate": 4.987292183961751e-05, "Full-pretrain/Loss": 2.1275081634521484, "Full-pretrain/Loss (Raw)": 2.384223461151123, "Full-pretrain/Step": 583, "Full-pretrain/Step Time": 17.61096191778779} +{"Full-pretrain/Learning Rate": 4.987206538561972e-05, "Full-pretrain/Loss": 2.126044273376465, "Full-pretrain/Loss (Raw)": 2.0689520835876465, "Full-pretrain/Step": 584, "Full-pretrain/Step Time": 17.609523316845298} +{"Full-pretrain/Learning Rate": 4.987120606263793e-05, "Full-pretrain/Loss": 2.118475914001465, "Full-pretrain/Loss (Raw)": 1.8779007196426392, "Full-pretrain/Step": 585, "Full-pretrain/Step Time": 17.607017062604427} +{"Full-pretrain/Learning Rate": 4.9870343870771256e-05, "Full-pretrain/Loss": 2.109920024871826, "Full-pretrain/Loss (Raw)": 1.9843348264694214, "Full-pretrain/Step": 586, "Full-pretrain/Step Time": 17.60818576067686} +{"Full-pretrain/Learning Rate": 4.9869478810119164e-05, "Full-pretrain/Loss": 2.113426685333252, "Full-pretrain/Loss (Raw)": 2.1627368927001953, "Full-pretrain/Step": 587, "Full-pretrain/Step Time": 17.60858504474163} +{"Full-pretrain/Learning Rate": 4.986861088078143e-05, "Full-pretrain/Loss": 2.118037223815918, "Full-pretrain/Loss (Raw)": 2.41973614692688, "Full-pretrain/Step": 588, "Full-pretrain/Step Time": 17.606186090037227} +{"Full-pretrain/Learning Rate": 4.986774008285816e-05, "Full-pretrain/Loss": 2.112955093383789, "Full-pretrain/Loss (Raw)": 2.0987539291381836, "Full-pretrain/Step": 589, "Full-pretrain/Step Time": 17.603498466312885} +{"Full-pretrain/Learning Rate": 4.986686641644982e-05, "Full-pretrain/Loss": 2.108574151992798, "Full-pretrain/Loss (Raw)": 2.04756236076355, "Full-pretrain/Step": 590, "Full-pretrain/Step Time": 17.60067735426128} +{"Full-pretrain/Learning Rate": 4.986598988165718e-05, "Full-pretrain/Loss": 2.111678123474121, "Full-pretrain/Loss (Raw)": 2.1870126724243164, "Full-pretrain/Step": 591, "Full-pretrain/Step Time": 17.599842682480812} +{"Full-pretrain/Learning Rate": 4.986511047858134e-05, "Full-pretrain/Loss": 2.105381965637207, "Full-pretrain/Loss (Raw)": 2.038321018218994, "Full-pretrain/Step": 592, "Full-pretrain/Step Time": 17.595472026616335} +{"Full-pretrain/Learning Rate": 4.986422820732375e-05, "Full-pretrain/Loss": 2.107058048248291, "Full-pretrain/Loss (Raw)": 1.9271748065948486, "Full-pretrain/Step": 593, "Full-pretrain/Step Time": 17.594157559797168} +{"Full-pretrain/Learning Rate": 4.986334306798617e-05, "Full-pretrain/Loss": 2.1002793312072754, "Full-pretrain/Loss (Raw)": 2.2378764152526855, "Full-pretrain/Step": 594, "Full-pretrain/Step Time": 17.59057948552072} +{"Full-pretrain/Learning Rate": 4.9862455060670696e-05, "Full-pretrain/Loss": 2.0967583656311035, "Full-pretrain/Loss (Raw)": 2.0239992141723633, "Full-pretrain/Step": 595, "Full-pretrain/Step Time": 17.59133325703442} +{"Full-pretrain/Learning Rate": 4.9861564185479784e-05, "Full-pretrain/Loss": 2.101853370666504, "Full-pretrain/Loss (Raw)": 2.244886636734009, "Full-pretrain/Step": 596, "Full-pretrain/Step Time": 17.597689893096685} +{"Full-pretrain/Learning Rate": 4.9860670442516175e-05, "Full-pretrain/Loss": 2.0923147201538086, "Full-pretrain/Loss (Raw)": 1.9159026145935059, "Full-pretrain/Step": 597, "Full-pretrain/Step Time": 17.590950530022383} +{"Full-pretrain/Learning Rate": 4.985977383188296e-05, "Full-pretrain/Loss": 2.089292287826538, "Full-pretrain/Loss (Raw)": 1.9806503057479858, "Full-pretrain/Step": 598, "Full-pretrain/Step Time": 17.596911331638694} +{"Full-pretrain/Learning Rate": 4.9858874353683574e-05, "Full-pretrain/Loss": 2.081751823425293, "Full-pretrain/Loss (Raw)": 1.7840020656585693, "Full-pretrain/Step": 599, "Full-pretrain/Step Time": 17.59362062625587} +{"Full-pretrain/Learning Rate": 4.985797200802177e-05, "Full-pretrain/Loss": 2.090848922729492, "Full-pretrain/Loss (Raw)": 2.2138490676879883, "Full-pretrain/Step": 600, "Full-pretrain/Step Time": 17.597173806279898} +{"Full-pretrain/Learning Rate": 4.9857066795001625e-05, "Full-pretrain/Loss": 2.0952000617980957, "Full-pretrain/Loss (Raw)": 2.102193593978882, "Full-pretrain/Step": 601, "Full-pretrain/Step Time": 17.5996504612267} +{"Full-pretrain/Learning Rate": 4.985615871472758e-05, "Full-pretrain/Loss": 2.083519458770752, "Full-pretrain/Loss (Raw)": 1.9534698724746704, "Full-pretrain/Step": 602, "Full-pretrain/Step Time": 17.598298590630293} +{"Full-pretrain/Learning Rate": 4.9855247767304337e-05, "Full-pretrain/Loss": 2.0802903175354004, "Full-pretrain/Loss (Raw)": 2.149897336959839, "Full-pretrain/Step": 603, "Full-pretrain/Step Time": 17.595028653740883} +{"Full-pretrain/Learning Rate": 4.985433395283701e-05, "Full-pretrain/Loss": 2.0819084644317627, "Full-pretrain/Loss (Raw)": 2.139859199523926, "Full-pretrain/Step": 604, "Full-pretrain/Step Time": 17.592020016163588} +{"Full-pretrain/Learning Rate": 4.985341727143099e-05, "Full-pretrain/Loss": 2.0886926651000977, "Full-pretrain/Loss (Raw)": 2.337935447692871, "Full-pretrain/Step": 605, "Full-pretrain/Step Time": 17.59514005854726} +{"Full-pretrain/Learning Rate": 4.9852497723192024e-05, "Full-pretrain/Loss": 2.091456413269043, "Full-pretrain/Loss (Raw)": 2.200878381729126, "Full-pretrain/Step": 606, "Full-pretrain/Step Time": 17.59155410528183} +{"Full-pretrain/Learning Rate": 4.985157530822619e-05, "Full-pretrain/Loss": 2.0947513580322266, "Full-pretrain/Loss (Raw)": 2.137460231781006, "Full-pretrain/Step": 607, "Full-pretrain/Step Time": 17.585348170250654} +{"Full-pretrain/Learning Rate": 4.985065002663987e-05, "Full-pretrain/Loss": 2.104278802871704, "Full-pretrain/Loss (Raw)": 2.1423850059509277, "Full-pretrain/Step": 608, "Full-pretrain/Step Time": 17.583233952522278} +{"Full-pretrain/Learning Rate": 4.9849721878539804e-05, "Full-pretrain/Loss": 2.104221820831299, "Full-pretrain/Loss (Raw)": 1.9946380853652954, "Full-pretrain/Step": 609, "Full-pretrain/Step Time": 17.594527285546064} +{"Full-pretrain/Learning Rate": 4.984879086403304e-05, "Full-pretrain/Loss": 2.1047863960266113, "Full-pretrain/Loss (Raw)": 2.137906074523926, "Full-pretrain/Step": 610, "Full-pretrain/Step Time": 17.5892626773566} +{"Full-pretrain/Learning Rate": 4.9847856983226996e-05, "Full-pretrain/Loss": 2.106963634490967, "Full-pretrain/Loss (Raw)": 2.187739610671997, "Full-pretrain/Step": 611, "Full-pretrain/Step Time": 17.58080993965268} +{"Full-pretrain/Learning Rate": 4.984692023622938e-05, "Full-pretrain/Loss": 2.113851547241211, "Full-pretrain/Loss (Raw)": 2.1991868019104004, "Full-pretrain/Step": 612, "Full-pretrain/Step Time": 17.587545681744814} +{"Full-pretrain/Learning Rate": 4.984598062314825e-05, "Full-pretrain/Loss": 2.115496873855591, "Full-pretrain/Loss (Raw)": 2.2461535930633545, "Full-pretrain/Step": 613, "Full-pretrain/Step Time": 17.593682078644633} +{"Full-pretrain/Learning Rate": 4.984503814409198e-05, "Full-pretrain/Loss": 2.1117568016052246, "Full-pretrain/Loss (Raw)": 2.0486416816711426, "Full-pretrain/Step": 614, "Full-pretrain/Step Time": 17.59602760337293} +{"Full-pretrain/Learning Rate": 4.984409279916929e-05, "Full-pretrain/Loss": 2.103743553161621, "Full-pretrain/Loss (Raw)": 2.127802848815918, "Full-pretrain/Step": 615, "Full-pretrain/Step Time": 17.59416765719652} +{"Full-pretrain/Learning Rate": 4.984314458848923e-05, "Full-pretrain/Loss": 2.101386547088623, "Full-pretrain/Loss (Raw)": 1.9935187101364136, "Full-pretrain/Step": 616, "Full-pretrain/Step Time": 17.589984385296702} +{"Full-pretrain/Learning Rate": 4.9842193512161165e-05, "Full-pretrain/Loss": 2.1128897666931152, "Full-pretrain/Loss (Raw)": 2.2460036277770996, "Full-pretrain/Step": 617, "Full-pretrain/Step Time": 17.59327789209783} +{"Full-pretrain/Learning Rate": 4.9841239570294815e-05, "Full-pretrain/Loss": 2.115128755569458, "Full-pretrain/Loss (Raw)": 2.0559844970703125, "Full-pretrain/Step": 618, "Full-pretrain/Step Time": 17.591058630496264} +{"Full-pretrain/Learning Rate": 4.984028276300021e-05, "Full-pretrain/Loss": 2.1134634017944336, "Full-pretrain/Loss (Raw)": 2.1094424724578857, "Full-pretrain/Step": 619, "Full-pretrain/Step Time": 17.586069433018565} +{"Full-pretrain/Learning Rate": 4.9839323090387725e-05, "Full-pretrain/Loss": 2.105828046798706, "Full-pretrain/Loss (Raw)": 2.1754093170166016, "Full-pretrain/Step": 620, "Full-pretrain/Step Time": 17.581380223855376} +{"Full-pretrain/Learning Rate": 4.983836055256804e-05, "Full-pretrain/Loss": 2.104226589202881, "Full-pretrain/Loss (Raw)": 2.0475006103515625, "Full-pretrain/Step": 621, "Full-pretrain/Step Time": 17.584641095250845} +{"Full-pretrain/Learning Rate": 4.98373951496522e-05, "Full-pretrain/Loss": 2.107687473297119, "Full-pretrain/Loss (Raw)": 2.1583235263824463, "Full-pretrain/Step": 622, "Full-pretrain/Step Time": 17.585374446585774} +{"Full-pretrain/Learning Rate": 4.9836426881751554e-05, "Full-pretrain/Loss": 2.1083011627197266, "Full-pretrain/Loss (Raw)": 2.2066457271575928, "Full-pretrain/Step": 623, "Full-pretrain/Step Time": 17.577799201011658} +{"Full-pretrain/Learning Rate": 4.9835455748977795e-05, "Full-pretrain/Loss": 2.1092405319213867, "Full-pretrain/Loss (Raw)": 2.0683791637420654, "Full-pretrain/Step": 624, "Full-pretrain/Step Time": 17.58072647638619} +{"Full-pretrain/Learning Rate": 4.983448175144294e-05, "Full-pretrain/Loss": 2.112058639526367, "Full-pretrain/Loss (Raw)": 2.017352342605591, "Full-pretrain/Step": 625, "Full-pretrain/Step Time": 17.58456751331687} +{"Full-pretrain/Learning Rate": 4.983350488925935e-05, "Full-pretrain/Loss": 2.107060432434082, "Full-pretrain/Loss (Raw)": 2.0779364109039307, "Full-pretrain/Step": 626, "Full-pretrain/Step Time": 17.582542521879077} +{"Full-pretrain/Learning Rate": 4.9832525162539696e-05, "Full-pretrain/Loss": 2.1059927940368652, "Full-pretrain/Loss (Raw)": 1.9898293018341064, "Full-pretrain/Step": 627, "Full-pretrain/Step Time": 17.573685489594936} +{"Full-pretrain/Learning Rate": 4.9831542571396995e-05, "Full-pretrain/Loss": 2.1022496223449707, "Full-pretrain/Loss (Raw)": 2.1251132488250732, "Full-pretrain/Step": 628, "Full-pretrain/Step Time": 17.57174332253635} +{"Full-pretrain/Learning Rate": 4.983055711594457e-05, "Full-pretrain/Loss": 2.1169934272766113, "Full-pretrain/Loss (Raw)": 2.3877041339874268, "Full-pretrain/Step": 629, "Full-pretrain/Step Time": 17.57460887171328} +{"Full-pretrain/Learning Rate": 4.982956879629612e-05, "Full-pretrain/Loss": 2.1259281635284424, "Full-pretrain/Loss (Raw)": 2.266556739807129, "Full-pretrain/Step": 630, "Full-pretrain/Step Time": 17.57045583613217} +{"Full-pretrain/Learning Rate": 4.982857761256564e-05, "Full-pretrain/Loss": 2.130751609802246, "Full-pretrain/Loss (Raw)": 1.9383559226989746, "Full-pretrain/Step": 631, "Full-pretrain/Step Time": 17.571842012926936} +{"Full-pretrain/Learning Rate": 4.982758356486745e-05, "Full-pretrain/Loss": 2.124268054962158, "Full-pretrain/Loss (Raw)": 2.0063681602478027, "Full-pretrain/Step": 632, "Full-pretrain/Step Time": 17.566205952316523} +{"Full-pretrain/Learning Rate": 4.982658665331622e-05, "Full-pretrain/Loss": 2.1226940155029297, "Full-pretrain/Loss (Raw)": 2.0518300533294678, "Full-pretrain/Step": 633, "Full-pretrain/Step Time": 17.568197790533304} +{"Full-pretrain/Learning Rate": 4.982558687802695e-05, "Full-pretrain/Loss": 2.1261487007141113, "Full-pretrain/Loss (Raw)": 2.064021348953247, "Full-pretrain/Step": 634, "Full-pretrain/Step Time": 17.564348071813583} +{"Full-pretrain/Learning Rate": 4.982458423911495e-05, "Full-pretrain/Loss": 2.132139205932617, "Full-pretrain/Loss (Raw)": 2.3415908813476562, "Full-pretrain/Step": 635, "Full-pretrain/Step Time": 17.566307863220572} +{"Full-pretrain/Learning Rate": 4.982357873669589e-05, "Full-pretrain/Loss": 2.127445697784424, "Full-pretrain/Loss (Raw)": 1.9896608591079712, "Full-pretrain/Step": 636, "Full-pretrain/Step Time": 17.564869675785303} +{"Full-pretrain/Learning Rate": 4.9822570370885733e-05, "Full-pretrain/Loss": 2.124403476715088, "Full-pretrain/Loss (Raw)": 2.240586280822754, "Full-pretrain/Step": 637, "Full-pretrain/Step Time": 17.569530161097646} +{"Full-pretrain/Learning Rate": 4.982155914180082e-05, "Full-pretrain/Loss": 2.1192941665649414, "Full-pretrain/Loss (Raw)": 2.0373873710632324, "Full-pretrain/Step": 638, "Full-pretrain/Step Time": 17.56532051973045} +{"Full-pretrain/Learning Rate": 4.982054504955778e-05, "Full-pretrain/Loss": 2.1135687828063965, "Full-pretrain/Loss (Raw)": 1.9542495012283325, "Full-pretrain/Step": 639, "Full-pretrain/Step Time": 17.566954091191292} +{"Full-pretrain/Learning Rate": 4.981952809427359e-05, "Full-pretrain/Loss": 2.1121506690979004, "Full-pretrain/Loss (Raw)": 2.097001552581787, "Full-pretrain/Step": 640, "Full-pretrain/Step Time": 17.566376443952322} +{"Full-pretrain/Learning Rate": 4.9818508276065554e-05, "Full-pretrain/Loss": 2.1186013221740723, "Full-pretrain/Loss (Raw)": 2.2010574340820312, "Full-pretrain/Step": 641, "Full-pretrain/Step Time": 17.565211148932576} +{"Full-pretrain/Learning Rate": 4.981748559505132e-05, "Full-pretrain/Loss": 2.111353874206543, "Full-pretrain/Loss (Raw)": 1.9059855937957764, "Full-pretrain/Step": 642, "Full-pretrain/Step Time": 17.560737773776054} +{"Full-pretrain/Learning Rate": 4.9816460051348835e-05, "Full-pretrain/Loss": 2.104206085205078, "Full-pretrain/Loss (Raw)": 1.9590154886245728, "Full-pretrain/Step": 643, "Full-pretrain/Step Time": 17.5621631834656} +{"Full-pretrain/Learning Rate": 4.98154316450764e-05, "Full-pretrain/Loss": 2.089730739593506, "Full-pretrain/Loss (Raw)": 1.7359740734100342, "Full-pretrain/Step": 644, "Full-pretrain/Step Time": 17.562312120571733} +{"Full-pretrain/Learning Rate": 4.981440037635266e-05, "Full-pretrain/Loss": 2.0855696201324463, "Full-pretrain/Loss (Raw)": 2.1129984855651855, "Full-pretrain/Step": 645, "Full-pretrain/Step Time": 17.564584596082568} +{"Full-pretrain/Learning Rate": 4.981336624529655e-05, "Full-pretrain/Loss": 2.0920002460479736, "Full-pretrain/Loss (Raw)": 2.2544209957122803, "Full-pretrain/Step": 646, "Full-pretrain/Step Time": 17.562007816508412} +{"Full-pretrain/Learning Rate": 4.981232925202736e-05, "Full-pretrain/Loss": 2.088268756866455, "Full-pretrain/Loss (Raw)": 2.008397102355957, "Full-pretrain/Step": 647, "Full-pretrain/Step Time": 17.560303619131446} +{"Full-pretrain/Learning Rate": 4.9811289396664715e-05, "Full-pretrain/Loss": 2.091362476348877, "Full-pretrain/Loss (Raw)": 2.092522144317627, "Full-pretrain/Step": 648, "Full-pretrain/Step Time": 17.565269634127617} +{"Full-pretrain/Learning Rate": 4.9810246679328554e-05, "Full-pretrain/Loss": 2.0899815559387207, "Full-pretrain/Loss (Raw)": 2.2018094062805176, "Full-pretrain/Step": 649, "Full-pretrain/Step Time": 17.569373635575175} +{"Full-pretrain/Learning Rate": 4.9809201100139156e-05, "Full-pretrain/Loss": 2.088529109954834, "Full-pretrain/Loss (Raw)": 2.0095038414001465, "Full-pretrain/Step": 650, "Full-pretrain/Step Time": 17.565795274451375} +{"Full-pretrain/Learning Rate": 4.980815265921713e-05, "Full-pretrain/Loss": 2.0828442573547363, "Full-pretrain/Loss (Raw)": 1.9275341033935547, "Full-pretrain/Step": 651, "Full-pretrain/Step Time": 17.56713756918907} +{"Full-pretrain/Learning Rate": 4.9807101356683415e-05, "Full-pretrain/Loss": 2.0789413452148438, "Full-pretrain/Loss (Raw)": 2.050511360168457, "Full-pretrain/Step": 652, "Full-pretrain/Step Time": 17.567792857065797} +{"Full-pretrain/Learning Rate": 4.9806047192659276e-05, "Full-pretrain/Loss": 2.0880699157714844, "Full-pretrain/Loss (Raw)": 2.339611053466797, "Full-pretrain/Step": 653, "Full-pretrain/Step Time": 17.56511515378952} +{"Full-pretrain/Learning Rate": 4.980499016726632e-05, "Full-pretrain/Loss": 2.087348461151123, "Full-pretrain/Loss (Raw)": 2.1352412700653076, "Full-pretrain/Step": 654, "Full-pretrain/Step Time": 17.56547106988728} +{"Full-pretrain/Learning Rate": 4.9803930280626455e-05, "Full-pretrain/Loss": 2.081094741821289, "Full-pretrain/Loss (Raw)": 2.0065319538116455, "Full-pretrain/Step": 655, "Full-pretrain/Step Time": 17.5644972641021} +{"Full-pretrain/Learning Rate": 4.980286753286195e-05, "Full-pretrain/Loss": 2.0808563232421875, "Full-pretrain/Loss (Raw)": 2.0607454776763916, "Full-pretrain/Step": 656, "Full-pretrain/Step Time": 17.56806488521397} +{"Full-pretrain/Learning Rate": 4.980180192409539e-05, "Full-pretrain/Loss": 2.0849413871765137, "Full-pretrain/Loss (Raw)": 2.148073196411133, "Full-pretrain/Step": 657, "Full-pretrain/Step Time": 17.563284372910857} +{"Full-pretrain/Learning Rate": 4.98007334544497e-05, "Full-pretrain/Loss": 2.086002826690674, "Full-pretrain/Loss (Raw)": 2.1119093894958496, "Full-pretrain/Step": 658, "Full-pretrain/Step Time": 17.563214745372534} +{"Full-pretrain/Learning Rate": 4.979966212404811e-05, "Full-pretrain/Loss": 2.0922935009002686, "Full-pretrain/Loss (Raw)": 2.1911256313323975, "Full-pretrain/Step": 659, "Full-pretrain/Step Time": 17.562845155596733} +{"Full-pretrain/Learning Rate": 4.979858793301422e-05, "Full-pretrain/Loss": 2.094125270843506, "Full-pretrain/Loss (Raw)": 2.183727502822876, "Full-pretrain/Step": 660, "Full-pretrain/Step Time": 17.572020398452878} +{"Full-pretrain/Learning Rate": 4.979751088147192e-05, "Full-pretrain/Loss": 2.0878171920776367, "Full-pretrain/Loss (Raw)": 2.18584942817688, "Full-pretrain/Step": 661, "Full-pretrain/Step Time": 17.570370377972722} +{"Full-pretrain/Learning Rate": 4.979643096954546e-05, "Full-pretrain/Loss": 2.074695348739624, "Full-pretrain/Loss (Raw)": 1.8466554880142212, "Full-pretrain/Step": 662, "Full-pretrain/Step Time": 17.56399000622332} +{"Full-pretrain/Learning Rate": 4.97953481973594e-05, "Full-pretrain/Loss": 2.0817055702209473, "Full-pretrain/Loss (Raw)": 2.1626763343811035, "Full-pretrain/Step": 663, "Full-pretrain/Step Time": 17.56896019540727} +{"Full-pretrain/Learning Rate": 4.979426256503864e-05, "Full-pretrain/Loss": 2.0847811698913574, "Full-pretrain/Loss (Raw)": 2.1047892570495605, "Full-pretrain/Step": 664, "Full-pretrain/Step Time": 17.571388142183423} +{"Full-pretrain/Learning Rate": 4.9793174072708405e-05, "Full-pretrain/Loss": 2.0836215019226074, "Full-pretrain/Loss (Raw)": 2.0147275924682617, "Full-pretrain/Step": 665, "Full-pretrain/Step Time": 17.576303901150823} +{"Full-pretrain/Learning Rate": 4.979208272049425e-05, "Full-pretrain/Loss": 2.09501576423645, "Full-pretrain/Loss (Raw)": 2.42863392829895, "Full-pretrain/Step": 666, "Full-pretrain/Step Time": 17.570264438167214} +{"Full-pretrain/Learning Rate": 4.9790988508522076e-05, "Full-pretrain/Loss": 2.0947508811950684, "Full-pretrain/Loss (Raw)": 2.333115577697754, "Full-pretrain/Step": 667, "Full-pretrain/Step Time": 17.570610858500004} +{"Full-pretrain/Learning Rate": 4.978989143691808e-05, "Full-pretrain/Loss": 2.1008412837982178, "Full-pretrain/Loss (Raw)": 2.1845521926879883, "Full-pretrain/Step": 668, "Full-pretrain/Step Time": 17.57260313630104} +{"Full-pretrain/Learning Rate": 4.978879150580882e-05, "Full-pretrain/Loss": 2.0996012687683105, "Full-pretrain/Loss (Raw)": 2.20090389251709, "Full-pretrain/Step": 669, "Full-pretrain/Step Time": 17.57410667091608} +{"Full-pretrain/Learning Rate": 4.978768871532118e-05, "Full-pretrain/Loss": 2.1010098457336426, "Full-pretrain/Loss (Raw)": 2.0824673175811768, "Full-pretrain/Step": 670, "Full-pretrain/Step Time": 17.569218819960952} +{"Full-pretrain/Learning Rate": 4.978658306558235e-05, "Full-pretrain/Loss": 2.1087098121643066, "Full-pretrain/Loss (Raw)": 2.2006406784057617, "Full-pretrain/Step": 671, "Full-pretrain/Step Time": 17.56857111863792} +{"Full-pretrain/Learning Rate": 4.978547455671987e-05, "Full-pretrain/Loss": 2.1086039543151855, "Full-pretrain/Loss (Raw)": 2.0936174392700195, "Full-pretrain/Step": 672, "Full-pretrain/Step Time": 17.566910035908222} +{"Full-pretrain/Learning Rate": 4.978436318886162e-05, "Full-pretrain/Loss": 2.10260272026062, "Full-pretrain/Loss (Raw)": 2.009016513824463, "Full-pretrain/Step": 673, "Full-pretrain/Step Time": 17.5731765832752} +{"Full-pretrain/Learning Rate": 4.978324896213577e-05, "Full-pretrain/Loss": 2.11572527885437, "Full-pretrain/Loss (Raw)": 2.325911045074463, "Full-pretrain/Step": 674, "Full-pretrain/Step Time": 17.56590940244496} +{"Full-pretrain/Learning Rate": 4.978213187667088e-05, "Full-pretrain/Loss": 2.119809865951538, "Full-pretrain/Loss (Raw)": 2.0897161960601807, "Full-pretrain/Step": 675, "Full-pretrain/Step Time": 17.5641627330333} +{"Full-pretrain/Learning Rate": 4.978101193259578e-05, "Full-pretrain/Loss": 2.1399893760681152, "Full-pretrain/Loss (Raw)": 2.3817267417907715, "Full-pretrain/Step": 676, "Full-pretrain/Step Time": 17.567120047286153} +{"Full-pretrain/Learning Rate": 4.977988913003967e-05, "Full-pretrain/Loss": 2.1336164474487305, "Full-pretrain/Loss (Raw)": 1.9090580940246582, "Full-pretrain/Step": 677, "Full-pretrain/Step Time": 17.56937346421182} +{"Full-pretrain/Learning Rate": 4.977876346913204e-05, "Full-pretrain/Loss": 2.122990131378174, "Full-pretrain/Loss (Raw)": 1.9143824577331543, "Full-pretrain/Step": 678, "Full-pretrain/Step Time": 17.561898536980152} +{"Full-pretrain/Learning Rate": 4.977763495000276e-05, "Full-pretrain/Loss": 2.123023509979248, "Full-pretrain/Loss (Raw)": 2.009460926055908, "Full-pretrain/Step": 679, "Full-pretrain/Step Time": 17.560521099716425} +{"Full-pretrain/Learning Rate": 4.9776503572782e-05, "Full-pretrain/Loss": 2.121901035308838, "Full-pretrain/Loss (Raw)": 2.056603193283081, "Full-pretrain/Step": 680, "Full-pretrain/Step Time": 17.56663996167481} +{"Full-pretrain/Learning Rate": 4.9775369337600255e-05, "Full-pretrain/Loss": 2.117788553237915, "Full-pretrain/Loss (Raw)": 2.070214033126831, "Full-pretrain/Step": 681, "Full-pretrain/Step Time": 17.57026121020317} +{"Full-pretrain/Learning Rate": 4.977423224458837e-05, "Full-pretrain/Loss": 2.11767840385437, "Full-pretrain/Loss (Raw)": 2.0059762001037598, "Full-pretrain/Step": 682, "Full-pretrain/Step Time": 17.56454803980887} +{"Full-pretrain/Learning Rate": 4.9773092293877496e-05, "Full-pretrain/Loss": 2.124103546142578, "Full-pretrain/Loss (Raw)": 2.133140802383423, "Full-pretrain/Step": 683, "Full-pretrain/Step Time": 17.564093368127942} +{"Full-pretrain/Learning Rate": 4.9771949485599134e-05, "Full-pretrain/Loss": 2.127857208251953, "Full-pretrain/Loss (Raw)": 2.170628070831299, "Full-pretrain/Step": 684, "Full-pretrain/Step Time": 17.568373434245586} +{"Full-pretrain/Learning Rate": 4.9770803819885104e-05, "Full-pretrain/Loss": 2.1231837272644043, "Full-pretrain/Loss (Raw)": 2.1900529861450195, "Full-pretrain/Step": 685, "Full-pretrain/Step Time": 17.57478612102568} +{"Full-pretrain/Learning Rate": 4.9769655296867554e-05, "Full-pretrain/Loss": 2.1190237998962402, "Full-pretrain/Loss (Raw)": 2.00213623046875, "Full-pretrain/Step": 686, "Full-pretrain/Step Time": 17.569156168028712} +{"Full-pretrain/Learning Rate": 4.9768503916678976e-05, "Full-pretrain/Loss": 2.1250994205474854, "Full-pretrain/Loss (Raw)": 2.200946807861328, "Full-pretrain/Step": 687, "Full-pretrain/Step Time": 17.571897817775607} +{"Full-pretrain/Learning Rate": 4.976734967945217e-05, "Full-pretrain/Loss": 2.128840446472168, "Full-pretrain/Loss (Raw)": 2.1804561614990234, "Full-pretrain/Step": 688, "Full-pretrain/Step Time": 17.575127843767405} +{"Full-pretrain/Learning Rate": 4.976619258532029e-05, "Full-pretrain/Loss": 2.118149757385254, "Full-pretrain/Loss (Raw)": 1.8059678077697754, "Full-pretrain/Step": 689, "Full-pretrain/Step Time": 17.582763521000743} +{"Full-pretrain/Learning Rate": 4.976503263441679e-05, "Full-pretrain/Loss": 2.1184041500091553, "Full-pretrain/Loss (Raw)": 2.1200599670410156, "Full-pretrain/Step": 690, "Full-pretrain/Step Time": 17.57560008391738} +{"Full-pretrain/Learning Rate": 4.976386982687549e-05, "Full-pretrain/Loss": 2.1085033416748047, "Full-pretrain/Loss (Raw)": 1.8742947578430176, "Full-pretrain/Step": 691, "Full-pretrain/Step Time": 17.57501263730228} +{"Full-pretrain/Learning Rate": 4.97627041628305e-05, "Full-pretrain/Loss": 2.1004648208618164, "Full-pretrain/Loss (Raw)": 1.9265007972717285, "Full-pretrain/Step": 692, "Full-pretrain/Step Time": 17.572509925812483} +{"Full-pretrain/Learning Rate": 4.976153564241628e-05, "Full-pretrain/Loss": 2.100775718688965, "Full-pretrain/Loss (Raw)": 2.1957898139953613, "Full-pretrain/Step": 693, "Full-pretrain/Step Time": 17.575426004827023} +{"Full-pretrain/Learning Rate": 4.976036426576763e-05, "Full-pretrain/Loss": 2.1094422340393066, "Full-pretrain/Loss (Raw)": 2.1239893436431885, "Full-pretrain/Step": 694, "Full-pretrain/Step Time": 17.574232060462236} +{"Full-pretrain/Learning Rate": 4.975919003301968e-05, "Full-pretrain/Loss": 2.1076462268829346, "Full-pretrain/Loss (Raw)": 2.105203866958618, "Full-pretrain/Step": 695, "Full-pretrain/Step Time": 17.569224312901497} +{"Full-pretrain/Learning Rate": 4.9758012944307844e-05, "Full-pretrain/Loss": 2.1034698486328125, "Full-pretrain/Loss (Raw)": 1.9711437225341797, "Full-pretrain/Step": 696, "Full-pretrain/Step Time": 17.561263754963875} +{"Full-pretrain/Learning Rate": 4.9756832999767914e-05, "Full-pretrain/Loss": 2.104072093963623, "Full-pretrain/Loss (Raw)": 2.034001350402832, "Full-pretrain/Step": 697, "Full-pretrain/Step Time": 17.565299348905683} +{"Full-pretrain/Learning Rate": 4.975565019953601e-05, "Full-pretrain/Loss": 2.0850980281829834, "Full-pretrain/Loss (Raw)": 1.8214589357376099, "Full-pretrain/Step": 698, "Full-pretrain/Step Time": 17.572459680959582} +{"Full-pretrain/Learning Rate": 4.9754464543748546e-05, "Full-pretrain/Loss": 2.079193115234375, "Full-pretrain/Loss (Raw)": 2.1441640853881836, "Full-pretrain/Step": 699, "Full-pretrain/Step Time": 17.566752571612597} +{"Full-pretrain/Learning Rate": 4.975327603254229e-05, "Full-pretrain/Loss": 2.0742130279541016, "Full-pretrain/Loss (Raw)": 2.0251834392547607, "Full-pretrain/Step": 700, "Full-pretrain/Step Time": 17.56856078468263} +{"Full-pretrain/Learning Rate": 4.9752084666054353e-05, "Full-pretrain/Loss": 2.0705466270446777, "Full-pretrain/Loss (Raw)": 2.0835824012756348, "Full-pretrain/Step": 701, "Full-pretrain/Step Time": 17.57090776786208} +{"Full-pretrain/Learning Rate": 4.975089044442215e-05, "Full-pretrain/Loss": 2.0760393142700195, "Full-pretrain/Loss (Raw)": 2.2582364082336426, "Full-pretrain/Step": 702, "Full-pretrain/Step Time": 17.568885823711753} +{"Full-pretrain/Learning Rate": 4.974969336778343e-05, "Full-pretrain/Loss": 2.0747036933898926, "Full-pretrain/Loss (Raw)": 2.157902240753174, "Full-pretrain/Step": 703, "Full-pretrain/Step Time": 17.568962020799518} +{"Full-pretrain/Learning Rate": 4.974849343627628e-05, "Full-pretrain/Loss": 2.0734946727752686, "Full-pretrain/Loss (Raw)": 2.0549230575561523, "Full-pretrain/Step": 704, "Full-pretrain/Step Time": 17.561202585697174} +{"Full-pretrain/Learning Rate": 4.97472906500391e-05, "Full-pretrain/Loss": 2.083508014678955, "Full-pretrain/Loss (Raw)": 2.3294410705566406, "Full-pretrain/Step": 705, "Full-pretrain/Step Time": 17.56777873635292} +{"Full-pretrain/Learning Rate": 4.974608500921064e-05, "Full-pretrain/Loss": 2.072775363922119, "Full-pretrain/Loss (Raw)": 1.9824672937393188, "Full-pretrain/Step": 706, "Full-pretrain/Step Time": 17.580548299476504} +{"Full-pretrain/Learning Rate": 4.974487651392998e-05, "Full-pretrain/Loss": 2.070427894592285, "Full-pretrain/Loss (Raw)": 2.014594316482544, "Full-pretrain/Step": 707, "Full-pretrain/Step Time": 17.579287929460406} +{"Full-pretrain/Learning Rate": 4.974366516433651e-05, "Full-pretrain/Loss": 2.0644049644470215, "Full-pretrain/Loss (Raw)": 2.188993453979492, "Full-pretrain/Step": 708, "Full-pretrain/Step Time": 17.575049825012684} +{"Full-pretrain/Learning Rate": 4.974245096056995e-05, "Full-pretrain/Loss": 2.068283796310425, "Full-pretrain/Loss (Raw)": 2.033186435699463, "Full-pretrain/Step": 709, "Full-pretrain/Step Time": 17.573086459189653} +{"Full-pretrain/Learning Rate": 4.974123390277038e-05, "Full-pretrain/Loss": 2.070725917816162, "Full-pretrain/Loss (Raw)": 1.9925322532653809, "Full-pretrain/Step": 710, "Full-pretrain/Step Time": 17.577944986522198} +{"Full-pretrain/Learning Rate": 4.974001399107816e-05, "Full-pretrain/Loss": 2.076115608215332, "Full-pretrain/Loss (Raw)": 2.181929111480713, "Full-pretrain/Step": 711, "Full-pretrain/Step Time": 17.573064886033535} +{"Full-pretrain/Learning Rate": 4.9738791225634027e-05, "Full-pretrain/Loss": 2.079766273498535, "Full-pretrain/Loss (Raw)": 2.1734180450439453, "Full-pretrain/Step": 712, "Full-pretrain/Step Time": 17.575777938589454} +{"Full-pretrain/Learning Rate": 4.973756560657902e-05, "Full-pretrain/Loss": 2.081862688064575, "Full-pretrain/Loss (Raw)": 2.1373019218444824, "Full-pretrain/Step": 713, "Full-pretrain/Step Time": 17.576712584123015} +{"Full-pretrain/Learning Rate": 4.973633713405451e-05, "Full-pretrain/Loss": 2.1100525856018066, "Full-pretrain/Loss (Raw)": 2.908053159713745, "Full-pretrain/Step": 714, "Full-pretrain/Step Time": 17.572596622630954} +{"Full-pretrain/Learning Rate": 4.973510580820221e-05, "Full-pretrain/Loss": 2.114593029022217, "Full-pretrain/Loss (Raw)": 2.278440475463867, "Full-pretrain/Step": 715, "Full-pretrain/Step Time": 17.572054903954268} +{"Full-pretrain/Learning Rate": 4.973387162916415e-05, "Full-pretrain/Loss": 2.1152095794677734, "Full-pretrain/Loss (Raw)": 2.190359115600586, "Full-pretrain/Step": 716, "Full-pretrain/Step Time": 17.56558771803975} +{"Full-pretrain/Learning Rate": 4.9732634597082685e-05, "Full-pretrain/Loss": 2.107348918914795, "Full-pretrain/Loss (Raw)": 1.9385052919387817, "Full-pretrain/Step": 717, "Full-pretrain/Step Time": 17.57135411351919} +{"Full-pretrain/Learning Rate": 4.973139471210051e-05, "Full-pretrain/Loss": 2.113419532775879, "Full-pretrain/Loss (Raw)": 2.196394681930542, "Full-pretrain/Step": 718, "Full-pretrain/Step Time": 17.57510270178318} +{"Full-pretrain/Learning Rate": 4.973015197436064e-05, "Full-pretrain/Loss": 2.1060614585876465, "Full-pretrain/Loss (Raw)": 1.965498447418213, "Full-pretrain/Step": 719, "Full-pretrain/Step Time": 17.569849202409387} +{"Full-pretrain/Learning Rate": 4.972890638400644e-05, "Full-pretrain/Loss": 2.1073153018951416, "Full-pretrain/Loss (Raw)": 2.2205748558044434, "Full-pretrain/Step": 720, "Full-pretrain/Step Time": 17.571526816114783} +{"Full-pretrain/Learning Rate": 4.972765794118158e-05, "Full-pretrain/Loss": 2.118196487426758, "Full-pretrain/Loss (Raw)": 2.154169797897339, "Full-pretrain/Step": 721, "Full-pretrain/Step Time": 17.568761399015784} +{"Full-pretrain/Learning Rate": 4.972640664603006e-05, "Full-pretrain/Loss": 2.1224734783172607, "Full-pretrain/Loss (Raw)": 2.2569174766540527, "Full-pretrain/Step": 722, "Full-pretrain/Step Time": 17.57177109271288} +{"Full-pretrain/Learning Rate": 4.972515249869622e-05, "Full-pretrain/Loss": 2.1302762031555176, "Full-pretrain/Loss (Raw)": 2.12397837638855, "Full-pretrain/Step": 723, "Full-pretrain/Step Time": 17.57033321261406} +{"Full-pretrain/Learning Rate": 4.972389549932474e-05, "Full-pretrain/Loss": 2.1334588527679443, "Full-pretrain/Loss (Raw)": 2.0283455848693848, "Full-pretrain/Step": 724, "Full-pretrain/Step Time": 17.566619500517845} +{"Full-pretrain/Learning Rate": 4.97226356480606e-05, "Full-pretrain/Loss": 2.127530097961426, "Full-pretrain/Loss (Raw)": 2.0060744285583496, "Full-pretrain/Step": 725, "Full-pretrain/Step Time": 17.57061142846942} +{"Full-pretrain/Learning Rate": 4.972137294504912e-05, "Full-pretrain/Loss": 2.130218029022217, "Full-pretrain/Loss (Raw)": 2.2100019454956055, "Full-pretrain/Step": 726, "Full-pretrain/Step Time": 17.566069655120373} +{"Full-pretrain/Learning Rate": 4.972010739043596e-05, "Full-pretrain/Loss": 2.1315858364105225, "Full-pretrain/Loss (Raw)": 2.1489720344543457, "Full-pretrain/Step": 727, "Full-pretrain/Step Time": 17.569319682195783} +{"Full-pretrain/Learning Rate": 4.97188389843671e-05, "Full-pretrain/Loss": 2.1348228454589844, "Full-pretrain/Loss (Raw)": 2.074730157852173, "Full-pretrain/Step": 728, "Full-pretrain/Step Time": 17.562535014003515} +{"Full-pretrain/Learning Rate": 4.971756772698886e-05, "Full-pretrain/Loss": 2.1348841190338135, "Full-pretrain/Loss (Raw)": 2.0359606742858887, "Full-pretrain/Step": 729, "Full-pretrain/Step Time": 17.561440594494343} +{"Full-pretrain/Learning Rate": 4.971629361844785e-05, "Full-pretrain/Loss": 2.1360068321228027, "Full-pretrain/Loss (Raw)": 1.857380986213684, "Full-pretrain/Step": 730, "Full-pretrain/Step Time": 17.5655988547951} +{"Full-pretrain/Learning Rate": 4.9715016658891064e-05, "Full-pretrain/Loss": 2.1349868774414062, "Full-pretrain/Loss (Raw)": 2.111527919769287, "Full-pretrain/Step": 731, "Full-pretrain/Step Time": 17.569496346637607} +{"Full-pretrain/Learning Rate": 4.97137368484658e-05, "Full-pretrain/Loss": 2.1358203887939453, "Full-pretrain/Loss (Raw)": 2.0518555641174316, "Full-pretrain/Step": 732, "Full-pretrain/Step Time": 17.56502583809197} +{"Full-pretrain/Learning Rate": 4.9712454187319666e-05, "Full-pretrain/Loss": 2.131721019744873, "Full-pretrain/Loss (Raw)": 1.9524073600769043, "Full-pretrain/Step": 733, "Full-pretrain/Step Time": 17.56324947066605} +{"Full-pretrain/Learning Rate": 4.971116867560064e-05, "Full-pretrain/Loss": 2.132742166519165, "Full-pretrain/Loss (Raw)": 2.2909140586853027, "Full-pretrain/Step": 734, "Full-pretrain/Step Time": 17.56730506569147} +{"Full-pretrain/Learning Rate": 4.970988031345698e-05, "Full-pretrain/Loss": 2.1349334716796875, "Full-pretrain/Loss (Raw)": 2.2280232906341553, "Full-pretrain/Step": 735, "Full-pretrain/Step Time": 17.569761304184794} +{"Full-pretrain/Learning Rate": 4.9708589101037306e-05, "Full-pretrain/Loss": 2.1386592388153076, "Full-pretrain/Loss (Raw)": 2.1741466522216797, "Full-pretrain/Step": 736, "Full-pretrain/Step Time": 17.57541644014418} +{"Full-pretrain/Learning Rate": 4.970729503849058e-05, "Full-pretrain/Loss": 2.1337361335754395, "Full-pretrain/Loss (Raw)": 2.1718976497650146, "Full-pretrain/Step": 737, "Full-pretrain/Step Time": 17.56532609462738} +{"Full-pretrain/Learning Rate": 4.970599812596603e-05, "Full-pretrain/Loss": 2.1323275566101074, "Full-pretrain/Loss (Raw)": 1.937395453453064, "Full-pretrain/Step": 738, "Full-pretrain/Step Time": 17.567450350150466} +{"Full-pretrain/Learning Rate": 4.9704698363613294e-05, "Full-pretrain/Loss": 2.1326088905334473, "Full-pretrain/Loss (Raw)": 2.02359938621521, "Full-pretrain/Step": 739, "Full-pretrain/Step Time": 17.57239027507603} +{"Full-pretrain/Learning Rate": 4.9703395751582284e-05, "Full-pretrain/Loss": 2.1269588470458984, "Full-pretrain/Loss (Raw)": 2.008195400238037, "Full-pretrain/Step": 740, "Full-pretrain/Step Time": 17.569001369178295} +{"Full-pretrain/Learning Rate": 4.9702090290023253e-05, "Full-pretrain/Loss": 2.128260850906372, "Full-pretrain/Loss (Raw)": 2.074845314025879, "Full-pretrain/Step": 741, "Full-pretrain/Step Time": 17.561831638216972} +{"Full-pretrain/Learning Rate": 4.970078197908678e-05, "Full-pretrain/Loss": 2.1277782917022705, "Full-pretrain/Loss (Raw)": 1.9770870208740234, "Full-pretrain/Step": 742, "Full-pretrain/Step Time": 17.56920030526817} +{"Full-pretrain/Learning Rate": 4.969947081892379e-05, "Full-pretrain/Loss": 2.12705135345459, "Full-pretrain/Loss (Raw)": 2.1586713790893555, "Full-pretrain/Step": 743, "Full-pretrain/Step Time": 17.568027200177312} +{"Full-pretrain/Learning Rate": 4.969815680968553e-05, "Full-pretrain/Loss": 2.121859312057495, "Full-pretrain/Loss (Raw)": 2.007272958755493, "Full-pretrain/Step": 744, "Full-pretrain/Step Time": 17.565993323922157} +{"Full-pretrain/Learning Rate": 4.969683995152356e-05, "Full-pretrain/Loss": 2.121407985687256, "Full-pretrain/Loss (Raw)": 2.122863531112671, "Full-pretrain/Step": 745, "Full-pretrain/Step Time": 17.564663380384445} +{"Full-pretrain/Learning Rate": 4.969552024458977e-05, "Full-pretrain/Loss": 2.098323345184326, "Full-pretrain/Loss (Raw)": 2.169341564178467, "Full-pretrain/Step": 746, "Full-pretrain/Step Time": 17.565253026783466} +{"Full-pretrain/Learning Rate": 4.96941976890364e-05, "Full-pretrain/Loss": 2.09092116355896, "Full-pretrain/Loss (Raw)": 2.041567802429199, "Full-pretrain/Step": 747, "Full-pretrain/Step Time": 17.563322143629193} +{"Full-pretrain/Learning Rate": 4.969287228501601e-05, "Full-pretrain/Loss": 2.085367202758789, "Full-pretrain/Loss (Raw)": 2.0126357078552246, "Full-pretrain/Step": 748, "Full-pretrain/Step Time": 17.5645460691303} +{"Full-pretrain/Learning Rate": 4.969154403268148e-05, "Full-pretrain/Loss": 2.0903844833374023, "Full-pretrain/Loss (Raw)": 2.099055290222168, "Full-pretrain/Step": 749, "Full-pretrain/Step Time": 17.56112914904952} +{"Full-pretrain/Learning Rate": 4.969021293218602e-05, "Full-pretrain/Loss": 2.0979819297790527, "Full-pretrain/Loss (Raw)": 2.439513921737671, "Full-pretrain/Step": 750, "Full-pretrain/Step Time": 17.558759296312928} +{"Full-pretrain/Learning Rate": 4.968887898368318e-05, "Full-pretrain/Loss": 2.100862741470337, "Full-pretrain/Loss (Raw)": 2.057684898376465, "Full-pretrain/Step": 751, "Full-pretrain/Step Time": 17.56696437112987} +{"Full-pretrain/Learning Rate": 4.968754218732682e-05, "Full-pretrain/Loss": 2.097088575363159, "Full-pretrain/Loss (Raw)": 2.099797010421753, "Full-pretrain/Step": 752, "Full-pretrain/Step Time": 17.567727530375123} +{"Full-pretrain/Learning Rate": 4.968620254327115e-05, "Full-pretrain/Loss": 2.0969643592834473, "Full-pretrain/Loss (Raw)": 2.150198221206665, "Full-pretrain/Step": 753, "Full-pretrain/Step Time": 17.571806797757745} +{"Full-pretrain/Learning Rate": 4.968486005167069e-05, "Full-pretrain/Loss": 2.0881197452545166, "Full-pretrain/Loss (Raw)": 1.9738857746124268, "Full-pretrain/Step": 754, "Full-pretrain/Step Time": 17.568542882800102} +{"Full-pretrain/Learning Rate": 4.968351471268029e-05, "Full-pretrain/Loss": 2.0867490768432617, "Full-pretrain/Loss (Raw)": 2.0801191329956055, "Full-pretrain/Step": 755, "Full-pretrain/Step Time": 17.57551241479814} +{"Full-pretrain/Learning Rate": 4.968216652645515e-05, "Full-pretrain/Loss": 2.0869851112365723, "Full-pretrain/Loss (Raw)": 2.035900831222534, "Full-pretrain/Step": 756, "Full-pretrain/Step Time": 17.572739774361253} +{"Full-pretrain/Learning Rate": 4.9680815493150776e-05, "Full-pretrain/Loss": 2.091834306716919, "Full-pretrain/Loss (Raw)": 2.161247491836548, "Full-pretrain/Step": 757, "Full-pretrain/Step Time": 17.5720454454422} +{"Full-pretrain/Learning Rate": 4.9679461612923006e-05, "Full-pretrain/Loss": 2.0882818698883057, "Full-pretrain/Loss (Raw)": 2.096322774887085, "Full-pretrain/Step": 758, "Full-pretrain/Step Time": 17.566826509311795} +{"Full-pretrain/Learning Rate": 4.9678104885928015e-05, "Full-pretrain/Loss": 2.092360734939575, "Full-pretrain/Loss (Raw)": 2.2795000076293945, "Full-pretrain/Step": 759, "Full-pretrain/Step Time": 17.56985325552523} +{"Full-pretrain/Learning Rate": 4.967674531232229e-05, "Full-pretrain/Loss": 2.0953822135925293, "Full-pretrain/Loss (Raw)": 2.1714224815368652, "Full-pretrain/Step": 760, "Full-pretrain/Step Time": 17.57123572193086} +{"Full-pretrain/Learning Rate": 4.967538289226267e-05, "Full-pretrain/Loss": 2.0976927280426025, "Full-pretrain/Loss (Raw)": 2.109889507293701, "Full-pretrain/Step": 761, "Full-pretrain/Step Time": 17.571248941123486} +{"Full-pretrain/Learning Rate": 4.967401762590631e-05, "Full-pretrain/Loss": 2.104966402053833, "Full-pretrain/Loss (Raw)": 2.0901412963867188, "Full-pretrain/Step": 762, "Full-pretrain/Step Time": 17.56832299940288} +{"Full-pretrain/Learning Rate": 4.967264951341069e-05, "Full-pretrain/Loss": 2.105590343475342, "Full-pretrain/Loss (Raw)": 2.131495952606201, "Full-pretrain/Step": 763, "Full-pretrain/Step Time": 17.567654699087143} +{"Full-pretrain/Learning Rate": 4.96712785549336e-05, "Full-pretrain/Loss": 2.109318256378174, "Full-pretrain/Loss (Raw)": 2.171140193939209, "Full-pretrain/Step": 764, "Full-pretrain/Step Time": 17.57419630140066} +{"Full-pretrain/Learning Rate": 4.966990475063321e-05, "Full-pretrain/Loss": 2.10685396194458, "Full-pretrain/Loss (Raw)": 1.8735578060150146, "Full-pretrain/Step": 765, "Full-pretrain/Step Time": 17.571048259735107} +{"Full-pretrain/Learning Rate": 4.9668528100667986e-05, "Full-pretrain/Loss": 2.100412607192993, "Full-pretrain/Loss (Raw)": 2.084787607192993, "Full-pretrain/Step": 766, "Full-pretrain/Step Time": 17.571195475757122} +{"Full-pretrain/Learning Rate": 4.96671486051967e-05, "Full-pretrain/Loss": 2.098778247833252, "Full-pretrain/Loss (Raw)": 2.1757194995880127, "Full-pretrain/Step": 767, "Full-pretrain/Step Time": 17.573536179959774} +{"Full-pretrain/Learning Rate": 4.96657662643785e-05, "Full-pretrain/Loss": 2.0889856815338135, "Full-pretrain/Loss (Raw)": 1.8607866764068604, "Full-pretrain/Step": 768, "Full-pretrain/Step Time": 17.577756175771356} +{"Full-pretrain/Learning Rate": 4.966438107837283e-05, "Full-pretrain/Loss": 2.0905709266662598, "Full-pretrain/Loss (Raw)": 2.2226223945617676, "Full-pretrain/Step": 769, "Full-pretrain/Step Time": 17.577442215755582} +{"Full-pretrain/Learning Rate": 4.966299304733947e-05, "Full-pretrain/Loss": 2.0936837196350098, "Full-pretrain/Loss (Raw)": 2.0370073318481445, "Full-pretrain/Step": 770, "Full-pretrain/Step Time": 17.576457614079118} +{"Full-pretrain/Learning Rate": 4.9661602171438524e-05, "Full-pretrain/Loss": 2.098156452178955, "Full-pretrain/Loss (Raw)": 2.1667275428771973, "Full-pretrain/Step": 771, "Full-pretrain/Step Time": 17.59027822688222} +{"Full-pretrain/Learning Rate": 4.966020845083044e-05, "Full-pretrain/Loss": 2.0965960025787354, "Full-pretrain/Loss (Raw)": 1.9582641124725342, "Full-pretrain/Step": 772, "Full-pretrain/Step Time": 17.588642109185457} +{"Full-pretrain/Learning Rate": 4.965881188567597e-05, "Full-pretrain/Loss": 2.092820644378662, "Full-pretrain/Loss (Raw)": 1.9540282487869263, "Full-pretrain/Step": 773, "Full-pretrain/Step Time": 17.58924785628915} +{"Full-pretrain/Learning Rate": 4.965741247613622e-05, "Full-pretrain/Loss": 2.0944771766662598, "Full-pretrain/Loss (Raw)": 2.030104398727417, "Full-pretrain/Step": 774, "Full-pretrain/Step Time": 17.588471353054047} +{"Full-pretrain/Learning Rate": 4.9656010222372604e-05, "Full-pretrain/Loss": 2.092094659805298, "Full-pretrain/Loss (Raw)": 2.082425594329834, "Full-pretrain/Step": 775, "Full-pretrain/Step Time": 17.590110393241048} +{"Full-pretrain/Learning Rate": 4.965460512454687e-05, "Full-pretrain/Loss": 2.0965256690979004, "Full-pretrain/Loss (Raw)": 2.14906907081604, "Full-pretrain/Step": 776, "Full-pretrain/Step Time": 17.58760883845389} +{"Full-pretrain/Learning Rate": 4.965319718282111e-05, "Full-pretrain/Loss": 2.0915236473083496, "Full-pretrain/Loss (Raw)": 1.962799310684204, "Full-pretrain/Step": 777, "Full-pretrain/Step Time": 17.58182419091463} +{"Full-pretrain/Learning Rate": 4.965178639735771e-05, "Full-pretrain/Loss": 2.08302640914917, "Full-pretrain/Loss (Raw)": 1.8974347114562988, "Full-pretrain/Step": 778, "Full-pretrain/Step Time": 17.58321669511497} +{"Full-pretrain/Learning Rate": 4.965037276831942e-05, "Full-pretrain/Loss": 2.098684787750244, "Full-pretrain/Loss (Raw)": 2.542623519897461, "Full-pretrain/Step": 779, "Full-pretrain/Step Time": 17.581912657245994} +{"Full-pretrain/Learning Rate": 4.9648956295869284e-05, "Full-pretrain/Loss": 2.095855474472046, "Full-pretrain/Loss (Raw)": 1.9221041202545166, "Full-pretrain/Step": 780, "Full-pretrain/Step Time": 17.579689839854836} +{"Full-pretrain/Learning Rate": 4.9647536980170704e-05, "Full-pretrain/Loss": 2.0976243019104004, "Full-pretrain/Loss (Raw)": 2.155651330947876, "Full-pretrain/Step": 781, "Full-pretrain/Step Time": 17.582814157009125} +{"Full-pretrain/Learning Rate": 4.96461148213874e-05, "Full-pretrain/Loss": 2.084214687347412, "Full-pretrain/Loss (Raw)": 2.0104143619537354, "Full-pretrain/Step": 782, "Full-pretrain/Step Time": 17.581094475463033} +{"Full-pretrain/Learning Rate": 4.964468981968341e-05, "Full-pretrain/Loss": 2.090031862258911, "Full-pretrain/Loss (Raw)": 2.2438278198242188, "Full-pretrain/Step": 783, "Full-pretrain/Step Time": 17.575703153386712} +{"Full-pretrain/Learning Rate": 4.964326197522311e-05, "Full-pretrain/Loss": 2.09238862991333, "Full-pretrain/Loss (Raw)": 2.1752190589904785, "Full-pretrain/Step": 784, "Full-pretrain/Step Time": 17.57935498468578} +{"Full-pretrain/Learning Rate": 4.96418312881712e-05, "Full-pretrain/Loss": 2.08998441696167, "Full-pretrain/Loss (Raw)": 2.073256015777588, "Full-pretrain/Step": 785, "Full-pretrain/Step Time": 17.582595394924283} +{"Full-pretrain/Learning Rate": 4.9640397758692715e-05, "Full-pretrain/Loss": 2.096902370452881, "Full-pretrain/Loss (Raw)": 2.1952624320983887, "Full-pretrain/Step": 786, "Full-pretrain/Step Time": 17.58106603100896} +{"Full-pretrain/Learning Rate": 4.9638961386953006e-05, "Full-pretrain/Loss": 2.0964062213897705, "Full-pretrain/Loss (Raw)": 2.0642476081848145, "Full-pretrain/Step": 787, "Full-pretrain/Step Time": 17.58148523978889} +{"Full-pretrain/Learning Rate": 4.963752217311775e-05, "Full-pretrain/Loss": 2.095898389816284, "Full-pretrain/Loss (Raw)": 2.019646406173706, "Full-pretrain/Step": 788, "Full-pretrain/Step Time": 17.572142904624343} +{"Full-pretrain/Learning Rate": 4.963608011735298e-05, "Full-pretrain/Loss": 2.0955095291137695, "Full-pretrain/Loss (Raw)": 2.1488089561462402, "Full-pretrain/Step": 789, "Full-pretrain/Step Time": 17.575249657034874} +{"Full-pretrain/Learning Rate": 4.963463521982503e-05, "Full-pretrain/Loss": 2.10532808303833, "Full-pretrain/Loss (Raw)": 2.4105074405670166, "Full-pretrain/Step": 790, "Full-pretrain/Step Time": 17.576213842257857} +{"Full-pretrain/Learning Rate": 4.963318748070056e-05, "Full-pretrain/Loss": 2.0975050926208496, "Full-pretrain/Loss (Raw)": 2.0291686058044434, "Full-pretrain/Step": 791, "Full-pretrain/Step Time": 17.569051971659064} +{"Full-pretrain/Learning Rate": 4.963173690014656e-05, "Full-pretrain/Loss": 2.094674587249756, "Full-pretrain/Loss (Raw)": 2.0808522701263428, "Full-pretrain/Step": 792, "Full-pretrain/Step Time": 17.570626061409712} +{"Full-pretrain/Learning Rate": 4.9630283478330386e-05, "Full-pretrain/Loss": 2.10261869430542, "Full-pretrain/Loss (Raw)": 2.3640942573547363, "Full-pretrain/Step": 793, "Full-pretrain/Step Time": 17.5707230232656} +{"Full-pretrain/Learning Rate": 4.962882721541966e-05, "Full-pretrain/Loss": 2.1094107627868652, "Full-pretrain/Loss (Raw)": 2.307490110397339, "Full-pretrain/Step": 794, "Full-pretrain/Step Time": 17.57605690136552} +{"Full-pretrain/Learning Rate": 4.9627368111582365e-05, "Full-pretrain/Loss": 2.1094818115234375, "Full-pretrain/Loss (Raw)": 2.1337718963623047, "Full-pretrain/Step": 795, "Full-pretrain/Step Time": 17.57497161999345} +{"Full-pretrain/Learning Rate": 4.962590616698681e-05, "Full-pretrain/Loss": 2.1051554679870605, "Full-pretrain/Loss (Raw)": 2.0326945781707764, "Full-pretrain/Step": 796, "Full-pretrain/Step Time": 17.578555876389146} +{"Full-pretrain/Learning Rate": 4.962444138180164e-05, "Full-pretrain/Loss": 2.1073098182678223, "Full-pretrain/Loss (Raw)": 1.9425021409988403, "Full-pretrain/Step": 797, "Full-pretrain/Step Time": 17.57693394087255} +{"Full-pretrain/Learning Rate": 4.962297375619581e-05, "Full-pretrain/Loss": 2.110429286956787, "Full-pretrain/Loss (Raw)": 2.18460750579834, "Full-pretrain/Step": 798, "Full-pretrain/Step Time": 17.581483963876963} +{"Full-pretrain/Learning Rate": 4.962150329033861e-05, "Full-pretrain/Loss": 2.107548475265503, "Full-pretrain/Loss (Raw)": 2.0835328102111816, "Full-pretrain/Step": 799, "Full-pretrain/Step Time": 17.57683178782463} +{"Full-pretrain/Learning Rate": 4.962002998439965e-05, "Full-pretrain/Loss": 2.1127517223358154, "Full-pretrain/Loss (Raw)": 2.0272903442382812, "Full-pretrain/Step": 800, "Full-pretrain/Step Time": 17.57083328254521} +{"Full-pretrain/Learning Rate": 4.961855383854889e-05, "Full-pretrain/Loss": 2.1085550785064697, "Full-pretrain/Loss (Raw)": 2.0883285999298096, "Full-pretrain/Step": 801, "Full-pretrain/Step Time": 17.570041611790657} +{"Full-pretrain/Learning Rate": 4.96170748529566e-05, "Full-pretrain/Loss": 2.1094770431518555, "Full-pretrain/Loss (Raw)": 2.06650972366333, "Full-pretrain/Step": 802, "Full-pretrain/Step Time": 17.572620978578925} +{"Full-pretrain/Learning Rate": 4.9615593027793374e-05, "Full-pretrain/Loss": 2.108454704284668, "Full-pretrain/Loss (Raw)": 2.1340062618255615, "Full-pretrain/Step": 803, "Full-pretrain/Step Time": 17.576003996655345} +{"Full-pretrain/Learning Rate": 4.9614108363230135e-05, "Full-pretrain/Loss": 2.1162853240966797, "Full-pretrain/Loss (Raw)": 2.2088475227355957, "Full-pretrain/Step": 804, "Full-pretrain/Step Time": 17.571771129965782} +{"Full-pretrain/Learning Rate": 4.961262085943815e-05, "Full-pretrain/Loss": 2.117979049682617, "Full-pretrain/Loss (Raw)": 2.0082340240478516, "Full-pretrain/Step": 805, "Full-pretrain/Step Time": 17.567757554352283} +{"Full-pretrain/Learning Rate": 4.961113051658901e-05, "Full-pretrain/Loss": 2.1164464950561523, "Full-pretrain/Loss (Raw)": 1.9810633659362793, "Full-pretrain/Step": 806, "Full-pretrain/Step Time": 17.575308356434107} +{"Full-pretrain/Learning Rate": 4.9609637334854596e-05, "Full-pretrain/Loss": 2.116952419281006, "Full-pretrain/Loss (Raw)": 2.0986061096191406, "Full-pretrain/Step": 807, "Full-pretrain/Step Time": 17.576457384973764} +{"Full-pretrain/Learning Rate": 4.9608141314407174e-05, "Full-pretrain/Loss": 2.112982749938965, "Full-pretrain/Loss (Raw)": 2.0220484733581543, "Full-pretrain/Step": 808, "Full-pretrain/Step Time": 17.57241695933044} +{"Full-pretrain/Learning Rate": 4.960664245541931e-05, "Full-pretrain/Loss": 2.108036518096924, "Full-pretrain/Loss (Raw)": 1.8045145273208618, "Full-pretrain/Step": 809, "Full-pretrain/Step Time": 17.57226115092635} +{"Full-pretrain/Learning Rate": 4.9605140758063866e-05, "Full-pretrain/Loss": 2.113992691040039, "Full-pretrain/Loss (Raw)": 2.08803391456604, "Full-pretrain/Step": 810, "Full-pretrain/Step Time": 17.574711924418807} +{"Full-pretrain/Learning Rate": 4.960363622251409e-05, "Full-pretrain/Loss": 2.096675395965576, "Full-pretrain/Loss (Raw)": 1.9884687662124634, "Full-pretrain/Step": 811, "Full-pretrain/Step Time": 17.574711930006742} +{"Full-pretrain/Learning Rate": 4.960212884894352e-05, "Full-pretrain/Loss": 2.1004862785339355, "Full-pretrain/Loss (Raw)": 2.0440542697906494, "Full-pretrain/Step": 812, "Full-pretrain/Step Time": 17.573719583451748} +{"Full-pretrain/Learning Rate": 4.960061863752604e-05, "Full-pretrain/Loss": 2.096703052520752, "Full-pretrain/Loss (Raw)": 2.0345892906188965, "Full-pretrain/Step": 813, "Full-pretrain/Step Time": 17.573475213721395} +{"Full-pretrain/Learning Rate": 4.9599105588435846e-05, "Full-pretrain/Loss": 2.097337245941162, "Full-pretrain/Loss (Raw)": 2.0307037830352783, "Full-pretrain/Step": 814, "Full-pretrain/Step Time": 17.57251249998808} +{"Full-pretrain/Learning Rate": 4.959758970184746e-05, "Full-pretrain/Loss": 2.099116563796997, "Full-pretrain/Loss (Raw)": 2.3007678985595703, "Full-pretrain/Step": 815, "Full-pretrain/Step Time": 17.56820104084909} +{"Full-pretrain/Learning Rate": 4.959607097793575e-05, "Full-pretrain/Loss": 2.096597909927368, "Full-pretrain/Loss (Raw)": 2.0946226119995117, "Full-pretrain/Step": 816, "Full-pretrain/Step Time": 17.565388683229685} +{"Full-pretrain/Learning Rate": 4.959454941687589e-05, "Full-pretrain/Loss": 2.101567268371582, "Full-pretrain/Loss (Raw)": 2.2322773933410645, "Full-pretrain/Step": 817, "Full-pretrain/Step Time": 17.561119182035327} +{"Full-pretrain/Learning Rate": 4.9593025018843406e-05, "Full-pretrain/Loss": 2.0927391052246094, "Full-pretrain/Loss (Raw)": 1.9127593040466309, "Full-pretrain/Step": 818, "Full-pretrain/Step Time": 17.556466998532414} +{"Full-pretrain/Learning Rate": 4.959149778401412e-05, "Full-pretrain/Loss": 2.088010311126709, "Full-pretrain/Loss (Raw)": 1.9129242897033691, "Full-pretrain/Step": 819, "Full-pretrain/Step Time": 17.559662571176887} +{"Full-pretrain/Learning Rate": 4.958996771256422e-05, "Full-pretrain/Loss": 2.0953662395477295, "Full-pretrain/Loss (Raw)": 2.2550411224365234, "Full-pretrain/Step": 820, "Full-pretrain/Step Time": 17.55969661846757} +{"Full-pretrain/Learning Rate": 4.9588434804670174e-05, "Full-pretrain/Loss": 2.0943987369537354, "Full-pretrain/Loss (Raw)": 2.1178464889526367, "Full-pretrain/Step": 821, "Full-pretrain/Step Time": 17.560254387557507} +{"Full-pretrain/Learning Rate": 4.958689906050882e-05, "Full-pretrain/Loss": 2.084726333618164, "Full-pretrain/Loss (Raw)": 2.100991725921631, "Full-pretrain/Step": 822, "Full-pretrain/Step Time": 17.560656243935227} +{"Full-pretrain/Learning Rate": 4.95853604802573e-05, "Full-pretrain/Loss": 2.08674955368042, "Full-pretrain/Loss (Raw)": 2.0939102172851562, "Full-pretrain/Step": 823, "Full-pretrain/Step Time": 17.55785639025271} +{"Full-pretrain/Learning Rate": 4.958381906409308e-05, "Full-pretrain/Loss": 2.0831639766693115, "Full-pretrain/Loss (Raw)": 1.9661153554916382, "Full-pretrain/Step": 824, "Full-pretrain/Step Time": 17.5708970669657} +{"Full-pretrain/Learning Rate": 4.9582274812193984e-05, "Full-pretrain/Loss": 2.0695669651031494, "Full-pretrain/Loss (Raw)": 1.928987979888916, "Full-pretrain/Step": 825, "Full-pretrain/Step Time": 17.56879311054945} +{"Full-pretrain/Learning Rate": 4.958072772473812e-05, "Full-pretrain/Loss": 2.0653223991394043, "Full-pretrain/Loss (Raw)": 2.171661615371704, "Full-pretrain/Step": 826, "Full-pretrain/Step Time": 17.566401122137904} +{"Full-pretrain/Learning Rate": 4.9579177801903945e-05, "Full-pretrain/Loss": 2.061042070388794, "Full-pretrain/Loss (Raw)": 1.996805191040039, "Full-pretrain/Step": 827, "Full-pretrain/Step Time": 17.570267517119646} +{"Full-pretrain/Learning Rate": 4.9577625043870255e-05, "Full-pretrain/Loss": 2.0631303787231445, "Full-pretrain/Loss (Raw)": 2.099515914916992, "Full-pretrain/Step": 828, "Full-pretrain/Step Time": 17.57254783809185} +{"Full-pretrain/Learning Rate": 4.957606945081615e-05, "Full-pretrain/Loss": 2.062819004058838, "Full-pretrain/Loss (Raw)": 1.9325426816940308, "Full-pretrain/Step": 829, "Full-pretrain/Step Time": 17.571034885942936} +{"Full-pretrain/Learning Rate": 4.957451102292108e-05, "Full-pretrain/Loss": 2.0556349754333496, "Full-pretrain/Loss (Raw)": 1.954717993736267, "Full-pretrain/Step": 830, "Full-pretrain/Step Time": 17.574414141476154} +{"Full-pretrain/Learning Rate": 4.9572949760364795e-05, "Full-pretrain/Loss": 2.0594916343688965, "Full-pretrain/Loss (Raw)": 2.20695161819458, "Full-pretrain/Step": 831, "Full-pretrain/Step Time": 17.574950305745006} +{"Full-pretrain/Learning Rate": 4.957138566332739e-05, "Full-pretrain/Loss": 2.0592989921569824, "Full-pretrain/Loss (Raw)": 2.0211167335510254, "Full-pretrain/Step": 832, "Full-pretrain/Step Time": 17.583845937624574} +{"Full-pretrain/Learning Rate": 4.956981873198928e-05, "Full-pretrain/Loss": 2.058959484100342, "Full-pretrain/Loss (Raw)": 2.0774688720703125, "Full-pretrain/Step": 833, "Full-pretrain/Step Time": 17.58101662993431} +{"Full-pretrain/Learning Rate": 4.956824896653122e-05, "Full-pretrain/Loss": 2.0560691356658936, "Full-pretrain/Loss (Raw)": 1.974016547203064, "Full-pretrain/Step": 834, "Full-pretrain/Step Time": 17.576292537152767} +{"Full-pretrain/Learning Rate": 4.956667636713427e-05, "Full-pretrain/Loss": 2.056811571121216, "Full-pretrain/Loss (Raw)": 2.157763957977295, "Full-pretrain/Step": 835, "Full-pretrain/Step Time": 17.582364559173584} +{"Full-pretrain/Learning Rate": 4.956510093397983e-05, "Full-pretrain/Loss": 2.0489063262939453, "Full-pretrain/Loss (Raw)": 1.9558831453323364, "Full-pretrain/Step": 836, "Full-pretrain/Step Time": 17.582688635215163} +{"Full-pretrain/Learning Rate": 4.956352266724964e-05, "Full-pretrain/Loss": 2.0531227588653564, "Full-pretrain/Loss (Raw)": 2.1431617736816406, "Full-pretrain/Step": 837, "Full-pretrain/Step Time": 17.58150820992887} +{"Full-pretrain/Learning Rate": 4.9561941567125736e-05, "Full-pretrain/Loss": 2.0661001205444336, "Full-pretrain/Loss (Raw)": 2.396336078643799, "Full-pretrain/Step": 838, "Full-pretrain/Step Time": 17.581120662391186} +{"Full-pretrain/Learning Rate": 4.956035763379051e-05, "Full-pretrain/Loss": 2.0672595500946045, "Full-pretrain/Loss (Raw)": 2.135707139968872, "Full-pretrain/Step": 839, "Full-pretrain/Step Time": 17.59177177399397} +{"Full-pretrain/Learning Rate": 4.955877086742666e-05, "Full-pretrain/Loss": 2.065767288208008, "Full-pretrain/Loss (Raw)": 1.9742883443832397, "Full-pretrain/Step": 840, "Full-pretrain/Step Time": 17.59441888704896} +{"Full-pretrain/Learning Rate": 4.9557181268217227e-05, "Full-pretrain/Loss": 2.0735416412353516, "Full-pretrain/Loss (Raw)": 2.053300619125366, "Full-pretrain/Step": 841, "Full-pretrain/Step Time": 17.596290485933423} +{"Full-pretrain/Learning Rate": 4.955558883634555e-05, "Full-pretrain/Loss": 2.0700955390930176, "Full-pretrain/Loss (Raw)": 1.9777600765228271, "Full-pretrain/Step": 842, "Full-pretrain/Step Time": 17.601006833836436} +{"Full-pretrain/Learning Rate": 4.955399357199534e-05, "Full-pretrain/Loss": 2.077916383743286, "Full-pretrain/Loss (Raw)": 2.238736629486084, "Full-pretrain/Step": 843, "Full-pretrain/Step Time": 17.59811480715871} +{"Full-pretrain/Learning Rate": 4.95523954753506e-05, "Full-pretrain/Loss": 2.0696961879730225, "Full-pretrain/Loss (Raw)": 1.7810025215148926, "Full-pretrain/Step": 844, "Full-pretrain/Step Time": 17.60534880310297} +{"Full-pretrain/Learning Rate": 4.9550794546595664e-05, "Full-pretrain/Loss": 2.0706632137298584, "Full-pretrain/Loss (Raw)": 2.0655357837677, "Full-pretrain/Step": 845, "Full-pretrain/Step Time": 17.603606306016445} +{"Full-pretrain/Learning Rate": 4.954919078591521e-05, "Full-pretrain/Loss": 2.0761382579803467, "Full-pretrain/Loss (Raw)": 2.2059080600738525, "Full-pretrain/Step": 846, "Full-pretrain/Step Time": 17.60604808665812} +{"Full-pretrain/Learning Rate": 4.9547584193494224e-05, "Full-pretrain/Loss": 2.0732781887054443, "Full-pretrain/Loss (Raw)": 2.2092444896698, "Full-pretrain/Step": 847, "Full-pretrain/Step Time": 17.610556406900287} +{"Full-pretrain/Learning Rate": 4.9545974769518033e-05, "Full-pretrain/Loss": 2.068330764770508, "Full-pretrain/Loss (Raw)": 1.9363007545471191, "Full-pretrain/Step": 848, "Full-pretrain/Step Time": 17.610014595091343} +{"Full-pretrain/Learning Rate": 4.954436251417227e-05, "Full-pretrain/Loss": 2.066364288330078, "Full-pretrain/Loss (Raw)": 2.1693553924560547, "Full-pretrain/Step": 849, "Full-pretrain/Step Time": 17.61086671985686} +{"Full-pretrain/Learning Rate": 4.9542747427642924e-05, "Full-pretrain/Loss": 2.0708487033843994, "Full-pretrain/Loss (Raw)": 2.0562570095062256, "Full-pretrain/Step": 850, "Full-pretrain/Step Time": 17.609566394239664} +{"Full-pretrain/Learning Rate": 4.954112951011628e-05, "Full-pretrain/Loss": 2.079599142074585, "Full-pretrain/Loss (Raw)": 2.1929380893707275, "Full-pretrain/Step": 851, "Full-pretrain/Step Time": 17.610079277306795} +{"Full-pretrain/Learning Rate": 4.953950876177898e-05, "Full-pretrain/Loss": 2.0740277767181396, "Full-pretrain/Loss (Raw)": 2.0767555236816406, "Full-pretrain/Step": 852, "Full-pretrain/Step Time": 17.61455112695694} +{"Full-pretrain/Learning Rate": 4.953788518281796e-05, "Full-pretrain/Loss": 2.0635063648223877, "Full-pretrain/Loss (Raw)": 1.781163215637207, "Full-pretrain/Step": 853, "Full-pretrain/Step Time": 17.612319378182292} +{"Full-pretrain/Learning Rate": 4.953625877342051e-05, "Full-pretrain/Loss": 2.06430721282959, "Full-pretrain/Loss (Raw)": 2.126617431640625, "Full-pretrain/Step": 854, "Full-pretrain/Step Time": 17.61618123948574} +{"Full-pretrain/Learning Rate": 4.9534629533774235e-05, "Full-pretrain/Loss": 2.0618631839752197, "Full-pretrain/Loss (Raw)": 2.01570200920105, "Full-pretrain/Step": 855, "Full-pretrain/Step Time": 17.61163079738617} +{"Full-pretrain/Learning Rate": 4.9532997464067065e-05, "Full-pretrain/Loss": 2.0698251724243164, "Full-pretrain/Loss (Raw)": 2.220898389816284, "Full-pretrain/Step": 856, "Full-pretrain/Step Time": 17.616450559347868} +{"Full-pretrain/Learning Rate": 4.953136256448726e-05, "Full-pretrain/Loss": 2.0738391876220703, "Full-pretrain/Loss (Raw)": 2.057441473007202, "Full-pretrain/Step": 857, "Full-pretrain/Step Time": 17.617782356217504} +{"Full-pretrain/Learning Rate": 4.9529724835223404e-05, "Full-pretrain/Loss": 2.0698740482330322, "Full-pretrain/Loss (Raw)": 2.0447745323181152, "Full-pretrain/Step": 858, "Full-pretrain/Step Time": 17.615010971203446} +{"Full-pretrain/Learning Rate": 4.9528084276464406e-05, "Full-pretrain/Loss": 2.0768299102783203, "Full-pretrain/Loss (Raw)": 2.219391345977783, "Full-pretrain/Step": 859, "Full-pretrain/Step Time": 17.612236952409148} +{"Full-pretrain/Learning Rate": 4.9526440888399506e-05, "Full-pretrain/Loss": 2.0784974098205566, "Full-pretrain/Loss (Raw)": 2.1528711318969727, "Full-pretrain/Step": 860, "Full-pretrain/Step Time": 17.616400396451354} +{"Full-pretrain/Learning Rate": 4.952479467121827e-05, "Full-pretrain/Loss": 2.0757718086242676, "Full-pretrain/Loss (Raw)": 1.8453352451324463, "Full-pretrain/Step": 861, "Full-pretrain/Step Time": 17.620979826897383} +{"Full-pretrain/Learning Rate": 4.952314562511059e-05, "Full-pretrain/Loss": 2.0808990001678467, "Full-pretrain/Loss (Raw)": 2.1187853813171387, "Full-pretrain/Step": 862, "Full-pretrain/Step Time": 17.616782318800688} +{"Full-pretrain/Learning Rate": 4.952149375026668e-05, "Full-pretrain/Loss": 2.0771422386169434, "Full-pretrain/Loss (Raw)": 2.086733818054199, "Full-pretrain/Step": 863, "Full-pretrain/Step Time": 17.618307380005717} +{"Full-pretrain/Learning Rate": 4.951983904687708e-05, "Full-pretrain/Loss": 2.080622673034668, "Full-pretrain/Loss (Raw)": 2.1324920654296875, "Full-pretrain/Step": 864, "Full-pretrain/Step Time": 17.61471839249134} +{"Full-pretrain/Learning Rate": 4.9518181515132666e-05, "Full-pretrain/Loss": 2.0783331394195557, "Full-pretrain/Loss (Raw)": 2.0042028427124023, "Full-pretrain/Step": 865, "Full-pretrain/Step Time": 17.61595181375742} +{"Full-pretrain/Learning Rate": 4.9516521155224625e-05, "Full-pretrain/Loss": 2.079496383666992, "Full-pretrain/Loss (Raw)": 2.0112409591674805, "Full-pretrain/Step": 866, "Full-pretrain/Step Time": 17.60972028411925} +{"Full-pretrain/Learning Rate": 4.951485796734449e-05, "Full-pretrain/Loss": 2.079601764678955, "Full-pretrain/Loss (Raw)": 2.161139965057373, "Full-pretrain/Step": 867, "Full-pretrain/Step Time": 17.609145315364003} +{"Full-pretrain/Learning Rate": 4.95131919516841e-05, "Full-pretrain/Loss": 2.0829427242279053, "Full-pretrain/Loss (Raw)": 2.0627894401550293, "Full-pretrain/Step": 868, "Full-pretrain/Step Time": 17.606842262670398} +{"Full-pretrain/Learning Rate": 4.951152310843564e-05, "Full-pretrain/Loss": 2.078495502471924, "Full-pretrain/Loss (Raw)": 2.000851631164551, "Full-pretrain/Step": 869, "Full-pretrain/Step Time": 17.612444011494517} +{"Full-pretrain/Learning Rate": 4.950985143779159e-05, "Full-pretrain/Loss": 2.0756123065948486, "Full-pretrain/Loss (Raw)": 2.3040714263916016, "Full-pretrain/Step": 870, "Full-pretrain/Step Time": 17.605944411829114} +{"Full-pretrain/Learning Rate": 4.950817693994481e-05, "Full-pretrain/Loss": 2.07523250579834, "Full-pretrain/Loss (Raw)": 2.1235575675964355, "Full-pretrain/Step": 871, "Full-pretrain/Step Time": 17.60513479448855} +{"Full-pretrain/Learning Rate": 4.950649961508841e-05, "Full-pretrain/Loss": 2.0774383544921875, "Full-pretrain/Loss (Raw)": 2.0448718070983887, "Full-pretrain/Step": 872, "Full-pretrain/Step Time": 17.60776911303401} +{"Full-pretrain/Learning Rate": 4.9504819463415906e-05, "Full-pretrain/Loss": 2.074214458465576, "Full-pretrain/Loss (Raw)": 1.9501349925994873, "Full-pretrain/Step": 873, "Full-pretrain/Step Time": 17.60692174360156} +{"Full-pretrain/Learning Rate": 4.950313648512108e-05, "Full-pretrain/Loss": 2.0732178688049316, "Full-pretrain/Loss (Raw)": 1.9458739757537842, "Full-pretrain/Step": 874, "Full-pretrain/Step Time": 17.604555336758494} +{"Full-pretrain/Learning Rate": 4.9501450680398084e-05, "Full-pretrain/Loss": 2.0670666694641113, "Full-pretrain/Loss (Raw)": 2.0418899059295654, "Full-pretrain/Step": 875, "Full-pretrain/Step Time": 17.609763709828258} +{"Full-pretrain/Learning Rate": 4.949976204944135e-05, "Full-pretrain/Loss": 2.067612886428833, "Full-pretrain/Loss (Raw)": 1.7984843254089355, "Full-pretrain/Step": 876, "Full-pretrain/Step Time": 17.609402490779757} +{"Full-pretrain/Learning Rate": 4.949807059244568e-05, "Full-pretrain/Loss": 2.0669784545898438, "Full-pretrain/Loss (Raw)": 2.045236110687256, "Full-pretrain/Step": 877, "Full-pretrain/Step Time": 17.60873662866652} +{"Full-pretrain/Learning Rate": 4.949637630960617e-05, "Full-pretrain/Loss": 2.070431709289551, "Full-pretrain/Loss (Raw)": 2.3164174556732178, "Full-pretrain/Step": 878, "Full-pretrain/Step Time": 17.60672076791525} +{"Full-pretrain/Learning Rate": 4.949467920111827e-05, "Full-pretrain/Loss": 2.067518711090088, "Full-pretrain/Loss (Raw)": 2.1160287857055664, "Full-pretrain/Step": 879, "Full-pretrain/Step Time": 17.601408630609512} +{"Full-pretrain/Learning Rate": 4.949297926717773e-05, "Full-pretrain/Loss": 2.066532850265503, "Full-pretrain/Loss (Raw)": 1.9047489166259766, "Full-pretrain/Step": 880, "Full-pretrain/Step Time": 17.59907709993422} +{"Full-pretrain/Learning Rate": 4.949127650798063e-05, "Full-pretrain/Loss": 2.0567758083343506, "Full-pretrain/Loss (Raw)": 1.857124924659729, "Full-pretrain/Step": 881, "Full-pretrain/Step Time": 17.597047716379166} +{"Full-pretrain/Learning Rate": 4.9489570923723404e-05, "Full-pretrain/Loss": 2.057131052017212, "Full-pretrain/Loss (Raw)": 2.0676302909851074, "Full-pretrain/Step": 882, "Full-pretrain/Step Time": 17.59648096561432} +{"Full-pretrain/Learning Rate": 4.948786251460277e-05, "Full-pretrain/Loss": 2.057647228240967, "Full-pretrain/Loss (Raw)": 2.209459066390991, "Full-pretrain/Step": 883, "Full-pretrain/Step Time": 17.594757931306958} +{"Full-pretrain/Learning Rate": 4.948615128081581e-05, "Full-pretrain/Loss": 2.061051368713379, "Full-pretrain/Loss (Raw)": 2.1856837272644043, "Full-pretrain/Step": 884, "Full-pretrain/Step Time": 17.596183110028505} +{"Full-pretrain/Learning Rate": 4.94844372225599e-05, "Full-pretrain/Loss": 2.070070743560791, "Full-pretrain/Loss (Raw)": 2.069779396057129, "Full-pretrain/Step": 885, "Full-pretrain/Step Time": 17.59886579401791} +{"Full-pretrain/Learning Rate": 4.948272034003275e-05, "Full-pretrain/Loss": 2.063654899597168, "Full-pretrain/Loss (Raw)": 1.9213162660598755, "Full-pretrain/Step": 886, "Full-pretrain/Step Time": 17.60113582573831} +{"Full-pretrain/Learning Rate": 4.948100063343243e-05, "Full-pretrain/Loss": 2.069783926010132, "Full-pretrain/Loss (Raw)": 2.2118313312530518, "Full-pretrain/Step": 887, "Full-pretrain/Step Time": 17.595309937372804} +{"Full-pretrain/Learning Rate": 4.947927810295728e-05, "Full-pretrain/Loss": 2.064213752746582, "Full-pretrain/Loss (Raw)": 2.042649030685425, "Full-pretrain/Step": 888, "Full-pretrain/Step Time": 17.602241029962897} +{"Full-pretrain/Learning Rate": 4.9477552748805996e-05, "Full-pretrain/Loss": 2.0657310485839844, "Full-pretrain/Loss (Raw)": 2.1059985160827637, "Full-pretrain/Step": 889, "Full-pretrain/Step Time": 17.605430928990245} +{"Full-pretrain/Learning Rate": 4.947582457117762e-05, "Full-pretrain/Loss": 2.078014850616455, "Full-pretrain/Loss (Raw)": 2.4378609657287598, "Full-pretrain/Step": 890, "Full-pretrain/Step Time": 17.606701837852597} +{"Full-pretrain/Learning Rate": 4.947409357027147e-05, "Full-pretrain/Loss": 2.0728938579559326, "Full-pretrain/Loss (Raw)": 2.0555152893066406, "Full-pretrain/Step": 891, "Full-pretrain/Step Time": 17.602027559652925} +{"Full-pretrain/Learning Rate": 4.947235974628724e-05, "Full-pretrain/Loss": 2.072108030319214, "Full-pretrain/Loss (Raw)": 2.1277248859405518, "Full-pretrain/Step": 892, "Full-pretrain/Step Time": 17.599224772304296} +{"Full-pretrain/Learning Rate": 4.947062309942491e-05, "Full-pretrain/Loss": 2.0811047554016113, "Full-pretrain/Loss (Raw)": 2.133227825164795, "Full-pretrain/Step": 893, "Full-pretrain/Step Time": 17.59771566465497} +{"Full-pretrain/Learning Rate": 4.946888362988479e-05, "Full-pretrain/Loss": 2.076563835144043, "Full-pretrain/Loss (Raw)": 1.9734692573547363, "Full-pretrain/Step": 894, "Full-pretrain/Step Time": 17.59940379485488} +{"Full-pretrain/Learning Rate": 4.9467141337867556e-05, "Full-pretrain/Loss": 2.075003147125244, "Full-pretrain/Loss (Raw)": 2.036799430847168, "Full-pretrain/Step": 895, "Full-pretrain/Step Time": 17.598001712933183} +{"Full-pretrain/Learning Rate": 4.946539622357417e-05, "Full-pretrain/Loss": 2.0756094455718994, "Full-pretrain/Loss (Raw)": 2.1518964767456055, "Full-pretrain/Step": 896, "Full-pretrain/Step Time": 17.596494616940618} +{"Full-pretrain/Learning Rate": 4.9463648287205924e-05, "Full-pretrain/Loss": 2.078979969024658, "Full-pretrain/Loss (Raw)": 2.1120519638061523, "Full-pretrain/Step": 897, "Full-pretrain/Step Time": 17.593602104112506} +{"Full-pretrain/Learning Rate": 4.946189752896444e-05, "Full-pretrain/Loss": 2.080726146697998, "Full-pretrain/Loss (Raw)": 2.06711745262146, "Full-pretrain/Step": 898, "Full-pretrain/Step Time": 17.598200924694538} +{"Full-pretrain/Learning Rate": 4.946014394905167e-05, "Full-pretrain/Loss": 2.076622486114502, "Full-pretrain/Loss (Raw)": 2.0298266410827637, "Full-pretrain/Step": 899, "Full-pretrain/Step Time": 17.579079242423177} +{"Full-pretrain/Learning Rate": 4.94583875476699e-05, "Full-pretrain/Loss": 2.075092315673828, "Full-pretrain/Loss (Raw)": 2.013824939727783, "Full-pretrain/Step": 900, "Full-pretrain/Step Time": 17.583456644788384} +{"Full-pretrain/Learning Rate": 4.9456628325021714e-05, "Full-pretrain/Loss": 2.0754566192626953, "Full-pretrain/Loss (Raw)": 2.012510299682617, "Full-pretrain/Step": 901, "Full-pretrain/Step Time": 17.58396547846496} +{"Full-pretrain/Learning Rate": 4.945486628131005e-05, "Full-pretrain/Loss": 2.0776147842407227, "Full-pretrain/Loss (Raw)": 2.373131275177002, "Full-pretrain/Step": 902, "Full-pretrain/Step Time": 17.58575054258108} +{"Full-pretrain/Learning Rate": 4.9453101416738155e-05, "Full-pretrain/Loss": 2.0723228454589844, "Full-pretrain/Loss (Raw)": 1.9542170763015747, "Full-pretrain/Step": 903, "Full-pretrain/Step Time": 17.58080656453967} +{"Full-pretrain/Learning Rate": 4.945133373150961e-05, "Full-pretrain/Loss": 2.0753259658813477, "Full-pretrain/Loss (Raw)": 2.1409711837768555, "Full-pretrain/Step": 904, "Full-pretrain/Step Time": 17.578561766073108} +{"Full-pretrain/Learning Rate": 4.94495632258283e-05, "Full-pretrain/Loss": 2.0832128524780273, "Full-pretrain/Loss (Raw)": 2.2025132179260254, "Full-pretrain/Step": 905, "Full-pretrain/Step Time": 17.587059760466218} +{"Full-pretrain/Learning Rate": 4.944778989989847e-05, "Full-pretrain/Loss": 2.0904598236083984, "Full-pretrain/Loss (Raw)": 2.177783489227295, "Full-pretrain/Step": 906, "Full-pretrain/Step Time": 17.59020427800715} +{"Full-pretrain/Learning Rate": 4.944601375392467e-05, "Full-pretrain/Loss": 2.094999074935913, "Full-pretrain/Loss (Raw)": 2.1871440410614014, "Full-pretrain/Step": 907, "Full-pretrain/Step Time": 17.587320594117045} +{"Full-pretrain/Learning Rate": 4.944423478811177e-05, "Full-pretrain/Loss": 2.103415012359619, "Full-pretrain/Loss (Raw)": 2.067793369293213, "Full-pretrain/Step": 908, "Full-pretrain/Step Time": 17.588828053325415} +{"Full-pretrain/Learning Rate": 4.944245300266498e-05, "Full-pretrain/Loss": 2.1075267791748047, "Full-pretrain/Loss (Raw)": 2.17681884765625, "Full-pretrain/Step": 909, "Full-pretrain/Step Time": 17.589868869632483} +{"Full-pretrain/Learning Rate": 4.944066839778982e-05, "Full-pretrain/Loss": 2.0994606018066406, "Full-pretrain/Loss (Raw)": 2.0582962036132812, "Full-pretrain/Step": 910, "Full-pretrain/Step Time": 17.59776671975851} +{"Full-pretrain/Learning Rate": 4.943888097369216e-05, "Full-pretrain/Loss": 2.0886483192443848, "Full-pretrain/Loss (Raw)": 1.7700295448303223, "Full-pretrain/Step": 911, "Full-pretrain/Step Time": 17.594696873798966} +{"Full-pretrain/Learning Rate": 4.943709073057816e-05, "Full-pretrain/Loss": 2.0932998657226562, "Full-pretrain/Loss (Raw)": 2.053598403930664, "Full-pretrain/Step": 912, "Full-pretrain/Step Time": 17.58445161767304} +{"Full-pretrain/Learning Rate": 4.943529766865434e-05, "Full-pretrain/Loss": 2.102792739868164, "Full-pretrain/Loss (Raw)": 2.1609020233154297, "Full-pretrain/Step": 913, "Full-pretrain/Step Time": 17.588111774995923} +{"Full-pretrain/Learning Rate": 4.9433501788127514e-05, "Full-pretrain/Loss": 2.1036906242370605, "Full-pretrain/Loss (Raw)": 2.096362590789795, "Full-pretrain/Step": 914, "Full-pretrain/Step Time": 17.590512089431286} +{"Full-pretrain/Learning Rate": 4.943170308920484e-05, "Full-pretrain/Loss": 2.0902934074401855, "Full-pretrain/Loss (Raw)": 1.7807389497756958, "Full-pretrain/Step": 915, "Full-pretrain/Step Time": 17.59261593595147} +{"Full-pretrain/Learning Rate": 4.9429901572093807e-05, "Full-pretrain/Loss": 2.0875327587127686, "Full-pretrain/Loss (Raw)": 2.0973525047302246, "Full-pretrain/Step": 916, "Full-pretrain/Step Time": 17.59122965298593} +{"Full-pretrain/Learning Rate": 4.942809723700221e-05, "Full-pretrain/Loss": 2.088660717010498, "Full-pretrain/Loss (Raw)": 2.105865955352783, "Full-pretrain/Step": 917, "Full-pretrain/Step Time": 17.594722788780928} +{"Full-pretrain/Learning Rate": 4.9426290084138186e-05, "Full-pretrain/Loss": 2.0904717445373535, "Full-pretrain/Loss (Raw)": 1.9792759418487549, "Full-pretrain/Step": 918, "Full-pretrain/Step Time": 17.60047853179276} +{"Full-pretrain/Learning Rate": 4.9424480113710175e-05, "Full-pretrain/Loss": 2.097092390060425, "Full-pretrain/Loss (Raw)": 2.423691749572754, "Full-pretrain/Step": 919, "Full-pretrain/Step Time": 17.603138556703925} +{"Full-pretrain/Learning Rate": 4.9422667325926975e-05, "Full-pretrain/Loss": 2.1025171279907227, "Full-pretrain/Loss (Raw)": 2.216235876083374, "Full-pretrain/Step": 920, "Full-pretrain/Step Time": 17.598028250038624} +{"Full-pretrain/Learning Rate": 4.9420851720997676e-05, "Full-pretrain/Loss": 2.090470790863037, "Full-pretrain/Loss (Raw)": 1.720524787902832, "Full-pretrain/Step": 921, "Full-pretrain/Step Time": 17.595103733241558} +{"Full-pretrain/Learning Rate": 4.941903329913172e-05, "Full-pretrain/Loss": 2.0738089084625244, "Full-pretrain/Loss (Raw)": 1.904675006866455, "Full-pretrain/Step": 922, "Full-pretrain/Step Time": 17.599208941683173} +{"Full-pretrain/Learning Rate": 4.9417212060538845e-05, "Full-pretrain/Loss": 2.073428153991699, "Full-pretrain/Loss (Raw)": 2.043335437774658, "Full-pretrain/Step": 923, "Full-pretrain/Step Time": 17.597159519791603} +{"Full-pretrain/Learning Rate": 4.9415388005429144e-05, "Full-pretrain/Loss": 2.0750820636749268, "Full-pretrain/Loss (Raw)": 2.18064022064209, "Full-pretrain/Step": 924, "Full-pretrain/Step Time": 17.589987875893712} +{"Full-pretrain/Learning Rate": 4.941356113401302e-05, "Full-pretrain/Loss": 2.0927014350891113, "Full-pretrain/Loss (Raw)": 2.6970508098602295, "Full-pretrain/Step": 925, "Full-pretrain/Step Time": 17.583486940711737} +{"Full-pretrain/Learning Rate": 4.94117314465012e-05, "Full-pretrain/Loss": 2.0947265625, "Full-pretrain/Loss (Raw)": 2.0382747650146484, "Full-pretrain/Step": 926, "Full-pretrain/Step Time": 17.59285737015307} +{"Full-pretrain/Learning Rate": 4.940989894310473e-05, "Full-pretrain/Loss": 2.0955588817596436, "Full-pretrain/Loss (Raw)": 2.0634334087371826, "Full-pretrain/Step": 927, "Full-pretrain/Step Time": 17.59623323753476} +{"Full-pretrain/Learning Rate": 4.9408063624034994e-05, "Full-pretrain/Loss": 2.1010613441467285, "Full-pretrain/Loss (Raw)": 2.3279783725738525, "Full-pretrain/Step": 928, "Full-pretrain/Step Time": 17.597659721970558} +{"Full-pretrain/Learning Rate": 4.9406225489503704e-05, "Full-pretrain/Loss": 2.1019644737243652, "Full-pretrain/Loss (Raw)": 2.1409456729888916, "Full-pretrain/Step": 929, "Full-pretrain/Step Time": 17.593712272122502} +{"Full-pretrain/Learning Rate": 4.940438453972288e-05, "Full-pretrain/Loss": 2.107059955596924, "Full-pretrain/Loss (Raw)": 2.2301764488220215, "Full-pretrain/Step": 930, "Full-pretrain/Step Time": 17.604591829702258} +{"Full-pretrain/Learning Rate": 4.940254077490487e-05, "Full-pretrain/Loss": 2.105870008468628, "Full-pretrain/Loss (Raw)": 1.9917467832565308, "Full-pretrain/Step": 931, "Full-pretrain/Step Time": 17.602312171831727} +{"Full-pretrain/Learning Rate": 4.9400694195262365e-05, "Full-pretrain/Loss": 2.1083507537841797, "Full-pretrain/Loss (Raw)": 2.093209743499756, "Full-pretrain/Step": 932, "Full-pretrain/Step Time": 17.602727435529232} +{"Full-pretrain/Learning Rate": 4.9398844801008354e-05, "Full-pretrain/Loss": 2.1008806228637695, "Full-pretrain/Loss (Raw)": 1.7734659910202026, "Full-pretrain/Step": 933, "Full-pretrain/Step Time": 17.602423656731844} +{"Full-pretrain/Learning Rate": 4.9396992592356174e-05, "Full-pretrain/Loss": 2.0886363983154297, "Full-pretrain/Loss (Raw)": 1.9813227653503418, "Full-pretrain/Step": 934, "Full-pretrain/Step Time": 17.60266457684338} +{"Full-pretrain/Learning Rate": 4.939513756951947e-05, "Full-pretrain/Loss": 2.0917375087738037, "Full-pretrain/Loss (Raw)": 2.0534496307373047, "Full-pretrain/Step": 935, "Full-pretrain/Step Time": 17.607797645032406} +{"Full-pretrain/Learning Rate": 4.939327973271221e-05, "Full-pretrain/Loss": 2.095118522644043, "Full-pretrain/Loss (Raw)": 2.2491674423217773, "Full-pretrain/Step": 936, "Full-pretrain/Step Time": 17.601032031700015} +{"Full-pretrain/Learning Rate": 4.939141908214871e-05, "Full-pretrain/Loss": 2.0893478393554688, "Full-pretrain/Loss (Raw)": 2.0178399085998535, "Full-pretrain/Step": 937, "Full-pretrain/Step Time": 17.597729317843914} +{"Full-pretrain/Learning Rate": 4.93895556180436e-05, "Full-pretrain/Loss": 2.086599826812744, "Full-pretrain/Loss (Raw)": 2.0898594856262207, "Full-pretrain/Step": 938, "Full-pretrain/Step Time": 17.602197660133243} +{"Full-pretrain/Learning Rate": 4.938768934061182e-05, "Full-pretrain/Loss": 2.0877959728240967, "Full-pretrain/Loss (Raw)": 2.225419521331787, "Full-pretrain/Step": 939, "Full-pretrain/Step Time": 17.59911723062396} +{"Full-pretrain/Learning Rate": 4.9385820250068635e-05, "Full-pretrain/Loss": 2.086732864379883, "Full-pretrain/Loss (Raw)": 2.0337724685668945, "Full-pretrain/Step": 940, "Full-pretrain/Step Time": 17.59916878864169} +{"Full-pretrain/Learning Rate": 4.938394834662966e-05, "Full-pretrain/Loss": 2.0880773067474365, "Full-pretrain/Loss (Raw)": 2.2198336124420166, "Full-pretrain/Step": 941, "Full-pretrain/Step Time": 17.593971287831664} +{"Full-pretrain/Learning Rate": 4.9382073630510816e-05, "Full-pretrain/Loss": 2.097188711166382, "Full-pretrain/Loss (Raw)": 2.349867820739746, "Full-pretrain/Step": 942, "Full-pretrain/Step Time": 17.604495659470558} +{"Full-pretrain/Learning Rate": 4.938019610192835e-05, "Full-pretrain/Loss": 2.0997259616851807, "Full-pretrain/Loss (Raw)": 1.8512214422225952, "Full-pretrain/Step": 943, "Full-pretrain/Step Time": 17.603694569319487} +{"Full-pretrain/Learning Rate": 4.9378315761098814e-05, "Full-pretrain/Loss": 2.099626302719116, "Full-pretrain/Loss (Raw)": 2.0504040718078613, "Full-pretrain/Step": 944, "Full-pretrain/Step Time": 17.606538211926818} +{"Full-pretrain/Learning Rate": 4.937643260823914e-05, "Full-pretrain/Loss": 2.0972445011138916, "Full-pretrain/Loss (Raw)": 2.0846855640411377, "Full-pretrain/Step": 945, "Full-pretrain/Step Time": 17.600170243531466} +{"Full-pretrain/Learning Rate": 4.9374546643566525e-05, "Full-pretrain/Loss": 2.1040306091308594, "Full-pretrain/Loss (Raw)": 2.3135151863098145, "Full-pretrain/Step": 946, "Full-pretrain/Step Time": 17.609499225392938} +{"Full-pretrain/Learning Rate": 4.9372657867298514e-05, "Full-pretrain/Loss": 2.114654541015625, "Full-pretrain/Loss (Raw)": 2.120710611343384, "Full-pretrain/Step": 947, "Full-pretrain/Step Time": 17.606391889974475} +{"Full-pretrain/Learning Rate": 4.937076627965299e-05, "Full-pretrain/Loss": 2.113863945007324, "Full-pretrain/Loss (Raw)": 2.0720508098602295, "Full-pretrain/Step": 948, "Full-pretrain/Step Time": 17.607250222936273} +{"Full-pretrain/Learning Rate": 4.936887188084813e-05, "Full-pretrain/Loss": 2.1159958839416504, "Full-pretrain/Loss (Raw)": 2.174091339111328, "Full-pretrain/Step": 949, "Full-pretrain/Step Time": 17.60494676977396} +{"Full-pretrain/Learning Rate": 4.9366974671102475e-05, "Full-pretrain/Loss": 2.1156773567199707, "Full-pretrain/Loss (Raw)": 1.9690848588943481, "Full-pretrain/Step": 950, "Full-pretrain/Step Time": 17.60896016098559} +{"Full-pretrain/Learning Rate": 4.9365074650634855e-05, "Full-pretrain/Loss": 2.1042723655700684, "Full-pretrain/Loss (Raw)": 2.058730125427246, "Full-pretrain/Step": 951, "Full-pretrain/Step Time": 17.61360094510019} +{"Full-pretrain/Learning Rate": 4.9363171819664434e-05, "Full-pretrain/Loss": 2.103123188018799, "Full-pretrain/Loss (Raw)": 2.1794607639312744, "Full-pretrain/Step": 952, "Full-pretrain/Step Time": 17.60565087199211} +{"Full-pretrain/Learning Rate": 4.9361266178410704e-05, "Full-pretrain/Loss": 2.1111011505126953, "Full-pretrain/Loss (Raw)": 1.9758155345916748, "Full-pretrain/Step": 953, "Full-pretrain/Step Time": 17.60820109769702} +{"Full-pretrain/Learning Rate": 4.935935772709348e-05, "Full-pretrain/Loss": 2.1144590377807617, "Full-pretrain/Loss (Raw)": 2.0121304988861084, "Full-pretrain/Step": 954, "Full-pretrain/Step Time": 17.608822867274284} +{"Full-pretrain/Learning Rate": 4.93574464659329e-05, "Full-pretrain/Loss": 2.119286060333252, "Full-pretrain/Loss (Raw)": 2.1978015899658203, "Full-pretrain/Step": 955, "Full-pretrain/Step Time": 17.605038356035948} +{"Full-pretrain/Learning Rate": 4.935553239514944e-05, "Full-pretrain/Loss": 2.1186461448669434, "Full-pretrain/Loss (Raw)": 2.1601603031158447, "Full-pretrain/Step": 956, "Full-pretrain/Step Time": 17.603004360571504} +{"Full-pretrain/Learning Rate": 4.935361551496387e-05, "Full-pretrain/Loss": 2.0988118648529053, "Full-pretrain/Loss (Raw)": 2.062346935272217, "Full-pretrain/Step": 957, "Full-pretrain/Step Time": 17.604688081890345} +{"Full-pretrain/Learning Rate": 4.935169582559731e-05, "Full-pretrain/Loss": 2.1013386249542236, "Full-pretrain/Loss (Raw)": 2.1191349029541016, "Full-pretrain/Step": 958, "Full-pretrain/Step Time": 17.602931590750813} +{"Full-pretrain/Learning Rate": 4.934977332727119e-05, "Full-pretrain/Loss": 2.10215425491333, "Full-pretrain/Loss (Raw)": 2.089531898498535, "Full-pretrain/Step": 959, "Full-pretrain/Step Time": 17.598617373034358} +{"Full-pretrain/Learning Rate": 4.934784802020728e-05, "Full-pretrain/Loss": 2.09403920173645, "Full-pretrain/Loss (Raw)": 2.068301200866699, "Full-pretrain/Step": 960, "Full-pretrain/Step Time": 17.591769797727466} +{"Full-pretrain/Learning Rate": 4.934591990462766e-05, "Full-pretrain/Loss": 2.0934371948242188, "Full-pretrain/Loss (Raw)": 2.121674060821533, "Full-pretrain/Step": 961, "Full-pretrain/Step Time": 17.59072018787265} +{"Full-pretrain/Learning Rate": 4.9343988980754724e-05, "Full-pretrain/Loss": 2.0844316482543945, "Full-pretrain/Loss (Raw)": 1.9420064687728882, "Full-pretrain/Step": 962, "Full-pretrain/Step Time": 17.591497527435422} +{"Full-pretrain/Learning Rate": 4.9342055248811226e-05, "Full-pretrain/Loss": 2.0935287475585938, "Full-pretrain/Loss (Raw)": 2.2828545570373535, "Full-pretrain/Step": 963, "Full-pretrain/Step Time": 17.5882374253124} +{"Full-pretrain/Learning Rate": 4.93401187090202e-05, "Full-pretrain/Loss": 2.0917606353759766, "Full-pretrain/Loss (Raw)": 2.0366368293762207, "Full-pretrain/Step": 964, "Full-pretrain/Step Time": 17.58881858550012} +{"Full-pretrain/Learning Rate": 4.933817936160504e-05, "Full-pretrain/Loss": 2.093583106994629, "Full-pretrain/Loss (Raw)": 1.8317829370498657, "Full-pretrain/Step": 965, "Full-pretrain/Step Time": 17.587246065959334} +{"Full-pretrain/Learning Rate": 4.933623720678944e-05, "Full-pretrain/Loss": 2.098583221435547, "Full-pretrain/Loss (Raw)": 2.1413254737854004, "Full-pretrain/Step": 966, "Full-pretrain/Step Time": 17.5875141993165} +{"Full-pretrain/Learning Rate": 4.933429224479743e-05, "Full-pretrain/Loss": 2.102048397064209, "Full-pretrain/Loss (Raw)": 2.1643333435058594, "Full-pretrain/Step": 967, "Full-pretrain/Step Time": 17.58047629147768} +{"Full-pretrain/Learning Rate": 4.933234447585337e-05, "Full-pretrain/Loss": 2.0903971195220947, "Full-pretrain/Loss (Raw)": 1.8763240575790405, "Full-pretrain/Step": 968, "Full-pretrain/Step Time": 17.580891171470284} +{"Full-pretrain/Learning Rate": 4.933039390018191e-05, "Full-pretrain/Loss": 2.088339328765869, "Full-pretrain/Loss (Raw)": 1.9519890546798706, "Full-pretrain/Step": 969, "Full-pretrain/Step Time": 17.576749369502068} +{"Full-pretrain/Learning Rate": 4.932844051800808e-05, "Full-pretrain/Loss": 2.0870580673217773, "Full-pretrain/Loss (Raw)": 2.048853635787964, "Full-pretrain/Step": 970, "Full-pretrain/Step Time": 17.57533478550613} +{"Full-pretrain/Learning Rate": 4.9326484329557175e-05, "Full-pretrain/Loss": 2.0872979164123535, "Full-pretrain/Loss (Raw)": 2.2331020832061768, "Full-pretrain/Step": 971, "Full-pretrain/Step Time": 17.581413308158517} +{"Full-pretrain/Learning Rate": 4.932452533505486e-05, "Full-pretrain/Loss": 2.0905494689941406, "Full-pretrain/Loss (Raw)": 2.1378235816955566, "Full-pretrain/Step": 972, "Full-pretrain/Step Time": 17.58059717528522} +{"Full-pretrain/Learning Rate": 4.932256353472709e-05, "Full-pretrain/Loss": 2.0825109481811523, "Full-pretrain/Loss (Raw)": 1.962602972984314, "Full-pretrain/Step": 973, "Full-pretrain/Step Time": 17.58370498381555} +{"Full-pretrain/Learning Rate": 4.9320598928800166e-05, "Full-pretrain/Loss": 2.0718812942504883, "Full-pretrain/Loss (Raw)": 2.0097129344940186, "Full-pretrain/Step": 974, "Full-pretrain/Step Time": 17.57755515910685} +{"Full-pretrain/Learning Rate": 4.93186315175007e-05, "Full-pretrain/Loss": 2.080779552459717, "Full-pretrain/Loss (Raw)": 2.1359658241271973, "Full-pretrain/Step": 975, "Full-pretrain/Step Time": 17.57396288588643} +{"Full-pretrain/Learning Rate": 4.9316661301055637e-05, "Full-pretrain/Loss": 2.079897403717041, "Full-pretrain/Loss (Raw)": 2.0221729278564453, "Full-pretrain/Step": 976, "Full-pretrain/Step Time": 17.577438443899155} +{"Full-pretrain/Learning Rate": 4.931468827969224e-05, "Full-pretrain/Loss": 2.080256223678589, "Full-pretrain/Loss (Raw)": 2.0961720943450928, "Full-pretrain/Step": 977, "Full-pretrain/Step Time": 17.575816025957465} +{"Full-pretrain/Learning Rate": 4.9312712453638096e-05, "Full-pretrain/Loss": 2.076733350753784, "Full-pretrain/Loss (Raw)": 2.2007803916931152, "Full-pretrain/Step": 978, "Full-pretrain/Step Time": 17.572393177077174} +{"Full-pretrain/Learning Rate": 4.931073382312111e-05, "Full-pretrain/Loss": 2.0749588012695312, "Full-pretrain/Loss (Raw)": 2.0639305114746094, "Full-pretrain/Step": 979, "Full-pretrain/Step Time": 17.573476575315} +{"Full-pretrain/Learning Rate": 4.930875238836952e-05, "Full-pretrain/Loss": 2.070983409881592, "Full-pretrain/Loss (Raw)": 1.9448347091674805, "Full-pretrain/Step": 980, "Full-pretrain/Step Time": 17.56875211931765} +{"Full-pretrain/Learning Rate": 4.930676814961189e-05, "Full-pretrain/Loss": 2.0644266605377197, "Full-pretrain/Loss (Raw)": 1.964276671409607, "Full-pretrain/Step": 981, "Full-pretrain/Step Time": 17.57036542519927} +{"Full-pretrain/Learning Rate": 4.930478110707709e-05, "Full-pretrain/Loss": 2.064114570617676, "Full-pretrain/Loss (Raw)": 1.9590959548950195, "Full-pretrain/Step": 982, "Full-pretrain/Step Time": 17.56646842882037} +{"Full-pretrain/Learning Rate": 4.930279126099433e-05, "Full-pretrain/Loss": 2.06866455078125, "Full-pretrain/Loss (Raw)": 2.2043352127075195, "Full-pretrain/Step": 983, "Full-pretrain/Step Time": 17.56609946489334} +{"Full-pretrain/Learning Rate": 4.930079861159315e-05, "Full-pretrain/Loss": 2.059969425201416, "Full-pretrain/Loss (Raw)": 1.9012080430984497, "Full-pretrain/Step": 984, "Full-pretrain/Step Time": 17.560384333133698} +{"Full-pretrain/Learning Rate": 4.929880315910338e-05, "Full-pretrain/Loss": 2.0648770332336426, "Full-pretrain/Loss (Raw)": 2.1328673362731934, "Full-pretrain/Step": 985, "Full-pretrain/Step Time": 17.5622020624578} +{"Full-pretrain/Learning Rate": 4.92968049037552e-05, "Full-pretrain/Loss": 2.067348003387451, "Full-pretrain/Loss (Raw)": 2.091203212738037, "Full-pretrain/Step": 986, "Full-pretrain/Step Time": 17.561372043564916} +{"Full-pretrain/Learning Rate": 4.9294803845779124e-05, "Full-pretrain/Loss": 2.0586764812469482, "Full-pretrain/Loss (Raw)": 1.9203131198883057, "Full-pretrain/Step": 987, "Full-pretrain/Step Time": 17.56074697524309} +{"Full-pretrain/Learning Rate": 4.929279998540596e-05, "Full-pretrain/Loss": 2.0542845726013184, "Full-pretrain/Loss (Raw)": 2.0196189880371094, "Full-pretrain/Step": 988, "Full-pretrain/Step Time": 17.55769222229719} +{"Full-pretrain/Learning Rate": 4.929079332286685e-05, "Full-pretrain/Loss": 2.052029609680176, "Full-pretrain/Loss (Raw)": 1.9901847839355469, "Full-pretrain/Step": 989, "Full-pretrain/Step Time": 17.557082045823336} +{"Full-pretrain/Learning Rate": 4.9288783858393273e-05, "Full-pretrain/Loss": 2.0467865467071533, "Full-pretrain/Loss (Raw)": 1.9513587951660156, "Full-pretrain/Step": 990, "Full-pretrain/Step Time": 17.558150419965386} +{"Full-pretrain/Learning Rate": 4.928677159221701e-05, "Full-pretrain/Loss": 2.0491745471954346, "Full-pretrain/Loss (Raw)": 2.165945053100586, "Full-pretrain/Step": 991, "Full-pretrain/Step Time": 17.55744530633092} +{"Full-pretrain/Learning Rate": 4.928475652457017e-05, "Full-pretrain/Loss": 2.0523934364318848, "Full-pretrain/Loss (Raw)": 2.1713016033172607, "Full-pretrain/Step": 992, "Full-pretrain/Step Time": 17.558028610423207} +{"Full-pretrain/Learning Rate": 4.9282738655685215e-05, "Full-pretrain/Loss": 2.052725315093994, "Full-pretrain/Loss (Raw)": 2.13230037689209, "Full-pretrain/Step": 993, "Full-pretrain/Step Time": 17.55784921720624} +{"Full-pretrain/Learning Rate": 4.928071798579488e-05, "Full-pretrain/Loss": 2.0523834228515625, "Full-pretrain/Loss (Raw)": 1.9310672283172607, "Full-pretrain/Step": 994, "Full-pretrain/Step Time": 17.56145802885294} +{"Full-pretrain/Learning Rate": 4.9278694515132265e-05, "Full-pretrain/Loss": 2.043921947479248, "Full-pretrain/Loss (Raw)": 2.0120787620544434, "Full-pretrain/Step": 995, "Full-pretrain/Step Time": 17.56042441725731} +{"Full-pretrain/Learning Rate": 4.9276668243930765e-05, "Full-pretrain/Loss": 2.0456008911132812, "Full-pretrain/Loss (Raw)": 2.0903663635253906, "Full-pretrain/Step": 996, "Full-pretrain/Step Time": 17.560050889849663} +{"Full-pretrain/Learning Rate": 4.927463917242411e-05, "Full-pretrain/Loss": 2.052671194076538, "Full-pretrain/Loss (Raw)": 2.0580334663391113, "Full-pretrain/Step": 997, "Full-pretrain/Step Time": 17.558033069595695} +{"Full-pretrain/Learning Rate": 4.927260730084636e-05, "Full-pretrain/Loss": 2.0496392250061035, "Full-pretrain/Loss (Raw)": 2.044299602508545, "Full-pretrain/Step": 998, "Full-pretrain/Step Time": 17.56007356196642} +{"Full-pretrain/Learning Rate": 4.9270572629431896e-05, "Full-pretrain/Loss": 2.048038959503174, "Full-pretrain/Loss (Raw)": 2.1131277084350586, "Full-pretrain/Step": 999, "Full-pretrain/Step Time": 17.563560400158167} +{"Full-pretrain/Learning Rate": 4.92685351584154e-05, "Full-pretrain/Loss": 2.048429489135742, "Full-pretrain/Loss (Raw)": 1.888826608657837, "Full-pretrain/Step": 1000, "Full-pretrain/Step Time": 17.560423305258155} +{"Full-pretrain/Learning Rate": 4.926649488803191e-05, "Full-pretrain/Loss": 2.0687355995178223, "Full-pretrain/Loss (Raw)": 2.601787567138672, "Full-pretrain/Step": 1001, "Full-pretrain/Step Time": 17.561295814812183} +{"Full-pretrain/Learning Rate": 4.926445181851676e-05, "Full-pretrain/Loss": 2.0783586502075195, "Full-pretrain/Loss (Raw)": 2.356778621673584, "Full-pretrain/Step": 1002, "Full-pretrain/Step Time": 17.562207460403442} +{"Full-pretrain/Learning Rate": 4.9262405950105606e-05, "Full-pretrain/Loss": 2.086808204650879, "Full-pretrain/Loss (Raw)": 2.503491163253784, "Full-pretrain/Step": 1003, "Full-pretrain/Step Time": 17.55863907933235} +{"Full-pretrain/Learning Rate": 4.926035728303446e-05, "Full-pretrain/Loss": 2.085844039916992, "Full-pretrain/Loss (Raw)": 2.106968641281128, "Full-pretrain/Step": 1004, "Full-pretrain/Step Time": 17.561067700386047} +{"Full-pretrain/Learning Rate": 4.925830581753964e-05, "Full-pretrain/Loss": 2.0949809551239014, "Full-pretrain/Loss (Raw)": 2.2549877166748047, "Full-pretrain/Step": 1005, "Full-pretrain/Step Time": 17.561639923602343} +{"Full-pretrain/Learning Rate": 4.925625155385776e-05, "Full-pretrain/Loss": 2.09363055229187, "Full-pretrain/Loss (Raw)": 1.9665004014968872, "Full-pretrain/Step": 1006, "Full-pretrain/Step Time": 17.563700335100293} +{"Full-pretrain/Learning Rate": 4.925419449222578e-05, "Full-pretrain/Loss": 2.0934786796569824, "Full-pretrain/Loss (Raw)": 2.131108283996582, "Full-pretrain/Step": 1007, "Full-pretrain/Step Time": 17.568271651864052} +{"Full-pretrain/Learning Rate": 4.9252134632881e-05, "Full-pretrain/Loss": 2.0893049240112305, "Full-pretrain/Loss (Raw)": 1.8886053562164307, "Full-pretrain/Step": 1008, "Full-pretrain/Step Time": 17.57011510618031} +{"Full-pretrain/Learning Rate": 4.925007197606101e-05, "Full-pretrain/Loss": 2.087934970855713, "Full-pretrain/Loss (Raw)": 2.0523300170898438, "Full-pretrain/Step": 1009, "Full-pretrain/Step Time": 17.56778290309012} +{"Full-pretrain/Learning Rate": 4.924800652200373e-05, "Full-pretrain/Loss": 2.081420421600342, "Full-pretrain/Loss (Raw)": 1.9923229217529297, "Full-pretrain/Step": 1010, "Full-pretrain/Step Time": 17.571783198043704} +{"Full-pretrain/Learning Rate": 4.9245938270947435e-05, "Full-pretrain/Loss": 2.0801172256469727, "Full-pretrain/Loss (Raw)": 2.022226333618164, "Full-pretrain/Step": 1011, "Full-pretrain/Step Time": 17.57044374011457} +{"Full-pretrain/Learning Rate": 4.924386722313067e-05, "Full-pretrain/Loss": 2.0900373458862305, "Full-pretrain/Loss (Raw)": 2.2622756958007812, "Full-pretrain/Step": 1012, "Full-pretrain/Step Time": 17.57468457520008} +{"Full-pretrain/Learning Rate": 4.924179337879234e-05, "Full-pretrain/Loss": 2.0905654430389404, "Full-pretrain/Loss (Raw)": 1.9811742305755615, "Full-pretrain/Step": 1013, "Full-pretrain/Step Time": 17.573017107322812} +{"Full-pretrain/Learning Rate": 4.923971673817167e-05, "Full-pretrain/Loss": 2.0936264991760254, "Full-pretrain/Loss (Raw)": 2.05704927444458, "Full-pretrain/Step": 1014, "Full-pretrain/Step Time": 17.57592187821865} +{"Full-pretrain/Learning Rate": 4.9237637301508187e-05, "Full-pretrain/Loss": 2.087865114212036, "Full-pretrain/Loss (Raw)": 2.019975185394287, "Full-pretrain/Step": 1015, "Full-pretrain/Step Time": 17.578847451135516} +{"Full-pretrain/Learning Rate": 4.923555506904176e-05, "Full-pretrain/Loss": 2.0952320098876953, "Full-pretrain/Loss (Raw)": 2.136951446533203, "Full-pretrain/Step": 1016, "Full-pretrain/Step Time": 17.571449659764767} +{"Full-pretrain/Learning Rate": 4.9233470041012576e-05, "Full-pretrain/Loss": 2.0978851318359375, "Full-pretrain/Loss (Raw)": 2.2177581787109375, "Full-pretrain/Step": 1017, "Full-pretrain/Step Time": 17.573725648224354} +{"Full-pretrain/Learning Rate": 4.923138221766114e-05, "Full-pretrain/Loss": 2.093400001525879, "Full-pretrain/Loss (Raw)": 1.9476866722106934, "Full-pretrain/Step": 1018, "Full-pretrain/Step Time": 17.57118651084602} +{"Full-pretrain/Learning Rate": 4.9229291599228277e-05, "Full-pretrain/Loss": 2.101010322570801, "Full-pretrain/Loss (Raw)": 2.16384220123291, "Full-pretrain/Step": 1019, "Full-pretrain/Step Time": 17.577022274956107} +{"Full-pretrain/Learning Rate": 4.922719818595514e-05, "Full-pretrain/Loss": 2.088019371032715, "Full-pretrain/Loss (Raw)": 1.6039128303527832, "Full-pretrain/Step": 1020, "Full-pretrain/Step Time": 17.581071676686406} +{"Full-pretrain/Learning Rate": 4.922510197808321e-05, "Full-pretrain/Loss": 2.092123508453369, "Full-pretrain/Loss (Raw)": 2.121508836746216, "Full-pretrain/Step": 1021, "Full-pretrain/Step Time": 17.581155816093087} +{"Full-pretrain/Learning Rate": 4.922300297585428e-05, "Full-pretrain/Loss": 2.0888161659240723, "Full-pretrain/Loss (Raw)": 1.84552001953125, "Full-pretrain/Step": 1022, "Full-pretrain/Step Time": 17.576593616977334} +{"Full-pretrain/Learning Rate": 4.922090117951047e-05, "Full-pretrain/Loss": 2.0859665870666504, "Full-pretrain/Loss (Raw)": 2.0747666358947754, "Full-pretrain/Step": 1023, "Full-pretrain/Step Time": 17.575390182435513} +{"Full-pretrain/Learning Rate": 4.921879658929422e-05, "Full-pretrain/Loss": 2.0941689014434814, "Full-pretrain/Loss (Raw)": 2.433776378631592, "Full-pretrain/Step": 1024, "Full-pretrain/Step Time": 17.5740822609514} +{"Full-pretrain/Learning Rate": 4.92166892054483e-05, "Full-pretrain/Loss": 2.0912299156188965, "Full-pretrain/Loss (Raw)": 2.0382542610168457, "Full-pretrain/Step": 1025, "Full-pretrain/Step Time": 17.58135164529085} +{"Full-pretrain/Learning Rate": 4.9214579028215776e-05, "Full-pretrain/Loss": 2.0909647941589355, "Full-pretrain/Loss (Raw)": 1.9225807189941406, "Full-pretrain/Step": 1026, "Full-pretrain/Step Time": 17.5804722327739} +{"Full-pretrain/Learning Rate": 4.921246605784008e-05, "Full-pretrain/Loss": 2.08979868888855, "Full-pretrain/Loss (Raw)": 1.9747631549835205, "Full-pretrain/Step": 1027, "Full-pretrain/Step Time": 17.58479045331478} +{"Full-pretrain/Learning Rate": 4.921035029456493e-05, "Full-pretrain/Loss": 2.095515727996826, "Full-pretrain/Loss (Raw)": 2.2733113765716553, "Full-pretrain/Step": 1028, "Full-pretrain/Step Time": 17.58356940187514} +{"Full-pretrain/Learning Rate": 4.920823173863439e-05, "Full-pretrain/Loss": 2.1003313064575195, "Full-pretrain/Loss (Raw)": 2.212132215499878, "Full-pretrain/Step": 1029, "Full-pretrain/Step Time": 17.583691269159317} +{"Full-pretrain/Learning Rate": 4.920611039029282e-05, "Full-pretrain/Loss": 2.097456932067871, "Full-pretrain/Loss (Raw)": 1.952318549156189, "Full-pretrain/Step": 1030, "Full-pretrain/Step Time": 17.583265654742718} +{"Full-pretrain/Learning Rate": 4.920398624978493e-05, "Full-pretrain/Loss": 2.1060638427734375, "Full-pretrain/Loss (Raw)": 2.3885531425476074, "Full-pretrain/Step": 1031, "Full-pretrain/Step Time": 17.58224143087864} +{"Full-pretrain/Learning Rate": 4.920185931735572e-05, "Full-pretrain/Loss": 2.1131529808044434, "Full-pretrain/Loss (Raw)": 2.1156725883483887, "Full-pretrain/Step": 1032, "Full-pretrain/Step Time": 17.591126324608922} +{"Full-pretrain/Learning Rate": 4.9199729593250555e-05, "Full-pretrain/Loss": 2.0982296466827393, "Full-pretrain/Loss (Raw)": 2.1242406368255615, "Full-pretrain/Step": 1033, "Full-pretrain/Step Time": 17.582487611100078} +{"Full-pretrain/Learning Rate": 4.919759707771507e-05, "Full-pretrain/Loss": 2.088320255279541, "Full-pretrain/Loss (Raw)": 2.0396761894226074, "Full-pretrain/Step": 1034, "Full-pretrain/Step Time": 17.58256594464183} +{"Full-pretrain/Learning Rate": 4.9195461770995274e-05, "Full-pretrain/Loss": 2.0778775215148926, "Full-pretrain/Loss (Raw)": 2.169325351715088, "Full-pretrain/Step": 1035, "Full-pretrain/Step Time": 17.580000264570117} +{"Full-pretrain/Learning Rate": 4.9193323673337476e-05, "Full-pretrain/Loss": 2.0804190635681152, "Full-pretrain/Loss (Raw)": 2.1882972717285156, "Full-pretrain/Step": 1036, "Full-pretrain/Step Time": 17.584919607266784} +{"Full-pretrain/Learning Rate": 4.919118278498828e-05, "Full-pretrain/Loss": 2.0789923667907715, "Full-pretrain/Loss (Raw)": 2.2093327045440674, "Full-pretrain/Step": 1037, "Full-pretrain/Step Time": 17.583977557718754} +{"Full-pretrain/Learning Rate": 4.9189039106194655e-05, "Full-pretrain/Loss": 2.0837886333465576, "Full-pretrain/Loss (Raw)": 2.1199817657470703, "Full-pretrain/Step": 1038, "Full-pretrain/Step Time": 17.57530421949923} +{"Full-pretrain/Learning Rate": 4.918689263720387e-05, "Full-pretrain/Loss": 2.085329294204712, "Full-pretrain/Loss (Raw)": 2.1804118156433105, "Full-pretrain/Step": 1039, "Full-pretrain/Step Time": 17.571891644969583} +{"Full-pretrain/Learning Rate": 4.918474337826352e-05, "Full-pretrain/Loss": 2.0920915603637695, "Full-pretrain/Loss (Raw)": 2.1050031185150146, "Full-pretrain/Step": 1040, "Full-pretrain/Step Time": 17.57862987741828} +{"Full-pretrain/Learning Rate": 4.918259132962153e-05, "Full-pretrain/Loss": 2.075944423675537, "Full-pretrain/Loss (Raw)": 1.5356228351593018, "Full-pretrain/Step": 1041, "Full-pretrain/Step Time": 17.575503434985876} +{"Full-pretrain/Learning Rate": 4.918043649152612e-05, "Full-pretrain/Loss": 2.083998680114746, "Full-pretrain/Loss (Raw)": 2.2500548362731934, "Full-pretrain/Step": 1042, "Full-pretrain/Step Time": 17.578557662665844} +{"Full-pretrain/Learning Rate": 4.917827886422585e-05, "Full-pretrain/Loss": 2.0844385623931885, "Full-pretrain/Loss (Raw)": 2.0363011360168457, "Full-pretrain/Step": 1043, "Full-pretrain/Step Time": 17.5719921477139} +{"Full-pretrain/Learning Rate": 4.9176118447969625e-05, "Full-pretrain/Loss": 2.079575777053833, "Full-pretrain/Loss (Raw)": 2.1066699028015137, "Full-pretrain/Step": 1044, "Full-pretrain/Step Time": 17.573355611413717} +{"Full-pretrain/Learning Rate": 4.917395524300662e-05, "Full-pretrain/Loss": 2.076545238494873, "Full-pretrain/Loss (Raw)": 1.8841936588287354, "Full-pretrain/Step": 1045, "Full-pretrain/Step Time": 17.570558857172728} +{"Full-pretrain/Learning Rate": 4.917178924958638e-05, "Full-pretrain/Loss": 2.0798070430755615, "Full-pretrain/Loss (Raw)": 2.1614320278167725, "Full-pretrain/Step": 1046, "Full-pretrain/Step Time": 17.57232734747231} +{"Full-pretrain/Learning Rate": 4.9169620467958746e-05, "Full-pretrain/Loss": 2.0800137519836426, "Full-pretrain/Loss (Raw)": 2.0265908241271973, "Full-pretrain/Step": 1047, "Full-pretrain/Step Time": 17.56426795013249} +{"Full-pretrain/Learning Rate": 4.916744889837388e-05, "Full-pretrain/Loss": 2.0781822204589844, "Full-pretrain/Loss (Raw)": 2.078341484069824, "Full-pretrain/Step": 1048, "Full-pretrain/Step Time": 17.564915154129267} +{"Full-pretrain/Learning Rate": 4.916527454108227e-05, "Full-pretrain/Loss": 2.070873260498047, "Full-pretrain/Loss (Raw)": 1.9838671684265137, "Full-pretrain/Step": 1049, "Full-pretrain/Step Time": 17.56755301915109} +{"Full-pretrain/Learning Rate": 4.916309739633475e-05, "Full-pretrain/Loss": 2.0707578659057617, "Full-pretrain/Loss (Raw)": 1.9439935684204102, "Full-pretrain/Step": 1050, "Full-pretrain/Step Time": 17.563308430835605} +{"Full-pretrain/Learning Rate": 4.916091746438243e-05, "Full-pretrain/Loss": 2.06872296333313, "Full-pretrain/Loss (Raw)": 2.0987274646759033, "Full-pretrain/Step": 1051, "Full-pretrain/Step Time": 17.564074374735355} +{"Full-pretrain/Learning Rate": 4.915873474547677e-05, "Full-pretrain/Loss": 2.0878665447235107, "Full-pretrain/Loss (Raw)": 2.2165026664733887, "Full-pretrain/Step": 1052, "Full-pretrain/Step Time": 17.567704308778048} +{"Full-pretrain/Learning Rate": 4.915654923986955e-05, "Full-pretrain/Loss": 2.091862678527832, "Full-pretrain/Loss (Raw)": 2.2493903636932373, "Full-pretrain/Step": 1053, "Full-pretrain/Step Time": 17.577544763684273} +{"Full-pretrain/Learning Rate": 4.915436094781286e-05, "Full-pretrain/Loss": 2.099362850189209, "Full-pretrain/Loss (Raw)": 2.085524559020996, "Full-pretrain/Step": 1054, "Full-pretrain/Step Time": 17.573176335543394} +{"Full-pretrain/Learning Rate": 4.9152169869559126e-05, "Full-pretrain/Loss": 2.099979877471924, "Full-pretrain/Loss (Raw)": 2.0945096015930176, "Full-pretrain/Step": 1055, "Full-pretrain/Step Time": 17.572541069239378} +{"Full-pretrain/Learning Rate": 4.9149976005361085e-05, "Full-pretrain/Loss": 2.0821633338928223, "Full-pretrain/Loss (Raw)": 1.863648533821106, "Full-pretrain/Step": 1056, "Full-pretrain/Step Time": 17.569916784763336} +{"Full-pretrain/Learning Rate": 4.9147779355471796e-05, "Full-pretrain/Loss": 2.0863375663757324, "Full-pretrain/Loss (Raw)": 2.1718287467956543, "Full-pretrain/Step": 1057, "Full-pretrain/Step Time": 17.574612002819777} +{"Full-pretrain/Learning Rate": 4.9145579920144645e-05, "Full-pretrain/Loss": 2.0928072929382324, "Full-pretrain/Loss (Raw)": 2.1296188831329346, "Full-pretrain/Step": 1058, "Full-pretrain/Step Time": 17.568564634770155} +{"Full-pretrain/Learning Rate": 4.914337769963334e-05, "Full-pretrain/Loss": 2.093366861343384, "Full-pretrain/Loss (Raw)": 1.992664098739624, "Full-pretrain/Step": 1059, "Full-pretrain/Step Time": 17.56751917861402} +{"Full-pretrain/Learning Rate": 4.9141172694191896e-05, "Full-pretrain/Loss": 2.0922489166259766, "Full-pretrain/Loss (Raw)": 2.2375364303588867, "Full-pretrain/Step": 1060, "Full-pretrain/Step Time": 17.563755221664906} +{"Full-pretrain/Learning Rate": 4.9138964904074667e-05, "Full-pretrain/Loss": 2.087246894836426, "Full-pretrain/Loss (Raw)": 2.052070379257202, "Full-pretrain/Step": 1061, "Full-pretrain/Step Time": 17.571509823203087} +{"Full-pretrain/Learning Rate": 4.9136754329536326e-05, "Full-pretrain/Loss": 2.0972514152526855, "Full-pretrain/Loss (Raw)": 2.2724668979644775, "Full-pretrain/Step": 1062, "Full-pretrain/Step Time": 17.568679651245475} +{"Full-pretrain/Learning Rate": 4.913454097083185e-05, "Full-pretrain/Loss": 2.0849204063415527, "Full-pretrain/Loss (Raw)": 1.993951439857483, "Full-pretrain/Step": 1063, "Full-pretrain/Step Time": 17.56129909865558} +{"Full-pretrain/Learning Rate": 4.913232482821656e-05, "Full-pretrain/Loss": 2.098798990249634, "Full-pretrain/Loss (Raw)": 2.5597901344299316, "Full-pretrain/Step": 1064, "Full-pretrain/Step Time": 17.562993610277772} +{"Full-pretrain/Learning Rate": 4.913010590194607e-05, "Full-pretrain/Loss": 2.09963321685791, "Full-pretrain/Loss (Raw)": 2.1509437561035156, "Full-pretrain/Step": 1065, "Full-pretrain/Step Time": 17.570999078452587} +{"Full-pretrain/Learning Rate": 4.9127884192276354e-05, "Full-pretrain/Loss": 2.100128173828125, "Full-pretrain/Loss (Raw)": 2.055508852005005, "Full-pretrain/Step": 1066, "Full-pretrain/Step Time": 17.56453189626336} +{"Full-pretrain/Learning Rate": 4.9125659699463664e-05, "Full-pretrain/Loss": 2.0982322692871094, "Full-pretrain/Loss (Raw)": 2.1086511611938477, "Full-pretrain/Step": 1067, "Full-pretrain/Step Time": 17.565208561718464} +{"Full-pretrain/Learning Rate": 4.912343242376462e-05, "Full-pretrain/Loss": 2.095332145690918, "Full-pretrain/Loss (Raw)": 2.095503330230713, "Full-pretrain/Step": 1068, "Full-pretrain/Step Time": 17.56404173746705} +{"Full-pretrain/Learning Rate": 4.9121202365436114e-05, "Full-pretrain/Loss": 2.093212127685547, "Full-pretrain/Loss (Raw)": 2.1414947509765625, "Full-pretrain/Step": 1069, "Full-pretrain/Step Time": 17.570307271555066} +{"Full-pretrain/Learning Rate": 4.9118969524735403e-05, "Full-pretrain/Loss": 2.0972418785095215, "Full-pretrain/Loss (Raw)": 2.2489259243011475, "Full-pretrain/Step": 1070, "Full-pretrain/Step Time": 17.563641745597124} +{"Full-pretrain/Learning Rate": 4.911673390192002e-05, "Full-pretrain/Loss": 2.091679573059082, "Full-pretrain/Loss (Raw)": 2.002418279647827, "Full-pretrain/Step": 1071, "Full-pretrain/Step Time": 17.564919652417302} +{"Full-pretrain/Learning Rate": 4.9114495497247864e-05, "Full-pretrain/Loss": 2.092310905456543, "Full-pretrain/Loss (Raw)": 2.125211000442505, "Full-pretrain/Step": 1072, "Full-pretrain/Step Time": 17.56450942158699} +{"Full-pretrain/Learning Rate": 4.911225431097712e-05, "Full-pretrain/Loss": 2.101259231567383, "Full-pretrain/Loss (Raw)": 1.8219587802886963, "Full-pretrain/Step": 1073, "Full-pretrain/Step Time": 17.569252274930477} +{"Full-pretrain/Learning Rate": 4.911001034336633e-05, "Full-pretrain/Loss": 2.0869548320770264, "Full-pretrain/Loss (Raw)": 1.7923182249069214, "Full-pretrain/Step": 1074, "Full-pretrain/Step Time": 17.570495365187526} +{"Full-pretrain/Learning Rate": 4.9107763594674303e-05, "Full-pretrain/Loss": 2.089498281478882, "Full-pretrain/Loss (Raw)": 2.117690324783325, "Full-pretrain/Step": 1075, "Full-pretrain/Step Time": 17.575976002961397} +{"Full-pretrain/Learning Rate": 4.910551406516023e-05, "Full-pretrain/Loss": 2.089888572692871, "Full-pretrain/Loss (Raw)": 2.1191635131835938, "Full-pretrain/Step": 1076, "Full-pretrain/Step Time": 17.572349769994617} +{"Full-pretrain/Learning Rate": 4.910326175508357e-05, "Full-pretrain/Loss": 2.0939931869506836, "Full-pretrain/Loss (Raw)": 2.0155389308929443, "Full-pretrain/Step": 1077, "Full-pretrain/Step Time": 17.572386825457215} +{"Full-pretrain/Learning Rate": 4.9101006664704145e-05, "Full-pretrain/Loss": 2.092533588409424, "Full-pretrain/Loss (Raw)": 2.114717483520508, "Full-pretrain/Step": 1078, "Full-pretrain/Step Time": 17.572918185964227} +{"Full-pretrain/Learning Rate": 4.909874879428207e-05, "Full-pretrain/Loss": 2.0969457626342773, "Full-pretrain/Loss (Raw)": 2.167781352996826, "Full-pretrain/Step": 1079, "Full-pretrain/Step Time": 17.577410588040948} +{"Full-pretrain/Learning Rate": 4.909648814407779e-05, "Full-pretrain/Loss": 2.0902857780456543, "Full-pretrain/Loss (Raw)": 1.8652245998382568, "Full-pretrain/Step": 1080, "Full-pretrain/Step Time": 17.579412499442697} +{"Full-pretrain/Learning Rate": 4.909422471435207e-05, "Full-pretrain/Loss": 2.093156337738037, "Full-pretrain/Loss (Raw)": 2.0757315158843994, "Full-pretrain/Step": 1081, "Full-pretrain/Step Time": 17.573087457567453} +{"Full-pretrain/Learning Rate": 4.9091958505366e-05, "Full-pretrain/Loss": 2.1058928966522217, "Full-pretrain/Loss (Raw)": 2.351559638977051, "Full-pretrain/Step": 1082, "Full-pretrain/Step Time": 17.5717541705817} +{"Full-pretrain/Learning Rate": 4.9089689517380974e-05, "Full-pretrain/Loss": 2.09968900680542, "Full-pretrain/Loss (Raw)": 1.900202751159668, "Full-pretrain/Step": 1083, "Full-pretrain/Step Time": 17.580272251740098} +{"Full-pretrain/Learning Rate": 4.908741775065873e-05, "Full-pretrain/Loss": 2.0910305976867676, "Full-pretrain/Loss (Raw)": 1.9394283294677734, "Full-pretrain/Step": 1084, "Full-pretrain/Step Time": 17.575892876833677} +{"Full-pretrain/Learning Rate": 4.908514320546131e-05, "Full-pretrain/Loss": 2.080848455429077, "Full-pretrain/Loss (Raw)": 1.9235692024230957, "Full-pretrain/Step": 1085, "Full-pretrain/Step Time": 17.569792410358787} +{"Full-pretrain/Learning Rate": 4.90828658820511e-05, "Full-pretrain/Loss": 2.0859718322753906, "Full-pretrain/Loss (Raw)": 2.249464750289917, "Full-pretrain/Step": 1086, "Full-pretrain/Step Time": 17.573289323598146} +{"Full-pretrain/Learning Rate": 4.908058578069077e-05, "Full-pretrain/Loss": 2.0829126834869385, "Full-pretrain/Loss (Raw)": 1.9966237545013428, "Full-pretrain/Step": 1087, "Full-pretrain/Step Time": 17.577045077458024} +{"Full-pretrain/Learning Rate": 4.907830290164332e-05, "Full-pretrain/Loss": 2.0861124992370605, "Full-pretrain/Loss (Raw)": 1.966037631034851, "Full-pretrain/Step": 1088, "Full-pretrain/Step Time": 17.576878622174263} +{"Full-pretrain/Learning Rate": 4.90760172451721e-05, "Full-pretrain/Loss": 2.084414482116699, "Full-pretrain/Loss (Raw)": 2.117502212524414, "Full-pretrain/Step": 1089, "Full-pretrain/Step Time": 17.577532647177577} +{"Full-pretrain/Learning Rate": 4.9073728811540756e-05, "Full-pretrain/Loss": 2.082970142364502, "Full-pretrain/Loss (Raw)": 2.0833919048309326, "Full-pretrain/Step": 1090, "Full-pretrain/Step Time": 17.576184721663594} +{"Full-pretrain/Learning Rate": 4.907143760101325e-05, "Full-pretrain/Loss": 2.087109088897705, "Full-pretrain/Loss (Raw)": 2.1251115798950195, "Full-pretrain/Step": 1091, "Full-pretrain/Step Time": 17.5764914881438} +{"Full-pretrain/Learning Rate": 4.9069143613853876e-05, "Full-pretrain/Loss": 2.0868513584136963, "Full-pretrain/Loss (Raw)": 2.2292895317077637, "Full-pretrain/Step": 1092, "Full-pretrain/Step Time": 17.57670077867806} +{"Full-pretrain/Learning Rate": 4.906684685032724e-05, "Full-pretrain/Loss": 2.0883069038391113, "Full-pretrain/Loss (Raw)": 2.098644971847534, "Full-pretrain/Step": 1093, "Full-pretrain/Step Time": 17.575273383408785} +{"Full-pretrain/Learning Rate": 4.9064547310698285e-05, "Full-pretrain/Loss": 2.0815796852111816, "Full-pretrain/Loss (Raw)": 2.057199478149414, "Full-pretrain/Step": 1094, "Full-pretrain/Step Time": 17.57800410874188} +{"Full-pretrain/Learning Rate": 4.906224499523225e-05, "Full-pretrain/Loss": 2.0825111865997314, "Full-pretrain/Loss (Raw)": 2.0237574577331543, "Full-pretrain/Step": 1095, "Full-pretrain/Step Time": 17.579513425007463} +{"Full-pretrain/Learning Rate": 4.9059939904194716e-05, "Full-pretrain/Loss": 2.063908338546753, "Full-pretrain/Loss (Raw)": 1.9645013809204102, "Full-pretrain/Step": 1096, "Full-pretrain/Step Time": 17.580348785966635} +{"Full-pretrain/Learning Rate": 4.905763203785156e-05, "Full-pretrain/Loss": 2.058598756790161, "Full-pretrain/Loss (Raw)": 1.9810353517532349, "Full-pretrain/Step": 1097, "Full-pretrain/Step Time": 17.587948951870203} +{"Full-pretrain/Learning Rate": 4.905532139646901e-05, "Full-pretrain/Loss": 2.059227466583252, "Full-pretrain/Loss (Raw)": 2.075634479522705, "Full-pretrain/Step": 1098, "Full-pretrain/Step Time": 17.582732807844877} +{"Full-pretrain/Learning Rate": 4.9053007980313594e-05, "Full-pretrain/Loss": 2.062955141067505, "Full-pretrain/Loss (Raw)": 2.2279281616210938, "Full-pretrain/Step": 1099, "Full-pretrain/Step Time": 17.580314982682467} +{"Full-pretrain/Learning Rate": 4.905069178965215e-05, "Full-pretrain/Loss": 2.0584466457366943, "Full-pretrain/Loss (Raw)": 1.9512310028076172, "Full-pretrain/Step": 1100, "Full-pretrain/Step Time": 17.582800179719925} +{"Full-pretrain/Learning Rate": 4.904837282475187e-05, "Full-pretrain/Loss": 2.0556044578552246, "Full-pretrain/Loss (Raw)": 2.050550699234009, "Full-pretrain/Step": 1101, "Full-pretrain/Step Time": 17.577835319563746} +{"Full-pretrain/Learning Rate": 4.904605108588023e-05, "Full-pretrain/Loss": 2.0462136268615723, "Full-pretrain/Loss (Raw)": 1.9484217166900635, "Full-pretrain/Step": 1102, "Full-pretrain/Step Time": 17.581232177093625} +{"Full-pretrain/Learning Rate": 4.9043726573305045e-05, "Full-pretrain/Loss": 2.049351930618286, "Full-pretrain/Loss (Raw)": 2.102837562561035, "Full-pretrain/Step": 1103, "Full-pretrain/Step Time": 17.58551201969385} +{"Full-pretrain/Learning Rate": 4.904139928729445e-05, "Full-pretrain/Loss": 2.0499277114868164, "Full-pretrain/Loss (Raw)": 2.143634796142578, "Full-pretrain/Step": 1104, "Full-pretrain/Step Time": 17.582110043615103} +{"Full-pretrain/Learning Rate": 4.90390692281169e-05, "Full-pretrain/Loss": 2.0514273643493652, "Full-pretrain/Loss (Raw)": 1.8699485063552856, "Full-pretrain/Step": 1105, "Full-pretrain/Step Time": 17.583099054172635} +{"Full-pretrain/Learning Rate": 4.903673639604116e-05, "Full-pretrain/Loss": 2.0622448921203613, "Full-pretrain/Loss (Raw)": 2.138477325439453, "Full-pretrain/Step": 1106, "Full-pretrain/Step Time": 17.584333831444383} +{"Full-pretrain/Learning Rate": 4.903440079133633e-05, "Full-pretrain/Loss": 2.066840648651123, "Full-pretrain/Loss (Raw)": 2.264761209487915, "Full-pretrain/Step": 1107, "Full-pretrain/Step Time": 17.581576293334365} +{"Full-pretrain/Learning Rate": 4.9032062414271804e-05, "Full-pretrain/Loss": 2.0595703125, "Full-pretrain/Loss (Raw)": 1.886509656906128, "Full-pretrain/Step": 1108, "Full-pretrain/Step Time": 17.588943637907505} +{"Full-pretrain/Learning Rate": 4.9029721265117335e-05, "Full-pretrain/Loss": 2.0606565475463867, "Full-pretrain/Loss (Raw)": 2.0503032207489014, "Full-pretrain/Step": 1109, "Full-pretrain/Step Time": 17.584522508084774} +{"Full-pretrain/Learning Rate": 4.9027377344142955e-05, "Full-pretrain/Loss": 2.055229663848877, "Full-pretrain/Loss (Raw)": 1.9410607814788818, "Full-pretrain/Step": 1110, "Full-pretrain/Step Time": 17.581704845651984} +{"Full-pretrain/Learning Rate": 4.9025030651619046e-05, "Full-pretrain/Loss": 2.0527901649475098, "Full-pretrain/Loss (Raw)": 2.0897090435028076, "Full-pretrain/Step": 1111, "Full-pretrain/Step Time": 17.58422975987196} +{"Full-pretrain/Learning Rate": 4.90226811878163e-05, "Full-pretrain/Loss": 2.065430164337158, "Full-pretrain/Loss (Raw)": 2.269706964492798, "Full-pretrain/Step": 1112, "Full-pretrain/Step Time": 17.592342276126146} +{"Full-pretrain/Learning Rate": 4.902032895300571e-05, "Full-pretrain/Loss": 2.0687007904052734, "Full-pretrain/Loss (Raw)": 2.180387496948242, "Full-pretrain/Step": 1113, "Full-pretrain/Step Time": 17.58983780257404} +{"Full-pretrain/Learning Rate": 4.901797394745862e-05, "Full-pretrain/Loss": 2.0624423027038574, "Full-pretrain/Loss (Raw)": 2.1512908935546875, "Full-pretrain/Step": 1114, "Full-pretrain/Step Time": 17.589259328320622} +{"Full-pretrain/Learning Rate": 4.9015616171446674e-05, "Full-pretrain/Loss": 2.064232349395752, "Full-pretrain/Loss (Raw)": 1.9574856758117676, "Full-pretrain/Step": 1115, "Full-pretrain/Step Time": 17.591160817071795} +{"Full-pretrain/Learning Rate": 4.9013255625241846e-05, "Full-pretrain/Loss": 2.0652551651000977, "Full-pretrain/Loss (Raw)": 1.97215735912323, "Full-pretrain/Step": 1116, "Full-pretrain/Step Time": 17.597436862066388} +{"Full-pretrain/Learning Rate": 4.901089230911642e-05, "Full-pretrain/Loss": 2.0685360431671143, "Full-pretrain/Loss (Raw)": 2.0285511016845703, "Full-pretrain/Step": 1117, "Full-pretrain/Step Time": 17.589482970535755} +{"Full-pretrain/Learning Rate": 4.900852622334301e-05, "Full-pretrain/Loss": 2.0582435131073, "Full-pretrain/Loss (Raw)": 1.9201107025146484, "Full-pretrain/Step": 1118, "Full-pretrain/Step Time": 17.589178819209337} +{"Full-pretrain/Learning Rate": 4.900615736819453e-05, "Full-pretrain/Loss": 2.060396194458008, "Full-pretrain/Loss (Raw)": 2.0655057430267334, "Full-pretrain/Step": 1119, "Full-pretrain/Step Time": 17.58884465135634} +{"Full-pretrain/Learning Rate": 4.900378574394423e-05, "Full-pretrain/Loss": 2.063122272491455, "Full-pretrain/Loss (Raw)": 2.0532727241516113, "Full-pretrain/Step": 1120, "Full-pretrain/Step Time": 17.592081025242805} +{"Full-pretrain/Learning Rate": 4.900141135086569e-05, "Full-pretrain/Loss": 2.0658907890319824, "Full-pretrain/Loss (Raw)": 2.2060930728912354, "Full-pretrain/Step": 1121, "Full-pretrain/Step Time": 17.595004165545106} +{"Full-pretrain/Learning Rate": 4.899903418923278e-05, "Full-pretrain/Loss": 2.060335636138916, "Full-pretrain/Loss (Raw)": 1.9056282043457031, "Full-pretrain/Step": 1122, "Full-pretrain/Step Time": 17.588648159056902} +{"Full-pretrain/Learning Rate": 4.8996654259319705e-05, "Full-pretrain/Loss": 2.06054425239563, "Full-pretrain/Loss (Raw)": 2.131791114807129, "Full-pretrain/Step": 1123, "Full-pretrain/Step Time": 17.58743591606617} +{"Full-pretrain/Learning Rate": 4.8994271561401e-05, "Full-pretrain/Loss": 2.051819324493408, "Full-pretrain/Loss (Raw)": 1.9500923156738281, "Full-pretrain/Step": 1124, "Full-pretrain/Step Time": 17.59621572867036} +{"Full-pretrain/Learning Rate": 4.899188609575151e-05, "Full-pretrain/Loss": 2.0546634197235107, "Full-pretrain/Loss (Raw)": 2.189657211303711, "Full-pretrain/Step": 1125, "Full-pretrain/Step Time": 17.602427046746016} +{"Full-pretrain/Learning Rate": 4.8989497862646374e-05, "Full-pretrain/Loss": 2.0614113807678223, "Full-pretrain/Loss (Raw)": 2.2731363773345947, "Full-pretrain/Step": 1126, "Full-pretrain/Step Time": 17.592730965465307} +{"Full-pretrain/Learning Rate": 4.89871068623611e-05, "Full-pretrain/Loss": 2.054597854614258, "Full-pretrain/Loss (Raw)": 1.8057218790054321, "Full-pretrain/Step": 1127, "Full-pretrain/Step Time": 17.593775145709515} +{"Full-pretrain/Learning Rate": 4.898471309517148e-05, "Full-pretrain/Loss": 2.058272123336792, "Full-pretrain/Loss (Raw)": 2.0820767879486084, "Full-pretrain/Step": 1128, "Full-pretrain/Step Time": 17.59896382689476} +{"Full-pretrain/Learning Rate": 4.898231656135363e-05, "Full-pretrain/Loss": 2.063866138458252, "Full-pretrain/Loss (Raw)": 2.1600499153137207, "Full-pretrain/Step": 1129, "Full-pretrain/Step Time": 17.604126995429397} +{"Full-pretrain/Learning Rate": 4.897991726118399e-05, "Full-pretrain/Loss": 2.0650687217712402, "Full-pretrain/Loss (Raw)": 2.1141061782836914, "Full-pretrain/Step": 1130, "Full-pretrain/Step Time": 17.60073136165738} +{"Full-pretrain/Learning Rate": 4.8977515194939325e-05, "Full-pretrain/Loss": 2.0593678951263428, "Full-pretrain/Loss (Raw)": 2.0455095767974854, "Full-pretrain/Step": 1131, "Full-pretrain/Step Time": 17.595834841951728} +{"Full-pretrain/Learning Rate": 4.8975110362896716e-05, "Full-pretrain/Loss": 2.065159797668457, "Full-pretrain/Loss (Raw)": 2.1365652084350586, "Full-pretrain/Step": 1132, "Full-pretrain/Step Time": 17.596268652006984} +{"Full-pretrain/Learning Rate": 4.897270276533354e-05, "Full-pretrain/Loss": 2.068692207336426, "Full-pretrain/Loss (Raw)": 2.1635890007019043, "Full-pretrain/Step": 1133, "Full-pretrain/Step Time": 17.599118500947952} +{"Full-pretrain/Learning Rate": 4.897029240252753e-05, "Full-pretrain/Loss": 2.0705878734588623, "Full-pretrain/Loss (Raw)": 2.0090861320495605, "Full-pretrain/Step": 1134, "Full-pretrain/Step Time": 17.597072517499328} +{"Full-pretrain/Learning Rate": 4.896787927475671e-05, "Full-pretrain/Loss": 2.0773215293884277, "Full-pretrain/Loss (Raw)": 2.3183159828186035, "Full-pretrain/Step": 1135, "Full-pretrain/Step Time": 17.59316861629486} +{"Full-pretrain/Learning Rate": 4.896546338229945e-05, "Full-pretrain/Loss": 2.078763961791992, "Full-pretrain/Loss (Raw)": 2.1897881031036377, "Full-pretrain/Step": 1136, "Full-pretrain/Step Time": 17.598352113738656} +{"Full-pretrain/Learning Rate": 4.89630447254344e-05, "Full-pretrain/Loss": 2.104404926300049, "Full-pretrain/Loss (Raw)": 2.6904637813568115, "Full-pretrain/Step": 1137, "Full-pretrain/Step Time": 17.60525467246771} +{"Full-pretrain/Learning Rate": 4.8960623304440565e-05, "Full-pretrain/Loss": 2.102973699569702, "Full-pretrain/Loss (Raw)": 2.0926804542541504, "Full-pretrain/Step": 1138, "Full-pretrain/Step Time": 17.602156177163124} +{"Full-pretrain/Learning Rate": 4.8958199119597256e-05, "Full-pretrain/Loss": 2.097748041152954, "Full-pretrain/Loss (Raw)": 2.0975379943847656, "Full-pretrain/Step": 1139, "Full-pretrain/Step Time": 17.60095672495663} +{"Full-pretrain/Learning Rate": 4.895577217118409e-05, "Full-pretrain/Loss": 2.106663465499878, "Full-pretrain/Loss (Raw)": 2.171802282333374, "Full-pretrain/Step": 1140, "Full-pretrain/Step Time": 17.60282347165048} +{"Full-pretrain/Learning Rate": 4.895334245948103e-05, "Full-pretrain/Loss": 2.100733995437622, "Full-pretrain/Loss (Raw)": 1.8605594635009766, "Full-pretrain/Step": 1141, "Full-pretrain/Step Time": 17.604789255186915} +{"Full-pretrain/Learning Rate": 4.8950909984768335e-05, "Full-pretrain/Loss": 2.107158899307251, "Full-pretrain/Loss (Raw)": 2.1466569900512695, "Full-pretrain/Step": 1142, "Full-pretrain/Step Time": 17.600164528936148} +{"Full-pretrain/Learning Rate": 4.894847474732658e-05, "Full-pretrain/Loss": 2.108733654022217, "Full-pretrain/Loss (Raw)": 2.140103816986084, "Full-pretrain/Step": 1143, "Full-pretrain/Step Time": 17.595397220924497} +{"Full-pretrain/Learning Rate": 4.894603674743669e-05, "Full-pretrain/Loss": 2.0951733589172363, "Full-pretrain/Loss (Raw)": 1.8357770442962646, "Full-pretrain/Step": 1144, "Full-pretrain/Step Time": 17.596033480018377} +{"Full-pretrain/Learning Rate": 4.894359598537988e-05, "Full-pretrain/Loss": 2.0847787857055664, "Full-pretrain/Loss (Raw)": 1.8477591276168823, "Full-pretrain/Step": 1145, "Full-pretrain/Step Time": 17.601323844864964} +{"Full-pretrain/Learning Rate": 4.894115246143768e-05, "Full-pretrain/Loss": 2.0812463760375977, "Full-pretrain/Loss (Raw)": 2.0382490158081055, "Full-pretrain/Step": 1146, "Full-pretrain/Step Time": 17.601430762559175} +{"Full-pretrain/Learning Rate": 4.893870617589196e-05, "Full-pretrain/Loss": 2.086501359939575, "Full-pretrain/Loss (Raw)": 2.125649929046631, "Full-pretrain/Step": 1147, "Full-pretrain/Step Time": 17.59636940062046} +{"Full-pretrain/Learning Rate": 4.893625712902489e-05, "Full-pretrain/Loss": 2.080699920654297, "Full-pretrain/Loss (Raw)": 1.786514401435852, "Full-pretrain/Step": 1148, "Full-pretrain/Step Time": 17.59432429075241} +{"Full-pretrain/Learning Rate": 4.8933805321118975e-05, "Full-pretrain/Loss": 2.085347890853882, "Full-pretrain/Loss (Raw)": 2.177281618118286, "Full-pretrain/Step": 1149, "Full-pretrain/Step Time": 17.600119752809405} +{"Full-pretrain/Learning Rate": 4.893135075245702e-05, "Full-pretrain/Loss": 2.082082509994507, "Full-pretrain/Loss (Raw)": 1.8156206607818604, "Full-pretrain/Step": 1150, "Full-pretrain/Step Time": 17.602858582511544} +{"Full-pretrain/Learning Rate": 4.892889342332218e-05, "Full-pretrain/Loss": 2.0782248973846436, "Full-pretrain/Loss (Raw)": 1.942061424255371, "Full-pretrain/Step": 1151, "Full-pretrain/Step Time": 17.600026154890656} +{"Full-pretrain/Learning Rate": 4.892643333399788e-05, "Full-pretrain/Loss": 2.0653347969055176, "Full-pretrain/Loss (Raw)": 1.6407963037490845, "Full-pretrain/Step": 1152, "Full-pretrain/Step Time": 17.601096354424953} +{"Full-pretrain/Learning Rate": 4.892397048476791e-05, "Full-pretrain/Loss": 2.0654451847076416, "Full-pretrain/Loss (Raw)": 2.2096195220947266, "Full-pretrain/Step": 1153, "Full-pretrain/Step Time": 17.599046235904098} +{"Full-pretrain/Learning Rate": 4.892150487591635e-05, "Full-pretrain/Loss": 2.072310447692871, "Full-pretrain/Loss (Raw)": 2.125321388244629, "Full-pretrain/Step": 1154, "Full-pretrain/Step Time": 17.600046506151557} +{"Full-pretrain/Learning Rate": 4.891903650772761e-05, "Full-pretrain/Loss": 2.0638651847839355, "Full-pretrain/Loss (Raw)": 1.8615385293960571, "Full-pretrain/Step": 1155, "Full-pretrain/Step Time": 17.59399320371449} +{"Full-pretrain/Learning Rate": 4.891656538048642e-05, "Full-pretrain/Loss": 2.073282241821289, "Full-pretrain/Loss (Raw)": 2.2514381408691406, "Full-pretrain/Step": 1156, "Full-pretrain/Step Time": 17.59156516008079} +{"Full-pretrain/Learning Rate": 4.891409149447781e-05, "Full-pretrain/Loss": 2.062321186065674, "Full-pretrain/Loss (Raw)": 1.8389005661010742, "Full-pretrain/Step": 1157, "Full-pretrain/Step Time": 17.592551488429308} +{"Full-pretrain/Learning Rate": 4.8911614849987154e-05, "Full-pretrain/Loss": 2.061089038848877, "Full-pretrain/Loss (Raw)": 2.2337088584899902, "Full-pretrain/Step": 1158, "Full-pretrain/Step Time": 17.595059018582106} +{"Full-pretrain/Learning Rate": 4.890913544730013e-05, "Full-pretrain/Loss": 2.0677356719970703, "Full-pretrain/Loss (Raw)": 2.01841402053833, "Full-pretrain/Step": 1159, "Full-pretrain/Step Time": 17.596922954544425} +{"Full-pretrain/Learning Rate": 4.890665328670273e-05, "Full-pretrain/Loss": 2.069629669189453, "Full-pretrain/Loss (Raw)": 2.1426804065704346, "Full-pretrain/Step": 1160, "Full-pretrain/Step Time": 17.584837779402733} +{"Full-pretrain/Learning Rate": 4.890416836848127e-05, "Full-pretrain/Loss": 2.069932699203491, "Full-pretrain/Loss (Raw)": 2.1697499752044678, "Full-pretrain/Step": 1161, "Full-pretrain/Step Time": 17.594812661409378} +{"Full-pretrain/Learning Rate": 4.89016806929224e-05, "Full-pretrain/Loss": 2.073819160461426, "Full-pretrain/Loss (Raw)": 2.238480806350708, "Full-pretrain/Step": 1162, "Full-pretrain/Step Time": 17.59019960835576} +{"Full-pretrain/Learning Rate": 4.889919026031306e-05, "Full-pretrain/Loss": 2.0695250034332275, "Full-pretrain/Loss (Raw)": 1.908087968826294, "Full-pretrain/Step": 1163, "Full-pretrain/Step Time": 17.594864636659622} +{"Full-pretrain/Learning Rate": 4.889669707094052e-05, "Full-pretrain/Loss": 2.0699567794799805, "Full-pretrain/Loss (Raw)": 2.150377035140991, "Full-pretrain/Step": 1164, "Full-pretrain/Step Time": 17.593499910086393} +{"Full-pretrain/Learning Rate": 4.889420112509237e-05, "Full-pretrain/Loss": 2.070377826690674, "Full-pretrain/Loss (Raw)": 2.177067756652832, "Full-pretrain/Step": 1165, "Full-pretrain/Step Time": 17.589317863807082} +{"Full-pretrain/Learning Rate": 4.889170242305652e-05, "Full-pretrain/Loss": 2.075639247894287, "Full-pretrain/Loss (Raw)": 2.1774587631225586, "Full-pretrain/Step": 1166, "Full-pretrain/Step Time": 17.592642698436975} +{"Full-pretrain/Learning Rate": 4.8889200965121184e-05, "Full-pretrain/Loss": 2.0673818588256836, "Full-pretrain/Loss (Raw)": 2.0540716648101807, "Full-pretrain/Step": 1167, "Full-pretrain/Step Time": 17.600923171266913} +{"Full-pretrain/Learning Rate": 4.8886696751574926e-05, "Full-pretrain/Loss": 2.059483051300049, "Full-pretrain/Loss (Raw)": 1.9370315074920654, "Full-pretrain/Step": 1168, "Full-pretrain/Step Time": 17.602887392044067} +{"Full-pretrain/Learning Rate": 4.888418978270658e-05, "Full-pretrain/Loss": 2.04714035987854, "Full-pretrain/Loss (Raw)": 2.295491933822632, "Full-pretrain/Step": 1169, "Full-pretrain/Step Time": 17.598739501088858} +{"Full-pretrain/Learning Rate": 4.888168005880533e-05, "Full-pretrain/Loss": 2.0442004203796387, "Full-pretrain/Loss (Raw)": 1.998600959777832, "Full-pretrain/Step": 1170, "Full-pretrain/Step Time": 17.597808677703142} +{"Full-pretrain/Learning Rate": 4.887916758016069e-05, "Full-pretrain/Loss": 2.0424795150756836, "Full-pretrain/Loss (Raw)": 2.042468547821045, "Full-pretrain/Step": 1171, "Full-pretrain/Step Time": 17.60231913998723} +{"Full-pretrain/Learning Rate": 4.887665234706246e-05, "Full-pretrain/Loss": 2.0326123237609863, "Full-pretrain/Loss (Raw)": 1.8560527563095093, "Full-pretrain/Step": 1172, "Full-pretrain/Step Time": 17.60880828090012} +{"Full-pretrain/Learning Rate": 4.887413435980077e-05, "Full-pretrain/Loss": 2.037482738494873, "Full-pretrain/Loss (Raw)": 2.0164108276367188, "Full-pretrain/Step": 1173, "Full-pretrain/Step Time": 17.60776331461966} +{"Full-pretrain/Learning Rate": 4.887161361866608e-05, "Full-pretrain/Loss": 2.0339016914367676, "Full-pretrain/Loss (Raw)": 2.032073974609375, "Full-pretrain/Step": 1174, "Full-pretrain/Step Time": 17.60242792405188} +{"Full-pretrain/Learning Rate": 4.886909012394913e-05, "Full-pretrain/Loss": 2.02917742729187, "Full-pretrain/Loss (Raw)": 1.9889219999313354, "Full-pretrain/Step": 1175, "Full-pretrain/Step Time": 17.61411647684872} +{"Full-pretrain/Learning Rate": 4.886656387594104e-05, "Full-pretrain/Loss": 2.0386829376220703, "Full-pretrain/Loss (Raw)": 2.139951705932617, "Full-pretrain/Step": 1176, "Full-pretrain/Step Time": 17.613186268135905} +{"Full-pretrain/Learning Rate": 4.886403487493319e-05, "Full-pretrain/Loss": 2.049093723297119, "Full-pretrain/Loss (Raw)": 2.180905342102051, "Full-pretrain/Step": 1177, "Full-pretrain/Step Time": 17.614180751144886} +{"Full-pretrain/Learning Rate": 4.88615031212173e-05, "Full-pretrain/Loss": 2.0487020015716553, "Full-pretrain/Loss (Raw)": 2.0257153511047363, "Full-pretrain/Step": 1178, "Full-pretrain/Step Time": 17.61083936318755} +{"Full-pretrain/Learning Rate": 4.885896861508541e-05, "Full-pretrain/Loss": 2.048900604248047, "Full-pretrain/Loss (Raw)": 2.132009506225586, "Full-pretrain/Step": 1179, "Full-pretrain/Step Time": 17.611069820821285} +{"Full-pretrain/Learning Rate": 4.885643135682988e-05, "Full-pretrain/Loss": 2.055846691131592, "Full-pretrain/Loss (Raw)": 2.0087857246398926, "Full-pretrain/Step": 1180, "Full-pretrain/Step Time": 17.6134225204587} +{"Full-pretrain/Learning Rate": 4.885389134674338e-05, "Full-pretrain/Loss": 2.054515838623047, "Full-pretrain/Loss (Raw)": 2.1346988677978516, "Full-pretrain/Step": 1181, "Full-pretrain/Step Time": 17.60903597995639} +{"Full-pretrain/Learning Rate": 4.885134858511888e-05, "Full-pretrain/Loss": 2.058807373046875, "Full-pretrain/Loss (Raw)": 1.9529480934143066, "Full-pretrain/Step": 1182, "Full-pretrain/Step Time": 17.60352393053472} +{"Full-pretrain/Learning Rate": 4.8848803072249715e-05, "Full-pretrain/Loss": 2.062340259552002, "Full-pretrain/Loss (Raw)": 2.0551159381866455, "Full-pretrain/Step": 1183, "Full-pretrain/Step Time": 17.605113992467523} +{"Full-pretrain/Learning Rate": 4.884625480842949e-05, "Full-pretrain/Loss": 2.0753073692321777, "Full-pretrain/Loss (Raw)": 2.055734634399414, "Full-pretrain/Step": 1184, "Full-pretrain/Step Time": 17.60827787965536} +{"Full-pretrain/Learning Rate": 4.884370379395215e-05, "Full-pretrain/Loss": 2.0738372802734375, "Full-pretrain/Loss (Raw)": 2.1625826358795166, "Full-pretrain/Step": 1185, "Full-pretrain/Step Time": 17.60335136204958} +{"Full-pretrain/Learning Rate": 4.884115002911197e-05, "Full-pretrain/Loss": 2.072157144546509, "Full-pretrain/Loss (Raw)": 2.0715537071228027, "Full-pretrain/Step": 1186, "Full-pretrain/Step Time": 17.595648439601064} +{"Full-pretrain/Learning Rate": 4.8838593514203505e-05, "Full-pretrain/Loss": 2.0798001289367676, "Full-pretrain/Loss (Raw)": 2.106119155883789, "Full-pretrain/Step": 1187, "Full-pretrain/Step Time": 17.60008417069912} +{"Full-pretrain/Learning Rate": 4.8836034249521653e-05, "Full-pretrain/Loss": 2.073098659515381, "Full-pretrain/Loss (Raw)": 2.036987066268921, "Full-pretrain/Step": 1188, "Full-pretrain/Step Time": 17.604933939874172} +{"Full-pretrain/Learning Rate": 4.883347223536163e-05, "Full-pretrain/Loss": 2.079404592514038, "Full-pretrain/Loss (Raw)": 2.0406885147094727, "Full-pretrain/Step": 1189, "Full-pretrain/Step Time": 17.59921457991004} +{"Full-pretrain/Learning Rate": 4.883090747201897e-05, "Full-pretrain/Loss": 2.069037914276123, "Full-pretrain/Loss (Raw)": 1.9019721746444702, "Full-pretrain/Step": 1190, "Full-pretrain/Step Time": 17.599650274962187} +{"Full-pretrain/Learning Rate": 4.8828339959789493e-05, "Full-pretrain/Loss": 2.062788248062134, "Full-pretrain/Loss (Raw)": 1.818429946899414, "Full-pretrain/Step": 1191, "Full-pretrain/Step Time": 17.60695148445666} +{"Full-pretrain/Learning Rate": 4.8825769698969384e-05, "Full-pretrain/Loss": 2.054266929626465, "Full-pretrain/Loss (Raw)": 1.8699952363967896, "Full-pretrain/Step": 1192, "Full-pretrain/Step Time": 17.610022800043225} +{"Full-pretrain/Learning Rate": 4.882319668985511e-05, "Full-pretrain/Loss": 2.0477113723754883, "Full-pretrain/Loss (Raw)": 1.9599740505218506, "Full-pretrain/Step": 1193, "Full-pretrain/Step Time": 17.60687099210918} +{"Full-pretrain/Learning Rate": 4.8820620932743465e-05, "Full-pretrain/Loss": 2.0417885780334473, "Full-pretrain/Loss (Raw)": 2.0489509105682373, "Full-pretrain/Step": 1194, "Full-pretrain/Step Time": 17.608417684212327} +{"Full-pretrain/Learning Rate": 4.8818042427931576e-05, "Full-pretrain/Loss": 2.045459508895874, "Full-pretrain/Loss (Raw)": 2.0255544185638428, "Full-pretrain/Step": 1195, "Full-pretrain/Step Time": 17.60768142156303} +{"Full-pretrain/Learning Rate": 4.8815461175716857e-05, "Full-pretrain/Loss": 2.0523757934570312, "Full-pretrain/Loss (Raw)": 2.371704578399658, "Full-pretrain/Step": 1196, "Full-pretrain/Step Time": 17.60745563171804} +{"Full-pretrain/Learning Rate": 4.881287717639706e-05, "Full-pretrain/Loss": 2.0509347915649414, "Full-pretrain/Loss (Raw)": 2.1309499740600586, "Full-pretrain/Step": 1197, "Full-pretrain/Step Time": 17.60499283671379} +{"Full-pretrain/Learning Rate": 4.8810290430270255e-05, "Full-pretrain/Loss": 2.06510591506958, "Full-pretrain/Loss (Raw)": 2.6309385299682617, "Full-pretrain/Step": 1198, "Full-pretrain/Step Time": 17.6051832921803} +{"Full-pretrain/Learning Rate": 4.8807700937634814e-05, "Full-pretrain/Loss": 2.069056510925293, "Full-pretrain/Loss (Raw)": 2.180485248565674, "Full-pretrain/Step": 1199, "Full-pretrain/Step Time": 17.606441468000412} +{"Full-pretrain/Learning Rate": 4.8805108698789435e-05, "Full-pretrain/Loss": 2.0828773975372314, "Full-pretrain/Loss (Raw)": 2.3793065547943115, "Full-pretrain/Step": 1200, "Full-pretrain/Step Time": 17.60574566014111} +{"Full-pretrain/Learning Rate": 4.880251371403313e-05, "Full-pretrain/Loss": 2.0812158584594727, "Full-pretrain/Loss (Raw)": 2.2423181533813477, "Full-pretrain/Step": 1201, "Full-pretrain/Step Time": 17.60491611622274} +{"Full-pretrain/Learning Rate": 4.879991598366524e-05, "Full-pretrain/Loss": 2.0753135681152344, "Full-pretrain/Loss (Raw)": 1.8097285032272339, "Full-pretrain/Step": 1202, "Full-pretrain/Step Time": 17.59853081777692} +{"Full-pretrain/Learning Rate": 4.87973155079854e-05, "Full-pretrain/Loss": 2.0751378536224365, "Full-pretrain/Loss (Raw)": 2.0368447303771973, "Full-pretrain/Step": 1203, "Full-pretrain/Step Time": 17.59736499376595} +{"Full-pretrain/Learning Rate": 4.879471228729358e-05, "Full-pretrain/Loss": 2.0790464878082275, "Full-pretrain/Loss (Raw)": 1.9811352491378784, "Full-pretrain/Step": 1204, "Full-pretrain/Step Time": 17.601175740361214} +{"Full-pretrain/Learning Rate": 4.8792106321890063e-05, "Full-pretrain/Loss": 2.080582618713379, "Full-pretrain/Loss (Raw)": 2.065568447113037, "Full-pretrain/Step": 1205, "Full-pretrain/Step Time": 17.60135466605425} +{"Full-pretrain/Learning Rate": 4.878949761207544e-05, "Full-pretrain/Loss": 2.088334560394287, "Full-pretrain/Loss (Raw)": 2.2801294326782227, "Full-pretrain/Step": 1206, "Full-pretrain/Step Time": 17.595591943711042} +{"Full-pretrain/Learning Rate": 4.8786886158150627e-05, "Full-pretrain/Loss": 2.0919899940490723, "Full-pretrain/Loss (Raw)": 2.105898380279541, "Full-pretrain/Step": 1207, "Full-pretrain/Step Time": 17.58996649645269} +{"Full-pretrain/Learning Rate": 4.878427196041686e-05, "Full-pretrain/Loss": 2.0869252681732178, "Full-pretrain/Loss (Raw)": 1.97788405418396, "Full-pretrain/Step": 1208, "Full-pretrain/Step Time": 17.587768463417888} +{"Full-pretrain/Learning Rate": 4.878165501917568e-05, "Full-pretrain/Loss": 2.0817840099334717, "Full-pretrain/Loss (Raw)": 2.0163822174072266, "Full-pretrain/Step": 1209, "Full-pretrain/Step Time": 17.598511481657624} +{"Full-pretrain/Learning Rate": 4.877903533472894e-05, "Full-pretrain/Loss": 2.0798146724700928, "Full-pretrain/Loss (Raw)": 1.962693691253662, "Full-pretrain/Step": 1210, "Full-pretrain/Step Time": 17.597169982269406} +{"Full-pretrain/Learning Rate": 4.877641290737884e-05, "Full-pretrain/Loss": 2.0797784328460693, "Full-pretrain/Loss (Raw)": 2.130850315093994, "Full-pretrain/Step": 1211, "Full-pretrain/Step Time": 17.589438498020172} +{"Full-pretrain/Learning Rate": 4.877378773742787e-05, "Full-pretrain/Loss": 2.0860908031463623, "Full-pretrain/Loss (Raw)": 2.2107858657836914, "Full-pretrain/Step": 1212, "Full-pretrain/Step Time": 17.5965757612139} +{"Full-pretrain/Learning Rate": 4.877115982517883e-05, "Full-pretrain/Loss": 2.085268974304199, "Full-pretrain/Loss (Raw)": 2.1084001064300537, "Full-pretrain/Step": 1213, "Full-pretrain/Step Time": 17.601549552753568} +{"Full-pretrain/Learning Rate": 4.8768529170934866e-05, "Full-pretrain/Loss": 2.0856692790985107, "Full-pretrain/Loss (Raw)": 1.9657526016235352, "Full-pretrain/Step": 1214, "Full-pretrain/Step Time": 17.60120357014239} +{"Full-pretrain/Learning Rate": 4.876589577499941e-05, "Full-pretrain/Loss": 2.0871996879577637, "Full-pretrain/Loss (Raw)": 2.104093551635742, "Full-pretrain/Step": 1215, "Full-pretrain/Step Time": 17.598394222557545} +{"Full-pretrain/Learning Rate": 4.876325963767623e-05, "Full-pretrain/Loss": 2.0765199661254883, "Full-pretrain/Loss (Raw)": 1.71397864818573, "Full-pretrain/Step": 1216, "Full-pretrain/Step Time": 17.59771047346294} +{"Full-pretrain/Learning Rate": 4.876062075926941e-05, "Full-pretrain/Loss": 2.0684499740600586, "Full-pretrain/Loss (Raw)": 1.9043406248092651, "Full-pretrain/Step": 1217, "Full-pretrain/Step Time": 17.604342628270388} +{"Full-pretrain/Learning Rate": 4.8757979140083324e-05, "Full-pretrain/Loss": 2.0637755393981934, "Full-pretrain/Loss (Raw)": 1.9219765663146973, "Full-pretrain/Step": 1218, "Full-pretrain/Step Time": 17.604434875771403} +{"Full-pretrain/Learning Rate": 4.875533478042269e-05, "Full-pretrain/Loss": 2.059675693511963, "Full-pretrain/Loss (Raw)": 1.9749271869659424, "Full-pretrain/Step": 1219, "Full-pretrain/Step Time": 17.598369089886546} +{"Full-pretrain/Learning Rate": 4.875268768059255e-05, "Full-pretrain/Loss": 2.058534622192383, "Full-pretrain/Loss (Raw)": 2.000469207763672, "Full-pretrain/Step": 1220, "Full-pretrain/Step Time": 17.598499294370413} +{"Full-pretrain/Learning Rate": 4.875003784089822e-05, "Full-pretrain/Loss": 2.060788154602051, "Full-pretrain/Loss (Raw)": 2.1128017902374268, "Full-pretrain/Step": 1221, "Full-pretrain/Step Time": 17.609090145677328} +{"Full-pretrain/Learning Rate": 4.874738526164538e-05, "Full-pretrain/Loss": 2.067722797393799, "Full-pretrain/Loss (Raw)": 2.123880386352539, "Full-pretrain/Step": 1222, "Full-pretrain/Step Time": 17.605558024719357} +{"Full-pretrain/Learning Rate": 4.8744729943139996e-05, "Full-pretrain/Loss": 2.076612949371338, "Full-pretrain/Loss (Raw)": 2.1029233932495117, "Full-pretrain/Step": 1223, "Full-pretrain/Step Time": 17.600993735715747} +{"Full-pretrain/Learning Rate": 4.8742071885688356e-05, "Full-pretrain/Loss": 2.079575300216675, "Full-pretrain/Loss (Raw)": 1.96478271484375, "Full-pretrain/Step": 1224, "Full-pretrain/Step Time": 17.597726058214903} +{"Full-pretrain/Learning Rate": 4.8739411089597065e-05, "Full-pretrain/Loss": 2.076493501663208, "Full-pretrain/Loss (Raw)": 1.8613590002059937, "Full-pretrain/Step": 1225, "Full-pretrain/Step Time": 17.59410554356873} +{"Full-pretrain/Learning Rate": 4.8736747555173047e-05, "Full-pretrain/Loss": 2.075622797012329, "Full-pretrain/Loss (Raw)": 2.0210824012756348, "Full-pretrain/Step": 1226, "Full-pretrain/Step Time": 17.598675748333335} +{"Full-pretrain/Learning Rate": 4.8734081282723544e-05, "Full-pretrain/Loss": 2.081871271133423, "Full-pretrain/Loss (Raw)": 2.225511074066162, "Full-pretrain/Step": 1227, "Full-pretrain/Step Time": 17.597294168546796} +{"Full-pretrain/Learning Rate": 4.8731412272556105e-05, "Full-pretrain/Loss": 2.0675387382507324, "Full-pretrain/Loss (Raw)": 1.9130637645721436, "Full-pretrain/Step": 1228, "Full-pretrain/Step Time": 17.59199116937816} +{"Full-pretrain/Learning Rate": 4.87287405249786e-05, "Full-pretrain/Loss": 2.0670957565307617, "Full-pretrain/Loss (Raw)": 2.116774082183838, "Full-pretrain/Step": 1229, "Full-pretrain/Step Time": 17.59728330746293} +{"Full-pretrain/Learning Rate": 4.872606604029921e-05, "Full-pretrain/Loss": 2.0529332160949707, "Full-pretrain/Loss (Raw)": 2.177737236022949, "Full-pretrain/Step": 1230, "Full-pretrain/Step Time": 17.60025619342923} +{"Full-pretrain/Learning Rate": 4.872338881882644e-05, "Full-pretrain/Loss": 2.053401470184326, "Full-pretrain/Loss (Raw)": 2.1954703330993652, "Full-pretrain/Step": 1231, "Full-pretrain/Step Time": 17.59480180591345} +{"Full-pretrain/Learning Rate": 4.872070886086912e-05, "Full-pretrain/Loss": 2.044869899749756, "Full-pretrain/Loss (Raw)": 2.106293201446533, "Full-pretrain/Step": 1232, "Full-pretrain/Step Time": 17.598414067178965} +{"Full-pretrain/Learning Rate": 4.8718026166736357e-05, "Full-pretrain/Loss": 2.0336179733276367, "Full-pretrain/Loss (Raw)": 1.8822537660598755, "Full-pretrain/Step": 1233, "Full-pretrain/Step Time": 17.59429942443967} +{"Full-pretrain/Learning Rate": 4.8715340736737616e-05, "Full-pretrain/Loss": 2.039527177810669, "Full-pretrain/Loss (Raw)": 1.9988285303115845, "Full-pretrain/Step": 1234, "Full-pretrain/Step Time": 17.601834440603852} +{"Full-pretrain/Learning Rate": 4.871265257118265e-05, "Full-pretrain/Loss": 2.0398356914520264, "Full-pretrain/Loss (Raw)": 2.0467147827148438, "Full-pretrain/Step": 1235, "Full-pretrain/Step Time": 17.608258923515677} +{"Full-pretrain/Learning Rate": 4.870996167038154e-05, "Full-pretrain/Loss": 2.042900562286377, "Full-pretrain/Loss (Raw)": 2.079214096069336, "Full-pretrain/Step": 1236, "Full-pretrain/Step Time": 17.604042815044522} +{"Full-pretrain/Learning Rate": 4.870726803464469e-05, "Full-pretrain/Loss": 2.045280933380127, "Full-pretrain/Loss (Raw)": 2.1417431831359863, "Full-pretrain/Step": 1237, "Full-pretrain/Step Time": 17.60627321153879} +{"Full-pretrain/Learning Rate": 4.8704571664282806e-05, "Full-pretrain/Loss": 2.0362439155578613, "Full-pretrain/Loss (Raw)": 1.990943193435669, "Full-pretrain/Step": 1238, "Full-pretrain/Step Time": 17.61113976687193} +{"Full-pretrain/Learning Rate": 4.870187255960691e-05, "Full-pretrain/Loss": 2.0405526161193848, "Full-pretrain/Loss (Raw)": 2.2437682151794434, "Full-pretrain/Step": 1239, "Full-pretrain/Step Time": 17.611935902386904} +{"Full-pretrain/Learning Rate": 4.869917072092834e-05, "Full-pretrain/Loss": 2.0389368534088135, "Full-pretrain/Loss (Raw)": 1.9261877536773682, "Full-pretrain/Step": 1240, "Full-pretrain/Step Time": 17.609250025823712} +{"Full-pretrain/Learning Rate": 4.869646614855876e-05, "Full-pretrain/Loss": 2.0406625270843506, "Full-pretrain/Loss (Raw)": 2.071603298187256, "Full-pretrain/Step": 1241, "Full-pretrain/Step Time": 17.614070910960436} +{"Full-pretrain/Learning Rate": 4.869375884281013e-05, "Full-pretrain/Loss": 2.043940544128418, "Full-pretrain/Loss (Raw)": 2.067591428756714, "Full-pretrain/Step": 1242, "Full-pretrain/Step Time": 17.613779462873936} +{"Full-pretrain/Learning Rate": 4.869104880399475e-05, "Full-pretrain/Loss": 2.03518009185791, "Full-pretrain/Loss (Raw)": 1.8505058288574219, "Full-pretrain/Step": 1243, "Full-pretrain/Step Time": 17.619220035150647} +{"Full-pretrain/Learning Rate": 4.868833603242522e-05, "Full-pretrain/Loss": 2.021749496459961, "Full-pretrain/Loss (Raw)": 1.7810182571411133, "Full-pretrain/Step": 1244, "Full-pretrain/Step Time": 17.608846956864} +{"Full-pretrain/Learning Rate": 4.8685620528414445e-05, "Full-pretrain/Loss": 2.02355694770813, "Full-pretrain/Loss (Raw)": 2.166236162185669, "Full-pretrain/Step": 1245, "Full-pretrain/Step Time": 17.61507390625775} +{"Full-pretrain/Learning Rate": 4.8682902292275664e-05, "Full-pretrain/Loss": 2.0349764823913574, "Full-pretrain/Loss (Raw)": 2.331171989440918, "Full-pretrain/Step": 1246, "Full-pretrain/Step Time": 17.615211471915245} +{"Full-pretrain/Learning Rate": 4.868018132432244e-05, "Full-pretrain/Loss": 2.0348880290985107, "Full-pretrain/Loss (Raw)": 2.101262092590332, "Full-pretrain/Step": 1247, "Full-pretrain/Step Time": 17.618699410930276} +{"Full-pretrain/Learning Rate": 4.867745762486861e-05, "Full-pretrain/Loss": 2.0490245819091797, "Full-pretrain/Loss (Raw)": 2.166349411010742, "Full-pretrain/Step": 1248, "Full-pretrain/Step Time": 17.613875227048993} +{"Full-pretrain/Learning Rate": 4.867473119422837e-05, "Full-pretrain/Loss": 2.0582070350646973, "Full-pretrain/Loss (Raw)": 2.198183536529541, "Full-pretrain/Step": 1249, "Full-pretrain/Step Time": 17.619095051661134} +{"Full-pretrain/Learning Rate": 4.8672002032716203e-05, "Full-pretrain/Loss": 2.0565311908721924, "Full-pretrain/Loss (Raw)": 1.8683457374572754, "Full-pretrain/Step": 1250, "Full-pretrain/Step Time": 17.6235460806638} +{"Full-pretrain/Learning Rate": 4.866927014064692e-05, "Full-pretrain/Loss": 2.0635299682617188, "Full-pretrain/Loss (Raw)": 2.1988914012908936, "Full-pretrain/Step": 1251, "Full-pretrain/Step Time": 17.624841429293156} +{"Full-pretrain/Learning Rate": 4.866653551833564e-05, "Full-pretrain/Loss": 2.0665855407714844, "Full-pretrain/Loss (Raw)": 2.0982418060302734, "Full-pretrain/Step": 1252, "Full-pretrain/Step Time": 17.615782853215933} +{"Full-pretrain/Learning Rate": 4.8663798166097816e-05, "Full-pretrain/Loss": 2.067328453063965, "Full-pretrain/Loss (Raw)": 2.1365718841552734, "Full-pretrain/Step": 1253, "Full-pretrain/Step Time": 17.614921279251575} +{"Full-pretrain/Learning Rate": 4.8661058084249176e-05, "Full-pretrain/Loss": 2.067121982574463, "Full-pretrain/Loss (Raw)": 2.117281675338745, "Full-pretrain/Step": 1254, "Full-pretrain/Step Time": 17.62128254957497} +{"Full-pretrain/Learning Rate": 4.865831527310581e-05, "Full-pretrain/Loss": 2.059459686279297, "Full-pretrain/Loss (Raw)": 1.8577332496643066, "Full-pretrain/Step": 1255, "Full-pretrain/Step Time": 17.623356010764837} +{"Full-pretrain/Learning Rate": 4.86555697329841e-05, "Full-pretrain/Loss": 2.0576066970825195, "Full-pretrain/Loss (Raw)": 1.9054794311523438, "Full-pretrain/Step": 1256, "Full-pretrain/Step Time": 17.620764557272196} +{"Full-pretrain/Learning Rate": 4.865282146420072e-05, "Full-pretrain/Loss": 2.0635712146759033, "Full-pretrain/Loss (Raw)": 2.0522255897521973, "Full-pretrain/Step": 1257, "Full-pretrain/Step Time": 17.618373619392514} +{"Full-pretrain/Learning Rate": 4.86500704670727e-05, "Full-pretrain/Loss": 2.066711187362671, "Full-pretrain/Loss (Raw)": 2.1215577125549316, "Full-pretrain/Step": 1258, "Full-pretrain/Step Time": 17.61947369016707} +{"Full-pretrain/Learning Rate": 4.8647316741917366e-05, "Full-pretrain/Loss": 2.060703754425049, "Full-pretrain/Loss (Raw)": 2.033276081085205, "Full-pretrain/Step": 1259, "Full-pretrain/Step Time": 17.62591015174985} +{"Full-pretrain/Learning Rate": 4.8644560289052354e-05, "Full-pretrain/Loss": 2.0585360527038574, "Full-pretrain/Loss (Raw)": 1.8437004089355469, "Full-pretrain/Step": 1260, "Full-pretrain/Step Time": 17.621064314618707} +{"Full-pretrain/Learning Rate": 4.864180110879562e-05, "Full-pretrain/Loss": 2.0555899143218994, "Full-pretrain/Loss (Raw)": 2.0224907398223877, "Full-pretrain/Step": 1261, "Full-pretrain/Step Time": 17.61989052966237} +{"Full-pretrain/Learning Rate": 4.8639039201465444e-05, "Full-pretrain/Loss": 2.0419042110443115, "Full-pretrain/Loss (Raw)": 1.7397935390472412, "Full-pretrain/Step": 1262, "Full-pretrain/Step Time": 17.622277157381177} +{"Full-pretrain/Learning Rate": 4.8636274567380394e-05, "Full-pretrain/Loss": 2.0415477752685547, "Full-pretrain/Loss (Raw)": 2.184065341949463, "Full-pretrain/Step": 1263, "Full-pretrain/Step Time": 17.625450851395726} +{"Full-pretrain/Learning Rate": 4.8633507206859385e-05, "Full-pretrain/Loss": 2.0401673316955566, "Full-pretrain/Loss (Raw)": 2.0621235370635986, "Full-pretrain/Step": 1264, "Full-pretrain/Step Time": 17.62218659184873} +{"Full-pretrain/Learning Rate": 4.863073712022162e-05, "Full-pretrain/Loss": 2.056788206100464, "Full-pretrain/Loss (Raw)": 2.4141147136688232, "Full-pretrain/Step": 1265, "Full-pretrain/Step Time": 17.619760839268565} +{"Full-pretrain/Learning Rate": 4.862796430778663e-05, "Full-pretrain/Loss": 2.061558485031128, "Full-pretrain/Loss (Raw)": 2.151479721069336, "Full-pretrain/Step": 1266, "Full-pretrain/Step Time": 17.620498487725854} +{"Full-pretrain/Learning Rate": 4.8625188769874274e-05, "Full-pretrain/Loss": 2.058326244354248, "Full-pretrain/Loss (Raw)": 1.943281650543213, "Full-pretrain/Step": 1267, "Full-pretrain/Step Time": 17.62250868231058} +{"Full-pretrain/Learning Rate": 4.8622410506804686e-05, "Full-pretrain/Loss": 2.058884620666504, "Full-pretrain/Loss (Raw)": 2.09708833694458, "Full-pretrain/Step": 1268, "Full-pretrain/Step Time": 17.621101062744856} +{"Full-pretrain/Learning Rate": 4.8619629518898344e-05, "Full-pretrain/Loss": 2.0598156452178955, "Full-pretrain/Loss (Raw)": 2.171534538269043, "Full-pretrain/Step": 1269, "Full-pretrain/Step Time": 17.61889623105526} +{"Full-pretrain/Learning Rate": 4.861684580647605e-05, "Full-pretrain/Loss": 2.063551425933838, "Full-pretrain/Loss (Raw)": 2.1104884147644043, "Full-pretrain/Step": 1270, "Full-pretrain/Step Time": 17.62100002542138} +{"Full-pretrain/Learning Rate": 4.861405936985888e-05, "Full-pretrain/Loss": 2.0597469806671143, "Full-pretrain/Loss (Raw)": 2.1220273971557617, "Full-pretrain/Step": 1271, "Full-pretrain/Step Time": 17.626820420846343} +{"Full-pretrain/Learning Rate": 4.861127020936827e-05, "Full-pretrain/Loss": 2.0638771057128906, "Full-pretrain/Loss (Raw)": 2.0583460330963135, "Full-pretrain/Step": 1272, "Full-pretrain/Step Time": 17.624981831759214} +{"Full-pretrain/Learning Rate": 4.8608478325325935e-05, "Full-pretrain/Loss": 2.078523874282837, "Full-pretrain/Loss (Raw)": 2.5403079986572266, "Full-pretrain/Step": 1273, "Full-pretrain/Step Time": 17.62019906193018} +{"Full-pretrain/Learning Rate": 4.860568371805392e-05, "Full-pretrain/Loss": 2.0864758491516113, "Full-pretrain/Loss (Raw)": 2.3220484256744385, "Full-pretrain/Step": 1274, "Full-pretrain/Step Time": 17.620698461309075} +{"Full-pretrain/Learning Rate": 4.860288638787458e-05, "Full-pretrain/Loss": 2.088283061981201, "Full-pretrain/Loss (Raw)": 1.9083425998687744, "Full-pretrain/Step": 1275, "Full-pretrain/Step Time": 17.62303213775158} +{"Full-pretrain/Learning Rate": 4.860008633511059e-05, "Full-pretrain/Loss": 2.090258836746216, "Full-pretrain/Loss (Raw)": 1.8442397117614746, "Full-pretrain/Step": 1276, "Full-pretrain/Step Time": 17.618332916870713} +{"Full-pretrain/Learning Rate": 4.859728356008495e-05, "Full-pretrain/Loss": 2.0827527046203613, "Full-pretrain/Loss (Raw)": 1.9260393381118774, "Full-pretrain/Step": 1277, "Full-pretrain/Step Time": 17.61348182335496} +{"Full-pretrain/Learning Rate": 4.859447806312093e-05, "Full-pretrain/Loss": 2.0695595741271973, "Full-pretrain/Loss (Raw)": 1.9089934825897217, "Full-pretrain/Step": 1278, "Full-pretrain/Step Time": 17.61382037959993} +{"Full-pretrain/Learning Rate": 4.859166984454216e-05, "Full-pretrain/Loss": 2.0615386962890625, "Full-pretrain/Loss (Raw)": 1.8445968627929688, "Full-pretrain/Step": 1279, "Full-pretrain/Step Time": 17.618965834379196} +{"Full-pretrain/Learning Rate": 4.858885890467256e-05, "Full-pretrain/Loss": 2.058868646621704, "Full-pretrain/Loss (Raw)": 2.080904960632324, "Full-pretrain/Step": 1280, "Full-pretrain/Step Time": 17.610236017033458} +{"Full-pretrain/Learning Rate": 4.8586045243836386e-05, "Full-pretrain/Loss": 2.0570855140686035, "Full-pretrain/Loss (Raw)": 2.14111590385437, "Full-pretrain/Step": 1281, "Full-pretrain/Step Time": 17.60974499769509} +{"Full-pretrain/Learning Rate": 4.858322886235817e-05, "Full-pretrain/Loss": 2.063046932220459, "Full-pretrain/Loss (Raw)": 2.0591139793395996, "Full-pretrain/Step": 1282, "Full-pretrain/Step Time": 17.611834932118654} +{"Full-pretrain/Learning Rate": 4.85804097605628e-05, "Full-pretrain/Loss": 2.066193103790283, "Full-pretrain/Loss (Raw)": 2.299570083618164, "Full-pretrain/Step": 1283, "Full-pretrain/Step Time": 17.61601012572646} +{"Full-pretrain/Learning Rate": 4.857758793877545e-05, "Full-pretrain/Loss": 2.0665173530578613, "Full-pretrain/Loss (Raw)": 2.1086249351501465, "Full-pretrain/Step": 1284, "Full-pretrain/Step Time": 17.620612295344472} +{"Full-pretrain/Learning Rate": 4.8574763397321614e-05, "Full-pretrain/Loss": 2.0662074089050293, "Full-pretrain/Loss (Raw)": 2.126648426055908, "Full-pretrain/Step": 1285, "Full-pretrain/Step Time": 17.612863149493933} +{"Full-pretrain/Learning Rate": 4.857193613652711e-05, "Full-pretrain/Loss": 2.0622177124023438, "Full-pretrain/Loss (Raw)": 1.9896115064620972, "Full-pretrain/Step": 1286, "Full-pretrain/Step Time": 17.616507289931178} +{"Full-pretrain/Learning Rate": 4.856910615671805e-05, "Full-pretrain/Loss": 2.071295738220215, "Full-pretrain/Loss (Raw)": 2.1482317447662354, "Full-pretrain/Step": 1287, "Full-pretrain/Step Time": 17.61797965504229} +{"Full-pretrain/Learning Rate": 4.856627345822088e-05, "Full-pretrain/Loss": 2.0713486671447754, "Full-pretrain/Loss (Raw)": 1.9071705341339111, "Full-pretrain/Step": 1288, "Full-pretrain/Step Time": 17.623752918094397} +{"Full-pretrain/Learning Rate": 4.8563438041362354e-05, "Full-pretrain/Loss": 2.0812840461730957, "Full-pretrain/Loss (Raw)": 2.3701536655426025, "Full-pretrain/Step": 1289, "Full-pretrain/Step Time": 17.61332083493471} +{"Full-pretrain/Learning Rate": 4.8560599906469515e-05, "Full-pretrain/Loss": 2.079730987548828, "Full-pretrain/Loss (Raw)": 2.07185959815979, "Full-pretrain/Step": 1290, "Full-pretrain/Step Time": 17.6138698104769} +{"Full-pretrain/Learning Rate": 4.855775905386977e-05, "Full-pretrain/Loss": 2.084181308746338, "Full-pretrain/Loss (Raw)": 2.1756880283355713, "Full-pretrain/Step": 1291, "Full-pretrain/Step Time": 17.622071197256446} +{"Full-pretrain/Learning Rate": 4.855491548389079e-05, "Full-pretrain/Loss": 2.0904541015625, "Full-pretrain/Loss (Raw)": 2.0444343090057373, "Full-pretrain/Step": 1292, "Full-pretrain/Step Time": 17.61638561822474} +{"Full-pretrain/Learning Rate": 4.8552069196860595e-05, "Full-pretrain/Loss": 2.089481830596924, "Full-pretrain/Loss (Raw)": 1.9913723468780518, "Full-pretrain/Step": 1293, "Full-pretrain/Step Time": 17.621864980086684} +{"Full-pretrain/Learning Rate": 4.8549220193107494e-05, "Full-pretrain/Loss": 2.0961947441101074, "Full-pretrain/Loss (Raw)": 1.9546128511428833, "Full-pretrain/Step": 1294, "Full-pretrain/Step Time": 17.62126993946731} +{"Full-pretrain/Learning Rate": 4.854636847296011e-05, "Full-pretrain/Loss": 2.092747211456299, "Full-pretrain/Loss (Raw)": 2.0737390518188477, "Full-pretrain/Step": 1295, "Full-pretrain/Step Time": 17.622303375974298} +{"Full-pretrain/Learning Rate": 4.8543514036747405e-05, "Full-pretrain/Loss": 2.0889883041381836, "Full-pretrain/Loss (Raw)": 1.9418476819992065, "Full-pretrain/Step": 1296, "Full-pretrain/Step Time": 17.62005632929504} +{"Full-pretrain/Learning Rate": 4.854065688479863e-05, "Full-pretrain/Loss": 2.0741825103759766, "Full-pretrain/Loss (Raw)": 1.9403274059295654, "Full-pretrain/Step": 1297, "Full-pretrain/Step Time": 17.62197893485427} +{"Full-pretrain/Learning Rate": 4.8537797017443356e-05, "Full-pretrain/Loss": 2.069831371307373, "Full-pretrain/Loss (Raw)": 2.0122461318969727, "Full-pretrain/Step": 1298, "Full-pretrain/Step Time": 17.62279214709997} +{"Full-pretrain/Learning Rate": 4.853493443501147e-05, "Full-pretrain/Loss": 2.077877998352051, "Full-pretrain/Loss (Raw)": 2.2007627487182617, "Full-pretrain/Step": 1299, "Full-pretrain/Step Time": 17.619128555059433} +{"Full-pretrain/Learning Rate": 4.8532069137833156e-05, "Full-pretrain/Loss": 2.077868700027466, "Full-pretrain/Loss (Raw)": 2.096795082092285, "Full-pretrain/Step": 1300, "Full-pretrain/Step Time": 17.613386081531644} +{"Full-pretrain/Learning Rate": 4.852920112623895e-05, "Full-pretrain/Loss": 2.079711437225342, "Full-pretrain/Loss (Raw)": 2.230498790740967, "Full-pretrain/Step": 1301, "Full-pretrain/Step Time": 17.617380117997527} +{"Full-pretrain/Learning Rate": 4.8526330400559664e-05, "Full-pretrain/Loss": 2.0733017921447754, "Full-pretrain/Loss (Raw)": 1.905378818511963, "Full-pretrain/Step": 1302, "Full-pretrain/Step Time": 17.62236139923334} +{"Full-pretrain/Learning Rate": 4.8523456961126425e-05, "Full-pretrain/Loss": 2.0777463912963867, "Full-pretrain/Loss (Raw)": 2.2642602920532227, "Full-pretrain/Step": 1303, "Full-pretrain/Step Time": 17.61570749245584} +{"Full-pretrain/Learning Rate": 4.852058080827069e-05, "Full-pretrain/Loss": 2.074950695037842, "Full-pretrain/Loss (Raw)": 1.968885898590088, "Full-pretrain/Step": 1304, "Full-pretrain/Step Time": 17.621946090832353} +{"Full-pretrain/Learning Rate": 4.851770194232423e-05, "Full-pretrain/Loss": 2.0598905086517334, "Full-pretrain/Loss (Raw)": 2.0583815574645996, "Full-pretrain/Step": 1305, "Full-pretrain/Step Time": 17.62272540293634} +{"Full-pretrain/Learning Rate": 4.8514820363619115e-05, "Full-pretrain/Loss": 2.050849437713623, "Full-pretrain/Loss (Raw)": 2.032728433609009, "Full-pretrain/Step": 1306, "Full-pretrain/Step Time": 17.6268680524081} +{"Full-pretrain/Learning Rate": 4.8511936072487735e-05, "Full-pretrain/Loss": 2.052309513092041, "Full-pretrain/Loss (Raw)": 1.9550676345825195, "Full-pretrain/Step": 1307, "Full-pretrain/Step Time": 17.625976962968707} +{"Full-pretrain/Learning Rate": 4.850904906926279e-05, "Full-pretrain/Loss": 2.0527749061584473, "Full-pretrain/Loss (Raw)": 1.8591320514678955, "Full-pretrain/Step": 1308, "Full-pretrain/Step Time": 17.62348524853587} +{"Full-pretrain/Learning Rate": 4.85061593542773e-05, "Full-pretrain/Loss": 2.0492238998413086, "Full-pretrain/Loss (Raw)": 1.8124113082885742, "Full-pretrain/Step": 1309, "Full-pretrain/Step Time": 17.62527588941157} +{"Full-pretrain/Learning Rate": 4.850326692786459e-05, "Full-pretrain/Loss": 2.05802845954895, "Full-pretrain/Loss (Raw)": 2.1907360553741455, "Full-pretrain/Step": 1310, "Full-pretrain/Step Time": 17.624898049980402} +{"Full-pretrain/Learning Rate": 4.850037179035829e-05, "Full-pretrain/Loss": 2.064842939376831, "Full-pretrain/Loss (Raw)": 2.0626635551452637, "Full-pretrain/Step": 1311, "Full-pretrain/Step Time": 17.61840659379959} +{"Full-pretrain/Learning Rate": 4.849747394209237e-05, "Full-pretrain/Loss": 2.062243938446045, "Full-pretrain/Loss (Raw)": 1.9977368116378784, "Full-pretrain/Step": 1312, "Full-pretrain/Step Time": 17.623341359198093} +{"Full-pretrain/Learning Rate": 4.849457338340109e-05, "Full-pretrain/Loss": 2.062406063079834, "Full-pretrain/Loss (Raw)": 2.1463067531585693, "Full-pretrain/Step": 1313, "Full-pretrain/Step Time": 17.62431207485497} +{"Full-pretrain/Learning Rate": 4.849167011461903e-05, "Full-pretrain/Loss": 2.0625030994415283, "Full-pretrain/Loss (Raw)": 2.062216281890869, "Full-pretrain/Step": 1314, "Full-pretrain/Step Time": 17.63026027008891} +{"Full-pretrain/Learning Rate": 4.8488764136081065e-05, "Full-pretrain/Loss": 2.055774211883545, "Full-pretrain/Loss (Raw)": 2.0842506885528564, "Full-pretrain/Step": 1315, "Full-pretrain/Step Time": 17.62566809915006} +{"Full-pretrain/Learning Rate": 4.848585544812242e-05, "Full-pretrain/Loss": 2.0529959201812744, "Full-pretrain/Loss (Raw)": 2.019714832305908, "Full-pretrain/Step": 1316, "Full-pretrain/Step Time": 17.62663316167891} +{"Full-pretrain/Learning Rate": 4.84829440510786e-05, "Full-pretrain/Loss": 2.0522031784057617, "Full-pretrain/Loss (Raw)": 2.101278781890869, "Full-pretrain/Step": 1317, "Full-pretrain/Step Time": 17.628865737468004} +{"Full-pretrain/Learning Rate": 4.848002994528543e-05, "Full-pretrain/Loss": 2.056478261947632, "Full-pretrain/Loss (Raw)": 2.126415729522705, "Full-pretrain/Step": 1318, "Full-pretrain/Step Time": 17.625459169968963} +{"Full-pretrain/Learning Rate": 4.847711313107907e-05, "Full-pretrain/Loss": 2.050288438796997, "Full-pretrain/Loss (Raw)": 1.9501609802246094, "Full-pretrain/Step": 1319, "Full-pretrain/Step Time": 17.619952423498034} +{"Full-pretrain/Learning Rate": 4.847419360879596e-05, "Full-pretrain/Loss": 2.055081367492676, "Full-pretrain/Loss (Raw)": 2.0605390071868896, "Full-pretrain/Step": 1320, "Full-pretrain/Step Time": 17.623964516445994} +{"Full-pretrain/Learning Rate": 4.847127137877286e-05, "Full-pretrain/Loss": 2.0498995780944824, "Full-pretrain/Loss (Raw)": 2.204333782196045, "Full-pretrain/Step": 1321, "Full-pretrain/Step Time": 17.622884625568986} +{"Full-pretrain/Learning Rate": 4.846834644134686e-05, "Full-pretrain/Loss": 2.050619125366211, "Full-pretrain/Loss (Raw)": 2.0948915481567383, "Full-pretrain/Step": 1322, "Full-pretrain/Step Time": 17.617612270638347} +{"Full-pretrain/Learning Rate": 4.846541879685533e-05, "Full-pretrain/Loss": 2.0466837882995605, "Full-pretrain/Loss (Raw)": 2.0497608184814453, "Full-pretrain/Step": 1323, "Full-pretrain/Step Time": 17.620837479829788} +{"Full-pretrain/Learning Rate": 4.846248844563601e-05, "Full-pretrain/Loss": 2.0503575801849365, "Full-pretrain/Loss (Raw)": 2.161985397338867, "Full-pretrain/Step": 1324, "Full-pretrain/Step Time": 17.619879575446248} +{"Full-pretrain/Learning Rate": 4.845955538802688e-05, "Full-pretrain/Loss": 2.055039405822754, "Full-pretrain/Loss (Raw)": 2.1411972045898438, "Full-pretrain/Step": 1325, "Full-pretrain/Step Time": 17.62132959626615} +{"Full-pretrain/Learning Rate": 4.8456619624366286e-05, "Full-pretrain/Loss": 2.058558225631714, "Full-pretrain/Loss (Raw)": 2.0672130584716797, "Full-pretrain/Step": 1326, "Full-pretrain/Step Time": 17.617149274796247} +{"Full-pretrain/Learning Rate": 4.845368115499286e-05, "Full-pretrain/Loss": 2.058772563934326, "Full-pretrain/Loss (Raw)": 2.080601692199707, "Full-pretrain/Step": 1327, "Full-pretrain/Step Time": 17.614289121702313} +{"Full-pretrain/Learning Rate": 4.8450739980245555e-05, "Full-pretrain/Loss": 2.0617215633392334, "Full-pretrain/Loss (Raw)": 2.036210775375366, "Full-pretrain/Step": 1328, "Full-pretrain/Step Time": 17.6181173697114} +{"Full-pretrain/Learning Rate": 4.8447796100463626e-05, "Full-pretrain/Loss": 2.0642781257629395, "Full-pretrain/Loss (Raw)": 2.0221333503723145, "Full-pretrain/Step": 1329, "Full-pretrain/Step Time": 17.616846105083823} +{"Full-pretrain/Learning Rate": 4.844484951598667e-05, "Full-pretrain/Loss": 2.061786651611328, "Full-pretrain/Loss (Raw)": 1.9325228929519653, "Full-pretrain/Step": 1330, "Full-pretrain/Step Time": 17.621703170239925} +{"Full-pretrain/Learning Rate": 4.844190022715456e-05, "Full-pretrain/Loss": 2.0460798740386963, "Full-pretrain/Loss (Raw)": 1.6981430053710938, "Full-pretrain/Step": 1331, "Full-pretrain/Step Time": 17.61569087021053} +{"Full-pretrain/Learning Rate": 4.843894823430749e-05, "Full-pretrain/Loss": 2.0453529357910156, "Full-pretrain/Loss (Raw)": 2.073533296585083, "Full-pretrain/Step": 1332, "Full-pretrain/Step Time": 17.616327043622732} +{"Full-pretrain/Learning Rate": 4.843599353778598e-05, "Full-pretrain/Loss": 2.0403239727020264, "Full-pretrain/Loss (Raw)": 2.069568634033203, "Full-pretrain/Step": 1333, "Full-pretrain/Step Time": 17.616695262491703} +{"Full-pretrain/Learning Rate": 4.843303613793085e-05, "Full-pretrain/Loss": 2.039675235748291, "Full-pretrain/Loss (Raw)": 1.8846232891082764, "Full-pretrain/Step": 1334, "Full-pretrain/Step Time": 17.62179276160896} +{"Full-pretrain/Learning Rate": 4.843007603508324e-05, "Full-pretrain/Loss": 2.0332722663879395, "Full-pretrain/Loss (Raw)": 2.059359550476074, "Full-pretrain/Step": 1335, "Full-pretrain/Step Time": 17.626621713861823} +{"Full-pretrain/Learning Rate": 4.842711322958459e-05, "Full-pretrain/Loss": 2.039900779724121, "Full-pretrain/Loss (Raw)": 2.1810035705566406, "Full-pretrain/Step": 1336, "Full-pretrain/Step Time": 17.632477406412363} +{"Full-pretrain/Learning Rate": 4.842414772177667e-05, "Full-pretrain/Loss": 2.0435142517089844, "Full-pretrain/Loss (Raw)": 2.1740105152130127, "Full-pretrain/Step": 1337, "Full-pretrain/Step Time": 17.625411342829466} +{"Full-pretrain/Learning Rate": 4.842117951200153e-05, "Full-pretrain/Loss": 2.0399749279022217, "Full-pretrain/Loss (Raw)": 1.91947340965271, "Full-pretrain/Step": 1338, "Full-pretrain/Step Time": 17.630793321877718} +{"Full-pretrain/Learning Rate": 4.841820860060157e-05, "Full-pretrain/Loss": 2.0441715717315674, "Full-pretrain/Loss (Raw)": 2.0893592834472656, "Full-pretrain/Step": 1339, "Full-pretrain/Step Time": 17.632465356960893} +{"Full-pretrain/Learning Rate": 4.841523498791948e-05, "Full-pretrain/Loss": 2.052077293395996, "Full-pretrain/Loss (Raw)": 2.1121225357055664, "Full-pretrain/Step": 1340, "Full-pretrain/Step Time": 17.631613163277507} +{"Full-pretrain/Learning Rate": 4.841225867429826e-05, "Full-pretrain/Loss": 2.0561022758483887, "Full-pretrain/Loss (Raw)": 1.9412027597427368, "Full-pretrain/Step": 1341, "Full-pretrain/Step Time": 17.63237687200308} +{"Full-pretrain/Learning Rate": 4.840927966008123e-05, "Full-pretrain/Loss": 2.055387020111084, "Full-pretrain/Loss (Raw)": 2.1678528785705566, "Full-pretrain/Step": 1342, "Full-pretrain/Step Time": 17.630942337214947} +{"Full-pretrain/Learning Rate": 4.840629794561202e-05, "Full-pretrain/Loss": 2.060422897338867, "Full-pretrain/Loss (Raw)": 2.2238121032714844, "Full-pretrain/Step": 1343, "Full-pretrain/Step Time": 17.63423104584217} +{"Full-pretrain/Learning Rate": 4.840331353123456e-05, "Full-pretrain/Loss": 2.0540037155151367, "Full-pretrain/Loss (Raw)": 1.7923226356506348, "Full-pretrain/Step": 1344, "Full-pretrain/Step Time": 17.63303149305284} +{"Full-pretrain/Learning Rate": 4.8400326417293115e-05, "Full-pretrain/Loss": 2.055253028869629, "Full-pretrain/Loss (Raw)": 2.1862809658050537, "Full-pretrain/Step": 1345, "Full-pretrain/Step Time": 17.629093259572983} +{"Full-pretrain/Learning Rate": 4.839733660413224e-05, "Full-pretrain/Loss": 2.054752826690674, "Full-pretrain/Loss (Raw)": 2.046215057373047, "Full-pretrain/Step": 1346, "Full-pretrain/Step Time": 17.6239194534719} +{"Full-pretrain/Learning Rate": 4.8394344092096814e-05, "Full-pretrain/Loss": 2.0532631874084473, "Full-pretrain/Loss (Raw)": 2.0365772247314453, "Full-pretrain/Step": 1347, "Full-pretrain/Step Time": 17.63204431720078} +{"Full-pretrain/Learning Rate": 4.839134888153202e-05, "Full-pretrain/Loss": 2.059816837310791, "Full-pretrain/Loss (Raw)": 2.229435920715332, "Full-pretrain/Step": 1348, "Full-pretrain/Step Time": 17.632718455046415} +{"Full-pretrain/Learning Rate": 4.8388350972783346e-05, "Full-pretrain/Loss": 2.063650608062744, "Full-pretrain/Loss (Raw)": 2.223954200744629, "Full-pretrain/Step": 1349, "Full-pretrain/Step Time": 17.628334745764732} +{"Full-pretrain/Learning Rate": 4.8385350366196605e-05, "Full-pretrain/Loss": 2.0666792392730713, "Full-pretrain/Loss (Raw)": 2.2233335971832275, "Full-pretrain/Step": 1350, "Full-pretrain/Step Time": 17.622349184006453} +{"Full-pretrain/Learning Rate": 4.838234706211792e-05, "Full-pretrain/Loss": 2.069492816925049, "Full-pretrain/Loss (Raw)": 2.040191650390625, "Full-pretrain/Step": 1351, "Full-pretrain/Step Time": 17.6353868432343} +{"Full-pretrain/Learning Rate": 4.8379341060893725e-05, "Full-pretrain/Loss": 2.067728281021118, "Full-pretrain/Loss (Raw)": 2.0040807723999023, "Full-pretrain/Step": 1352, "Full-pretrain/Step Time": 17.639045460149646} +{"Full-pretrain/Learning Rate": 4.8376332362870745e-05, "Full-pretrain/Loss": 2.057274103164673, "Full-pretrain/Loss (Raw)": 1.8697961568832397, "Full-pretrain/Step": 1353, "Full-pretrain/Step Time": 17.641346339136362} +{"Full-pretrain/Learning Rate": 4.8373320968396046e-05, "Full-pretrain/Loss": 2.057539939880371, "Full-pretrain/Loss (Raw)": 2.1033997535705566, "Full-pretrain/Step": 1354, "Full-pretrain/Step Time": 17.634518841281533} +{"Full-pretrain/Learning Rate": 4.837030687781699e-05, "Full-pretrain/Loss": 2.0522453784942627, "Full-pretrain/Loss (Raw)": 1.880333662033081, "Full-pretrain/Step": 1355, "Full-pretrain/Step Time": 17.646200651302934} +{"Full-pretrain/Learning Rate": 4.8367290091481245e-05, "Full-pretrain/Loss": 2.047478675842285, "Full-pretrain/Loss (Raw)": 2.0094518661499023, "Full-pretrain/Step": 1356, "Full-pretrain/Step Time": 17.646601689979434} +{"Full-pretrain/Learning Rate": 4.8364270609736794e-05, "Full-pretrain/Loss": 2.0387253761291504, "Full-pretrain/Loss (Raw)": 1.8610916137695312, "Full-pretrain/Step": 1357, "Full-pretrain/Step Time": 17.644410146400332} +{"Full-pretrain/Learning Rate": 4.836124843293195e-05, "Full-pretrain/Loss": 2.0351357460021973, "Full-pretrain/Loss (Raw)": 1.9523470401763916, "Full-pretrain/Step": 1358, "Full-pretrain/Step Time": 17.638888413086534} +{"Full-pretrain/Learning Rate": 4.8358223561415304e-05, "Full-pretrain/Loss": 2.0314877033233643, "Full-pretrain/Loss (Raw)": 1.9638619422912598, "Full-pretrain/Step": 1359, "Full-pretrain/Step Time": 17.64077964052558} +{"Full-pretrain/Learning Rate": 4.835519599553578e-05, "Full-pretrain/Loss": 2.034162998199463, "Full-pretrain/Loss (Raw)": 2.1218161582946777, "Full-pretrain/Step": 1360, "Full-pretrain/Step Time": 17.63736356422305} +{"Full-pretrain/Learning Rate": 4.8352165735642604e-05, "Full-pretrain/Loss": 2.030874252319336, "Full-pretrain/Loss (Raw)": 1.916900873184204, "Full-pretrain/Step": 1361, "Full-pretrain/Step Time": 17.640924433246255} +{"Full-pretrain/Learning Rate": 4.8349132782085316e-05, "Full-pretrain/Loss": 2.031280517578125, "Full-pretrain/Loss (Raw)": 1.9455208778381348, "Full-pretrain/Step": 1362, "Full-pretrain/Step Time": 17.63607414998114} +{"Full-pretrain/Learning Rate": 4.8346097135213766e-05, "Full-pretrain/Loss": 2.0461926460266113, "Full-pretrain/Loss (Raw)": 2.175333023071289, "Full-pretrain/Step": 1363, "Full-pretrain/Step Time": 17.633918678388} +{"Full-pretrain/Learning Rate": 4.834305879537813e-05, "Full-pretrain/Loss": 2.0468199253082275, "Full-pretrain/Loss (Raw)": 2.0936036109924316, "Full-pretrain/Step": 1364, "Full-pretrain/Step Time": 17.62862773053348} +{"Full-pretrain/Learning Rate": 4.8340017762928845e-05, "Full-pretrain/Loss": 2.0451693534851074, "Full-pretrain/Loss (Raw)": 2.016751766204834, "Full-pretrain/Step": 1365, "Full-pretrain/Step Time": 17.631861543282866} +{"Full-pretrain/Learning Rate": 4.833697403821672e-05, "Full-pretrain/Loss": 2.0559067726135254, "Full-pretrain/Loss (Raw)": 2.228222370147705, "Full-pretrain/Step": 1366, "Full-pretrain/Step Time": 17.628261171281338} +{"Full-pretrain/Learning Rate": 4.833392762159285e-05, "Full-pretrain/Loss": 2.0578155517578125, "Full-pretrain/Loss (Raw)": 2.12044095993042, "Full-pretrain/Step": 1367, "Full-pretrain/Step Time": 17.626764707267284} +{"Full-pretrain/Learning Rate": 4.833087851340862e-05, "Full-pretrain/Loss": 2.054537296295166, "Full-pretrain/Loss (Raw)": 2.076096534729004, "Full-pretrain/Step": 1368, "Full-pretrain/Step Time": 17.625183565542102} +{"Full-pretrain/Learning Rate": 4.832782671401575e-05, "Full-pretrain/Loss": 2.051176071166992, "Full-pretrain/Loss (Raw)": 2.06644344329834, "Full-pretrain/Step": 1369, "Full-pretrain/Step Time": 17.616445103660226} +{"Full-pretrain/Learning Rate": 4.8324772223766276e-05, "Full-pretrain/Loss": 2.0583314895629883, "Full-pretrain/Loss (Raw)": 2.1484522819519043, "Full-pretrain/Step": 1370, "Full-pretrain/Step Time": 17.622609484940767} +{"Full-pretrain/Learning Rate": 4.832171504301252e-05, "Full-pretrain/Loss": 2.0552921295166016, "Full-pretrain/Loss (Raw)": 1.992103099822998, "Full-pretrain/Step": 1371, "Full-pretrain/Step Time": 17.617438979446888} +{"Full-pretrain/Learning Rate": 4.8318655172107126e-05, "Full-pretrain/Loss": 2.048107147216797, "Full-pretrain/Loss (Raw)": 1.882200837135315, "Full-pretrain/Step": 1372, "Full-pretrain/Step Time": 17.625590013340116} +{"Full-pretrain/Learning Rate": 4.831559261140305e-05, "Full-pretrain/Loss": 2.0555601119995117, "Full-pretrain/Loss (Raw)": 2.1796977519989014, "Full-pretrain/Step": 1373, "Full-pretrain/Step Time": 17.617460016161203} +{"Full-pretrain/Learning Rate": 4.831252736125357e-05, "Full-pretrain/Loss": 2.051116943359375, "Full-pretrain/Loss (Raw)": 2.0256693363189697, "Full-pretrain/Step": 1374, "Full-pretrain/Step Time": 17.625477373600006} +{"Full-pretrain/Learning Rate": 4.830945942201224e-05, "Full-pretrain/Loss": 2.0434162616729736, "Full-pretrain/Loss (Raw)": 1.9773964881896973, "Full-pretrain/Step": 1375, "Full-pretrain/Step Time": 17.619557293131948} +{"Full-pretrain/Learning Rate": 4.830638879403297e-05, "Full-pretrain/Loss": 2.048518180847168, "Full-pretrain/Loss (Raw)": 1.9555797576904297, "Full-pretrain/Step": 1376, "Full-pretrain/Step Time": 17.62474991194904} +{"Full-pretrain/Learning Rate": 4.830331547766993e-05, "Full-pretrain/Loss": 2.0381922721862793, "Full-pretrain/Loss (Raw)": 1.8558517694473267, "Full-pretrain/Step": 1377, "Full-pretrain/Step Time": 17.61689938046038} +{"Full-pretrain/Learning Rate": 4.830023947327764e-05, "Full-pretrain/Loss": 2.034367561340332, "Full-pretrain/Loss (Raw)": 1.9238253831863403, "Full-pretrain/Step": 1378, "Full-pretrain/Step Time": 17.61905610561371} +{"Full-pretrain/Learning Rate": 4.8297160781210925e-05, "Full-pretrain/Loss": 2.0348117351531982, "Full-pretrain/Loss (Raw)": 2.0507941246032715, "Full-pretrain/Step": 1379, "Full-pretrain/Step Time": 17.61889691092074} +{"Full-pretrain/Learning Rate": 4.82940794018249e-05, "Full-pretrain/Loss": 2.0274863243103027, "Full-pretrain/Loss (Raw)": 1.9950190782546997, "Full-pretrain/Step": 1380, "Full-pretrain/Step Time": 17.620580445975065} +{"Full-pretrain/Learning Rate": 4.8290995335475e-05, "Full-pretrain/Loss": 2.016897678375244, "Full-pretrain/Loss (Raw)": 1.8851158618927002, "Full-pretrain/Step": 1381, "Full-pretrain/Step Time": 17.612581381574273} +{"Full-pretrain/Learning Rate": 4.828790858251697e-05, "Full-pretrain/Loss": 2.0160348415374756, "Full-pretrain/Loss (Raw)": 2.1957273483276367, "Full-pretrain/Step": 1382, "Full-pretrain/Step Time": 17.612322088330984} +{"Full-pretrain/Learning Rate": 4.828481914330687e-05, "Full-pretrain/Loss": 2.0154776573181152, "Full-pretrain/Loss (Raw)": 2.022359848022461, "Full-pretrain/Step": 1383, "Full-pretrain/Step Time": 17.60989724099636} +{"Full-pretrain/Learning Rate": 4.828172701820106e-05, "Full-pretrain/Loss": 2.0150647163391113, "Full-pretrain/Loss (Raw)": 1.990868091583252, "Full-pretrain/Step": 1384, "Full-pretrain/Step Time": 17.610371198505163} +{"Full-pretrain/Learning Rate": 4.827863220755623e-05, "Full-pretrain/Loss": 2.025970935821533, "Full-pretrain/Loss (Raw)": 2.2187881469726562, "Full-pretrain/Step": 1385, "Full-pretrain/Step Time": 17.607219396159053} +{"Full-pretrain/Learning Rate": 4.827553471172935e-05, "Full-pretrain/Loss": 2.0252435207366943, "Full-pretrain/Loss (Raw)": 2.080127716064453, "Full-pretrain/Step": 1386, "Full-pretrain/Step Time": 17.607826804742217} +{"Full-pretrain/Learning Rate": 4.827243453107772e-05, "Full-pretrain/Loss": 2.028757095336914, "Full-pretrain/Loss (Raw)": 1.9927647113800049, "Full-pretrain/Step": 1387, "Full-pretrain/Step Time": 17.60506552644074} +{"Full-pretrain/Learning Rate": 4.826933166595895e-05, "Full-pretrain/Loss": 2.0382606983184814, "Full-pretrain/Loss (Raw)": 2.3135673999786377, "Full-pretrain/Step": 1388, "Full-pretrain/Step Time": 17.61150981672108} +{"Full-pretrain/Learning Rate": 4.826622611673094e-05, "Full-pretrain/Loss": 2.0380401611328125, "Full-pretrain/Loss (Raw)": 1.8540409803390503, "Full-pretrain/Step": 1389, "Full-pretrain/Step Time": 17.60324042662978} +{"Full-pretrain/Learning Rate": 4.826311788375193e-05, "Full-pretrain/Loss": 2.0404067039489746, "Full-pretrain/Loss (Raw)": 2.0280683040618896, "Full-pretrain/Step": 1390, "Full-pretrain/Step Time": 17.60993203893304} +{"Full-pretrain/Learning Rate": 4.826000696738045e-05, "Full-pretrain/Loss": 2.0351696014404297, "Full-pretrain/Loss (Raw)": 1.796286702156067, "Full-pretrain/Step": 1391, "Full-pretrain/Step Time": 17.609073139727116} +{"Full-pretrain/Learning Rate": 4.825689336797534e-05, "Full-pretrain/Loss": 2.0347232818603516, "Full-pretrain/Loss (Raw)": 2.1075215339660645, "Full-pretrain/Step": 1392, "Full-pretrain/Step Time": 17.606008434668183} +{"Full-pretrain/Learning Rate": 4.825377708589575e-05, "Full-pretrain/Loss": 2.0332093238830566, "Full-pretrain/Loss (Raw)": 1.8684598207473755, "Full-pretrain/Step": 1393, "Full-pretrain/Step Time": 17.601461488753557} +{"Full-pretrain/Learning Rate": 4.8250658121501144e-05, "Full-pretrain/Loss": 2.0351691246032715, "Full-pretrain/Loss (Raw)": 2.0082385540008545, "Full-pretrain/Step": 1394, "Full-pretrain/Step Time": 17.59966387040913} +{"Full-pretrain/Learning Rate": 4.82475364751513e-05, "Full-pretrain/Loss": 2.032454252243042, "Full-pretrain/Loss (Raw)": 2.088452100753784, "Full-pretrain/Step": 1395, "Full-pretrain/Step Time": 17.599921133369207} +{"Full-pretrain/Learning Rate": 4.8244412147206284e-05, "Full-pretrain/Loss": 2.0260839462280273, "Full-pretrain/Loss (Raw)": 1.8897520303726196, "Full-pretrain/Step": 1396, "Full-pretrain/Step Time": 17.595176888629794} +{"Full-pretrain/Learning Rate": 4.8241285138026506e-05, "Full-pretrain/Loss": 2.0274887084960938, "Full-pretrain/Loss (Raw)": 2.0617032051086426, "Full-pretrain/Step": 1397, "Full-pretrain/Step Time": 17.589559951797128} +{"Full-pretrain/Learning Rate": 4.823815544797265e-05, "Full-pretrain/Loss": 2.0195255279541016, "Full-pretrain/Loss (Raw)": 1.9734069108963013, "Full-pretrain/Step": 1398, "Full-pretrain/Step Time": 17.58883836492896} +{"Full-pretrain/Learning Rate": 4.823502307740573e-05, "Full-pretrain/Loss": 2.0092649459838867, "Full-pretrain/Loss (Raw)": 1.792090892791748, "Full-pretrain/Step": 1399, "Full-pretrain/Step Time": 17.590818095952272} +{"Full-pretrain/Learning Rate": 4.823188802668707e-05, "Full-pretrain/Loss": 2.003180503845215, "Full-pretrain/Loss (Raw)": 1.8814021348953247, "Full-pretrain/Step": 1400, "Full-pretrain/Step Time": 17.592094598338008} +{"Full-pretrain/Learning Rate": 4.8228750296178275e-05, "Full-pretrain/Loss": 2.003441333770752, "Full-pretrain/Loss (Raw)": 2.0747945308685303, "Full-pretrain/Step": 1401, "Full-pretrain/Step Time": 17.586905520409346} +{"Full-pretrain/Learning Rate": 4.822560988624131e-05, "Full-pretrain/Loss": 2.001157283782959, "Full-pretrain/Loss (Raw)": 2.075355052947998, "Full-pretrain/Step": 1402, "Full-pretrain/Step Time": 17.590768042951822} +{"Full-pretrain/Learning Rate": 4.8222466797238396e-05, "Full-pretrain/Loss": 2.0048255920410156, "Full-pretrain/Loss (Raw)": 2.1094958782196045, "Full-pretrain/Step": 1403, "Full-pretrain/Step Time": 17.589719677343965} +{"Full-pretrain/Learning Rate": 4.821932102953211e-05, "Full-pretrain/Loss": 2.0107898712158203, "Full-pretrain/Loss (Raw)": 2.0730502605438232, "Full-pretrain/Step": 1404, "Full-pretrain/Step Time": 17.5925357285887} +{"Full-pretrain/Learning Rate": 4.821617258348529e-05, "Full-pretrain/Loss": 2.0028738975524902, "Full-pretrain/Loss (Raw)": 1.926392912864685, "Full-pretrain/Step": 1405, "Full-pretrain/Step Time": 17.5893350020051} +{"Full-pretrain/Learning Rate": 4.821302145946113e-05, "Full-pretrain/Loss": 2.001237392425537, "Full-pretrain/Loss (Raw)": 1.9732952117919922, "Full-pretrain/Step": 1406, "Full-pretrain/Step Time": 17.581758487969637} +{"Full-pretrain/Learning Rate": 4.8209867657823104e-05, "Full-pretrain/Loss": 1.99049711227417, "Full-pretrain/Loss (Raw)": 1.6337140798568726, "Full-pretrain/Step": 1407, "Full-pretrain/Step Time": 17.579797161743045} +{"Full-pretrain/Learning Rate": 4.8206711178934996e-05, "Full-pretrain/Loss": 1.989609718322754, "Full-pretrain/Loss (Raw)": 1.9271750450134277, "Full-pretrain/Step": 1408, "Full-pretrain/Step Time": 17.59279366955161} +{"Full-pretrain/Learning Rate": 4.8203552023160905e-05, "Full-pretrain/Loss": 1.9871457815170288, "Full-pretrain/Loss (Raw)": 1.7770087718963623, "Full-pretrain/Step": 1409, "Full-pretrain/Step Time": 17.586843671277165} +{"Full-pretrain/Learning Rate": 4.8200390190865254e-05, "Full-pretrain/Loss": 1.9941961765289307, "Full-pretrain/Loss (Raw)": 2.149444103240967, "Full-pretrain/Step": 1410, "Full-pretrain/Step Time": 17.584729900583625} +{"Full-pretrain/Learning Rate": 4.819722568241274e-05, "Full-pretrain/Loss": 1.9929203987121582, "Full-pretrain/Loss (Raw)": 2.009967803955078, "Full-pretrain/Step": 1411, "Full-pretrain/Step Time": 17.58515614643693} +{"Full-pretrain/Learning Rate": 4.819405849816839e-05, "Full-pretrain/Loss": 1.993126630783081, "Full-pretrain/Loss (Raw)": 2.0016157627105713, "Full-pretrain/Step": 1412, "Full-pretrain/Step Time": 17.58406911790371} +{"Full-pretrain/Learning Rate": 4.8190888638497556e-05, "Full-pretrain/Loss": 1.9926867485046387, "Full-pretrain/Loss (Raw)": 1.8710379600524902, "Full-pretrain/Step": 1413, "Full-pretrain/Step Time": 17.58581188134849} +{"Full-pretrain/Learning Rate": 4.8187716103765856e-05, "Full-pretrain/Loss": 1.983891487121582, "Full-pretrain/Loss (Raw)": 1.9142838716506958, "Full-pretrain/Step": 1414, "Full-pretrain/Step Time": 17.57916454412043} +{"Full-pretrain/Learning Rate": 4.818454089433926e-05, "Full-pretrain/Loss": 1.9787166118621826, "Full-pretrain/Loss (Raw)": 1.8567614555358887, "Full-pretrain/Step": 1415, "Full-pretrain/Step Time": 17.578814646229148} +{"Full-pretrain/Learning Rate": 4.8181363010584013e-05, "Full-pretrain/Loss": 1.9781681299209595, "Full-pretrain/Loss (Raw)": 1.9733176231384277, "Full-pretrain/Step": 1416, "Full-pretrain/Step Time": 17.580729389563203} +{"Full-pretrain/Learning Rate": 4.81781824528667e-05, "Full-pretrain/Loss": 1.978211522102356, "Full-pretrain/Loss (Raw)": 2.2201733589172363, "Full-pretrain/Step": 1417, "Full-pretrain/Step Time": 17.57765461690724} +{"Full-pretrain/Learning Rate": 4.8174999221554176e-05, "Full-pretrain/Loss": 1.977372646331787, "Full-pretrain/Loss (Raw)": 2.053285598754883, "Full-pretrain/Step": 1418, "Full-pretrain/Step Time": 17.58069788850844} +{"Full-pretrain/Learning Rate": 4.8171813317013635e-05, "Full-pretrain/Loss": 1.9738826751708984, "Full-pretrain/Loss (Raw)": 1.8810853958129883, "Full-pretrain/Step": 1419, "Full-pretrain/Step Time": 17.567256830632687} +{"Full-pretrain/Learning Rate": 4.816862473961258e-05, "Full-pretrain/Loss": 1.9657427072525024, "Full-pretrain/Loss (Raw)": 2.0530900955200195, "Full-pretrain/Step": 1420, "Full-pretrain/Step Time": 17.574855661019683} +{"Full-pretrain/Learning Rate": 4.8165433489718795e-05, "Full-pretrain/Loss": 1.97602379322052, "Full-pretrain/Loss (Raw)": 2.183035373687744, "Full-pretrain/Step": 1421, "Full-pretrain/Step Time": 17.56644089706242} +{"Full-pretrain/Learning Rate": 4.81622395677004e-05, "Full-pretrain/Loss": 1.9764524698257446, "Full-pretrain/Loss (Raw)": 2.041785717010498, "Full-pretrain/Step": 1422, "Full-pretrain/Step Time": 17.566538240760565} +{"Full-pretrain/Learning Rate": 4.8159042973925814e-05, "Full-pretrain/Loss": 1.9841878414154053, "Full-pretrain/Loss (Raw)": 2.043816089630127, "Full-pretrain/Step": 1423, "Full-pretrain/Step Time": 17.558544350787997} +{"Full-pretrain/Learning Rate": 4.815584370876376e-05, "Full-pretrain/Loss": 1.980545997619629, "Full-pretrain/Loss (Raw)": 1.9909849166870117, "Full-pretrain/Step": 1424, "Full-pretrain/Step Time": 17.566849499940872} +{"Full-pretrain/Learning Rate": 4.815264177258326e-05, "Full-pretrain/Loss": 1.9937312602996826, "Full-pretrain/Loss (Raw)": 2.2903847694396973, "Full-pretrain/Step": 1425, "Full-pretrain/Step Time": 17.563192829489708} +{"Full-pretrain/Learning Rate": 4.814943716575369e-05, "Full-pretrain/Loss": 1.9952733516693115, "Full-pretrain/Loss (Raw)": 2.057589054107666, "Full-pretrain/Step": 1426, "Full-pretrain/Step Time": 17.56143557652831} +{"Full-pretrain/Learning Rate": 4.8146229888644656e-05, "Full-pretrain/Loss": 1.996387243270874, "Full-pretrain/Loss (Raw)": 2.124091625213623, "Full-pretrain/Step": 1427, "Full-pretrain/Step Time": 17.56530235335231} +{"Full-pretrain/Learning Rate": 4.814301994162615e-05, "Full-pretrain/Loss": 2.005509614944458, "Full-pretrain/Loss (Raw)": 2.1816701889038086, "Full-pretrain/Step": 1428, "Full-pretrain/Step Time": 17.565313775092363} +{"Full-pretrain/Learning Rate": 4.8139807325068425e-05, "Full-pretrain/Loss": 2.003635883331299, "Full-pretrain/Loss (Raw)": 2.001739978790283, "Full-pretrain/Step": 1429, "Full-pretrain/Step Time": 17.561185026541352} +{"Full-pretrain/Learning Rate": 4.813659203934205e-05, "Full-pretrain/Loss": 2.0121731758117676, "Full-pretrain/Loss (Raw)": 2.246608257293701, "Full-pretrain/Step": 1430, "Full-pretrain/Step Time": 17.555395931005478} +{"Full-pretrain/Learning Rate": 4.8133374084817927e-05, "Full-pretrain/Loss": 2.01933217048645, "Full-pretrain/Loss (Raw)": 2.0211739540100098, "Full-pretrain/Step": 1431, "Full-pretrain/Step Time": 17.56003556959331} +{"Full-pretrain/Learning Rate": 4.8130153461867225e-05, "Full-pretrain/Loss": 2.021448850631714, "Full-pretrain/Loss (Raw)": 1.9491379261016846, "Full-pretrain/Step": 1432, "Full-pretrain/Step Time": 17.556814052164555} +{"Full-pretrain/Learning Rate": 4.812693017086145e-05, "Full-pretrain/Loss": 2.020369529724121, "Full-pretrain/Loss (Raw)": 2.0402603149414062, "Full-pretrain/Step": 1433, "Full-pretrain/Step Time": 17.55731008015573} +{"Full-pretrain/Learning Rate": 4.8123704212172415e-05, "Full-pretrain/Loss": 2.0127646923065186, "Full-pretrain/Loss (Raw)": 1.8319958448410034, "Full-pretrain/Step": 1434, "Full-pretrain/Step Time": 17.551169991493225} +{"Full-pretrain/Learning Rate": 4.8120475586172223e-05, "Full-pretrain/Loss": 2.004237174987793, "Full-pretrain/Loss (Raw)": 1.836620569229126, "Full-pretrain/Step": 1435, "Full-pretrain/Step Time": 17.548127913847566} +{"Full-pretrain/Learning Rate": 4.811724429323329e-05, "Full-pretrain/Loss": 1.9958462715148926, "Full-pretrain/Loss (Raw)": 1.8045343160629272, "Full-pretrain/Step": 1436, "Full-pretrain/Step Time": 17.555125320330262} +{"Full-pretrain/Learning Rate": 4.811401033372835e-05, "Full-pretrain/Loss": 1.9986361265182495, "Full-pretrain/Loss (Raw)": 2.0156736373901367, "Full-pretrain/Step": 1437, "Full-pretrain/Step Time": 17.550928108394146} +{"Full-pretrain/Learning Rate": 4.811077370803044e-05, "Full-pretrain/Loss": 2.0068869590759277, "Full-pretrain/Loss (Raw)": 2.2373147010803223, "Full-pretrain/Step": 1438, "Full-pretrain/Step Time": 17.548707153648138} +{"Full-pretrain/Learning Rate": 4.810753441651292e-05, "Full-pretrain/Loss": 2.021934747695923, "Full-pretrain/Loss (Raw)": 2.1152501106262207, "Full-pretrain/Step": 1439, "Full-pretrain/Step Time": 17.554274125024676} +{"Full-pretrain/Learning Rate": 4.8104292459549415e-05, "Full-pretrain/Loss": 2.026479721069336, "Full-pretrain/Loss (Raw)": 2.0726118087768555, "Full-pretrain/Step": 1440, "Full-pretrain/Step Time": 17.54877963848412} +{"Full-pretrain/Learning Rate": 4.810104783751389e-05, "Full-pretrain/Loss": 2.0386738777160645, "Full-pretrain/Loss (Raw)": 2.1672255992889404, "Full-pretrain/Step": 1441, "Full-pretrain/Step Time": 17.55568155273795} +{"Full-pretrain/Learning Rate": 4.8097800550780625e-05, "Full-pretrain/Loss": 2.030470848083496, "Full-pretrain/Loss (Raw)": 1.886941909790039, "Full-pretrain/Step": 1442, "Full-pretrain/Step Time": 17.551653180271387} +{"Full-pretrain/Learning Rate": 4.809455059972418e-05, "Full-pretrain/Loss": 2.031233787536621, "Full-pretrain/Loss (Raw)": 2.034379005432129, "Full-pretrain/Step": 1443, "Full-pretrain/Step Time": 17.553043756633997} +{"Full-pretrain/Learning Rate": 4.809129798471944e-05, "Full-pretrain/Loss": 2.039501190185547, "Full-pretrain/Loss (Raw)": 2.2661795616149902, "Full-pretrain/Step": 1444, "Full-pretrain/Step Time": 17.55604187399149} +{"Full-pretrain/Learning Rate": 4.808804270614159e-05, "Full-pretrain/Loss": 2.0436172485351562, "Full-pretrain/Loss (Raw)": 2.002749443054199, "Full-pretrain/Step": 1445, "Full-pretrain/Step Time": 17.558704279363155} +{"Full-pretrain/Learning Rate": 4.8084784764366123e-05, "Full-pretrain/Loss": 2.043917417526245, "Full-pretrain/Loss (Raw)": 1.9238903522491455, "Full-pretrain/Step": 1446, "Full-pretrain/Step Time": 17.561148861423135} +{"Full-pretrain/Learning Rate": 4.8081524159768855e-05, "Full-pretrain/Loss": 2.0529897212982178, "Full-pretrain/Loss (Raw)": 2.147073745727539, "Full-pretrain/Step": 1447, "Full-pretrain/Step Time": 17.559191770851612} +{"Full-pretrain/Learning Rate": 4.8078260892725876e-05, "Full-pretrain/Loss": 2.0561795234680176, "Full-pretrain/Loss (Raw)": 2.0753862857818604, "Full-pretrain/Step": 1448, "Full-pretrain/Step Time": 17.563044883310795} +{"Full-pretrain/Learning Rate": 4.807499496361362e-05, "Full-pretrain/Loss": 2.0466723442077637, "Full-pretrain/Loss (Raw)": 1.9159517288208008, "Full-pretrain/Step": 1449, "Full-pretrain/Step Time": 17.566010165959597} +{"Full-pretrain/Learning Rate": 4.807172637280881e-05, "Full-pretrain/Loss": 2.0505475997924805, "Full-pretrain/Loss (Raw)": 2.1772913932800293, "Full-pretrain/Step": 1450, "Full-pretrain/Step Time": 17.571642281487584} +{"Full-pretrain/Learning Rate": 4.806845512068846e-05, "Full-pretrain/Loss": 2.053562879562378, "Full-pretrain/Loss (Raw)": 1.9775736331939697, "Full-pretrain/Step": 1451, "Full-pretrain/Step Time": 17.570470048114657} +{"Full-pretrain/Learning Rate": 4.806518120762993e-05, "Full-pretrain/Loss": 2.056230068206787, "Full-pretrain/Loss (Raw)": 2.1384410858154297, "Full-pretrain/Step": 1452, "Full-pretrain/Step Time": 17.573275085538626} +{"Full-pretrain/Learning Rate": 4.806190463401085e-05, "Full-pretrain/Loss": 2.05303692817688, "Full-pretrain/Loss (Raw)": 2.0808565616607666, "Full-pretrain/Step": 1453, "Full-pretrain/Step Time": 17.571209767833352} +{"Full-pretrain/Learning Rate": 4.8058625400209165e-05, "Full-pretrain/Loss": 2.055191993713379, "Full-pretrain/Loss (Raw)": 2.1107430458068848, "Full-pretrain/Step": 1454, "Full-pretrain/Step Time": 17.574037896469235} +{"Full-pretrain/Learning Rate": 4.805534350660315e-05, "Full-pretrain/Loss": 2.051438570022583, "Full-pretrain/Loss (Raw)": 1.9237066507339478, "Full-pretrain/Step": 1455, "Full-pretrain/Step Time": 17.574453121051192} +{"Full-pretrain/Learning Rate": 4.805205895357137e-05, "Full-pretrain/Loss": 2.0422964096069336, "Full-pretrain/Loss (Raw)": 1.6984355449676514, "Full-pretrain/Step": 1456, "Full-pretrain/Step Time": 17.575015619397163} +{"Full-pretrain/Learning Rate": 4.804877174149268e-05, "Full-pretrain/Loss": 2.0402719974517822, "Full-pretrain/Loss (Raw)": 2.225602626800537, "Full-pretrain/Step": 1457, "Full-pretrain/Step Time": 17.576150050386786} +{"Full-pretrain/Learning Rate": 4.804548187074628e-05, "Full-pretrain/Loss": 2.037662982940674, "Full-pretrain/Loss (Raw)": 1.974096655845642, "Full-pretrain/Step": 1458, "Full-pretrain/Step Time": 17.5760043784976} +{"Full-pretrain/Learning Rate": 4.804218934171163e-05, "Full-pretrain/Loss": 2.04176926612854, "Full-pretrain/Loss (Raw)": 2.2554988861083984, "Full-pretrain/Step": 1459, "Full-pretrain/Step Time": 17.57800708897412} +{"Full-pretrain/Learning Rate": 4.8038894154768554e-05, "Full-pretrain/Loss": 2.0350000858306885, "Full-pretrain/Loss (Raw)": 1.9650577306747437, "Full-pretrain/Step": 1460, "Full-pretrain/Step Time": 17.57630328461528} +{"Full-pretrain/Learning Rate": 4.8035596310297124e-05, "Full-pretrain/Loss": 2.0355029106140137, "Full-pretrain/Loss (Raw)": 2.017827033996582, "Full-pretrain/Step": 1461, "Full-pretrain/Step Time": 17.571443999186158} +{"Full-pretrain/Learning Rate": 4.8032295808677754e-05, "Full-pretrain/Loss": 2.026759386062622, "Full-pretrain/Loss (Raw)": 1.9668183326721191, "Full-pretrain/Step": 1462, "Full-pretrain/Step Time": 17.57623885013163} +{"Full-pretrain/Learning Rate": 4.802899265029116e-05, "Full-pretrain/Loss": 2.019944906234741, "Full-pretrain/Loss (Raw)": 1.8031117916107178, "Full-pretrain/Step": 1463, "Full-pretrain/Step Time": 17.57467408105731} +{"Full-pretrain/Learning Rate": 4.802568683551836e-05, "Full-pretrain/Loss": 2.0157814025878906, "Full-pretrain/Loss (Raw)": 1.8159105777740479, "Full-pretrain/Step": 1464, "Full-pretrain/Step Time": 17.5655849725008} +{"Full-pretrain/Learning Rate": 4.802237836474067e-05, "Full-pretrain/Loss": 2.0173864364624023, "Full-pretrain/Loss (Raw)": 2.0916192531585693, "Full-pretrain/Step": 1465, "Full-pretrain/Step Time": 17.570994965732098} +{"Full-pretrain/Learning Rate": 4.801906723833973e-05, "Full-pretrain/Loss": 2.0232434272766113, "Full-pretrain/Loss (Raw)": 2.019415855407715, "Full-pretrain/Step": 1466, "Full-pretrain/Step Time": 17.568747486919165} +{"Full-pretrain/Learning Rate": 4.8015753456697465e-05, "Full-pretrain/Loss": 2.027590036392212, "Full-pretrain/Loss (Raw)": 1.9757137298583984, "Full-pretrain/Step": 1467, "Full-pretrain/Step Time": 17.57044936530292} +{"Full-pretrain/Learning Rate": 4.801243702019614e-05, "Full-pretrain/Loss": 2.040107488632202, "Full-pretrain/Loss (Raw)": 2.2050929069519043, "Full-pretrain/Step": 1468, "Full-pretrain/Step Time": 17.565812524408102} +{"Full-pretrain/Learning Rate": 4.8009117929218285e-05, "Full-pretrain/Loss": 2.048877716064453, "Full-pretrain/Loss (Raw)": 2.2963156700134277, "Full-pretrain/Step": 1469, "Full-pretrain/Step Time": 17.567871810868382} +{"Full-pretrain/Learning Rate": 4.800579618414676e-05, "Full-pretrain/Loss": 2.0466036796569824, "Full-pretrain/Loss (Raw)": 2.1645541191101074, "Full-pretrain/Step": 1470, "Full-pretrain/Step Time": 17.568322394043207} +{"Full-pretrain/Learning Rate": 4.8002471785364734e-05, "Full-pretrain/Loss": 2.033752918243408, "Full-pretrain/Loss (Raw)": 1.704017162322998, "Full-pretrain/Step": 1471, "Full-pretrain/Step Time": 17.56691719777882} +{"Full-pretrain/Learning Rate": 4.799914473325567e-05, "Full-pretrain/Loss": 2.032125473022461, "Full-pretrain/Loss (Raw)": 2.0205416679382324, "Full-pretrain/Step": 1472, "Full-pretrain/Step Time": 17.569816261529922} +{"Full-pretrain/Learning Rate": 4.7995815028203344e-05, "Full-pretrain/Loss": 2.03310227394104, "Full-pretrain/Loss (Raw)": 2.198479175567627, "Full-pretrain/Step": 1473, "Full-pretrain/Step Time": 17.57298055663705} +{"Full-pretrain/Learning Rate": 4.799248267059183e-05, "Full-pretrain/Loss": 2.042511224746704, "Full-pretrain/Loss (Raw)": 2.188028335571289, "Full-pretrain/Step": 1474, "Full-pretrain/Step Time": 17.571899266913533} +{"Full-pretrain/Learning Rate": 4.798914766080554e-05, "Full-pretrain/Loss": 2.0434060096740723, "Full-pretrain/Loss (Raw)": 2.0630083084106445, "Full-pretrain/Step": 1475, "Full-pretrain/Step Time": 17.569574382156134} +{"Full-pretrain/Learning Rate": 4.798580999922912e-05, "Full-pretrain/Loss": 2.039544105529785, "Full-pretrain/Loss (Raw)": 2.142601490020752, "Full-pretrain/Step": 1476, "Full-pretrain/Step Time": 17.56733184121549} +{"Full-pretrain/Learning Rate": 4.7982469686247614e-05, "Full-pretrain/Loss": 2.0398848056793213, "Full-pretrain/Loss (Raw)": 2.013653039932251, "Full-pretrain/Step": 1477, "Full-pretrain/Step Time": 17.5685346852988} +{"Full-pretrain/Learning Rate": 4.797912672224629e-05, "Full-pretrain/Loss": 2.0465941429138184, "Full-pretrain/Loss (Raw)": 2.138587474822998, "Full-pretrain/Step": 1478, "Full-pretrain/Step Time": 17.572041146457195} +{"Full-pretrain/Learning Rate": 4.797578110761078e-05, "Full-pretrain/Loss": 2.0491890907287598, "Full-pretrain/Loss (Raw)": 2.2301108837127686, "Full-pretrain/Step": 1479, "Full-pretrain/Step Time": 17.564350550994277} +{"Full-pretrain/Learning Rate": 4.797243284272701e-05, "Full-pretrain/Loss": 2.04691219329834, "Full-pretrain/Loss (Raw)": 2.0025265216827393, "Full-pretrain/Step": 1480, "Full-pretrain/Step Time": 17.554572321474552} +{"Full-pretrain/Learning Rate": 4.7969081927981165e-05, "Full-pretrain/Loss": 2.0435678958892822, "Full-pretrain/Loss (Raw)": 1.8089380264282227, "Full-pretrain/Step": 1481, "Full-pretrain/Step Time": 17.55662169493735} +{"Full-pretrain/Learning Rate": 4.79657283637598e-05, "Full-pretrain/Loss": 2.036158561706543, "Full-pretrain/Loss (Raw)": 1.9401905536651611, "Full-pretrain/Step": 1482, "Full-pretrain/Step Time": 17.558500304818153} +{"Full-pretrain/Learning Rate": 4.796237215044973e-05, "Full-pretrain/Loss": 2.0396876335144043, "Full-pretrain/Loss (Raw)": 2.0905017852783203, "Full-pretrain/Step": 1483, "Full-pretrain/Step Time": 17.54732263274491} +{"Full-pretrain/Learning Rate": 4.795901328843811e-05, "Full-pretrain/Loss": 2.0363657474517822, "Full-pretrain/Loss (Raw)": 2.032142162322998, "Full-pretrain/Step": 1484, "Full-pretrain/Step Time": 17.547503035515547} +{"Full-pretrain/Learning Rate": 4.7955651778112375e-05, "Full-pretrain/Loss": 2.030752182006836, "Full-pretrain/Loss (Raw)": 1.901226282119751, "Full-pretrain/Step": 1485, "Full-pretrain/Step Time": 17.54479070752859} +{"Full-pretrain/Learning Rate": 4.795228761986028e-05, "Full-pretrain/Loss": 2.029932737350464, "Full-pretrain/Loss (Raw)": 2.0845186710357666, "Full-pretrain/Step": 1486, "Full-pretrain/Step Time": 17.545878291130066} +{"Full-pretrain/Learning Rate": 4.7948920814069866e-05, "Full-pretrain/Loss": 2.035900354385376, "Full-pretrain/Loss (Raw)": 2.11466908454895, "Full-pretrain/Step": 1487, "Full-pretrain/Step Time": 17.539299307391047} +{"Full-pretrain/Learning Rate": 4.79455513611295e-05, "Full-pretrain/Loss": 2.0526416301727295, "Full-pretrain/Loss (Raw)": 2.234158515930176, "Full-pretrain/Step": 1488, "Full-pretrain/Step Time": 17.539628364145756} +{"Full-pretrain/Learning Rate": 4.794217926142785e-05, "Full-pretrain/Loss": 2.047219753265381, "Full-pretrain/Loss (Raw)": 2.0520973205566406, "Full-pretrain/Step": 1489, "Full-pretrain/Step Time": 17.545840822160244} +{"Full-pretrain/Learning Rate": 4.7938804515353887e-05, "Full-pretrain/Loss": 2.0450284481048584, "Full-pretrain/Loss (Raw)": 1.903976321220398, "Full-pretrain/Step": 1490, "Full-pretrain/Step Time": 17.54406432621181} +{"Full-pretrain/Learning Rate": 4.793542712329688e-05, "Full-pretrain/Loss": 2.0377228260040283, "Full-pretrain/Loss (Raw)": 2.0217208862304688, "Full-pretrain/Step": 1491, "Full-pretrain/Step Time": 17.538871947675943} +{"Full-pretrain/Learning Rate": 4.793204708564641e-05, "Full-pretrain/Loss": 2.0302579402923584, "Full-pretrain/Loss (Raw)": 1.726184368133545, "Full-pretrain/Step": 1492, "Full-pretrain/Step Time": 17.54626427218318} +{"Full-pretrain/Learning Rate": 4.792866440279238e-05, "Full-pretrain/Loss": 2.018494129180908, "Full-pretrain/Loss (Raw)": 1.6413860321044922, "Full-pretrain/Step": 1493, "Full-pretrain/Step Time": 17.54494603909552} +{"Full-pretrain/Learning Rate": 4.792527907512496e-05, "Full-pretrain/Loss": 2.027683734893799, "Full-pretrain/Loss (Raw)": 2.2608776092529297, "Full-pretrain/Step": 1494, "Full-pretrain/Step Time": 17.542911421507597} +{"Full-pretrain/Learning Rate": 4.792189110303467e-05, "Full-pretrain/Loss": 2.041628837585449, "Full-pretrain/Loss (Raw)": 2.249358892440796, "Full-pretrain/Step": 1495, "Full-pretrain/Step Time": 17.546065470203757} +{"Full-pretrain/Learning Rate": 4.7918500486912274e-05, "Full-pretrain/Loss": 2.0522539615631104, "Full-pretrain/Loss (Raw)": 2.155919075012207, "Full-pretrain/Step": 1496, "Full-pretrain/Step Time": 17.5441586766392} +{"Full-pretrain/Learning Rate": 4.791510722714892e-05, "Full-pretrain/Loss": 2.0552845001220703, "Full-pretrain/Loss (Raw)": 2.1885881423950195, "Full-pretrain/Step": 1497, "Full-pretrain/Step Time": 17.547745794057846} +{"Full-pretrain/Learning Rate": 4.791171132413599e-05, "Full-pretrain/Loss": 2.058145523071289, "Full-pretrain/Loss (Raw)": 2.110976219177246, "Full-pretrain/Step": 1498, "Full-pretrain/Step Time": 17.54229503683746} +{"Full-pretrain/Learning Rate": 4.790831277826521e-05, "Full-pretrain/Loss": 2.0658726692199707, "Full-pretrain/Loss (Raw)": 2.222977876663208, "Full-pretrain/Step": 1499, "Full-pretrain/Step Time": 17.54071382060647} +{"Full-pretrain/Learning Rate": 4.790491158992861e-05, "Full-pretrain/Loss": 2.0639030933380127, "Full-pretrain/Loss (Raw)": 2.142068862915039, "Full-pretrain/Step": 1500, "Full-pretrain/Step Time": 17.540961116552353} +{"Full-pretrain/Learning Rate": 4.79015077595185e-05, "Full-pretrain/Loss": 2.0570249557495117, "Full-pretrain/Loss (Raw)": 2.0762181282043457, "Full-pretrain/Step": 1501, "Full-pretrain/Step Time": 17.547694316133857} +{"Full-pretrain/Learning Rate": 4.789810128742752e-05, "Full-pretrain/Loss": 2.056305408477783, "Full-pretrain/Loss (Raw)": 2.1415300369262695, "Full-pretrain/Step": 1502, "Full-pretrain/Step Time": 17.538422776386142} +{"Full-pretrain/Learning Rate": 4.789469217404861e-05, "Full-pretrain/Loss": 2.0648961067199707, "Full-pretrain/Loss (Raw)": 1.9789140224456787, "Full-pretrain/Step": 1503, "Full-pretrain/Step Time": 17.542651714757085} +{"Full-pretrain/Learning Rate": 4.7891280419774985e-05, "Full-pretrain/Loss": 2.065697431564331, "Full-pretrain/Loss (Raw)": 2.046182632446289, "Full-pretrain/Step": 1504, "Full-pretrain/Step Time": 17.539389360696077} +{"Full-pretrain/Learning Rate": 4.7887866025000225e-05, "Full-pretrain/Loss": 2.058537483215332, "Full-pretrain/Loss (Raw)": 1.969364047050476, "Full-pretrain/Step": 1505, "Full-pretrain/Step Time": 17.5399071238935} +{"Full-pretrain/Learning Rate": 4.788444899011816e-05, "Full-pretrain/Loss": 2.050118923187256, "Full-pretrain/Loss (Raw)": 1.918631911277771, "Full-pretrain/Step": 1506, "Full-pretrain/Step Time": 17.538479482755065} +{"Full-pretrain/Learning Rate": 4.788102931552294e-05, "Full-pretrain/Loss": 2.0448474884033203, "Full-pretrain/Loss (Raw)": 1.8943194150924683, "Full-pretrain/Step": 1507, "Full-pretrain/Step Time": 17.542026784271002} +{"Full-pretrain/Learning Rate": 4.787760700160904e-05, "Full-pretrain/Loss": 2.0456199645996094, "Full-pretrain/Loss (Raw)": 2.1673269271850586, "Full-pretrain/Step": 1508, "Full-pretrain/Step Time": 17.543320851400495} +{"Full-pretrain/Learning Rate": 4.78741820487712e-05, "Full-pretrain/Loss": 2.045177459716797, "Full-pretrain/Loss (Raw)": 1.9994933605194092, "Full-pretrain/Step": 1509, "Full-pretrain/Step Time": 17.54709043726325} +{"Full-pretrain/Learning Rate": 4.78707544574045e-05, "Full-pretrain/Loss": 2.041140556335449, "Full-pretrain/Loss (Raw)": 2.0094079971313477, "Full-pretrain/Step": 1510, "Full-pretrain/Step Time": 17.55160883255303} +{"Full-pretrain/Learning Rate": 4.786732422790432e-05, "Full-pretrain/Loss": 2.040928840637207, "Full-pretrain/Loss (Raw)": 2.223334789276123, "Full-pretrain/Step": 1511, "Full-pretrain/Step Time": 17.55039450712502} +{"Full-pretrain/Learning Rate": 4.786389136066633e-05, "Full-pretrain/Loss": 2.0430946350097656, "Full-pretrain/Loss (Raw)": 2.0718326568603516, "Full-pretrain/Step": 1512, "Full-pretrain/Step Time": 17.55279965698719} +{"Full-pretrain/Learning Rate": 4.7860455856086487e-05, "Full-pretrain/Loss": 2.044930934906006, "Full-pretrain/Loss (Raw)": 1.8677008152008057, "Full-pretrain/Step": 1513, "Full-pretrain/Step Time": 17.551692802459} +{"Full-pretrain/Learning Rate": 4.785701771456111e-05, "Full-pretrain/Loss": 2.052769184112549, "Full-pretrain/Loss (Raw)": 2.191012144088745, "Full-pretrain/Step": 1514, "Full-pretrain/Step Time": 17.55188950896263} +{"Full-pretrain/Learning Rate": 4.785357693648677e-05, "Full-pretrain/Loss": 2.0455663204193115, "Full-pretrain/Loss (Raw)": 1.8600082397460938, "Full-pretrain/Step": 1515, "Full-pretrain/Step Time": 17.55815645866096} +{"Full-pretrain/Learning Rate": 4.785013352226036e-05, "Full-pretrain/Loss": 2.048640727996826, "Full-pretrain/Loss (Raw)": 2.130524158477783, "Full-pretrain/Step": 1516, "Full-pretrain/Step Time": 17.556934274733067} +{"Full-pretrain/Learning Rate": 4.784668747227907e-05, "Full-pretrain/Loss": 2.0557668209075928, "Full-pretrain/Loss (Raw)": 2.1292612552642822, "Full-pretrain/Step": 1517, "Full-pretrain/Step Time": 17.55968031845987} +{"Full-pretrain/Learning Rate": 4.7843238786940425e-05, "Full-pretrain/Loss": 2.05336856842041, "Full-pretrain/Loss (Raw)": 2.007767915725708, "Full-pretrain/Step": 1518, "Full-pretrain/Step Time": 17.556200796738267} +{"Full-pretrain/Learning Rate": 4.783978746664221e-05, "Full-pretrain/Loss": 2.05376935005188, "Full-pretrain/Loss (Raw)": 2.127500534057617, "Full-pretrain/Step": 1519, "Full-pretrain/Step Time": 17.55890260823071} +{"Full-pretrain/Learning Rate": 4.783633351178253e-05, "Full-pretrain/Loss": 2.0490942001342773, "Full-pretrain/Loss (Raw)": 2.084547519683838, "Full-pretrain/Step": 1520, "Full-pretrain/Step Time": 17.55907777696848} +{"Full-pretrain/Learning Rate": 4.783287692275981e-05, "Full-pretrain/Loss": 2.041808605194092, "Full-pretrain/Loss (Raw)": 1.8189622163772583, "Full-pretrain/Step": 1521, "Full-pretrain/Step Time": 17.556149343028665} +{"Full-pretrain/Learning Rate": 4.7829417699972754e-05, "Full-pretrain/Loss": 2.055088996887207, "Full-pretrain/Loss (Raw)": 2.328946352005005, "Full-pretrain/Step": 1522, "Full-pretrain/Step Time": 17.555097987875342} +{"Full-pretrain/Learning Rate": 4.782595584382039e-05, "Full-pretrain/Loss": 2.0595738887786865, "Full-pretrain/Loss (Raw)": 2.165240526199341, "Full-pretrain/Step": 1523, "Full-pretrain/Step Time": 17.556917391717434} +{"Full-pretrain/Learning Rate": 4.782249135470205e-05, "Full-pretrain/Loss": 2.0717101097106934, "Full-pretrain/Loss (Raw)": 2.1145358085632324, "Full-pretrain/Step": 1524, "Full-pretrain/Step Time": 17.559976745396852} +{"Full-pretrain/Learning Rate": 4.781902423301734e-05, "Full-pretrain/Loss": 2.0867156982421875, "Full-pretrain/Loss (Raw)": 2.121572494506836, "Full-pretrain/Step": 1525, "Full-pretrain/Step Time": 17.561173738911748} +{"Full-pretrain/Learning Rate": 4.781555447916621e-05, "Full-pretrain/Loss": 2.0775015354156494, "Full-pretrain/Loss (Raw)": 1.96602463722229, "Full-pretrain/Step": 1526, "Full-pretrain/Step Time": 17.5693990457803} +{"Full-pretrain/Learning Rate": 4.7812082093548894e-05, "Full-pretrain/Loss": 2.0709657669067383, "Full-pretrain/Loss (Raw)": 2.040210247039795, "Full-pretrain/Step": 1527, "Full-pretrain/Step Time": 17.560310950502753} +{"Full-pretrain/Learning Rate": 4.780860707656592e-05, "Full-pretrain/Loss": 2.065275192260742, "Full-pretrain/Loss (Raw)": 1.9738287925720215, "Full-pretrain/Step": 1528, "Full-pretrain/Step Time": 17.567727711051702} +{"Full-pretrain/Learning Rate": 4.780512942861813e-05, "Full-pretrain/Loss": 2.065925359725952, "Full-pretrain/Loss (Raw)": 2.209390640258789, "Full-pretrain/Step": 1529, "Full-pretrain/Step Time": 17.568948443979025} +{"Full-pretrain/Learning Rate": 4.780164915010669e-05, "Full-pretrain/Loss": 2.072040557861328, "Full-pretrain/Loss (Raw)": 2.3066658973693848, "Full-pretrain/Step": 1530, "Full-pretrain/Step Time": 17.570996114984155} +{"Full-pretrain/Learning Rate": 4.779816624143302e-05, "Full-pretrain/Loss": 2.0639755725860596, "Full-pretrain/Loss (Raw)": 1.9648900032043457, "Full-pretrain/Step": 1531, "Full-pretrain/Step Time": 17.57022636011243} +{"Full-pretrain/Learning Rate": 4.7794680702998895e-05, "Full-pretrain/Loss": 2.0658936500549316, "Full-pretrain/Loss (Raw)": 2.2034525871276855, "Full-pretrain/Step": 1532, "Full-pretrain/Step Time": 17.57190339639783} +{"Full-pretrain/Learning Rate": 4.7791192535206355e-05, "Full-pretrain/Loss": 2.0660817623138428, "Full-pretrain/Loss (Raw)": 2.082235097885132, "Full-pretrain/Step": 1533, "Full-pretrain/Step Time": 17.572748126462102} +{"Full-pretrain/Learning Rate": 4.778770173845777e-05, "Full-pretrain/Loss": 2.064591884613037, "Full-pretrain/Loss (Raw)": 2.093852996826172, "Full-pretrain/Step": 1534, "Full-pretrain/Step Time": 17.577322943136096} +{"Full-pretrain/Learning Rate": 4.778420831315579e-05, "Full-pretrain/Loss": 2.064781665802002, "Full-pretrain/Loss (Raw)": 1.9849878549575806, "Full-pretrain/Step": 1535, "Full-pretrain/Step Time": 17.571941435337067} +{"Full-pretrain/Learning Rate": 4.77807122597034e-05, "Full-pretrain/Loss": 2.069117546081543, "Full-pretrain/Loss (Raw)": 2.184938430786133, "Full-pretrain/Step": 1536, "Full-pretrain/Step Time": 17.570501705631614} +{"Full-pretrain/Learning Rate": 4.777721357850384e-05, "Full-pretrain/Loss": 2.078700065612793, "Full-pretrain/Loss (Raw)": 2.2759952545166016, "Full-pretrain/Step": 1537, "Full-pretrain/Step Time": 17.57045350037515} +{"Full-pretrain/Learning Rate": 4.7773712269960716e-05, "Full-pretrain/Loss": 2.0734152793884277, "Full-pretrain/Loss (Raw)": 1.7495193481445312, "Full-pretrain/Step": 1538, "Full-pretrain/Step Time": 17.569244919344783} +{"Full-pretrain/Learning Rate": 4.7770208334477875e-05, "Full-pretrain/Loss": 2.073856830596924, "Full-pretrain/Loss (Raw)": 1.9084482192993164, "Full-pretrain/Step": 1539, "Full-pretrain/Step Time": 17.57096252962947} +{"Full-pretrain/Learning Rate": 4.77667017724595e-05, "Full-pretrain/Loss": 2.0669353008270264, "Full-pretrain/Loss (Raw)": 1.9458431005477905, "Full-pretrain/Step": 1540, "Full-pretrain/Step Time": 17.575743885710835} +{"Full-pretrain/Learning Rate": 4.776319258431009e-05, "Full-pretrain/Loss": 2.071758270263672, "Full-pretrain/Loss (Raw)": 2.1538238525390625, "Full-pretrain/Step": 1541, "Full-pretrain/Step Time": 17.578395688906312} +{"Full-pretrain/Learning Rate": 4.7759680770434404e-05, "Full-pretrain/Loss": 2.078589916229248, "Full-pretrain/Loss (Raw)": 2.2280235290527344, "Full-pretrain/Step": 1542, "Full-pretrain/Step Time": 17.58376097306609} +{"Full-pretrain/Learning Rate": 4.775616633123754e-05, "Full-pretrain/Loss": 2.0742545127868652, "Full-pretrain/Loss (Raw)": 2.0846011638641357, "Full-pretrain/Step": 1543, "Full-pretrain/Step Time": 17.58383064903319} +{"Full-pretrain/Learning Rate": 4.775264926712489e-05, "Full-pretrain/Loss": 2.0692389011383057, "Full-pretrain/Loss (Raw)": 1.9113328456878662, "Full-pretrain/Step": 1544, "Full-pretrain/Step Time": 17.584880141541362} +{"Full-pretrain/Learning Rate": 4.774912957850215e-05, "Full-pretrain/Loss": 2.0744848251342773, "Full-pretrain/Loss (Raw)": 2.0355632305145264, "Full-pretrain/Step": 1545, "Full-pretrain/Step Time": 17.59253782965243} +{"Full-pretrain/Learning Rate": 4.7745607265775295e-05, "Full-pretrain/Loss": 2.062864303588867, "Full-pretrain/Loss (Raw)": 1.8191624879837036, "Full-pretrain/Step": 1546, "Full-pretrain/Step Time": 17.594156114384532} +{"Full-pretrain/Learning Rate": 4.7742082329350644e-05, "Full-pretrain/Loss": 2.072322130203247, "Full-pretrain/Loss (Raw)": 2.162656307220459, "Full-pretrain/Step": 1547, "Full-pretrain/Step Time": 17.602286595851183} +{"Full-pretrain/Learning Rate": 4.773855476963479e-05, "Full-pretrain/Loss": 2.069624185562134, "Full-pretrain/Loss (Raw)": 2.044191837310791, "Full-pretrain/Step": 1548, "Full-pretrain/Step Time": 17.599261241033673} +{"Full-pretrain/Learning Rate": 4.773502458703463e-05, "Full-pretrain/Loss": 2.066235065460205, "Full-pretrain/Loss (Raw)": 2.020811080932617, "Full-pretrain/Step": 1549, "Full-pretrain/Step Time": 17.6063689365983} +{"Full-pretrain/Learning Rate": 4.773149178195737e-05, "Full-pretrain/Loss": 2.0743956565856934, "Full-pretrain/Loss (Raw)": 2.2689008712768555, "Full-pretrain/Step": 1550, "Full-pretrain/Step Time": 17.602906309068203} +{"Full-pretrain/Learning Rate": 4.772795635481052e-05, "Full-pretrain/Loss": 2.0733325481414795, "Full-pretrain/Loss (Raw)": 2.0934863090515137, "Full-pretrain/Step": 1551, "Full-pretrain/Step Time": 17.61444109492004} +{"Full-pretrain/Learning Rate": 4.77244183060019e-05, "Full-pretrain/Loss": 2.075042247772217, "Full-pretrain/Loss (Raw)": 2.1392581462860107, "Full-pretrain/Step": 1552, "Full-pretrain/Step Time": 17.60584837757051} +{"Full-pretrain/Learning Rate": 4.772087763593961e-05, "Full-pretrain/Loss": 2.0846452713012695, "Full-pretrain/Loss (Raw)": 2.1262576580047607, "Full-pretrain/Step": 1553, "Full-pretrain/Step Time": 17.608479915186763} +{"Full-pretrain/Learning Rate": 4.7717334345032065e-05, "Full-pretrain/Loss": 2.0752530097961426, "Full-pretrain/Loss (Raw)": 2.0283937454223633, "Full-pretrain/Step": 1554, "Full-pretrain/Step Time": 17.605546694248915} +{"Full-pretrain/Learning Rate": 4.7713788433687995e-05, "Full-pretrain/Loss": 2.0752644538879395, "Full-pretrain/Loss (Raw)": 2.1656136512756348, "Full-pretrain/Step": 1555, "Full-pretrain/Step Time": 17.606748919934034} +{"Full-pretrain/Learning Rate": 4.7710239902316405e-05, "Full-pretrain/Loss": 2.0689401626586914, "Full-pretrain/Loss (Raw)": 1.912156343460083, "Full-pretrain/Step": 1556, "Full-pretrain/Step Time": 17.607077684253454} +{"Full-pretrain/Learning Rate": 4.770668875132663e-05, "Full-pretrain/Loss": 2.0674266815185547, "Full-pretrain/Loss (Raw)": 2.0731406211853027, "Full-pretrain/Step": 1557, "Full-pretrain/Step Time": 17.607446705922484} +{"Full-pretrain/Learning Rate": 4.7703134981128285e-05, "Full-pretrain/Loss": 2.0725555419921875, "Full-pretrain/Loss (Raw)": 2.130143165588379, "Full-pretrain/Step": 1558, "Full-pretrain/Step Time": 17.609839610755444} +{"Full-pretrain/Learning Rate": 4.76995785921313e-05, "Full-pretrain/Loss": 2.0761663913726807, "Full-pretrain/Loss (Raw)": 2.155759572982788, "Full-pretrain/Step": 1559, "Full-pretrain/Step Time": 17.60902313143015} +{"Full-pretrain/Learning Rate": 4.7696019584745886e-05, "Full-pretrain/Loss": 2.0694072246551514, "Full-pretrain/Loss (Raw)": 1.757535457611084, "Full-pretrain/Step": 1560, "Full-pretrain/Step Time": 17.60680105537176} +{"Full-pretrain/Learning Rate": 4.769245795938261e-05, "Full-pretrain/Loss": 2.0665881633758545, "Full-pretrain/Loss (Raw)": 2.119182586669922, "Full-pretrain/Step": 1561, "Full-pretrain/Step Time": 17.606710420921445} +{"Full-pretrain/Learning Rate": 4.768889371645227e-05, "Full-pretrain/Loss": 2.0590620040893555, "Full-pretrain/Loss (Raw)": 2.065825939178467, "Full-pretrain/Step": 1562, "Full-pretrain/Step Time": 17.61212350986898} +{"Full-pretrain/Learning Rate": 4.768532685636602e-05, "Full-pretrain/Loss": 2.061037540435791, "Full-pretrain/Loss (Raw)": 2.0281074047088623, "Full-pretrain/Step": 1563, "Full-pretrain/Step Time": 17.619147315621376} +{"Full-pretrain/Learning Rate": 4.768175737953529e-05, "Full-pretrain/Loss": 2.05855393409729, "Full-pretrain/Loss (Raw)": 2.1239805221557617, "Full-pretrain/Step": 1564, "Full-pretrain/Step Time": 17.613234993070364} +{"Full-pretrain/Learning Rate": 4.767818528637181e-05, "Full-pretrain/Loss": 2.0578784942626953, "Full-pretrain/Loss (Raw)": 2.060617685317993, "Full-pretrain/Step": 1565, "Full-pretrain/Step Time": 17.6179464943707} +{"Full-pretrain/Learning Rate": 4.767461057728763e-05, "Full-pretrain/Loss": 2.0504159927368164, "Full-pretrain/Loss (Raw)": 1.8550567626953125, "Full-pretrain/Step": 1566, "Full-pretrain/Step Time": 17.62008319608867} +{"Full-pretrain/Learning Rate": 4.7671033252695083e-05, "Full-pretrain/Loss": 2.056644916534424, "Full-pretrain/Loss (Raw)": 2.1843132972717285, "Full-pretrain/Step": 1567, "Full-pretrain/Step Time": 17.624220306053758} +{"Full-pretrain/Learning Rate": 4.7667453313006825e-05, "Full-pretrain/Loss": 2.0590317249298096, "Full-pretrain/Loss (Raw)": 2.2613189220428467, "Full-pretrain/Step": 1568, "Full-pretrain/Step Time": 17.628795770928264} +{"Full-pretrain/Learning Rate": 4.76638707586358e-05, "Full-pretrain/Loss": 2.048884153366089, "Full-pretrain/Loss (Raw)": 1.9512661695480347, "Full-pretrain/Step": 1569, "Full-pretrain/Step Time": 17.624175287783146} +{"Full-pretrain/Learning Rate": 4.766028558999524e-05, "Full-pretrain/Loss": 2.0559539794921875, "Full-pretrain/Loss (Raw)": 1.9757634401321411, "Full-pretrain/Step": 1570, "Full-pretrain/Step Time": 17.623975183814764} +{"Full-pretrain/Learning Rate": 4.765669780749869e-05, "Full-pretrain/Loss": 2.0614569187164307, "Full-pretrain/Loss (Raw)": 2.0845389366149902, "Full-pretrain/Step": 1571, "Full-pretrain/Step Time": 17.627792105078697} +{"Full-pretrain/Learning Rate": 4.7653107411560026e-05, "Full-pretrain/Loss": 2.072378635406494, "Full-pretrain/Loss (Raw)": 2.295337200164795, "Full-pretrain/Step": 1572, "Full-pretrain/Step Time": 17.626886432990432} +{"Full-pretrain/Learning Rate": 4.7649514402593374e-05, "Full-pretrain/Loss": 2.0715622901916504, "Full-pretrain/Loss (Raw)": 2.1276988983154297, "Full-pretrain/Step": 1573, "Full-pretrain/Step Time": 17.621273633092642} +{"Full-pretrain/Learning Rate": 4.76459187810132e-05, "Full-pretrain/Loss": 2.065897226333618, "Full-pretrain/Loss (Raw)": 2.0467417240142822, "Full-pretrain/Step": 1574, "Full-pretrain/Step Time": 17.623008059337735} +{"Full-pretrain/Learning Rate": 4.764232054723425e-05, "Full-pretrain/Loss": 2.067964553833008, "Full-pretrain/Loss (Raw)": 2.1507534980773926, "Full-pretrain/Step": 1575, "Full-pretrain/Step Time": 17.628265177831054} +{"Full-pretrain/Learning Rate": 4.7638719701671584e-05, "Full-pretrain/Loss": 2.0763721466064453, "Full-pretrain/Loss (Raw)": 2.180375814437866, "Full-pretrain/Step": 1576, "Full-pretrain/Step Time": 17.620049560442567} +{"Full-pretrain/Learning Rate": 4.763511624474055e-05, "Full-pretrain/Loss": 2.0774741172790527, "Full-pretrain/Loss (Raw)": 2.0708236694335938, "Full-pretrain/Step": 1577, "Full-pretrain/Step Time": 17.62139680609107} +{"Full-pretrain/Learning Rate": 4.763151017685682e-05, "Full-pretrain/Loss": 2.0827722549438477, "Full-pretrain/Loss (Raw)": 1.9886997938156128, "Full-pretrain/Step": 1578, "Full-pretrain/Step Time": 17.623953389003873} +{"Full-pretrain/Learning Rate": 4.762790149843634e-05, "Full-pretrain/Loss": 2.0759479999542236, "Full-pretrain/Loss (Raw)": 1.9442851543426514, "Full-pretrain/Step": 1579, "Full-pretrain/Step Time": 17.625349760055542} +{"Full-pretrain/Learning Rate": 4.7624290209895384e-05, "Full-pretrain/Loss": 2.073617935180664, "Full-pretrain/Loss (Raw)": 1.9696292877197266, "Full-pretrain/Step": 1580, "Full-pretrain/Step Time": 17.622509544715285} +{"Full-pretrain/Learning Rate": 4.762067631165049e-05, "Full-pretrain/Loss": 2.0660767555236816, "Full-pretrain/Loss (Raw)": 1.7794908285140991, "Full-pretrain/Step": 1581, "Full-pretrain/Step Time": 17.627784974873066} +{"Full-pretrain/Learning Rate": 4.7617059804118534e-05, "Full-pretrain/Loss": 2.0665173530578613, "Full-pretrain/Loss (Raw)": 2.28299880027771, "Full-pretrain/Step": 1582, "Full-pretrain/Step Time": 17.627125907689333} +{"Full-pretrain/Learning Rate": 4.761344068771668e-05, "Full-pretrain/Loss": 2.0663928985595703, "Full-pretrain/Loss (Raw)": 2.089506149291992, "Full-pretrain/Step": 1583, "Full-pretrain/Step Time": 17.624750029295683} +{"Full-pretrain/Learning Rate": 4.7609818962862394e-05, "Full-pretrain/Loss": 2.0656561851501465, "Full-pretrain/Loss (Raw)": 2.115687608718872, "Full-pretrain/Step": 1584, "Full-pretrain/Step Time": 17.61983210593462} +{"Full-pretrain/Learning Rate": 4.760619462997343e-05, "Full-pretrain/Loss": 2.0644404888153076, "Full-pretrain/Loss (Raw)": 2.087352752685547, "Full-pretrain/Step": 1585, "Full-pretrain/Step Time": 17.62391320616007} +{"Full-pretrain/Learning Rate": 4.760256768946787e-05, "Full-pretrain/Loss": 2.0559744834899902, "Full-pretrain/Loss (Raw)": 1.7574859857559204, "Full-pretrain/Step": 1586, "Full-pretrain/Step Time": 17.62318965420127} +{"Full-pretrain/Learning Rate": 4.759893814176406e-05, "Full-pretrain/Loss": 2.048569679260254, "Full-pretrain/Loss (Raw)": 1.928654670715332, "Full-pretrain/Step": 1587, "Full-pretrain/Step Time": 17.623460214585066} +{"Full-pretrain/Learning Rate": 4.759530598728068e-05, "Full-pretrain/Loss": 2.0542068481445312, "Full-pretrain/Loss (Raw)": 2.0925493240356445, "Full-pretrain/Step": 1588, "Full-pretrain/Step Time": 17.62373878993094} +{"Full-pretrain/Learning Rate": 4.7591671226436695e-05, "Full-pretrain/Loss": 2.050285816192627, "Full-pretrain/Loss (Raw)": 1.947660207748413, "Full-pretrain/Step": 1589, "Full-pretrain/Step Time": 17.629197290167212} +{"Full-pretrain/Learning Rate": 4.7588033859651376e-05, "Full-pretrain/Loss": 2.049750328063965, "Full-pretrain/Loss (Raw)": 2.1130080223083496, "Full-pretrain/Step": 1590, "Full-pretrain/Step Time": 17.62700998224318} +{"Full-pretrain/Learning Rate": 4.758439388734429e-05, "Full-pretrain/Loss": 2.0471816062927246, "Full-pretrain/Loss (Raw)": 2.0735557079315186, "Full-pretrain/Step": 1591, "Full-pretrain/Step Time": 17.626715909689665} +{"Full-pretrain/Learning Rate": 4.75807513099353e-05, "Full-pretrain/Loss": 2.0502564907073975, "Full-pretrain/Loss (Raw)": 1.8559422492980957, "Full-pretrain/Step": 1592, "Full-pretrain/Step Time": 17.630869077518582} +{"Full-pretrain/Learning Rate": 4.7577106127844585e-05, "Full-pretrain/Loss": 2.0558018684387207, "Full-pretrain/Loss (Raw)": 2.296635627746582, "Full-pretrain/Step": 1593, "Full-pretrain/Step Time": 17.6211298070848} +{"Full-pretrain/Learning Rate": 4.757345834149261e-05, "Full-pretrain/Loss": 2.058250665664673, "Full-pretrain/Loss (Raw)": 2.1441853046417236, "Full-pretrain/Step": 1594, "Full-pretrain/Step Time": 17.630031680688262} +{"Full-pretrain/Learning Rate": 4.756980795130015e-05, "Full-pretrain/Loss": 2.063308000564575, "Full-pretrain/Loss (Raw)": 2.1899378299713135, "Full-pretrain/Step": 1595, "Full-pretrain/Step Time": 17.623754592612386} +{"Full-pretrain/Learning Rate": 4.7566154957688274e-05, "Full-pretrain/Loss": 2.054839611053467, "Full-pretrain/Loss (Raw)": 1.8530009984970093, "Full-pretrain/Step": 1596, "Full-pretrain/Step Time": 17.628825755789876} +{"Full-pretrain/Learning Rate": 4.7562499361078356e-05, "Full-pretrain/Loss": 2.051502227783203, "Full-pretrain/Loss (Raw)": 1.9538145065307617, "Full-pretrain/Step": 1597, "Full-pretrain/Step Time": 17.624857963994145} +{"Full-pretrain/Learning Rate": 4.755884116189207e-05, "Full-pretrain/Loss": 2.0497703552246094, "Full-pretrain/Loss (Raw)": 1.7996433973312378, "Full-pretrain/Step": 1598, "Full-pretrain/Step Time": 17.626274842768908} +{"Full-pretrain/Learning Rate": 4.755518036055137e-05, "Full-pretrain/Loss": 2.0461857318878174, "Full-pretrain/Loss (Raw)": 2.0696005821228027, "Full-pretrain/Step": 1599, "Full-pretrain/Step Time": 17.6251226272434} +{"Full-pretrain/Learning Rate": 4.7551516957478546e-05, "Full-pretrain/Loss": 2.040161609649658, "Full-pretrain/Loss (Raw)": 2.06854248046875, "Full-pretrain/Step": 1600, "Full-pretrain/Step Time": 17.629175815731287} +{"Full-pretrain/Learning Rate": 4.754785095309617e-05, "Full-pretrain/Loss": 2.043710708618164, "Full-pretrain/Loss (Raw)": 2.0648412704467773, "Full-pretrain/Step": 1601, "Full-pretrain/Step Time": 17.624876625835896} +{"Full-pretrain/Learning Rate": 4.7544182347827116e-05, "Full-pretrain/Loss": 2.044867753982544, "Full-pretrain/Loss (Raw)": 2.0127878189086914, "Full-pretrain/Step": 1602, "Full-pretrain/Step Time": 17.627882920205593} +{"Full-pretrain/Learning Rate": 4.754051114209455e-05, "Full-pretrain/Loss": 2.04522442817688, "Full-pretrain/Loss (Raw)": 2.095957040786743, "Full-pretrain/Step": 1603, "Full-pretrain/Step Time": 17.62967904098332} +{"Full-pretrain/Learning Rate": 4.753683733632193e-05, "Full-pretrain/Loss": 2.031431198120117, "Full-pretrain/Loss (Raw)": 1.8539443016052246, "Full-pretrain/Step": 1604, "Full-pretrain/Step Time": 17.63104913942516} +{"Full-pretrain/Learning Rate": 4.7533160930933056e-05, "Full-pretrain/Loss": 2.0298352241516113, "Full-pretrain/Loss (Raw)": 2.0766360759735107, "Full-pretrain/Step": 1605, "Full-pretrain/Step Time": 17.628948723897338} +{"Full-pretrain/Learning Rate": 4.752948192635198e-05, "Full-pretrain/Loss": 2.0408496856689453, "Full-pretrain/Loss (Raw)": 2.399200677871704, "Full-pretrain/Step": 1606, "Full-pretrain/Step Time": 17.631199026480317} +{"Full-pretrain/Learning Rate": 4.752580032300309e-05, "Full-pretrain/Loss": 2.0327820777893066, "Full-pretrain/Loss (Raw)": 1.8925925493240356, "Full-pretrain/Step": 1607, "Full-pretrain/Step Time": 17.63360949419439} +{"Full-pretrain/Learning Rate": 4.752211612131104e-05, "Full-pretrain/Loss": 2.0295886993408203, "Full-pretrain/Loss (Raw)": 2.0781781673431396, "Full-pretrain/Step": 1608, "Full-pretrain/Step Time": 17.63799975812435} +{"Full-pretrain/Learning Rate": 4.751842932170082e-05, "Full-pretrain/Loss": 2.031970500946045, "Full-pretrain/Loss (Raw)": 2.147052764892578, "Full-pretrain/Step": 1609, "Full-pretrain/Step Time": 17.634449247270823} +{"Full-pretrain/Learning Rate": 4.7514739924597686e-05, "Full-pretrain/Loss": 2.0482254028320312, "Full-pretrain/Loss (Raw)": 2.5088515281677246, "Full-pretrain/Step": 1610, "Full-pretrain/Step Time": 17.638338653370738} +{"Full-pretrain/Learning Rate": 4.751104793042722e-05, "Full-pretrain/Loss": 2.0443310737609863, "Full-pretrain/Loss (Raw)": 1.8196723461151123, "Full-pretrain/Step": 1611, "Full-pretrain/Step Time": 17.63881553336978} +{"Full-pretrain/Learning Rate": 4.7507353339615275e-05, "Full-pretrain/Loss": 2.04777193069458, "Full-pretrain/Loss (Raw)": 2.0797359943389893, "Full-pretrain/Step": 1612, "Full-pretrain/Step Time": 17.63978567160666} +{"Full-pretrain/Learning Rate": 4.7503656152588036e-05, "Full-pretrain/Loss": 2.052675724029541, "Full-pretrain/Loss (Raw)": 1.9364080429077148, "Full-pretrain/Step": 1613, "Full-pretrain/Step Time": 17.642469011247158} +{"Full-pretrain/Learning Rate": 4.749995636977197e-05, "Full-pretrain/Loss": 2.0310497283935547, "Full-pretrain/Loss (Raw)": 1.5909662246704102, "Full-pretrain/Step": 1614, "Full-pretrain/Step Time": 17.644142411649227} +{"Full-pretrain/Learning Rate": 4.7496253991593844e-05, "Full-pretrain/Loss": 2.0467453002929688, "Full-pretrain/Loss (Raw)": 2.5917704105377197, "Full-pretrain/Step": 1615, "Full-pretrain/Step Time": 17.655523689463735} +{"Full-pretrain/Learning Rate": 4.749254901848073e-05, "Full-pretrain/Loss": 2.0395076274871826, "Full-pretrain/Loss (Raw)": 1.8840800523757935, "Full-pretrain/Step": 1616, "Full-pretrain/Step Time": 17.658660165965557} +{"Full-pretrain/Learning Rate": 4.7488841450859975e-05, "Full-pretrain/Loss": 2.0294222831726074, "Full-pretrain/Loss (Raw)": 1.7646198272705078, "Full-pretrain/Step": 1617, "Full-pretrain/Step Time": 17.64919582940638} +{"Full-pretrain/Learning Rate": 4.7485131289159276e-05, "Full-pretrain/Loss": 2.0367820262908936, "Full-pretrain/Loss (Raw)": 1.9929969310760498, "Full-pretrain/Step": 1618, "Full-pretrain/Step Time": 17.653669321909547} +{"Full-pretrain/Learning Rate": 4.7481418533806586e-05, "Full-pretrain/Loss": 2.037875175476074, "Full-pretrain/Loss (Raw)": 1.963633418083191, "Full-pretrain/Step": 1619, "Full-pretrain/Step Time": 17.65410508029163} +{"Full-pretrain/Learning Rate": 4.747770318523016e-05, "Full-pretrain/Loss": 2.0363874435424805, "Full-pretrain/Loss (Raw)": 2.0449416637420654, "Full-pretrain/Step": 1620, "Full-pretrain/Step Time": 17.656021907925606} +{"Full-pretrain/Learning Rate": 4.7473985243858575e-05, "Full-pretrain/Loss": 2.0405774116516113, "Full-pretrain/Loss (Raw)": 2.0817456245422363, "Full-pretrain/Step": 1621, "Full-pretrain/Step Time": 17.650939801707864} +{"Full-pretrain/Learning Rate": 4.7470264710120697e-05, "Full-pretrain/Loss": 2.0396459102630615, "Full-pretrain/Loss (Raw)": 2.083198308944702, "Full-pretrain/Step": 1622, "Full-pretrain/Step Time": 17.657101886346936} +{"Full-pretrain/Learning Rate": 4.746654158444567e-05, "Full-pretrain/Loss": 2.030996322631836, "Full-pretrain/Loss (Raw)": 1.7967641353607178, "Full-pretrain/Step": 1623, "Full-pretrain/Step Time": 17.65797788836062} +{"Full-pretrain/Learning Rate": 4.7462815867262964e-05, "Full-pretrain/Loss": 2.0321409702301025, "Full-pretrain/Loss (Raw)": 1.8925790786743164, "Full-pretrain/Step": 1624, "Full-pretrain/Step Time": 17.66203329153359} +{"Full-pretrain/Learning Rate": 4.745908755900236e-05, "Full-pretrain/Loss": 2.0261106491088867, "Full-pretrain/Loss (Raw)": 2.1036601066589355, "Full-pretrain/Step": 1625, "Full-pretrain/Step Time": 17.65560291148722} +{"Full-pretrain/Learning Rate": 4.7455356660093886e-05, "Full-pretrain/Loss": 2.024665117263794, "Full-pretrain/Loss (Raw)": 2.097930431365967, "Full-pretrain/Step": 1626, "Full-pretrain/Step Time": 17.660719215869904} +{"Full-pretrain/Learning Rate": 4.745162317096791e-05, "Full-pretrain/Loss": 2.014281749725342, "Full-pretrain/Loss (Raw)": 1.85767662525177, "Full-pretrain/Step": 1627, "Full-pretrain/Step Time": 17.66334694996476} +{"Full-pretrain/Learning Rate": 4.7447887092055095e-05, "Full-pretrain/Loss": 2.0203213691711426, "Full-pretrain/Loss (Raw)": 2.0462634563446045, "Full-pretrain/Step": 1628, "Full-pretrain/Step Time": 17.665799057111144} +{"Full-pretrain/Learning Rate": 4.744414842378639e-05, "Full-pretrain/Loss": 2.025176525115967, "Full-pretrain/Loss (Raw)": 2.109182834625244, "Full-pretrain/Step": 1629, "Full-pretrain/Step Time": 17.663214636966586} +{"Full-pretrain/Learning Rate": 4.744040716659306e-05, "Full-pretrain/Loss": 2.0328965187072754, "Full-pretrain/Loss (Raw)": 2.046677350997925, "Full-pretrain/Step": 1630, "Full-pretrain/Step Time": 17.664916813373566} +{"Full-pretrain/Learning Rate": 4.7436663320906636e-05, "Full-pretrain/Loss": 2.0339207649230957, "Full-pretrain/Loss (Raw)": 2.102381467819214, "Full-pretrain/Step": 1631, "Full-pretrain/Step Time": 17.665269574150443} +{"Full-pretrain/Learning Rate": 4.7432916887158993e-05, "Full-pretrain/Loss": 2.0380959510803223, "Full-pretrain/Loss (Raw)": 2.2021427154541016, "Full-pretrain/Step": 1632, "Full-pretrain/Step Time": 17.66683003678918} +{"Full-pretrain/Learning Rate": 4.742916786578227e-05, "Full-pretrain/Loss": 2.034025192260742, "Full-pretrain/Loss (Raw)": 1.9345755577087402, "Full-pretrain/Step": 1633, "Full-pretrain/Step Time": 17.66448518075049} +{"Full-pretrain/Learning Rate": 4.742541625720892e-05, "Full-pretrain/Loss": 2.0324227809906006, "Full-pretrain/Loss (Raw)": 1.961515188217163, "Full-pretrain/Step": 1634, "Full-pretrain/Step Time": 17.669030275195837} +{"Full-pretrain/Learning Rate": 4.7421662061871674e-05, "Full-pretrain/Loss": 2.0260331630706787, "Full-pretrain/Loss (Raw)": 1.8914868831634521, "Full-pretrain/Step": 1635, "Full-pretrain/Step Time": 17.66815094090998} +{"Full-pretrain/Learning Rate": 4.7417905280203594e-05, "Full-pretrain/Loss": 2.026310443878174, "Full-pretrain/Loss (Raw)": 1.8628178834915161, "Full-pretrain/Step": 1636, "Full-pretrain/Step Time": 17.669092506170273} +{"Full-pretrain/Learning Rate": 4.741414591263802e-05, "Full-pretrain/Loss": 2.0168867111206055, "Full-pretrain/Loss (Raw)": 1.7750718593597412, "Full-pretrain/Step": 1637, "Full-pretrain/Step Time": 17.668884048238397} +{"Full-pretrain/Learning Rate": 4.741038395960859e-05, "Full-pretrain/Loss": 2.0097639560699463, "Full-pretrain/Loss (Raw)": 2.171278476715088, "Full-pretrain/Step": 1638, "Full-pretrain/Step Time": 17.668191323056817} +{"Full-pretrain/Learning Rate": 4.740661942154925e-05, "Full-pretrain/Loss": 2.009012222290039, "Full-pretrain/Loss (Raw)": 1.8685332536697388, "Full-pretrain/Step": 1639, "Full-pretrain/Step Time": 17.669103944674134} +{"Full-pretrain/Learning Rate": 4.740285229889423e-05, "Full-pretrain/Loss": 1.9972221851348877, "Full-pretrain/Loss (Raw)": 1.7009003162384033, "Full-pretrain/Step": 1640, "Full-pretrain/Step Time": 17.667739674448967} +{"Full-pretrain/Learning Rate": 4.739908259207807e-05, "Full-pretrain/Loss": 2.000365972518921, "Full-pretrain/Loss (Raw)": 2.247654438018799, "Full-pretrain/Step": 1641, "Full-pretrain/Step Time": 17.668866984546185} +{"Full-pretrain/Learning Rate": 4.73953103015356e-05, "Full-pretrain/Loss": 1.9845242500305176, "Full-pretrain/Loss (Raw)": 2.001917839050293, "Full-pretrain/Step": 1642, "Full-pretrain/Step Time": 17.66590970568359} +{"Full-pretrain/Learning Rate": 4.7391535427701966e-05, "Full-pretrain/Loss": 1.9920034408569336, "Full-pretrain/Loss (Raw)": 2.059001922607422, "Full-pretrain/Step": 1643, "Full-pretrain/Step Time": 17.666214836761355} +{"Full-pretrain/Learning Rate": 4.738775797101258e-05, "Full-pretrain/Loss": 1.9866352081298828, "Full-pretrain/Loss (Raw)": 1.9079539775848389, "Full-pretrain/Step": 1644, "Full-pretrain/Step Time": 17.668533535674214} +{"Full-pretrain/Learning Rate": 4.738397793190319e-05, "Full-pretrain/Loss": 1.9935353994369507, "Full-pretrain/Loss (Raw)": 2.1572139263153076, "Full-pretrain/Step": 1645, "Full-pretrain/Step Time": 17.66479679197073} +{"Full-pretrain/Learning Rate": 4.7380195310809806e-05, "Full-pretrain/Loss": 1.9974241256713867, "Full-pretrain/Loss (Raw)": 1.7154057025909424, "Full-pretrain/Step": 1646, "Full-pretrain/Step Time": 17.660495597869158} +{"Full-pretrain/Learning Rate": 4.7376410108168753e-05, "Full-pretrain/Loss": 1.9802093505859375, "Full-pretrain/Loss (Raw)": 2.0408976078033447, "Full-pretrain/Step": 1647, "Full-pretrain/Step Time": 17.65804897993803} +{"Full-pretrain/Learning Rate": 4.737262232441667e-05, "Full-pretrain/Loss": 1.9974334239959717, "Full-pretrain/Loss (Raw)": 2.435253620147705, "Full-pretrain/Step": 1648, "Full-pretrain/Step Time": 17.66081009991467} +{"Full-pretrain/Learning Rate": 4.736883195999045e-05, "Full-pretrain/Loss": 2.0156893730163574, "Full-pretrain/Loss (Raw)": 2.348802089691162, "Full-pretrain/Step": 1649, "Full-pretrain/Step Time": 17.661969354376197} +{"Full-pretrain/Learning Rate": 4.736503901532734e-05, "Full-pretrain/Loss": 2.022686004638672, "Full-pretrain/Loss (Raw)": 2.216897964477539, "Full-pretrain/Step": 1650, "Full-pretrain/Step Time": 17.665048887953162} +{"Full-pretrain/Learning Rate": 4.736124349086482e-05, "Full-pretrain/Loss": 2.0214579105377197, "Full-pretrain/Loss (Raw)": 1.9243342876434326, "Full-pretrain/Step": 1651, "Full-pretrain/Step Time": 17.65823931619525} +{"Full-pretrain/Learning Rate": 4.7357445387040746e-05, "Full-pretrain/Loss": 2.0318098068237305, "Full-pretrain/Loss (Raw)": 2.37620210647583, "Full-pretrain/Step": 1652, "Full-pretrain/Step Time": 17.659644735977054} +{"Full-pretrain/Learning Rate": 4.7353644704293185e-05, "Full-pretrain/Loss": 2.031113624572754, "Full-pretrain/Loss (Raw)": 2.059462785720825, "Full-pretrain/Step": 1653, "Full-pretrain/Step Time": 17.66324796155095} +{"Full-pretrain/Learning Rate": 4.734984144306057e-05, "Full-pretrain/Loss": 2.0225110054016113, "Full-pretrain/Loss (Raw)": 1.8079184293746948, "Full-pretrain/Step": 1654, "Full-pretrain/Step Time": 17.658066034317017} +{"Full-pretrain/Learning Rate": 4.73460356037816e-05, "Full-pretrain/Loss": 2.032895565032959, "Full-pretrain/Loss (Raw)": 2.1290698051452637, "Full-pretrain/Step": 1655, "Full-pretrain/Step Time": 17.664199374616146} +{"Full-pretrain/Learning Rate": 4.7342227186895275e-05, "Full-pretrain/Loss": 2.0308403968811035, "Full-pretrain/Loss (Raw)": 1.8268102407455444, "Full-pretrain/Step": 1656, "Full-pretrain/Step Time": 17.658734615892172} +{"Full-pretrain/Learning Rate": 4.733841619284089e-05, "Full-pretrain/Loss": 2.0328266620635986, "Full-pretrain/Loss (Raw)": 2.167222738265991, "Full-pretrain/Step": 1657, "Full-pretrain/Step Time": 17.65617671236396} +{"Full-pretrain/Learning Rate": 4.733460262205805e-05, "Full-pretrain/Loss": 2.0295300483703613, "Full-pretrain/Loss (Raw)": 1.9924355745315552, "Full-pretrain/Step": 1658, "Full-pretrain/Step Time": 17.65458944439888} +{"Full-pretrain/Learning Rate": 4.733078647498665e-05, "Full-pretrain/Loss": 2.03069806098938, "Full-pretrain/Loss (Raw)": 1.8950583934783936, "Full-pretrain/Step": 1659, "Full-pretrain/Step Time": 17.65976599045098} +{"Full-pretrain/Learning Rate": 4.732696775206688e-05, "Full-pretrain/Loss": 2.023540496826172, "Full-pretrain/Loss (Raw)": 1.817215919494629, "Full-pretrain/Step": 1660, "Full-pretrain/Step Time": 17.656083354726434} +{"Full-pretrain/Learning Rate": 4.732314645373921e-05, "Full-pretrain/Loss": 2.0142643451690674, "Full-pretrain/Loss (Raw)": 1.8123502731323242, "Full-pretrain/Step": 1661, "Full-pretrain/Step Time": 17.65594041533768} +{"Full-pretrain/Learning Rate": 4.731932258044446e-05, "Full-pretrain/Loss": 2.0171031951904297, "Full-pretrain/Loss (Raw)": 2.1375255584716797, "Full-pretrain/Step": 1662, "Full-pretrain/Step Time": 17.658451745286584} +{"Full-pretrain/Learning Rate": 4.731549613262368e-05, "Full-pretrain/Loss": 2.011866569519043, "Full-pretrain/Loss (Raw)": 1.9348063468933105, "Full-pretrain/Step": 1663, "Full-pretrain/Step Time": 17.662494285032153} +{"Full-pretrain/Learning Rate": 4.731166711071827e-05, "Full-pretrain/Loss": 2.0038676261901855, "Full-pretrain/Loss (Raw)": 1.9461766481399536, "Full-pretrain/Step": 1664, "Full-pretrain/Step Time": 17.657293409109116} +{"Full-pretrain/Learning Rate": 4.730783551516991e-05, "Full-pretrain/Loss": 2.006330728530884, "Full-pretrain/Loss (Raw)": 2.0133886337280273, "Full-pretrain/Step": 1665, "Full-pretrain/Step Time": 17.659079944714904} +{"Full-pretrain/Learning Rate": 4.730400134642055e-05, "Full-pretrain/Loss": 2.0070180892944336, "Full-pretrain/Loss (Raw)": 1.9835090637207031, "Full-pretrain/Step": 1666, "Full-pretrain/Step Time": 17.660353308543563} +{"Full-pretrain/Learning Rate": 4.7300164604912475e-05, "Full-pretrain/Loss": 2.0146000385284424, "Full-pretrain/Loss (Raw)": 2.1341142654418945, "Full-pretrain/Step": 1667, "Full-pretrain/Step Time": 17.65922012552619} +{"Full-pretrain/Learning Rate": 4.729632529108825e-05, "Full-pretrain/Loss": 2.029446840286255, "Full-pretrain/Loss (Raw)": 2.337916135787964, "Full-pretrain/Step": 1668, "Full-pretrain/Step Time": 17.652114177122712} +{"Full-pretrain/Learning Rate": 4.7292483405390736e-05, "Full-pretrain/Loss": 2.033888578414917, "Full-pretrain/Loss (Raw)": 1.9172059297561646, "Full-pretrain/Step": 1669, "Full-pretrain/Step Time": 17.648783519864082} +{"Full-pretrain/Learning Rate": 4.72886389482631e-05, "Full-pretrain/Loss": 2.021902084350586, "Full-pretrain/Loss (Raw)": 1.7877098321914673, "Full-pretrain/Step": 1670, "Full-pretrain/Step Time": 17.649380469694734} +{"Full-pretrain/Learning Rate": 4.7284791920148784e-05, "Full-pretrain/Loss": 2.028904914855957, "Full-pretrain/Loss (Raw)": 2.0926215648651123, "Full-pretrain/Step": 1671, "Full-pretrain/Step Time": 17.650914112105966} +{"Full-pretrain/Learning Rate": 4.728094232149156e-05, "Full-pretrain/Loss": 2.039750814437866, "Full-pretrain/Loss (Raw)": 2.047968864440918, "Full-pretrain/Step": 1672, "Full-pretrain/Step Time": 17.646227398887277} +{"Full-pretrain/Learning Rate": 4.727709015273547e-05, "Full-pretrain/Loss": 2.0359809398651123, "Full-pretrain/Loss (Raw)": 2.127023935317993, "Full-pretrain/Step": 1673, "Full-pretrain/Step Time": 17.646850435063243} +{"Full-pretrain/Learning Rate": 4.727323541432486e-05, "Full-pretrain/Loss": 2.035701036453247, "Full-pretrain/Loss (Raw)": 1.992958664894104, "Full-pretrain/Step": 1674, "Full-pretrain/Step Time": 17.648138623684645} +{"Full-pretrain/Learning Rate": 4.726937810670437e-05, "Full-pretrain/Loss": 2.0327582359313965, "Full-pretrain/Loss (Raw)": 1.964832067489624, "Full-pretrain/Step": 1675, "Full-pretrain/Step Time": 17.644628826528788} +{"Full-pretrain/Learning Rate": 4.7265518230318944e-05, "Full-pretrain/Loss": 2.033433198928833, "Full-pretrain/Loss (Raw)": 1.9295538663864136, "Full-pretrain/Step": 1676, "Full-pretrain/Step Time": 17.642670784145594} +{"Full-pretrain/Learning Rate": 4.7261655785613814e-05, "Full-pretrain/Loss": 2.0274643898010254, "Full-pretrain/Loss (Raw)": 1.9662058353424072, "Full-pretrain/Step": 1677, "Full-pretrain/Step Time": 17.637660715728998} +{"Full-pretrain/Learning Rate": 4.725779077303451e-05, "Full-pretrain/Loss": 2.038431167602539, "Full-pretrain/Loss (Raw)": 2.0663504600524902, "Full-pretrain/Step": 1678, "Full-pretrain/Step Time": 17.6409472245723} +{"Full-pretrain/Learning Rate": 4.7253923193026863e-05, "Full-pretrain/Loss": 2.0376553535461426, "Full-pretrain/Loss (Raw)": 2.016066551208496, "Full-pretrain/Step": 1679, "Full-pretrain/Step Time": 17.639655405655503} +{"Full-pretrain/Learning Rate": 4.7250053046036994e-05, "Full-pretrain/Loss": 2.0211563110351562, "Full-pretrain/Loss (Raw)": 1.9072825908660889, "Full-pretrain/Step": 1680, "Full-pretrain/Step Time": 17.641350466758013} +{"Full-pretrain/Learning Rate": 4.724618033251133e-05, "Full-pretrain/Loss": 2.0085887908935547, "Full-pretrain/Loss (Raw)": 1.9466383457183838, "Full-pretrain/Step": 1681, "Full-pretrain/Step Time": 17.641145398840308} +{"Full-pretrain/Learning Rate": 4.724230505289658e-05, "Full-pretrain/Loss": 1.9984610080718994, "Full-pretrain/Loss (Raw)": 1.8928149938583374, "Full-pretrain/Step": 1682, "Full-pretrain/Step Time": 17.6427429523319} +{"Full-pretrain/Learning Rate": 4.723842720763976e-05, "Full-pretrain/Loss": 2.0065014362335205, "Full-pretrain/Loss (Raw)": 2.181628704071045, "Full-pretrain/Step": 1683, "Full-pretrain/Step Time": 17.640809919685125} +{"Full-pretrain/Learning Rate": 4.723454679718817e-05, "Full-pretrain/Loss": 1.9998239278793335, "Full-pretrain/Loss (Raw)": 2.1625232696533203, "Full-pretrain/Step": 1684, "Full-pretrain/Step Time": 17.643479676917195} +{"Full-pretrain/Learning Rate": 4.723066382198943e-05, "Full-pretrain/Loss": 1.9878884553909302, "Full-pretrain/Loss (Raw)": 1.6775258779525757, "Full-pretrain/Step": 1685, "Full-pretrain/Step Time": 17.647611251100898} +{"Full-pretrain/Learning Rate": 4.7226778282491424e-05, "Full-pretrain/Loss": 1.9979403018951416, "Full-pretrain/Loss (Raw)": 2.1295762062072754, "Full-pretrain/Step": 1686, "Full-pretrain/Step Time": 17.65021854825318} +{"Full-pretrain/Learning Rate": 4.722289017914236e-05, "Full-pretrain/Loss": 1.9956936836242676, "Full-pretrain/Loss (Raw)": 2.0571789741516113, "Full-pretrain/Step": 1687, "Full-pretrain/Step Time": 17.644069585949183} +{"Full-pretrain/Learning Rate": 4.721899951239072e-05, "Full-pretrain/Loss": 2.0037336349487305, "Full-pretrain/Loss (Raw)": 2.084089756011963, "Full-pretrain/Step": 1688, "Full-pretrain/Step Time": 17.64633120968938} +{"Full-pretrain/Learning Rate": 4.72151062826853e-05, "Full-pretrain/Loss": 2.000638484954834, "Full-pretrain/Loss (Raw)": 2.068183422088623, "Full-pretrain/Step": 1689, "Full-pretrain/Step Time": 17.63950409181416} +{"Full-pretrain/Learning Rate": 4.721121049047517e-05, "Full-pretrain/Loss": 2.007519245147705, "Full-pretrain/Loss (Raw)": 2.212610960006714, "Full-pretrain/Step": 1690, "Full-pretrain/Step Time": 17.63836338557303} +{"Full-pretrain/Learning Rate": 4.720731213620972e-05, "Full-pretrain/Loss": 2.016606569290161, "Full-pretrain/Loss (Raw)": 2.1858553886413574, "Full-pretrain/Step": 1691, "Full-pretrain/Step Time": 17.6316757183522} +{"Full-pretrain/Learning Rate": 4.720341122033862e-05, "Full-pretrain/Loss": 2.025575637817383, "Full-pretrain/Loss (Raw)": 2.1042284965515137, "Full-pretrain/Step": 1692, "Full-pretrain/Step Time": 17.63429019600153} +{"Full-pretrain/Learning Rate": 4.719950774331183e-05, "Full-pretrain/Loss": 2.0339431762695312, "Full-pretrain/Loss (Raw)": 2.080111026763916, "Full-pretrain/Step": 1693, "Full-pretrain/Step Time": 17.627971524372697} +{"Full-pretrain/Learning Rate": 4.7195601705579626e-05, "Full-pretrain/Loss": 2.027580738067627, "Full-pretrain/Loss (Raw)": 1.9339251518249512, "Full-pretrain/Step": 1694, "Full-pretrain/Step Time": 17.62947141751647} +{"Full-pretrain/Learning Rate": 4.719169310759257e-05, "Full-pretrain/Loss": 2.0330376625061035, "Full-pretrain/Loss (Raw)": 2.1094281673431396, "Full-pretrain/Step": 1695, "Full-pretrain/Step Time": 17.627548662945628} +{"Full-pretrain/Learning Rate": 4.7187781949801514e-05, "Full-pretrain/Loss": 2.03834867477417, "Full-pretrain/Loss (Raw)": 2.1161341667175293, "Full-pretrain/Step": 1696, "Full-pretrain/Step Time": 17.622964546084404} +{"Full-pretrain/Learning Rate": 4.71838682326576e-05, "Full-pretrain/Loss": 2.0381431579589844, "Full-pretrain/Loss (Raw)": 2.006809711456299, "Full-pretrain/Step": 1697, "Full-pretrain/Step Time": 17.62274939380586} +{"Full-pretrain/Learning Rate": 4.717995195661229e-05, "Full-pretrain/Loss": 2.0417966842651367, "Full-pretrain/Loss (Raw)": 2.100421905517578, "Full-pretrain/Step": 1698, "Full-pretrain/Step Time": 17.628761371597648} +{"Full-pretrain/Learning Rate": 4.7176033122117317e-05, "Full-pretrain/Loss": 2.04091215133667, "Full-pretrain/Loss (Raw)": 2.1058106422424316, "Full-pretrain/Step": 1699, "Full-pretrain/Step Time": 17.621859069913626} +{"Full-pretrain/Learning Rate": 4.7172111729624706e-05, "Full-pretrain/Loss": 2.032395839691162, "Full-pretrain/Loss (Raw)": 2.065394878387451, "Full-pretrain/Step": 1700, "Full-pretrain/Step Time": 17.62578647583723} +{"Full-pretrain/Learning Rate": 4.71681877795868e-05, "Full-pretrain/Loss": 2.040147304534912, "Full-pretrain/Loss (Raw)": 2.165256977081299, "Full-pretrain/Step": 1701, "Full-pretrain/Step Time": 17.624932451173663} +{"Full-pretrain/Learning Rate": 4.716426127245624e-05, "Full-pretrain/Loss": 2.0410008430480957, "Full-pretrain/Loss (Raw)": 1.8150136470794678, "Full-pretrain/Step": 1702, "Full-pretrain/Step Time": 17.621496479958296} +{"Full-pretrain/Learning Rate": 4.716033220868592e-05, "Full-pretrain/Loss": 2.0344653129577637, "Full-pretrain/Loss (Raw)": 1.8834893703460693, "Full-pretrain/Step": 1703, "Full-pretrain/Step Time": 17.614922372624278} +{"Full-pretrain/Learning Rate": 4.7156400588729066e-05, "Full-pretrain/Loss": 2.034320592880249, "Full-pretrain/Loss (Raw)": 2.043337106704712, "Full-pretrain/Step": 1704, "Full-pretrain/Step Time": 17.61956214159727} +{"Full-pretrain/Learning Rate": 4.7152466413039184e-05, "Full-pretrain/Loss": 2.021273612976074, "Full-pretrain/Loss (Raw)": 1.7095215320587158, "Full-pretrain/Step": 1705, "Full-pretrain/Step Time": 17.611894454807043} +{"Full-pretrain/Learning Rate": 4.71485296820701e-05, "Full-pretrain/Loss": 2.025519371032715, "Full-pretrain/Loss (Raw)": 2.1288199424743652, "Full-pretrain/Step": 1706, "Full-pretrain/Step Time": 17.611730121076107} +{"Full-pretrain/Learning Rate": 4.7144590396275896e-05, "Full-pretrain/Loss": 2.0243752002716064, "Full-pretrain/Loss (Raw)": 1.9282203912734985, "Full-pretrain/Step": 1707, "Full-pretrain/Step Time": 17.605368826538324} +{"Full-pretrain/Learning Rate": 4.714064855611097e-05, "Full-pretrain/Loss": 2.028517246246338, "Full-pretrain/Loss (Raw)": 2.0620970726013184, "Full-pretrain/Step": 1708, "Full-pretrain/Step Time": 17.609828451648355} +{"Full-pretrain/Learning Rate": 4.713670416203001e-05, "Full-pretrain/Loss": 2.0298550128936768, "Full-pretrain/Loss (Raw)": 2.0090107917785645, "Full-pretrain/Step": 1709, "Full-pretrain/Step Time": 17.607653820887208} +{"Full-pretrain/Learning Rate": 4.7132757214488013e-05, "Full-pretrain/Loss": 2.0328965187072754, "Full-pretrain/Loss (Raw)": 2.1636791229248047, "Full-pretrain/Step": 1710, "Full-pretrain/Step Time": 17.607927607372403} +{"Full-pretrain/Learning Rate": 4.712880771394024e-05, "Full-pretrain/Loss": 2.0259311199188232, "Full-pretrain/Loss (Raw)": 1.793174386024475, "Full-pretrain/Step": 1711, "Full-pretrain/Step Time": 17.609630594030023} +{"Full-pretrain/Learning Rate": 4.712485566084228e-05, "Full-pretrain/Loss": 2.0337677001953125, "Full-pretrain/Loss (Raw)": 2.1580557823181152, "Full-pretrain/Step": 1712, "Full-pretrain/Step Time": 17.610082713887095} +{"Full-pretrain/Learning Rate": 4.712090105565e-05, "Full-pretrain/Loss": 2.036531925201416, "Full-pretrain/Loss (Raw)": 2.0350942611694336, "Full-pretrain/Step": 1713, "Full-pretrain/Step Time": 17.60798236913979} +{"Full-pretrain/Learning Rate": 4.7116943898819546e-05, "Full-pretrain/Loss": 2.043233871459961, "Full-pretrain/Loss (Raw)": 2.107273578643799, "Full-pretrain/Step": 1714, "Full-pretrain/Step Time": 17.601402197033167} +{"Full-pretrain/Learning Rate": 4.711298419080739e-05, "Full-pretrain/Loss": 2.0357513427734375, "Full-pretrain/Loss (Raw)": 1.9421887397766113, "Full-pretrain/Step": 1715, "Full-pretrain/Step Time": 17.60513362661004} +{"Full-pretrain/Learning Rate": 4.710902193207029e-05, "Full-pretrain/Loss": 2.03639554977417, "Full-pretrain/Loss (Raw)": 2.183143138885498, "Full-pretrain/Step": 1716, "Full-pretrain/Step Time": 17.607176246121526} +{"Full-pretrain/Learning Rate": 4.710505712306526e-05, "Full-pretrain/Loss": 2.0406150817871094, "Full-pretrain/Loss (Raw)": 1.8125495910644531, "Full-pretrain/Step": 1717, "Full-pretrain/Step Time": 17.60866274125874} +{"Full-pretrain/Learning Rate": 4.710108976424967e-05, "Full-pretrain/Loss": 2.0403223037719727, "Full-pretrain/Loss (Raw)": 2.1202049255371094, "Full-pretrain/Step": 1718, "Full-pretrain/Step Time": 17.601993817836046} +{"Full-pretrain/Learning Rate": 4.709711985608114e-05, "Full-pretrain/Loss": 2.0374269485473633, "Full-pretrain/Loss (Raw)": 1.964524507522583, "Full-pretrain/Step": 1719, "Full-pretrain/Step Time": 17.599096219986677} +{"Full-pretrain/Learning Rate": 4.7093147399017604e-05, "Full-pretrain/Loss": 2.0228261947631836, "Full-pretrain/Loss (Raw)": 1.616869330406189, "Full-pretrain/Step": 1720, "Full-pretrain/Step Time": 17.600518319755793} +{"Full-pretrain/Learning Rate": 4.708917239351727e-05, "Full-pretrain/Loss": 2.0275990962982178, "Full-pretrain/Loss (Raw)": 2.220916748046875, "Full-pretrain/Step": 1721, "Full-pretrain/Step Time": 17.60581485927105} +{"Full-pretrain/Learning Rate": 4.708519484003867e-05, "Full-pretrain/Loss": 2.0180137157440186, "Full-pretrain/Loss (Raw)": 1.9058802127838135, "Full-pretrain/Step": 1722, "Full-pretrain/Step Time": 17.59794794395566} +{"Full-pretrain/Learning Rate": 4.708121473904061e-05, "Full-pretrain/Loss": 2.018383264541626, "Full-pretrain/Loss (Raw)": 2.197678565979004, "Full-pretrain/Step": 1723, "Full-pretrain/Step Time": 17.605789674445987} +{"Full-pretrain/Learning Rate": 4.707723209098218e-05, "Full-pretrain/Loss": 2.01702880859375, "Full-pretrain/Loss (Raw)": 2.0608859062194824, "Full-pretrain/Step": 1724, "Full-pretrain/Step Time": 17.598697802051902} +{"Full-pretrain/Learning Rate": 4.70732468963228e-05, "Full-pretrain/Loss": 2.015275478363037, "Full-pretrain/Loss (Raw)": 2.0240015983581543, "Full-pretrain/Step": 1725, "Full-pretrain/Step Time": 17.60541162826121} +{"Full-pretrain/Learning Rate": 4.7069259155522135e-05, "Full-pretrain/Loss": 2.0194671154022217, "Full-pretrain/Loss (Raw)": 2.0680594444274902, "Full-pretrain/Step": 1726, "Full-pretrain/Step Time": 17.603064604103565} +{"Full-pretrain/Learning Rate": 4.706526886904019e-05, "Full-pretrain/Loss": 2.0132150650024414, "Full-pretrain/Loss (Raw)": 1.9093639850616455, "Full-pretrain/Step": 1727, "Full-pretrain/Step Time": 17.60546311363578} +{"Full-pretrain/Learning Rate": 4.706127603733723e-05, "Full-pretrain/Loss": 2.0158472061157227, "Full-pretrain/Loss (Raw)": 2.200364112854004, "Full-pretrain/Step": 1728, "Full-pretrain/Step Time": 17.60126625932753} +{"Full-pretrain/Learning Rate": 4.7057280660873835e-05, "Full-pretrain/Loss": 2.0180745124816895, "Full-pretrain/Loss (Raw)": 2.0780816078186035, "Full-pretrain/Step": 1729, "Full-pretrain/Step Time": 17.60293329693377} +{"Full-pretrain/Learning Rate": 4.705328274011086e-05, "Full-pretrain/Loss": 2.01995587348938, "Full-pretrain/Loss (Raw)": 2.1606225967407227, "Full-pretrain/Step": 1730, "Full-pretrain/Step Time": 17.599931851029396} +{"Full-pretrain/Learning Rate": 4.704928227550949e-05, "Full-pretrain/Loss": 2.0147361755371094, "Full-pretrain/Loss (Raw)": 1.9387800693511963, "Full-pretrain/Step": 1731, "Full-pretrain/Step Time": 17.598829029127955} +{"Full-pretrain/Learning Rate": 4.704527926753114e-05, "Full-pretrain/Loss": 2.0129876136779785, "Full-pretrain/Loss (Raw)": 2.0094451904296875, "Full-pretrain/Step": 1732, "Full-pretrain/Step Time": 17.60786994546652} +{"Full-pretrain/Learning Rate": 4.704127371663758e-05, "Full-pretrain/Loss": 2.0119853019714355, "Full-pretrain/Loss (Raw)": 2.1331799030303955, "Full-pretrain/Step": 1733, "Full-pretrain/Step Time": 17.601249430328608} +{"Full-pretrain/Learning Rate": 4.7037265623290836e-05, "Full-pretrain/Loss": 2.0106565952301025, "Full-pretrain/Loss (Raw)": 1.7724947929382324, "Full-pretrain/Step": 1734, "Full-pretrain/Step Time": 17.600370401516557} +{"Full-pretrain/Learning Rate": 4.703325498795326e-05, "Full-pretrain/Loss": 2.0120787620544434, "Full-pretrain/Loss (Raw)": 1.9289995431900024, "Full-pretrain/Step": 1735, "Full-pretrain/Step Time": 17.59888150729239} +{"Full-pretrain/Learning Rate": 4.7029241811087457e-05, "Full-pretrain/Loss": 2.0175063610076904, "Full-pretrain/Loss (Raw)": 2.217024087905884, "Full-pretrain/Step": 1736, "Full-pretrain/Step Time": 17.6023679189384} +{"Full-pretrain/Learning Rate": 4.702522609315635e-05, "Full-pretrain/Loss": 2.0206382274627686, "Full-pretrain/Loss (Raw)": 1.8097383975982666, "Full-pretrain/Step": 1737, "Full-pretrain/Step Time": 17.597698451951146} +{"Full-pretrain/Learning Rate": 4.702120783462316e-05, "Full-pretrain/Loss": 2.0208323001861572, "Full-pretrain/Loss (Raw)": 2.1350302696228027, "Full-pretrain/Step": 1738, "Full-pretrain/Step Time": 17.597243677824736} +{"Full-pretrain/Learning Rate": 4.7017187035951384e-05, "Full-pretrain/Loss": 2.0268959999084473, "Full-pretrain/Loss (Raw)": 2.1222598552703857, "Full-pretrain/Step": 1739, "Full-pretrain/Step Time": 17.59822665527463} +{"Full-pretrain/Learning Rate": 4.7013163697604814e-05, "Full-pretrain/Loss": 2.0305087566375732, "Full-pretrain/Loss (Raw)": 2.1777055263519287, "Full-pretrain/Step": 1740, "Full-pretrain/Step Time": 17.602876167744398} +{"Full-pretrain/Learning Rate": 4.7009137820047546e-05, "Full-pretrain/Loss": 2.028165340423584, "Full-pretrain/Loss (Raw)": 1.934028148651123, "Full-pretrain/Step": 1741, "Full-pretrain/Step Time": 17.59760166145861} +{"Full-pretrain/Learning Rate": 4.700510940374397e-05, "Full-pretrain/Loss": 2.0329079627990723, "Full-pretrain/Loss (Raw)": 2.315434455871582, "Full-pretrain/Step": 1742, "Full-pretrain/Step Time": 17.598104840144515} +{"Full-pretrain/Learning Rate": 4.700107844915876e-05, "Full-pretrain/Loss": 2.0374999046325684, "Full-pretrain/Loss (Raw)": 1.940124750137329, "Full-pretrain/Step": 1743, "Full-pretrain/Step Time": 17.594611613079906} +{"Full-pretrain/Learning Rate": 4.699704495675689e-05, "Full-pretrain/Loss": 2.0398237705230713, "Full-pretrain/Loss (Raw)": 2.2324166297912598, "Full-pretrain/Step": 1744, "Full-pretrain/Step Time": 17.595461195334792} +{"Full-pretrain/Learning Rate": 4.69930089270036e-05, "Full-pretrain/Loss": 2.0392282009124756, "Full-pretrain/Loss (Raw)": 2.0160329341888428, "Full-pretrain/Step": 1745, "Full-pretrain/Step Time": 17.6002120282501} +{"Full-pretrain/Learning Rate": 4.698897036036446e-05, "Full-pretrain/Loss": 2.053800106048584, "Full-pretrain/Loss (Raw)": 2.5735719203948975, "Full-pretrain/Step": 1746, "Full-pretrain/Step Time": 17.59584116190672} +{"Full-pretrain/Learning Rate": 4.6984929257305323e-05, "Full-pretrain/Loss": 2.0547561645507812, "Full-pretrain/Loss (Raw)": 1.9727931022644043, "Full-pretrain/Step": 1747, "Full-pretrain/Step Time": 17.595011232420802} +{"Full-pretrain/Learning Rate": 4.698088561829232e-05, "Full-pretrain/Loss": 2.040457248687744, "Full-pretrain/Loss (Raw)": 1.7255710363388062, "Full-pretrain/Step": 1748, "Full-pretrain/Step Time": 17.595671759918332} +{"Full-pretrain/Learning Rate": 4.697683944379189e-05, "Full-pretrain/Loss": 2.0348927974700928, "Full-pretrain/Loss (Raw)": 1.6344887018203735, "Full-pretrain/Step": 1749, "Full-pretrain/Step Time": 17.599348455667496} +{"Full-pretrain/Learning Rate": 4.697279073427074e-05, "Full-pretrain/Loss": 2.0389370918273926, "Full-pretrain/Loss (Raw)": 2.2496228218078613, "Full-pretrain/Step": 1750, "Full-pretrain/Step Time": 17.60180637612939} +{"Full-pretrain/Learning Rate": 4.696873949019591e-05, "Full-pretrain/Loss": 2.0436766147613525, "Full-pretrain/Loss (Raw)": 2.1161909103393555, "Full-pretrain/Step": 1751, "Full-pretrain/Step Time": 17.591299204155803} +{"Full-pretrain/Learning Rate": 4.69646857120347e-05, "Full-pretrain/Loss": 2.058852434158325, "Full-pretrain/Loss (Raw)": 2.102492332458496, "Full-pretrain/Step": 1752, "Full-pretrain/Step Time": 17.59361796081066} +{"Full-pretrain/Learning Rate": 4.696062940025471e-05, "Full-pretrain/Loss": 2.0467870235443115, "Full-pretrain/Loss (Raw)": 1.8348300457000732, "Full-pretrain/Step": 1753, "Full-pretrain/Step Time": 17.602351570501924} +{"Full-pretrain/Learning Rate": 4.695657055532384e-05, "Full-pretrain/Loss": 2.0488715171813965, "Full-pretrain/Loss (Raw)": 1.9725770950317383, "Full-pretrain/Step": 1754, "Full-pretrain/Step Time": 17.597114875912666} +{"Full-pretrain/Learning Rate": 4.695250917771027e-05, "Full-pretrain/Loss": 2.0393645763397217, "Full-pretrain/Loss (Raw)": 1.8934568166732788, "Full-pretrain/Step": 1755, "Full-pretrain/Step Time": 17.595282044261694} +{"Full-pretrain/Learning Rate": 4.6948445267882486e-05, "Full-pretrain/Loss": 2.037985324859619, "Full-pretrain/Loss (Raw)": 2.0167489051818848, "Full-pretrain/Step": 1756, "Full-pretrain/Step Time": 17.591753751039505} +{"Full-pretrain/Learning Rate": 4.6944378826309247e-05, "Full-pretrain/Loss": 2.0379161834716797, "Full-pretrain/Loss (Raw)": 2.0217976570129395, "Full-pretrain/Step": 1757, "Full-pretrain/Step Time": 17.592258416116238} +{"Full-pretrain/Learning Rate": 4.694030985345962e-05, "Full-pretrain/Loss": 2.036891222000122, "Full-pretrain/Loss (Raw)": 2.035250186920166, "Full-pretrain/Step": 1758, "Full-pretrain/Step Time": 17.592388410121202} +{"Full-pretrain/Learning Rate": 4.693623834980297e-05, "Full-pretrain/Loss": 2.0463733673095703, "Full-pretrain/Loss (Raw)": 2.212794542312622, "Full-pretrain/Step": 1759, "Full-pretrain/Step Time": 17.59279116988182} +{"Full-pretrain/Learning Rate": 4.6932164315808936e-05, "Full-pretrain/Loss": 2.0429153442382812, "Full-pretrain/Loss (Raw)": 2.0897114276885986, "Full-pretrain/Step": 1760, "Full-pretrain/Step Time": 17.592567164450884} +{"Full-pretrain/Learning Rate": 4.692808775194745e-05, "Full-pretrain/Loss": 2.0402183532714844, "Full-pretrain/Loss (Raw)": 1.9917722940444946, "Full-pretrain/Step": 1761, "Full-pretrain/Step Time": 17.59915285371244} +{"Full-pretrain/Learning Rate": 4.692400865868874e-05, "Full-pretrain/Loss": 2.037446975708008, "Full-pretrain/Loss (Raw)": 2.071944236755371, "Full-pretrain/Step": 1762, "Full-pretrain/Step Time": 17.592494543641806} +{"Full-pretrain/Learning Rate": 4.691992703650335e-05, "Full-pretrain/Loss": 2.039295196533203, "Full-pretrain/Loss (Raw)": 1.9979145526885986, "Full-pretrain/Step": 1763, "Full-pretrain/Step Time": 17.59191363491118} +{"Full-pretrain/Learning Rate": 4.691584288586207e-05, "Full-pretrain/Loss": 2.0384445190429688, "Full-pretrain/Loss (Raw)": 1.9822301864624023, "Full-pretrain/Step": 1764, "Full-pretrain/Step Time": 17.585393646731973} +{"Full-pretrain/Learning Rate": 4.691175620723602e-05, "Full-pretrain/Loss": 2.032895088195801, "Full-pretrain/Loss (Raw)": 1.9555937051773071, "Full-pretrain/Step": 1765, "Full-pretrain/Step Time": 17.583797799423337} +{"Full-pretrain/Learning Rate": 4.690766700109659e-05, "Full-pretrain/Loss": 2.0358786582946777, "Full-pretrain/Loss (Raw)": 1.8679678440093994, "Full-pretrain/Step": 1766, "Full-pretrain/Step Time": 17.5858834721148} +{"Full-pretrain/Learning Rate": 4.690357526791547e-05, "Full-pretrain/Loss": 2.031754732131958, "Full-pretrain/Loss (Raw)": 1.7970390319824219, "Full-pretrain/Step": 1767, "Full-pretrain/Step Time": 17.586379803717136} +{"Full-pretrain/Learning Rate": 4.689948100816465e-05, "Full-pretrain/Loss": 2.02860426902771, "Full-pretrain/Loss (Raw)": 2.116205930709839, "Full-pretrain/Step": 1768, "Full-pretrain/Step Time": 17.579974126070738} +{"Full-pretrain/Learning Rate": 4.6895384222316375e-05, "Full-pretrain/Loss": 2.037649154663086, "Full-pretrain/Loss (Raw)": 2.099177122116089, "Full-pretrain/Step": 1769, "Full-pretrain/Step Time": 17.57948124781251} +{"Full-pretrain/Learning Rate": 4.689128491084324e-05, "Full-pretrain/Loss": 2.0318870544433594, "Full-pretrain/Loss (Raw)": 1.9506385326385498, "Full-pretrain/Step": 1770, "Full-pretrain/Step Time": 17.58854365721345} +{"Full-pretrain/Learning Rate": 4.688718307421807e-05, "Full-pretrain/Loss": 2.032466411590576, "Full-pretrain/Loss (Raw)": 2.140800952911377, "Full-pretrain/Step": 1771, "Full-pretrain/Step Time": 17.57970936410129} +{"Full-pretrain/Learning Rate": 4.688307871291403e-05, "Full-pretrain/Loss": 2.0310754776000977, "Full-pretrain/Loss (Raw)": 2.13320255279541, "Full-pretrain/Step": 1772, "Full-pretrain/Step Time": 17.576112497597933} +{"Full-pretrain/Learning Rate": 4.687897182740455e-05, "Full-pretrain/Loss": 2.0297024250030518, "Full-pretrain/Loss (Raw)": 1.890087604522705, "Full-pretrain/Step": 1773, "Full-pretrain/Step Time": 17.580750711262226} +{"Full-pretrain/Learning Rate": 4.6874862418163364e-05, "Full-pretrain/Loss": 2.0259270668029785, "Full-pretrain/Loss (Raw)": 2.194620132446289, "Full-pretrain/Step": 1774, "Full-pretrain/Step Time": 17.5849198885262} +{"Full-pretrain/Learning Rate": 4.687075048566448e-05, "Full-pretrain/Loss": 2.0260009765625, "Full-pretrain/Loss (Raw)": 1.9424870014190674, "Full-pretrain/Step": 1775, "Full-pretrain/Step Time": 17.583427235484123} +{"Full-pretrain/Learning Rate": 4.686663603038222e-05, "Full-pretrain/Loss": 2.0225467681884766, "Full-pretrain/Loss (Raw)": 2.1218888759613037, "Full-pretrain/Step": 1776, "Full-pretrain/Step Time": 17.57922156341374} +{"Full-pretrain/Learning Rate": 4.6862519052791165e-05, "Full-pretrain/Loss": 2.02183198928833, "Full-pretrain/Loss (Raw)": 1.9931526184082031, "Full-pretrain/Step": 1777, "Full-pretrain/Step Time": 17.586067831143737} +{"Full-pretrain/Learning Rate": 4.685839955336623e-05, "Full-pretrain/Loss": 2.0070953369140625, "Full-pretrain/Loss (Raw)": 2.1020007133483887, "Full-pretrain/Step": 1778, "Full-pretrain/Step Time": 17.596269950270653} +{"Full-pretrain/Learning Rate": 4.6854277532582584e-05, "Full-pretrain/Loss": 2.012507200241089, "Full-pretrain/Loss (Raw)": 2.1459741592407227, "Full-pretrain/Step": 1779, "Full-pretrain/Step Time": 17.594863679260015} +{"Full-pretrain/Learning Rate": 4.6850152990915706e-05, "Full-pretrain/Loss": 2.015463352203369, "Full-pretrain/Loss (Raw)": 1.8201664686203003, "Full-pretrain/Step": 1780, "Full-pretrain/Step Time": 17.59605496749282} +{"Full-pretrain/Learning Rate": 4.684602592884136e-05, "Full-pretrain/Loss": 2.031217575073242, "Full-pretrain/Loss (Raw)": 2.1386215686798096, "Full-pretrain/Step": 1781, "Full-pretrain/Step Time": 17.594758454710245} +{"Full-pretrain/Learning Rate": 4.68418963468356e-05, "Full-pretrain/Loss": 2.023386240005493, "Full-pretrain/Loss (Raw)": 1.9990278482437134, "Full-pretrain/Step": 1782, "Full-pretrain/Step Time": 17.59556102193892} +{"Full-pretrain/Learning Rate": 4.6837764245374774e-05, "Full-pretrain/Loss": 2.01794171333313, "Full-pretrain/Loss (Raw)": 1.941957712173462, "Full-pretrain/Step": 1783, "Full-pretrain/Step Time": 17.59271034412086} +{"Full-pretrain/Learning Rate": 4.683362962493552e-05, "Full-pretrain/Loss": 2.0172433853149414, "Full-pretrain/Loss (Raw)": 2.0801453590393066, "Full-pretrain/Step": 1784, "Full-pretrain/Step Time": 17.592918634414673} +{"Full-pretrain/Learning Rate": 4.6829492485994756e-05, "Full-pretrain/Loss": 2.024064302444458, "Full-pretrain/Loss (Raw)": 2.05310320854187, "Full-pretrain/Step": 1785, "Full-pretrain/Step Time": 17.598088279366493} +{"Full-pretrain/Learning Rate": 4.6825352829029705e-05, "Full-pretrain/Loss": 2.0266497135162354, "Full-pretrain/Loss (Raw)": 2.0553135871887207, "Full-pretrain/Step": 1786, "Full-pretrain/Step Time": 17.595087492838502} +{"Full-pretrain/Learning Rate": 4.6821210654517875e-05, "Full-pretrain/Loss": 2.0283477306365967, "Full-pretrain/Loss (Raw)": 1.9477909803390503, "Full-pretrain/Step": 1787, "Full-pretrain/Step Time": 17.590941237285733} +{"Full-pretrain/Learning Rate": 4.681706596293707e-05, "Full-pretrain/Loss": 2.0276408195495605, "Full-pretrain/Loss (Raw)": 1.9941240549087524, "Full-pretrain/Step": 1788, "Full-pretrain/Step Time": 17.588595425710082} +{"Full-pretrain/Learning Rate": 4.681291875476537e-05, "Full-pretrain/Loss": 2.028139114379883, "Full-pretrain/Loss (Raw)": 2.037753105163574, "Full-pretrain/Step": 1789, "Full-pretrain/Step Time": 17.596567878499627} +{"Full-pretrain/Learning Rate": 4.680876903048115e-05, "Full-pretrain/Loss": 2.02839994430542, "Full-pretrain/Loss (Raw)": 2.0435898303985596, "Full-pretrain/Step": 1790, "Full-pretrain/Step Time": 17.5944387819618} +{"Full-pretrain/Learning Rate": 4.6804616790563097e-05, "Full-pretrain/Loss": 2.027414321899414, "Full-pretrain/Loss (Raw)": 2.1812546253204346, "Full-pretrain/Step": 1791, "Full-pretrain/Step Time": 17.589574912562966} +{"Full-pretrain/Learning Rate": 4.6800462035490155e-05, "Full-pretrain/Loss": 2.030392646789551, "Full-pretrain/Loss (Raw)": 2.1850152015686035, "Full-pretrain/Step": 1792, "Full-pretrain/Step Time": 17.594155717641115} +{"Full-pretrain/Learning Rate": 4.6796304765741585e-05, "Full-pretrain/Loss": 2.0338377952575684, "Full-pretrain/Loss (Raw)": 2.1020264625549316, "Full-pretrain/Step": 1793, "Full-pretrain/Step Time": 17.597925037145615} +{"Full-pretrain/Learning Rate": 4.679214498179691e-05, "Full-pretrain/Loss": 2.029325008392334, "Full-pretrain/Loss (Raw)": 1.927522897720337, "Full-pretrain/Step": 1794, "Full-pretrain/Step Time": 17.595880307257175} +{"Full-pretrain/Learning Rate": 4.678798268413597e-05, "Full-pretrain/Loss": 2.0348784923553467, "Full-pretrain/Loss (Raw)": 2.175631046295166, "Full-pretrain/Step": 1795, "Full-pretrain/Step Time": 17.593108035624027} +{"Full-pretrain/Learning Rate": 4.678381787323889e-05, "Full-pretrain/Loss": 2.0190038681030273, "Full-pretrain/Loss (Raw)": 1.4742374420166016, "Full-pretrain/Step": 1796, "Full-pretrain/Step Time": 17.59369750879705} +{"Full-pretrain/Learning Rate": 4.677965054958607e-05, "Full-pretrain/Loss": 2.01589298248291, "Full-pretrain/Loss (Raw)": 1.8560549020767212, "Full-pretrain/Step": 1797, "Full-pretrain/Step Time": 17.603258907794952} +{"Full-pretrain/Learning Rate": 4.6775480713658216e-05, "Full-pretrain/Loss": 2.023883819580078, "Full-pretrain/Loss (Raw)": 2.123668909072876, "Full-pretrain/Step": 1798, "Full-pretrain/Step Time": 17.59839321114123} +{"Full-pretrain/Learning Rate": 4.677130836593632e-05, "Full-pretrain/Loss": 2.031736135482788, "Full-pretrain/Loss (Raw)": 2.0483131408691406, "Full-pretrain/Step": 1799, "Full-pretrain/Step Time": 17.59665391407907} +{"Full-pretrain/Learning Rate": 4.676713350690164e-05, "Full-pretrain/Loss": 2.019618034362793, "Full-pretrain/Loss (Raw)": 1.728432059288025, "Full-pretrain/Step": 1800, "Full-pretrain/Step Time": 17.601952612400055} +{"Full-pretrain/Learning Rate": 4.6762956137035774e-05, "Full-pretrain/Loss": 2.0120689868927, "Full-pretrain/Loss (Raw)": 1.8576042652130127, "Full-pretrain/Step": 1801, "Full-pretrain/Step Time": 17.598333910107613} +{"Full-pretrain/Learning Rate": 4.675877625682055e-05, "Full-pretrain/Loss": 2.024625778198242, "Full-pretrain/Loss (Raw)": 2.3524529933929443, "Full-pretrain/Step": 1802, "Full-pretrain/Step Time": 17.5956314727664} +{"Full-pretrain/Learning Rate": 4.675459386673815e-05, "Full-pretrain/Loss": 2.0231618881225586, "Full-pretrain/Loss (Raw)": 2.0939583778381348, "Full-pretrain/Step": 1803, "Full-pretrain/Step Time": 17.591122414916754} +{"Full-pretrain/Learning Rate": 4.6750408967270976e-05, "Full-pretrain/Loss": 2.0117387771606445, "Full-pretrain/Loss (Raw)": 1.7676661014556885, "Full-pretrain/Step": 1804, "Full-pretrain/Step Time": 17.598280627280474} +{"Full-pretrain/Learning Rate": 4.674622155890178e-05, "Full-pretrain/Loss": 2.013014078140259, "Full-pretrain/Loss (Raw)": 1.9308946132659912, "Full-pretrain/Step": 1805, "Full-pretrain/Step Time": 17.60342837125063} +{"Full-pretrain/Learning Rate": 4.674203164211357e-05, "Full-pretrain/Loss": 2.0154120922088623, "Full-pretrain/Loss (Raw)": 2.2713589668273926, "Full-pretrain/Step": 1806, "Full-pretrain/Step Time": 17.597325341776013} +{"Full-pretrain/Learning Rate": 4.673783921738964e-05, "Full-pretrain/Loss": 2.0182077884674072, "Full-pretrain/Loss (Raw)": 2.031947135925293, "Full-pretrain/Step": 1807, "Full-pretrain/Step Time": 17.59197629801929} +{"Full-pretrain/Learning Rate": 4.673364428521361e-05, "Full-pretrain/Loss": 2.0119245052337646, "Full-pretrain/Loss (Raw)": 1.9208266735076904, "Full-pretrain/Step": 1808, "Full-pretrain/Step Time": 17.59405128657818} +{"Full-pretrain/Learning Rate": 4.672944684606934e-05, "Full-pretrain/Loss": 2.0140230655670166, "Full-pretrain/Loss (Raw)": 2.060305595397949, "Full-pretrain/Step": 1809, "Full-pretrain/Step Time": 17.599965326488018} +{"Full-pretrain/Learning Rate": 4.672524690044102e-05, "Full-pretrain/Loss": 2.016069173812866, "Full-pretrain/Loss (Raw)": 2.1674742698669434, "Full-pretrain/Step": 1810, "Full-pretrain/Step Time": 17.598740324378014} +{"Full-pretrain/Learning Rate": 4.67210444488131e-05, "Full-pretrain/Loss": 2.0182251930236816, "Full-pretrain/Loss (Raw)": 2.214972496032715, "Full-pretrain/Step": 1811, "Full-pretrain/Step Time": 17.600194916129112} +{"Full-pretrain/Learning Rate": 4.671683949167034e-05, "Full-pretrain/Loss": 2.033273696899414, "Full-pretrain/Loss (Raw)": 2.30171537399292, "Full-pretrain/Step": 1812, "Full-pretrain/Step Time": 17.60545409657061} +{"Full-pretrain/Learning Rate": 4.6712632029497765e-05, "Full-pretrain/Loss": 2.0257296562194824, "Full-pretrain/Loss (Raw)": 1.8972094058990479, "Full-pretrain/Step": 1813, "Full-pretrain/Step Time": 17.60334763675928} +{"Full-pretrain/Learning Rate": 4.670842206278073e-05, "Full-pretrain/Loss": 2.0287587642669678, "Full-pretrain/Loss (Raw)": 2.095958948135376, "Full-pretrain/Step": 1814, "Full-pretrain/Step Time": 17.59883321635425} +{"Full-pretrain/Learning Rate": 4.6704209592004836e-05, "Full-pretrain/Loss": 2.030555248260498, "Full-pretrain/Loss (Raw)": 1.9994462728500366, "Full-pretrain/Step": 1815, "Full-pretrain/Step Time": 17.598316054791212} +{"Full-pretrain/Learning Rate": 4.6699994617655985e-05, "Full-pretrain/Loss": 2.0364437103271484, "Full-pretrain/Loss (Raw)": 2.2685723304748535, "Full-pretrain/Step": 1816, "Full-pretrain/Step Time": 17.599312415346503} +{"Full-pretrain/Learning Rate": 4.669577714022039e-05, "Full-pretrain/Loss": 2.029430389404297, "Full-pretrain/Loss (Raw)": 1.8286832571029663, "Full-pretrain/Step": 1817, "Full-pretrain/Step Time": 17.603524785488844} +{"Full-pretrain/Learning Rate": 4.6691557160184516e-05, "Full-pretrain/Loss": 2.0313024520874023, "Full-pretrain/Loss (Raw)": 2.115219831466675, "Full-pretrain/Step": 1818, "Full-pretrain/Step Time": 17.60438352636993} +{"Full-pretrain/Learning Rate": 4.668733467803515e-05, "Full-pretrain/Loss": 2.0320608615875244, "Full-pretrain/Loss (Raw)": 1.972057580947876, "Full-pretrain/Step": 1819, "Full-pretrain/Step Time": 17.60603410936892} +{"Full-pretrain/Learning Rate": 4.668310969425935e-05, "Full-pretrain/Loss": 2.0398173332214355, "Full-pretrain/Loss (Raw)": 2.2423291206359863, "Full-pretrain/Step": 1820, "Full-pretrain/Step Time": 17.602869473397732} +{"Full-pretrain/Learning Rate": 4.667888220934448e-05, "Full-pretrain/Loss": 2.0349292755126953, "Full-pretrain/Loss (Raw)": 1.8813376426696777, "Full-pretrain/Step": 1821, "Full-pretrain/Step Time": 17.611316449940205} +{"Full-pretrain/Learning Rate": 4.667465222377815e-05, "Full-pretrain/Loss": 2.035101890563965, "Full-pretrain/Loss (Raw)": 2.0491127967834473, "Full-pretrain/Step": 1822, "Full-pretrain/Step Time": 17.61071522347629} +{"Full-pretrain/Learning Rate": 4.667041973804831e-05, "Full-pretrain/Loss": 2.0274901390075684, "Full-pretrain/Loss (Raw)": 1.937673568725586, "Full-pretrain/Step": 1823, "Full-pretrain/Step Time": 17.60132555104792} +{"Full-pretrain/Learning Rate": 4.666618475264316e-05, "Full-pretrain/Loss": 2.0110561847686768, "Full-pretrain/Loss (Raw)": 1.6591367721557617, "Full-pretrain/Step": 1824, "Full-pretrain/Step Time": 17.611546816304326} +{"Full-pretrain/Learning Rate": 4.666194726805122e-05, "Full-pretrain/Loss": 2.0057334899902344, "Full-pretrain/Loss (Raw)": 1.9316980838775635, "Full-pretrain/Step": 1825, "Full-pretrain/Step Time": 17.6093358527869} +{"Full-pretrain/Learning Rate": 4.6657707284761274e-05, "Full-pretrain/Loss": 2.009321928024292, "Full-pretrain/Loss (Raw)": 2.0423524379730225, "Full-pretrain/Step": 1826, "Full-pretrain/Step Time": 17.603041550144553} +{"Full-pretrain/Learning Rate": 4.665346480326241e-05, "Full-pretrain/Loss": 2.0044546127319336, "Full-pretrain/Loss (Raw)": 2.019878625869751, "Full-pretrain/Step": 1827, "Full-pretrain/Step Time": 17.600824385881424} +{"Full-pretrain/Learning Rate": 4.664921982404399e-05, "Full-pretrain/Loss": 2.016822576522827, "Full-pretrain/Loss (Raw)": 1.8700124025344849, "Full-pretrain/Step": 1828, "Full-pretrain/Step Time": 17.604655468836427} +{"Full-pretrain/Learning Rate": 4.664497234759566e-05, "Full-pretrain/Loss": 2.0257911682128906, "Full-pretrain/Loss (Raw)": 2.1430435180664062, "Full-pretrain/Step": 1829, "Full-pretrain/Step Time": 17.604202050715685} +{"Full-pretrain/Learning Rate": 4.664072237440739e-05, "Full-pretrain/Loss": 2.015692710876465, "Full-pretrain/Loss (Raw)": 1.8005247116088867, "Full-pretrain/Step": 1830, "Full-pretrain/Step Time": 17.601830706000328} +{"Full-pretrain/Learning Rate": 4.6636469904969386e-05, "Full-pretrain/Loss": 2.029792547225952, "Full-pretrain/Loss (Raw)": 2.4995009899139404, "Full-pretrain/Step": 1831, "Full-pretrain/Step Time": 17.609246691688895} +{"Full-pretrain/Learning Rate": 4.663221493977219e-05, "Full-pretrain/Loss": 2.0420618057250977, "Full-pretrain/Loss (Raw)": 2.1210551261901855, "Full-pretrain/Step": 1832, "Full-pretrain/Step Time": 17.60710589773953} +{"Full-pretrain/Learning Rate": 4.66279574793066e-05, "Full-pretrain/Loss": 2.0481796264648438, "Full-pretrain/Loss (Raw)": 2.0533745288848877, "Full-pretrain/Step": 1833, "Full-pretrain/Step Time": 17.610493579879403} +{"Full-pretrain/Learning Rate": 4.6623697524063713e-05, "Full-pretrain/Loss": 2.0357861518859863, "Full-pretrain/Loss (Raw)": 1.9558571577072144, "Full-pretrain/Step": 1834, "Full-pretrain/Step Time": 17.606136709451675} +{"Full-pretrain/Learning Rate": 4.661943507453492e-05, "Full-pretrain/Loss": 2.032745599746704, "Full-pretrain/Loss (Raw)": 1.9966622591018677, "Full-pretrain/Step": 1835, "Full-pretrain/Step Time": 17.610070506110787} +{"Full-pretrain/Learning Rate": 4.661517013121189e-05, "Full-pretrain/Loss": 2.0491104125976562, "Full-pretrain/Loss (Raw)": 2.2913451194763184, "Full-pretrain/Step": 1836, "Full-pretrain/Step Time": 17.606861975044012} +{"Full-pretrain/Learning Rate": 4.6610902694586576e-05, "Full-pretrain/Loss": 2.0494024753570557, "Full-pretrain/Loss (Raw)": 1.9402384757995605, "Full-pretrain/Step": 1837, "Full-pretrain/Step Time": 17.605120366439223} +{"Full-pretrain/Learning Rate": 4.660663276515124e-05, "Full-pretrain/Loss": 2.0421929359436035, "Full-pretrain/Loss (Raw)": 2.0406501293182373, "Full-pretrain/Step": 1838, "Full-pretrain/Step Time": 17.602639144286513} +{"Full-pretrain/Learning Rate": 4.66023603433984e-05, "Full-pretrain/Loss": 2.0425076484680176, "Full-pretrain/Loss (Raw)": 2.042026996612549, "Full-pretrain/Step": 1839, "Full-pretrain/Step Time": 17.6017857901752} +{"Full-pretrain/Learning Rate": 4.659808542982088e-05, "Full-pretrain/Loss": 2.049031972885132, "Full-pretrain/Loss (Raw)": 2.129598617553711, "Full-pretrain/Step": 1840, "Full-pretrain/Step Time": 17.60699287429452} +{"Full-pretrain/Learning Rate": 4.659380802491181e-05, "Full-pretrain/Loss": 2.041398286819458, "Full-pretrain/Loss (Raw)": 1.8160303831100464, "Full-pretrain/Step": 1841, "Full-pretrain/Step Time": 17.60412277467549} +{"Full-pretrain/Learning Rate": 4.6589528129164564e-05, "Full-pretrain/Loss": 2.0399086475372314, "Full-pretrain/Loss (Raw)": 2.1198008060455322, "Full-pretrain/Step": 1842, "Full-pretrain/Step Time": 17.60430376790464} +{"Full-pretrain/Learning Rate": 4.658524574307284e-05, "Full-pretrain/Loss": 2.036804676055908, "Full-pretrain/Loss (Raw)": 2.115643262863159, "Full-pretrain/Step": 1843, "Full-pretrain/Step Time": 17.600261295214295} +{"Full-pretrain/Learning Rate": 4.6580960867130604e-05, "Full-pretrain/Loss": 2.0265841484069824, "Full-pretrain/Loss (Raw)": 1.9746652841567993, "Full-pretrain/Step": 1844, "Full-pretrain/Step Time": 17.600057426840067} +{"Full-pretrain/Learning Rate": 4.6576673501832114e-05, "Full-pretrain/Loss": 2.025439500808716, "Full-pretrain/Loss (Raw)": 1.860581398010254, "Full-pretrain/Step": 1845, "Full-pretrain/Step Time": 17.59861167706549} +{"Full-pretrain/Learning Rate": 4.6572383647671913e-05, "Full-pretrain/Loss": 2.0212600231170654, "Full-pretrain/Loss (Raw)": 1.9622114896774292, "Full-pretrain/Step": 1846, "Full-pretrain/Step Time": 17.5936049092561} +{"Full-pretrain/Learning Rate": 4.6568091305144853e-05, "Full-pretrain/Loss": 2.023366928100586, "Full-pretrain/Loss (Raw)": 2.066863536834717, "Full-pretrain/Step": 1847, "Full-pretrain/Step Time": 17.5970279853791} +{"Full-pretrain/Learning Rate": 4.656379647474603e-05, "Full-pretrain/Loss": 2.022284746170044, "Full-pretrain/Loss (Raw)": 2.233943462371826, "Full-pretrain/Step": 1848, "Full-pretrain/Step Time": 17.595280358567834} +{"Full-pretrain/Learning Rate": 4.655949915697086e-05, "Full-pretrain/Loss": 2.027825117111206, "Full-pretrain/Loss (Raw)": 2.005978584289551, "Full-pretrain/Step": 1849, "Full-pretrain/Step Time": 17.595809765160084} +{"Full-pretrain/Learning Rate": 4.655519935231505e-05, "Full-pretrain/Loss": 2.022955894470215, "Full-pretrain/Loss (Raw)": 1.9594022035598755, "Full-pretrain/Step": 1850, "Full-pretrain/Step Time": 17.594547586515546} +{"Full-pretrain/Learning Rate": 4.655089706127456e-05, "Full-pretrain/Loss": 2.0245301723480225, "Full-pretrain/Loss (Raw)": 2.0224359035491943, "Full-pretrain/Step": 1851, "Full-pretrain/Step Time": 17.591914365068078} +{"Full-pretrain/Learning Rate": 4.654659228434567e-05, "Full-pretrain/Loss": 2.020620822906494, "Full-pretrain/Loss (Raw)": 2.11722731590271, "Full-pretrain/Step": 1852, "Full-pretrain/Step Time": 17.598964799195528} +{"Full-pretrain/Learning Rate": 4.654228502202493e-05, "Full-pretrain/Loss": 2.032475709915161, "Full-pretrain/Loss (Raw)": 2.260695219039917, "Full-pretrain/Step": 1853, "Full-pretrain/Step Time": 17.59569402039051} +{"Full-pretrain/Learning Rate": 4.6537975274809186e-05, "Full-pretrain/Loss": 2.034085750579834, "Full-pretrain/Loss (Raw)": 2.100630044937134, "Full-pretrain/Step": 1854, "Full-pretrain/Step Time": 17.596130955964327} +{"Full-pretrain/Learning Rate": 4.653366304319556e-05, "Full-pretrain/Loss": 2.036665439605713, "Full-pretrain/Loss (Raw)": 2.0202322006225586, "Full-pretrain/Step": 1855, "Full-pretrain/Step Time": 17.594649862498045} +{"Full-pretrain/Learning Rate": 4.652934832768148e-05, "Full-pretrain/Loss": 2.0594494342803955, "Full-pretrain/Loss (Raw)": 2.388218402862549, "Full-pretrain/Step": 1856, "Full-pretrain/Step Time": 17.595753768458962} +{"Full-pretrain/Learning Rate": 4.652503112876463e-05, "Full-pretrain/Loss": 2.064891815185547, "Full-pretrain/Loss (Raw)": 2.105855703353882, "Full-pretrain/Step": 1857, "Full-pretrain/Step Time": 17.594185823574662} +{"Full-pretrain/Learning Rate": 4.6520711446943e-05, "Full-pretrain/Loss": 2.0591862201690674, "Full-pretrain/Loss (Raw)": 1.8597722053527832, "Full-pretrain/Step": 1858, "Full-pretrain/Step Time": 17.600784208625555} +{"Full-pretrain/Learning Rate": 4.651638928271487e-05, "Full-pretrain/Loss": 2.0579564571380615, "Full-pretrain/Loss (Raw)": 1.9805283546447754, "Full-pretrain/Step": 1859, "Full-pretrain/Step Time": 17.599614540115} +{"Full-pretrain/Learning Rate": 4.65120646365788e-05, "Full-pretrain/Loss": 2.063418388366699, "Full-pretrain/Loss (Raw)": 2.0447919368743896, "Full-pretrain/Step": 1860, "Full-pretrain/Step Time": 17.589410038664937} +{"Full-pretrain/Learning Rate": 4.650773750903363e-05, "Full-pretrain/Loss": 2.0623278617858887, "Full-pretrain/Loss (Raw)": 2.1081464290618896, "Full-pretrain/Step": 1861, "Full-pretrain/Step Time": 17.599096285179257} +{"Full-pretrain/Learning Rate": 4.65034079005785e-05, "Full-pretrain/Loss": 2.063011884689331, "Full-pretrain/Loss (Raw)": 1.822417974472046, "Full-pretrain/Step": 1862, "Full-pretrain/Step Time": 17.597404956817627} +{"Full-pretrain/Learning Rate": 4.649907581171282e-05, "Full-pretrain/Loss": 2.0524094104766846, "Full-pretrain/Loss (Raw)": 2.160217761993408, "Full-pretrain/Step": 1863, "Full-pretrain/Step Time": 17.59431365504861} +{"Full-pretrain/Learning Rate": 4.64947412429363e-05, "Full-pretrain/Loss": 2.0515189170837402, "Full-pretrain/Loss (Raw)": 2.0925631523132324, "Full-pretrain/Step": 1864, "Full-pretrain/Step Time": 17.596150632947683} +{"Full-pretrain/Learning Rate": 4.6490404194748937e-05, "Full-pretrain/Loss": 2.053966522216797, "Full-pretrain/Loss (Raw)": 2.1316919326782227, "Full-pretrain/Step": 1865, "Full-pretrain/Step Time": 17.598657181486487} +{"Full-pretrain/Learning Rate": 4.6486064667651003e-05, "Full-pretrain/Loss": 2.054328441619873, "Full-pretrain/Loss (Raw)": 1.9674495458602905, "Full-pretrain/Step": 1866, "Full-pretrain/Step Time": 17.597702896222472} +{"Full-pretrain/Learning Rate": 4.6481722662143056e-05, "Full-pretrain/Loss": 2.0585880279541016, "Full-pretrain/Loss (Raw)": 2.132964611053467, "Full-pretrain/Step": 1867, "Full-pretrain/Step Time": 17.593811471015215} +{"Full-pretrain/Learning Rate": 4.6477378178725954e-05, "Full-pretrain/Loss": 2.0488333702087402, "Full-pretrain/Loss (Raw)": 1.97919499874115, "Full-pretrain/Step": 1868, "Full-pretrain/Step Time": 17.593251653015614} +{"Full-pretrain/Learning Rate": 4.647303121790082e-05, "Full-pretrain/Loss": 2.049555540084839, "Full-pretrain/Loss (Raw)": 1.9633442163467407, "Full-pretrain/Step": 1869, "Full-pretrain/Step Time": 17.5984999332577} +{"Full-pretrain/Learning Rate": 4.646868178016909e-05, "Full-pretrain/Loss": 2.0561137199401855, "Full-pretrain/Loss (Raw)": 2.2505149841308594, "Full-pretrain/Step": 1870, "Full-pretrain/Step Time": 17.597205199301243} +{"Full-pretrain/Learning Rate": 4.646432986603245e-05, "Full-pretrain/Loss": 2.0574355125427246, "Full-pretrain/Loss (Raw)": 2.0843276977539062, "Full-pretrain/Step": 1871, "Full-pretrain/Step Time": 17.595587711781263} +{"Full-pretrain/Learning Rate": 4.645997547599292e-05, "Full-pretrain/Loss": 2.048316478729248, "Full-pretrain/Loss (Raw)": 1.8377928733825684, "Full-pretrain/Step": 1872, "Full-pretrain/Step Time": 17.596794970333576} +{"Full-pretrain/Learning Rate": 4.6455618610552745e-05, "Full-pretrain/Loss": 2.049473524093628, "Full-pretrain/Loss (Raw)": 1.8530523777008057, "Full-pretrain/Step": 1873, "Full-pretrain/Step Time": 17.595706349238753} +{"Full-pretrain/Learning Rate": 4.645125927021451e-05, "Full-pretrain/Loss": 2.0497303009033203, "Full-pretrain/Loss (Raw)": 2.1280155181884766, "Full-pretrain/Step": 1874, "Full-pretrain/Step Time": 17.598511569201946} +{"Full-pretrain/Learning Rate": 4.6446897455481053e-05, "Full-pretrain/Loss": 2.052544116973877, "Full-pretrain/Loss (Raw)": 2.2056894302368164, "Full-pretrain/Step": 1875, "Full-pretrain/Step Time": 17.594577150419354} +{"Full-pretrain/Learning Rate": 4.6442533166855514e-05, "Full-pretrain/Loss": 2.0545599460601807, "Full-pretrain/Loss (Raw)": 2.0391671657562256, "Full-pretrain/Step": 1876, "Full-pretrain/Step Time": 17.592151084914804} +{"Full-pretrain/Learning Rate": 4.643816640484131e-05, "Full-pretrain/Loss": 2.0602004528045654, "Full-pretrain/Loss (Raw)": 2.041078805923462, "Full-pretrain/Step": 1877, "Full-pretrain/Step Time": 17.598291784524918} +{"Full-pretrain/Learning Rate": 4.643379716994214e-05, "Full-pretrain/Loss": 2.058194875717163, "Full-pretrain/Loss (Raw)": 1.8980331420898438, "Full-pretrain/Step": 1878, "Full-pretrain/Step Time": 17.59449521638453} +{"Full-pretrain/Learning Rate": 4.6429425462662e-05, "Full-pretrain/Loss": 2.0622329711914062, "Full-pretrain/Loss (Raw)": 2.196077346801758, "Full-pretrain/Step": 1879, "Full-pretrain/Step Time": 17.602336240932345} +{"Full-pretrain/Learning Rate": 4.642505128350517e-05, "Full-pretrain/Loss": 2.052356481552124, "Full-pretrain/Loss (Raw)": 1.9178963899612427, "Full-pretrain/Step": 1880, "Full-pretrain/Step Time": 17.599111976101995} +{"Full-pretrain/Learning Rate": 4.6420674632976205e-05, "Full-pretrain/Loss": 2.057997226715088, "Full-pretrain/Loss (Raw)": 2.1864829063415527, "Full-pretrain/Step": 1881, "Full-pretrain/Step Time": 17.598049845546484} +{"Full-pretrain/Learning Rate": 4.6416295511579946e-05, "Full-pretrain/Loss": 2.0691676139831543, "Full-pretrain/Loss (Raw)": 2.316864013671875, "Full-pretrain/Step": 1882, "Full-pretrain/Step Time": 17.60586299933493} +{"Full-pretrain/Learning Rate": 4.641191391982152e-05, "Full-pretrain/Loss": 2.0624618530273438, "Full-pretrain/Loss (Raw)": 1.8078407049179077, "Full-pretrain/Step": 1883, "Full-pretrain/Step Time": 17.600525826215744} +{"Full-pretrain/Learning Rate": 4.6407529858206354e-05, "Full-pretrain/Loss": 2.0635948181152344, "Full-pretrain/Loss (Raw)": 2.1534829139709473, "Full-pretrain/Step": 1884, "Full-pretrain/Step Time": 17.599775940179825} +{"Full-pretrain/Learning Rate": 4.640314332724014e-05, "Full-pretrain/Loss": 2.055786371231079, "Full-pretrain/Loss (Raw)": 2.010828971862793, "Full-pretrain/Step": 1885, "Full-pretrain/Step Time": 17.605407377704978} +{"Full-pretrain/Learning Rate": 4.639875432742886e-05, "Full-pretrain/Loss": 2.054687976837158, "Full-pretrain/Loss (Raw)": 2.0654749870300293, "Full-pretrain/Step": 1886, "Full-pretrain/Step Time": 17.60456982627511} +{"Full-pretrain/Learning Rate": 4.6394362859278794e-05, "Full-pretrain/Loss": 2.0522336959838867, "Full-pretrain/Loss (Raw)": 1.9416966438293457, "Full-pretrain/Step": 1887, "Full-pretrain/Step Time": 17.59797379001975} +{"Full-pretrain/Learning Rate": 4.6389968923296494e-05, "Full-pretrain/Loss": 2.0372681617736816, "Full-pretrain/Loss (Raw)": 1.909325361251831, "Full-pretrain/Step": 1888, "Full-pretrain/Step Time": 17.5994104295969} +{"Full-pretrain/Learning Rate": 4.63855725199888e-05, "Full-pretrain/Loss": 2.0374505519866943, "Full-pretrain/Loss (Raw)": 2.111691474914551, "Full-pretrain/Step": 1889, "Full-pretrain/Step Time": 17.60174976848066} +{"Full-pretrain/Learning Rate": 4.638117364986282e-05, "Full-pretrain/Loss": 2.0376439094543457, "Full-pretrain/Loss (Raw)": 1.8659567832946777, "Full-pretrain/Step": 1890, "Full-pretrain/Step Time": 17.606460742652416} +{"Full-pretrain/Learning Rate": 4.637677231342598e-05, "Full-pretrain/Loss": 2.0317251682281494, "Full-pretrain/Loss (Raw)": 1.7911304235458374, "Full-pretrain/Step": 1891, "Full-pretrain/Step Time": 17.598935890942812} +{"Full-pretrain/Learning Rate": 4.637236851118595e-05, "Full-pretrain/Loss": 2.0352301597595215, "Full-pretrain/Loss (Raw)": 2.156956195831299, "Full-pretrain/Step": 1892, "Full-pretrain/Step Time": 17.602175787091255} +{"Full-pretrain/Learning Rate": 4.6367962243650745e-05, "Full-pretrain/Loss": 2.03256893157959, "Full-pretrain/Loss (Raw)": 2.022979259490967, "Full-pretrain/Step": 1893, "Full-pretrain/Step Time": 17.606268694624305} +{"Full-pretrain/Learning Rate": 4.636355351132859e-05, "Full-pretrain/Loss": 2.040616750717163, "Full-pretrain/Loss (Raw)": 2.0799484252929688, "Full-pretrain/Step": 1894, "Full-pretrain/Step Time": 17.607155302539468} +{"Full-pretrain/Learning Rate": 4.635914231472805e-05, "Full-pretrain/Loss": 2.0350799560546875, "Full-pretrain/Loss (Raw)": 1.9830409288406372, "Full-pretrain/Step": 1895, "Full-pretrain/Step Time": 17.605836840346456} +{"Full-pretrain/Learning Rate": 4.635472865435795e-05, "Full-pretrain/Loss": 2.0284247398376465, "Full-pretrain/Loss (Raw)": 1.879602074623108, "Full-pretrain/Step": 1896, "Full-pretrain/Step Time": 17.606248136609793} +{"Full-pretrain/Learning Rate": 4.63503125307274e-05, "Full-pretrain/Loss": 2.0197250843048096, "Full-pretrain/Loss (Raw)": 1.853295087814331, "Full-pretrain/Step": 1897, "Full-pretrain/Step Time": 17.6135741956532} +{"Full-pretrain/Learning Rate": 4.634589394434581e-05, "Full-pretrain/Loss": 2.0200557708740234, "Full-pretrain/Loss (Raw)": 1.9780292510986328, "Full-pretrain/Step": 1898, "Full-pretrain/Step Time": 17.609944872558117} +{"Full-pretrain/Learning Rate": 4.6341472895722854e-05, "Full-pretrain/Loss": 2.0138773918151855, "Full-pretrain/Loss (Raw)": 1.9352598190307617, "Full-pretrain/Step": 1899, "Full-pretrain/Step Time": 17.608065973967314} +{"Full-pretrain/Learning Rate": 4.6337049385368496e-05, "Full-pretrain/Loss": 2.0133895874023438, "Full-pretrain/Loss (Raw)": 1.9635910987854004, "Full-pretrain/Step": 1900, "Full-pretrain/Step Time": 17.605572225525975} +{"Full-pretrain/Learning Rate": 4.633262341379299e-05, "Full-pretrain/Loss": 2.010690689086914, "Full-pretrain/Loss (Raw)": 1.8769749402999878, "Full-pretrain/Step": 1901, "Full-pretrain/Step Time": 17.6143911331892} +{"Full-pretrain/Learning Rate": 4.632819498150688e-05, "Full-pretrain/Loss": 2.0117053985595703, "Full-pretrain/Loss (Raw)": 2.282982349395752, "Full-pretrain/Step": 1902, "Full-pretrain/Step Time": 17.611702477559447} +{"Full-pretrain/Learning Rate": 4.632376408902096e-05, "Full-pretrain/Loss": 2.01200008392334, "Full-pretrain/Loss (Raw)": 2.0937633514404297, "Full-pretrain/Step": 1903, "Full-pretrain/Step Time": 17.61013895832002} +{"Full-pretrain/Learning Rate": 4.631933073684635e-05, "Full-pretrain/Loss": 2.0156211853027344, "Full-pretrain/Loss (Raw)": 1.9536612033843994, "Full-pretrain/Step": 1904, "Full-pretrain/Step Time": 17.61305231973529} +{"Full-pretrain/Learning Rate": 4.631489492549443e-05, "Full-pretrain/Loss": 2.0303468704223633, "Full-pretrain/Loss (Raw)": 2.3242790699005127, "Full-pretrain/Step": 1905, "Full-pretrain/Step Time": 17.61069872789085} +{"Full-pretrain/Learning Rate": 4.6310456655476876e-05, "Full-pretrain/Loss": 2.0267388820648193, "Full-pretrain/Loss (Raw)": 2.012558937072754, "Full-pretrain/Step": 1906, "Full-pretrain/Step Time": 17.60501073859632} +{"Full-pretrain/Learning Rate": 4.630601592730564e-05, "Full-pretrain/Loss": 2.022796392440796, "Full-pretrain/Loss (Raw)": 2.0795352458953857, "Full-pretrain/Step": 1907, "Full-pretrain/Step Time": 17.60404135286808} +{"Full-pretrain/Learning Rate": 4.630157274149294e-05, "Full-pretrain/Loss": 2.0237114429473877, "Full-pretrain/Loss (Raw)": 2.0684456825256348, "Full-pretrain/Step": 1908, "Full-pretrain/Step Time": 17.604410706087947} +{"Full-pretrain/Learning Rate": 4.6297127098551316e-05, "Full-pretrain/Loss": 2.0273966789245605, "Full-pretrain/Loss (Raw)": 2.159005641937256, "Full-pretrain/Step": 1909, "Full-pretrain/Step Time": 17.60626882314682} +{"Full-pretrain/Learning Rate": 4.6292678998993576e-05, "Full-pretrain/Loss": 2.0294480323791504, "Full-pretrain/Loss (Raw)": 1.9636825323104858, "Full-pretrain/Step": 1910, "Full-pretrain/Step Time": 17.603317230939865} +{"Full-pretrain/Learning Rate": 4.628822844333278e-05, "Full-pretrain/Loss": 2.023305654525757, "Full-pretrain/Loss (Raw)": 1.9995150566101074, "Full-pretrain/Step": 1911, "Full-pretrain/Step Time": 17.609284391626716} +{"Full-pretrain/Learning Rate": 4.6283775432082325e-05, "Full-pretrain/Loss": 2.027865409851074, "Full-pretrain/Loss (Raw)": 2.0638160705566406, "Full-pretrain/Step": 1912, "Full-pretrain/Step Time": 17.60428519360721} +{"Full-pretrain/Learning Rate": 4.627931996575585e-05, "Full-pretrain/Loss": 2.0232839584350586, "Full-pretrain/Loss (Raw)": 2.0398738384246826, "Full-pretrain/Step": 1913, "Full-pretrain/Step Time": 17.60510751605034} +{"Full-pretrain/Learning Rate": 4.6274862044867304e-05, "Full-pretrain/Loss": 2.010796546936035, "Full-pretrain/Loss (Raw)": 1.917266607284546, "Full-pretrain/Step": 1914, "Full-pretrain/Step Time": 17.609661921858788} +{"Full-pretrain/Learning Rate": 4.627040166993089e-05, "Full-pretrain/Loss": 2.0234153270721436, "Full-pretrain/Loss (Raw)": 2.211635112762451, "Full-pretrain/Step": 1915, "Full-pretrain/Step Time": 17.611734092235565} +{"Full-pretrain/Learning Rate": 4.626593884146111e-05, "Full-pretrain/Loss": 2.021821975708008, "Full-pretrain/Loss (Raw)": 2.1024975776672363, "Full-pretrain/Step": 1916, "Full-pretrain/Step Time": 17.609452923759818} +{"Full-pretrain/Learning Rate": 4.626147355997277e-05, "Full-pretrain/Loss": 2.0241024494171143, "Full-pretrain/Loss (Raw)": 2.083808183670044, "Full-pretrain/Step": 1917, "Full-pretrain/Step Time": 17.605635849758983} +{"Full-pretrain/Learning Rate": 4.625700582598092e-05, "Full-pretrain/Loss": 2.0277795791625977, "Full-pretrain/Loss (Raw)": 2.1831417083740234, "Full-pretrain/Step": 1918, "Full-pretrain/Step Time": 17.6133500225842} +{"Full-pretrain/Learning Rate": 4.6252535640000924e-05, "Full-pretrain/Loss": 2.0375163555145264, "Full-pretrain/Loss (Raw)": 2.253272533416748, "Full-pretrain/Step": 1919, "Full-pretrain/Step Time": 17.61337055824697} +{"Full-pretrain/Learning Rate": 4.6248063002548404e-05, "Full-pretrain/Loss": 2.0381722450256348, "Full-pretrain/Loss (Raw)": 1.9303175210952759, "Full-pretrain/Step": 1920, "Full-pretrain/Step Time": 17.605459548532963} +{"Full-pretrain/Learning Rate": 4.6243587914139285e-05, "Full-pretrain/Loss": 2.032080888748169, "Full-pretrain/Loss (Raw)": 1.916765809059143, "Full-pretrain/Step": 1921, "Full-pretrain/Step Time": 17.604003040120006} +{"Full-pretrain/Learning Rate": 4.6239110375289775e-05, "Full-pretrain/Loss": 2.0350241661071777, "Full-pretrain/Loss (Raw)": 1.960141658782959, "Full-pretrain/Step": 1922, "Full-pretrain/Step Time": 17.610034188255668} +{"Full-pretrain/Learning Rate": 4.623463038651633e-05, "Full-pretrain/Loss": 2.04721999168396, "Full-pretrain/Loss (Raw)": 2.1813955307006836, "Full-pretrain/Step": 1923, "Full-pretrain/Step Time": 17.61397136375308} +{"Full-pretrain/Learning Rate": 4.623014794833574e-05, "Full-pretrain/Loss": 2.038038492202759, "Full-pretrain/Loss (Raw)": 1.8631494045257568, "Full-pretrain/Step": 1924, "Full-pretrain/Step Time": 17.609289733693004} +{"Full-pretrain/Learning Rate": 4.622566306126506e-05, "Full-pretrain/Loss": 2.0376243591308594, "Full-pretrain/Loss (Raw)": 2.0097293853759766, "Full-pretrain/Step": 1925, "Full-pretrain/Step Time": 17.602919032797217} +{"Full-pretrain/Learning Rate": 4.6221175725821586e-05, "Full-pretrain/Loss": 2.032909393310547, "Full-pretrain/Loss (Raw)": 1.929064154624939, "Full-pretrain/Step": 1926, "Full-pretrain/Step Time": 17.607891373336315} +{"Full-pretrain/Learning Rate": 4.6216685942522956e-05, "Full-pretrain/Loss": 2.0245208740234375, "Full-pretrain/Loss (Raw)": 1.7146077156066895, "Full-pretrain/Step": 1927, "Full-pretrain/Step Time": 17.60798902064562} +{"Full-pretrain/Learning Rate": 4.621219371188706e-05, "Full-pretrain/Loss": 2.0270562171936035, "Full-pretrain/Loss (Raw)": 1.9607332944869995, "Full-pretrain/Step": 1928, "Full-pretrain/Step Time": 17.604005033150315} +{"Full-pretrain/Learning Rate": 4.620769903443207e-05, "Full-pretrain/Loss": 2.034442663192749, "Full-pretrain/Loss (Raw)": 2.0896670818328857, "Full-pretrain/Step": 1929, "Full-pretrain/Step Time": 17.60641779564321} +{"Full-pretrain/Learning Rate": 4.620320191067645e-05, "Full-pretrain/Loss": 2.037313461303711, "Full-pretrain/Loss (Raw)": 2.069894313812256, "Full-pretrain/Step": 1930, "Full-pretrain/Step Time": 17.607811687514186} +{"Full-pretrain/Learning Rate": 4.619870234113894e-05, "Full-pretrain/Loss": 2.0357322692871094, "Full-pretrain/Loss (Raw)": 1.8846626281738281, "Full-pretrain/Step": 1931, "Full-pretrain/Step Time": 17.61355764977634} +{"Full-pretrain/Learning Rate": 4.619420032633857e-05, "Full-pretrain/Loss": 2.0400075912475586, "Full-pretrain/Loss (Raw)": 2.1003940105438232, "Full-pretrain/Step": 1932, "Full-pretrain/Step Time": 17.605094023048878} +{"Full-pretrain/Learning Rate": 4.6189695866794635e-05, "Full-pretrain/Loss": 2.047062397003174, "Full-pretrain/Loss (Raw)": 2.102729558944702, "Full-pretrain/Step": 1933, "Full-pretrain/Step Time": 17.606938594952226} +{"Full-pretrain/Learning Rate": 4.618518896302674e-05, "Full-pretrain/Loss": 2.0344767570495605, "Full-pretrain/Loss (Raw)": 1.880244493484497, "Full-pretrain/Step": 1934, "Full-pretrain/Step Time": 17.618612928315997} +{"Full-pretrain/Learning Rate": 4.618067961555473e-05, "Full-pretrain/Loss": 2.0264487266540527, "Full-pretrain/Loss (Raw)": 1.8368644714355469, "Full-pretrain/Step": 1935, "Full-pretrain/Step Time": 17.61797123402357} +{"Full-pretrain/Learning Rate": 4.6176167824898773e-05, "Full-pretrain/Loss": 2.0212597846984863, "Full-pretrain/Loss (Raw)": 1.7876195907592773, "Full-pretrain/Step": 1936, "Full-pretrain/Step Time": 17.610243909060955} +{"Full-pretrain/Learning Rate": 4.61716535915793e-05, "Full-pretrain/Loss": 2.0007431507110596, "Full-pretrain/Loss (Raw)": 1.667741298675537, "Full-pretrain/Step": 1937, "Full-pretrain/Step Time": 17.60977539420128} +{"Full-pretrain/Learning Rate": 4.616713691611703e-05, "Full-pretrain/Loss": 1.998815655708313, "Full-pretrain/Loss (Raw)": 1.9508839845657349, "Full-pretrain/Step": 1938, "Full-pretrain/Step Time": 17.607107285410166} +{"Full-pretrain/Learning Rate": 4.616261779903295e-05, "Full-pretrain/Loss": 1.9940683841705322, "Full-pretrain/Loss (Raw)": 1.9276213645935059, "Full-pretrain/Step": 1939, "Full-pretrain/Step Time": 17.6070042476058} +{"Full-pretrain/Learning Rate": 4.615809624084834e-05, "Full-pretrain/Loss": 1.9874536991119385, "Full-pretrain/Loss (Raw)": 1.8567757606506348, "Full-pretrain/Step": 1940, "Full-pretrain/Step Time": 17.599000995978713} +{"Full-pretrain/Learning Rate": 4.6153572242084776e-05, "Full-pretrain/Loss": 1.9858226776123047, "Full-pretrain/Loss (Raw)": 2.106816291809082, "Full-pretrain/Step": 1941, "Full-pretrain/Step Time": 17.600644301623106} +{"Full-pretrain/Learning Rate": 4.6149045803264076e-05, "Full-pretrain/Loss": 1.9827499389648438, "Full-pretrain/Loss (Raw)": 1.8653532266616821, "Full-pretrain/Step": 1942, "Full-pretrain/Step Time": 17.6015178989619} +{"Full-pretrain/Learning Rate": 4.614451692490838e-05, "Full-pretrain/Loss": 1.9743425846099854, "Full-pretrain/Loss (Raw)": 1.7304800748825073, "Full-pretrain/Step": 1943, "Full-pretrain/Step Time": 17.611134976148605} +{"Full-pretrain/Learning Rate": 4.613998560754009e-05, "Full-pretrain/Loss": 1.978695034980774, "Full-pretrain/Loss (Raw)": 2.2030904293060303, "Full-pretrain/Step": 1944, "Full-pretrain/Step Time": 17.606975998729467} +{"Full-pretrain/Learning Rate": 4.613545185168188e-05, "Full-pretrain/Loss": 1.9861905574798584, "Full-pretrain/Loss (Raw)": 2.2797369956970215, "Full-pretrain/Step": 1945, "Full-pretrain/Step Time": 17.606566317379475} +{"Full-pretrain/Learning Rate": 4.6130915657856734e-05, "Full-pretrain/Loss": 1.9801609516143799, "Full-pretrain/Loss (Raw)": 1.7243181467056274, "Full-pretrain/Step": 1946, "Full-pretrain/Step Time": 17.6092442125082} +{"Full-pretrain/Learning Rate": 4.61263770265879e-05, "Full-pretrain/Loss": 1.9701693058013916, "Full-pretrain/Loss (Raw)": 1.8918967247009277, "Full-pretrain/Step": 1947, "Full-pretrain/Step Time": 17.60855943709612} +{"Full-pretrain/Learning Rate": 4.6121835958398886e-05, "Full-pretrain/Loss": 1.9648820161819458, "Full-pretrain/Loss (Raw)": 1.9333059787750244, "Full-pretrain/Step": 1948, "Full-pretrain/Step Time": 17.609485218301415} +{"Full-pretrain/Learning Rate": 4.611729245381352e-05, "Full-pretrain/Loss": 1.967780351638794, "Full-pretrain/Loss (Raw)": 2.1765551567077637, "Full-pretrain/Step": 1949, "Full-pretrain/Step Time": 17.601535128429532} +{"Full-pretrain/Learning Rate": 4.61127465133559e-05, "Full-pretrain/Loss": 1.9544380903244019, "Full-pretrain/Loss (Raw)": 1.7561906576156616, "Full-pretrain/Step": 1950, "Full-pretrain/Step Time": 17.603464640676975} +{"Full-pretrain/Learning Rate": 4.610819813755038e-05, "Full-pretrain/Loss": 1.9512052536010742, "Full-pretrain/Loss (Raw)": 2.1498184204101562, "Full-pretrain/Step": 1951, "Full-pretrain/Step Time": 17.613988349214196} +{"Full-pretrain/Learning Rate": 4.610364732692163e-05, "Full-pretrain/Loss": 1.9560754299163818, "Full-pretrain/Loss (Raw)": 2.086167335510254, "Full-pretrain/Step": 1952, "Full-pretrain/Step Time": 17.604158656671643} +{"Full-pretrain/Learning Rate": 4.609909408199456e-05, "Full-pretrain/Loss": 1.9670593738555908, "Full-pretrain/Loss (Raw)": 2.268251895904541, "Full-pretrain/Step": 1953, "Full-pretrain/Step Time": 17.604373261332512} +{"Full-pretrain/Learning Rate": 4.609453840329442e-05, "Full-pretrain/Loss": 1.9719696044921875, "Full-pretrain/Loss (Raw)": 2.117264986038208, "Full-pretrain/Step": 1954, "Full-pretrain/Step Time": 17.606402384117246} +{"Full-pretrain/Learning Rate": 4.6089980291346685e-05, "Full-pretrain/Loss": 1.9552148580551147, "Full-pretrain/Loss (Raw)": 1.6452486515045166, "Full-pretrain/Step": 1955, "Full-pretrain/Step Time": 17.615772105753422} +{"Full-pretrain/Learning Rate": 4.608541974667714e-05, "Full-pretrain/Loss": 1.9579179286956787, "Full-pretrain/Loss (Raw)": 1.9496426582336426, "Full-pretrain/Step": 1956, "Full-pretrain/Step Time": 17.60383907146752} +{"Full-pretrain/Learning Rate": 4.608085676981183e-05, "Full-pretrain/Loss": 1.9587956666946411, "Full-pretrain/Loss (Raw)": 2.037823438644409, "Full-pretrain/Step": 1957, "Full-pretrain/Step Time": 17.600165583193302} +{"Full-pretrain/Learning Rate": 4.6076291361277096e-05, "Full-pretrain/Loss": 1.965672492980957, "Full-pretrain/Loss (Raw)": 2.1491174697875977, "Full-pretrain/Step": 1958, "Full-pretrain/Step Time": 17.606584461405873} +{"Full-pretrain/Learning Rate": 4.6071723521599566e-05, "Full-pretrain/Loss": 1.9784549474716187, "Full-pretrain/Loss (Raw)": 2.1236510276794434, "Full-pretrain/Step": 1959, "Full-pretrain/Step Time": 17.607622418552637} +{"Full-pretrain/Learning Rate": 4.606715325130613e-05, "Full-pretrain/Loss": 1.9797554016113281, "Full-pretrain/Loss (Raw)": 2.002342462539673, "Full-pretrain/Step": 1960, "Full-pretrain/Step Time": 17.601664746180177} +{"Full-pretrain/Learning Rate": 4.606258055092397e-05, "Full-pretrain/Loss": 1.9792612791061401, "Full-pretrain/Loss (Raw)": 2.073859691619873, "Full-pretrain/Step": 1961, "Full-pretrain/Step Time": 17.604242984205484} +{"Full-pretrain/Learning Rate": 4.6058005420980544e-05, "Full-pretrain/Loss": 1.983178973197937, "Full-pretrain/Loss (Raw)": 2.195255994796753, "Full-pretrain/Step": 1962, "Full-pretrain/Step Time": 17.606299608945847} +{"Full-pretrain/Learning Rate": 4.605342786200359e-05, "Full-pretrain/Loss": 1.985114336013794, "Full-pretrain/Loss (Raw)": 1.9466009140014648, "Full-pretrain/Step": 1963, "Full-pretrain/Step Time": 17.612388271838427} +{"Full-pretrain/Learning Rate": 4.6048847874521146e-05, "Full-pretrain/Loss": 1.9803473949432373, "Full-pretrain/Loss (Raw)": 1.9478461742401123, "Full-pretrain/Step": 1964, "Full-pretrain/Step Time": 17.608986135572195} +{"Full-pretrain/Learning Rate": 4.6044265459061486e-05, "Full-pretrain/Loss": 1.9798307418823242, "Full-pretrain/Loss (Raw)": 2.0861964225769043, "Full-pretrain/Step": 1965, "Full-pretrain/Step Time": 17.606041826307774} +{"Full-pretrain/Learning Rate": 4.6039680616153204e-05, "Full-pretrain/Loss": 1.985650658607483, "Full-pretrain/Loss (Raw)": 2.0664825439453125, "Full-pretrain/Step": 1966, "Full-pretrain/Step Time": 17.610518984496593} +{"Full-pretrain/Learning Rate": 4.603509334632515e-05, "Full-pretrain/Loss": 1.9945082664489746, "Full-pretrain/Loss (Raw)": 2.1203126907348633, "Full-pretrain/Step": 1967, "Full-pretrain/Step Time": 17.611297385767102} +{"Full-pretrain/Learning Rate": 4.603050365010648e-05, "Full-pretrain/Loss": 2.0028176307678223, "Full-pretrain/Loss (Raw)": 2.053520441055298, "Full-pretrain/Step": 1968, "Full-pretrain/Step Time": 17.60909701511264} +{"Full-pretrain/Learning Rate": 4.6025911528026596e-05, "Full-pretrain/Loss": 2.0215301513671875, "Full-pretrain/Loss (Raw)": 2.266533851623535, "Full-pretrain/Step": 1969, "Full-pretrain/Step Time": 17.610819164663553} +{"Full-pretrain/Learning Rate": 4.6021316980615216e-05, "Full-pretrain/Loss": 2.0288453102111816, "Full-pretrain/Loss (Raw)": 2.184967517852783, "Full-pretrain/Step": 1970, "Full-pretrain/Step Time": 17.620337937027216} +{"Full-pretrain/Learning Rate": 4.60167200084023e-05, "Full-pretrain/Loss": 2.028641939163208, "Full-pretrain/Loss (Raw)": 1.921121597290039, "Full-pretrain/Step": 1971, "Full-pretrain/Step Time": 17.618394752964377} +{"Full-pretrain/Learning Rate": 4.601212061191812e-05, "Full-pretrain/Loss": 2.0369174480438232, "Full-pretrain/Loss (Raw)": 2.121589422225952, "Full-pretrain/Step": 1972, "Full-pretrain/Step Time": 17.62274106964469} +{"Full-pretrain/Learning Rate": 4.6007518791693214e-05, "Full-pretrain/Loss": 2.035830020904541, "Full-pretrain/Loss (Raw)": 2.072014808654785, "Full-pretrain/Step": 1973, "Full-pretrain/Step Time": 17.61898011341691} +{"Full-pretrain/Learning Rate": 4.6002914548258404e-05, "Full-pretrain/Loss": 2.03759503364563, "Full-pretrain/Loss (Raw)": 1.9218330383300781, "Full-pretrain/Step": 1974, "Full-pretrain/Step Time": 17.625349931418896} +{"Full-pretrain/Learning Rate": 4.599830788214477e-05, "Full-pretrain/Loss": 2.048982620239258, "Full-pretrain/Loss (Raw)": 2.0948920249938965, "Full-pretrain/Step": 1975, "Full-pretrain/Step Time": 17.625200752168894} +{"Full-pretrain/Learning Rate": 4.599369879388371e-05, "Full-pretrain/Loss": 2.0437116622924805, "Full-pretrain/Loss (Raw)": 2.034420967102051, "Full-pretrain/Step": 1976, "Full-pretrain/Step Time": 17.628337202593684} +{"Full-pretrain/Learning Rate": 4.598908728400687e-05, "Full-pretrain/Loss": 2.038784980773926, "Full-pretrain/Loss (Raw)": 2.122076988220215, "Full-pretrain/Step": 1977, "Full-pretrain/Step Time": 17.62496922723949} +{"Full-pretrain/Learning Rate": 4.598447335304618e-05, "Full-pretrain/Loss": 2.049051523208618, "Full-pretrain/Loss (Raw)": 2.0528504848480225, "Full-pretrain/Step": 1978, "Full-pretrain/Step Time": 17.623979326337576} +{"Full-pretrain/Learning Rate": 4.597985700153387e-05, "Full-pretrain/Loss": 2.049445152282715, "Full-pretrain/Loss (Raw)": 1.904484510421753, "Full-pretrain/Step": 1979, "Full-pretrain/Step Time": 17.625482063740492} +{"Full-pretrain/Learning Rate": 4.597523823000243e-05, "Full-pretrain/Loss": 2.0493876934051514, "Full-pretrain/Loss (Raw)": 1.9314770698547363, "Full-pretrain/Step": 1980, "Full-pretrain/Step Time": 17.624773539602757} +{"Full-pretrain/Learning Rate": 4.597061703898462e-05, "Full-pretrain/Loss": 2.0520248413085938, "Full-pretrain/Loss (Raw)": 2.2609405517578125, "Full-pretrain/Step": 1981, "Full-pretrain/Step Time": 17.621148262172937} +{"Full-pretrain/Learning Rate": 4.596599342901351e-05, "Full-pretrain/Loss": 2.0612545013427734, "Full-pretrain/Loss (Raw)": 2.051541328430176, "Full-pretrain/Step": 1982, "Full-pretrain/Step Time": 17.62085377238691} +{"Full-pretrain/Learning Rate": 4.596136740062243e-05, "Full-pretrain/Loss": 2.05246639251709, "Full-pretrain/Loss (Raw)": 1.86859130859375, "Full-pretrain/Step": 1983, "Full-pretrain/Step Time": 17.626299424096942} +{"Full-pretrain/Learning Rate": 4.5956738954344985e-05, "Full-pretrain/Loss": 2.050852060317993, "Full-pretrain/Loss (Raw)": 2.0345118045806885, "Full-pretrain/Step": 1984, "Full-pretrain/Step Time": 17.62224778905511} +{"Full-pretrain/Learning Rate": 4.5952108090715066e-05, "Full-pretrain/Loss": 2.037043333053589, "Full-pretrain/Loss (Raw)": 1.8263673782348633, "Full-pretrain/Step": 1985, "Full-pretrain/Step Time": 17.62290397658944} +{"Full-pretrain/Learning Rate": 4.594747481026684e-05, "Full-pretrain/Loss": 2.0384552478790283, "Full-pretrain/Loss (Raw)": 2.162451982498169, "Full-pretrain/Step": 1986, "Full-pretrain/Step Time": 17.618814488872886} +{"Full-pretrain/Learning Rate": 4.5942839113534755e-05, "Full-pretrain/Loss": 2.042182207107544, "Full-pretrain/Loss (Raw)": 1.7645095586776733, "Full-pretrain/Step": 1987, "Full-pretrain/Step Time": 17.626476790755987} +{"Full-pretrain/Learning Rate": 4.593820100105355e-05, "Full-pretrain/Loss": 2.0400919914245605, "Full-pretrain/Loss (Raw)": 1.8827505111694336, "Full-pretrain/Step": 1988, "Full-pretrain/Step Time": 17.628689730539918} +{"Full-pretrain/Learning Rate": 4.5933560473358204e-05, "Full-pretrain/Loss": 2.045619487762451, "Full-pretrain/Loss (Raw)": 2.214707374572754, "Full-pretrain/Step": 1989, "Full-pretrain/Step Time": 17.623042032122612} +{"Full-pretrain/Learning Rate": 4.5928917530984016e-05, "Full-pretrain/Loss": 2.03983998298645, "Full-pretrain/Loss (Raw)": 1.9641783237457275, "Full-pretrain/Step": 1990, "Full-pretrain/Step Time": 17.62356771156192} +{"Full-pretrain/Learning Rate": 4.5924272174466554e-05, "Full-pretrain/Loss": 2.0389764308929443, "Full-pretrain/Loss (Raw)": 2.096017360687256, "Full-pretrain/Step": 1991, "Full-pretrain/Step Time": 17.629566621035337} +{"Full-pretrain/Learning Rate": 4.5919624404341646e-05, "Full-pretrain/Loss": 2.037320852279663, "Full-pretrain/Loss (Raw)": 1.9493616819381714, "Full-pretrain/Step": 1992, "Full-pretrain/Step Time": 17.62829070352018} +{"Full-pretrain/Learning Rate": 4.591497422114541e-05, "Full-pretrain/Loss": 2.0319838523864746, "Full-pretrain/Loss (Raw)": 1.903078317642212, "Full-pretrain/Step": 1993, "Full-pretrain/Step Time": 17.62668632529676} +{"Full-pretrain/Learning Rate": 4.591032162541425e-05, "Full-pretrain/Loss": 2.0376811027526855, "Full-pretrain/Loss (Raw)": 2.377565622329712, "Full-pretrain/Step": 1994, "Full-pretrain/Step Time": 17.627343552187085} +{"Full-pretrain/Learning Rate": 4.590566661768484e-05, "Full-pretrain/Loss": 2.038522243499756, "Full-pretrain/Loss (Raw)": 1.9735205173492432, "Full-pretrain/Step": 1995, "Full-pretrain/Step Time": 17.633202200755477} +{"Full-pretrain/Learning Rate": 4.5901009198494125e-05, "Full-pretrain/Loss": 2.04630708694458, "Full-pretrain/Loss (Raw)": 2.196955680847168, "Full-pretrain/Step": 1996, "Full-pretrain/Step Time": 17.630284192040563} +{"Full-pretrain/Learning Rate": 4.5896349368379356e-05, "Full-pretrain/Loss": 2.0476653575897217, "Full-pretrain/Loss (Raw)": 2.129666805267334, "Full-pretrain/Step": 1997, "Full-pretrain/Step Time": 17.626627111807466} +{"Full-pretrain/Learning Rate": 4.5891687127878025e-05, "Full-pretrain/Loss": 2.0483908653259277, "Full-pretrain/Loss (Raw)": 2.089695453643799, "Full-pretrain/Step": 1998, "Full-pretrain/Step Time": 17.62581213004887} +{"Full-pretrain/Learning Rate": 4.5887022477527926e-05, "Full-pretrain/Loss": 2.0507102012634277, "Full-pretrain/Loss (Raw)": 2.1945319175720215, "Full-pretrain/Step": 1999, "Full-pretrain/Step Time": 17.628055293112993} +{"Full-pretrain/Learning Rate": 4.5882355417867126e-05, "Full-pretrain/Loss": 2.049575090408325, "Full-pretrain/Loss (Raw)": 2.0171992778778076, "Full-pretrain/Step": 2000, "Full-pretrain/Step Time": 17.62418444827199} +{"Full-pretrain/Learning Rate": 4.587768594943396e-05, "Full-pretrain/Loss": 2.039371967315674, "Full-pretrain/Loss (Raw)": 1.940029263496399, "Full-pretrain/Step": 2001, "Full-pretrain/Step Time": 17.619358755648136} +{"Full-pretrain/Learning Rate": 4.587301407276707e-05, "Full-pretrain/Loss": 2.0330984592437744, "Full-pretrain/Loss (Raw)": 1.9842175245285034, "Full-pretrain/Step": 2002, "Full-pretrain/Step Time": 17.616611508652568} +{"Full-pretrain/Learning Rate": 4.5868339788405334e-05, "Full-pretrain/Loss": 2.0372323989868164, "Full-pretrain/Loss (Raw)": 2.053407669067383, "Full-pretrain/Step": 2003, "Full-pretrain/Step Time": 17.62609515711665} +{"Full-pretrain/Learning Rate": 4.586366309688793e-05, "Full-pretrain/Loss": 2.0216121673583984, "Full-pretrain/Loss (Raw)": 1.621744990348816, "Full-pretrain/Step": 2004, "Full-pretrain/Step Time": 17.62752889841795} +{"Full-pretrain/Learning Rate": 4.585898399875433e-05, "Full-pretrain/Loss": 2.0154013633728027, "Full-pretrain/Loss (Raw)": 1.8732590675354004, "Full-pretrain/Step": 2005, "Full-pretrain/Step Time": 17.6177893076092} +{"Full-pretrain/Learning Rate": 4.585430249454426e-05, "Full-pretrain/Loss": 2.0254921913146973, "Full-pretrain/Loss (Raw)": 2.244748115539551, "Full-pretrain/Step": 2006, "Full-pretrain/Step Time": 17.619698654860258} +{"Full-pretrain/Learning Rate": 4.584961858479772e-05, "Full-pretrain/Loss": 2.0216760635375977, "Full-pretrain/Loss (Raw)": 1.9727703332901, "Full-pretrain/Step": 2007, "Full-pretrain/Step Time": 17.61514980532229} +{"Full-pretrain/Learning Rate": 4.5844932270054994e-05, "Full-pretrain/Loss": 2.0282769203186035, "Full-pretrain/Loss (Raw)": 2.2456541061401367, "Full-pretrain/Step": 2008, "Full-pretrain/Step Time": 17.617514980956912} +{"Full-pretrain/Learning Rate": 4.584024355085666e-05, "Full-pretrain/Loss": 2.0247182846069336, "Full-pretrain/Loss (Raw)": 2.008192539215088, "Full-pretrain/Step": 2009, "Full-pretrain/Step Time": 17.61508548259735} +{"Full-pretrain/Learning Rate": 4.583555242774357e-05, "Full-pretrain/Loss": 2.0189199447631836, "Full-pretrain/Loss (Raw)": 1.8673090934753418, "Full-pretrain/Step": 2010, "Full-pretrain/Step Time": 17.606690855696797} +{"Full-pretrain/Learning Rate": 4.5830858901256826e-05, "Full-pretrain/Loss": 2.0185718536376953, "Full-pretrain/Loss (Raw)": 1.8933513164520264, "Full-pretrain/Step": 2011, "Full-pretrain/Step Time": 17.610147796571255} +{"Full-pretrain/Learning Rate": 4.5826162971937816e-05, "Full-pretrain/Loss": 2.0192179679870605, "Full-pretrain/Loss (Raw)": 1.9521404504776, "Full-pretrain/Step": 2012, "Full-pretrain/Step Time": 17.61377900093794} +{"Full-pretrain/Learning Rate": 4.582146464032824e-05, "Full-pretrain/Loss": 2.0122766494750977, "Full-pretrain/Loss (Raw)": 2.0388240814208984, "Full-pretrain/Step": 2013, "Full-pretrain/Step Time": 17.61043781787157} +{"Full-pretrain/Learning Rate": 4.5816763906970025e-05, "Full-pretrain/Loss": 2.012418746948242, "Full-pretrain/Loss (Raw)": 2.056086301803589, "Full-pretrain/Step": 2014, "Full-pretrain/Step Time": 17.6069321539253} +{"Full-pretrain/Learning Rate": 4.5812060772405406e-05, "Full-pretrain/Loss": 2.010284900665283, "Full-pretrain/Loss (Raw)": 1.8003084659576416, "Full-pretrain/Step": 2015, "Full-pretrain/Step Time": 17.612953396514058} +{"Full-pretrain/Learning Rate": 4.58073552371769e-05, "Full-pretrain/Loss": 2.0139429569244385, "Full-pretrain/Loss (Raw)": 2.151569366455078, "Full-pretrain/Step": 2016, "Full-pretrain/Step Time": 17.612721720710397} +{"Full-pretrain/Learning Rate": 4.580264730182727e-05, "Full-pretrain/Loss": 2.0172605514526367, "Full-pretrain/Loss (Raw)": 1.9325363636016846, "Full-pretrain/Step": 2017, "Full-pretrain/Step Time": 17.60756453871727} +{"Full-pretrain/Learning Rate": 4.57979369668996e-05, "Full-pretrain/Loss": 2.0194454193115234, "Full-pretrain/Loss (Raw)": 2.232363700866699, "Full-pretrain/Step": 2018, "Full-pretrain/Step Time": 17.60104521922767} +{"Full-pretrain/Learning Rate": 4.579322423293719e-05, "Full-pretrain/Loss": 2.026520252227783, "Full-pretrain/Loss (Raw)": 1.9909038543701172, "Full-pretrain/Step": 2019, "Full-pretrain/Step Time": 17.60657810047269} +{"Full-pretrain/Learning Rate": 4.578850910048369e-05, "Full-pretrain/Loss": 2.029026508331299, "Full-pretrain/Loss (Raw)": 1.9629504680633545, "Full-pretrain/Step": 2020, "Full-pretrain/Step Time": 17.61077619716525} +{"Full-pretrain/Learning Rate": 4.578379157008296e-05, "Full-pretrain/Loss": 2.0162856578826904, "Full-pretrain/Loss (Raw)": 1.8070032596588135, "Full-pretrain/Step": 2021, "Full-pretrain/Step Time": 17.609237536787987} +{"Full-pretrain/Learning Rate": 4.577907164227918e-05, "Full-pretrain/Loss": 2.010206937789917, "Full-pretrain/Loss (Raw)": 1.7696589231491089, "Full-pretrain/Step": 2022, "Full-pretrain/Step Time": 17.600851180031896} +{"Full-pretrain/Learning Rate": 4.577434931761679e-05, "Full-pretrain/Loss": 2.010993242263794, "Full-pretrain/Loss (Raw)": 2.1211800575256348, "Full-pretrain/Step": 2023, "Full-pretrain/Step Time": 17.59901617281139} +{"Full-pretrain/Learning Rate": 4.57696245966405e-05, "Full-pretrain/Loss": 2.018052816390991, "Full-pretrain/Loss (Raw)": 2.1752679347991943, "Full-pretrain/Step": 2024, "Full-pretrain/Step Time": 17.605186335742474} +{"Full-pretrain/Learning Rate": 4.5764897479895317e-05, "Full-pretrain/Loss": 2.0220885276794434, "Full-pretrain/Loss (Raw)": 2.0322203636169434, "Full-pretrain/Step": 2025, "Full-pretrain/Step Time": 17.600847482681274} +{"Full-pretrain/Learning Rate": 4.57601679679265e-05, "Full-pretrain/Loss": 2.0157601833343506, "Full-pretrain/Loss (Raw)": 2.175058364868164, "Full-pretrain/Step": 2026, "Full-pretrain/Step Time": 17.593271620571613} +{"Full-pretrain/Learning Rate": 4.575543606127962e-05, "Full-pretrain/Loss": 2.016648292541504, "Full-pretrain/Loss (Raw)": 2.0019404888153076, "Full-pretrain/Step": 2027, "Full-pretrain/Step Time": 17.598099576309323} +{"Full-pretrain/Learning Rate": 4.5750701760500466e-05, "Full-pretrain/Loss": 2.0105981826782227, "Full-pretrain/Loss (Raw)": 2.003350257873535, "Full-pretrain/Step": 2028, "Full-pretrain/Step Time": 17.599627980962396} +{"Full-pretrain/Learning Rate": 4.574596506613516e-05, "Full-pretrain/Loss": 2.0052871704101562, "Full-pretrain/Loss (Raw)": 1.9597097635269165, "Full-pretrain/Step": 2029, "Full-pretrain/Step Time": 17.59736029803753} +{"Full-pretrain/Learning Rate": 4.574122597873009e-05, "Full-pretrain/Loss": 2.0056498050689697, "Full-pretrain/Loss (Raw)": 2.1013026237487793, "Full-pretrain/Step": 2030, "Full-pretrain/Step Time": 17.5945728700608} +{"Full-pretrain/Learning Rate": 4.573648449883188e-05, "Full-pretrain/Loss": 2.0020174980163574, "Full-pretrain/Loss (Raw)": 2.0782976150512695, "Full-pretrain/Step": 2031, "Full-pretrain/Step Time": 17.598620615899563} +{"Full-pretrain/Learning Rate": 4.573174062698747e-05, "Full-pretrain/Loss": 1.998030185699463, "Full-pretrain/Loss (Raw)": 1.8896071910858154, "Full-pretrain/Step": 2032, "Full-pretrain/Step Time": 17.593107391148806} +{"Full-pretrain/Learning Rate": 4.572699436374407e-05, "Full-pretrain/Loss": 1.997426152229309, "Full-pretrain/Loss (Raw)": 1.9207013845443726, "Full-pretrain/Step": 2033, "Full-pretrain/Step Time": 17.595751244574785} +{"Full-pretrain/Learning Rate": 4.572224570964915e-05, "Full-pretrain/Loss": 1.9979074001312256, "Full-pretrain/Loss (Raw)": 1.9996159076690674, "Full-pretrain/Step": 2034, "Full-pretrain/Step Time": 17.588082106783986} +{"Full-pretrain/Learning Rate": 4.571749466525047e-05, "Full-pretrain/Loss": 2.000931739807129, "Full-pretrain/Loss (Raw)": 2.1501874923706055, "Full-pretrain/Step": 2035, "Full-pretrain/Step Time": 17.591157097369432} +{"Full-pretrain/Learning Rate": 4.571274123109606e-05, "Full-pretrain/Loss": 2.0225841999053955, "Full-pretrain/Loss (Raw)": 2.3146233558654785, "Full-pretrain/Step": 2036, "Full-pretrain/Step Time": 17.58619219996035} +{"Full-pretrain/Learning Rate": 4.570798540773422e-05, "Full-pretrain/Loss": 2.0222978591918945, "Full-pretrain/Loss (Raw)": 1.8640931844711304, "Full-pretrain/Step": 2037, "Full-pretrain/Step Time": 17.59151699580252} +{"Full-pretrain/Learning Rate": 4.570322719571355e-05, "Full-pretrain/Loss": 2.019474506378174, "Full-pretrain/Loss (Raw)": 2.154407024383545, "Full-pretrain/Step": 2038, "Full-pretrain/Step Time": 17.59478921443224} +{"Full-pretrain/Learning Rate": 4.56984665955829e-05, "Full-pretrain/Loss": 2.021228313446045, "Full-pretrain/Loss (Raw)": 2.028890609741211, "Full-pretrain/Step": 2039, "Full-pretrain/Step Time": 17.587732333689928} +{"Full-pretrain/Learning Rate": 4.56937036078914e-05, "Full-pretrain/Loss": 2.018564224243164, "Full-pretrain/Loss (Raw)": 2.160404682159424, "Full-pretrain/Step": 2040, "Full-pretrain/Step Time": 17.59610728546977} +{"Full-pretrain/Learning Rate": 4.568893823318846e-05, "Full-pretrain/Loss": 2.022693157196045, "Full-pretrain/Loss (Raw)": 2.140317916870117, "Full-pretrain/Step": 2041, "Full-pretrain/Step Time": 17.59481173567474} +{"Full-pretrain/Learning Rate": 4.568417047202377e-05, "Full-pretrain/Loss": 2.018930435180664, "Full-pretrain/Loss (Raw)": 1.7469021081924438, "Full-pretrain/Step": 2042, "Full-pretrain/Step Time": 17.591121261939406} +{"Full-pretrain/Learning Rate": 4.567940032494727e-05, "Full-pretrain/Loss": 2.0284085273742676, "Full-pretrain/Loss (Raw)": 2.196654796600342, "Full-pretrain/Step": 2043, "Full-pretrain/Step Time": 17.58867182955146} +{"Full-pretrain/Learning Rate": 4.5674627792509225e-05, "Full-pretrain/Loss": 2.0285356044769287, "Full-pretrain/Loss (Raw)": 1.9562015533447266, "Full-pretrain/Step": 2044, "Full-pretrain/Step Time": 17.59769356250763} +{"Full-pretrain/Learning Rate": 4.5669852875260134e-05, "Full-pretrain/Loss": 2.0299253463745117, "Full-pretrain/Loss (Raw)": 2.08329439163208, "Full-pretrain/Step": 2045, "Full-pretrain/Step Time": 17.600892866030335} +{"Full-pretrain/Learning Rate": 4.5665075573750766e-05, "Full-pretrain/Loss": 2.026258945465088, "Full-pretrain/Loss (Raw)": 1.9387668371200562, "Full-pretrain/Step": 2046, "Full-pretrain/Step Time": 17.593574080616236} +{"Full-pretrain/Learning Rate": 4.5660295888532195e-05, "Full-pretrain/Loss": 2.0382776260375977, "Full-pretrain/Loss (Raw)": 2.184906482696533, "Full-pretrain/Step": 2047, "Full-pretrain/Step Time": 17.5953357424587} +{"Full-pretrain/Learning Rate": 4.565551382015576e-05, "Full-pretrain/Loss": 2.0287318229675293, "Full-pretrain/Loss (Raw)": 1.8460993766784668, "Full-pretrain/Step": 2048, "Full-pretrain/Step Time": 17.599463468417525} +{"Full-pretrain/Learning Rate": 4.565072936917305e-05, "Full-pretrain/Loss": 2.0307326316833496, "Full-pretrain/Loss (Raw)": 1.9965672492980957, "Full-pretrain/Step": 2049, "Full-pretrain/Step Time": 17.604139108210802} +{"Full-pretrain/Learning Rate": 4.564594253613598e-05, "Full-pretrain/Loss": 2.0212454795837402, "Full-pretrain/Loss (Raw)": 1.928769588470459, "Full-pretrain/Step": 2050, "Full-pretrain/Step Time": 17.602256260812283} +{"Full-pretrain/Learning Rate": 4.564115332159668e-05, "Full-pretrain/Loss": 2.026211738586426, "Full-pretrain/Loss (Raw)": 2.14982533454895, "Full-pretrain/Step": 2051, "Full-pretrain/Step Time": 17.59931237436831} +{"Full-pretrain/Learning Rate": 4.563636172610761e-05, "Full-pretrain/Loss": 2.0314369201660156, "Full-pretrain/Loss (Raw)": 2.1301517486572266, "Full-pretrain/Step": 2052, "Full-pretrain/Step Time": 17.605486107990146} +{"Full-pretrain/Learning Rate": 4.563156775022147e-05, "Full-pretrain/Loss": 2.0505056381225586, "Full-pretrain/Loss (Raw)": 2.417205810546875, "Full-pretrain/Step": 2053, "Full-pretrain/Step Time": 17.61332576163113} +{"Full-pretrain/Learning Rate": 4.562677139449123e-05, "Full-pretrain/Loss": 2.0587189197540283, "Full-pretrain/Loss (Raw)": 2.032482147216797, "Full-pretrain/Step": 2054, "Full-pretrain/Step Time": 17.612862879410386} +{"Full-pretrain/Learning Rate": 4.562197265947016e-05, "Full-pretrain/Loss": 2.052006483078003, "Full-pretrain/Loss (Raw)": 1.906383991241455, "Full-pretrain/Step": 2055, "Full-pretrain/Step Time": 17.606416754424572} +{"Full-pretrain/Learning Rate": 4.561717154571179e-05, "Full-pretrain/Loss": 2.0419411659240723, "Full-pretrain/Loss (Raw)": 1.8531779050827026, "Full-pretrain/Step": 2056, "Full-pretrain/Step Time": 17.60862498730421} +{"Full-pretrain/Learning Rate": 4.561236805376994e-05, "Full-pretrain/Loss": 2.054619789123535, "Full-pretrain/Loss (Raw)": 2.4379358291625977, "Full-pretrain/Step": 2057, "Full-pretrain/Step Time": 17.60556080751121} +{"Full-pretrain/Learning Rate": 4.560756218419867e-05, "Full-pretrain/Loss": 2.0495715141296387, "Full-pretrain/Loss (Raw)": 2.0135159492492676, "Full-pretrain/Step": 2058, "Full-pretrain/Step Time": 17.607984675094485} +{"Full-pretrain/Learning Rate": 4.560275393755233e-05, "Full-pretrain/Loss": 2.0430469512939453, "Full-pretrain/Loss (Raw)": 1.7931472063064575, "Full-pretrain/Step": 2059, "Full-pretrain/Step Time": 17.60699470899999} +{"Full-pretrain/Learning Rate": 4.5597943314385586e-05, "Full-pretrain/Loss": 2.0434370040893555, "Full-pretrain/Loss (Raw)": 2.015840530395508, "Full-pretrain/Step": 2060, "Full-pretrain/Step Time": 17.608946518972516} +{"Full-pretrain/Learning Rate": 4.559313031525331e-05, "Full-pretrain/Loss": 2.050990343093872, "Full-pretrain/Loss (Raw)": 2.2014143466949463, "Full-pretrain/Step": 2061, "Full-pretrain/Step Time": 17.60675393603742} +{"Full-pretrain/Learning Rate": 4.558831494071069e-05, "Full-pretrain/Loss": 2.043790340423584, "Full-pretrain/Loss (Raw)": 1.870897650718689, "Full-pretrain/Step": 2062, "Full-pretrain/Step Time": 17.59914438612759} +{"Full-pretrain/Learning Rate": 4.558349719131317e-05, "Full-pretrain/Loss": 2.0419259071350098, "Full-pretrain/Loss (Raw)": 2.018639087677002, "Full-pretrain/Step": 2063, "Full-pretrain/Step Time": 17.601071901619434} +{"Full-pretrain/Learning Rate": 4.5578677067616494e-05, "Full-pretrain/Loss": 2.0428261756896973, "Full-pretrain/Loss (Raw)": 1.9184132814407349, "Full-pretrain/Step": 2064, "Full-pretrain/Step Time": 17.60128988698125} +{"Full-pretrain/Learning Rate": 4.5573854570176645e-05, "Full-pretrain/Loss": 2.0554633140563965, "Full-pretrain/Loss (Raw)": 2.325099229812622, "Full-pretrain/Step": 2065, "Full-pretrain/Step Time": 17.60189483501017} +{"Full-pretrain/Learning Rate": 4.5569029699549904e-05, "Full-pretrain/Loss": 2.0586490631103516, "Full-pretrain/Loss (Raw)": 2.101559638977051, "Full-pretrain/Step": 2066, "Full-pretrain/Step Time": 17.60237810574472} +{"Full-pretrain/Learning Rate": 4.556420245629281e-05, "Full-pretrain/Loss": 2.0508365631103516, "Full-pretrain/Loss (Raw)": 1.90017831325531, "Full-pretrain/Step": 2067, "Full-pretrain/Step Time": 17.603334590792656} +{"Full-pretrain/Learning Rate": 4.555937284096219e-05, "Full-pretrain/Loss": 2.0389292240142822, "Full-pretrain/Loss (Raw)": 1.933593511581421, "Full-pretrain/Step": 2068, "Full-pretrain/Step Time": 17.602769128978252} +{"Full-pretrain/Learning Rate": 4.555454085411514e-05, "Full-pretrain/Loss": 2.04586124420166, "Full-pretrain/Loss (Raw)": 2.0859193801879883, "Full-pretrain/Step": 2069, "Full-pretrain/Step Time": 17.603456547483802} +{"Full-pretrain/Learning Rate": 4.554970649630903e-05, "Full-pretrain/Loss": 2.039754629135132, "Full-pretrain/Loss (Raw)": 1.9589923620224, "Full-pretrain/Step": 2070, "Full-pretrain/Step Time": 17.60057906061411} +{"Full-pretrain/Learning Rate": 4.554486976810149e-05, "Full-pretrain/Loss": 2.0404744148254395, "Full-pretrain/Loss (Raw)": 2.051928997039795, "Full-pretrain/Step": 2071, "Full-pretrain/Step Time": 17.5988812148571} +{"Full-pretrain/Learning Rate": 4.554003067005045e-05, "Full-pretrain/Loss": 2.0290229320526123, "Full-pretrain/Loss (Raw)": 1.7939512729644775, "Full-pretrain/Step": 2072, "Full-pretrain/Step Time": 17.6025885976851} +{"Full-pretrain/Learning Rate": 4.553518920271408e-05, "Full-pretrain/Loss": 2.0312726497650146, "Full-pretrain/Loss (Raw)": 2.212307929992676, "Full-pretrain/Step": 2073, "Full-pretrain/Step Time": 17.60464223474264} +{"Full-pretrain/Learning Rate": 4.553034536665086e-05, "Full-pretrain/Loss": 2.027853012084961, "Full-pretrain/Loss (Raw)": 1.6374754905700684, "Full-pretrain/Step": 2074, "Full-pretrain/Step Time": 17.594194600358605} +{"Full-pretrain/Learning Rate": 4.552549916241952e-05, "Full-pretrain/Loss": 2.0211403369903564, "Full-pretrain/Loss (Raw)": 1.981850504875183, "Full-pretrain/Step": 2075, "Full-pretrain/Step Time": 17.597423635423183} +{"Full-pretrain/Learning Rate": 4.5520650590579055e-05, "Full-pretrain/Loss": 2.0261549949645996, "Full-pretrain/Loss (Raw)": 2.116666793823242, "Full-pretrain/Step": 2076, "Full-pretrain/Step Time": 17.601722905412316} +{"Full-pretrain/Learning Rate": 4.5515799651688765e-05, "Full-pretrain/Loss": 2.028759479522705, "Full-pretrain/Loss (Raw)": 2.166637420654297, "Full-pretrain/Step": 2077, "Full-pretrain/Step Time": 17.60211587511003} +{"Full-pretrain/Learning Rate": 4.5510946346308185e-05, "Full-pretrain/Loss": 2.0234262943267822, "Full-pretrain/Loss (Raw)": 1.7681057453155518, "Full-pretrain/Step": 2078, "Full-pretrain/Step Time": 17.60120291262865} +{"Full-pretrain/Learning Rate": 4.550609067499716e-05, "Full-pretrain/Loss": 2.0178489685058594, "Full-pretrain/Loss (Raw)": 2.006434440612793, "Full-pretrain/Step": 2079, "Full-pretrain/Step Time": 17.599472228437662} +{"Full-pretrain/Learning Rate": 4.550123263831578e-05, "Full-pretrain/Loss": 2.0244572162628174, "Full-pretrain/Loss (Raw)": 2.0575623512268066, "Full-pretrain/Step": 2080, "Full-pretrain/Step Time": 17.603313772007823} +{"Full-pretrain/Learning Rate": 4.549637223682441e-05, "Full-pretrain/Loss": 2.0228919982910156, "Full-pretrain/Loss (Raw)": 1.9464777708053589, "Full-pretrain/Step": 2081, "Full-pretrain/Step Time": 17.60731866210699} +{"Full-pretrain/Learning Rate": 4.5491509471083724e-05, "Full-pretrain/Loss": 2.0273325443267822, "Full-pretrain/Loss (Raw)": 2.0708656311035156, "Full-pretrain/Step": 2082, "Full-pretrain/Step Time": 17.604258209466934} +{"Full-pretrain/Learning Rate": 4.548664434165461e-05, "Full-pretrain/Loss": 2.018005847930908, "Full-pretrain/Loss (Raw)": 1.8513774871826172, "Full-pretrain/Step": 2083, "Full-pretrain/Step Time": 17.597910400480032} +{"Full-pretrain/Learning Rate": 4.5481776849098274e-05, "Full-pretrain/Loss": 2.0166015625, "Full-pretrain/Loss (Raw)": 2.0852160453796387, "Full-pretrain/Step": 2084, "Full-pretrain/Step Time": 17.603733126074076} +{"Full-pretrain/Learning Rate": 4.547690699397618e-05, "Full-pretrain/Loss": 2.006363868713379, "Full-pretrain/Loss (Raw)": 2.089595317840576, "Full-pretrain/Step": 2085, "Full-pretrain/Step Time": 17.610402032732964} +{"Full-pretrain/Learning Rate": 4.547203477685005e-05, "Full-pretrain/Loss": 2.009997844696045, "Full-pretrain/Loss (Raw)": 2.1487674713134766, "Full-pretrain/Step": 2086, "Full-pretrain/Step Time": 17.607111705467105} +{"Full-pretrain/Learning Rate": 4.546716019828191e-05, "Full-pretrain/Loss": 2.01456356048584, "Full-pretrain/Loss (Raw)": 2.0524890422821045, "Full-pretrain/Step": 2087, "Full-pretrain/Step Time": 17.60037731193006} +{"Full-pretrain/Learning Rate": 4.546228325883403e-05, "Full-pretrain/Loss": 2.020139217376709, "Full-pretrain/Loss (Raw)": 2.0316011905670166, "Full-pretrain/Step": 2088, "Full-pretrain/Step Time": 17.605965765193105} +{"Full-pretrain/Learning Rate": 4.545740395906897e-05, "Full-pretrain/Loss": 2.008500337600708, "Full-pretrain/Loss (Raw)": 2.0654890537261963, "Full-pretrain/Step": 2089, "Full-pretrain/Step Time": 17.603327563032508} +{"Full-pretrain/Learning Rate": 4.545252229954955e-05, "Full-pretrain/Loss": 2.0134482383728027, "Full-pretrain/Loss (Raw)": 2.1718502044677734, "Full-pretrain/Step": 2090, "Full-pretrain/Step Time": 17.608113583177328} +{"Full-pretrain/Learning Rate": 4.5447638280838875e-05, "Full-pretrain/Loss": 2.020203113555908, "Full-pretrain/Loss (Raw)": 2.009302854537964, "Full-pretrain/Step": 2091, "Full-pretrain/Step Time": 17.600852435454726} +{"Full-pretrain/Learning Rate": 4.544275190350031e-05, "Full-pretrain/Loss": 2.0199878215789795, "Full-pretrain/Loss (Raw)": 2.0089523792266846, "Full-pretrain/Step": 2092, "Full-pretrain/Step Time": 17.602293334901333} +{"Full-pretrain/Learning Rate": 4.5437863168097496e-05, "Full-pretrain/Loss": 2.0119547843933105, "Full-pretrain/Loss (Raw)": 1.9443557262420654, "Full-pretrain/Step": 2093, "Full-pretrain/Step Time": 17.61047102510929} +{"Full-pretrain/Learning Rate": 4.543297207519434e-05, "Full-pretrain/Loss": 2.011720657348633, "Full-pretrain/Loss (Raw)": 1.863410234451294, "Full-pretrain/Step": 2094, "Full-pretrain/Step Time": 17.61049935221672} +{"Full-pretrain/Learning Rate": 4.542807862535504e-05, "Full-pretrain/Loss": 2.0187125205993652, "Full-pretrain/Loss (Raw)": 2.2423739433288574, "Full-pretrain/Step": 2095, "Full-pretrain/Step Time": 17.60832673124969} +{"Full-pretrain/Learning Rate": 4.5423182819144055e-05, "Full-pretrain/Loss": 2.0227060317993164, "Full-pretrain/Loss (Raw)": 2.0462074279785156, "Full-pretrain/Step": 2096, "Full-pretrain/Step Time": 17.605195807293057} +{"Full-pretrain/Learning Rate": 4.541828465712611e-05, "Full-pretrain/Loss": 2.01716947555542, "Full-pretrain/Loss (Raw)": 2.14793062210083, "Full-pretrain/Step": 2097, "Full-pretrain/Step Time": 17.613383615389466} +{"Full-pretrain/Learning Rate": 4.54133841398662e-05, "Full-pretrain/Loss": 2.01715087890625, "Full-pretrain/Loss (Raw)": 2.1009573936462402, "Full-pretrain/Step": 2098, "Full-pretrain/Step Time": 17.609750350937247} +{"Full-pretrain/Learning Rate": 4.5408481267929605e-05, "Full-pretrain/Loss": 2.0229153633117676, "Full-pretrain/Loss (Raw)": 2.084646463394165, "Full-pretrain/Step": 2099, "Full-pretrain/Step Time": 17.612385101616383} +{"Full-pretrain/Learning Rate": 4.5403576041881864e-05, "Full-pretrain/Loss": 2.024704694747925, "Full-pretrain/Loss (Raw)": 1.9908509254455566, "Full-pretrain/Step": 2100, "Full-pretrain/Step Time": 17.602061480283737} +{"Full-pretrain/Learning Rate": 4.53986684622888e-05, "Full-pretrain/Loss": 2.020453453063965, "Full-pretrain/Loss (Raw)": 1.949886441230774, "Full-pretrain/Step": 2101, "Full-pretrain/Step Time": 17.61007202602923} +{"Full-pretrain/Learning Rate": 4.539375852971649e-05, "Full-pretrain/Loss": 2.023751735687256, "Full-pretrain/Loss (Raw)": 2.0645265579223633, "Full-pretrain/Step": 2102, "Full-pretrain/Step Time": 17.612642105668783} +{"Full-pretrain/Learning Rate": 4.538884624473131e-05, "Full-pretrain/Loss": 2.016005039215088, "Full-pretrain/Loss (Raw)": 1.8040382862091064, "Full-pretrain/Step": 2103, "Full-pretrain/Step Time": 17.610668981447816} +{"Full-pretrain/Learning Rate": 4.538393160789988e-05, "Full-pretrain/Loss": 2.02504301071167, "Full-pretrain/Loss (Raw)": 2.0831716060638428, "Full-pretrain/Step": 2104, "Full-pretrain/Step Time": 17.608455628156662} +{"Full-pretrain/Learning Rate": 4.5379014619789104e-05, "Full-pretrain/Loss": 2.018657684326172, "Full-pretrain/Loss (Raw)": 2.0079758167266846, "Full-pretrain/Step": 2105, "Full-pretrain/Step Time": 17.611419837921858} +{"Full-pretrain/Learning Rate": 4.537409528096615e-05, "Full-pretrain/Loss": 2.0322909355163574, "Full-pretrain/Loss (Raw)": 2.073737621307373, "Full-pretrain/Step": 2106, "Full-pretrain/Step Time": 17.619196731597185} +{"Full-pretrain/Learning Rate": 4.536917359199847e-05, "Full-pretrain/Loss": 2.0340981483459473, "Full-pretrain/Loss (Raw)": 2.039680242538452, "Full-pretrain/Step": 2107, "Full-pretrain/Step Time": 17.61331593245268} +{"Full-pretrain/Learning Rate": 4.536424955345376e-05, "Full-pretrain/Loss": 2.030637502670288, "Full-pretrain/Loss (Raw)": 2.0059239864349365, "Full-pretrain/Step": 2108, "Full-pretrain/Step Time": 17.610236756503582} +{"Full-pretrain/Learning Rate": 4.5359323165900036e-05, "Full-pretrain/Loss": 2.024453639984131, "Full-pretrain/Loss (Raw)": 1.9687516689300537, "Full-pretrain/Step": 2109, "Full-pretrain/Step Time": 17.61186329089105} +{"Full-pretrain/Learning Rate": 4.535439442990553e-05, "Full-pretrain/Loss": 2.0326004028320312, "Full-pretrain/Loss (Raw)": 2.0288052558898926, "Full-pretrain/Step": 2110, "Full-pretrain/Step Time": 17.614952063187957} +{"Full-pretrain/Learning Rate": 4.534946334603879e-05, "Full-pretrain/Loss": 2.0293784141540527, "Full-pretrain/Loss (Raw)": 1.9033336639404297, "Full-pretrain/Step": 2111, "Full-pretrain/Step Time": 17.61289594694972} +{"Full-pretrain/Learning Rate": 4.5344529914868596e-05, "Full-pretrain/Loss": 2.0337719917297363, "Full-pretrain/Loss (Raw)": 2.198152780532837, "Full-pretrain/Step": 2112, "Full-pretrain/Step Time": 17.61354200169444} +{"Full-pretrain/Learning Rate": 4.533959413696403e-05, "Full-pretrain/Loss": 2.0360679626464844, "Full-pretrain/Loss (Raw)": 2.0199477672576904, "Full-pretrain/Step": 2113, "Full-pretrain/Step Time": 17.618382101878524} +{"Full-pretrain/Learning Rate": 4.533465601289443e-05, "Full-pretrain/Loss": 2.0354769229888916, "Full-pretrain/Loss (Raw)": 2.051955223083496, "Full-pretrain/Step": 2114, "Full-pretrain/Step Time": 17.61897891946137} +{"Full-pretrain/Learning Rate": 4.53297155432294e-05, "Full-pretrain/Loss": 2.0340113639831543, "Full-pretrain/Loss (Raw)": 1.8044817447662354, "Full-pretrain/Step": 2115, "Full-pretrain/Step Time": 17.608260916545987} +{"Full-pretrain/Learning Rate": 4.5324772728538825e-05, "Full-pretrain/Loss": 2.0418219566345215, "Full-pretrain/Loss (Raw)": 2.335153579711914, "Full-pretrain/Step": 2116, "Full-pretrain/Step Time": 17.6054530441761} +{"Full-pretrain/Learning Rate": 4.531982756939286e-05, "Full-pretrain/Loss": 2.0359244346618652, "Full-pretrain/Loss (Raw)": 1.9008759260177612, "Full-pretrain/Step": 2117, "Full-pretrain/Step Time": 17.61052979156375} +{"Full-pretrain/Learning Rate": 4.531488006636193e-05, "Full-pretrain/Loss": 2.02439022064209, "Full-pretrain/Loss (Raw)": 1.7796666622161865, "Full-pretrain/Step": 2118, "Full-pretrain/Step Time": 17.612517040222883} +{"Full-pretrain/Learning Rate": 4.530993022001671e-05, "Full-pretrain/Loss": 2.0142135620117188, "Full-pretrain/Loss (Raw)": 1.7268435955047607, "Full-pretrain/Step": 2119, "Full-pretrain/Step Time": 17.61036740615964} +{"Full-pretrain/Learning Rate": 4.530497803092819e-05, "Full-pretrain/Loss": 2.0097270011901855, "Full-pretrain/Loss (Raw)": 1.8880279064178467, "Full-pretrain/Step": 2120, "Full-pretrain/Step Time": 17.607632271945477} +{"Full-pretrain/Learning Rate": 4.530002349966759e-05, "Full-pretrain/Loss": 2.0082345008850098, "Full-pretrain/Loss (Raw)": 2.017726421356201, "Full-pretrain/Step": 2121, "Full-pretrain/Step Time": 17.609432194381952} +{"Full-pretrain/Learning Rate": 4.529506662680641e-05, "Full-pretrain/Loss": 2.000967025756836, "Full-pretrain/Loss (Raw)": 1.93929123878479, "Full-pretrain/Step": 2122, "Full-pretrain/Step Time": 17.61149975657463} +{"Full-pretrain/Learning Rate": 4.5290107412916427e-05, "Full-pretrain/Loss": 2.0038766860961914, "Full-pretrain/Loss (Raw)": 2.102410078048706, "Full-pretrain/Step": 2123, "Full-pretrain/Step Time": 17.610477421432734} +{"Full-pretrain/Learning Rate": 4.5285145858569686e-05, "Full-pretrain/Loss": 1.9956591129302979, "Full-pretrain/Loss (Raw)": 1.745996117591858, "Full-pretrain/Step": 2124, "Full-pretrain/Step Time": 17.607181256636977} +{"Full-pretrain/Learning Rate": 4.5280181964338495e-05, "Full-pretrain/Loss": 1.9987053871154785, "Full-pretrain/Loss (Raw)": 2.041835308074951, "Full-pretrain/Step": 2125, "Full-pretrain/Step Time": 17.607302129268646} +{"Full-pretrain/Learning Rate": 4.527521573079544e-05, "Full-pretrain/Loss": 2.006736993789673, "Full-pretrain/Loss (Raw)": 2.120424747467041, "Full-pretrain/Step": 2126, "Full-pretrain/Step Time": 17.611810689792037} +{"Full-pretrain/Learning Rate": 4.527024715851338e-05, "Full-pretrain/Loss": 1.9997090101242065, "Full-pretrain/Loss (Raw)": 2.0174741744995117, "Full-pretrain/Step": 2127, "Full-pretrain/Step Time": 17.61421198397875} +{"Full-pretrain/Learning Rate": 4.526527624806543e-05, "Full-pretrain/Loss": 1.9959402084350586, "Full-pretrain/Loss (Raw)": 1.9256072044372559, "Full-pretrain/Step": 2128, "Full-pretrain/Step Time": 17.61829424649477} +{"Full-pretrain/Learning Rate": 4.5260303000025e-05, "Full-pretrain/Loss": 1.9909085035324097, "Full-pretrain/Loss (Raw)": 1.9869160652160645, "Full-pretrain/Step": 2129, "Full-pretrain/Step Time": 17.622833667322993} +{"Full-pretrain/Learning Rate": 4.525532741496572e-05, "Full-pretrain/Loss": 1.9800306558609009, "Full-pretrain/Loss (Raw)": 1.7528669834136963, "Full-pretrain/Step": 2130, "Full-pretrain/Step Time": 17.62345163524151} +{"Full-pretrain/Learning Rate": 4.525034949346155e-05, "Full-pretrain/Loss": 1.9790098667144775, "Full-pretrain/Loss (Raw)": 2.0519816875457764, "Full-pretrain/Step": 2131, "Full-pretrain/Step Time": 17.62265187688172} +{"Full-pretrain/Learning Rate": 4.524536923608668e-05, "Full-pretrain/Loss": 1.9809530973434448, "Full-pretrain/Loss (Raw)": 2.053034782409668, "Full-pretrain/Step": 2132, "Full-pretrain/Step Time": 17.614586299285293} +{"Full-pretrain/Learning Rate": 4.524038664341558e-05, "Full-pretrain/Loss": 1.9908037185668945, "Full-pretrain/Loss (Raw)": 2.265101432800293, "Full-pretrain/Step": 2133, "Full-pretrain/Step Time": 17.617163645103574} +{"Full-pretrain/Learning Rate": 4.5235401716023e-05, "Full-pretrain/Loss": 1.9935810565948486, "Full-pretrain/Loss (Raw)": 2.1534042358398438, "Full-pretrain/Step": 2134, "Full-pretrain/Step Time": 17.616433538496494} +{"Full-pretrain/Learning Rate": 4.523041445448394e-05, "Full-pretrain/Loss": 2.004918336868286, "Full-pretrain/Loss (Raw)": 2.1668317317962646, "Full-pretrain/Step": 2135, "Full-pretrain/Step Time": 17.621110694482923} +{"Full-pretrain/Learning Rate": 4.522542485937369e-05, "Full-pretrain/Loss": 1.9950038194656372, "Full-pretrain/Loss (Raw)": 1.7659077644348145, "Full-pretrain/Step": 2136, "Full-pretrain/Step Time": 17.62156397663057} +{"Full-pretrain/Learning Rate": 4.522043293126778e-05, "Full-pretrain/Loss": 1.9903099536895752, "Full-pretrain/Loss (Raw)": 1.8577678203582764, "Full-pretrain/Step": 2137, "Full-pretrain/Step Time": 17.620534429326653} +{"Full-pretrain/Learning Rate": 4.5215438670742045e-05, "Full-pretrain/Loss": 1.9893540143966675, "Full-pretrain/Loss (Raw)": 2.043149948120117, "Full-pretrain/Step": 2138, "Full-pretrain/Step Time": 17.620751483365893} +{"Full-pretrain/Learning Rate": 4.521044207837256e-05, "Full-pretrain/Loss": 1.9876585006713867, "Full-pretrain/Loss (Raw)": 1.9854278564453125, "Full-pretrain/Step": 2139, "Full-pretrain/Step Time": 17.62067561224103} +{"Full-pretrain/Learning Rate": 4.5205443154735684e-05, "Full-pretrain/Loss": 1.9885445833206177, "Full-pretrain/Loss (Raw)": 2.034275770187378, "Full-pretrain/Step": 2140, "Full-pretrain/Step Time": 17.61997414007783} +{"Full-pretrain/Learning Rate": 4.5200441900408045e-05, "Full-pretrain/Loss": 1.9875352382659912, "Full-pretrain/Loss (Raw)": 1.936450719833374, "Full-pretrain/Step": 2141, "Full-pretrain/Step Time": 17.61966234073043} +{"Full-pretrain/Learning Rate": 4.519543831596652e-05, "Full-pretrain/Loss": 1.9949270486831665, "Full-pretrain/Loss (Raw)": 2.2653446197509766, "Full-pretrain/Step": 2142, "Full-pretrain/Step Time": 17.623173279687762} +{"Full-pretrain/Learning Rate": 4.519043240198829e-05, "Full-pretrain/Loss": 2.0179455280303955, "Full-pretrain/Loss (Raw)": 2.639920473098755, "Full-pretrain/Step": 2143, "Full-pretrain/Step Time": 17.620318606495857} +{"Full-pretrain/Learning Rate": 4.518542415905077e-05, "Full-pretrain/Loss": 2.0118637084960938, "Full-pretrain/Loss (Raw)": 2.00354266166687, "Full-pretrain/Step": 2144, "Full-pretrain/Step Time": 17.61998775973916} +{"Full-pretrain/Learning Rate": 4.518041358773169e-05, "Full-pretrain/Loss": 2.0113823413848877, "Full-pretrain/Loss (Raw)": 2.004539728164673, "Full-pretrain/Step": 2145, "Full-pretrain/Step Time": 17.61376792937517} +{"Full-pretrain/Learning Rate": 4.517540068860897e-05, "Full-pretrain/Loss": 2.0172839164733887, "Full-pretrain/Loss (Raw)": 2.2408084869384766, "Full-pretrain/Step": 2146, "Full-pretrain/Step Time": 17.615575479343534} +{"Full-pretrain/Learning Rate": 4.5170385462260875e-05, "Full-pretrain/Loss": 2.0183563232421875, "Full-pretrain/Loss (Raw)": 1.8387892246246338, "Full-pretrain/Step": 2147, "Full-pretrain/Step Time": 17.61618353240192} +{"Full-pretrain/Learning Rate": 4.516536790926592e-05, "Full-pretrain/Loss": 2.0090811252593994, "Full-pretrain/Loss (Raw)": 2.038351535797119, "Full-pretrain/Step": 2148, "Full-pretrain/Step Time": 17.61610059440136} +{"Full-pretrain/Learning Rate": 4.516034803020285e-05, "Full-pretrain/Loss": 2.0051491260528564, "Full-pretrain/Loss (Raw)": 1.7750575542449951, "Full-pretrain/Step": 2149, "Full-pretrain/Step Time": 17.61459149979055} +{"Full-pretrain/Learning Rate": 4.515532582565072e-05, "Full-pretrain/Loss": 2.015944480895996, "Full-pretrain/Loss (Raw)": 2.1251134872436523, "Full-pretrain/Step": 2150, "Full-pretrain/Step Time": 17.615379728376865} +{"Full-pretrain/Learning Rate": 4.515030129618884e-05, "Full-pretrain/Loss": 2.0217947959899902, "Full-pretrain/Loss (Raw)": 1.914050817489624, "Full-pretrain/Step": 2151, "Full-pretrain/Step Time": 17.616170512512326} +{"Full-pretrain/Learning Rate": 4.514527444239679e-05, "Full-pretrain/Loss": 2.0338642597198486, "Full-pretrain/Loss (Raw)": 2.2742509841918945, "Full-pretrain/Step": 2152, "Full-pretrain/Step Time": 17.613698113709688} +{"Full-pretrain/Learning Rate": 4.514024526485441e-05, "Full-pretrain/Loss": 2.0388002395629883, "Full-pretrain/Loss (Raw)": 2.17568302154541, "Full-pretrain/Step": 2153, "Full-pretrain/Step Time": 17.615640718489885} +{"Full-pretrain/Learning Rate": 4.513521376414181e-05, "Full-pretrain/Loss": 2.042919158935547, "Full-pretrain/Loss (Raw)": 2.0710959434509277, "Full-pretrain/Step": 2154, "Full-pretrain/Step Time": 17.62437440827489} +{"Full-pretrain/Learning Rate": 4.513017994083939e-05, "Full-pretrain/Loss": 2.0421862602233887, "Full-pretrain/Loss (Raw)": 2.0789542198181152, "Full-pretrain/Step": 2155, "Full-pretrain/Step Time": 17.619359927251935} +{"Full-pretrain/Learning Rate": 4.512514379552779e-05, "Full-pretrain/Loss": 2.039170980453491, "Full-pretrain/Loss (Raw)": 1.6495082378387451, "Full-pretrain/Step": 2156, "Full-pretrain/Step Time": 17.624029533937573} +{"Full-pretrain/Learning Rate": 4.512010532878792e-05, "Full-pretrain/Loss": 2.039684772491455, "Full-pretrain/Loss (Raw)": 2.0582752227783203, "Full-pretrain/Step": 2157, "Full-pretrain/Step Time": 17.619866529479623} +{"Full-pretrain/Learning Rate": 4.511506454120097e-05, "Full-pretrain/Loss": 2.0300440788269043, "Full-pretrain/Loss (Raw)": 1.81192946434021, "Full-pretrain/Step": 2158, "Full-pretrain/Step Time": 17.624483939260244} +{"Full-pretrain/Learning Rate": 4.5110021433348396e-05, "Full-pretrain/Loss": 2.028258800506592, "Full-pretrain/Loss (Raw)": 1.9603424072265625, "Full-pretrain/Step": 2159, "Full-pretrain/Step Time": 17.617184903472662} +{"Full-pretrain/Learning Rate": 4.510497600581192e-05, "Full-pretrain/Loss": 2.0369186401367188, "Full-pretrain/Loss (Raw)": 2.202718734741211, "Full-pretrain/Step": 2160, "Full-pretrain/Step Time": 17.62564382329583} +{"Full-pretrain/Learning Rate": 4.5099928259173516e-05, "Full-pretrain/Loss": 2.039484739303589, "Full-pretrain/Loss (Raw)": 2.0690348148345947, "Full-pretrain/Step": 2161, "Full-pretrain/Step Time": 17.62167017161846} +{"Full-pretrain/Learning Rate": 4.509487819401545e-05, "Full-pretrain/Loss": 2.0541019439697266, "Full-pretrain/Loss (Raw)": 2.220620632171631, "Full-pretrain/Step": 2162, "Full-pretrain/Step Time": 17.626647541299462} +{"Full-pretrain/Learning Rate": 4.508982581092026e-05, "Full-pretrain/Loss": 2.0490775108337402, "Full-pretrain/Loss (Raw)": 1.8912012577056885, "Full-pretrain/Step": 2163, "Full-pretrain/Step Time": 17.62676993943751} +{"Full-pretrain/Learning Rate": 4.508477111047072e-05, "Full-pretrain/Loss": 2.0531699657440186, "Full-pretrain/Loss (Raw)": 2.1839911937713623, "Full-pretrain/Step": 2164, "Full-pretrain/Step Time": 17.6295730099082} +{"Full-pretrain/Learning Rate": 4.5079714093249884e-05, "Full-pretrain/Loss": 2.0407819747924805, "Full-pretrain/Loss (Raw)": 1.8686838150024414, "Full-pretrain/Step": 2165, "Full-pretrain/Step Time": 17.62890568561852} +{"Full-pretrain/Learning Rate": 4.507465475984109e-05, "Full-pretrain/Loss": 2.032245635986328, "Full-pretrain/Loss (Raw)": 1.880239725112915, "Full-pretrain/Step": 2166, "Full-pretrain/Step Time": 17.624402726069093} +{"Full-pretrain/Learning Rate": 4.5069593110827926e-05, "Full-pretrain/Loss": 2.0285849571228027, "Full-pretrain/Loss (Raw)": 2.049696445465088, "Full-pretrain/Step": 2167, "Full-pretrain/Step Time": 17.621249878779054} +{"Full-pretrain/Learning Rate": 4.506452914679424e-05, "Full-pretrain/Loss": 2.0334601402282715, "Full-pretrain/Loss (Raw)": 1.921903371810913, "Full-pretrain/Step": 2168, "Full-pretrain/Step Time": 17.622483126819134} +{"Full-pretrain/Learning Rate": 4.505946286832418e-05, "Full-pretrain/Loss": 2.039706230163574, "Full-pretrain/Loss (Raw)": 2.057648181915283, "Full-pretrain/Step": 2169, "Full-pretrain/Step Time": 17.618188481777906} +{"Full-pretrain/Learning Rate": 4.505439427600211e-05, "Full-pretrain/Loss": 2.035567283630371, "Full-pretrain/Loss (Raw)": 1.9107016324996948, "Full-pretrain/Step": 2170, "Full-pretrain/Step Time": 17.62096224538982} +{"Full-pretrain/Learning Rate": 4.5049323370412724e-05, "Full-pretrain/Loss": 2.0399742126464844, "Full-pretrain/Loss (Raw)": 2.1264543533325195, "Full-pretrain/Step": 2171, "Full-pretrain/Step Time": 17.620615983381867} +{"Full-pretrain/Learning Rate": 4.504425015214092e-05, "Full-pretrain/Loss": 2.0298917293548584, "Full-pretrain/Loss (Raw)": 1.7116291522979736, "Full-pretrain/Step": 2172, "Full-pretrain/Step Time": 17.618403021246195} +{"Full-pretrain/Learning Rate": 4.503917462177192e-05, "Full-pretrain/Loss": 2.0389821529388428, "Full-pretrain/Loss (Raw)": 2.227349281311035, "Full-pretrain/Step": 2173, "Full-pretrain/Step Time": 17.61333523131907} +{"Full-pretrain/Learning Rate": 4.503409677989116e-05, "Full-pretrain/Loss": 2.0284323692321777, "Full-pretrain/Loss (Raw)": 1.9277441501617432, "Full-pretrain/Step": 2174, "Full-pretrain/Step Time": 17.61782167479396} +{"Full-pretrain/Learning Rate": 4.502901662708437e-05, "Full-pretrain/Loss": 2.0005204677581787, "Full-pretrain/Loss (Raw)": 1.746746301651001, "Full-pretrain/Step": 2175, "Full-pretrain/Step Time": 17.617197206243873} +{"Full-pretrain/Learning Rate": 4.502393416393756e-05, "Full-pretrain/Loss": 2.000173330307007, "Full-pretrain/Loss (Raw)": 1.9924302101135254, "Full-pretrain/Step": 2176, "Full-pretrain/Step Time": 17.62243109382689} +{"Full-pretrain/Learning Rate": 4.5018849391036986e-05, "Full-pretrain/Loss": 1.99898362159729, "Full-pretrain/Loss (Raw)": 1.966475248336792, "Full-pretrain/Step": 2177, "Full-pretrain/Step Time": 17.616861740127206} +{"Full-pretrain/Learning Rate": 4.501376230896917e-05, "Full-pretrain/Loss": 1.9915162324905396, "Full-pretrain/Loss (Raw)": 2.0018470287323, "Full-pretrain/Step": 2178, "Full-pretrain/Step Time": 17.619870020076632} +{"Full-pretrain/Learning Rate": 4.500867291832089e-05, "Full-pretrain/Loss": 2.001269817352295, "Full-pretrain/Loss (Raw)": 2.150907516479492, "Full-pretrain/Step": 2179, "Full-pretrain/Step Time": 17.618873106315732} +{"Full-pretrain/Learning Rate": 4.5003581219679233e-05, "Full-pretrain/Loss": 1.9999096393585205, "Full-pretrain/Loss (Raw)": 1.9948225021362305, "Full-pretrain/Step": 2180, "Full-pretrain/Step Time": 17.619551111012697} +{"Full-pretrain/Learning Rate": 4.499848721363151e-05, "Full-pretrain/Loss": 2.0061306953430176, "Full-pretrain/Loss (Raw)": 1.9741344451904297, "Full-pretrain/Step": 2181, "Full-pretrain/Step Time": 17.61150055937469} +{"Full-pretrain/Learning Rate": 4.499339090076532e-05, "Full-pretrain/Loss": 2.00742769241333, "Full-pretrain/Loss (Raw)": 2.166614055633545, "Full-pretrain/Step": 2182, "Full-pretrain/Step Time": 17.61277701333165} +{"Full-pretrain/Learning Rate": 4.498829228166851e-05, "Full-pretrain/Loss": 2.0064449310302734, "Full-pretrain/Loss (Raw)": 1.8826018571853638, "Full-pretrain/Step": 2183, "Full-pretrain/Step Time": 17.620195105671883} +{"Full-pretrain/Learning Rate": 4.498319135692921e-05, "Full-pretrain/Loss": 1.9971262216567993, "Full-pretrain/Loss (Raw)": 1.9760559797286987, "Full-pretrain/Step": 2184, "Full-pretrain/Step Time": 17.615680672228336} +{"Full-pretrain/Learning Rate": 4.4978088127135806e-05, "Full-pretrain/Loss": 1.9943532943725586, "Full-pretrain/Loss (Raw)": 2.086946725845337, "Full-pretrain/Step": 2185, "Full-pretrain/Step Time": 17.623073909431696} +{"Full-pretrain/Learning Rate": 4.497298259287696e-05, "Full-pretrain/Loss": 1.9937622547149658, "Full-pretrain/Loss (Raw)": 2.052187442779541, "Full-pretrain/Step": 2186, "Full-pretrain/Step Time": 17.616106720641255} +{"Full-pretrain/Learning Rate": 4.496787475474159e-05, "Full-pretrain/Loss": 1.993799090385437, "Full-pretrain/Loss (Raw)": 2.080132007598877, "Full-pretrain/Step": 2187, "Full-pretrain/Step Time": 17.620192965492606} +{"Full-pretrain/Learning Rate": 4.496276461331889e-05, "Full-pretrain/Loss": 2.010348320007324, "Full-pretrain/Loss (Raw)": 2.179077625274658, "Full-pretrain/Step": 2188, "Full-pretrain/Step Time": 17.623043993487954} +{"Full-pretrain/Learning Rate": 4.49576521691983e-05, "Full-pretrain/Loss": 2.0048675537109375, "Full-pretrain/Loss (Raw)": 1.8828926086425781, "Full-pretrain/Step": 2189, "Full-pretrain/Step Time": 17.62175950780511} +{"Full-pretrain/Learning Rate": 4.495253742296955e-05, "Full-pretrain/Loss": 2.0155837535858154, "Full-pretrain/Loss (Raw)": 2.1548514366149902, "Full-pretrain/Step": 2190, "Full-pretrain/Step Time": 17.62631994113326} +{"Full-pretrain/Learning Rate": 4.4947420375222616e-05, "Full-pretrain/Loss": 2.0238046646118164, "Full-pretrain/Loss (Raw)": 2.2234151363372803, "Full-pretrain/Step": 2191, "Full-pretrain/Step Time": 17.625091223046184} +{"Full-pretrain/Learning Rate": 4.4942301026547755e-05, "Full-pretrain/Loss": 2.0190560817718506, "Full-pretrain/Loss (Raw)": 2.050760507583618, "Full-pretrain/Step": 2192, "Full-pretrain/Step Time": 17.628781836479902} +{"Full-pretrain/Learning Rate": 4.4937179377535476e-05, "Full-pretrain/Loss": 2.0195322036743164, "Full-pretrain/Loss (Raw)": 2.084270477294922, "Full-pretrain/Step": 2193, "Full-pretrain/Step Time": 17.624146703630686} +{"Full-pretrain/Learning Rate": 4.493205542877656e-05, "Full-pretrain/Loss": 2.0157270431518555, "Full-pretrain/Loss (Raw)": 2.0988481044769287, "Full-pretrain/Step": 2194, "Full-pretrain/Step Time": 17.629422897472978} +{"Full-pretrain/Learning Rate": 4.4926929180862064e-05, "Full-pretrain/Loss": 2.021043539047241, "Full-pretrain/Loss (Raw)": 2.061335325241089, "Full-pretrain/Step": 2195, "Full-pretrain/Step Time": 17.632034979760647} +{"Full-pretrain/Learning Rate": 4.4921800634383294e-05, "Full-pretrain/Loss": 2.013479709625244, "Full-pretrain/Loss (Raw)": 1.9419445991516113, "Full-pretrain/Step": 2196, "Full-pretrain/Step Time": 17.633865298703313} +{"Full-pretrain/Learning Rate": 4.491666978993181e-05, "Full-pretrain/Loss": 2.012557029724121, "Full-pretrain/Loss (Raw)": 1.8391591310501099, "Full-pretrain/Step": 2197, "Full-pretrain/Step Time": 17.629334576427937} +{"Full-pretrain/Learning Rate": 4.4911536648099464e-05, "Full-pretrain/Loss": 2.0210933685302734, "Full-pretrain/Loss (Raw)": 2.1534032821655273, "Full-pretrain/Step": 2198, "Full-pretrain/Step Time": 17.635051306337118} +{"Full-pretrain/Learning Rate": 4.4906401209478367e-05, "Full-pretrain/Loss": 2.0183095932006836, "Full-pretrain/Loss (Raw)": 1.9606205224990845, "Full-pretrain/Step": 2199, "Full-pretrain/Step Time": 17.635975124314427} +{"Full-pretrain/Learning Rate": 4.4901263474660894e-05, "Full-pretrain/Loss": 2.0268845558166504, "Full-pretrain/Loss (Raw)": 2.196300983428955, "Full-pretrain/Step": 2200, "Full-pretrain/Step Time": 17.63521990738809} +{"Full-pretrain/Learning Rate": 4.489612344423966e-05, "Full-pretrain/Loss": 2.03340220451355, "Full-pretrain/Loss (Raw)": 2.2662131786346436, "Full-pretrain/Step": 2201, "Full-pretrain/Step Time": 17.63004350475967} +{"Full-pretrain/Learning Rate": 4.489098111880759e-05, "Full-pretrain/Loss": 2.029756546020508, "Full-pretrain/Loss (Raw)": 1.7940336465835571, "Full-pretrain/Step": 2202, "Full-pretrain/Step Time": 17.640214988961816} +{"Full-pretrain/Learning Rate": 4.4885836498957824e-05, "Full-pretrain/Loss": 2.0280492305755615, "Full-pretrain/Loss (Raw)": 2.0718300342559814, "Full-pretrain/Step": 2203, "Full-pretrain/Step Time": 17.638881735503674} +{"Full-pretrain/Learning Rate": 4.488068958528382e-05, "Full-pretrain/Loss": 2.031439781188965, "Full-pretrain/Loss (Raw)": 1.82012140750885, "Full-pretrain/Step": 2204, "Full-pretrain/Step Time": 17.635822465643287} +{"Full-pretrain/Learning Rate": 4.487554037837925e-05, "Full-pretrain/Loss": 2.023237466812134, "Full-pretrain/Loss (Raw)": 1.9648747444152832, "Full-pretrain/Step": 2205, "Full-pretrain/Step Time": 17.638099847361445} +{"Full-pretrain/Learning Rate": 4.487038887883809e-05, "Full-pretrain/Loss": 2.026444435119629, "Full-pretrain/Loss (Raw)": 2.030364751815796, "Full-pretrain/Step": 2206, "Full-pretrain/Step Time": 17.63563211262226} +{"Full-pretrain/Learning Rate": 4.4865235087254545e-05, "Full-pretrain/Loss": 2.031055450439453, "Full-pretrain/Loss (Raw)": 1.894302487373352, "Full-pretrain/Step": 2207, "Full-pretrain/Step Time": 17.631905537098646} +{"Full-pretrain/Learning Rate": 4.486007900422312e-05, "Full-pretrain/Loss": 2.032233953475952, "Full-pretrain/Loss (Raw)": 2.0301413536071777, "Full-pretrain/Step": 2208, "Full-pretrain/Step Time": 17.633574144914746} +{"Full-pretrain/Learning Rate": 4.485492063033856e-05, "Full-pretrain/Loss": 2.0357882976531982, "Full-pretrain/Loss (Raw)": 2.0802128314971924, "Full-pretrain/Step": 2209, "Full-pretrain/Step Time": 17.628115467727184} +{"Full-pretrain/Learning Rate": 4.484975996619589e-05, "Full-pretrain/Loss": 2.0421018600463867, "Full-pretrain/Loss (Raw)": 2.2038848400115967, "Full-pretrain/Step": 2210, "Full-pretrain/Step Time": 17.630452688783407} +{"Full-pretrain/Learning Rate": 4.484459701239038e-05, "Full-pretrain/Loss": 2.0389528274536133, "Full-pretrain/Loss (Raw)": 2.050138473510742, "Full-pretrain/Step": 2211, "Full-pretrain/Step Time": 17.63402133062482} +{"Full-pretrain/Learning Rate": 4.483943176951757e-05, "Full-pretrain/Loss": 2.042938709259033, "Full-pretrain/Loss (Raw)": 2.122368812561035, "Full-pretrain/Step": 2212, "Full-pretrain/Step Time": 17.633240666240454} +{"Full-pretrain/Learning Rate": 4.4834264238173285e-05, "Full-pretrain/Loss": 2.051187038421631, "Full-pretrain/Loss (Raw)": 2.238083600997925, "Full-pretrain/Step": 2213, "Full-pretrain/Step Time": 17.63125553354621} +{"Full-pretrain/Learning Rate": 4.4829094418953586e-05, "Full-pretrain/Loss": 2.0504236221313477, "Full-pretrain/Loss (Raw)": 2.142178535461426, "Full-pretrain/Step": 2214, "Full-pretrain/Step Time": 17.629309562966228} +{"Full-pretrain/Learning Rate": 4.482392231245481e-05, "Full-pretrain/Loss": 2.049783706665039, "Full-pretrain/Loss (Raw)": 1.8621268272399902, "Full-pretrain/Step": 2215, "Full-pretrain/Step Time": 17.633676052093506} +{"Full-pretrain/Learning Rate": 4.4818747919273575e-05, "Full-pretrain/Loss": 2.051828145980835, "Full-pretrain/Loss (Raw)": 2.0414769649505615, "Full-pretrain/Step": 2216, "Full-pretrain/Step Time": 17.634715925902128} +{"Full-pretrain/Learning Rate": 4.4813571240006726e-05, "Full-pretrain/Loss": 2.0437512397766113, "Full-pretrain/Loss (Raw)": 1.828485131263733, "Full-pretrain/Step": 2217, "Full-pretrain/Step Time": 17.63120224699378} +{"Full-pretrain/Learning Rate": 4.48083922752514e-05, "Full-pretrain/Loss": 2.043300151824951, "Full-pretrain/Loss (Raw)": 2.037750244140625, "Full-pretrain/Step": 2218, "Full-pretrain/Step Time": 17.629843812435865} +{"Full-pretrain/Learning Rate": 4.480321102560499e-05, "Full-pretrain/Loss": 2.0400261878967285, "Full-pretrain/Loss (Raw)": 1.9753634929656982, "Full-pretrain/Step": 2219, "Full-pretrain/Step Time": 17.632408883422613} +{"Full-pretrain/Learning Rate": 4.4798027491665134e-05, "Full-pretrain/Loss": 2.0344038009643555, "Full-pretrain/Loss (Raw)": 1.9991657733917236, "Full-pretrain/Step": 2220, "Full-pretrain/Step Time": 17.631814997643232} +{"Full-pretrain/Learning Rate": 4.4792841674029776e-05, "Full-pretrain/Loss": 2.041288375854492, "Full-pretrain/Loss (Raw)": 2.1031951904296875, "Full-pretrain/Step": 2221, "Full-pretrain/Step Time": 17.624777337536216} +{"Full-pretrain/Learning Rate": 4.4787653573297075e-05, "Full-pretrain/Loss": 2.0357580184936523, "Full-pretrain/Loss (Raw)": 1.9778825044631958, "Full-pretrain/Step": 2222, "Full-pretrain/Step Time": 17.627934051677585} +{"Full-pretrain/Learning Rate": 4.47824631900655e-05, "Full-pretrain/Loss": 2.0303573608398438, "Full-pretrain/Loss (Raw)": 2.050593376159668, "Full-pretrain/Step": 2223, "Full-pretrain/Step Time": 17.62971117347479} +{"Full-pretrain/Learning Rate": 4.477727052493375e-05, "Full-pretrain/Loss": 2.034287929534912, "Full-pretrain/Loss (Raw)": 2.176541805267334, "Full-pretrain/Step": 2224, "Full-pretrain/Step Time": 17.634803058579564} +{"Full-pretrain/Learning Rate": 4.4772075578500785e-05, "Full-pretrain/Loss": 2.0312156677246094, "Full-pretrain/Loss (Raw)": 1.9859619140625, "Full-pretrain/Step": 2225, "Full-pretrain/Step Time": 17.62598145008087} +{"Full-pretrain/Learning Rate": 4.476687835136585e-05, "Full-pretrain/Loss": 2.044917106628418, "Full-pretrain/Loss (Raw)": 2.537289619445801, "Full-pretrain/Step": 2226, "Full-pretrain/Step Time": 17.633341621607542} +{"Full-pretrain/Learning Rate": 4.476167884412845e-05, "Full-pretrain/Loss": 2.041790008544922, "Full-pretrain/Loss (Raw)": 1.9612696170806885, "Full-pretrain/Step": 2227, "Full-pretrain/Step Time": 17.63532785885036} +{"Full-pretrain/Learning Rate": 4.475647705738833e-05, "Full-pretrain/Loss": 2.038681983947754, "Full-pretrain/Loss (Raw)": 1.8424909114837646, "Full-pretrain/Step": 2228, "Full-pretrain/Step Time": 17.641269704326987} +{"Full-pretrain/Learning Rate": 4.475127299174554e-05, "Full-pretrain/Loss": 2.0420029163360596, "Full-pretrain/Loss (Raw)": 1.9454286098480225, "Full-pretrain/Step": 2229, "Full-pretrain/Step Time": 17.63209447450936} +{"Full-pretrain/Learning Rate": 4.4746066647800344e-05, "Full-pretrain/Loss": 2.0353055000305176, "Full-pretrain/Loss (Raw)": 1.9390830993652344, "Full-pretrain/Step": 2230, "Full-pretrain/Step Time": 17.63333728350699} +{"Full-pretrain/Learning Rate": 4.4740858026153297e-05, "Full-pretrain/Loss": 2.024468183517456, "Full-pretrain/Loss (Raw)": 1.6138300895690918, "Full-pretrain/Step": 2231, "Full-pretrain/Step Time": 17.63466766476631} +{"Full-pretrain/Learning Rate": 4.4735647127405215e-05, "Full-pretrain/Loss": 2.017444610595703, "Full-pretrain/Loss (Raw)": 1.9715512990951538, "Full-pretrain/Step": 2232, "Full-pretrain/Step Time": 17.629596581682563} +{"Full-pretrain/Learning Rate": 4.473043395215718e-05, "Full-pretrain/Loss": 2.0139966011047363, "Full-pretrain/Loss (Raw)": 2.155867099761963, "Full-pretrain/Step": 2233, "Full-pretrain/Step Time": 17.630854219198227} +{"Full-pretrain/Learning Rate": 4.4725218501010514e-05, "Full-pretrain/Loss": 2.0319747924804688, "Full-pretrain/Loss (Raw)": 2.36933970451355, "Full-pretrain/Step": 2234, "Full-pretrain/Step Time": 17.621143270283937} +{"Full-pretrain/Learning Rate": 4.472000077456683e-05, "Full-pretrain/Loss": 2.0307319164276123, "Full-pretrain/Loss (Raw)": 2.0320558547973633, "Full-pretrain/Step": 2235, "Full-pretrain/Step Time": 17.629626540467143} +{"Full-pretrain/Learning Rate": 4.471478077342798e-05, "Full-pretrain/Loss": 2.0263359546661377, "Full-pretrain/Loss (Raw)": 1.6794500350952148, "Full-pretrain/Step": 2236, "Full-pretrain/Step Time": 17.62928695231676} +{"Full-pretrain/Learning Rate": 4.4709558498196104e-05, "Full-pretrain/Loss": 2.030137777328491, "Full-pretrain/Loss (Raw)": 2.0865323543548584, "Full-pretrain/Step": 2237, "Full-pretrain/Step Time": 17.628940761089325} +{"Full-pretrain/Learning Rate": 4.4704333949473575e-05, "Full-pretrain/Loss": 2.0385825634002686, "Full-pretrain/Loss (Raw)": 2.3005995750427246, "Full-pretrain/Step": 2238, "Full-pretrain/Step Time": 17.624601189047098} +{"Full-pretrain/Learning Rate": 4.469910712786305e-05, "Full-pretrain/Loss": 2.0471882820129395, "Full-pretrain/Loss (Raw)": 2.169687271118164, "Full-pretrain/Step": 2239, "Full-pretrain/Step Time": 17.62186342291534} +{"Full-pretrain/Learning Rate": 4.469387803396745e-05, "Full-pretrain/Loss": 2.0444438457489014, "Full-pretrain/Loss (Raw)": 1.9423184394836426, "Full-pretrain/Step": 2240, "Full-pretrain/Step Time": 17.626850962638855} +{"Full-pretrain/Learning Rate": 4.4688646668389935e-05, "Full-pretrain/Loss": 2.0452446937561035, "Full-pretrain/Loss (Raw)": 2.105841636657715, "Full-pretrain/Step": 2241, "Full-pretrain/Step Time": 17.61973504535854} +{"Full-pretrain/Learning Rate": 4.468341303173394e-05, "Full-pretrain/Loss": 2.0503201484680176, "Full-pretrain/Loss (Raw)": 2.366295576095581, "Full-pretrain/Step": 2242, "Full-pretrain/Step Time": 17.61760315299034} +{"Full-pretrain/Learning Rate": 4.4678177124603174e-05, "Full-pretrain/Loss": 2.049048900604248, "Full-pretrain/Loss (Raw)": 2.009460687637329, "Full-pretrain/Step": 2243, "Full-pretrain/Step Time": 17.621377300471067} +{"Full-pretrain/Learning Rate": 4.46729389476016e-05, "Full-pretrain/Loss": 2.0477285385131836, "Full-pretrain/Loss (Raw)": 2.0801234245300293, "Full-pretrain/Step": 2244, "Full-pretrain/Step Time": 17.6220675483346} +{"Full-pretrain/Learning Rate": 4.466769850133342e-05, "Full-pretrain/Loss": 2.0477356910705566, "Full-pretrain/Loss (Raw)": 2.238304615020752, "Full-pretrain/Step": 2245, "Full-pretrain/Step Time": 17.623519629240036} +{"Full-pretrain/Learning Rate": 4.466245578640313e-05, "Full-pretrain/Loss": 2.0362257957458496, "Full-pretrain/Loss (Raw)": 1.7738627195358276, "Full-pretrain/Step": 2246, "Full-pretrain/Step Time": 17.624589677900076} +{"Full-pretrain/Learning Rate": 4.465721080341547e-05, "Full-pretrain/Loss": 2.0451033115386963, "Full-pretrain/Loss (Raw)": 2.1462087631225586, "Full-pretrain/Step": 2247, "Full-pretrain/Step Time": 17.622252279892564} +{"Full-pretrain/Learning Rate": 4.465196355297546e-05, "Full-pretrain/Loss": 2.035616159439087, "Full-pretrain/Loss (Raw)": 1.737889289855957, "Full-pretrain/Step": 2248, "Full-pretrain/Step Time": 17.619552878662944} +{"Full-pretrain/Learning Rate": 4.464671403568836e-05, "Full-pretrain/Loss": 2.0443222522735596, "Full-pretrain/Loss (Raw)": 2.1070756912231445, "Full-pretrain/Step": 2249, "Full-pretrain/Step Time": 17.624085530638695} +{"Full-pretrain/Learning Rate": 4.46414622521597e-05, "Full-pretrain/Loss": 2.0468273162841797, "Full-pretrain/Loss (Raw)": 2.117914915084839, "Full-pretrain/Step": 2250, "Full-pretrain/Step Time": 17.622460899874568} +{"Full-pretrain/Learning Rate": 4.463620820299528e-05, "Full-pretrain/Loss": 2.0488929748535156, "Full-pretrain/Loss (Raw)": 2.0414626598358154, "Full-pretrain/Step": 2251, "Full-pretrain/Step Time": 17.62527940236032} +{"Full-pretrain/Learning Rate": 4.463095188880113e-05, "Full-pretrain/Loss": 2.043919324874878, "Full-pretrain/Loss (Raw)": 1.8400139808654785, "Full-pretrain/Step": 2252, "Full-pretrain/Step Time": 17.626666015014052} +{"Full-pretrain/Learning Rate": 4.462569331018359e-05, "Full-pretrain/Loss": 2.038952589035034, "Full-pretrain/Loss (Raw)": 1.944258451461792, "Full-pretrain/Step": 2253, "Full-pretrain/Step Time": 17.632726173847914} +{"Full-pretrain/Learning Rate": 4.4620432467749217e-05, "Full-pretrain/Loss": 2.0386383533477783, "Full-pretrain/Loss (Raw)": 1.9678281545639038, "Full-pretrain/Step": 2254, "Full-pretrain/Step Time": 17.630426716059446} +{"Full-pretrain/Learning Rate": 4.461516936210486e-05, "Full-pretrain/Loss": 2.039064884185791, "Full-pretrain/Loss (Raw)": 2.064239740371704, "Full-pretrain/Step": 2255, "Full-pretrain/Step Time": 17.62552348151803} +{"Full-pretrain/Learning Rate": 4.460990399385761e-05, "Full-pretrain/Loss": 2.039849042892456, "Full-pretrain/Loss (Raw)": 2.201637029647827, "Full-pretrain/Step": 2256, "Full-pretrain/Step Time": 17.622070057317615} +{"Full-pretrain/Learning Rate": 4.4604636363614813e-05, "Full-pretrain/Loss": 2.0507829189300537, "Full-pretrain/Loss (Raw)": 2.335843086242676, "Full-pretrain/Step": 2257, "Full-pretrain/Step Time": 17.628512183204293} +{"Full-pretrain/Learning Rate": 4.4599366471984104e-05, "Full-pretrain/Loss": 2.0362443923950195, "Full-pretrain/Loss (Raw)": 2.0720553398132324, "Full-pretrain/Step": 2258, "Full-pretrain/Step Time": 17.62733267247677} +{"Full-pretrain/Learning Rate": 4.459409431957337e-05, "Full-pretrain/Loss": 2.04201078414917, "Full-pretrain/Loss (Raw)": 2.145799160003662, "Full-pretrain/Step": 2259, "Full-pretrain/Step Time": 17.6206593234092} +{"Full-pretrain/Learning Rate": 4.4588819906990745e-05, "Full-pretrain/Loss": 2.0500564575195312, "Full-pretrain/Loss (Raw)": 2.099945545196533, "Full-pretrain/Step": 2260, "Full-pretrain/Step Time": 17.62820973061025} +{"Full-pretrain/Learning Rate": 4.4583543234844616e-05, "Full-pretrain/Loss": 2.052929639816284, "Full-pretrain/Loss (Raw)": 2.0373711585998535, "Full-pretrain/Step": 2261, "Full-pretrain/Step Time": 17.63326996192336} +{"Full-pretrain/Learning Rate": 4.457826430374366e-05, "Full-pretrain/Loss": 2.053304672241211, "Full-pretrain/Loss (Raw)": 1.9510846138000488, "Full-pretrain/Step": 2262, "Full-pretrain/Step Time": 17.63156154938042} +{"Full-pretrain/Learning Rate": 4.45729831142968e-05, "Full-pretrain/Loss": 2.066803216934204, "Full-pretrain/Loss (Raw)": 2.0457863807678223, "Full-pretrain/Step": 2263, "Full-pretrain/Step Time": 17.630757000297308} +{"Full-pretrain/Learning Rate": 4.456769966711321e-05, "Full-pretrain/Loss": 2.0676145553588867, "Full-pretrain/Loss (Raw)": 1.997513771057129, "Full-pretrain/Step": 2264, "Full-pretrain/Step Time": 17.629013745114207} +{"Full-pretrain/Learning Rate": 4.456241396280234e-05, "Full-pretrain/Loss": 2.0629868507385254, "Full-pretrain/Loss (Raw)": 2.0077781677246094, "Full-pretrain/Step": 2265, "Full-pretrain/Step Time": 17.633943924680352} +{"Full-pretrain/Learning Rate": 4.4557126001973904e-05, "Full-pretrain/Loss": 2.0575613975524902, "Full-pretrain/Loss (Raw)": 2.195720672607422, "Full-pretrain/Step": 2266, "Full-pretrain/Step Time": 17.63914893567562} +{"Full-pretrain/Learning Rate": 4.455183578523785e-05, "Full-pretrain/Loss": 2.0629589557647705, "Full-pretrain/Loss (Raw)": 2.204791307449341, "Full-pretrain/Step": 2267, "Full-pretrain/Step Time": 17.64028475061059} +{"Full-pretrain/Learning Rate": 4.4546543313204414e-05, "Full-pretrain/Loss": 2.0761618614196777, "Full-pretrain/Loss (Raw)": 2.1019349098205566, "Full-pretrain/Step": 2268, "Full-pretrain/Step Time": 17.640251936390996} +{"Full-pretrain/Learning Rate": 4.454124858648407e-05, "Full-pretrain/Loss": 2.0739126205444336, "Full-pretrain/Loss (Raw)": 2.0145602226257324, "Full-pretrain/Step": 2269, "Full-pretrain/Step Time": 17.63865969143808} +{"Full-pretrain/Learning Rate": 4.453595160568757e-05, "Full-pretrain/Loss": 2.0742859840393066, "Full-pretrain/Loss (Raw)": 2.312537670135498, "Full-pretrain/Step": 2270, "Full-pretrain/Step Time": 17.644679356366396} +{"Full-pretrain/Learning Rate": 4.453065237142592e-05, "Full-pretrain/Loss": 2.0741689205169678, "Full-pretrain/Loss (Raw)": 2.1659514904022217, "Full-pretrain/Step": 2271, "Full-pretrain/Step Time": 17.64499015547335} +{"Full-pretrain/Learning Rate": 4.452535088431038e-05, "Full-pretrain/Loss": 2.0792980194091797, "Full-pretrain/Loss (Raw)": 2.1064398288726807, "Full-pretrain/Step": 2272, "Full-pretrain/Step Time": 17.64137444831431} +{"Full-pretrain/Learning Rate": 4.452004714495248e-05, "Full-pretrain/Loss": 2.0713388919830322, "Full-pretrain/Loss (Raw)": 1.851161241531372, "Full-pretrain/Step": 2273, "Full-pretrain/Step Time": 17.65144918486476} +{"Full-pretrain/Learning Rate": 4.4514741153964e-05, "Full-pretrain/Loss": 2.060267448425293, "Full-pretrain/Loss (Raw)": 2.0119991302490234, "Full-pretrain/Step": 2274, "Full-pretrain/Step Time": 17.653256652876735} +{"Full-pretrain/Learning Rate": 4.4509432911956985e-05, "Full-pretrain/Loss": 2.0649991035461426, "Full-pretrain/Loss (Raw)": 2.1608810424804688, "Full-pretrain/Step": 2275, "Full-pretrain/Step Time": 17.65333593636751} +{"Full-pretrain/Learning Rate": 4.450412241954374e-05, "Full-pretrain/Loss": 2.0520544052124023, "Full-pretrain/Loss (Raw)": 1.6658905744552612, "Full-pretrain/Step": 2276, "Full-pretrain/Step Time": 17.653985645622015} +{"Full-pretrain/Learning Rate": 4.449880967733683e-05, "Full-pretrain/Loss": 2.0470681190490723, "Full-pretrain/Loss (Raw)": 2.0787458419799805, "Full-pretrain/Step": 2277, "Full-pretrain/Step Time": 17.656736582517624} +{"Full-pretrain/Learning Rate": 4.449349468594908e-05, "Full-pretrain/Loss": 2.0552704334259033, "Full-pretrain/Loss (Raw)": 2.036332607269287, "Full-pretrain/Step": 2278, "Full-pretrain/Step Time": 17.65590782277286} +{"Full-pretrain/Learning Rate": 4.448817744599356e-05, "Full-pretrain/Loss": 2.0595455169677734, "Full-pretrain/Loss (Raw)": 2.2830147743225098, "Full-pretrain/Step": 2279, "Full-pretrain/Step Time": 17.659664513543248} +{"Full-pretrain/Learning Rate": 4.4482857958083625e-05, "Full-pretrain/Loss": 2.0736334323883057, "Full-pretrain/Loss (Raw)": 2.1887006759643555, "Full-pretrain/Step": 2280, "Full-pretrain/Step Time": 17.658773871138692} +{"Full-pretrain/Learning Rate": 4.447753622283287e-05, "Full-pretrain/Loss": 2.0679123401641846, "Full-pretrain/Loss (Raw)": 1.9240014553070068, "Full-pretrain/Step": 2281, "Full-pretrain/Step Time": 17.658268017694354} +{"Full-pretrain/Learning Rate": 4.447221224085516e-05, "Full-pretrain/Loss": 2.063599109649658, "Full-pretrain/Loss (Raw)": 1.9798877239227295, "Full-pretrain/Step": 2282, "Full-pretrain/Step Time": 17.6566975787282} +{"Full-pretrain/Learning Rate": 4.4466886012764605e-05, "Full-pretrain/Loss": 2.0633578300476074, "Full-pretrain/Loss (Raw)": 2.0337448120117188, "Full-pretrain/Step": 2283, "Full-pretrain/Step Time": 17.662701403722167} +{"Full-pretrain/Learning Rate": 4.4461557539175594e-05, "Full-pretrain/Loss": 2.0664243698120117, "Full-pretrain/Loss (Raw)": 1.938143014907837, "Full-pretrain/Step": 2284, "Full-pretrain/Step Time": 17.658346850425005} +{"Full-pretrain/Learning Rate": 4.445622682070275e-05, "Full-pretrain/Loss": 2.0699429512023926, "Full-pretrain/Loss (Raw)": 2.056854724884033, "Full-pretrain/Step": 2285, "Full-pretrain/Step Time": 17.660288540646434} +{"Full-pretrain/Learning Rate": 4.445089385796099e-05, "Full-pretrain/Loss": 2.088148832321167, "Full-pretrain/Loss (Raw)": 2.5504095554351807, "Full-pretrain/Step": 2286, "Full-pretrain/Step Time": 17.65265880152583} +{"Full-pretrain/Learning Rate": 4.4445558651565457e-05, "Full-pretrain/Loss": 2.084620237350464, "Full-pretrain/Loss (Raw)": 1.9513310194015503, "Full-pretrain/Step": 2287, "Full-pretrain/Step Time": 17.6615148819983} +{"Full-pretrain/Learning Rate": 4.444022120213157e-05, "Full-pretrain/Loss": 2.070164918899536, "Full-pretrain/Loss (Raw)": 1.7390661239624023, "Full-pretrain/Step": 2288, "Full-pretrain/Step Time": 17.657066840678453} +{"Full-pretrain/Learning Rate": 4.4434881510274994e-05, "Full-pretrain/Loss": 2.0596020221710205, "Full-pretrain/Loss (Raw)": 1.9978327751159668, "Full-pretrain/Step": 2289, "Full-pretrain/Step Time": 17.658350065350533} +{"Full-pretrain/Learning Rate": 4.442953957661167e-05, "Full-pretrain/Loss": 2.0547001361846924, "Full-pretrain/Loss (Raw)": 1.91519033908844, "Full-pretrain/Step": 2290, "Full-pretrain/Step Time": 17.65539601072669} +{"Full-pretrain/Learning Rate": 4.4424195401757776e-05, "Full-pretrain/Loss": 2.0470032691955566, "Full-pretrain/Loss (Raw)": 1.8994982242584229, "Full-pretrain/Step": 2291, "Full-pretrain/Step Time": 17.662361280992627} +{"Full-pretrain/Learning Rate": 4.441884898632977e-05, "Full-pretrain/Loss": 2.0470545291900635, "Full-pretrain/Loss (Raw)": 2.1015896797180176, "Full-pretrain/Step": 2292, "Full-pretrain/Step Time": 17.656878100708127} +{"Full-pretrain/Learning Rate": 4.441350033094437e-05, "Full-pretrain/Loss": 2.043210029602051, "Full-pretrain/Loss (Raw)": 1.9143508672714233, "Full-pretrain/Step": 2293, "Full-pretrain/Step Time": 17.656791165471077} +{"Full-pretrain/Learning Rate": 4.440814943621852e-05, "Full-pretrain/Loss": 2.048783540725708, "Full-pretrain/Loss (Raw)": 2.1294336318969727, "Full-pretrain/Step": 2294, "Full-pretrain/Step Time": 17.6585673969239} +{"Full-pretrain/Learning Rate": 4.440279630276946e-05, "Full-pretrain/Loss": 2.04793643951416, "Full-pretrain/Loss (Raw)": 2.018669605255127, "Full-pretrain/Step": 2295, "Full-pretrain/Step Time": 17.669332422316074} +{"Full-pretrain/Learning Rate": 4.439744093121465e-05, "Full-pretrain/Loss": 2.0491549968719482, "Full-pretrain/Loss (Raw)": 2.03652024269104, "Full-pretrain/Step": 2296, "Full-pretrain/Step Time": 17.66549379006028} +{"Full-pretrain/Learning Rate": 4.439208332217186e-05, "Full-pretrain/Loss": 2.0450987815856934, "Full-pretrain/Loss (Raw)": 1.87796950340271, "Full-pretrain/Step": 2297, "Full-pretrain/Step Time": 17.670379880815744} +{"Full-pretrain/Learning Rate": 4.438672347625907e-05, "Full-pretrain/Loss": 2.039081335067749, "Full-pretrain/Loss (Raw)": 2.0031685829162598, "Full-pretrain/Step": 2298, "Full-pretrain/Step Time": 17.66376342996955} +{"Full-pretrain/Learning Rate": 4.4381361394094535e-05, "Full-pretrain/Loss": 2.0395877361297607, "Full-pretrain/Loss (Raw)": 2.2209949493408203, "Full-pretrain/Step": 2299, "Full-pretrain/Step Time": 17.667892053723335} +{"Full-pretrain/Learning Rate": 4.437599707629678e-05, "Full-pretrain/Loss": 2.036163568496704, "Full-pretrain/Loss (Raw)": 1.9923653602600098, "Full-pretrain/Step": 2300, "Full-pretrain/Step Time": 17.665294751524925} +{"Full-pretrain/Learning Rate": 4.437063052348457e-05, "Full-pretrain/Loss": 2.0366668701171875, "Full-pretrain/Loss (Raw)": 2.030662775039673, "Full-pretrain/Step": 2301, "Full-pretrain/Step Time": 17.664209689944983} +{"Full-pretrain/Learning Rate": 4.436526173627693e-05, "Full-pretrain/Loss": 2.025081157684326, "Full-pretrain/Loss (Raw)": 1.9417930841445923, "Full-pretrain/Step": 2302, "Full-pretrain/Step Time": 17.667514303699136} +{"Full-pretrain/Learning Rate": 4.435989071529316e-05, "Full-pretrain/Loss": 2.0230154991149902, "Full-pretrain/Loss (Raw)": 2.099853992462158, "Full-pretrain/Step": 2303, "Full-pretrain/Step Time": 17.67469915188849} +{"Full-pretrain/Learning Rate": 4.43545174611528e-05, "Full-pretrain/Loss": 2.0189690589904785, "Full-pretrain/Loss (Raw)": 1.9769551753997803, "Full-pretrain/Step": 2304, "Full-pretrain/Step Time": 17.6712698135525} +{"Full-pretrain/Learning Rate": 4.434914197447565e-05, "Full-pretrain/Loss": 2.0234556198120117, "Full-pretrain/Loss (Raw)": 1.9947268962860107, "Full-pretrain/Step": 2305, "Full-pretrain/Step Time": 17.67287871427834} +{"Full-pretrain/Learning Rate": 4.4343764255881784e-05, "Full-pretrain/Loss": 2.0237512588500977, "Full-pretrain/Loss (Raw)": 2.021458625793457, "Full-pretrain/Step": 2306, "Full-pretrain/Step Time": 17.671002384275198} +{"Full-pretrain/Learning Rate": 4.433838430599149e-05, "Full-pretrain/Loss": 2.01401948928833, "Full-pretrain/Loss (Raw)": 1.8494634628295898, "Full-pretrain/Step": 2307, "Full-pretrain/Step Time": 17.67249070852995} +{"Full-pretrain/Learning Rate": 4.433300212542537e-05, "Full-pretrain/Loss": 2.013154983520508, "Full-pretrain/Loss (Raw)": 1.638235092163086, "Full-pretrain/Step": 2308, "Full-pretrain/Step Time": 17.66988653689623} +{"Full-pretrain/Learning Rate": 4.432761771480426e-05, "Full-pretrain/Loss": 2.014247417449951, "Full-pretrain/Loss (Raw)": 2.1136953830718994, "Full-pretrain/Step": 2309, "Full-pretrain/Step Time": 17.67750750295818} +{"Full-pretrain/Learning Rate": 4.4322231074749227e-05, "Full-pretrain/Loss": 2.0198159217834473, "Full-pretrain/Loss (Raw)": 2.2145328521728516, "Full-pretrain/Step": 2310, "Full-pretrain/Step Time": 17.672750111669302} +{"Full-pretrain/Learning Rate": 4.431684220588163e-05, "Full-pretrain/Loss": 2.020444869995117, "Full-pretrain/Loss (Raw)": 2.3031387329101562, "Full-pretrain/Step": 2311, "Full-pretrain/Step Time": 17.67504519596696} +{"Full-pretrain/Learning Rate": 4.4311451108823076e-05, "Full-pretrain/Loss": 2.0123064517974854, "Full-pretrain/Loss (Raw)": 1.928266167640686, "Full-pretrain/Step": 2312, "Full-pretrain/Step Time": 17.673936519771814} +{"Full-pretrain/Learning Rate": 4.4306057784195423e-05, "Full-pretrain/Loss": 2.015742540359497, "Full-pretrain/Loss (Raw)": 2.033953905105591, "Full-pretrain/Step": 2313, "Full-pretrain/Step Time": 17.675696402788162} +{"Full-pretrain/Learning Rate": 4.430066223262079e-05, "Full-pretrain/Loss": 2.0252366065979004, "Full-pretrain/Loss (Raw)": 2.2836949825286865, "Full-pretrain/Step": 2314, "Full-pretrain/Step Time": 17.680179780349135} +{"Full-pretrain/Learning Rate": 4.4295264454721544e-05, "Full-pretrain/Loss": 2.024348735809326, "Full-pretrain/Loss (Raw)": 2.005338191986084, "Full-pretrain/Step": 2315, "Full-pretrain/Step Time": 17.673562424257398} +{"Full-pretrain/Learning Rate": 4.4289864451120335e-05, "Full-pretrain/Loss": 2.0212278366088867, "Full-pretrain/Loss (Raw)": 1.8382689952850342, "Full-pretrain/Step": 2316, "Full-pretrain/Step Time": 17.673162903636694} +{"Full-pretrain/Learning Rate": 4.4284462222440036e-05, "Full-pretrain/Loss": 2.022214412689209, "Full-pretrain/Loss (Raw)": 2.0884270668029785, "Full-pretrain/Step": 2317, "Full-pretrain/Step Time": 17.676989363506436} +{"Full-pretrain/Learning Rate": 4.427905776930379e-05, "Full-pretrain/Loss": 2.0065622329711914, "Full-pretrain/Loss (Raw)": 2.0495409965515137, "Full-pretrain/Step": 2318, "Full-pretrain/Step Time": 17.6701039634645} +{"Full-pretrain/Learning Rate": 4.4273651092335016e-05, "Full-pretrain/Loss": 2.0103728771209717, "Full-pretrain/Loss (Raw)": 2.073276996612549, "Full-pretrain/Step": 2319, "Full-pretrain/Step Time": 17.674108857288957} +{"Full-pretrain/Learning Rate": 4.426824219215736e-05, "Full-pretrain/Loss": 2.017308473587036, "Full-pretrain/Loss (Raw)": 1.9609990119934082, "Full-pretrain/Step": 2320, "Full-pretrain/Step Time": 17.676979713141918} +{"Full-pretrain/Learning Rate": 4.426283106939474e-05, "Full-pretrain/Loss": 2.0196948051452637, "Full-pretrain/Loss (Raw)": 2.074202537536621, "Full-pretrain/Step": 2321, "Full-pretrain/Step Time": 17.68152728304267} +{"Full-pretrain/Learning Rate": 4.4257417724671314e-05, "Full-pretrain/Loss": 2.0217432975769043, "Full-pretrain/Loss (Raw)": 1.9807378053665161, "Full-pretrain/Step": 2322, "Full-pretrain/Step Time": 17.677503429353237} +{"Full-pretrain/Learning Rate": 4.425200215861153e-05, "Full-pretrain/Loss": 2.019423007965088, "Full-pretrain/Loss (Raw)": 1.8252466917037964, "Full-pretrain/Step": 2323, "Full-pretrain/Step Time": 17.67571296170354} +{"Full-pretrain/Learning Rate": 4.424658437184006e-05, "Full-pretrain/Loss": 2.015383005142212, "Full-pretrain/Loss (Raw)": 1.9723122119903564, "Full-pretrain/Step": 2324, "Full-pretrain/Step Time": 17.682152215391397} +{"Full-pretrain/Learning Rate": 4.424116436498185e-05, "Full-pretrain/Loss": 2.016879081726074, "Full-pretrain/Loss (Raw)": 1.9622317552566528, "Full-pretrain/Step": 2325, "Full-pretrain/Step Time": 17.682700909674168} +{"Full-pretrain/Learning Rate": 4.423574213866208e-05, "Full-pretrain/Loss": 2.0148093700408936, "Full-pretrain/Loss (Raw)": 2.063194751739502, "Full-pretrain/Step": 2326, "Full-pretrain/Step Time": 17.677941370755434} +{"Full-pretrain/Learning Rate": 4.423031769350623e-05, "Full-pretrain/Loss": 2.0143990516662598, "Full-pretrain/Loss (Raw)": 2.005545139312744, "Full-pretrain/Step": 2327, "Full-pretrain/Step Time": 17.67477273195982} +{"Full-pretrain/Learning Rate": 4.4224891030139986e-05, "Full-pretrain/Loss": 2.0134339332580566, "Full-pretrain/Loss (Raw)": 2.0056347846984863, "Full-pretrain/Step": 2328, "Full-pretrain/Step Time": 17.673783188685775} +{"Full-pretrain/Learning Rate": 4.421946214918932e-05, "Full-pretrain/Loss": 2.006680727005005, "Full-pretrain/Loss (Raw)": 1.6618671417236328, "Full-pretrain/Step": 2329, "Full-pretrain/Step Time": 17.677574226632714} +{"Full-pretrain/Learning Rate": 4.4214031051280444e-05, "Full-pretrain/Loss": 2.0109708309173584, "Full-pretrain/Loss (Raw)": 2.140446662902832, "Full-pretrain/Step": 2330, "Full-pretrain/Step Time": 17.672875678166747} +{"Full-pretrain/Learning Rate": 4.4208597737039845e-05, "Full-pretrain/Loss": 2.0037028789520264, "Full-pretrain/Loss (Raw)": 1.9884216785430908, "Full-pretrain/Step": 2331, "Full-pretrain/Step Time": 17.66995500586927} +{"Full-pretrain/Learning Rate": 4.420316220709424e-05, "Full-pretrain/Loss": 1.9968721866607666, "Full-pretrain/Loss (Raw)": 1.7737840414047241, "Full-pretrain/Step": 2332, "Full-pretrain/Step Time": 17.66682681813836} +{"Full-pretrain/Learning Rate": 4.419772446207063e-05, "Full-pretrain/Loss": 1.9882855415344238, "Full-pretrain/Loss (Raw)": 1.755894422531128, "Full-pretrain/Step": 2333, "Full-pretrain/Step Time": 17.669099347665906} +{"Full-pretrain/Learning Rate": 4.4192284502596245e-05, "Full-pretrain/Loss": 1.992088794708252, "Full-pretrain/Loss (Raw)": 2.0634918212890625, "Full-pretrain/Step": 2334, "Full-pretrain/Step Time": 17.66804563254118} +{"Full-pretrain/Learning Rate": 4.41868423292986e-05, "Full-pretrain/Loss": 1.9879080057144165, "Full-pretrain/Loss (Raw)": 1.9660714864730835, "Full-pretrain/Step": 2335, "Full-pretrain/Step Time": 17.671835768967867} +{"Full-pretrain/Learning Rate": 4.418139794280541e-05, "Full-pretrain/Loss": 1.9931414127349854, "Full-pretrain/Loss (Raw)": 2.1444239616394043, "Full-pretrain/Step": 2336, "Full-pretrain/Step Time": 17.66766571626067} +{"Full-pretrain/Learning Rate": 4.4175951343744725e-05, "Full-pretrain/Loss": 1.9956672191619873, "Full-pretrain/Loss (Raw)": 2.0755529403686523, "Full-pretrain/Step": 2337, "Full-pretrain/Step Time": 17.678870420902967} +{"Full-pretrain/Learning Rate": 4.417050253274479e-05, "Full-pretrain/Loss": 1.993710994720459, "Full-pretrain/Loss (Raw)": 1.958857774734497, "Full-pretrain/Step": 2338, "Full-pretrain/Step Time": 17.67736637406051} +{"Full-pretrain/Learning Rate": 4.4165051510434124e-05, "Full-pretrain/Loss": 2.001436710357666, "Full-pretrain/Loss (Raw)": 2.0966901779174805, "Full-pretrain/Step": 2339, "Full-pretrain/Step Time": 17.67368347942829} +{"Full-pretrain/Learning Rate": 4.41595982774415e-05, "Full-pretrain/Loss": 2.0157341957092285, "Full-pretrain/Loss (Raw)": 2.095754623413086, "Full-pretrain/Step": 2340, "Full-pretrain/Step Time": 17.670624354854226} +{"Full-pretrain/Learning Rate": 4.4154142834395954e-05, "Full-pretrain/Loss": 2.0102152824401855, "Full-pretrain/Loss (Raw)": 1.937085747718811, "Full-pretrain/Step": 2341, "Full-pretrain/Step Time": 17.677008885890245} +{"Full-pretrain/Learning Rate": 4.414868518192675e-05, "Full-pretrain/Loss": 2.0138354301452637, "Full-pretrain/Loss (Raw)": 2.330378293991089, "Full-pretrain/Step": 2342, "Full-pretrain/Step Time": 17.678836973384023} +{"Full-pretrain/Learning Rate": 4.414322532066345e-05, "Full-pretrain/Loss": 1.999495029449463, "Full-pretrain/Loss (Raw)": 1.8442425727844238, "Full-pretrain/Step": 2343, "Full-pretrain/Step Time": 17.679041726514697} +{"Full-pretrain/Learning Rate": 4.4137763251235835e-05, "Full-pretrain/Loss": 1.991746187210083, "Full-pretrain/Loss (Raw)": 1.6803075075149536, "Full-pretrain/Step": 2344, "Full-pretrain/Step Time": 17.674780743196607} +{"Full-pretrain/Learning Rate": 4.413229897427396e-05, "Full-pretrain/Loss": 1.9874001741409302, "Full-pretrain/Loss (Raw)": 1.894882082939148, "Full-pretrain/Step": 2345, "Full-pretrain/Step Time": 17.684335865080357} +{"Full-pretrain/Learning Rate": 4.412683249040811e-05, "Full-pretrain/Loss": 1.9882969856262207, "Full-pretrain/Loss (Raw)": 2.312392234802246, "Full-pretrain/Step": 2346, "Full-pretrain/Step Time": 17.67852633446455} +{"Full-pretrain/Learning Rate": 4.4121363800268854e-05, "Full-pretrain/Loss": 1.9952962398529053, "Full-pretrain/Loss (Raw)": 2.229311466217041, "Full-pretrain/Step": 2347, "Full-pretrain/Step Time": 17.682646790519357} +{"Full-pretrain/Learning Rate": 4.411589290448701e-05, "Full-pretrain/Loss": 1.9956564903259277, "Full-pretrain/Loss (Raw)": 1.8497976064682007, "Full-pretrain/Step": 2348, "Full-pretrain/Step Time": 17.681215258315206} +{"Full-pretrain/Learning Rate": 4.4110419803693635e-05, "Full-pretrain/Loss": 1.9885462522506714, "Full-pretrain/Loss (Raw)": 1.860903263092041, "Full-pretrain/Step": 2349, "Full-pretrain/Step Time": 17.687779784202576} +{"Full-pretrain/Learning Rate": 4.4104944498520054e-05, "Full-pretrain/Loss": 1.9898823499679565, "Full-pretrain/Loss (Raw)": 2.092296600341797, "Full-pretrain/Step": 2350, "Full-pretrain/Step Time": 17.682241577655077} +{"Full-pretrain/Learning Rate": 4.4099466989597836e-05, "Full-pretrain/Loss": 1.9905219078063965, "Full-pretrain/Loss (Raw)": 2.093743324279785, "Full-pretrain/Step": 2351, "Full-pretrain/Step Time": 17.68472490645945} +{"Full-pretrain/Learning Rate": 4.409398727755882e-05, "Full-pretrain/Loss": 1.997637391090393, "Full-pretrain/Loss (Raw)": 2.1886940002441406, "Full-pretrain/Step": 2352, "Full-pretrain/Step Time": 17.678523326292634} +{"Full-pretrain/Learning Rate": 4.408850536303507e-05, "Full-pretrain/Loss": 1.992748498916626, "Full-pretrain/Loss (Raw)": 1.9177556037902832, "Full-pretrain/Step": 2353, "Full-pretrain/Step Time": 17.679978977888823} +{"Full-pretrain/Learning Rate": 4.4083021246658944e-05, "Full-pretrain/Loss": 1.9914511442184448, "Full-pretrain/Loss (Raw)": 1.93922758102417, "Full-pretrain/Step": 2354, "Full-pretrain/Step Time": 17.67284954339266} +{"Full-pretrain/Learning Rate": 4.4077534929063025e-05, "Full-pretrain/Loss": 1.9838016033172607, "Full-pretrain/Loss (Raw)": 1.580458164215088, "Full-pretrain/Step": 2355, "Full-pretrain/Step Time": 17.671660624444485} +{"Full-pretrain/Learning Rate": 4.4072046410880145e-05, "Full-pretrain/Loss": 1.9851605892181396, "Full-pretrain/Loss (Raw)": 2.015803813934326, "Full-pretrain/Step": 2356, "Full-pretrain/Step Time": 17.669151527807117} +{"Full-pretrain/Learning Rate": 4.406655569274342e-05, "Full-pretrain/Loss": 1.9884518384933472, "Full-pretrain/Loss (Raw)": 2.067547082901001, "Full-pretrain/Step": 2357, "Full-pretrain/Step Time": 17.6680867690593} +{"Full-pretrain/Learning Rate": 4.40610627752862e-05, "Full-pretrain/Loss": 1.9881179332733154, "Full-pretrain/Loss (Raw)": 2.05250883102417, "Full-pretrain/Step": 2358, "Full-pretrain/Step Time": 17.66656212694943} +{"Full-pretrain/Learning Rate": 4.405556765914208e-05, "Full-pretrain/Loss": 1.990400791168213, "Full-pretrain/Loss (Raw)": 2.0785980224609375, "Full-pretrain/Step": 2359, "Full-pretrain/Step Time": 17.670809926465154} +{"Full-pretrain/Learning Rate": 4.405007034494494e-05, "Full-pretrain/Loss": 1.9949369430541992, "Full-pretrain/Loss (Raw)": 2.1507906913757324, "Full-pretrain/Step": 2360, "Full-pretrain/Step Time": 17.674380026757717} +{"Full-pretrain/Learning Rate": 4.404457083332886e-05, "Full-pretrain/Loss": 2.0036420822143555, "Full-pretrain/Loss (Raw)": 1.9404377937316895, "Full-pretrain/Step": 2361, "Full-pretrain/Step Time": 17.675304763019085} +{"Full-pretrain/Learning Rate": 4.4039069124928244e-05, "Full-pretrain/Loss": 2.004059314727783, "Full-pretrain/Loss (Raw)": 2.15378999710083, "Full-pretrain/Step": 2362, "Full-pretrain/Step Time": 17.676732188090682} +{"Full-pretrain/Learning Rate": 4.4033565220377694e-05, "Full-pretrain/Loss": 2.001328945159912, "Full-pretrain/Loss (Raw)": 1.901058554649353, "Full-pretrain/Step": 2363, "Full-pretrain/Step Time": 17.668312456458807} +{"Full-pretrain/Learning Rate": 4.402805912031208e-05, "Full-pretrain/Loss": 2.016143321990967, "Full-pretrain/Loss (Raw)": 2.247838258743286, "Full-pretrain/Step": 2364, "Full-pretrain/Step Time": 17.67096154205501} +{"Full-pretrain/Learning Rate": 4.4022550825366526e-05, "Full-pretrain/Loss": 2.021742820739746, "Full-pretrain/Loss (Raw)": 1.935082197189331, "Full-pretrain/Step": 2365, "Full-pretrain/Step Time": 17.66898100450635} +{"Full-pretrain/Learning Rate": 4.401704033617643e-05, "Full-pretrain/Loss": 2.0298209190368652, "Full-pretrain/Loss (Raw)": 2.3219921588897705, "Full-pretrain/Step": 2366, "Full-pretrain/Step Time": 17.672931343317032} +{"Full-pretrain/Learning Rate": 4.4011527653377415e-05, "Full-pretrain/Loss": 2.0351648330688477, "Full-pretrain/Loss (Raw)": 2.137070655822754, "Full-pretrain/Step": 2367, "Full-pretrain/Step Time": 17.672378607094288} +{"Full-pretrain/Learning Rate": 4.400601277760536e-05, "Full-pretrain/Loss": 2.031071662902832, "Full-pretrain/Loss (Raw)": 2.013439893722534, "Full-pretrain/Step": 2368, "Full-pretrain/Step Time": 17.664433693513274} +{"Full-pretrain/Learning Rate": 4.400049570949641e-05, "Full-pretrain/Loss": 2.029212474822998, "Full-pretrain/Loss (Raw)": 2.016062021255493, "Full-pretrain/Step": 2369, "Full-pretrain/Step Time": 17.66694810986519} +{"Full-pretrain/Learning Rate": 4.399497644968696e-05, "Full-pretrain/Loss": 2.0429086685180664, "Full-pretrain/Loss (Raw)": 2.3971402645111084, "Full-pretrain/Step": 2370, "Full-pretrain/Step Time": 17.67093899101019} +{"Full-pretrain/Learning Rate": 4.398945499881366e-05, "Full-pretrain/Loss": 2.0392332077026367, "Full-pretrain/Loss (Raw)": 1.9790745973587036, "Full-pretrain/Step": 2371, "Full-pretrain/Step Time": 17.67449831403792} +{"Full-pretrain/Learning Rate": 4.3983931357513385e-05, "Full-pretrain/Loss": 2.040212631225586, "Full-pretrain/Loss (Raw)": 2.1270956993103027, "Full-pretrain/Step": 2372, "Full-pretrain/Step Time": 17.671878492459655} +{"Full-pretrain/Learning Rate": 4.3978405526423305e-05, "Full-pretrain/Loss": 2.046755790710449, "Full-pretrain/Loss (Raw)": 2.146470069885254, "Full-pretrain/Step": 2373, "Full-pretrain/Step Time": 17.666102956980467} +{"Full-pretrain/Learning Rate": 4.397287750618082e-05, "Full-pretrain/Loss": 2.0438222885131836, "Full-pretrain/Loss (Raw)": 2.236501932144165, "Full-pretrain/Step": 2374, "Full-pretrain/Step Time": 17.662043061107397} +{"Full-pretrain/Learning Rate": 4.3967347297423575e-05, "Full-pretrain/Loss": 2.0502266883850098, "Full-pretrain/Loss (Raw)": 2.0491762161254883, "Full-pretrain/Step": 2375, "Full-pretrain/Step Time": 17.66311872191727} +{"Full-pretrain/Learning Rate": 4.3961814900789495e-05, "Full-pretrain/Loss": 2.0585403442382812, "Full-pretrain/Loss (Raw)": 1.9463493824005127, "Full-pretrain/Step": 2376, "Full-pretrain/Step Time": 17.669638130813837} +{"Full-pretrain/Learning Rate": 4.395628031691672e-05, "Full-pretrain/Loss": 2.068366527557373, "Full-pretrain/Loss (Raw)": 2.2093207836151123, "Full-pretrain/Step": 2377, "Full-pretrain/Step Time": 17.66243868507445} +{"Full-pretrain/Learning Rate": 4.395074354644368e-05, "Full-pretrain/Loss": 2.065321207046509, "Full-pretrain/Loss (Raw)": 2.214944362640381, "Full-pretrain/Step": 2378, "Full-pretrain/Step Time": 17.667997295036912} +{"Full-pretrain/Learning Rate": 4.3945204590009024e-05, "Full-pretrain/Loss": 2.0600645542144775, "Full-pretrain/Loss (Raw)": 2.061094045639038, "Full-pretrain/Step": 2379, "Full-pretrain/Step Time": 17.665121791884303} +{"Full-pretrain/Learning Rate": 4.3939663448251687e-05, "Full-pretrain/Loss": 2.0695197582244873, "Full-pretrain/Loss (Raw)": 2.1523642539978027, "Full-pretrain/Step": 2380, "Full-pretrain/Step Time": 17.662474401295185} +{"Full-pretrain/Learning Rate": 4.393412012181082e-05, "Full-pretrain/Loss": 2.083125591278076, "Full-pretrain/Loss (Raw)": 2.296292304992676, "Full-pretrain/Step": 2381, "Full-pretrain/Step Time": 17.653003960847855} +{"Full-pretrain/Learning Rate": 4.3928574611325844e-05, "Full-pretrain/Loss": 2.0818185806274414, "Full-pretrain/Loss (Raw)": 2.0504753589630127, "Full-pretrain/Step": 2382, "Full-pretrain/Step Time": 17.653945740312338} +{"Full-pretrain/Learning Rate": 4.392302691743645e-05, "Full-pretrain/Loss": 2.0758767127990723, "Full-pretrain/Loss (Raw)": 1.9035998582839966, "Full-pretrain/Step": 2383, "Full-pretrain/Step Time": 17.657479040324688} +{"Full-pretrain/Learning Rate": 4.3917477040782554e-05, "Full-pretrain/Loss": 2.062537670135498, "Full-pretrain/Loss (Raw)": 1.761847734451294, "Full-pretrain/Step": 2384, "Full-pretrain/Step Time": 17.656214617192745} +{"Full-pretrain/Learning Rate": 4.3911924982004315e-05, "Full-pretrain/Loss": 2.067363739013672, "Full-pretrain/Loss (Raw)": 2.0721840858459473, "Full-pretrain/Step": 2385, "Full-pretrain/Step Time": 17.648128755390644} +{"Full-pretrain/Learning Rate": 4.3906370741742186e-05, "Full-pretrain/Loss": 2.065049171447754, "Full-pretrain/Loss (Raw)": 1.8651667833328247, "Full-pretrain/Step": 2386, "Full-pretrain/Step Time": 17.652151074260473} +{"Full-pretrain/Learning Rate": 4.390081432063683e-05, "Full-pretrain/Loss": 2.079845905303955, "Full-pretrain/Loss (Raw)": 2.053950071334839, "Full-pretrain/Step": 2387, "Full-pretrain/Step Time": 17.656061308458447} +{"Full-pretrain/Learning Rate": 4.389525571932919e-05, "Full-pretrain/Loss": 2.0768768787384033, "Full-pretrain/Loss (Raw)": 1.92079496383667, "Full-pretrain/Step": 2388, "Full-pretrain/Step Time": 17.653251763433218} +{"Full-pretrain/Learning Rate": 4.388969493846044e-05, "Full-pretrain/Loss": 2.0718202590942383, "Full-pretrain/Loss (Raw)": 1.9057366847991943, "Full-pretrain/Step": 2389, "Full-pretrain/Step Time": 17.64880720153451} +{"Full-pretrain/Learning Rate": 4.388413197867202e-05, "Full-pretrain/Loss": 2.066694498062134, "Full-pretrain/Loss (Raw)": 1.8884800672531128, "Full-pretrain/Step": 2390, "Full-pretrain/Step Time": 17.648567320778966} +{"Full-pretrain/Learning Rate": 4.3878566840605604e-05, "Full-pretrain/Loss": 2.0600075721740723, "Full-pretrain/Loss (Raw)": 1.8646214008331299, "Full-pretrain/Step": 2391, "Full-pretrain/Step Time": 17.648433655500412} +{"Full-pretrain/Learning Rate": 4.387299952490315e-05, "Full-pretrain/Loss": 2.054086208343506, "Full-pretrain/Loss (Raw)": 1.9613091945648193, "Full-pretrain/Step": 2392, "Full-pretrain/Step Time": 17.64631556160748} +{"Full-pretrain/Learning Rate": 4.3867430032206823e-05, "Full-pretrain/Loss": 2.0585875511169434, "Full-pretrain/Loss (Raw)": 2.0844688415527344, "Full-pretrain/Step": 2393, "Full-pretrain/Step Time": 17.639904079958797} +{"Full-pretrain/Learning Rate": 4.386185836315908e-05, "Full-pretrain/Loss": 2.0439531803131104, "Full-pretrain/Loss (Raw)": 1.6854963302612305, "Full-pretrain/Step": 2394, "Full-pretrain/Step Time": 17.63833268545568} +{"Full-pretrain/Learning Rate": 4.3856284518402594e-05, "Full-pretrain/Loss": 2.0342233180999756, "Full-pretrain/Loss (Raw)": 1.5897033214569092, "Full-pretrain/Step": 2395, "Full-pretrain/Step Time": 17.6415221337229} +{"Full-pretrain/Learning Rate": 4.385070849858033e-05, "Full-pretrain/Loss": 2.031653881072998, "Full-pretrain/Loss (Raw)": 2.165611982345581, "Full-pretrain/Step": 2396, "Full-pretrain/Step Time": 17.63698186725378} +{"Full-pretrain/Learning Rate": 4.3845130304335455e-05, "Full-pretrain/Loss": 2.0349488258361816, "Full-pretrain/Loss (Raw)": 2.0405287742614746, "Full-pretrain/Step": 2397, "Full-pretrain/Step Time": 17.635569859296083} +{"Full-pretrain/Learning Rate": 4.383954993631142e-05, "Full-pretrain/Loss": 2.0203394889831543, "Full-pretrain/Loss (Raw)": 1.8544890880584717, "Full-pretrain/Step": 2398, "Full-pretrain/Step Time": 17.62638962455094} +{"Full-pretrain/Learning Rate": 4.383396739515192e-05, "Full-pretrain/Loss": 2.0188710689544678, "Full-pretrain/Loss (Raw)": 2.0900843143463135, "Full-pretrain/Step": 2399, "Full-pretrain/Step Time": 17.625256951898336} +{"Full-pretrain/Learning Rate": 4.382838268150091e-05, "Full-pretrain/Loss": 2.018129348754883, "Full-pretrain/Loss (Raw)": 1.989697813987732, "Full-pretrain/Step": 2400, "Full-pretrain/Step Time": 17.627762023359537} +{"Full-pretrain/Learning Rate": 4.382279579600256e-05, "Full-pretrain/Loss": 2.0208382606506348, "Full-pretrain/Loss (Raw)": 2.1027605533599854, "Full-pretrain/Step": 2401, "Full-pretrain/Step Time": 17.62659828364849} +{"Full-pretrain/Learning Rate": 4.381720673930134e-05, "Full-pretrain/Loss": 2.0098068714141846, "Full-pretrain/Loss (Raw)": 2.044123888015747, "Full-pretrain/Step": 2402, "Full-pretrain/Step Time": 17.6240375302732} +{"Full-pretrain/Learning Rate": 4.381161551204194e-05, "Full-pretrain/Loss": 2.0058059692382812, "Full-pretrain/Loss (Raw)": 1.8510488271713257, "Full-pretrain/Step": 2403, "Full-pretrain/Step Time": 17.62590771354735} +{"Full-pretrain/Learning Rate": 4.3806022114869296e-05, "Full-pretrain/Loss": 2.0132036209106445, "Full-pretrain/Loss (Raw)": 2.363821506500244, "Full-pretrain/Step": 2404, "Full-pretrain/Step Time": 17.618995152413845} +{"Full-pretrain/Learning Rate": 4.3800426548428605e-05, "Full-pretrain/Loss": 2.0112435817718506, "Full-pretrain/Loss (Raw)": 2.083754062652588, "Full-pretrain/Step": 2405, "Full-pretrain/Step Time": 17.61794901266694} +{"Full-pretrain/Learning Rate": 4.379482881336532e-05, "Full-pretrain/Loss": 2.007291793823242, "Full-pretrain/Loss (Raw)": 2.110037326812744, "Full-pretrain/Step": 2406, "Full-pretrain/Step Time": 17.61934581398964} +{"Full-pretrain/Learning Rate": 4.3789228910325134e-05, "Full-pretrain/Loss": 2.0061845779418945, "Full-pretrain/Loss (Raw)": 2.0137548446655273, "Full-pretrain/Step": 2407, "Full-pretrain/Step Time": 17.61563828960061} +{"Full-pretrain/Learning Rate": 4.3783626839954005e-05, "Full-pretrain/Loss": 2.0071120262145996, "Full-pretrain/Loss (Raw)": 1.976026177406311, "Full-pretrain/Step": 2408, "Full-pretrain/Step Time": 17.622415935620666} +{"Full-pretrain/Learning Rate": 4.3778022602898116e-05, "Full-pretrain/Loss": 2.0023181438446045, "Full-pretrain/Loss (Raw)": 2.055917978286743, "Full-pretrain/Step": 2409, "Full-pretrain/Step Time": 17.622223243117332} +{"Full-pretrain/Learning Rate": 4.3772416199803924e-05, "Full-pretrain/Loss": 1.996841311454773, "Full-pretrain/Loss (Raw)": 2.0396785736083984, "Full-pretrain/Step": 2410, "Full-pretrain/Step Time": 17.618426205590367} +{"Full-pretrain/Learning Rate": 4.3766807631318106e-05, "Full-pretrain/Loss": 1.9929249286651611, "Full-pretrain/Loss (Raw)": 1.9357750415802002, "Full-pretrain/Step": 2411, "Full-pretrain/Step Time": 17.618884585797787} +{"Full-pretrain/Learning Rate": 4.376119689808764e-05, "Full-pretrain/Loss": 1.9903550148010254, "Full-pretrain/Loss (Raw)": 2.070124626159668, "Full-pretrain/Step": 2412, "Full-pretrain/Step Time": 17.620264997705817} +{"Full-pretrain/Learning Rate": 4.3755584000759695e-05, "Full-pretrain/Loss": 1.9885592460632324, "Full-pretrain/Loss (Raw)": 2.2388291358947754, "Full-pretrain/Step": 2413, "Full-pretrain/Step Time": 17.6209072265774} +{"Full-pretrain/Learning Rate": 4.3749968939981734e-05, "Full-pretrain/Loss": 1.990747332572937, "Full-pretrain/Loss (Raw)": 2.1204910278320312, "Full-pretrain/Step": 2414, "Full-pretrain/Step Time": 17.62589932233095} +{"Full-pretrain/Learning Rate": 4.374435171640144e-05, "Full-pretrain/Loss": 1.9902210235595703, "Full-pretrain/Loss (Raw)": 1.8867554664611816, "Full-pretrain/Step": 2415, "Full-pretrain/Step Time": 17.621259830892086} +{"Full-pretrain/Learning Rate": 4.373873233066676e-05, "Full-pretrain/Loss": 1.9889837503433228, "Full-pretrain/Loss (Raw)": 1.7222567796707153, "Full-pretrain/Step": 2416, "Full-pretrain/Step Time": 17.625037098303437} +{"Full-pretrain/Learning Rate": 4.373311078342589e-05, "Full-pretrain/Loss": 1.9819560050964355, "Full-pretrain/Loss (Raw)": 1.8472957611083984, "Full-pretrain/Step": 2417, "Full-pretrain/Step Time": 17.619947873055935} +{"Full-pretrain/Learning Rate": 4.3727487075327286e-05, "Full-pretrain/Loss": 1.9886574745178223, "Full-pretrain/Loss (Raw)": 2.079613447189331, "Full-pretrain/Step": 2418, "Full-pretrain/Step Time": 17.626278473064303} +{"Full-pretrain/Learning Rate": 4.372186120701962e-05, "Full-pretrain/Loss": 1.996751070022583, "Full-pretrain/Loss (Raw)": 2.312943935394287, "Full-pretrain/Step": 2419, "Full-pretrain/Step Time": 17.61997915431857} +{"Full-pretrain/Learning Rate": 4.371623317915184e-05, "Full-pretrain/Loss": 2.0057456493377686, "Full-pretrain/Loss (Raw)": 2.2086243629455566, "Full-pretrain/Step": 2420, "Full-pretrain/Step Time": 17.629392018541694} +{"Full-pretrain/Learning Rate": 4.371060299237315e-05, "Full-pretrain/Loss": 2.0135316848754883, "Full-pretrain/Loss (Raw)": 2.1548900604248047, "Full-pretrain/Step": 2421, "Full-pretrain/Step Time": 17.62203318439424} +{"Full-pretrain/Learning Rate": 4.370497064733298e-05, "Full-pretrain/Loss": 2.020859479904175, "Full-pretrain/Loss (Raw)": 2.122971534729004, "Full-pretrain/Step": 2422, "Full-pretrain/Step Time": 17.62443894892931} +{"Full-pretrain/Learning Rate": 4.369933614468101e-05, "Full-pretrain/Loss": 2.0216739177703857, "Full-pretrain/Loss (Raw)": 1.890679955482483, "Full-pretrain/Step": 2423, "Full-pretrain/Step Time": 17.618046468123794} +{"Full-pretrain/Learning Rate": 4.369369948506719e-05, "Full-pretrain/Loss": 2.0222973823547363, "Full-pretrain/Loss (Raw)": 1.981258749961853, "Full-pretrain/Step": 2424, "Full-pretrain/Step Time": 17.620739426463842} +{"Full-pretrain/Learning Rate": 4.368806066914171e-05, "Full-pretrain/Loss": 2.0185999870300293, "Full-pretrain/Loss (Raw)": 1.9661551713943481, "Full-pretrain/Step": 2425, "Full-pretrain/Step Time": 17.61717526242137} +{"Full-pretrain/Learning Rate": 4.368241969755499e-05, "Full-pretrain/Loss": 2.0252926349639893, "Full-pretrain/Loss (Raw)": 1.899662733078003, "Full-pretrain/Step": 2426, "Full-pretrain/Step Time": 17.618223883211613} +{"Full-pretrain/Learning Rate": 4.3676776570957726e-05, "Full-pretrain/Loss": 2.038651943206787, "Full-pretrain/Loss (Raw)": 2.0172038078308105, "Full-pretrain/Step": 2427, "Full-pretrain/Step Time": 17.6175399068743} +{"Full-pretrain/Learning Rate": 4.367113129000085e-05, "Full-pretrain/Loss": 2.038301944732666, "Full-pretrain/Loss (Raw)": 2.154411554336548, "Full-pretrain/Step": 2428, "Full-pretrain/Step Time": 17.62337521649897} +{"Full-pretrain/Learning Rate": 4.366548385533554e-05, "Full-pretrain/Loss": 2.036998748779297, "Full-pretrain/Loss (Raw)": 1.9988253116607666, "Full-pretrain/Step": 2429, "Full-pretrain/Step Time": 17.629284279420972} +{"Full-pretrain/Learning Rate": 4.3659834267613234e-05, "Full-pretrain/Loss": 2.0365161895751953, "Full-pretrain/Loss (Raw)": 1.8390439748764038, "Full-pretrain/Step": 2430, "Full-pretrain/Step Time": 17.620362108573318} +{"Full-pretrain/Learning Rate": 4.365418252748559e-05, "Full-pretrain/Loss": 2.0252833366394043, "Full-pretrain/Loss (Raw)": 1.73063063621521, "Full-pretrain/Step": 2431, "Full-pretrain/Step Time": 17.615541441366076} +{"Full-pretrain/Learning Rate": 4.3648528635604556e-05, "Full-pretrain/Loss": 2.0251638889312744, "Full-pretrain/Loss (Raw)": 1.9858808517456055, "Full-pretrain/Step": 2432, "Full-pretrain/Step Time": 17.61153361387551} +{"Full-pretrain/Learning Rate": 4.36428725926223e-05, "Full-pretrain/Loss": 2.0159506797790527, "Full-pretrain/Loss (Raw)": 1.8079354763031006, "Full-pretrain/Step": 2433, "Full-pretrain/Step Time": 17.614868249744177} +{"Full-pretrain/Learning Rate": 4.3637214399191234e-05, "Full-pretrain/Loss": 2.013122081756592, "Full-pretrain/Loss (Raw)": 1.9536136388778687, "Full-pretrain/Step": 2434, "Full-pretrain/Step Time": 17.61033544689417} +{"Full-pretrain/Learning Rate": 4.363155405596404e-05, "Full-pretrain/Loss": 2.0148234367370605, "Full-pretrain/Loss (Raw)": 1.9054886102676392, "Full-pretrain/Step": 2435, "Full-pretrain/Step Time": 17.609081843867898} +{"Full-pretrain/Learning Rate": 4.3625891563593626e-05, "Full-pretrain/Loss": 2.0026063919067383, "Full-pretrain/Loss (Raw)": 1.9728734493255615, "Full-pretrain/Step": 2436, "Full-pretrain/Step Time": 17.612024350091815} +{"Full-pretrain/Learning Rate": 4.3620226922733174e-05, "Full-pretrain/Loss": 1.9933547973632812, "Full-pretrain/Loss (Raw)": 1.7877068519592285, "Full-pretrain/Step": 2437, "Full-pretrain/Step Time": 17.608562346547842} +{"Full-pretrain/Learning Rate": 4.361456013403609e-05, "Full-pretrain/Loss": 1.9986152648925781, "Full-pretrain/Loss (Raw)": 2.278367042541504, "Full-pretrain/Step": 2438, "Full-pretrain/Step Time": 17.606037789955735} +{"Full-pretrain/Learning Rate": 4.360889119815604e-05, "Full-pretrain/Loss": 2.0043540000915527, "Full-pretrain/Loss (Raw)": 2.1973931789398193, "Full-pretrain/Step": 2439, "Full-pretrain/Step Time": 17.60673107020557} +{"Full-pretrain/Learning Rate": 4.360322011574692e-05, "Full-pretrain/Loss": 2.0120952129364014, "Full-pretrain/Loss (Raw)": 2.223748207092285, "Full-pretrain/Step": 2440, "Full-pretrain/Step Time": 17.60682867281139} +{"Full-pretrain/Learning Rate": 4.3597546887462904e-05, "Full-pretrain/Loss": 2.0089902877807617, "Full-pretrain/Loss (Raw)": 1.9565598964691162, "Full-pretrain/Step": 2441, "Full-pretrain/Step Time": 17.607389751821756} +{"Full-pretrain/Learning Rate": 4.3591871513958395e-05, "Full-pretrain/Loss": 2.004138946533203, "Full-pretrain/Loss (Raw)": 1.8844332695007324, "Full-pretrain/Step": 2442, "Full-pretrain/Step Time": 17.604464448988438} +{"Full-pretrain/Learning Rate": 4.3586193995888024e-05, "Full-pretrain/Loss": 2.0090513229370117, "Full-pretrain/Loss (Raw)": 2.0929768085479736, "Full-pretrain/Step": 2443, "Full-pretrain/Step Time": 17.608733467757702} +{"Full-pretrain/Learning Rate": 4.3580514333906716e-05, "Full-pretrain/Loss": 2.0084333419799805, "Full-pretrain/Loss (Raw)": 2.0503487586975098, "Full-pretrain/Step": 2444, "Full-pretrain/Step Time": 17.601545674726367} +{"Full-pretrain/Learning Rate": 4.357483252866961e-05, "Full-pretrain/Loss": 1.9990077018737793, "Full-pretrain/Loss (Raw)": 1.9372007846832275, "Full-pretrain/Step": 2445, "Full-pretrain/Step Time": 17.600718518719077} +{"Full-pretrain/Learning Rate": 4.356914858083211e-05, "Full-pretrain/Loss": 1.9944279193878174, "Full-pretrain/Loss (Raw)": 1.9739421606063843, "Full-pretrain/Step": 2446, "Full-pretrain/Step Time": 17.605578074231744} +{"Full-pretrain/Learning Rate": 4.3563462491049834e-05, "Full-pretrain/Loss": 2.0108275413513184, "Full-pretrain/Loss (Raw)": 2.4115490913391113, "Full-pretrain/Step": 2447, "Full-pretrain/Step Time": 17.602607138454914} +{"Full-pretrain/Learning Rate": 4.3557774259978685e-05, "Full-pretrain/Loss": 2.0228545665740967, "Full-pretrain/Loss (Raw)": 2.1071176528930664, "Full-pretrain/Step": 2448, "Full-pretrain/Step Time": 17.595039946958423} +{"Full-pretrain/Learning Rate": 4.35520838882748e-05, "Full-pretrain/Loss": 2.021214485168457, "Full-pretrain/Loss (Raw)": 1.79481041431427, "Full-pretrain/Step": 2449, "Full-pretrain/Step Time": 17.59277397952974} +{"Full-pretrain/Learning Rate": 4.354639137659455e-05, "Full-pretrain/Loss": 2.0226433277130127, "Full-pretrain/Loss (Raw)": 2.125338554382324, "Full-pretrain/Step": 2450, "Full-pretrain/Step Time": 17.591878773644567} +{"Full-pretrain/Learning Rate": 4.354069672559458e-05, "Full-pretrain/Loss": 2.009913444519043, "Full-pretrain/Loss (Raw)": 1.9055876731872559, "Full-pretrain/Step": 2451, "Full-pretrain/Step Time": 17.588811671361327} +{"Full-pretrain/Learning Rate": 4.353499993593176e-05, "Full-pretrain/Loss": 2.000523328781128, "Full-pretrain/Loss (Raw)": 1.908140778541565, "Full-pretrain/Step": 2452, "Full-pretrain/Step Time": 17.583166997879744} +{"Full-pretrain/Learning Rate": 4.35293010082632e-05, "Full-pretrain/Loss": 1.9926395416259766, "Full-pretrain/Loss (Raw)": 1.9026108980178833, "Full-pretrain/Step": 2453, "Full-pretrain/Step Time": 17.580955946817994} +{"Full-pretrain/Learning Rate": 4.35235999432463e-05, "Full-pretrain/Loss": 1.996335506439209, "Full-pretrain/Loss (Raw)": 2.241239070892334, "Full-pretrain/Step": 2454, "Full-pretrain/Step Time": 17.58903742209077} +{"Full-pretrain/Learning Rate": 4.3517896741538634e-05, "Full-pretrain/Loss": 2.0046184062957764, "Full-pretrain/Loss (Raw)": 2.155731678009033, "Full-pretrain/Step": 2455, "Full-pretrain/Step Time": 17.58504942059517} +{"Full-pretrain/Learning Rate": 4.35121914037981e-05, "Full-pretrain/Loss": 1.9986562728881836, "Full-pretrain/Loss (Raw)": 1.7904762029647827, "Full-pretrain/Step": 2456, "Full-pretrain/Step Time": 17.58584624901414} +{"Full-pretrain/Learning Rate": 4.3506483930682785e-05, "Full-pretrain/Loss": 1.993138313293457, "Full-pretrain/Loss (Raw)": 1.7895779609680176, "Full-pretrain/Step": 2457, "Full-pretrain/Step Time": 17.587332628667355} +{"Full-pretrain/Learning Rate": 4.3500774322851064e-05, "Full-pretrain/Loss": 2.0026192665100098, "Full-pretrain/Loss (Raw)": 2.203052043914795, "Full-pretrain/Step": 2458, "Full-pretrain/Step Time": 17.59089420363307} +{"Full-pretrain/Learning Rate": 4.349506258096152e-05, "Full-pretrain/Loss": 1.9996432065963745, "Full-pretrain/Loss (Raw)": 1.9219696521759033, "Full-pretrain/Step": 2459, "Full-pretrain/Step Time": 17.59326976723969} +{"Full-pretrain/Learning Rate": 4.3489348705673e-05, "Full-pretrain/Loss": 1.9955555200576782, "Full-pretrain/Loss (Raw)": 2.0236096382141113, "Full-pretrain/Step": 2460, "Full-pretrain/Step Time": 17.59183633327484} +{"Full-pretrain/Learning Rate": 4.348363269764462e-05, "Full-pretrain/Loss": 1.9937500953674316, "Full-pretrain/Loss (Raw)": 1.9410500526428223, "Full-pretrain/Step": 2461, "Full-pretrain/Step Time": 17.590051038190722} +{"Full-pretrain/Learning Rate": 4.3477914557535684e-05, "Full-pretrain/Loss": 2.00032114982605, "Full-pretrain/Loss (Raw)": 2.0493199825286865, "Full-pretrain/Step": 2462, "Full-pretrain/Step Time": 17.593605883419514} +{"Full-pretrain/Learning Rate": 4.3472194286005815e-05, "Full-pretrain/Loss": 2.0103838443756104, "Full-pretrain/Loss (Raw)": 2.0526323318481445, "Full-pretrain/Step": 2463, "Full-pretrain/Step Time": 17.592651652172208} +{"Full-pretrain/Learning Rate": 4.346647188371482e-05, "Full-pretrain/Loss": 2.0131523609161377, "Full-pretrain/Loss (Raw)": 2.074474811553955, "Full-pretrain/Step": 2464, "Full-pretrain/Step Time": 17.59137075394392} +{"Full-pretrain/Learning Rate": 4.346074735132278e-05, "Full-pretrain/Loss": 2.0174953937530518, "Full-pretrain/Loss (Raw)": 1.9469108581542969, "Full-pretrain/Step": 2465, "Full-pretrain/Step Time": 17.584171440452337} +{"Full-pretrain/Learning Rate": 4.345502068949002e-05, "Full-pretrain/Loss": 2.0154263973236084, "Full-pretrain/Loss (Raw)": 1.8874040842056274, "Full-pretrain/Step": 2466, "Full-pretrain/Step Time": 17.583990735933185} +{"Full-pretrain/Learning Rate": 4.344929189887712e-05, "Full-pretrain/Loss": 2.0191235542297363, "Full-pretrain/Loss (Raw)": 2.023803472518921, "Full-pretrain/Step": 2467, "Full-pretrain/Step Time": 17.58548668026924} +{"Full-pretrain/Learning Rate": 4.344356098014487e-05, "Full-pretrain/Loss": 2.0067331790924072, "Full-pretrain/Loss (Raw)": 1.5763778686523438, "Full-pretrain/Step": 2468, "Full-pretrain/Step Time": 17.59078347682953} +{"Full-pretrain/Learning Rate": 4.343782793395435e-05, "Full-pretrain/Loss": 2.012827157974243, "Full-pretrain/Loss (Raw)": 1.9827110767364502, "Full-pretrain/Step": 2469, "Full-pretrain/Step Time": 17.584216341376305} +{"Full-pretrain/Learning Rate": 4.3432092760966856e-05, "Full-pretrain/Loss": 2.0067198276519775, "Full-pretrain/Loss (Raw)": 2.082933187484741, "Full-pretrain/Step": 2470, "Full-pretrain/Step Time": 17.58488920889795} +{"Full-pretrain/Learning Rate": 4.342635546184394e-05, "Full-pretrain/Loss": 2.003448486328125, "Full-pretrain/Loss (Raw)": 2.092712163925171, "Full-pretrain/Step": 2471, "Full-pretrain/Step Time": 17.58287137746811} +{"Full-pretrain/Learning Rate": 4.34206160372474e-05, "Full-pretrain/Loss": 1.996019959449768, "Full-pretrain/Loss (Raw)": 1.9860366582870483, "Full-pretrain/Step": 2472, "Full-pretrain/Step Time": 17.58368506655097} +{"Full-pretrain/Learning Rate": 4.341487448783926e-05, "Full-pretrain/Loss": 1.9967904090881348, "Full-pretrain/Loss (Raw)": 1.9812102317810059, "Full-pretrain/Step": 2473, "Full-pretrain/Step Time": 17.575191596522927} +{"Full-pretrain/Learning Rate": 4.340913081428183e-05, "Full-pretrain/Loss": 2.0014238357543945, "Full-pretrain/Loss (Raw)": 2.0327067375183105, "Full-pretrain/Step": 2474, "Full-pretrain/Step Time": 17.581056479364634} +{"Full-pretrain/Learning Rate": 4.340338501723763e-05, "Full-pretrain/Loss": 2.0015759468078613, "Full-pretrain/Loss (Raw)": 2.0978400707244873, "Full-pretrain/Step": 2475, "Full-pretrain/Step Time": 17.57316697575152} +{"Full-pretrain/Learning Rate": 4.339763709736944e-05, "Full-pretrain/Loss": 1.9918360710144043, "Full-pretrain/Loss (Raw)": 1.7386765480041504, "Full-pretrain/Step": 2476, "Full-pretrain/Step Time": 17.57867898605764} +{"Full-pretrain/Learning Rate": 4.3391887055340266e-05, "Full-pretrain/Loss": 2.001100540161133, "Full-pretrain/Loss (Raw)": 2.23366379737854, "Full-pretrain/Step": 2477, "Full-pretrain/Step Time": 17.569046584889293} +{"Full-pretrain/Learning Rate": 4.3386134891813385e-05, "Full-pretrain/Loss": 1.998117208480835, "Full-pretrain/Loss (Raw)": 1.878477931022644, "Full-pretrain/Step": 2478, "Full-pretrain/Step Time": 17.576350005343556} +{"Full-pretrain/Learning Rate": 4.338038060745231e-05, "Full-pretrain/Loss": 1.9852550029754639, "Full-pretrain/Loss (Raw)": 1.999955654144287, "Full-pretrain/Step": 2479, "Full-pretrain/Step Time": 17.579341057687998} +{"Full-pretrain/Learning Rate": 4.3374624202920785e-05, "Full-pretrain/Loss": 1.9853185415267944, "Full-pretrain/Loss (Raw)": 2.109151840209961, "Full-pretrain/Step": 2480, "Full-pretrain/Step Time": 17.577511863783002} +{"Full-pretrain/Learning Rate": 4.336886567888283e-05, "Full-pretrain/Loss": 1.9874227046966553, "Full-pretrain/Loss (Raw)": 1.8621476888656616, "Full-pretrain/Step": 2481, "Full-pretrain/Step Time": 17.57573340460658} +{"Full-pretrain/Learning Rate": 4.336310503600266e-05, "Full-pretrain/Loss": 1.9852356910705566, "Full-pretrain/Loss (Raw)": 2.055351734161377, "Full-pretrain/Step": 2482, "Full-pretrain/Step Time": 17.57475358247757} +{"Full-pretrain/Learning Rate": 4.335734227494478e-05, "Full-pretrain/Loss": 1.9914758205413818, "Full-pretrain/Loss (Raw)": 2.1052722930908203, "Full-pretrain/Step": 2483, "Full-pretrain/Step Time": 17.57262560725212} +{"Full-pretrain/Learning Rate": 4.3351577396373923e-05, "Full-pretrain/Loss": 1.9946949481964111, "Full-pretrain/Loss (Raw)": 2.0111498832702637, "Full-pretrain/Step": 2484, "Full-pretrain/Step Time": 17.57559704221785} +{"Full-pretrain/Learning Rate": 4.334581040095506e-05, "Full-pretrain/Loss": 1.9979277849197388, "Full-pretrain/Loss (Raw)": 2.0060644149780273, "Full-pretrain/Step": 2485, "Full-pretrain/Step Time": 17.57537512294948} +{"Full-pretrain/Learning Rate": 4.3340041289353415e-05, "Full-pretrain/Loss": 2.000875473022461, "Full-pretrain/Loss (Raw)": 2.335564136505127, "Full-pretrain/Step": 2486, "Full-pretrain/Step Time": 17.57238456234336} +{"Full-pretrain/Learning Rate": 4.333427006223445e-05, "Full-pretrain/Loss": 1.9942392110824585, "Full-pretrain/Loss (Raw)": 1.9433735609054565, "Full-pretrain/Step": 2487, "Full-pretrain/Step Time": 17.5694897249341} +{"Full-pretrain/Learning Rate": 4.332849672026388e-05, "Full-pretrain/Loss": 2.001065731048584, "Full-pretrain/Loss (Raw)": 2.0089221000671387, "Full-pretrain/Step": 2488, "Full-pretrain/Step Time": 17.57364590279758} +{"Full-pretrain/Learning Rate": 4.332272126410766e-05, "Full-pretrain/Loss": 2.009000539779663, "Full-pretrain/Loss (Raw)": 2.0434951782226562, "Full-pretrain/Step": 2489, "Full-pretrain/Step Time": 17.566505325958133} +{"Full-pretrain/Learning Rate": 4.331694369443197e-05, "Full-pretrain/Loss": 2.0041160583496094, "Full-pretrain/Loss (Raw)": 2.0467400550842285, "Full-pretrain/Step": 2490, "Full-pretrain/Step Time": 17.56666026636958} +{"Full-pretrain/Learning Rate": 4.3311164011903274e-05, "Full-pretrain/Loss": 2.0059731006622314, "Full-pretrain/Loss (Raw)": 1.981403112411499, "Full-pretrain/Step": 2491, "Full-pretrain/Step Time": 17.57028090581298} +{"Full-pretrain/Learning Rate": 4.330538221718823e-05, "Full-pretrain/Loss": 2.0043532848358154, "Full-pretrain/Loss (Raw)": 1.9717750549316406, "Full-pretrain/Step": 2492, "Full-pretrain/Step Time": 17.57418063469231} +{"Full-pretrain/Learning Rate": 4.3299598310953793e-05, "Full-pretrain/Loss": 2.000391960144043, "Full-pretrain/Loss (Raw)": 1.8142820596694946, "Full-pretrain/Step": 2493, "Full-pretrain/Step Time": 17.577091444283724} +{"Full-pretrain/Learning Rate": 4.329381229386711e-05, "Full-pretrain/Loss": 1.9960980415344238, "Full-pretrain/Loss (Raw)": 1.9119174480438232, "Full-pretrain/Step": 2494, "Full-pretrain/Step Time": 17.570845616981387} +{"Full-pretrain/Learning Rate": 4.3288024166595614e-05, "Full-pretrain/Loss": 1.9976084232330322, "Full-pretrain/Loss (Raw)": 2.100963592529297, "Full-pretrain/Step": 2495, "Full-pretrain/Step Time": 17.575092231854796} +{"Full-pretrain/Learning Rate": 4.328223392980696e-05, "Full-pretrain/Loss": 1.995320200920105, "Full-pretrain/Loss (Raw)": 2.0012521743774414, "Full-pretrain/Step": 2496, "Full-pretrain/Step Time": 17.581426341086626} +{"Full-pretrain/Learning Rate": 4.327644158416905e-05, "Full-pretrain/Loss": 1.9943867921829224, "Full-pretrain/Loss (Raw)": 1.917039155960083, "Full-pretrain/Step": 2497, "Full-pretrain/Step Time": 17.578688263893127} +{"Full-pretrain/Learning Rate": 4.3270647130350016e-05, "Full-pretrain/Loss": 1.9955428838729858, "Full-pretrain/Loss (Raw)": 1.9244037866592407, "Full-pretrain/Step": 2498, "Full-pretrain/Step Time": 17.574570693075657} +{"Full-pretrain/Learning Rate": 4.326485056901826e-05, "Full-pretrain/Loss": 1.9920787811279297, "Full-pretrain/Loss (Raw)": 1.9129489660263062, "Full-pretrain/Step": 2499, "Full-pretrain/Step Time": 17.56997406668961} +{"Full-pretrain/Learning Rate": 4.325905190084241e-05, "Full-pretrain/Loss": 2.001164674758911, "Full-pretrain/Loss (Raw)": 1.8671298027038574, "Full-pretrain/Step": 2500, "Full-pretrain/Step Time": 17.576122330501676} +{"Full-pretrain/Learning Rate": 4.325325112649134e-05, "Full-pretrain/Loss": 2.0027971267700195, "Full-pretrain/Loss (Raw)": 2.0349478721618652, "Full-pretrain/Step": 2501, "Full-pretrain/Step Time": 17.58000890351832} +{"Full-pretrain/Learning Rate": 4.324744824663417e-05, "Full-pretrain/Loss": 2.0048937797546387, "Full-pretrain/Loss (Raw)": 2.1500227451324463, "Full-pretrain/Step": 2502, "Full-pretrain/Step Time": 17.578823758289218} +{"Full-pretrain/Learning Rate": 4.3241643261940243e-05, "Full-pretrain/Loss": 2.0050911903381348, "Full-pretrain/Loss (Raw)": 2.0990328788757324, "Full-pretrain/Step": 2503, "Full-pretrain/Step Time": 17.584690771996975} +{"Full-pretrain/Learning Rate": 4.323583617307919e-05, "Full-pretrain/Loss": 2.007925033569336, "Full-pretrain/Loss (Raw)": 2.0767135620117188, "Full-pretrain/Step": 2504, "Full-pretrain/Step Time": 17.577089726924896} +{"Full-pretrain/Learning Rate": 4.323002698072085e-05, "Full-pretrain/Loss": 2.0111632347106934, "Full-pretrain/Loss (Raw)": 2.0848388671875, "Full-pretrain/Step": 2505, "Full-pretrain/Step Time": 17.584033926948905} +{"Full-pretrain/Learning Rate": 4.3224215685535294e-05, "Full-pretrain/Loss": 2.017345905303955, "Full-pretrain/Loss (Raw)": 2.230543851852417, "Full-pretrain/Step": 2506, "Full-pretrain/Step Time": 17.57297821715474} +{"Full-pretrain/Learning Rate": 4.321840228819286e-05, "Full-pretrain/Loss": 2.017725944519043, "Full-pretrain/Loss (Raw)": 2.110001564025879, "Full-pretrain/Step": 2507, "Full-pretrain/Step Time": 17.572516253218055} +{"Full-pretrain/Learning Rate": 4.321258678936413e-05, "Full-pretrain/Loss": 2.015524387359619, "Full-pretrain/Loss (Raw)": 1.6682353019714355, "Full-pretrain/Step": 2508, "Full-pretrain/Step Time": 17.57683801651001} +{"Full-pretrain/Learning Rate": 4.3206769189719906e-05, "Full-pretrain/Loss": 2.013369083404541, "Full-pretrain/Loss (Raw)": 2.1646888256073, "Full-pretrain/Step": 2509, "Full-pretrain/Step Time": 17.58034148812294} +{"Full-pretrain/Learning Rate": 4.320094948993127e-05, "Full-pretrain/Loss": 2.0158677101135254, "Full-pretrain/Loss (Raw)": 1.9584317207336426, "Full-pretrain/Step": 2510, "Full-pretrain/Step Time": 17.582539094612002} +{"Full-pretrain/Learning Rate": 4.319512769066949e-05, "Full-pretrain/Loss": 2.008317708969116, "Full-pretrain/Loss (Raw)": 1.7583601474761963, "Full-pretrain/Step": 2511, "Full-pretrain/Step Time": 17.58146489970386} +{"Full-pretrain/Learning Rate": 4.318930379260614e-05, "Full-pretrain/Loss": 2.0088400840759277, "Full-pretrain/Loss (Raw)": 2.1258721351623535, "Full-pretrain/Step": 2512, "Full-pretrain/Step Time": 17.580433178693056} +{"Full-pretrain/Learning Rate": 4.318347779641298e-05, "Full-pretrain/Loss": 2.017677068710327, "Full-pretrain/Loss (Raw)": 2.1449294090270996, "Full-pretrain/Step": 2513, "Full-pretrain/Step Time": 17.582332778722048} +{"Full-pretrain/Learning Rate": 4.3177649702762046e-05, "Full-pretrain/Loss": 2.0126819610595703, "Full-pretrain/Loss (Raw)": 1.8955031633377075, "Full-pretrain/Step": 2514, "Full-pretrain/Step Time": 17.576791113242507} +{"Full-pretrain/Learning Rate": 4.317181951232562e-05, "Full-pretrain/Loss": 2.0084612369537354, "Full-pretrain/Loss (Raw)": 1.9702131748199463, "Full-pretrain/Step": 2515, "Full-pretrain/Step Time": 17.579628106206656} +{"Full-pretrain/Learning Rate": 4.316598722577618e-05, "Full-pretrain/Loss": 2.0099918842315674, "Full-pretrain/Loss (Raw)": 2.0601296424865723, "Full-pretrain/Step": 2516, "Full-pretrain/Step Time": 17.57769086956978} +{"Full-pretrain/Learning Rate": 4.31601528437865e-05, "Full-pretrain/Loss": 2.007476806640625, "Full-pretrain/Loss (Raw)": 1.9255822896957397, "Full-pretrain/Step": 2517, "Full-pretrain/Step Time": 17.58015946112573} +{"Full-pretrain/Learning Rate": 4.315431636702959e-05, "Full-pretrain/Loss": 1.9937334060668945, "Full-pretrain/Loss (Raw)": 1.8957719802856445, "Full-pretrain/Step": 2518, "Full-pretrain/Step Time": 17.579848803579807} +{"Full-pretrain/Learning Rate": 4.3148477796178653e-05, "Full-pretrain/Loss": 1.9950648546218872, "Full-pretrain/Loss (Raw)": 1.9859815835952759, "Full-pretrain/Step": 2519, "Full-pretrain/Step Time": 17.57950229756534} +{"Full-pretrain/Learning Rate": 4.3142637131907184e-05, "Full-pretrain/Loss": 1.990798830986023, "Full-pretrain/Loss (Raw)": 1.872412085533142, "Full-pretrain/Step": 2520, "Full-pretrain/Step Time": 17.58033650368452} +{"Full-pretrain/Learning Rate": 4.313679437488889e-05, "Full-pretrain/Loss": 1.9907748699188232, "Full-pretrain/Loss (Raw)": 2.042726993560791, "Full-pretrain/Step": 2521, "Full-pretrain/Step Time": 17.581215426325798} +{"Full-pretrain/Learning Rate": 4.3130949525797746e-05, "Full-pretrain/Loss": 1.9867022037506104, "Full-pretrain/Loss (Raw)": 1.9164156913757324, "Full-pretrain/Step": 2522, "Full-pretrain/Step Time": 17.57628800906241} +{"Full-pretrain/Learning Rate": 4.312510258530794e-05, "Full-pretrain/Loss": 1.9873948097229004, "Full-pretrain/Loss (Raw)": 2.0035645961761475, "Full-pretrain/Step": 2523, "Full-pretrain/Step Time": 17.57535343617201} +{"Full-pretrain/Learning Rate": 4.311925355409393e-05, "Full-pretrain/Loss": 1.989740014076233, "Full-pretrain/Loss (Raw)": 2.0468225479125977, "Full-pretrain/Step": 2524, "Full-pretrain/Step Time": 17.57976058498025} +{"Full-pretrain/Learning Rate": 4.311340243283038e-05, "Full-pretrain/Loss": 1.991729974746704, "Full-pretrain/Loss (Raw)": 1.8779618740081787, "Full-pretrain/Step": 2525, "Full-pretrain/Step Time": 17.580306442454457} +{"Full-pretrain/Learning Rate": 4.3107549222192234e-05, "Full-pretrain/Loss": 2.002244234085083, "Full-pretrain/Loss (Raw)": 2.2483694553375244, "Full-pretrain/Step": 2526, "Full-pretrain/Step Time": 17.580215943977237} +{"Full-pretrain/Learning Rate": 4.310169392285464e-05, "Full-pretrain/Loss": 2.0029306411743164, "Full-pretrain/Loss (Raw)": 2.1229279041290283, "Full-pretrain/Step": 2527, "Full-pretrain/Step Time": 17.58491188287735} +{"Full-pretrain/Learning Rate": 4.3095836535493016e-05, "Full-pretrain/Loss": 2.0067732334136963, "Full-pretrain/Loss (Raw)": 2.1242170333862305, "Full-pretrain/Step": 2528, "Full-pretrain/Step Time": 17.587619476020336} +{"Full-pretrain/Learning Rate": 4.308997706078301e-05, "Full-pretrain/Loss": 2.0069055557250977, "Full-pretrain/Loss (Raw)": 1.9212716817855835, "Full-pretrain/Step": 2529, "Full-pretrain/Step Time": 17.582170352339745} +{"Full-pretrain/Learning Rate": 4.3084115499400506e-05, "Full-pretrain/Loss": 2.008422374725342, "Full-pretrain/Loss (Raw)": 1.9729421138763428, "Full-pretrain/Step": 2530, "Full-pretrain/Step Time": 17.582864858210087} +{"Full-pretrain/Learning Rate": 4.3078251852021636e-05, "Full-pretrain/Loss": 2.0115528106689453, "Full-pretrain/Loss (Raw)": 2.0131242275238037, "Full-pretrain/Step": 2531, "Full-pretrain/Step Time": 17.583270024508238} +{"Full-pretrain/Learning Rate": 4.3072386119322764e-05, "Full-pretrain/Loss": 2.016035556793213, "Full-pretrain/Loss (Raw)": 2.01058292388916, "Full-pretrain/Step": 2532, "Full-pretrain/Step Time": 17.585872288793325} +{"Full-pretrain/Learning Rate": 4.306651830198051e-05, "Full-pretrain/Loss": 2.012270450592041, "Full-pretrain/Loss (Raw)": 1.914466142654419, "Full-pretrain/Step": 2533, "Full-pretrain/Step Time": 17.586290139704943} +{"Full-pretrain/Learning Rate": 4.306064840067171e-05, "Full-pretrain/Loss": 2.010178327560425, "Full-pretrain/Loss (Raw)": 2.083070755004883, "Full-pretrain/Step": 2534, "Full-pretrain/Step Time": 17.583887988701463} +{"Full-pretrain/Learning Rate": 4.3054776416073474e-05, "Full-pretrain/Loss": 2.0100550651550293, "Full-pretrain/Loss (Raw)": 2.095088005065918, "Full-pretrain/Step": 2535, "Full-pretrain/Step Time": 17.58970676548779} +{"Full-pretrain/Learning Rate": 4.3048902348863116e-05, "Full-pretrain/Loss": 2.017815589904785, "Full-pretrain/Loss (Raw)": 2.3250484466552734, "Full-pretrain/Step": 2536, "Full-pretrain/Step Time": 17.585390634834766} +{"Full-pretrain/Learning Rate": 4.304302619971822e-05, "Full-pretrain/Loss": 2.019035577774048, "Full-pretrain/Loss (Raw)": 2.123879909515381, "Full-pretrain/Step": 2537, "Full-pretrain/Step Time": 17.584289578720927} +{"Full-pretrain/Learning Rate": 4.3037147969316583e-05, "Full-pretrain/Loss": 2.008206844329834, "Full-pretrain/Loss (Raw)": 1.8840211629867554, "Full-pretrain/Step": 2538, "Full-pretrain/Step Time": 17.58546116016805} +{"Full-pretrain/Learning Rate": 4.303126765833628e-05, "Full-pretrain/Loss": 2.0070807933807373, "Full-pretrain/Loss (Raw)": 2.073972463607788, "Full-pretrain/Step": 2539, "Full-pretrain/Step Time": 17.57878801226616} +{"Full-pretrain/Learning Rate": 4.3025385267455575e-05, "Full-pretrain/Loss": 2.0218544006347656, "Full-pretrain/Loss (Raw)": 2.140993118286133, "Full-pretrain/Step": 2540, "Full-pretrain/Step Time": 17.578389333561063} +{"Full-pretrain/Learning Rate": 4.3019500797353025e-05, "Full-pretrain/Loss": 2.0179080963134766, "Full-pretrain/Loss (Raw)": 2.038398265838623, "Full-pretrain/Step": 2541, "Full-pretrain/Step Time": 17.57755828462541} +{"Full-pretrain/Learning Rate": 4.301361424870739e-05, "Full-pretrain/Loss": 2.021714448928833, "Full-pretrain/Loss (Raw)": 2.080239772796631, "Full-pretrain/Step": 2542, "Full-pretrain/Step Time": 17.58108041062951} +{"Full-pretrain/Learning Rate": 4.3007725622197674e-05, "Full-pretrain/Loss": 2.0349740982055664, "Full-pretrain/Loss (Raw)": 2.182666301727295, "Full-pretrain/Step": 2543, "Full-pretrain/Step Time": 17.577997732907534} +{"Full-pretrain/Learning Rate": 4.300183491850314e-05, "Full-pretrain/Loss": 2.026322364807129, "Full-pretrain/Loss (Raw)": 1.8490188121795654, "Full-pretrain/Step": 2544, "Full-pretrain/Step Time": 17.576129380613565} +{"Full-pretrain/Learning Rate": 4.2995942138303276e-05, "Full-pretrain/Loss": 2.023085117340088, "Full-pretrain/Loss (Raw)": 2.04133677482605, "Full-pretrain/Step": 2545, "Full-pretrain/Step Time": 17.581347100436687} +{"Full-pretrain/Learning Rate": 4.299004728227781e-05, "Full-pretrain/Loss": 2.0294549465179443, "Full-pretrain/Loss (Raw)": 2.0993378162384033, "Full-pretrain/Step": 2546, "Full-pretrain/Step Time": 17.5736085139215} +{"Full-pretrain/Learning Rate": 4.2984150351106714e-05, "Full-pretrain/Loss": 2.0264551639556885, "Full-pretrain/Loss (Raw)": 1.8742212057113647, "Full-pretrain/Step": 2547, "Full-pretrain/Step Time": 17.574778005480766} +{"Full-pretrain/Learning Rate": 4.297825134547019e-05, "Full-pretrain/Loss": 2.026092052459717, "Full-pretrain/Loss (Raw)": 2.048508882522583, "Full-pretrain/Step": 2548, "Full-pretrain/Step Time": 17.562621481716633} +{"Full-pretrain/Learning Rate": 4.29723502660487e-05, "Full-pretrain/Loss": 2.03145694732666, "Full-pretrain/Loss (Raw)": 2.0972630977630615, "Full-pretrain/Step": 2549, "Full-pretrain/Step Time": 17.573024448007345} +{"Full-pretrain/Learning Rate": 4.296644711352291e-05, "Full-pretrain/Loss": 2.025331497192383, "Full-pretrain/Loss (Raw)": 1.6997464895248413, "Full-pretrain/Step": 2550, "Full-pretrain/Step Time": 17.577883334830403} +{"Full-pretrain/Learning Rate": 4.296054188857377e-05, "Full-pretrain/Loss": 2.025125026702881, "Full-pretrain/Loss (Raw)": 1.979380488395691, "Full-pretrain/Step": 2551, "Full-pretrain/Step Time": 17.573522737249732} +{"Full-pretrain/Learning Rate": 4.295463459188243e-05, "Full-pretrain/Loss": 2.018120288848877, "Full-pretrain/Loss (Raw)": 1.6482632160186768, "Full-pretrain/Step": 2552, "Full-pretrain/Step Time": 17.579752065241337} +{"Full-pretrain/Learning Rate": 4.29487252241303e-05, "Full-pretrain/Loss": 2.0171432495117188, "Full-pretrain/Loss (Raw)": 2.011462688446045, "Full-pretrain/Step": 2553, "Full-pretrain/Step Time": 17.582097874954343} +{"Full-pretrain/Learning Rate": 4.2942813785999026e-05, "Full-pretrain/Loss": 2.0303797721862793, "Full-pretrain/Loss (Raw)": 2.339977741241455, "Full-pretrain/Step": 2554, "Full-pretrain/Step Time": 17.58778800815344} +{"Full-pretrain/Learning Rate": 4.2936900278170484e-05, "Full-pretrain/Loss": 2.0300183296203613, "Full-pretrain/Loss (Raw)": 1.9919991493225098, "Full-pretrain/Step": 2555, "Full-pretrain/Step Time": 17.584846226498485} +{"Full-pretrain/Learning Rate": 4.2930984701326796e-05, "Full-pretrain/Loss": 2.029231071472168, "Full-pretrain/Loss (Raw)": 2.0216331481933594, "Full-pretrain/Step": 2556, "Full-pretrain/Step Time": 17.586479043588042} +{"Full-pretrain/Learning Rate": 4.2925067056150325e-05, "Full-pretrain/Loss": 2.0393171310424805, "Full-pretrain/Loss (Raw)": 2.2007179260253906, "Full-pretrain/Step": 2557, "Full-pretrain/Step Time": 17.584993183612823} +{"Full-pretrain/Learning Rate": 4.291914734332367e-05, "Full-pretrain/Loss": 2.0303244590759277, "Full-pretrain/Loss (Raw)": 1.9606008529663086, "Full-pretrain/Step": 2558, "Full-pretrain/Step Time": 17.585843162611127} +{"Full-pretrain/Learning Rate": 4.2913225563529674e-05, "Full-pretrain/Loss": 2.027009963989258, "Full-pretrain/Loss (Raw)": 2.0168633460998535, "Full-pretrain/Step": 2559, "Full-pretrain/Step Time": 17.585440123453736} +{"Full-pretrain/Learning Rate": 4.29073017174514e-05, "Full-pretrain/Loss": 2.020270586013794, "Full-pretrain/Loss (Raw)": 1.9085594415664673, "Full-pretrain/Step": 2560, "Full-pretrain/Step Time": 17.589130936190486} +{"Full-pretrain/Learning Rate": 4.290137580577216e-05, "Full-pretrain/Loss": 2.016842842102051, "Full-pretrain/Loss (Raw)": 1.8115893602371216, "Full-pretrain/Step": 2561, "Full-pretrain/Step Time": 17.586944695562124} +{"Full-pretrain/Learning Rate": 4.289544782917552e-05, "Full-pretrain/Loss": 2.017594337463379, "Full-pretrain/Loss (Raw)": 1.9969842433929443, "Full-pretrain/Step": 2562, "Full-pretrain/Step Time": 17.588228350505233} +{"Full-pretrain/Learning Rate": 4.288951778834525e-05, "Full-pretrain/Loss": 2.018649101257324, "Full-pretrain/Loss (Raw)": 2.0468783378601074, "Full-pretrain/Step": 2563, "Full-pretrain/Step Time": 17.593472396954894} +{"Full-pretrain/Learning Rate": 4.28835856839654e-05, "Full-pretrain/Loss": 2.0147509574890137, "Full-pretrain/Loss (Raw)": 1.8858466148376465, "Full-pretrain/Step": 2564, "Full-pretrain/Step Time": 17.59166368842125} +{"Full-pretrain/Learning Rate": 4.2877651516720215e-05, "Full-pretrain/Loss": 2.0318338871002197, "Full-pretrain/Loss (Raw)": 2.4611144065856934, "Full-pretrain/Step": 2565, "Full-pretrain/Step Time": 17.585204850882292} +{"Full-pretrain/Learning Rate": 4.287171528729422e-05, "Full-pretrain/Loss": 2.026350498199463, "Full-pretrain/Loss (Raw)": 1.9076011180877686, "Full-pretrain/Step": 2566, "Full-pretrain/Step Time": 17.59233582019806} +{"Full-pretrain/Learning Rate": 4.286577699637215e-05, "Full-pretrain/Loss": 2.0215353965759277, "Full-pretrain/Loss (Raw)": 1.9410115480422974, "Full-pretrain/Step": 2567, "Full-pretrain/Step Time": 17.592361446470022} +{"Full-pretrain/Learning Rate": 4.2859836644638976e-05, "Full-pretrain/Loss": 2.0138978958129883, "Full-pretrain/Loss (Raw)": 2.0806446075439453, "Full-pretrain/Step": 2568, "Full-pretrain/Step Time": 17.597285022959113} +{"Full-pretrain/Learning Rate": 4.2853894232779924e-05, "Full-pretrain/Loss": 2.0116217136383057, "Full-pretrain/Loss (Raw)": 2.0510385036468506, "Full-pretrain/Step": 2569, "Full-pretrain/Step Time": 17.588756300508976} +{"Full-pretrain/Learning Rate": 4.2847949761480445e-05, "Full-pretrain/Loss": 2.009840250015259, "Full-pretrain/Loss (Raw)": 1.8270167112350464, "Full-pretrain/Step": 2570, "Full-pretrain/Step Time": 17.58739043585956} +{"Full-pretrain/Learning Rate": 4.284200323142623e-05, "Full-pretrain/Loss": 2.0153775215148926, "Full-pretrain/Loss (Raw)": 2.2511630058288574, "Full-pretrain/Step": 2571, "Full-pretrain/Step Time": 17.59085115790367} +{"Full-pretrain/Learning Rate": 4.283605464330322e-05, "Full-pretrain/Loss": 2.0091230869293213, "Full-pretrain/Loss (Raw)": 1.9408526420593262, "Full-pretrain/Step": 2572, "Full-pretrain/Step Time": 17.601793253794312} +{"Full-pretrain/Learning Rate": 4.283010399779757e-05, "Full-pretrain/Loss": 2.0051844120025635, "Full-pretrain/Loss (Raw)": 1.9123600721359253, "Full-pretrain/Step": 2573, "Full-pretrain/Step Time": 17.593790039420128} +{"Full-pretrain/Learning Rate": 4.2824151295595696e-05, "Full-pretrain/Loss": 1.9980249404907227, "Full-pretrain/Loss (Raw)": 1.8511358499526978, "Full-pretrain/Step": 2574, "Full-pretrain/Step Time": 17.590793576091528} +{"Full-pretrain/Learning Rate": 4.281819653738422e-05, "Full-pretrain/Loss": 1.9980274438858032, "Full-pretrain/Loss (Raw)": 2.182748556137085, "Full-pretrain/Step": 2575, "Full-pretrain/Step Time": 17.595864046365023} +{"Full-pretrain/Learning Rate": 4.281223972385005e-05, "Full-pretrain/Loss": 2.00175142288208, "Full-pretrain/Loss (Raw)": 1.9681808948516846, "Full-pretrain/Step": 2576, "Full-pretrain/Step Time": 17.602006630972028} +{"Full-pretrain/Learning Rate": 4.280628085568028e-05, "Full-pretrain/Loss": 1.987647533416748, "Full-pretrain/Loss (Raw)": 1.5900156497955322, "Full-pretrain/Step": 2577, "Full-pretrain/Step Time": 17.603242138400674} +{"Full-pretrain/Learning Rate": 4.280031993356227e-05, "Full-pretrain/Loss": 1.9844744205474854, "Full-pretrain/Loss (Raw)": 1.9977991580963135, "Full-pretrain/Step": 2578, "Full-pretrain/Step Time": 17.605637557804585} +{"Full-pretrain/Learning Rate": 4.279435695818361e-05, "Full-pretrain/Loss": 1.9817662239074707, "Full-pretrain/Loss (Raw)": 1.7875566482543945, "Full-pretrain/Step": 2579, "Full-pretrain/Step Time": 17.609386704862118} +{"Full-pretrain/Learning Rate": 4.278839193023214e-05, "Full-pretrain/Loss": 1.982975959777832, "Full-pretrain/Loss (Raw)": 2.0872206687927246, "Full-pretrain/Step": 2580, "Full-pretrain/Step Time": 17.606997963041067} +{"Full-pretrain/Learning Rate": 4.2782424850395896e-05, "Full-pretrain/Loss": 1.986458420753479, "Full-pretrain/Loss (Raw)": 2.2087042331695557, "Full-pretrain/Step": 2581, "Full-pretrain/Step Time": 17.61037520878017} +{"Full-pretrain/Learning Rate": 4.2776455719363205e-05, "Full-pretrain/Loss": 1.9926847219467163, "Full-pretrain/Loss (Raw)": 1.8989894390106201, "Full-pretrain/Step": 2582, "Full-pretrain/Step Time": 17.60344995930791} +{"Full-pretrain/Learning Rate": 4.277048453782259e-05, "Full-pretrain/Loss": 1.9874780178070068, "Full-pretrain/Loss (Raw)": 1.8127645254135132, "Full-pretrain/Step": 2583, "Full-pretrain/Step Time": 17.60474607720971} +{"Full-pretrain/Learning Rate": 4.2764511306462826e-05, "Full-pretrain/Loss": 1.9929252862930298, "Full-pretrain/Loss (Raw)": 1.8225754499435425, "Full-pretrain/Step": 2584, "Full-pretrain/Step Time": 17.609813628718257} +{"Full-pretrain/Learning Rate": 4.2758536025972936e-05, "Full-pretrain/Loss": 1.988143801689148, "Full-pretrain/Loss (Raw)": 1.8584561347961426, "Full-pretrain/Step": 2585, "Full-pretrain/Step Time": 17.60743192024529} +{"Full-pretrain/Learning Rate": 4.275255869704214e-05, "Full-pretrain/Loss": 1.9759509563446045, "Full-pretrain/Loss (Raw)": 1.9498047828674316, "Full-pretrain/Step": 2586, "Full-pretrain/Step Time": 17.603580933064222} +{"Full-pretrain/Learning Rate": 4.274657932035996e-05, "Full-pretrain/Loss": 1.9772510528564453, "Full-pretrain/Loss (Raw)": 2.033604621887207, "Full-pretrain/Step": 2587, "Full-pretrain/Step Time": 17.603249989449978} +{"Full-pretrain/Learning Rate": 4.2740597896616075e-05, "Full-pretrain/Loss": 1.980363130569458, "Full-pretrain/Loss (Raw)": 2.1212151050567627, "Full-pretrain/Step": 2588, "Full-pretrain/Step Time": 17.6117174718529} +{"Full-pretrain/Learning Rate": 4.273461442650046e-05, "Full-pretrain/Loss": 1.9755076169967651, "Full-pretrain/Loss (Raw)": 2.0453438758850098, "Full-pretrain/Step": 2589, "Full-pretrain/Step Time": 17.612269282341003} +{"Full-pretrain/Learning Rate": 4.272862891070331e-05, "Full-pretrain/Loss": 1.9767651557922363, "Full-pretrain/Loss (Raw)": 2.0008456707000732, "Full-pretrain/Step": 2590, "Full-pretrain/Step Time": 17.609531331807375} +{"Full-pretrain/Learning Rate": 4.272264134991503e-05, "Full-pretrain/Loss": 1.9782016277313232, "Full-pretrain/Loss (Raw)": 2.0628275871276855, "Full-pretrain/Step": 2591, "Full-pretrain/Step Time": 17.60911968536675} +{"Full-pretrain/Learning Rate": 4.271665174482631e-05, "Full-pretrain/Loss": 1.9731545448303223, "Full-pretrain/Loss (Raw)": 1.7470526695251465, "Full-pretrain/Step": 2592, "Full-pretrain/Step Time": 17.61134879477322} +{"Full-pretrain/Learning Rate": 4.271066009612804e-05, "Full-pretrain/Loss": 1.9834538698196411, "Full-pretrain/Loss (Raw)": 2.1411690711975098, "Full-pretrain/Step": 2593, "Full-pretrain/Step Time": 17.611937137320638} +{"Full-pretrain/Learning Rate": 4.270466640451134e-05, "Full-pretrain/Loss": 1.9785913228988647, "Full-pretrain/Loss (Raw)": 1.8413822650909424, "Full-pretrain/Step": 2594, "Full-pretrain/Step Time": 17.610466120764613} +{"Full-pretrain/Learning Rate": 4.26986706706676e-05, "Full-pretrain/Loss": 1.9698834419250488, "Full-pretrain/Loss (Raw)": 1.7682260274887085, "Full-pretrain/Step": 2595, "Full-pretrain/Step Time": 17.616126799955964} +{"Full-pretrain/Learning Rate": 4.269267289528842e-05, "Full-pretrain/Loss": 1.9765620231628418, "Full-pretrain/Loss (Raw)": 2.099565029144287, "Full-pretrain/Step": 2596, "Full-pretrain/Step Time": 17.614771815016866} +{"Full-pretrain/Learning Rate": 4.268667307906564e-05, "Full-pretrain/Loss": 1.9632387161254883, "Full-pretrain/Loss (Raw)": 2.0347702503204346, "Full-pretrain/Step": 2597, "Full-pretrain/Step Time": 17.617867443710566} +{"Full-pretrain/Learning Rate": 4.2680671222691325e-05, "Full-pretrain/Loss": 1.9684923887252808, "Full-pretrain/Loss (Raw)": 2.0757148265838623, "Full-pretrain/Step": 2598, "Full-pretrain/Step Time": 17.61186001636088} +{"Full-pretrain/Learning Rate": 4.2674667326857807e-05, "Full-pretrain/Loss": 1.9709073305130005, "Full-pretrain/Loss (Raw)": 2.01829195022583, "Full-pretrain/Step": 2599, "Full-pretrain/Step Time": 17.61503241956234} +{"Full-pretrain/Learning Rate": 4.2668661392257624e-05, "Full-pretrain/Loss": 1.967877745628357, "Full-pretrain/Loss (Raw)": 1.9836976528167725, "Full-pretrain/Step": 2600, "Full-pretrain/Step Time": 17.617648985236883} +{"Full-pretrain/Learning Rate": 4.2662653419583556e-05, "Full-pretrain/Loss": 1.9646921157836914, "Full-pretrain/Loss (Raw)": 1.9490966796875, "Full-pretrain/Step": 2601, "Full-pretrain/Step Time": 17.621465515345335} +{"Full-pretrain/Learning Rate": 4.2656643409528624e-05, "Full-pretrain/Loss": 1.9790003299713135, "Full-pretrain/Loss (Raw)": 2.2848827838897705, "Full-pretrain/Step": 2602, "Full-pretrain/Step Time": 17.613272549584508} +{"Full-pretrain/Learning Rate": 4.265063136278608e-05, "Full-pretrain/Loss": 1.973710060119629, "Full-pretrain/Loss (Raw)": 2.0818722248077393, "Full-pretrain/Step": 2603, "Full-pretrain/Step Time": 17.619002610445023} +{"Full-pretrain/Learning Rate": 4.264461728004941e-05, "Full-pretrain/Loss": 1.9741076231002808, "Full-pretrain/Loss (Raw)": 1.9535741806030273, "Full-pretrain/Step": 2604, "Full-pretrain/Step Time": 17.618819650262594} +{"Full-pretrain/Learning Rate": 4.2638601162012335e-05, "Full-pretrain/Loss": 1.9789202213287354, "Full-pretrain/Loss (Raw)": 2.0663628578186035, "Full-pretrain/Step": 2605, "Full-pretrain/Step Time": 17.621642546728253} +{"Full-pretrain/Learning Rate": 4.263258300936882e-05, "Full-pretrain/Loss": 1.9945576190948486, "Full-pretrain/Loss (Raw)": 2.3515326976776123, "Full-pretrain/Step": 2606, "Full-pretrain/Step Time": 17.615528225898743} +{"Full-pretrain/Learning Rate": 4.262656282281305e-05, "Full-pretrain/Loss": 1.988034725189209, "Full-pretrain/Loss (Raw)": 1.97401762008667, "Full-pretrain/Step": 2607, "Full-pretrain/Step Time": 17.610894517973065} +{"Full-pretrain/Learning Rate": 4.262054060303945e-05, "Full-pretrain/Loss": 1.9930020570755005, "Full-pretrain/Loss (Raw)": 2.127136468887329, "Full-pretrain/Step": 2608, "Full-pretrain/Step Time": 17.615170147269964} +{"Full-pretrain/Learning Rate": 4.261451635074269e-05, "Full-pretrain/Loss": 2.0156335830688477, "Full-pretrain/Loss (Raw)": 2.3142170906066895, "Full-pretrain/Step": 2609, "Full-pretrain/Step Time": 17.619864897802472} +{"Full-pretrain/Learning Rate": 4.2608490066617654e-05, "Full-pretrain/Loss": 2.015928268432617, "Full-pretrain/Loss (Raw)": 2.0072364807128906, "Full-pretrain/Step": 2610, "Full-pretrain/Step Time": 17.62021985836327} +{"Full-pretrain/Learning Rate": 4.260246175135948e-05, "Full-pretrain/Loss": 2.0310158729553223, "Full-pretrain/Loss (Raw)": 2.270355701446533, "Full-pretrain/Step": 2611, "Full-pretrain/Step Time": 17.626090059056878} +{"Full-pretrain/Learning Rate": 4.259643140566352e-05, "Full-pretrain/Loss": 2.039085865020752, "Full-pretrain/Loss (Raw)": 2.3454644680023193, "Full-pretrain/Step": 2612, "Full-pretrain/Step Time": 17.61930751055479} +{"Full-pretrain/Learning Rate": 4.259039903022539e-05, "Full-pretrain/Loss": 2.0330991744995117, "Full-pretrain/Loss (Raw)": 2.017129421234131, "Full-pretrain/Step": 2613, "Full-pretrain/Step Time": 17.62711543403566} +{"Full-pretrain/Learning Rate": 4.2584364625740914e-05, "Full-pretrain/Loss": 2.0344719886779785, "Full-pretrain/Loss (Raw)": 1.9429203271865845, "Full-pretrain/Step": 2614, "Full-pretrain/Step Time": 17.62724810652435} +{"Full-pretrain/Learning Rate": 4.257832819290615e-05, "Full-pretrain/Loss": 2.0360617637634277, "Full-pretrain/Loss (Raw)": 1.86363685131073, "Full-pretrain/Step": 2615, "Full-pretrain/Step Time": 17.624147411435843} +{"Full-pretrain/Learning Rate": 4.257228973241741e-05, "Full-pretrain/Loss": 2.0348410606384277, "Full-pretrain/Loss (Raw)": 1.783515453338623, "Full-pretrain/Step": 2616, "Full-pretrain/Step Time": 17.621855782344937} +{"Full-pretrain/Learning Rate": 4.256624924497123e-05, "Full-pretrain/Loss": 2.044989585876465, "Full-pretrain/Loss (Raw)": 2.183198928833008, "Full-pretrain/Step": 2617, "Full-pretrain/Step Time": 17.62358570098877} +{"Full-pretrain/Learning Rate": 4.2560206731264376e-05, "Full-pretrain/Loss": 2.049865484237671, "Full-pretrain/Loss (Raw)": 2.105839252471924, "Full-pretrain/Step": 2618, "Full-pretrain/Step Time": 17.624601002782583} +{"Full-pretrain/Learning Rate": 4.2554162191993844e-05, "Full-pretrain/Loss": 2.0507919788360596, "Full-pretrain/Loss (Raw)": 2.0632500648498535, "Full-pretrain/Step": 2619, "Full-pretrain/Step Time": 17.622138310223818} +{"Full-pretrain/Learning Rate": 4.254811562785686e-05, "Full-pretrain/Loss": 2.0465080738067627, "Full-pretrain/Loss (Raw)": 1.9841339588165283, "Full-pretrain/Step": 2620, "Full-pretrain/Step Time": 17.620214706286788} +{"Full-pretrain/Learning Rate": 4.254206703955091e-05, "Full-pretrain/Loss": 2.0435357093811035, "Full-pretrain/Loss (Raw)": 1.9502289295196533, "Full-pretrain/Step": 2621, "Full-pretrain/Step Time": 17.619414599612355} +{"Full-pretrain/Learning Rate": 4.25360164277737e-05, "Full-pretrain/Loss": 2.040794610977173, "Full-pretrain/Loss (Raw)": 1.913126826286316, "Full-pretrain/Step": 2622, "Full-pretrain/Step Time": 17.620103841647506} +{"Full-pretrain/Learning Rate": 4.2529963793223146e-05, "Full-pretrain/Loss": 2.0351743698120117, "Full-pretrain/Loss (Raw)": 1.882982611656189, "Full-pretrain/Step": 2623, "Full-pretrain/Step Time": 17.617455443367362} +{"Full-pretrain/Learning Rate": 4.252390913659744e-05, "Full-pretrain/Loss": 2.046279191970825, "Full-pretrain/Loss (Raw)": 2.1024069786071777, "Full-pretrain/Step": 2624, "Full-pretrain/Step Time": 17.618323450908065} +{"Full-pretrain/Learning Rate": 4.251785245859497e-05, "Full-pretrain/Loss": 2.031353712081909, "Full-pretrain/Loss (Raw)": 1.6635491847991943, "Full-pretrain/Step": 2625, "Full-pretrain/Step Time": 17.61985102854669} +{"Full-pretrain/Learning Rate": 4.251179375991438e-05, "Full-pretrain/Loss": 2.039172649383545, "Full-pretrain/Loss (Raw)": 2.091588258743286, "Full-pretrain/Step": 2626, "Full-pretrain/Step Time": 17.61799664236605} +{"Full-pretrain/Learning Rate": 4.250573304125453e-05, "Full-pretrain/Loss": 2.0489397048950195, "Full-pretrain/Loss (Raw)": 2.080770492553711, "Full-pretrain/Step": 2627, "Full-pretrain/Step Time": 17.625452673062682} +{"Full-pretrain/Learning Rate": 4.2499670303314516e-05, "Full-pretrain/Loss": 2.050752639770508, "Full-pretrain/Loss (Raw)": 2.1575827598571777, "Full-pretrain/Step": 2628, "Full-pretrain/Step Time": 17.62451737932861} +{"Full-pretrain/Learning Rate": 4.249360554679369e-05, "Full-pretrain/Loss": 2.053975820541382, "Full-pretrain/Loss (Raw)": 2.137908935546875, "Full-pretrain/Step": 2629, "Full-pretrain/Step Time": 17.61895356886089} +{"Full-pretrain/Learning Rate": 4.248753877239161e-05, "Full-pretrain/Loss": 2.0554676055908203, "Full-pretrain/Loss (Raw)": 2.1234564781188965, "Full-pretrain/Step": 2630, "Full-pretrain/Step Time": 17.61893029138446} +{"Full-pretrain/Learning Rate": 4.248146998080808e-05, "Full-pretrain/Loss": 2.054358959197998, "Full-pretrain/Loss (Raw)": 1.9828163385391235, "Full-pretrain/Step": 2631, "Full-pretrain/Step Time": 17.617716748267412} +{"Full-pretrain/Learning Rate": 4.2475399172743134e-05, "Full-pretrain/Loss": 2.059873104095459, "Full-pretrain/Loss (Raw)": 2.160147190093994, "Full-pretrain/Step": 2632, "Full-pretrain/Step Time": 17.62526036053896} +{"Full-pretrain/Learning Rate": 4.246932634889703e-05, "Full-pretrain/Loss": 2.0576400756835938, "Full-pretrain/Loss (Raw)": 1.8776429891586304, "Full-pretrain/Step": 2633, "Full-pretrain/Step Time": 17.619245022535324} +{"Full-pretrain/Learning Rate": 4.246325150997027e-05, "Full-pretrain/Loss": 2.055354595184326, "Full-pretrain/Loss (Raw)": 2.2117481231689453, "Full-pretrain/Step": 2634, "Full-pretrain/Step Time": 17.62228830717504} +{"Full-pretrain/Learning Rate": 4.245717465666359e-05, "Full-pretrain/Loss": 2.054305076599121, "Full-pretrain/Loss (Raw)": 2.0482828617095947, "Full-pretrain/Step": 2635, "Full-pretrain/Step Time": 17.6175118368119} +{"Full-pretrain/Learning Rate": 4.2451095789677945e-05, "Full-pretrain/Loss": 2.057110071182251, "Full-pretrain/Loss (Raw)": 2.0433349609375, "Full-pretrain/Step": 2636, "Full-pretrain/Step Time": 17.623442817479372} +{"Full-pretrain/Learning Rate": 4.244501490971454e-05, "Full-pretrain/Loss": 2.0514960289001465, "Full-pretrain/Loss (Raw)": 1.8867120742797852, "Full-pretrain/Step": 2637, "Full-pretrain/Step Time": 17.624322220683098} +{"Full-pretrain/Learning Rate": 4.243893201747478e-05, "Full-pretrain/Loss": 2.0343403816223145, "Full-pretrain/Loss (Raw)": 1.8025532960891724, "Full-pretrain/Step": 2638, "Full-pretrain/Step Time": 17.616176111623645} +{"Full-pretrain/Learning Rate": 4.2432847113660356e-05, "Full-pretrain/Loss": 2.03446364402771, "Full-pretrain/Loss (Raw)": 1.9779618978500366, "Full-pretrain/Step": 2639, "Full-pretrain/Step Time": 17.615625401958823} +{"Full-pretrain/Learning Rate": 4.242676019897314e-05, "Full-pretrain/Loss": 2.034158229827881, "Full-pretrain/Loss (Raw)": 2.1173667907714844, "Full-pretrain/Step": 2640, "Full-pretrain/Step Time": 17.619198225438595} +{"Full-pretrain/Learning Rate": 4.242067127411526e-05, "Full-pretrain/Loss": 2.017932653427124, "Full-pretrain/Loss (Raw)": 1.794995903968811, "Full-pretrain/Step": 2641, "Full-pretrain/Step Time": 17.62755194865167} +{"Full-pretrain/Learning Rate": 4.241458033978907e-05, "Full-pretrain/Loss": 2.0203919410705566, "Full-pretrain/Loss (Raw)": 2.085937261581421, "Full-pretrain/Step": 2642, "Full-pretrain/Step Time": 17.62771395035088} +{"Full-pretrain/Learning Rate": 4.240848739669715e-05, "Full-pretrain/Loss": 2.015709400177002, "Full-pretrain/Loss (Raw)": 2.1205055713653564, "Full-pretrain/Step": 2643, "Full-pretrain/Step Time": 17.625070121139288} +{"Full-pretrain/Learning Rate": 4.240239244554233e-05, "Full-pretrain/Loss": 2.0043716430664062, "Full-pretrain/Loss (Raw)": 1.982663631439209, "Full-pretrain/Step": 2644, "Full-pretrain/Step Time": 17.627279225736856} +{"Full-pretrain/Learning Rate": 4.239629548702767e-05, "Full-pretrain/Loss": 1.9924378395080566, "Full-pretrain/Loss (Raw)": 1.635244607925415, "Full-pretrain/Step": 2645, "Full-pretrain/Step Time": 17.628906462341547} +{"Full-pretrain/Learning Rate": 4.239019652185642e-05, "Full-pretrain/Loss": 1.9966689348220825, "Full-pretrain/Loss (Raw)": 2.078315496444702, "Full-pretrain/Step": 2646, "Full-pretrain/Step Time": 17.627493623644114} +{"Full-pretrain/Learning Rate": 4.238409555073212e-05, "Full-pretrain/Loss": 2.0023324489593506, "Full-pretrain/Loss (Raw)": 2.044870615005493, "Full-pretrain/Step": 2647, "Full-pretrain/Step Time": 17.62658661417663} +{"Full-pretrain/Learning Rate": 4.237799257435852e-05, "Full-pretrain/Loss": 2.015523672103882, "Full-pretrain/Loss (Raw)": 2.2056305408477783, "Full-pretrain/Step": 2648, "Full-pretrain/Step Time": 17.63194296322763} +{"Full-pretrain/Learning Rate": 4.237188759343956e-05, "Full-pretrain/Loss": 2.013228416442871, "Full-pretrain/Loss (Raw)": 2.109750509262085, "Full-pretrain/Step": 2649, "Full-pretrain/Step Time": 17.634775273501873} +{"Full-pretrain/Learning Rate": 4.236578060867949e-05, "Full-pretrain/Loss": 2.003567695617676, "Full-pretrain/Loss (Raw)": 1.7967009544372559, "Full-pretrain/Step": 2650, "Full-pretrain/Step Time": 17.63750785589218} +{"Full-pretrain/Learning Rate": 4.235967162078272e-05, "Full-pretrain/Loss": 2.0102806091308594, "Full-pretrain/Loss (Raw)": 2.278062105178833, "Full-pretrain/Step": 2651, "Full-pretrain/Step Time": 17.634946098551154} +{"Full-pretrain/Learning Rate": 4.235356063045393e-05, "Full-pretrain/Loss": 2.011164665222168, "Full-pretrain/Loss (Raw)": 2.0124218463897705, "Full-pretrain/Step": 2652, "Full-pretrain/Step Time": 17.633521994575858} +{"Full-pretrain/Learning Rate": 4.234744763839802e-05, "Full-pretrain/Loss": 2.0120766162872314, "Full-pretrain/Loss (Raw)": 1.9794143438339233, "Full-pretrain/Step": 2653, "Full-pretrain/Step Time": 17.634501004591584} +{"Full-pretrain/Learning Rate": 4.234133264532012e-05, "Full-pretrain/Loss": 2.0194175243377686, "Full-pretrain/Loss (Raw)": 2.1480355262756348, "Full-pretrain/Step": 2654, "Full-pretrain/Step Time": 17.63457883708179} +{"Full-pretrain/Learning Rate": 4.2335215651925605e-05, "Full-pretrain/Loss": 2.019188642501831, "Full-pretrain/Loss (Raw)": 1.8756569623947144, "Full-pretrain/Step": 2655, "Full-pretrain/Step Time": 17.633481487631798} +{"Full-pretrain/Learning Rate": 4.2329096658920045e-05, "Full-pretrain/Loss": 2.016663074493408, "Full-pretrain/Loss (Raw)": 2.0215883255004883, "Full-pretrain/Step": 2656, "Full-pretrain/Step Time": 17.632153540849686} +{"Full-pretrain/Learning Rate": 4.232297566700928e-05, "Full-pretrain/Loss": 2.0289340019226074, "Full-pretrain/Loss (Raw)": 2.05621600151062, "Full-pretrain/Step": 2657, "Full-pretrain/Step Time": 17.633026614785194} +{"Full-pretrain/Learning Rate": 4.2316852676899356e-05, "Full-pretrain/Loss": 2.0119173526763916, "Full-pretrain/Loss (Raw)": 1.5470595359802246, "Full-pretrain/Step": 2658, "Full-pretrain/Step Time": 17.633839974179864} +{"Full-pretrain/Learning Rate": 4.231072768929656e-05, "Full-pretrain/Loss": 2.022735118865967, "Full-pretrain/Loss (Raw)": 2.426936149597168, "Full-pretrain/Step": 2659, "Full-pretrain/Step Time": 17.630363104864955} +{"Full-pretrain/Learning Rate": 4.2304600704907414e-05, "Full-pretrain/Loss": 2.0196852684020996, "Full-pretrain/Loss (Raw)": 2.059988498687744, "Full-pretrain/Step": 2660, "Full-pretrain/Step Time": 17.63482043519616} +{"Full-pretrain/Learning Rate": 4.229847172443866e-05, "Full-pretrain/Loss": 2.0097436904907227, "Full-pretrain/Loss (Raw)": 1.8197779655456543, "Full-pretrain/Step": 2661, "Full-pretrain/Step Time": 17.629925835877657} +{"Full-pretrain/Learning Rate": 4.229234074859727e-05, "Full-pretrain/Loss": 2.0072717666625977, "Full-pretrain/Loss (Raw)": 2.0443568229675293, "Full-pretrain/Step": 2662, "Full-pretrain/Step Time": 17.63411009684205} +{"Full-pretrain/Learning Rate": 4.228620777809045e-05, "Full-pretrain/Loss": 2.014350414276123, "Full-pretrain/Loss (Raw)": 2.2093281745910645, "Full-pretrain/Step": 2663, "Full-pretrain/Step Time": 17.629592653363943} +{"Full-pretrain/Learning Rate": 4.2280072813625634e-05, "Full-pretrain/Loss": 2.0086755752563477, "Full-pretrain/Loss (Raw)": 1.9785531759262085, "Full-pretrain/Step": 2664, "Full-pretrain/Step Time": 17.625801671296358} +{"Full-pretrain/Learning Rate": 4.227393585591049e-05, "Full-pretrain/Loss": 2.004434823989868, "Full-pretrain/Loss (Raw)": 1.7419397830963135, "Full-pretrain/Step": 2665, "Full-pretrain/Step Time": 17.623847030103207} +{"Full-pretrain/Learning Rate": 4.2267796905652924e-05, "Full-pretrain/Loss": 1.9992107152938843, "Full-pretrain/Loss (Raw)": 2.0445761680603027, "Full-pretrain/Step": 2666, "Full-pretrain/Step Time": 17.622310480102897} +{"Full-pretrain/Learning Rate": 4.2261655963561044e-05, "Full-pretrain/Loss": 1.9961506128311157, "Full-pretrain/Loss (Raw)": 1.9503626823425293, "Full-pretrain/Step": 2667, "Full-pretrain/Step Time": 17.632339062169194} +{"Full-pretrain/Learning Rate": 4.225551303034322e-05, "Full-pretrain/Loss": 2.001483917236328, "Full-pretrain/Loss (Raw)": 2.2139978408813477, "Full-pretrain/Step": 2668, "Full-pretrain/Step Time": 17.626113967970014} +{"Full-pretrain/Learning Rate": 4.224936810670803e-05, "Full-pretrain/Loss": 2.0102171897888184, "Full-pretrain/Loss (Raw)": 2.1661794185638428, "Full-pretrain/Step": 2669, "Full-pretrain/Step Time": 17.627002956345677} +{"Full-pretrain/Learning Rate": 4.224322119336429e-05, "Full-pretrain/Loss": 2.0042083263397217, "Full-pretrain/Loss (Raw)": 1.6102678775787354, "Full-pretrain/Step": 2670, "Full-pretrain/Step Time": 17.622047528624535} +{"Full-pretrain/Learning Rate": 4.223707229102105e-05, "Full-pretrain/Loss": 2.0042572021484375, "Full-pretrain/Loss (Raw)": 1.979527473449707, "Full-pretrain/Step": 2671, "Full-pretrain/Step Time": 17.62064602598548} +{"Full-pretrain/Learning Rate": 4.223092140038758e-05, "Full-pretrain/Loss": 2.004080295562744, "Full-pretrain/Loss (Raw)": 2.1117124557495117, "Full-pretrain/Step": 2672, "Full-pretrain/Step Time": 17.61851075850427} +{"Full-pretrain/Learning Rate": 4.222476852217338e-05, "Full-pretrain/Loss": 2.0065927505493164, "Full-pretrain/Loss (Raw)": 1.8753931522369385, "Full-pretrain/Step": 2673, "Full-pretrain/Step Time": 17.620718244463205} +{"Full-pretrain/Learning Rate": 4.221861365708818e-05, "Full-pretrain/Loss": 1.9981271028518677, "Full-pretrain/Loss (Raw)": 1.8150337934494019, "Full-pretrain/Step": 2674, "Full-pretrain/Step Time": 17.624831724911928} +{"Full-pretrain/Learning Rate": 4.221245680584194e-05, "Full-pretrain/Loss": 1.9880481958389282, "Full-pretrain/Loss (Raw)": 1.797982096672058, "Full-pretrain/Step": 2675, "Full-pretrain/Step Time": 17.62543674185872} +{"Full-pretrain/Learning Rate": 4.220629796914487e-05, "Full-pretrain/Loss": 1.9847242832183838, "Full-pretrain/Loss (Raw)": 1.8763006925582886, "Full-pretrain/Step": 2676, "Full-pretrain/Step Time": 17.63137307204306} +{"Full-pretrain/Learning Rate": 4.220013714770737e-05, "Full-pretrain/Loss": 1.9934319257736206, "Full-pretrain/Loss (Raw)": 1.9138842821121216, "Full-pretrain/Step": 2677, "Full-pretrain/Step Time": 17.626558551564813} +{"Full-pretrain/Learning Rate": 4.2193974342240096e-05, "Full-pretrain/Loss": 1.9909559488296509, "Full-pretrain/Loss (Raw)": 1.9990862607955933, "Full-pretrain/Step": 2678, "Full-pretrain/Step Time": 17.620589323341846} +{"Full-pretrain/Learning Rate": 4.2187809553453924e-05, "Full-pretrain/Loss": 1.9917137622833252, "Full-pretrain/Loss (Raw)": 2.069120407104492, "Full-pretrain/Step": 2679, "Full-pretrain/Step Time": 17.62435561977327} +{"Full-pretrain/Learning Rate": 4.2181642782059955e-05, "Full-pretrain/Loss": 1.983365535736084, "Full-pretrain/Loss (Raw)": 1.9384852647781372, "Full-pretrain/Step": 2680, "Full-pretrain/Step Time": 17.61652926914394} +{"Full-pretrain/Learning Rate": 4.2175474028769534e-05, "Full-pretrain/Loss": 1.9820308685302734, "Full-pretrain/Loss (Raw)": 2.0670418739318848, "Full-pretrain/Step": 2681, "Full-pretrain/Step Time": 17.618300314992666} +{"Full-pretrain/Learning Rate": 4.2169303294294216e-05, "Full-pretrain/Loss": 1.9834239482879639, "Full-pretrain/Loss (Raw)": 1.841280221939087, "Full-pretrain/Step": 2682, "Full-pretrain/Step Time": 17.61951951868832} +{"Full-pretrain/Learning Rate": 4.21631305793458e-05, "Full-pretrain/Loss": 1.971662998199463, "Full-pretrain/Loss (Raw)": 1.9017095565795898, "Full-pretrain/Step": 2683, "Full-pretrain/Step Time": 17.61575461551547} +{"Full-pretrain/Learning Rate": 4.2156955884636304e-05, "Full-pretrain/Loss": 1.9694238901138306, "Full-pretrain/Loss (Raw)": 1.9407728910446167, "Full-pretrain/Step": 2684, "Full-pretrain/Step Time": 17.61162517219782} +{"Full-pretrain/Learning Rate": 4.215077921087798e-05, "Full-pretrain/Loss": 1.9742940664291382, "Full-pretrain/Loss (Raw)": 2.1352591514587402, "Full-pretrain/Step": 2685, "Full-pretrain/Step Time": 17.61078580096364} +{"Full-pretrain/Learning Rate": 4.214460055878329e-05, "Full-pretrain/Loss": 1.968477487564087, "Full-pretrain/Loss (Raw)": 1.9619081020355225, "Full-pretrain/Step": 2686, "Full-pretrain/Step Time": 17.61150638014078} +{"Full-pretrain/Learning Rate": 4.213841992906496e-05, "Full-pretrain/Loss": 1.973572015762329, "Full-pretrain/Loss (Raw)": 2.038682222366333, "Full-pretrain/Step": 2687, "Full-pretrain/Step Time": 17.610595703125} +{"Full-pretrain/Learning Rate": 4.213223732243591e-05, "Full-pretrain/Loss": 1.977479100227356, "Full-pretrain/Loss (Raw)": 2.146611213684082, "Full-pretrain/Step": 2688, "Full-pretrain/Step Time": 17.61039394699037} +{"Full-pretrain/Learning Rate": 4.21260527396093e-05, "Full-pretrain/Loss": 1.9778692722320557, "Full-pretrain/Loss (Raw)": 2.06870436668396, "Full-pretrain/Step": 2689, "Full-pretrain/Step Time": 17.614221826195717} +{"Full-pretrain/Learning Rate": 4.211986618129854e-05, "Full-pretrain/Loss": 1.9865303039550781, "Full-pretrain/Loss (Raw)": 1.824209213256836, "Full-pretrain/Step": 2690, "Full-pretrain/Step Time": 17.613141991198063} +{"Full-pretrain/Learning Rate": 4.211367764821722e-05, "Full-pretrain/Loss": 1.9670296907424927, "Full-pretrain/Loss (Raw)": 1.8029184341430664, "Full-pretrain/Step": 2691, "Full-pretrain/Step Time": 17.611657243221998} +{"Full-pretrain/Learning Rate": 4.2107487141079206e-05, "Full-pretrain/Loss": 1.962109088897705, "Full-pretrain/Loss (Raw)": 1.9025243520736694, "Full-pretrain/Step": 2692, "Full-pretrain/Step Time": 17.610146053135395} +{"Full-pretrain/Learning Rate": 4.2101294660598556e-05, "Full-pretrain/Loss": 1.9608025550842285, "Full-pretrain/Loss (Raw)": 1.7779756784439087, "Full-pretrain/Step": 2693, "Full-pretrain/Step Time": 17.61954451724887} +{"Full-pretrain/Learning Rate": 4.209510020748957e-05, "Full-pretrain/Loss": 1.9704513549804688, "Full-pretrain/Loss (Raw)": 2.353113889694214, "Full-pretrain/Step": 2694, "Full-pretrain/Step Time": 17.611263254657388} +{"Full-pretrain/Learning Rate": 4.2088903782466795e-05, "Full-pretrain/Loss": 1.9591070413589478, "Full-pretrain/Loss (Raw)": 1.846313238143921, "Full-pretrain/Step": 2695, "Full-pretrain/Step Time": 17.605877056717873} +{"Full-pretrain/Learning Rate": 4.208270538624497e-05, "Full-pretrain/Loss": 1.9625823497772217, "Full-pretrain/Loss (Raw)": 2.0897634029388428, "Full-pretrain/Step": 2696, "Full-pretrain/Step Time": 17.60642060637474} +{"Full-pretrain/Learning Rate": 4.207650501953908e-05, "Full-pretrain/Loss": 1.9706685543060303, "Full-pretrain/Loss (Raw)": 2.0006954669952393, "Full-pretrain/Step": 2697, "Full-pretrain/Step Time": 17.612090418115258} +{"Full-pretrain/Learning Rate": 4.2070302683064345e-05, "Full-pretrain/Loss": 1.9598236083984375, "Full-pretrain/Loss (Raw)": 1.697540044784546, "Full-pretrain/Step": 2698, "Full-pretrain/Step Time": 17.611121136695147} +{"Full-pretrain/Learning Rate": 4.206409837753618e-05, "Full-pretrain/Loss": 1.961097002029419, "Full-pretrain/Loss (Raw)": 1.9911086559295654, "Full-pretrain/Step": 2699, "Full-pretrain/Step Time": 17.60635097324848} +{"Full-pretrain/Learning Rate": 4.2057892103670274e-05, "Full-pretrain/Loss": 1.9530751705169678, "Full-pretrain/Loss (Raw)": 1.957301139831543, "Full-pretrain/Step": 2700, "Full-pretrain/Step Time": 17.595862479880452} +{"Full-pretrain/Learning Rate": 4.205168386218251e-05, "Full-pretrain/Loss": 1.9474241733551025, "Full-pretrain/Loss (Raw)": 1.9853465557098389, "Full-pretrain/Step": 2701, "Full-pretrain/Step Time": 17.60383239760995} +{"Full-pretrain/Learning Rate": 4.2045473653789e-05, "Full-pretrain/Loss": 1.950226068496704, "Full-pretrain/Loss (Raw)": 1.6999268531799316, "Full-pretrain/Step": 2702, "Full-pretrain/Step Time": 17.60622907988727} +{"Full-pretrain/Learning Rate": 4.2039261479206094e-05, "Full-pretrain/Loss": 1.9524916410446167, "Full-pretrain/Loss (Raw)": 2.05202579498291, "Full-pretrain/Step": 2703, "Full-pretrain/Step Time": 17.602410594001412} +{"Full-pretrain/Learning Rate": 4.203304733915036e-05, "Full-pretrain/Loss": 1.9514776468276978, "Full-pretrain/Loss (Raw)": 2.079266309738159, "Full-pretrain/Step": 2704, "Full-pretrain/Step Time": 17.59437165223062} +{"Full-pretrain/Learning Rate": 4.202683123433862e-05, "Full-pretrain/Loss": 1.9476733207702637, "Full-pretrain/Loss (Raw)": 1.753652811050415, "Full-pretrain/Step": 2705, "Full-pretrain/Step Time": 17.59065555036068} +{"Full-pretrain/Learning Rate": 4.202061316548787e-05, "Full-pretrain/Loss": 1.9629414081573486, "Full-pretrain/Loss (Raw)": 2.303609848022461, "Full-pretrain/Step": 2706, "Full-pretrain/Step Time": 17.592714376747608} +{"Full-pretrain/Learning Rate": 4.2014393133315366e-05, "Full-pretrain/Loss": 1.9658268690109253, "Full-pretrain/Loss (Raw)": 1.8903226852416992, "Full-pretrain/Step": 2707, "Full-pretrain/Step Time": 17.590224971994758} +{"Full-pretrain/Learning Rate": 4.20081711385386e-05, "Full-pretrain/Loss": 1.972350835800171, "Full-pretrain/Loss (Raw)": 2.0850658416748047, "Full-pretrain/Step": 2708, "Full-pretrain/Step Time": 17.587395491078496} +{"Full-pretrain/Learning Rate": 4.200194718187527e-05, "Full-pretrain/Loss": 1.9758285284042358, "Full-pretrain/Loss (Raw)": 2.0251712799072266, "Full-pretrain/Step": 2709, "Full-pretrain/Step Time": 17.588235553354025} +{"Full-pretrain/Learning Rate": 4.1995721264043296e-05, "Full-pretrain/Loss": 1.9762568473815918, "Full-pretrain/Loss (Raw)": 2.012788772583008, "Full-pretrain/Step": 2710, "Full-pretrain/Step Time": 17.590524796396494} +{"Full-pretrain/Learning Rate": 4.1989493385760864e-05, "Full-pretrain/Loss": 1.9709895849227905, "Full-pretrain/Loss (Raw)": 1.9005712270736694, "Full-pretrain/Step": 2711, "Full-pretrain/Step Time": 17.592249061912298} +{"Full-pretrain/Learning Rate": 4.198326354774633e-05, "Full-pretrain/Loss": 1.970027208328247, "Full-pretrain/Loss (Raw)": 1.907686710357666, "Full-pretrain/Step": 2712, "Full-pretrain/Step Time": 17.584147298708558} +{"Full-pretrain/Learning Rate": 4.197703175071832e-05, "Full-pretrain/Loss": 1.9691202640533447, "Full-pretrain/Loss (Raw)": 2.038022994995117, "Full-pretrain/Step": 2713, "Full-pretrain/Step Time": 17.586438093334436} +{"Full-pretrain/Learning Rate": 4.197079799539566e-05, "Full-pretrain/Loss": 1.9710254669189453, "Full-pretrain/Loss (Raw)": 1.9022473096847534, "Full-pretrain/Step": 2714, "Full-pretrain/Step Time": 17.588314574211836} +{"Full-pretrain/Learning Rate": 4.196456228249742e-05, "Full-pretrain/Loss": 1.9693961143493652, "Full-pretrain/Loss (Raw)": 1.8495689630508423, "Full-pretrain/Step": 2715, "Full-pretrain/Step Time": 17.586990743875504} +{"Full-pretrain/Learning Rate": 4.1958324612742875e-05, "Full-pretrain/Loss": 1.9719698429107666, "Full-pretrain/Loss (Raw)": 2.023131847381592, "Full-pretrain/Step": 2716, "Full-pretrain/Step Time": 17.58679967932403} +{"Full-pretrain/Learning Rate": 4.195208498685155e-05, "Full-pretrain/Loss": 1.9619733095169067, "Full-pretrain/Loss (Raw)": 1.81536865234375, "Full-pretrain/Step": 2717, "Full-pretrain/Step Time": 17.586089538410306} +{"Full-pretrain/Learning Rate": 4.194584340554318e-05, "Full-pretrain/Loss": 1.945910096168518, "Full-pretrain/Loss (Raw)": 1.44788658618927, "Full-pretrain/Step": 2718, "Full-pretrain/Step Time": 17.58796378597617} +{"Full-pretrain/Learning Rate": 4.193959986953773e-05, "Full-pretrain/Loss": 1.9423571825027466, "Full-pretrain/Loss (Raw)": 1.9249894618988037, "Full-pretrain/Step": 2719, "Full-pretrain/Step Time": 17.583701567724347} +{"Full-pretrain/Learning Rate": 4.193335437955538e-05, "Full-pretrain/Loss": 1.9217514991760254, "Full-pretrain/Loss (Raw)": 1.4872299432754517, "Full-pretrain/Step": 2720, "Full-pretrain/Step Time": 17.59120345674455} +{"Full-pretrain/Learning Rate": 4.192710693631656e-05, "Full-pretrain/Loss": 1.9252853393554688, "Full-pretrain/Loss (Raw)": 2.181788206100464, "Full-pretrain/Step": 2721, "Full-pretrain/Step Time": 17.589079905301332} +{"Full-pretrain/Learning Rate": 4.1920857540541905e-05, "Full-pretrain/Loss": 1.9326450824737549, "Full-pretrain/Loss (Raw)": 2.0597195625305176, "Full-pretrain/Step": 2722, "Full-pretrain/Step Time": 17.596446089446545} +{"Full-pretrain/Learning Rate": 4.191460619295227e-05, "Full-pretrain/Loss": 1.9382351636886597, "Full-pretrain/Loss (Raw)": 1.9818007946014404, "Full-pretrain/Step": 2723, "Full-pretrain/Step Time": 17.58924276009202} +{"Full-pretrain/Learning Rate": 4.1908352894268765e-05, "Full-pretrain/Loss": 1.9472731351852417, "Full-pretrain/Loss (Raw)": 2.191739559173584, "Full-pretrain/Step": 2724, "Full-pretrain/Step Time": 17.58883536607027} +{"Full-pretrain/Learning Rate": 4.190209764521269e-05, "Full-pretrain/Loss": 1.9576890468597412, "Full-pretrain/Loss (Raw)": 2.1112871170043945, "Full-pretrain/Step": 2725, "Full-pretrain/Step Time": 17.589200172573328} +{"Full-pretrain/Learning Rate": 4.1895840446505594e-05, "Full-pretrain/Loss": 1.9506983757019043, "Full-pretrain/Loss (Raw)": 2.1294097900390625, "Full-pretrain/Step": 2726, "Full-pretrain/Step Time": 17.59928110986948} +{"Full-pretrain/Learning Rate": 4.188958129886924e-05, "Full-pretrain/Loss": 1.9484822750091553, "Full-pretrain/Loss (Raw)": 1.7753970623016357, "Full-pretrain/Step": 2727, "Full-pretrain/Step Time": 17.597675194963813} +{"Full-pretrain/Learning Rate": 4.188332020302561e-05, "Full-pretrain/Loss": 1.9325482845306396, "Full-pretrain/Loss (Raw)": 1.579874038696289, "Full-pretrain/Step": 2728, "Full-pretrain/Step Time": 17.598592277616262} +{"Full-pretrain/Learning Rate": 4.1877057159696944e-05, "Full-pretrain/Loss": 1.934038758277893, "Full-pretrain/Loss (Raw)": 2.0483922958374023, "Full-pretrain/Step": 2729, "Full-pretrain/Step Time": 17.598249385133386} +{"Full-pretrain/Learning Rate": 4.187079216960565e-05, "Full-pretrain/Loss": 1.949096441268921, "Full-pretrain/Loss (Raw)": 2.179385185241699, "Full-pretrain/Step": 2730, "Full-pretrain/Step Time": 17.601411117240787} +{"Full-pretrain/Learning Rate": 4.1864525233474414e-05, "Full-pretrain/Loss": 1.9491535425186157, "Full-pretrain/Loss (Raw)": 1.992938756942749, "Full-pretrain/Step": 2731, "Full-pretrain/Step Time": 17.60277619212866} +{"Full-pretrain/Learning Rate": 4.1858256352026125e-05, "Full-pretrain/Loss": 1.950758934020996, "Full-pretrain/Loss (Raw)": 2.0086729526519775, "Full-pretrain/Step": 2732, "Full-pretrain/Step Time": 17.59608587808907} +{"Full-pretrain/Learning Rate": 4.185198552598388e-05, "Full-pretrain/Loss": 1.9491056203842163, "Full-pretrain/Loss (Raw)": 1.932442545890808, "Full-pretrain/Step": 2733, "Full-pretrain/Step Time": 17.597585881128907} +{"Full-pretrain/Learning Rate": 4.184571275607103e-05, "Full-pretrain/Loss": 1.9606614112854004, "Full-pretrain/Loss (Raw)": 2.069709300994873, "Full-pretrain/Step": 2734, "Full-pretrain/Step Time": 17.59904768317938} +{"Full-pretrain/Learning Rate": 4.183943804301114e-05, "Full-pretrain/Loss": 1.9577195644378662, "Full-pretrain/Loss (Raw)": 1.9578903913497925, "Full-pretrain/Step": 2735, "Full-pretrain/Step Time": 17.606476921588182} +{"Full-pretrain/Learning Rate": 4.1833161387527986e-05, "Full-pretrain/Loss": 1.9595367908477783, "Full-pretrain/Loss (Raw)": 2.1374173164367676, "Full-pretrain/Step": 2736, "Full-pretrain/Step Time": 17.60351803712547} +{"Full-pretrain/Learning Rate": 4.182688279034558e-05, "Full-pretrain/Loss": 1.9682745933532715, "Full-pretrain/Loss (Raw)": 2.033264636993408, "Full-pretrain/Step": 2737, "Full-pretrain/Step Time": 17.598320761695504} +{"Full-pretrain/Learning Rate": 4.182060225218816e-05, "Full-pretrain/Loss": 1.9618384838104248, "Full-pretrain/Loss (Raw)": 2.0976476669311523, "Full-pretrain/Step": 2738, "Full-pretrain/Step Time": 17.59943726286292} +{"Full-pretrain/Learning Rate": 4.181431977378018e-05, "Full-pretrain/Loss": 1.9663335084915161, "Full-pretrain/Loss (Raw)": 2.0341649055480957, "Full-pretrain/Step": 2739, "Full-pretrain/Step Time": 17.593480590730906} +{"Full-pretrain/Learning Rate": 4.180803535584632e-05, "Full-pretrain/Loss": 1.955547571182251, "Full-pretrain/Loss (Raw)": 1.7399169206619263, "Full-pretrain/Step": 2740, "Full-pretrain/Step Time": 17.59789370931685} +{"Full-pretrain/Learning Rate": 4.180174899911149e-05, "Full-pretrain/Loss": 1.9599368572235107, "Full-pretrain/Loss (Raw)": 2.165625810623169, "Full-pretrain/Step": 2741, "Full-pretrain/Step Time": 17.594010055065155} +{"Full-pretrain/Learning Rate": 4.179546070430082e-05, "Full-pretrain/Loss": 1.9639430046081543, "Full-pretrain/Loss (Raw)": 2.140984535217285, "Full-pretrain/Step": 2742, "Full-pretrain/Step Time": 17.592706372961402} +{"Full-pretrain/Learning Rate": 4.1789170472139655e-05, "Full-pretrain/Loss": 1.9566690921783447, "Full-pretrain/Loss (Raw)": 1.6678098440170288, "Full-pretrain/Step": 2743, "Full-pretrain/Step Time": 17.594062194228172} +{"Full-pretrain/Learning Rate": 4.178287830335358e-05, "Full-pretrain/Loss": 1.9601494073867798, "Full-pretrain/Loss (Raw)": 2.0190553665161133, "Full-pretrain/Step": 2744, "Full-pretrain/Step Time": 17.59505197778344} +{"Full-pretrain/Learning Rate": 4.177658419866839e-05, "Full-pretrain/Loss": 1.962953805923462, "Full-pretrain/Loss (Raw)": 2.1277647018432617, "Full-pretrain/Step": 2745, "Full-pretrain/Step Time": 17.600130703300238} +{"Full-pretrain/Learning Rate": 4.177028815881011e-05, "Full-pretrain/Loss": 1.9735386371612549, "Full-pretrain/Loss (Raw)": 2.240960121154785, "Full-pretrain/Step": 2746, "Full-pretrain/Step Time": 17.597181636840105} +{"Full-pretrain/Learning Rate": 4.176399018450499e-05, "Full-pretrain/Loss": 1.9673998355865479, "Full-pretrain/Loss (Raw)": 1.6531271934509277, "Full-pretrain/Step": 2747, "Full-pretrain/Step Time": 17.602984711527824} +{"Full-pretrain/Learning Rate": 4.1757690276479476e-05, "Full-pretrain/Loss": 1.9765160083770752, "Full-pretrain/Loss (Raw)": 2.314852714538574, "Full-pretrain/Step": 2748, "Full-pretrain/Step Time": 17.599749583750963} +{"Full-pretrain/Learning Rate": 4.175138843546029e-05, "Full-pretrain/Loss": 1.9824544191360474, "Full-pretrain/Loss (Raw)": 2.0053932666778564, "Full-pretrain/Step": 2749, "Full-pretrain/Step Time": 17.60304538346827} +{"Full-pretrain/Learning Rate": 4.174508466217434e-05, "Full-pretrain/Loss": 1.9981149435043335, "Full-pretrain/Loss (Raw)": 1.9490270614624023, "Full-pretrain/Step": 2750, "Full-pretrain/Step Time": 17.605989703908563} +{"Full-pretrain/Learning Rate": 4.1738778957348744e-05, "Full-pretrain/Loss": 2.001117706298828, "Full-pretrain/Loss (Raw)": 2.021074056625366, "Full-pretrain/Step": 2751, "Full-pretrain/Step Time": 17.604050444439054} +{"Full-pretrain/Learning Rate": 4.173247132171089e-05, "Full-pretrain/Loss": 2.0171751976013184, "Full-pretrain/Loss (Raw)": 2.001070976257324, "Full-pretrain/Step": 2752, "Full-pretrain/Step Time": 17.607878176495433} +{"Full-pretrain/Learning Rate": 4.1726161755988344e-05, "Full-pretrain/Loss": 2.0143284797668457, "Full-pretrain/Loss (Raw)": 2.090696334838867, "Full-pretrain/Step": 2753, "Full-pretrain/Step Time": 17.610552037134767} +{"Full-pretrain/Learning Rate": 4.171985026090892e-05, "Full-pretrain/Loss": 2.012373447418213, "Full-pretrain/Loss (Raw)": 1.9971588850021362, "Full-pretrain/Step": 2754, "Full-pretrain/Step Time": 17.61076195910573} +{"Full-pretrain/Learning Rate": 4.171353683720064e-05, "Full-pretrain/Loss": 2.0170235633850098, "Full-pretrain/Loss (Raw)": 2.1306071281433105, "Full-pretrain/Step": 2755, "Full-pretrain/Step Time": 17.603039637207985} +{"Full-pretrain/Learning Rate": 4.170722148559176e-05, "Full-pretrain/Loss": 2.011162519454956, "Full-pretrain/Loss (Raw)": 2.0041801929473877, "Full-pretrain/Step": 2756, "Full-pretrain/Step Time": 17.608746564015746} +{"Full-pretrain/Learning Rate": 4.1700904206810755e-05, "Full-pretrain/Loss": 1.9986037015914917, "Full-pretrain/Loss (Raw)": 1.7094063758850098, "Full-pretrain/Step": 2757, "Full-pretrain/Step Time": 17.609864197671413} +{"Full-pretrain/Learning Rate": 4.169458500158632e-05, "Full-pretrain/Loss": 1.9895195960998535, "Full-pretrain/Loss (Raw)": 1.838719367980957, "Full-pretrain/Step": 2758, "Full-pretrain/Step Time": 17.612161869183183} +{"Full-pretrain/Learning Rate": 4.168826387064737e-05, "Full-pretrain/Loss": 2.0009889602661133, "Full-pretrain/Loss (Raw)": 2.1424131393432617, "Full-pretrain/Step": 2759, "Full-pretrain/Step Time": 17.604436235502362} +{"Full-pretrain/Learning Rate": 4.168194081472305e-05, "Full-pretrain/Loss": 2.021350622177124, "Full-pretrain/Loss (Raw)": 2.231451988220215, "Full-pretrain/Step": 2760, "Full-pretrain/Step Time": 17.60401718877256} +{"Full-pretrain/Learning Rate": 4.167561583454272e-05, "Full-pretrain/Loss": 2.0296573638916016, "Full-pretrain/Loss (Raw)": 2.314207077026367, "Full-pretrain/Step": 2761, "Full-pretrain/Step Time": 17.60855658352375} +{"Full-pretrain/Learning Rate": 4.166928893083596e-05, "Full-pretrain/Loss": 2.0212655067443848, "Full-pretrain/Loss (Raw)": 1.9108400344848633, "Full-pretrain/Step": 2762, "Full-pretrain/Step Time": 17.609591403976083} +{"Full-pretrain/Learning Rate": 4.166296010433258e-05, "Full-pretrain/Loss": 2.0167319774627686, "Full-pretrain/Loss (Raw)": 1.847869634628296, "Full-pretrain/Step": 2763, "Full-pretrain/Step Time": 17.612969240173697} +{"Full-pretrain/Learning Rate": 4.16566293557626e-05, "Full-pretrain/Loss": 2.0140879154205322, "Full-pretrain/Loss (Raw)": 1.9240667819976807, "Full-pretrain/Step": 2764, "Full-pretrain/Step Time": 17.60955374315381} +{"Full-pretrain/Learning Rate": 4.165029668585629e-05, "Full-pretrain/Loss": 2.016831874847412, "Full-pretrain/Loss (Raw)": 2.02024507522583, "Full-pretrain/Step": 2765, "Full-pretrain/Step Time": 17.610192589461803} +{"Full-pretrain/Learning Rate": 4.164396209534411e-05, "Full-pretrain/Loss": 2.0177979469299316, "Full-pretrain/Loss (Raw)": 2.1006267070770264, "Full-pretrain/Step": 2766, "Full-pretrain/Step Time": 17.609855884686112} +{"Full-pretrain/Learning Rate": 4.163762558495674e-05, "Full-pretrain/Loss": 2.028076171875, "Full-pretrain/Loss (Raw)": 2.2867937088012695, "Full-pretrain/Step": 2767, "Full-pretrain/Step Time": 17.61335190758109} +{"Full-pretrain/Learning Rate": 4.163128715542511e-05, "Full-pretrain/Loss": 2.0241966247558594, "Full-pretrain/Loss (Raw)": 2.0132718086242676, "Full-pretrain/Step": 2768, "Full-pretrain/Step Time": 17.61070016026497} +{"Full-pretrain/Learning Rate": 4.162494680748036e-05, "Full-pretrain/Loss": 2.024026393890381, "Full-pretrain/Loss (Raw)": 2.0278162956237793, "Full-pretrain/Step": 2769, "Full-pretrain/Step Time": 17.60820957645774} +{"Full-pretrain/Learning Rate": 4.1618604541853826e-05, "Full-pretrain/Loss": 2.016995668411255, "Full-pretrain/Loss (Raw)": 1.8726609945297241, "Full-pretrain/Step": 2770, "Full-pretrain/Step Time": 17.61194771155715} +{"Full-pretrain/Learning Rate": 4.1612260359277114e-05, "Full-pretrain/Loss": 2.0212976932525635, "Full-pretrain/Loss (Raw)": 2.171832323074341, "Full-pretrain/Step": 2771, "Full-pretrain/Step Time": 17.6104595400393} +{"Full-pretrain/Learning Rate": 4.160591426048199e-05, "Full-pretrain/Loss": 2.0188674926757812, "Full-pretrain/Loss (Raw)": 1.6621513366699219, "Full-pretrain/Step": 2772, "Full-pretrain/Step Time": 17.610621253028512} +{"Full-pretrain/Learning Rate": 4.1599566246200495e-05, "Full-pretrain/Loss": 2.0092196464538574, "Full-pretrain/Loss (Raw)": 1.8568912744522095, "Full-pretrain/Step": 2773, "Full-pretrain/Step Time": 17.605863012373447} +{"Full-pretrain/Learning Rate": 4.159321631716487e-05, "Full-pretrain/Loss": 2.0019145011901855, "Full-pretrain/Loss (Raw)": 1.9072253704071045, "Full-pretrain/Step": 2774, "Full-pretrain/Step Time": 17.60716519318521} +{"Full-pretrain/Learning Rate": 4.158686447410758e-05, "Full-pretrain/Loss": 2.013162851333618, "Full-pretrain/Loss (Raw)": 2.0277514457702637, "Full-pretrain/Step": 2775, "Full-pretrain/Step Time": 17.606964364647865} +{"Full-pretrain/Learning Rate": 4.158051071776129e-05, "Full-pretrain/Loss": 2.017256259918213, "Full-pretrain/Loss (Raw)": 2.1500449180603027, "Full-pretrain/Step": 2776, "Full-pretrain/Step Time": 17.602422542870045} +{"Full-pretrain/Learning Rate": 4.157415504885893e-05, "Full-pretrain/Loss": 2.016672372817993, "Full-pretrain/Loss (Raw)": 2.109084129333496, "Full-pretrain/Step": 2777, "Full-pretrain/Step Time": 17.60657245479524} +{"Full-pretrain/Learning Rate": 4.156779746813359e-05, "Full-pretrain/Loss": 2.005709409713745, "Full-pretrain/Loss (Raw)": 1.8901437520980835, "Full-pretrain/Step": 2778, "Full-pretrain/Step Time": 17.60246328264475} +{"Full-pretrain/Learning Rate": 4.1561437976318655e-05, "Full-pretrain/Loss": 2.0191738605499268, "Full-pretrain/Loss (Raw)": 2.083987236022949, "Full-pretrain/Step": 2779, "Full-pretrain/Step Time": 17.604354348033667} +{"Full-pretrain/Learning Rate": 4.155507657414766e-05, "Full-pretrain/Loss": 2.008671760559082, "Full-pretrain/Loss (Raw)": 1.9787859916687012, "Full-pretrain/Step": 2780, "Full-pretrain/Step Time": 17.604651981964707} +{"Full-pretrain/Learning Rate": 4.15487132623544e-05, "Full-pretrain/Loss": 2.0077342987060547, "Full-pretrain/Loss (Raw)": 1.9753990173339844, "Full-pretrain/Step": 2781, "Full-pretrain/Step Time": 17.60233366675675} +{"Full-pretrain/Learning Rate": 4.1542348041672884e-05, "Full-pretrain/Loss": 2.007490634918213, "Full-pretrain/Loss (Raw)": 1.9412301778793335, "Full-pretrain/Step": 2782, "Full-pretrain/Step Time": 17.601188607513905} +{"Full-pretrain/Learning Rate": 4.153598091283733e-05, "Full-pretrain/Loss": 2.002260208129883, "Full-pretrain/Loss (Raw)": 1.8537009954452515, "Full-pretrain/Step": 2783, "Full-pretrain/Step Time": 17.60076405853033} +{"Full-pretrain/Learning Rate": 4.15296118765822e-05, "Full-pretrain/Loss": 2.001587390899658, "Full-pretrain/Loss (Raw)": 1.9795349836349487, "Full-pretrain/Step": 2784, "Full-pretrain/Step Time": 17.6028244625777} +{"Full-pretrain/Learning Rate": 4.152324093364213e-05, "Full-pretrain/Loss": 1.9988386631011963, "Full-pretrain/Loss (Raw)": 2.002741813659668, "Full-pretrain/Step": 2785, "Full-pretrain/Step Time": 17.607516018673778} +{"Full-pretrain/Learning Rate": 4.151686808475204e-05, "Full-pretrain/Loss": 1.9968959093093872, "Full-pretrain/Loss (Raw)": 1.9349851608276367, "Full-pretrain/Step": 2786, "Full-pretrain/Step Time": 17.60599630139768} +{"Full-pretrain/Learning Rate": 4.151049333064702e-05, "Full-pretrain/Loss": 1.989296317100525, "Full-pretrain/Loss (Raw)": 1.8874201774597168, "Full-pretrain/Step": 2787, "Full-pretrain/Step Time": 17.60846850462258} +{"Full-pretrain/Learning Rate": 4.1504116672062386e-05, "Full-pretrain/Loss": 1.994450569152832, "Full-pretrain/Loss (Raw)": 2.1691155433654785, "Full-pretrain/Step": 2788, "Full-pretrain/Step Time": 17.60792836174369} +{"Full-pretrain/Learning Rate": 4.14977381097337e-05, "Full-pretrain/Loss": 2.0047085285186768, "Full-pretrain/Loss (Raw)": 2.037667751312256, "Full-pretrain/Step": 2789, "Full-pretrain/Step Time": 17.6069010309875} +{"Full-pretrain/Learning Rate": 4.149135764439672e-05, "Full-pretrain/Loss": 2.005894184112549, "Full-pretrain/Loss (Raw)": 1.876651406288147, "Full-pretrain/Step": 2790, "Full-pretrain/Step Time": 17.606657899916172} +{"Full-pretrain/Learning Rate": 4.1484975276787435e-05, "Full-pretrain/Loss": 1.9960575103759766, "Full-pretrain/Loss (Raw)": 1.8276402950286865, "Full-pretrain/Step": 2791, "Full-pretrain/Step Time": 17.603902600705624} +{"Full-pretrain/Learning Rate": 4.147859100764204e-05, "Full-pretrain/Loss": 1.9989805221557617, "Full-pretrain/Loss (Raw)": 2.324993133544922, "Full-pretrain/Step": 2792, "Full-pretrain/Step Time": 17.607668532058597} +{"Full-pretrain/Learning Rate": 4.1472204837696974e-05, "Full-pretrain/Loss": 1.993520736694336, "Full-pretrain/Loss (Raw)": 2.1394925117492676, "Full-pretrain/Step": 2793, "Full-pretrain/Step Time": 17.61124314367771} +{"Full-pretrain/Learning Rate": 4.146581676768885e-05, "Full-pretrain/Loss": 1.9951115846633911, "Full-pretrain/Loss (Raw)": 1.9617470502853394, "Full-pretrain/Step": 2794, "Full-pretrain/Step Time": 17.612709909677505} +{"Full-pretrain/Learning Rate": 4.145942679835456e-05, "Full-pretrain/Loss": 1.9880545139312744, "Full-pretrain/Loss (Raw)": 1.6220436096191406, "Full-pretrain/Step": 2795, "Full-pretrain/Step Time": 17.60561736486852} +{"Full-pretrain/Learning Rate": 4.145303493043118e-05, "Full-pretrain/Loss": 1.9928513765335083, "Full-pretrain/Loss (Raw)": 2.0775675773620605, "Full-pretrain/Step": 2796, "Full-pretrain/Step Time": 17.610727628692985} +{"Full-pretrain/Learning Rate": 4.1446641164655984e-05, "Full-pretrain/Loss": 1.9942554235458374, "Full-pretrain/Loss (Raw)": 2.065174102783203, "Full-pretrain/Step": 2797, "Full-pretrain/Step Time": 17.61119586415589} +{"Full-pretrain/Learning Rate": 4.144024550176653e-05, "Full-pretrain/Loss": 1.991953730583191, "Full-pretrain/Loss (Raw)": 2.0269699096679688, "Full-pretrain/Step": 2798, "Full-pretrain/Step Time": 17.615291249006987} +{"Full-pretrain/Learning Rate": 4.143384794250052e-05, "Full-pretrain/Loss": 1.9834651947021484, "Full-pretrain/Loss (Raw)": 2.0151658058166504, "Full-pretrain/Step": 2799, "Full-pretrain/Step Time": 17.61793464049697} +{"Full-pretrain/Learning Rate": 4.142744848759593e-05, "Full-pretrain/Loss": 1.9899475574493408, "Full-pretrain/Loss (Raw)": 2.2207064628601074, "Full-pretrain/Step": 2800, "Full-pretrain/Step Time": 17.62290431559086} +{"Full-pretrain/Learning Rate": 4.142104713779093e-05, "Full-pretrain/Loss": 1.9904191493988037, "Full-pretrain/Loss (Raw)": 2.042902708053589, "Full-pretrain/Step": 2801, "Full-pretrain/Step Time": 17.625154362991452} +{"Full-pretrain/Learning Rate": 4.1414643893823914e-05, "Full-pretrain/Loss": 1.9952316284179688, "Full-pretrain/Loss (Raw)": 2.0266623497009277, "Full-pretrain/Step": 2802, "Full-pretrain/Step Time": 17.618280792608857} +{"Full-pretrain/Learning Rate": 4.1408238756433495e-05, "Full-pretrain/Loss": 1.9877835512161255, "Full-pretrain/Loss (Raw)": 1.9334964752197266, "Full-pretrain/Step": 2803, "Full-pretrain/Step Time": 17.619874771684408} +{"Full-pretrain/Learning Rate": 4.14018317263585e-05, "Full-pretrain/Loss": 1.9967738389968872, "Full-pretrain/Loss (Raw)": 1.9498403072357178, "Full-pretrain/Step": 2804, "Full-pretrain/Step Time": 17.619460241869092} +{"Full-pretrain/Learning Rate": 4.1395422804337974e-05, "Full-pretrain/Loss": 2.005197525024414, "Full-pretrain/Loss (Raw)": 2.1264495849609375, "Full-pretrain/Step": 2805, "Full-pretrain/Step Time": 17.622062807902694} +{"Full-pretrain/Learning Rate": 4.1389011991111195e-05, "Full-pretrain/Loss": 1.9996806383132935, "Full-pretrain/Loss (Raw)": 1.7306854724884033, "Full-pretrain/Step": 2806, "Full-pretrain/Step Time": 17.617075568065047} +{"Full-pretrain/Learning Rate": 4.138259928741764e-05, "Full-pretrain/Loss": 1.999864101409912, "Full-pretrain/Loss (Raw)": 2.033618927001953, "Full-pretrain/Step": 2807, "Full-pretrain/Step Time": 17.61687334254384} +{"Full-pretrain/Learning Rate": 4.137618469399702e-05, "Full-pretrain/Loss": 1.9952192306518555, "Full-pretrain/Loss (Raw)": 2.001411199569702, "Full-pretrain/Step": 2808, "Full-pretrain/Step Time": 17.615556394681334} +{"Full-pretrain/Learning Rate": 4.136976821158924e-05, "Full-pretrain/Loss": 1.9986637830734253, "Full-pretrain/Loss (Raw)": 2.2193076610565186, "Full-pretrain/Step": 2809, "Full-pretrain/Step Time": 17.6157659124583} +{"Full-pretrain/Learning Rate": 4.1363349840934464e-05, "Full-pretrain/Loss": 1.9984220266342163, "Full-pretrain/Loss (Raw)": 1.8824118375778198, "Full-pretrain/Step": 2810, "Full-pretrain/Step Time": 17.60960776358843} +{"Full-pretrain/Learning Rate": 4.135692958277302e-05, "Full-pretrain/Loss": 1.995105266571045, "Full-pretrain/Loss (Raw)": 1.9778461456298828, "Full-pretrain/Step": 2811, "Full-pretrain/Step Time": 17.613692827522755} +{"Full-pretrain/Learning Rate": 4.13505074378455e-05, "Full-pretrain/Loss": 2.0001466274261475, "Full-pretrain/Loss (Raw)": 2.1401100158691406, "Full-pretrain/Step": 2812, "Full-pretrain/Step Time": 17.612036814913154} +{"Full-pretrain/Learning Rate": 4.13440834068927e-05, "Full-pretrain/Loss": 1.995347499847412, "Full-pretrain/Loss (Raw)": 1.8218283653259277, "Full-pretrain/Step": 2813, "Full-pretrain/Step Time": 17.61539184115827} +{"Full-pretrain/Learning Rate": 4.133765749065562e-05, "Full-pretrain/Loss": 1.9968286752700806, "Full-pretrain/Loss (Raw)": 1.9886283874511719, "Full-pretrain/Step": 2814, "Full-pretrain/Step Time": 17.618187088519335} +{"Full-pretrain/Learning Rate": 4.133122968987549e-05, "Full-pretrain/Loss": 2.000063896179199, "Full-pretrain/Loss (Raw)": 1.9572312831878662, "Full-pretrain/Step": 2815, "Full-pretrain/Step Time": 17.615084301680326} +{"Full-pretrain/Learning Rate": 4.1324800005293754e-05, "Full-pretrain/Loss": 1.9996669292449951, "Full-pretrain/Loss (Raw)": 1.9668257236480713, "Full-pretrain/Step": 2816, "Full-pretrain/Step Time": 17.618079498410225} +{"Full-pretrain/Learning Rate": 4.131836843765207e-05, "Full-pretrain/Loss": 2.0010530948638916, "Full-pretrain/Loss (Raw)": 2.0471012592315674, "Full-pretrain/Step": 2817, "Full-pretrain/Step Time": 17.6209654584527} +{"Full-pretrain/Learning Rate": 4.131193498769232e-05, "Full-pretrain/Loss": 2.012350082397461, "Full-pretrain/Loss (Raw)": 2.296490430831909, "Full-pretrain/Step": 2818, "Full-pretrain/Step Time": 17.620268082246184} +{"Full-pretrain/Learning Rate": 4.130549965615662e-05, "Full-pretrain/Loss": 2.014457941055298, "Full-pretrain/Loss (Raw)": 1.9548709392547607, "Full-pretrain/Step": 2819, "Full-pretrain/Step Time": 17.614159086719155} +{"Full-pretrain/Learning Rate": 4.129906244378724e-05, "Full-pretrain/Loss": 2.010511636734009, "Full-pretrain/Loss (Raw)": 2.0428342819213867, "Full-pretrain/Step": 2820, "Full-pretrain/Step Time": 17.613786105066538} +{"Full-pretrain/Learning Rate": 4.129262335132675e-05, "Full-pretrain/Loss": 2.001199960708618, "Full-pretrain/Loss (Raw)": 1.739693522453308, "Full-pretrain/Step": 2821, "Full-pretrain/Step Time": 17.61610764823854} +{"Full-pretrain/Learning Rate": 4.128618237951788e-05, "Full-pretrain/Loss": 2.0018417835235596, "Full-pretrain/Loss (Raw)": 1.897192358970642, "Full-pretrain/Step": 2822, "Full-pretrain/Step Time": 17.61892074160278} +{"Full-pretrain/Learning Rate": 4.1279739529103586e-05, "Full-pretrain/Loss": 2.0183277130126953, "Full-pretrain/Loss (Raw)": 2.3551924228668213, "Full-pretrain/Step": 2823, "Full-pretrain/Step Time": 17.615195084363222} +{"Full-pretrain/Learning Rate": 4.127329480082708e-05, "Full-pretrain/Loss": 2.0130796432495117, "Full-pretrain/Loss (Raw)": 2.1570539474487305, "Full-pretrain/Step": 2824, "Full-pretrain/Step Time": 17.61257185973227} +{"Full-pretrain/Learning Rate": 4.126684819543172e-05, "Full-pretrain/Loss": 2.006042242050171, "Full-pretrain/Loss (Raw)": 1.914291262626648, "Full-pretrain/Step": 2825, "Full-pretrain/Step Time": 17.61059719324112} +{"Full-pretrain/Learning Rate": 4.126039971366114e-05, "Full-pretrain/Loss": 2.008342981338501, "Full-pretrain/Loss (Raw)": 2.0353715419769287, "Full-pretrain/Step": 2826, "Full-pretrain/Step Time": 17.612787483260036} +{"Full-pretrain/Learning Rate": 4.1253949356259166e-05, "Full-pretrain/Loss": 2.015666961669922, "Full-pretrain/Loss (Raw)": 1.856416940689087, "Full-pretrain/Step": 2827, "Full-pretrain/Step Time": 17.606468411162496} +{"Full-pretrain/Learning Rate": 4.1247497123969844e-05, "Full-pretrain/Loss": 2.021728992462158, "Full-pretrain/Loss (Raw)": 2.27154803276062, "Full-pretrain/Step": 2828, "Full-pretrain/Step Time": 17.60602475889027} +{"Full-pretrain/Learning Rate": 4.124104301753745e-05, "Full-pretrain/Loss": 2.018237352371216, "Full-pretrain/Loss (Raw)": 1.953439712524414, "Full-pretrain/Step": 2829, "Full-pretrain/Step Time": 17.601736407727003} +{"Full-pretrain/Learning Rate": 4.123458703770645e-05, "Full-pretrain/Loss": 2.0095372200012207, "Full-pretrain/Loss (Raw)": 1.7485604286193848, "Full-pretrain/Step": 2830, "Full-pretrain/Step Time": 17.6055427826941} +{"Full-pretrain/Learning Rate": 4.122812918522153e-05, "Full-pretrain/Loss": 2.0090723037719727, "Full-pretrain/Loss (Raw)": 2.0002989768981934, "Full-pretrain/Step": 2831, "Full-pretrain/Step Time": 17.59855636022985} +{"Full-pretrain/Learning Rate": 4.122166946082762e-05, "Full-pretrain/Loss": 2.0077433586120605, "Full-pretrain/Loss (Raw)": 2.178170680999756, "Full-pretrain/Step": 2832, "Full-pretrain/Step Time": 17.60238029435277} +{"Full-pretrain/Learning Rate": 4.1215207865269835e-05, "Full-pretrain/Loss": 2.005077838897705, "Full-pretrain/Loss (Raw)": 1.9576082229614258, "Full-pretrain/Step": 2833, "Full-pretrain/Step Time": 17.604639168828726} +{"Full-pretrain/Learning Rate": 4.120874439929352e-05, "Full-pretrain/Loss": 2.007564067840576, "Full-pretrain/Loss (Raw)": 2.106226921081543, "Full-pretrain/Step": 2834, "Full-pretrain/Step Time": 17.604044549167156} +{"Full-pretrain/Learning Rate": 4.120227906364423e-05, "Full-pretrain/Loss": 2.023670196533203, "Full-pretrain/Loss (Raw)": 2.4488906860351562, "Full-pretrain/Step": 2835, "Full-pretrain/Step Time": 17.599160028621554} +{"Full-pretrain/Learning Rate": 4.1195811859067754e-05, "Full-pretrain/Loss": 2.022282600402832, "Full-pretrain/Loss (Raw)": 1.9054335355758667, "Full-pretrain/Step": 2836, "Full-pretrain/Step Time": 17.603901118040085} +{"Full-pretrain/Learning Rate": 4.118934278631007e-05, "Full-pretrain/Loss": 2.014552593231201, "Full-pretrain/Loss (Raw)": 1.8790949583053589, "Full-pretrain/Step": 2837, "Full-pretrain/Step Time": 17.604740388691425} +{"Full-pretrain/Learning Rate": 4.1182871846117375e-05, "Full-pretrain/Loss": 2.030956506729126, "Full-pretrain/Loss (Raw)": 2.2556090354919434, "Full-pretrain/Step": 2838, "Full-pretrain/Step Time": 17.60382964089513} +{"Full-pretrain/Learning Rate": 4.1176399039236116e-05, "Full-pretrain/Loss": 2.035431146621704, "Full-pretrain/Loss (Raw)": 2.1768076419830322, "Full-pretrain/Step": 2839, "Full-pretrain/Step Time": 17.603911800310016} +{"Full-pretrain/Learning Rate": 4.11699243664129e-05, "Full-pretrain/Loss": 2.0318403244018555, "Full-pretrain/Loss (Raw)": 1.8865070343017578, "Full-pretrain/Step": 2840, "Full-pretrain/Step Time": 17.60047190450132} +{"Full-pretrain/Learning Rate": 4.116344782839459e-05, "Full-pretrain/Loss": 2.025752305984497, "Full-pretrain/Loss (Raw)": 2.024489164352417, "Full-pretrain/Step": 2841, "Full-pretrain/Step Time": 17.602867051959038} +{"Full-pretrain/Learning Rate": 4.115696942592826e-05, "Full-pretrain/Loss": 2.0283126831054688, "Full-pretrain/Loss (Raw)": 1.964339017868042, "Full-pretrain/Step": 2842, "Full-pretrain/Step Time": 17.605908872559667} +{"Full-pretrain/Learning Rate": 4.115048915976118e-05, "Full-pretrain/Loss": 2.0236573219299316, "Full-pretrain/Loss (Raw)": 1.828873872756958, "Full-pretrain/Step": 2843, "Full-pretrain/Step Time": 17.606810504570603} +{"Full-pretrain/Learning Rate": 4.114400703064085e-05, "Full-pretrain/Loss": 2.018688201904297, "Full-pretrain/Loss (Raw)": 1.9811022281646729, "Full-pretrain/Step": 2844, "Full-pretrain/Step Time": 17.59621648862958} +{"Full-pretrain/Learning Rate": 4.1137523039314994e-05, "Full-pretrain/Loss": 2.024226427078247, "Full-pretrain/Loss (Raw)": 1.9990510940551758, "Full-pretrain/Step": 2845, "Full-pretrain/Step Time": 17.599042842164636} +{"Full-pretrain/Learning Rate": 4.113103718653152e-05, "Full-pretrain/Loss": 2.025800943374634, "Full-pretrain/Loss (Raw)": 2.0390124320983887, "Full-pretrain/Step": 2846, "Full-pretrain/Step Time": 17.598610546439886} +{"Full-pretrain/Learning Rate": 4.112454947303856e-05, "Full-pretrain/Loss": 2.025848865509033, "Full-pretrain/Loss (Raw)": 1.9587624073028564, "Full-pretrain/Step": 2847, "Full-pretrain/Step Time": 17.603076998144388} +{"Full-pretrain/Learning Rate": 4.111805989958451e-05, "Full-pretrain/Loss": 2.024355888366699, "Full-pretrain/Loss (Raw)": 1.919055700302124, "Full-pretrain/Step": 2848, "Full-pretrain/Step Time": 17.594989977777004} +{"Full-pretrain/Learning Rate": 4.11115684669179e-05, "Full-pretrain/Loss": 2.0221364498138428, "Full-pretrain/Loss (Raw)": 1.9760725498199463, "Full-pretrain/Step": 2849, "Full-pretrain/Step Time": 17.591785233467817} +{"Full-pretrain/Learning Rate": 4.110507517578753e-05, "Full-pretrain/Loss": 2.0182671546936035, "Full-pretrain/Loss (Raw)": 2.1726837158203125, "Full-pretrain/Step": 2850, "Full-pretrain/Step Time": 17.58796489611268} +{"Full-pretrain/Learning Rate": 4.10985800269424e-05, "Full-pretrain/Loss": 2.0185060501098633, "Full-pretrain/Loss (Raw)": 1.9625118970870972, "Full-pretrain/Step": 2851, "Full-pretrain/Step Time": 17.590031884610653} +{"Full-pretrain/Learning Rate": 4.109208302113173e-05, "Full-pretrain/Loss": 2.0176262855529785, "Full-pretrain/Loss (Raw)": 2.014683723449707, "Full-pretrain/Step": 2852, "Full-pretrain/Step Time": 17.584726724773645} +{"Full-pretrain/Learning Rate": 4.108558415910493e-05, "Full-pretrain/Loss": 2.0307705402374268, "Full-pretrain/Loss (Raw)": 2.160301685333252, "Full-pretrain/Step": 2853, "Full-pretrain/Step Time": 17.58230678923428} +{"Full-pretrain/Learning Rate": 4.107908344161165e-05, "Full-pretrain/Loss": 2.0389389991760254, "Full-pretrain/Loss (Raw)": 2.1585893630981445, "Full-pretrain/Step": 2854, "Full-pretrain/Step Time": 17.579089649021626} +{"Full-pretrain/Learning Rate": 4.107258086940174e-05, "Full-pretrain/Loss": 2.0282678604125977, "Full-pretrain/Loss (Raw)": 2.0137150287628174, "Full-pretrain/Step": 2855, "Full-pretrain/Step Time": 17.576967876404524} +{"Full-pretrain/Learning Rate": 4.106607644322529e-05, "Full-pretrain/Loss": 2.029088020324707, "Full-pretrain/Loss (Raw)": 2.1833038330078125, "Full-pretrain/Step": 2856, "Full-pretrain/Step Time": 17.574570581316948} +{"Full-pretrain/Learning Rate": 4.105957016383256e-05, "Full-pretrain/Loss": 2.0307586193084717, "Full-pretrain/Loss (Raw)": 1.9677385091781616, "Full-pretrain/Step": 2857, "Full-pretrain/Step Time": 17.571198949590325} +{"Full-pretrain/Learning Rate": 4.1053062031974055e-05, "Full-pretrain/Loss": 2.0253238677978516, "Full-pretrain/Loss (Raw)": 1.8614615201950073, "Full-pretrain/Step": 2858, "Full-pretrain/Step Time": 17.578767837956548} +{"Full-pretrain/Learning Rate": 4.104655204840048e-05, "Full-pretrain/Loss": 2.0316848754882812, "Full-pretrain/Loss (Raw)": 2.059965133666992, "Full-pretrain/Step": 2859, "Full-pretrain/Step Time": 17.579220842570066} +{"Full-pretrain/Learning Rate": 4.104004021386277e-05, "Full-pretrain/Loss": 2.0196492671966553, "Full-pretrain/Loss (Raw)": 1.8864142894744873, "Full-pretrain/Step": 2860, "Full-pretrain/Step Time": 17.581843899562955} +{"Full-pretrain/Learning Rate": 4.1033526529112064e-05, "Full-pretrain/Loss": 2.0234274864196777, "Full-pretrain/Loss (Raw)": 2.074340343475342, "Full-pretrain/Step": 2861, "Full-pretrain/Step Time": 17.58290956541896} +{"Full-pretrain/Learning Rate": 4.1027010994899705e-05, "Full-pretrain/Loss": 2.026315689086914, "Full-pretrain/Loss (Raw)": 1.84098219871521, "Full-pretrain/Step": 2862, "Full-pretrain/Step Time": 17.583578119054437} +{"Full-pretrain/Learning Rate": 4.1020493611977265e-05, "Full-pretrain/Loss": 2.024473190307617, "Full-pretrain/Loss (Raw)": 1.9413423538208008, "Full-pretrain/Step": 2863, "Full-pretrain/Step Time": 17.57800423167646} +{"Full-pretrain/Learning Rate": 4.10139743810965e-05, "Full-pretrain/Loss": 2.0208311080932617, "Full-pretrain/Loss (Raw)": 2.0616254806518555, "Full-pretrain/Step": 2864, "Full-pretrain/Step Time": 17.577191503718495} +{"Full-pretrain/Learning Rate": 4.100745330300943e-05, "Full-pretrain/Loss": 2.012434720993042, "Full-pretrain/Loss (Raw)": 1.6889240741729736, "Full-pretrain/Step": 2865, "Full-pretrain/Step Time": 17.58119356445968} +{"Full-pretrain/Learning Rate": 4.100093037846825e-05, "Full-pretrain/Loss": 2.0144572257995605, "Full-pretrain/Loss (Raw)": 2.1709494590759277, "Full-pretrain/Step": 2866, "Full-pretrain/Step Time": 17.580798571929336} +{"Full-pretrain/Learning Rate": 4.099440560822536e-05, "Full-pretrain/Loss": 2.0113353729248047, "Full-pretrain/Loss (Raw)": 2.348987340927124, "Full-pretrain/Step": 2867, "Full-pretrain/Step Time": 17.58297067321837} +{"Full-pretrain/Learning Rate": 4.0987878993033415e-05, "Full-pretrain/Loss": 2.011043071746826, "Full-pretrain/Loss (Raw)": 1.8960766792297363, "Full-pretrain/Step": 2868, "Full-pretrain/Step Time": 17.579460214823484} +{"Full-pretrain/Learning Rate": 4.098135053364525e-05, "Full-pretrain/Loss": 2.0171995162963867, "Full-pretrain/Loss (Raw)": 2.0761022567749023, "Full-pretrain/Step": 2869, "Full-pretrain/Step Time": 17.580561321228743} +{"Full-pretrain/Learning Rate": 4.097482023081391e-05, "Full-pretrain/Loss": 2.011800527572632, "Full-pretrain/Loss (Raw)": 2.0828447341918945, "Full-pretrain/Step": 2870, "Full-pretrain/Step Time": 17.588667321950197} +{"Full-pretrain/Learning Rate": 4.096828808529267e-05, "Full-pretrain/Loss": 2.0090184211730957, "Full-pretrain/Loss (Raw)": 2.0877842903137207, "Full-pretrain/Step": 2871, "Full-pretrain/Step Time": 17.58856094069779} +{"Full-pretrain/Learning Rate": 4.0961754097835015e-05, "Full-pretrain/Loss": 2.0132393836975098, "Full-pretrain/Loss (Raw)": 2.0215721130371094, "Full-pretrain/Step": 2872, "Full-pretrain/Step Time": 17.58513300307095} +{"Full-pretrain/Learning Rate": 4.0955218269194626e-05, "Full-pretrain/Loss": 2.0095107555389404, "Full-pretrain/Loss (Raw)": 1.905174970626831, "Full-pretrain/Step": 2873, "Full-pretrain/Step Time": 17.58419211022556} +{"Full-pretrain/Learning Rate": 4.0948680600125433e-05, "Full-pretrain/Loss": 2.0197954177856445, "Full-pretrain/Loss (Raw)": 2.293447971343994, "Full-pretrain/Step": 2874, "Full-pretrain/Step Time": 17.587562683969736} +{"Full-pretrain/Learning Rate": 4.094214109138153e-05, "Full-pretrain/Loss": 2.0295493602752686, "Full-pretrain/Loss (Raw)": 2.1409974098205566, "Full-pretrain/Step": 2875, "Full-pretrain/Step Time": 17.584157343953848} +{"Full-pretrain/Learning Rate": 4.093559974371725e-05, "Full-pretrain/Loss": 2.0245206356048584, "Full-pretrain/Loss (Raw)": 1.8201878070831299, "Full-pretrain/Step": 2876, "Full-pretrain/Step Time": 17.58504919707775} +{"Full-pretrain/Learning Rate": 4.092905655788714e-05, "Full-pretrain/Loss": 2.020069122314453, "Full-pretrain/Loss (Raw)": 1.856600284576416, "Full-pretrain/Step": 2877, "Full-pretrain/Step Time": 17.57741385139525} +{"Full-pretrain/Learning Rate": 4.092251153464595e-05, "Full-pretrain/Loss": 2.0164523124694824, "Full-pretrain/Loss (Raw)": 1.923269510269165, "Full-pretrain/Step": 2878, "Full-pretrain/Step Time": 17.579320169985294} +{"Full-pretrain/Learning Rate": 4.091596467474866e-05, "Full-pretrain/Loss": 2.014492988586426, "Full-pretrain/Loss (Raw)": 1.8960692882537842, "Full-pretrain/Step": 2879, "Full-pretrain/Step Time": 17.580752139911056} +{"Full-pretrain/Learning Rate": 4.0909415978950434e-05, "Full-pretrain/Loss": 2.016509532928467, "Full-pretrain/Loss (Raw)": 1.9835851192474365, "Full-pretrain/Step": 2880, "Full-pretrain/Step Time": 17.576023070141673} +{"Full-pretrain/Learning Rate": 4.0902865448006665e-05, "Full-pretrain/Loss": 2.0180890560150146, "Full-pretrain/Loss (Raw)": 2.0266127586364746, "Full-pretrain/Step": 2881, "Full-pretrain/Step Time": 17.57459664903581} +{"Full-pretrain/Learning Rate": 4.0896313082672956e-05, "Full-pretrain/Loss": 2.0082621574401855, "Full-pretrain/Loss (Raw)": 1.85822331905365, "Full-pretrain/Step": 2882, "Full-pretrain/Step Time": 17.579597963020205} +{"Full-pretrain/Learning Rate": 4.088975888370512e-05, "Full-pretrain/Loss": 2.010039806365967, "Full-pretrain/Loss (Raw)": 2.0194027423858643, "Full-pretrain/Step": 2883, "Full-pretrain/Step Time": 17.576903400942683} +{"Full-pretrain/Learning Rate": 4.088320285185918e-05, "Full-pretrain/Loss": 2.025531053543091, "Full-pretrain/Loss (Raw)": 2.5104031562805176, "Full-pretrain/Step": 2884, "Full-pretrain/Step Time": 17.566406592726707} +{"Full-pretrain/Learning Rate": 4.087664498789137e-05, "Full-pretrain/Loss": 2.0165295600891113, "Full-pretrain/Loss (Raw)": 1.8722517490386963, "Full-pretrain/Step": 2885, "Full-pretrain/Step Time": 17.572798194363713} +{"Full-pretrain/Learning Rate": 4.0870085292558145e-05, "Full-pretrain/Loss": 2.010366439819336, "Full-pretrain/Loss (Raw)": 1.9613745212554932, "Full-pretrain/Step": 2886, "Full-pretrain/Step Time": 17.57584731094539} +{"Full-pretrain/Learning Rate": 4.0863523766616157e-05, "Full-pretrain/Loss": 2.017432689666748, "Full-pretrain/Loss (Raw)": 2.239833116531372, "Full-pretrain/Step": 2887, "Full-pretrain/Step Time": 17.577462643384933} +{"Full-pretrain/Learning Rate": 4.085696041082228e-05, "Full-pretrain/Loss": 2.026130199432373, "Full-pretrain/Loss (Raw)": 2.4616243839263916, "Full-pretrain/Step": 2888, "Full-pretrain/Step Time": 17.57257517799735} +{"Full-pretrain/Learning Rate": 4.085039522593358e-05, "Full-pretrain/Loss": 2.0357513427734375, "Full-pretrain/Loss (Raw)": 2.275618076324463, "Full-pretrain/Step": 2889, "Full-pretrain/Step Time": 17.571375904604793} +{"Full-pretrain/Learning Rate": 4.084382821270737e-05, "Full-pretrain/Loss": 2.04190731048584, "Full-pretrain/Loss (Raw)": 2.058445453643799, "Full-pretrain/Step": 2890, "Full-pretrain/Step Time": 17.577759757637978} +{"Full-pretrain/Learning Rate": 4.083725937190115e-05, "Full-pretrain/Loss": 2.0389838218688965, "Full-pretrain/Loss (Raw)": 1.9664173126220703, "Full-pretrain/Step": 2891, "Full-pretrain/Step Time": 17.578197229653597} +{"Full-pretrain/Learning Rate": 4.083068870427262e-05, "Full-pretrain/Loss": 2.047891616821289, "Full-pretrain/Loss (Raw)": 2.1714601516723633, "Full-pretrain/Step": 2892, "Full-pretrain/Step Time": 17.571814998984337} +{"Full-pretrain/Learning Rate": 4.082411621057971e-05, "Full-pretrain/Loss": 2.0498476028442383, "Full-pretrain/Loss (Raw)": 2.136930465698242, "Full-pretrain/Step": 2893, "Full-pretrain/Step Time": 17.571365494281054} +{"Full-pretrain/Learning Rate": 4.081754189158056e-05, "Full-pretrain/Loss": 2.0548338890075684, "Full-pretrain/Loss (Raw)": 2.00054669380188, "Full-pretrain/Step": 2894, "Full-pretrain/Step Time": 17.57920570485294} +{"Full-pretrain/Learning Rate": 4.081096574803351e-05, "Full-pretrain/Loss": 2.06270432472229, "Full-pretrain/Loss (Raw)": 2.193194627761841, "Full-pretrain/Step": 2895, "Full-pretrain/Step Time": 17.578946985304356} +{"Full-pretrain/Learning Rate": 4.080438778069711e-05, "Full-pretrain/Loss": 2.0665459632873535, "Full-pretrain/Loss (Raw)": 2.184560775756836, "Full-pretrain/Step": 2896, "Full-pretrain/Step Time": 17.572597285732627} +{"Full-pretrain/Learning Rate": 4.0797807990330136e-05, "Full-pretrain/Loss": 2.0732131004333496, "Full-pretrain/Loss (Raw)": 1.902266502380371, "Full-pretrain/Step": 2897, "Full-pretrain/Step Time": 17.574066001921892} +{"Full-pretrain/Learning Rate": 4.079122637769157e-05, "Full-pretrain/Loss": 2.068582057952881, "Full-pretrain/Loss (Raw)": 2.0227608680725098, "Full-pretrain/Step": 2898, "Full-pretrain/Step Time": 17.577730055898428} +{"Full-pretrain/Learning Rate": 4.078464294354059e-05, "Full-pretrain/Loss": 2.0537467002868652, "Full-pretrain/Loss (Raw)": 1.874251365661621, "Full-pretrain/Step": 2899, "Full-pretrain/Step Time": 17.583094388246536} +{"Full-pretrain/Learning Rate": 4.07780576886366e-05, "Full-pretrain/Loss": 2.051992416381836, "Full-pretrain/Loss (Raw)": 1.8399442434310913, "Full-pretrain/Step": 2900, "Full-pretrain/Step Time": 17.580118127167225} +{"Full-pretrain/Learning Rate": 4.077147061373918e-05, "Full-pretrain/Loss": 2.0468506813049316, "Full-pretrain/Loss (Raw)": 1.9115709066390991, "Full-pretrain/Step": 2901, "Full-pretrain/Step Time": 17.57913699001074} +{"Full-pretrain/Learning Rate": 4.0764881719608185e-05, "Full-pretrain/Loss": 2.043274402618408, "Full-pretrain/Loss (Raw)": 1.9683979749679565, "Full-pretrain/Step": 2902, "Full-pretrain/Step Time": 17.587963227182627} +{"Full-pretrain/Learning Rate": 4.0758291007003615e-05, "Full-pretrain/Loss": 2.0326545238494873, "Full-pretrain/Loss (Raw)": 1.7479503154754639, "Full-pretrain/Step": 2903, "Full-pretrain/Step Time": 17.587477320805192} +{"Full-pretrain/Learning Rate": 4.075169847668572e-05, "Full-pretrain/Loss": 2.0357282161712646, "Full-pretrain/Loss (Raw)": 2.1199264526367188, "Full-pretrain/Step": 2904, "Full-pretrain/Step Time": 17.589557433500886} +{"Full-pretrain/Learning Rate": 4.074510412941493e-05, "Full-pretrain/Loss": 2.0367488861083984, "Full-pretrain/Loss (Raw)": 1.9378366470336914, "Full-pretrain/Step": 2905, "Full-pretrain/Step Time": 17.580626813694835} +{"Full-pretrain/Learning Rate": 4.073850796595192e-05, "Full-pretrain/Loss": 2.0244123935699463, "Full-pretrain/Loss (Raw)": 1.8986836671829224, "Full-pretrain/Step": 2906, "Full-pretrain/Step Time": 17.586082354187965} +{"Full-pretrain/Learning Rate": 4.073190998705755e-05, "Full-pretrain/Loss": 2.021362543106079, "Full-pretrain/Loss (Raw)": 2.0434021949768066, "Full-pretrain/Step": 2907, "Full-pretrain/Step Time": 17.588504143059254} +{"Full-pretrain/Learning Rate": 4.0725310193492895e-05, "Full-pretrain/Loss": 2.0315780639648438, "Full-pretrain/Loss (Raw)": 2.1470837593078613, "Full-pretrain/Step": 2908, "Full-pretrain/Step Time": 17.586599493399262} +{"Full-pretrain/Learning Rate": 4.0718708586019225e-05, "Full-pretrain/Loss": 2.037393569946289, "Full-pretrain/Loss (Raw)": 2.042698860168457, "Full-pretrain/Step": 2909, "Full-pretrain/Step Time": 17.58923148550093} +{"Full-pretrain/Learning Rate": 4.071210516539804e-05, "Full-pretrain/Loss": 2.0510895252227783, "Full-pretrain/Loss (Raw)": 2.361539363861084, "Full-pretrain/Step": 2910, "Full-pretrain/Step Time": 17.593708900734782} +{"Full-pretrain/Learning Rate": 4.070549993239106e-05, "Full-pretrain/Loss": 2.0428740978240967, "Full-pretrain/Loss (Raw)": 1.6331732273101807, "Full-pretrain/Step": 2911, "Full-pretrain/Step Time": 17.597281532362103} +{"Full-pretrain/Learning Rate": 4.069889288776018e-05, "Full-pretrain/Loss": 2.042553424835205, "Full-pretrain/Loss (Raw)": 1.973329782485962, "Full-pretrain/Step": 2912, "Full-pretrain/Step Time": 17.598256638273597} +{"Full-pretrain/Learning Rate": 4.0692284032267516e-05, "Full-pretrain/Loss": 2.032949209213257, "Full-pretrain/Loss (Raw)": 1.719268798828125, "Full-pretrain/Step": 2913, "Full-pretrain/Step Time": 17.58658318594098} +{"Full-pretrain/Learning Rate": 4.06856733666754e-05, "Full-pretrain/Loss": 2.054020404815674, "Full-pretrain/Loss (Raw)": 2.532501697540283, "Full-pretrain/Step": 2914, "Full-pretrain/Step Time": 17.591487424448133} +{"Full-pretrain/Learning Rate": 4.0679060891746386e-05, "Full-pretrain/Loss": 2.0528717041015625, "Full-pretrain/Loss (Raw)": 1.9826496839523315, "Full-pretrain/Step": 2915, "Full-pretrain/Step Time": 17.600084306672215} +{"Full-pretrain/Learning Rate": 4.06724466082432e-05, "Full-pretrain/Loss": 2.035043716430664, "Full-pretrain/Loss (Raw)": 1.939910888671875, "Full-pretrain/Step": 2916, "Full-pretrain/Step Time": 17.597902996465564} +{"Full-pretrain/Learning Rate": 4.066583051692881e-05, "Full-pretrain/Loss": 2.0393950939178467, "Full-pretrain/Loss (Raw)": 2.011486530303955, "Full-pretrain/Step": 2917, "Full-pretrain/Step Time": 17.596214463934302} +{"Full-pretrain/Learning Rate": 4.065921261856637e-05, "Full-pretrain/Loss": 2.044574737548828, "Full-pretrain/Loss (Raw)": 2.127133369445801, "Full-pretrain/Step": 2918, "Full-pretrain/Step Time": 17.59353361837566} +{"Full-pretrain/Learning Rate": 4.065259291391926e-05, "Full-pretrain/Loss": 2.036768913269043, "Full-pretrain/Loss (Raw)": 1.990038275718689, "Full-pretrain/Step": 2919, "Full-pretrain/Step Time": 17.599285822361708} +{"Full-pretrain/Learning Rate": 4.064597140375105e-05, "Full-pretrain/Loss": 2.0238373279571533, "Full-pretrain/Loss (Raw)": 2.047821044921875, "Full-pretrain/Step": 2920, "Full-pretrain/Step Time": 17.605149703100324} +{"Full-pretrain/Learning Rate": 4.0639348088825554e-05, "Full-pretrain/Loss": 2.0170536041259766, "Full-pretrain/Loss (Raw)": 2.0585269927978516, "Full-pretrain/Step": 2921, "Full-pretrain/Step Time": 17.60242691449821} +{"Full-pretrain/Learning Rate": 4.063272296990674e-05, "Full-pretrain/Loss": 2.015674114227295, "Full-pretrain/Loss (Raw)": 2.0143113136291504, "Full-pretrain/Step": 2922, "Full-pretrain/Step Time": 17.60229028388858} +{"Full-pretrain/Learning Rate": 4.0626096047758824e-05, "Full-pretrain/Loss": 2.009251832962036, "Full-pretrain/Loss (Raw)": 1.7609026432037354, "Full-pretrain/Step": 2923, "Full-pretrain/Step Time": 17.605074098333716} +{"Full-pretrain/Learning Rate": 4.061946732314622e-05, "Full-pretrain/Loss": 2.0030994415283203, "Full-pretrain/Loss (Raw)": 1.9745889902114868, "Full-pretrain/Step": 2924, "Full-pretrain/Step Time": 17.60700094886124} +{"Full-pretrain/Learning Rate": 4.061283679683356e-05, "Full-pretrain/Loss": 1.9998220205307007, "Full-pretrain/Loss (Raw)": 2.032043933868408, "Full-pretrain/Step": 2925, "Full-pretrain/Step Time": 17.600678898394108} +{"Full-pretrain/Learning Rate": 4.060620446958565e-05, "Full-pretrain/Loss": 1.9921517372131348, "Full-pretrain/Loss (Raw)": 1.7550996541976929, "Full-pretrain/Step": 2926, "Full-pretrain/Step Time": 17.59826746955514} +{"Full-pretrain/Learning Rate": 4.0599570342167546e-05, "Full-pretrain/Loss": 1.988911747932434, "Full-pretrain/Loss (Raw)": 2.0895159244537354, "Full-pretrain/Step": 2927, "Full-pretrain/Step Time": 17.60129364952445} +{"Full-pretrain/Learning Rate": 4.0592934415344485e-05, "Full-pretrain/Loss": 1.990855097770691, "Full-pretrain/Loss (Raw)": 2.246748208999634, "Full-pretrain/Step": 2928, "Full-pretrain/Step Time": 17.598588090389967} +{"Full-pretrain/Learning Rate": 4.058629668988192e-05, "Full-pretrain/Loss": 1.9858760833740234, "Full-pretrain/Loss (Raw)": 1.7429335117340088, "Full-pretrain/Step": 2929, "Full-pretrain/Step Time": 17.593575470149517} +{"Full-pretrain/Learning Rate": 4.0579657166545505e-05, "Full-pretrain/Loss": 1.980681300163269, "Full-pretrain/Loss (Raw)": 1.856530785560608, "Full-pretrain/Step": 2930, "Full-pretrain/Step Time": 17.600066885352135} +{"Full-pretrain/Learning Rate": 4.0573015846101117e-05, "Full-pretrain/Loss": 1.989772915840149, "Full-pretrain/Loss (Raw)": 2.1651828289031982, "Full-pretrain/Step": 2931, "Full-pretrain/Step Time": 17.59791599214077} +{"Full-pretrain/Learning Rate": 4.056637272931482e-05, "Full-pretrain/Loss": 1.993697166442871, "Full-pretrain/Loss (Raw)": 1.965524673461914, "Full-pretrain/Step": 2932, "Full-pretrain/Step Time": 17.60302077792585} +{"Full-pretrain/Learning Rate": 4.0559727816952894e-05, "Full-pretrain/Loss": 1.9974377155303955, "Full-pretrain/Loss (Raw)": 2.0312654972076416, "Full-pretrain/Step": 2933, "Full-pretrain/Step Time": 17.597801657393575} +{"Full-pretrain/Learning Rate": 4.0553081109781844e-05, "Full-pretrain/Loss": 1.9923175573349, "Full-pretrain/Loss (Raw)": 1.804551124572754, "Full-pretrain/Step": 2934, "Full-pretrain/Step Time": 17.605236034840345} +{"Full-pretrain/Learning Rate": 4.054643260856834e-05, "Full-pretrain/Loss": 1.9993095397949219, "Full-pretrain/Loss (Raw)": 1.971695899963379, "Full-pretrain/Step": 2935, "Full-pretrain/Step Time": 17.608331758528948} +{"Full-pretrain/Learning Rate": 4.053978231407931e-05, "Full-pretrain/Loss": 1.9928345680236816, "Full-pretrain/Loss (Raw)": 1.9127252101898193, "Full-pretrain/Step": 2936, "Full-pretrain/Step Time": 17.614179581403732} +{"Full-pretrain/Learning Rate": 4.053313022708184e-05, "Full-pretrain/Loss": 2.000356912612915, "Full-pretrain/Loss (Raw)": 2.178550958633423, "Full-pretrain/Step": 2937, "Full-pretrain/Step Time": 17.611291566863656} +{"Full-pretrain/Learning Rate": 4.052647634834327e-05, "Full-pretrain/Loss": 2.0072903633117676, "Full-pretrain/Loss (Raw)": 2.1205544471740723, "Full-pretrain/Step": 2938, "Full-pretrain/Step Time": 17.613933738321066} +{"Full-pretrain/Learning Rate": 4.0519820678631094e-05, "Full-pretrain/Loss": 2.007362127304077, "Full-pretrain/Loss (Raw)": 2.045698404312134, "Full-pretrain/Step": 2939, "Full-pretrain/Step Time": 17.61443488486111} +{"Full-pretrain/Learning Rate": 4.051316321871307e-05, "Full-pretrain/Loss": 2.005005359649658, "Full-pretrain/Loss (Raw)": 2.0716731548309326, "Full-pretrain/Step": 2940, "Full-pretrain/Step Time": 17.61260249093175} +{"Full-pretrain/Learning Rate": 4.050650396935711e-05, "Full-pretrain/Loss": 1.9969699382781982, "Full-pretrain/Loss (Raw)": 1.7855596542358398, "Full-pretrain/Step": 2941, "Full-pretrain/Step Time": 17.60806817188859} +{"Full-pretrain/Learning Rate": 4.049984293133138e-05, "Full-pretrain/Loss": 1.9885146617889404, "Full-pretrain/Loss (Raw)": 2.0909736156463623, "Full-pretrain/Step": 2942, "Full-pretrain/Step Time": 17.607795171439648} +{"Full-pretrain/Learning Rate": 4.04931801054042e-05, "Full-pretrain/Loss": 1.9945274591445923, "Full-pretrain/Loss (Raw)": 1.8255772590637207, "Full-pretrain/Step": 2943, "Full-pretrain/Step Time": 17.613590616732836} +{"Full-pretrain/Learning Rate": 4.048651549234415e-05, "Full-pretrain/Loss": 1.9940177202224731, "Full-pretrain/Loss (Raw)": 1.9570214748382568, "Full-pretrain/Step": 2944, "Full-pretrain/Step Time": 17.605611361563206} +{"Full-pretrain/Learning Rate": 4.0479849092919974e-05, "Full-pretrain/Loss": 2.0012779235839844, "Full-pretrain/Loss (Raw)": 1.9515985250473022, "Full-pretrain/Step": 2945, "Full-pretrain/Step Time": 17.599905859678984} +{"Full-pretrain/Learning Rate": 4.047318090790065e-05, "Full-pretrain/Loss": 1.9805283546447754, "Full-pretrain/Loss (Raw)": 1.8685153722763062, "Full-pretrain/Step": 2946, "Full-pretrain/Step Time": 17.600211076438427} +{"Full-pretrain/Learning Rate": 4.046651093805534e-05, "Full-pretrain/Loss": 1.980050802230835, "Full-pretrain/Loss (Raw)": 1.9673609733581543, "Full-pretrain/Step": 2947, "Full-pretrain/Step Time": 17.599995573982596} +{"Full-pretrain/Learning Rate": 4.0459839184153435e-05, "Full-pretrain/Loss": 1.98145592212677, "Full-pretrain/Loss (Raw)": 1.9848779439926147, "Full-pretrain/Step": 2948, "Full-pretrain/Step Time": 17.597866743803024} +{"Full-pretrain/Learning Rate": 4.045316564696451e-05, "Full-pretrain/Loss": 1.9769457578659058, "Full-pretrain/Loss (Raw)": 1.8671629428863525, "Full-pretrain/Step": 2949, "Full-pretrain/Step Time": 17.58996651135385} +{"Full-pretrain/Learning Rate": 4.044649032725836e-05, "Full-pretrain/Loss": 1.9747446775436401, "Full-pretrain/Loss (Raw)": 2.0566976070404053, "Full-pretrain/Step": 2950, "Full-pretrain/Step Time": 17.591333959251642} +{"Full-pretrain/Learning Rate": 4.043981322580498e-05, "Full-pretrain/Loss": 1.9817653894424438, "Full-pretrain/Loss (Raw)": 2.214700222015381, "Full-pretrain/Step": 2951, "Full-pretrain/Step Time": 17.597075702622533} +{"Full-pretrain/Learning Rate": 4.043313434337457e-05, "Full-pretrain/Loss": 1.9782365560531616, "Full-pretrain/Loss (Raw)": 1.9348978996276855, "Full-pretrain/Step": 2952, "Full-pretrain/Step Time": 17.597979836165905} +{"Full-pretrain/Learning Rate": 4.042645368073754e-05, "Full-pretrain/Loss": 1.9629676342010498, "Full-pretrain/Loss (Raw)": 1.5699217319488525, "Full-pretrain/Step": 2953, "Full-pretrain/Step Time": 17.598657477647066} +{"Full-pretrain/Learning Rate": 4.0419771238664485e-05, "Full-pretrain/Loss": 1.9632749557495117, "Full-pretrain/Loss (Raw)": 2.0241446495056152, "Full-pretrain/Step": 2954, "Full-pretrain/Step Time": 17.596522860229015} +{"Full-pretrain/Learning Rate": 4.041308701792625e-05, "Full-pretrain/Loss": 1.9692169427871704, "Full-pretrain/Loss (Raw)": 1.9510480165481567, "Full-pretrain/Step": 2955, "Full-pretrain/Step Time": 17.600095357745886} +{"Full-pretrain/Learning Rate": 4.040640101929384e-05, "Full-pretrain/Loss": 1.9708421230316162, "Full-pretrain/Loss (Raw)": 2.0265955924987793, "Full-pretrain/Step": 2956, "Full-pretrain/Step Time": 17.606855919584632} +{"Full-pretrain/Learning Rate": 4.039971324353849e-05, "Full-pretrain/Loss": 1.969382643699646, "Full-pretrain/Loss (Raw)": 1.9853390455245972, "Full-pretrain/Step": 2957, "Full-pretrain/Step Time": 17.608712166547775} +{"Full-pretrain/Learning Rate": 4.039302369143162e-05, "Full-pretrain/Loss": 1.9822323322296143, "Full-pretrain/Loss (Raw)": 2.166290283203125, "Full-pretrain/Step": 2958, "Full-pretrain/Step Time": 17.60260497778654} +{"Full-pretrain/Learning Rate": 4.0386332363744886e-05, "Full-pretrain/Loss": 1.975907802581787, "Full-pretrain/Loss (Raw)": 1.88712739944458, "Full-pretrain/Step": 2959, "Full-pretrain/Step Time": 17.60783384181559} +{"Full-pretrain/Learning Rate": 4.037963926125011e-05, "Full-pretrain/Loss": 1.9671941995620728, "Full-pretrain/Loss (Raw)": 1.9679157733917236, "Full-pretrain/Step": 2960, "Full-pretrain/Step Time": 17.608616422861814} +{"Full-pretrain/Learning Rate": 4.0372944384719364e-05, "Full-pretrain/Loss": 1.973724365234375, "Full-pretrain/Loss (Raw)": 1.9519014358520508, "Full-pretrain/Step": 2961, "Full-pretrain/Step Time": 17.607691114768386} +{"Full-pretrain/Learning Rate": 4.036624773492488e-05, "Full-pretrain/Loss": 1.9769980907440186, "Full-pretrain/Loss (Raw)": 1.9612908363342285, "Full-pretrain/Step": 2962, "Full-pretrain/Step Time": 17.61045155674219} +{"Full-pretrain/Learning Rate": 4.035954931263912e-05, "Full-pretrain/Loss": 1.9609466791152954, "Full-pretrain/Loss (Raw)": 1.6515337228775024, "Full-pretrain/Step": 2963, "Full-pretrain/Step Time": 17.611569372937083} +{"Full-pretrain/Learning Rate": 4.035284911863474e-05, "Full-pretrain/Loss": 1.9656567573547363, "Full-pretrain/Loss (Raw)": 2.1162467002868652, "Full-pretrain/Step": 2964, "Full-pretrain/Step Time": 17.609859032556415} +{"Full-pretrain/Learning Rate": 4.034614715368461e-05, "Full-pretrain/Loss": 1.9643785953521729, "Full-pretrain/Loss (Raw)": 1.990368366241455, "Full-pretrain/Step": 2965, "Full-pretrain/Step Time": 17.60973848029971} +{"Full-pretrain/Learning Rate": 4.0339443418561805e-05, "Full-pretrain/Loss": 1.971423625946045, "Full-pretrain/Loss (Raw)": 2.02999210357666, "Full-pretrain/Step": 2966, "Full-pretrain/Step Time": 17.6155704613775} +{"Full-pretrain/Learning Rate": 4.0332737914039585e-05, "Full-pretrain/Loss": 1.9720203876495361, "Full-pretrain/Loss (Raw)": 1.9907920360565186, "Full-pretrain/Step": 2967, "Full-pretrain/Step Time": 17.613539149984717} +{"Full-pretrain/Learning Rate": 4.032603064089144e-05, "Full-pretrain/Loss": 1.9747231006622314, "Full-pretrain/Loss (Raw)": 1.9992103576660156, "Full-pretrain/Step": 2968, "Full-pretrain/Step Time": 17.616082407534122} +{"Full-pretrain/Learning Rate": 4.0319321599891044e-05, "Full-pretrain/Loss": 1.9687294960021973, "Full-pretrain/Loss (Raw)": 1.986760139465332, "Full-pretrain/Step": 2969, "Full-pretrain/Step Time": 17.61346662417054} +{"Full-pretrain/Learning Rate": 4.0312610791812286e-05, "Full-pretrain/Loss": 1.9657686948776245, "Full-pretrain/Loss (Raw)": 2.0258049964904785, "Full-pretrain/Step": 2970, "Full-pretrain/Step Time": 17.614858757704496} +{"Full-pretrain/Learning Rate": 4.030589821742926e-05, "Full-pretrain/Loss": 1.956142544746399, "Full-pretrain/Loss (Raw)": 1.7376630306243896, "Full-pretrain/Step": 2971, "Full-pretrain/Step Time": 17.609594859182835} +{"Full-pretrain/Learning Rate": 4.029918387751625e-05, "Full-pretrain/Loss": 1.950493574142456, "Full-pretrain/Loss (Raw)": 1.890904188156128, "Full-pretrain/Step": 2972, "Full-pretrain/Step Time": 17.612524773925543} +{"Full-pretrain/Learning Rate": 4.029246777284775e-05, "Full-pretrain/Loss": 1.9666743278503418, "Full-pretrain/Loss (Raw)": 2.303344249725342, "Full-pretrain/Step": 2973, "Full-pretrain/Step Time": 17.614537548273802} +{"Full-pretrain/Learning Rate": 4.0285749904198476e-05, "Full-pretrain/Loss": 1.9678412675857544, "Full-pretrain/Loss (Raw)": 2.1283159255981445, "Full-pretrain/Step": 2974, "Full-pretrain/Step Time": 17.61417601443827} +{"Full-pretrain/Learning Rate": 4.027903027234332e-05, "Full-pretrain/Loss": 1.981507658958435, "Full-pretrain/Loss (Raw)": 2.2629029750823975, "Full-pretrain/Step": 2975, "Full-pretrain/Step Time": 17.614828802645206} +{"Full-pretrain/Learning Rate": 4.0272308878057385e-05, "Full-pretrain/Loss": 1.9884226322174072, "Full-pretrain/Loss (Raw)": 2.1782963275909424, "Full-pretrain/Step": 2976, "Full-pretrain/Step Time": 17.618132261559367} +{"Full-pretrain/Learning Rate": 4.026558572211599e-05, "Full-pretrain/Loss": 1.992815375328064, "Full-pretrain/Loss (Raw)": 2.0921688079833984, "Full-pretrain/Step": 2977, "Full-pretrain/Step Time": 17.621892362833023} +{"Full-pretrain/Learning Rate": 4.025886080529465e-05, "Full-pretrain/Loss": 1.9998222589492798, "Full-pretrain/Loss (Raw)": 2.092738628387451, "Full-pretrain/Step": 2978, "Full-pretrain/Step Time": 17.61669747531414} +{"Full-pretrain/Learning Rate": 4.025213412836908e-05, "Full-pretrain/Loss": 2.004682779312134, "Full-pretrain/Loss (Raw)": 2.1228981018066406, "Full-pretrain/Step": 2979, "Full-pretrain/Step Time": 17.622002175077796} +{"Full-pretrain/Learning Rate": 4.0245405692115195e-05, "Full-pretrain/Loss": 2.0084612369537354, "Full-pretrain/Loss (Raw)": 2.105781078338623, "Full-pretrain/Step": 2980, "Full-pretrain/Step Time": 17.620667707175016} +{"Full-pretrain/Learning Rate": 4.023867549730912e-05, "Full-pretrain/Loss": 2.0094828605651855, "Full-pretrain/Loss (Raw)": 1.8998582363128662, "Full-pretrain/Step": 2981, "Full-pretrain/Step Time": 17.62449956126511} +{"Full-pretrain/Learning Rate": 4.023194354472719e-05, "Full-pretrain/Loss": 2.005889892578125, "Full-pretrain/Loss (Raw)": 1.941725492477417, "Full-pretrain/Step": 2982, "Full-pretrain/Step Time": 17.62881626933813} +{"Full-pretrain/Learning Rate": 4.022520983514592e-05, "Full-pretrain/Loss": 2.0022995471954346, "Full-pretrain/Loss (Raw)": 2.0998146533966064, "Full-pretrain/Step": 2983, "Full-pretrain/Step Time": 17.631550401449203} +{"Full-pretrain/Learning Rate": 4.021847436934204e-05, "Full-pretrain/Loss": 1.9962577819824219, "Full-pretrain/Loss (Raw)": 1.741553783416748, "Full-pretrain/Step": 2984, "Full-pretrain/Step Time": 17.630155755206943} +{"Full-pretrain/Learning Rate": 4.021173714809249e-05, "Full-pretrain/Loss": 2.0065526962280273, "Full-pretrain/Loss (Raw)": 1.8993628025054932, "Full-pretrain/Step": 2985, "Full-pretrain/Step Time": 17.63464715331793} +{"Full-pretrain/Learning Rate": 4.0204998172174415e-05, "Full-pretrain/Loss": 2.0048470497131348, "Full-pretrain/Loss (Raw)": 1.9695580005645752, "Full-pretrain/Step": 2986, "Full-pretrain/Step Time": 17.631338223814964} +{"Full-pretrain/Learning Rate": 4.019825744236514e-05, "Full-pretrain/Loss": 2.000363349914551, "Full-pretrain/Loss (Raw)": 1.807573676109314, "Full-pretrain/Step": 2987, "Full-pretrain/Step Time": 17.628601441159844} +{"Full-pretrain/Learning Rate": 4.01915149594422e-05, "Full-pretrain/Loss": 1.9955096244812012, "Full-pretrain/Loss (Raw)": 1.8712739944458008, "Full-pretrain/Step": 2988, "Full-pretrain/Step Time": 17.625523574650288} +{"Full-pretrain/Learning Rate": 4.018477072418336e-05, "Full-pretrain/Loss": 1.988808035850525, "Full-pretrain/Loss (Raw)": 1.7708921432495117, "Full-pretrain/Step": 2989, "Full-pretrain/Step Time": 17.62097721733153} +{"Full-pretrain/Learning Rate": 4.0178024737366554e-05, "Full-pretrain/Loss": 1.989426612854004, "Full-pretrain/Loss (Raw)": 2.1860804557800293, "Full-pretrain/Step": 2990, "Full-pretrain/Step Time": 17.619234526529908} +{"Full-pretrain/Learning Rate": 4.017127699976992e-05, "Full-pretrain/Loss": 1.997807264328003, "Full-pretrain/Loss (Raw)": 2.155308723449707, "Full-pretrain/Step": 2991, "Full-pretrain/Step Time": 17.61517032980919} +{"Full-pretrain/Learning Rate": 4.0164527512171826e-05, "Full-pretrain/Loss": 1.999579906463623, "Full-pretrain/Loss (Raw)": 2.0246410369873047, "Full-pretrain/Step": 2992, "Full-pretrain/Step Time": 17.617081394419074} +{"Full-pretrain/Learning Rate": 4.0157776275350805e-05, "Full-pretrain/Loss": 2.004190444946289, "Full-pretrain/Loss (Raw)": 2.099440574645996, "Full-pretrain/Step": 2993, "Full-pretrain/Step Time": 17.61528622545302} +{"Full-pretrain/Learning Rate": 4.015102329008562e-05, "Full-pretrain/Loss": 2.013151168823242, "Full-pretrain/Loss (Raw)": 2.2480266094207764, "Full-pretrain/Step": 2994, "Full-pretrain/Step Time": 17.61077539809048} +{"Full-pretrain/Learning Rate": 4.014426855715523e-05, "Full-pretrain/Loss": 2.0208659172058105, "Full-pretrain/Loss (Raw)": 1.8984098434448242, "Full-pretrain/Step": 2995, "Full-pretrain/Step Time": 17.611694552004337} +{"Full-pretrain/Learning Rate": 4.013751207733877e-05, "Full-pretrain/Loss": 2.0210819244384766, "Full-pretrain/Loss (Raw)": 2.123157262802124, "Full-pretrain/Step": 2996, "Full-pretrain/Step Time": 17.614164035767317} +{"Full-pretrain/Learning Rate": 4.0130753851415614e-05, "Full-pretrain/Loss": 2.016803741455078, "Full-pretrain/Loss (Raw)": 1.8534677028656006, "Full-pretrain/Step": 2997, "Full-pretrain/Step Time": 17.614220537245274} +{"Full-pretrain/Learning Rate": 4.012399388016533e-05, "Full-pretrain/Loss": 2.0208680629730225, "Full-pretrain/Loss (Raw)": 2.160052537918091, "Full-pretrain/Step": 2998, "Full-pretrain/Step Time": 17.607293162494898} +{"Full-pretrain/Learning Rate": 4.0117232164367655e-05, "Full-pretrain/Loss": 2.016047477722168, "Full-pretrain/Loss (Raw)": 1.8365356922149658, "Full-pretrain/Step": 2999, "Full-pretrain/Step Time": 17.605248982086778} +{"Full-pretrain/Learning Rate": 4.011046870480257e-05, "Full-pretrain/Loss": 2.0184504985809326, "Full-pretrain/Loss (Raw)": 2.076107978820801, "Full-pretrain/Step": 3000, "Full-pretrain/Step Time": 17.60753552429378} +{"Full-pretrain/Learning Rate": 4.010370350225022e-05, "Full-pretrain/Loss": 2.015188455581665, "Full-pretrain/Loss (Raw)": 1.8823686838150024, "Full-pretrain/Step": 3001, "Full-pretrain/Step Time": 17.603163501247764} +{"Full-pretrain/Learning Rate": 4.0096936557490995e-05, "Full-pretrain/Loss": 2.017733573913574, "Full-pretrain/Loss (Raw)": 2.1072471141815186, "Full-pretrain/Step": 3002, "Full-pretrain/Step Time": 17.601574821397662} +{"Full-pretrain/Learning Rate": 4.009016787130543e-05, "Full-pretrain/Loss": 2.0261173248291016, "Full-pretrain/Loss (Raw)": 2.0059494972229004, "Full-pretrain/Step": 3003, "Full-pretrain/Step Time": 17.60151563026011} +{"Full-pretrain/Learning Rate": 4.008339744447431e-05, "Full-pretrain/Loss": 2.0306880474090576, "Full-pretrain/Loss (Raw)": 2.0371670722961426, "Full-pretrain/Step": 3004, "Full-pretrain/Step Time": 17.60070614889264} +{"Full-pretrain/Learning Rate": 4.00766252777786e-05, "Full-pretrain/Loss": 2.025866985321045, "Full-pretrain/Loss (Raw)": 2.149068593978882, "Full-pretrain/Step": 3005, "Full-pretrain/Step Time": 17.60288280621171} +{"Full-pretrain/Learning Rate": 4.006985137199945e-05, "Full-pretrain/Loss": 2.0270578861236572, "Full-pretrain/Loss (Raw)": 2.1664204597473145, "Full-pretrain/Step": 3006, "Full-pretrain/Step Time": 17.600420778617263} +{"Full-pretrain/Learning Rate": 4.0063075727918245e-05, "Full-pretrain/Loss": 2.021294355392456, "Full-pretrain/Loss (Raw)": 2.078474998474121, "Full-pretrain/Step": 3007, "Full-pretrain/Step Time": 17.600073374807835} +{"Full-pretrain/Learning Rate": 4.0056298346316555e-05, "Full-pretrain/Loss": 2.013613700866699, "Full-pretrain/Loss (Raw)": 1.9325190782546997, "Full-pretrain/Step": 3008, "Full-pretrain/Step Time": 17.600526174530387} +{"Full-pretrain/Learning Rate": 4.0049519227976135e-05, "Full-pretrain/Loss": 2.0100836753845215, "Full-pretrain/Loss (Raw)": 1.9792070388793945, "Full-pretrain/Step": 3009, "Full-pretrain/Step Time": 17.599631395190954} +{"Full-pretrain/Learning Rate": 4.004273837367896e-05, "Full-pretrain/Loss": 2.0034523010253906, "Full-pretrain/Loss (Raw)": 1.8805333375930786, "Full-pretrain/Step": 3010, "Full-pretrain/Step Time": 17.596350206062198} +{"Full-pretrain/Learning Rate": 4.0035955784207203e-05, "Full-pretrain/Loss": 2.00101375579834, "Full-pretrain/Loss (Raw)": 2.0448689460754395, "Full-pretrain/Step": 3011, "Full-pretrain/Step Time": 17.6000549569726} +{"Full-pretrain/Learning Rate": 4.002917146034323e-05, "Full-pretrain/Loss": 1.997161626815796, "Full-pretrain/Loss (Raw)": 1.982507586479187, "Full-pretrain/Step": 3012, "Full-pretrain/Step Time": 17.604969637468457} +{"Full-pretrain/Learning Rate": 4.002238540286961e-05, "Full-pretrain/Loss": 2.004460334777832, "Full-pretrain/Loss (Raw)": 2.133420705795288, "Full-pretrain/Step": 3013, "Full-pretrain/Step Time": 17.60481259226799} +{"Full-pretrain/Learning Rate": 4.0015597612569113e-05, "Full-pretrain/Loss": 2.007045269012451, "Full-pretrain/Loss (Raw)": 2.024440050125122, "Full-pretrain/Step": 3014, "Full-pretrain/Step Time": 17.598581612110138} +{"Full-pretrain/Learning Rate": 4.0008808090224714e-05, "Full-pretrain/Loss": 2.001498222351074, "Full-pretrain/Loss (Raw)": 1.9223135709762573, "Full-pretrain/Step": 3015, "Full-pretrain/Step Time": 17.597238225862384} +{"Full-pretrain/Learning Rate": 4.000201683661957e-05, "Full-pretrain/Loss": 2.00563383102417, "Full-pretrain/Loss (Raw)": 1.8738895654678345, "Full-pretrain/Step": 3016, "Full-pretrain/Step Time": 17.601762387901545} +{"Full-pretrain/Learning Rate": 3.999522385253706e-05, "Full-pretrain/Loss": 2.0132083892822266, "Full-pretrain/Loss (Raw)": 2.1417479515075684, "Full-pretrain/Step": 3017, "Full-pretrain/Step Time": 17.603084571659565} +{"Full-pretrain/Learning Rate": 3.998842913876074e-05, "Full-pretrain/Loss": 2.0074009895324707, "Full-pretrain/Loss (Raw)": 1.783722162246704, "Full-pretrain/Step": 3018, "Full-pretrain/Step Time": 17.595701521262527} +{"Full-pretrain/Learning Rate": 3.9981632696074394e-05, "Full-pretrain/Loss": 2.015672206878662, "Full-pretrain/Loss (Raw)": 2.07224702835083, "Full-pretrain/Step": 3019, "Full-pretrain/Step Time": 17.59403771907091} +{"Full-pretrain/Learning Rate": 3.997483452526198e-05, "Full-pretrain/Loss": 2.021872043609619, "Full-pretrain/Loss (Raw)": 2.0696754455566406, "Full-pretrain/Step": 3020, "Full-pretrain/Step Time": 17.597456492483616} +{"Full-pretrain/Learning Rate": 3.996803462710767e-05, "Full-pretrain/Loss": 2.0282254219055176, "Full-pretrain/Loss (Raw)": 1.9741945266723633, "Full-pretrain/Step": 3021, "Full-pretrain/Step Time": 17.59665479697287} +{"Full-pretrain/Learning Rate": 3.996123300239581e-05, "Full-pretrain/Loss": 2.021169662475586, "Full-pretrain/Loss (Raw)": 1.9602960348129272, "Full-pretrain/Step": 3022, "Full-pretrain/Step Time": 17.596723878756166} +{"Full-pretrain/Learning Rate": 3.9954429651911e-05, "Full-pretrain/Loss": 2.00848388671875, "Full-pretrain/Loss (Raw)": 1.7493705749511719, "Full-pretrain/Step": 3023, "Full-pretrain/Step Time": 17.59142655879259} +{"Full-pretrain/Learning Rate": 3.9947624576437975e-05, "Full-pretrain/Loss": 2.0154621601104736, "Full-pretrain/Loss (Raw)": 2.247938632965088, "Full-pretrain/Step": 3024, "Full-pretrain/Step Time": 17.60423008725047} +{"Full-pretrain/Learning Rate": 3.994081777676171e-05, "Full-pretrain/Loss": 2.0085222721099854, "Full-pretrain/Loss (Raw)": 1.877368450164795, "Full-pretrain/Step": 3025, "Full-pretrain/Step Time": 17.595598401501775} +{"Full-pretrain/Learning Rate": 3.993400925366736e-05, "Full-pretrain/Loss": 2.003708839416504, "Full-pretrain/Loss (Raw)": 2.0939927101135254, "Full-pretrain/Step": 3026, "Full-pretrain/Step Time": 17.592910578474402} +{"Full-pretrain/Learning Rate": 3.9927199007940294e-05, "Full-pretrain/Loss": 2.0086891651153564, "Full-pretrain/Loss (Raw)": 2.057783842086792, "Full-pretrain/Step": 3027, "Full-pretrain/Step Time": 17.58765628375113} +{"Full-pretrain/Learning Rate": 3.9920387040366076e-05, "Full-pretrain/Loss": 2.0047364234924316, "Full-pretrain/Loss (Raw)": 1.9966681003570557, "Full-pretrain/Step": 3028, "Full-pretrain/Step Time": 17.59246020950377} +{"Full-pretrain/Learning Rate": 3.9913573351730455e-05, "Full-pretrain/Loss": 2.012951135635376, "Full-pretrain/Loss (Raw)": 2.116342067718506, "Full-pretrain/Step": 3029, "Full-pretrain/Step Time": 17.59127363935113} +{"Full-pretrain/Learning Rate": 3.990675794281938e-05, "Full-pretrain/Loss": 2.0202736854553223, "Full-pretrain/Loss (Raw)": 2.3943724632263184, "Full-pretrain/Step": 3030, "Full-pretrain/Step Time": 17.587498381733894} +{"Full-pretrain/Learning Rate": 3.989994081441902e-05, "Full-pretrain/Loss": 2.0319833755493164, "Full-pretrain/Loss (Raw)": 2.21124529838562, "Full-pretrain/Step": 3031, "Full-pretrain/Step Time": 17.587998243048787} +{"Full-pretrain/Learning Rate": 3.989312196731572e-05, "Full-pretrain/Loss": 2.0348782539367676, "Full-pretrain/Loss (Raw)": 2.1687474250793457, "Full-pretrain/Step": 3032, "Full-pretrain/Step Time": 17.588305769488215} +{"Full-pretrain/Learning Rate": 3.9886301402296036e-05, "Full-pretrain/Loss": 2.0398504734039307, "Full-pretrain/Loss (Raw)": 2.041475772857666, "Full-pretrain/Step": 3033, "Full-pretrain/Step Time": 17.58999770320952} +{"Full-pretrain/Learning Rate": 3.9879479120146723e-05, "Full-pretrain/Loss": 2.0321264266967773, "Full-pretrain/Loss (Raw)": 1.8600795269012451, "Full-pretrain/Step": 3034, "Full-pretrain/Step Time": 17.589194174855947} +{"Full-pretrain/Learning Rate": 3.987265512165471e-05, "Full-pretrain/Loss": 2.035351276397705, "Full-pretrain/Loss (Raw)": 2.1091368198394775, "Full-pretrain/Step": 3035, "Full-pretrain/Step Time": 17.586736707016826} +{"Full-pretrain/Learning Rate": 3.986582940760717e-05, "Full-pretrain/Loss": 2.0328614711761475, "Full-pretrain/Loss (Raw)": 1.9574992656707764, "Full-pretrain/Step": 3036, "Full-pretrain/Step Time": 17.58715184777975} +{"Full-pretrain/Learning Rate": 3.9859001978791424e-05, "Full-pretrain/Loss": 2.0319433212280273, "Full-pretrain/Loss (Raw)": 2.1196858882904053, "Full-pretrain/Step": 3037, "Full-pretrain/Step Time": 17.585029697045684} +{"Full-pretrain/Learning Rate": 3.9852172835995025e-05, "Full-pretrain/Loss": 2.0235912799835205, "Full-pretrain/Loss (Raw)": 1.8991577625274658, "Full-pretrain/Step": 3038, "Full-pretrain/Step Time": 17.581889228895307} +{"Full-pretrain/Learning Rate": 3.9845341980005704e-05, "Full-pretrain/Loss": 2.018646717071533, "Full-pretrain/Loss (Raw)": 1.920243740081787, "Full-pretrain/Step": 3039, "Full-pretrain/Step Time": 17.57726743631065} +{"Full-pretrain/Learning Rate": 3.9838509411611405e-05, "Full-pretrain/Loss": 2.0181126594543457, "Full-pretrain/Loss (Raw)": 1.9154341220855713, "Full-pretrain/Step": 3040, "Full-pretrain/Step Time": 17.576688639819622} +{"Full-pretrain/Learning Rate": 3.9831675131600255e-05, "Full-pretrain/Loss": 2.0188937187194824, "Full-pretrain/Loss (Raw)": 2.004204273223877, "Full-pretrain/Step": 3041, "Full-pretrain/Step Time": 17.581010596826673} +{"Full-pretrain/Learning Rate": 3.98248391407606e-05, "Full-pretrain/Loss": 2.0153307914733887, "Full-pretrain/Loss (Raw)": 1.7665156126022339, "Full-pretrain/Step": 3042, "Full-pretrain/Step Time": 17.583357851952314} +{"Full-pretrain/Learning Rate": 3.9818001439880954e-05, "Full-pretrain/Loss": 2.015774965286255, "Full-pretrain/Loss (Raw)": 2.0590786933898926, "Full-pretrain/Step": 3043, "Full-pretrain/Step Time": 17.569678781554103} +{"Full-pretrain/Learning Rate": 3.9811162029750045e-05, "Full-pretrain/Loss": 2.0118844509124756, "Full-pretrain/Loss (Raw)": 1.8580200672149658, "Full-pretrain/Step": 3044, "Full-pretrain/Step Time": 17.572700234130025} +{"Full-pretrain/Learning Rate": 3.980432091115681e-05, "Full-pretrain/Loss": 1.9985973834991455, "Full-pretrain/Loss (Raw)": 1.708233118057251, "Full-pretrain/Step": 3045, "Full-pretrain/Step Time": 17.57307732477784} +{"Full-pretrain/Learning Rate": 3.979747808489036e-05, "Full-pretrain/Loss": 2.003215789794922, "Full-pretrain/Loss (Raw)": 2.1722309589385986, "Full-pretrain/Step": 3046, "Full-pretrain/Step Time": 17.576881553977728} +{"Full-pretrain/Learning Rate": 3.979063355174001e-05, "Full-pretrain/Loss": 2.0053188800811768, "Full-pretrain/Loss (Raw)": 1.9896061420440674, "Full-pretrain/Step": 3047, "Full-pretrain/Step Time": 17.574940090999007} +{"Full-pretrain/Learning Rate": 3.978378731249528e-05, "Full-pretrain/Loss": 2.0071825981140137, "Full-pretrain/Loss (Raw)": 1.9335277080535889, "Full-pretrain/Step": 3048, "Full-pretrain/Step Time": 17.567493146285415} +{"Full-pretrain/Learning Rate": 3.9776939367945876e-05, "Full-pretrain/Loss": 2.0028655529022217, "Full-pretrain/Loss (Raw)": 2.003600597381592, "Full-pretrain/Step": 3049, "Full-pretrain/Step Time": 17.5672878716141} +{"Full-pretrain/Learning Rate": 3.977008971888171e-05, "Full-pretrain/Loss": 2.0096025466918945, "Full-pretrain/Loss (Raw)": 1.999305009841919, "Full-pretrain/Step": 3050, "Full-pretrain/Step Time": 17.56545295007527} +{"Full-pretrain/Learning Rate": 3.976323836609288e-05, "Full-pretrain/Loss": 2.00407075881958, "Full-pretrain/Loss (Raw)": 1.8952358961105347, "Full-pretrain/Step": 3051, "Full-pretrain/Step Time": 17.566263707354665} +{"Full-pretrain/Learning Rate": 3.97563853103697e-05, "Full-pretrain/Loss": 1.9903935194015503, "Full-pretrain/Loss (Raw)": 1.6319993734359741, "Full-pretrain/Step": 3052, "Full-pretrain/Step Time": 17.56223543919623} +{"Full-pretrain/Learning Rate": 3.9749530552502656e-05, "Full-pretrain/Loss": 1.9805576801300049, "Full-pretrain/Loss (Raw)": 1.659448504447937, "Full-pretrain/Step": 3053, "Full-pretrain/Step Time": 17.57172444090247} +{"Full-pretrain/Learning Rate": 3.974267409328245e-05, "Full-pretrain/Loss": 1.9849116802215576, "Full-pretrain/Loss (Raw)": 2.099623680114746, "Full-pretrain/Step": 3054, "Full-pretrain/Step Time": 17.56873330846429} +{"Full-pretrain/Learning Rate": 3.973581593349997e-05, "Full-pretrain/Loss": 1.9937424659729004, "Full-pretrain/Loss (Raw)": 2.0319557189941406, "Full-pretrain/Step": 3055, "Full-pretrain/Step Time": 17.569234929978848} +{"Full-pretrain/Learning Rate": 3.97289560739463e-05, "Full-pretrain/Loss": 1.9833394289016724, "Full-pretrain/Loss (Raw)": 1.9150440692901611, "Full-pretrain/Step": 3056, "Full-pretrain/Step Time": 17.565346587449312} +{"Full-pretrain/Learning Rate": 3.972209451541272e-05, "Full-pretrain/Loss": 1.9860498905181885, "Full-pretrain/Loss (Raw)": 1.9641039371490479, "Full-pretrain/Step": 3057, "Full-pretrain/Step Time": 17.56832497008145} +{"Full-pretrain/Learning Rate": 3.971523125869071e-05, "Full-pretrain/Loss": 1.9825539588928223, "Full-pretrain/Loss (Raw)": 1.9821230173110962, "Full-pretrain/Step": 3058, "Full-pretrain/Step Time": 17.563490241765976} +{"Full-pretrain/Learning Rate": 3.970836630457194e-05, "Full-pretrain/Loss": 1.981420874595642, "Full-pretrain/Loss (Raw)": 2.0215189456939697, "Full-pretrain/Step": 3059, "Full-pretrain/Step Time": 17.56327836215496} +{"Full-pretrain/Learning Rate": 3.9701499653848296e-05, "Full-pretrain/Loss": 1.982550859451294, "Full-pretrain/Loss (Raw)": 2.032832622528076, "Full-pretrain/Step": 3060, "Full-pretrain/Step Time": 17.555926440283656} +{"Full-pretrain/Learning Rate": 3.969463130731183e-05, "Full-pretrain/Loss": 1.973125696182251, "Full-pretrain/Loss (Raw)": 1.8147339820861816, "Full-pretrain/Step": 3061, "Full-pretrain/Step Time": 17.562124559655786} +{"Full-pretrain/Learning Rate": 3.968776126575481e-05, "Full-pretrain/Loss": 1.9556257724761963, "Full-pretrain/Loss (Raw)": 1.834375262260437, "Full-pretrain/Step": 3062, "Full-pretrain/Step Time": 17.55473074875772} +{"Full-pretrain/Learning Rate": 3.968088952996969e-05, "Full-pretrain/Loss": 1.9466965198516846, "Full-pretrain/Loss (Raw)": 1.9255105257034302, "Full-pretrain/Step": 3063, "Full-pretrain/Step Time": 17.5516299251467} +{"Full-pretrain/Learning Rate": 3.967401610074911e-05, "Full-pretrain/Loss": 1.9445743560791016, "Full-pretrain/Loss (Raw)": 2.100841522216797, "Full-pretrain/Step": 3064, "Full-pretrain/Step Time": 17.549112232401967} +{"Full-pretrain/Learning Rate": 3.966714097888594e-05, "Full-pretrain/Loss": 1.9457695484161377, "Full-pretrain/Loss (Raw)": 2.0797197818756104, "Full-pretrain/Step": 3065, "Full-pretrain/Step Time": 17.54977230168879} +{"Full-pretrain/Learning Rate": 3.966026416517321e-05, "Full-pretrain/Loss": 1.9492015838623047, "Full-pretrain/Loss (Raw)": 1.969907283782959, "Full-pretrain/Step": 3066, "Full-pretrain/Step Time": 17.549698105081916} +{"Full-pretrain/Learning Rate": 3.965338566040416e-05, "Full-pretrain/Loss": 1.9472637176513672, "Full-pretrain/Loss (Raw)": 2.047123670578003, "Full-pretrain/Step": 3067, "Full-pretrain/Step Time": 17.545258602127433} +{"Full-pretrain/Learning Rate": 3.964650546537222e-05, "Full-pretrain/Loss": 1.9464809894561768, "Full-pretrain/Loss (Raw)": 1.932450294494629, "Full-pretrain/Step": 3068, "Full-pretrain/Step Time": 17.555092461407185} +{"Full-pretrain/Learning Rate": 3.963962358087103e-05, "Full-pretrain/Loss": 1.9554128646850586, "Full-pretrain/Loss (Raw)": 2.4055063724517822, "Full-pretrain/Step": 3069, "Full-pretrain/Step Time": 17.5527324937284} +{"Full-pretrain/Learning Rate": 3.96327400076944e-05, "Full-pretrain/Loss": 1.9497532844543457, "Full-pretrain/Loss (Raw)": 1.718050479888916, "Full-pretrain/Step": 3070, "Full-pretrain/Step Time": 17.554665934294462} +{"Full-pretrain/Learning Rate": 3.962585474663636e-05, "Full-pretrain/Loss": 1.9489895105361938, "Full-pretrain/Loss (Raw)": 1.8958033323287964, "Full-pretrain/Step": 3071, "Full-pretrain/Step Time": 17.54746261611581} +{"Full-pretrain/Learning Rate": 3.96189677984911e-05, "Full-pretrain/Loss": 1.9543999433517456, "Full-pretrain/Loss (Raw)": 2.0885701179504395, "Full-pretrain/Step": 3072, "Full-pretrain/Step Time": 17.55536781810224} +{"Full-pretrain/Learning Rate": 3.961207916405305e-05, "Full-pretrain/Loss": 1.9559242725372314, "Full-pretrain/Loss (Raw)": 2.0529801845550537, "Full-pretrain/Step": 3073, "Full-pretrain/Step Time": 17.550149377435446} +{"Full-pretrain/Learning Rate": 3.9605188844116815e-05, "Full-pretrain/Loss": 1.965518832206726, "Full-pretrain/Loss (Raw)": 2.0735440254211426, "Full-pretrain/Step": 3074, "Full-pretrain/Step Time": 17.551139501854777} +{"Full-pretrain/Learning Rate": 3.959829683947717e-05, "Full-pretrain/Loss": 1.9666852951049805, "Full-pretrain/Loss (Raw)": 2.096405029296875, "Full-pretrain/Step": 3075, "Full-pretrain/Step Time": 17.557691695168614} +{"Full-pretrain/Learning Rate": 3.9591403150929104e-05, "Full-pretrain/Loss": 1.967095971107483, "Full-pretrain/Loss (Raw)": 1.8711607456207275, "Full-pretrain/Step": 3076, "Full-pretrain/Step Time": 17.55943901836872} +{"Full-pretrain/Learning Rate": 3.9584507779267824e-05, "Full-pretrain/Loss": 1.9788987636566162, "Full-pretrain/Loss (Raw)": 2.085918664932251, "Full-pretrain/Step": 3077, "Full-pretrain/Step Time": 17.56444662809372} +{"Full-pretrain/Learning Rate": 3.957761072528869e-05, "Full-pretrain/Loss": 1.969041347503662, "Full-pretrain/Loss (Raw)": 1.8567978143692017, "Full-pretrain/Step": 3078, "Full-pretrain/Step Time": 17.56008877977729} +{"Full-pretrain/Learning Rate": 3.957071198978729e-05, "Full-pretrain/Loss": 1.9613009691238403, "Full-pretrain/Loss (Raw)": 1.7419147491455078, "Full-pretrain/Step": 3079, "Full-pretrain/Step Time": 17.558937275782228} +{"Full-pretrain/Learning Rate": 3.956381157355938e-05, "Full-pretrain/Loss": 1.961885690689087, "Full-pretrain/Loss (Raw)": 1.9522356986999512, "Full-pretrain/Step": 3080, "Full-pretrain/Step Time": 17.56230722181499} +{"Full-pretrain/Learning Rate": 3.9556909477400914e-05, "Full-pretrain/Loss": 1.9611225128173828, "Full-pretrain/Loss (Raw)": 1.9791814088821411, "Full-pretrain/Step": 3081, "Full-pretrain/Step Time": 17.564372096210718} +{"Full-pretrain/Learning Rate": 3.9550005702108076e-05, "Full-pretrain/Loss": 1.9612609148025513, "Full-pretrain/Loss (Raw)": 2.003732919692993, "Full-pretrain/Step": 3082, "Full-pretrain/Step Time": 17.566689094528556} +{"Full-pretrain/Learning Rate": 3.9543100248477174e-05, "Full-pretrain/Loss": 1.9698289632797241, "Full-pretrain/Loss (Raw)": 2.169416904449463, "Full-pretrain/Step": 3083, "Full-pretrain/Step Time": 17.561672423034906} +{"Full-pretrain/Learning Rate": 3.9536193117304777e-05, "Full-pretrain/Loss": 1.9820291996002197, "Full-pretrain/Loss (Raw)": 2.0224034786224365, "Full-pretrain/Step": 3084, "Full-pretrain/Step Time": 17.56476636044681} +{"Full-pretrain/Learning Rate": 3.952928430938761e-05, "Full-pretrain/Loss": 1.9853838682174683, "Full-pretrain/Loss (Raw)": 1.7667993307113647, "Full-pretrain/Step": 3085, "Full-pretrain/Step Time": 17.567237347364426} +{"Full-pretrain/Learning Rate": 3.95223738255226e-05, "Full-pretrain/Loss": 1.9837180376052856, "Full-pretrain/Loss (Raw)": 2.0463194847106934, "Full-pretrain/Step": 3086, "Full-pretrain/Step Time": 17.572193330153823} +{"Full-pretrain/Learning Rate": 3.951546166650688e-05, "Full-pretrain/Loss": 1.981459617614746, "Full-pretrain/Loss (Raw)": 1.9596880674362183, "Full-pretrain/Step": 3087, "Full-pretrain/Step Time": 17.569966606795788} +{"Full-pretrain/Learning Rate": 3.9508547833137756e-05, "Full-pretrain/Loss": 1.978879451751709, "Full-pretrain/Loss (Raw)": 1.8324750661849976, "Full-pretrain/Step": 3088, "Full-pretrain/Step Time": 17.56905870139599} +{"Full-pretrain/Learning Rate": 3.950163232621273e-05, "Full-pretrain/Loss": 1.980129361152649, "Full-pretrain/Loss (Raw)": 2.004098653793335, "Full-pretrain/Step": 3089, "Full-pretrain/Step Time": 17.573751755058765} +{"Full-pretrain/Learning Rate": 3.9494715146529525e-05, "Full-pretrain/Loss": 1.982420802116394, "Full-pretrain/Loss (Raw)": 2.0554537773132324, "Full-pretrain/Step": 3090, "Full-pretrain/Step Time": 17.580386087298393} +{"Full-pretrain/Learning Rate": 3.948779629488602e-05, "Full-pretrain/Loss": 1.986886739730835, "Full-pretrain/Loss (Raw)": 2.1644251346588135, "Full-pretrain/Step": 3091, "Full-pretrain/Step Time": 17.58005108870566} +{"Full-pretrain/Learning Rate": 3.94808757720803e-05, "Full-pretrain/Loss": 1.984078288078308, "Full-pretrain/Loss (Raw)": 1.9429599046707153, "Full-pretrain/Step": 3092, "Full-pretrain/Step Time": 17.58461968973279} +{"Full-pretrain/Learning Rate": 3.9473953578910644e-05, "Full-pretrain/Loss": 1.9910410642623901, "Full-pretrain/Loss (Raw)": 2.037545680999756, "Full-pretrain/Step": 3093, "Full-pretrain/Step Time": 17.584313111379743} +{"Full-pretrain/Learning Rate": 3.946702971617553e-05, "Full-pretrain/Loss": 1.9935561418533325, "Full-pretrain/Loss (Raw)": 1.9148591756820679, "Full-pretrain/Step": 3094, "Full-pretrain/Step Time": 17.585262017324567} +{"Full-pretrain/Learning Rate": 3.946010418467363e-05, "Full-pretrain/Loss": 1.994242787361145, "Full-pretrain/Loss (Raw)": 1.947481393814087, "Full-pretrain/Step": 3095, "Full-pretrain/Step Time": 17.58457162976265} +{"Full-pretrain/Learning Rate": 3.9453176985203785e-05, "Full-pretrain/Loss": 1.983135461807251, "Full-pretrain/Loss (Raw)": 1.745406150817871, "Full-pretrain/Step": 3096, "Full-pretrain/Step Time": 17.58894931897521} +{"Full-pretrain/Learning Rate": 3.944624811856506e-05, "Full-pretrain/Loss": 1.9734967947006226, "Full-pretrain/Loss (Raw)": 1.7712825536727905, "Full-pretrain/Step": 3097, "Full-pretrain/Step Time": 17.589362043887377} +{"Full-pretrain/Learning Rate": 3.943931758555669e-05, "Full-pretrain/Loss": 1.9751720428466797, "Full-pretrain/Loss (Raw)": 2.0235185623168945, "Full-pretrain/Step": 3098, "Full-pretrain/Step Time": 17.58700712583959} +{"Full-pretrain/Learning Rate": 3.943238538697811e-05, "Full-pretrain/Loss": 1.9718961715698242, "Full-pretrain/Loss (Raw)": 1.9422956705093384, "Full-pretrain/Step": 3099, "Full-pretrain/Step Time": 17.59529618360102} +{"Full-pretrain/Learning Rate": 3.9425451523628954e-05, "Full-pretrain/Loss": 1.9810819625854492, "Full-pretrain/Loss (Raw)": 2.226395606994629, "Full-pretrain/Step": 3100, "Full-pretrain/Step Time": 17.594380024820566} +{"Full-pretrain/Learning Rate": 3.941851599630902e-05, "Full-pretrain/Loss": 1.9722884893417358, "Full-pretrain/Loss (Raw)": 2.1241087913513184, "Full-pretrain/Step": 3101, "Full-pretrain/Step Time": 17.5945593919605} +{"Full-pretrain/Learning Rate": 3.9411578805818344e-05, "Full-pretrain/Loss": 1.9800951480865479, "Full-pretrain/Loss (Raw)": 1.9678677320480347, "Full-pretrain/Step": 3102, "Full-pretrain/Step Time": 17.601007860153913} +{"Full-pretrain/Learning Rate": 3.940463995295712e-05, "Full-pretrain/Loss": 1.9861440658569336, "Full-pretrain/Loss (Raw)": 2.089365243911743, "Full-pretrain/Step": 3103, "Full-pretrain/Step Time": 17.595838567242026} +{"Full-pretrain/Learning Rate": 3.939769943852573e-05, "Full-pretrain/Loss": 1.9824175834655762, "Full-pretrain/Loss (Raw)": 1.9693279266357422, "Full-pretrain/Step": 3104, "Full-pretrain/Step Time": 17.591672165319324} +{"Full-pretrain/Learning Rate": 3.9390757263324774e-05, "Full-pretrain/Loss": 1.980292797088623, "Full-pretrain/Loss (Raw)": 1.9849803447723389, "Full-pretrain/Step": 3105, "Full-pretrain/Step Time": 17.60054619051516} +{"Full-pretrain/Learning Rate": 3.9383813428155025e-05, "Full-pretrain/Loss": 1.9802049398422241, "Full-pretrain/Loss (Raw)": 2.070735216140747, "Full-pretrain/Step": 3106, "Full-pretrain/Step Time": 17.61090323701501} +{"Full-pretrain/Learning Rate": 3.937686793381745e-05, "Full-pretrain/Loss": 1.9801464080810547, "Full-pretrain/Loss (Raw)": 2.0945327281951904, "Full-pretrain/Step": 3107, "Full-pretrain/Step Time": 17.60284954868257} +{"Full-pretrain/Learning Rate": 3.936992078111321e-05, "Full-pretrain/Loss": 1.978684425354004, "Full-pretrain/Loss (Raw)": 1.8243820667266846, "Full-pretrain/Step": 3108, "Full-pretrain/Step Time": 17.609977601096034} +{"Full-pretrain/Learning Rate": 3.936297197084367e-05, "Full-pretrain/Loss": 1.9755406379699707, "Full-pretrain/Loss (Raw)": 1.9853103160858154, "Full-pretrain/Step": 3109, "Full-pretrain/Step Time": 17.607342332601547} +{"Full-pretrain/Learning Rate": 3.935602150381034e-05, "Full-pretrain/Loss": 1.9746572971343994, "Full-pretrain/Loss (Raw)": 1.828534483909607, "Full-pretrain/Step": 3110, "Full-pretrain/Step Time": 17.60683311149478} +{"Full-pretrain/Learning Rate": 3.934906938081499e-05, "Full-pretrain/Loss": 1.995792269706726, "Full-pretrain/Loss (Raw)": 2.4182329177856445, "Full-pretrain/Step": 3111, "Full-pretrain/Step Time": 17.604376001283526} +{"Full-pretrain/Learning Rate": 3.934211560265952e-05, "Full-pretrain/Loss": 1.9963300228118896, "Full-pretrain/Loss (Raw)": 1.969443678855896, "Full-pretrain/Step": 3112, "Full-pretrain/Step Time": 17.605999132618308} +{"Full-pretrain/Learning Rate": 3.933516017014607e-05, "Full-pretrain/Loss": 1.9987895488739014, "Full-pretrain/Loss (Raw)": 2.057884454727173, "Full-pretrain/Step": 3113, "Full-pretrain/Step Time": 17.606794342398643} +{"Full-pretrain/Learning Rate": 3.932820308407692e-05, "Full-pretrain/Loss": 2.0005526542663574, "Full-pretrain/Loss (Raw)": 2.0601515769958496, "Full-pretrain/Step": 3114, "Full-pretrain/Step Time": 17.607168534770608} +{"Full-pretrain/Learning Rate": 3.932124434525458e-05, "Full-pretrain/Loss": 1.9949783086776733, "Full-pretrain/Loss (Raw)": 1.9910404682159424, "Full-pretrain/Step": 3115, "Full-pretrain/Step Time": 17.607716785743833} +{"Full-pretrain/Learning Rate": 3.931428395448174e-05, "Full-pretrain/Loss": 1.9938757419586182, "Full-pretrain/Loss (Raw)": 1.9871220588684082, "Full-pretrain/Step": 3116, "Full-pretrain/Step Time": 17.61161307245493} +{"Full-pretrain/Learning Rate": 3.930732191256128e-05, "Full-pretrain/Loss": 2.003915309906006, "Full-pretrain/Loss (Raw)": 2.088068962097168, "Full-pretrain/Step": 3117, "Full-pretrain/Step Time": 17.61705232411623} +{"Full-pretrain/Learning Rate": 3.930035822029626e-05, "Full-pretrain/Loss": 2.0031380653381348, "Full-pretrain/Loss (Raw)": 2.0214414596557617, "Full-pretrain/Step": 3118, "Full-pretrain/Step Time": 17.619251407682896} +{"Full-pretrain/Learning Rate": 3.9293392878489945e-05, "Full-pretrain/Loss": 2.0091609954833984, "Full-pretrain/Loss (Raw)": 2.15242338180542, "Full-pretrain/Step": 3119, "Full-pretrain/Step Time": 17.626194475218654} +{"Full-pretrain/Learning Rate": 3.928642588794579e-05, "Full-pretrain/Loss": 2.0144524574279785, "Full-pretrain/Loss (Raw)": 2.001807689666748, "Full-pretrain/Step": 3120, "Full-pretrain/Step Time": 17.625668650493026} +{"Full-pretrain/Learning Rate": 3.927945724946742e-05, "Full-pretrain/Loss": 2.0136826038360596, "Full-pretrain/Loss (Raw)": 1.9794583320617676, "Full-pretrain/Step": 3121, "Full-pretrain/Step Time": 17.62853747420013} +{"Full-pretrain/Learning Rate": 3.927248696385868e-05, "Full-pretrain/Loss": 2.0123767852783203, "Full-pretrain/Loss (Raw)": 2.0136656761169434, "Full-pretrain/Step": 3122, "Full-pretrain/Step Time": 17.638238871470094} +{"Full-pretrain/Learning Rate": 3.926551503192358e-05, "Full-pretrain/Loss": 2.0052685737609863, "Full-pretrain/Loss (Raw)": 1.93696129322052, "Full-pretrain/Step": 3123, "Full-pretrain/Step Time": 17.64577541127801} +{"Full-pretrain/Learning Rate": 3.925854145446635e-05, "Full-pretrain/Loss": 2.006866693496704, "Full-pretrain/Loss (Raw)": 1.9941062927246094, "Full-pretrain/Step": 3124, "Full-pretrain/Step Time": 17.64758089184761} +{"Full-pretrain/Learning Rate": 3.925156623229136e-05, "Full-pretrain/Loss": 2.0141587257385254, "Full-pretrain/Loss (Raw)": 2.2708911895751953, "Full-pretrain/Step": 3125, "Full-pretrain/Step Time": 17.648020403459668} +{"Full-pretrain/Learning Rate": 3.924458936620321e-05, "Full-pretrain/Loss": 2.0163846015930176, "Full-pretrain/Loss (Raw)": 1.986080288887024, "Full-pretrain/Step": 3126, "Full-pretrain/Step Time": 17.654970725998282} +{"Full-pretrain/Learning Rate": 3.923761085700669e-05, "Full-pretrain/Loss": 2.0161962509155273, "Full-pretrain/Loss (Raw)": 1.9414584636688232, "Full-pretrain/Step": 3127, "Full-pretrain/Step Time": 17.65974915213883} +{"Full-pretrain/Learning Rate": 3.923063070550676e-05, "Full-pretrain/Loss": 2.0347564220428467, "Full-pretrain/Loss (Raw)": 2.3393287658691406, "Full-pretrain/Step": 3128, "Full-pretrain/Step Time": 17.658496098592877} +{"Full-pretrain/Learning Rate": 3.922364891250857e-05, "Full-pretrain/Loss": 2.0360445976257324, "Full-pretrain/Loss (Raw)": 1.8125110864639282, "Full-pretrain/Step": 3129, "Full-pretrain/Step Time": 17.66479648090899} +{"Full-pretrain/Learning Rate": 3.921666547881749e-05, "Full-pretrain/Loss": 2.035708427429199, "Full-pretrain/Loss (Raw)": 2.0127463340759277, "Full-pretrain/Step": 3130, "Full-pretrain/Step Time": 17.668491626158357} +{"Full-pretrain/Learning Rate": 3.920968040523904e-05, "Full-pretrain/Loss": 2.0310816764831543, "Full-pretrain/Loss (Raw)": 1.7942519187927246, "Full-pretrain/Step": 3131, "Full-pretrain/Step Time": 17.669559309259057} +{"Full-pretrain/Learning Rate": 3.920269369257895e-05, "Full-pretrain/Loss": 2.0255069732666016, "Full-pretrain/Loss (Raw)": 2.0480029582977295, "Full-pretrain/Step": 3132, "Full-pretrain/Step Time": 17.66970205307007} +{"Full-pretrain/Learning Rate": 3.919570534164313e-05, "Full-pretrain/Loss": 2.0250444412231445, "Full-pretrain/Loss (Raw)": 2.1093058586120605, "Full-pretrain/Step": 3133, "Full-pretrain/Step Time": 17.675583750009537} +{"Full-pretrain/Learning Rate": 3.918871535323769e-05, "Full-pretrain/Loss": 2.031705379486084, "Full-pretrain/Loss (Raw)": 2.1810085773468018, "Full-pretrain/Step": 3134, "Full-pretrain/Step Time": 17.67613486945629} +{"Full-pretrain/Learning Rate": 3.9181723728168916e-05, "Full-pretrain/Loss": 2.0309906005859375, "Full-pretrain/Loss (Raw)": 2.066504955291748, "Full-pretrain/Step": 3135, "Full-pretrain/Step Time": 17.679646147415042} +{"Full-pretrain/Learning Rate": 3.9174730467243294e-05, "Full-pretrain/Loss": 2.027714729309082, "Full-pretrain/Loss (Raw)": 1.8644938468933105, "Full-pretrain/Step": 3136, "Full-pretrain/Step Time": 17.679356770589948} +{"Full-pretrain/Learning Rate": 3.91677355712675e-05, "Full-pretrain/Loss": 2.025009870529175, "Full-pretrain/Loss (Raw)": 1.898431420326233, "Full-pretrain/Step": 3137, "Full-pretrain/Step Time": 17.680354891344905} +{"Full-pretrain/Learning Rate": 3.9160739041048375e-05, "Full-pretrain/Loss": 2.018423080444336, "Full-pretrain/Loss (Raw)": 1.85995614528656, "Full-pretrain/Step": 3138, "Full-pretrain/Step Time": 17.681598715484142} +{"Full-pretrain/Learning Rate": 3.915374087739299e-05, "Full-pretrain/Loss": 2.0133020877838135, "Full-pretrain/Loss (Raw)": 1.9306632280349731, "Full-pretrain/Step": 3139, "Full-pretrain/Step Time": 17.688386771827936} +{"Full-pretrain/Learning Rate": 3.914674108110857e-05, "Full-pretrain/Loss": 2.0097620487213135, "Full-pretrain/Loss (Raw)": 1.711097240447998, "Full-pretrain/Step": 3140, "Full-pretrain/Step Time": 17.68758494220674} +{"Full-pretrain/Learning Rate": 3.913973965300253e-05, "Full-pretrain/Loss": 2.009732723236084, "Full-pretrain/Loss (Raw)": 1.9843708276748657, "Full-pretrain/Step": 3141, "Full-pretrain/Step Time": 17.68452476710081} +{"Full-pretrain/Learning Rate": 3.913273659388249e-05, "Full-pretrain/Loss": 2.016709804534912, "Full-pretrain/Loss (Raw)": 2.0518031120300293, "Full-pretrain/Step": 3142, "Full-pretrain/Step Time": 17.69106474891305} +{"Full-pretrain/Learning Rate": 3.912573190455626e-05, "Full-pretrain/Loss": 2.005039930343628, "Full-pretrain/Loss (Raw)": 2.0447933673858643, "Full-pretrain/Step": 3143, "Full-pretrain/Step Time": 17.698841024190187} +{"Full-pretrain/Learning Rate": 3.911872558583181e-05, "Full-pretrain/Loss": 2.014293670654297, "Full-pretrain/Loss (Raw)": 2.2655656337738037, "Full-pretrain/Step": 3144, "Full-pretrain/Step Time": 17.69981617666781} +{"Full-pretrain/Learning Rate": 3.911171763851733e-05, "Full-pretrain/Loss": 2.0156426429748535, "Full-pretrain/Loss (Raw)": 2.101048469543457, "Full-pretrain/Step": 3145, "Full-pretrain/Step Time": 17.696170315146446} +{"Full-pretrain/Learning Rate": 3.910470806342117e-05, "Full-pretrain/Loss": 2.0193231105804443, "Full-pretrain/Loss (Raw)": 2.1779305934906006, "Full-pretrain/Step": 3146, "Full-pretrain/Step Time": 17.70334721915424} +{"Full-pretrain/Learning Rate": 3.9097696861351896e-05, "Full-pretrain/Loss": 2.026533842086792, "Full-pretrain/Loss (Raw)": 2.2217817306518555, "Full-pretrain/Step": 3147, "Full-pretrain/Step Time": 17.712385142222047} +{"Full-pretrain/Learning Rate": 3.9090684033118254e-05, "Full-pretrain/Loss": 2.024597406387329, "Full-pretrain/Loss (Raw)": 1.9251564741134644, "Full-pretrain/Step": 3148, "Full-pretrain/Step Time": 17.719835996627808} +{"Full-pretrain/Learning Rate": 3.908366957952915e-05, "Full-pretrain/Loss": 2.01370906829834, "Full-pretrain/Loss (Raw)": 1.7396447658538818, "Full-pretrain/Step": 3149, "Full-pretrain/Step Time": 17.724335027858615} +{"Full-pretrain/Learning Rate": 3.907665350139371e-05, "Full-pretrain/Loss": 2.0124008655548096, "Full-pretrain/Loss (Raw)": 1.979575753211975, "Full-pretrain/Step": 3150, "Full-pretrain/Step Time": 17.72499698586762} +{"Full-pretrain/Learning Rate": 3.906963579952124e-05, "Full-pretrain/Loss": 1.9975382089614868, "Full-pretrain/Loss (Raw)": 1.6768213510513306, "Full-pretrain/Step": 3151, "Full-pretrain/Step Time": 17.73617099225521} +{"Full-pretrain/Learning Rate": 3.906261647472122e-05, "Full-pretrain/Loss": 1.9885296821594238, "Full-pretrain/Loss (Raw)": 1.7135359048843384, "Full-pretrain/Step": 3152, "Full-pretrain/Step Time": 17.732740119099617} +{"Full-pretrain/Learning Rate": 3.905559552780333e-05, "Full-pretrain/Loss": 1.9799950122833252, "Full-pretrain/Loss (Raw)": 1.7063474655151367, "Full-pretrain/Step": 3153, "Full-pretrain/Step Time": 17.738240307196975} +{"Full-pretrain/Learning Rate": 3.904857295957744e-05, "Full-pretrain/Loss": 1.9813024997711182, "Full-pretrain/Loss (Raw)": 2.0555052757263184, "Full-pretrain/Step": 3154, "Full-pretrain/Step Time": 17.742115458473563} +{"Full-pretrain/Learning Rate": 3.90415487708536e-05, "Full-pretrain/Loss": 1.9797487258911133, "Full-pretrain/Loss (Raw)": 1.8872407674789429, "Full-pretrain/Step": 3155, "Full-pretrain/Step Time": 17.746150648221374} +{"Full-pretrain/Learning Rate": 3.903452296244204e-05, "Full-pretrain/Loss": 1.9799033403396606, "Full-pretrain/Loss (Raw)": 1.9990530014038086, "Full-pretrain/Step": 3156, "Full-pretrain/Step Time": 17.753013690933585} +{"Full-pretrain/Learning Rate": 3.9027495535153185e-05, "Full-pretrain/Loss": 1.9712527990341187, "Full-pretrain/Loss (Raw)": 1.994077205657959, "Full-pretrain/Step": 3157, "Full-pretrain/Step Time": 17.761739222332835} +{"Full-pretrain/Learning Rate": 3.902046648979766e-05, "Full-pretrain/Loss": 1.9625099897384644, "Full-pretrain/Loss (Raw)": 1.7063062191009521, "Full-pretrain/Step": 3158, "Full-pretrain/Step Time": 17.76348370499909} +{"Full-pretrain/Learning Rate": 3.901343582718624e-05, "Full-pretrain/Loss": 1.9745941162109375, "Full-pretrain/Loss (Raw)": 2.3281543254852295, "Full-pretrain/Step": 3159, "Full-pretrain/Step Time": 17.768609277904034} +{"Full-pretrain/Learning Rate": 3.900640354812992e-05, "Full-pretrain/Loss": 1.9628623723983765, "Full-pretrain/Loss (Raw)": 1.9639108180999756, "Full-pretrain/Step": 3160, "Full-pretrain/Step Time": 17.771659718826413} +{"Full-pretrain/Learning Rate": 3.899936965343989e-05, "Full-pretrain/Loss": 1.971936821937561, "Full-pretrain/Loss (Raw)": 2.1028947830200195, "Full-pretrain/Step": 3161, "Full-pretrain/Step Time": 17.775139262899756} +{"Full-pretrain/Learning Rate": 3.8992334143927475e-05, "Full-pretrain/Loss": 1.982812762260437, "Full-pretrain/Loss (Raw)": 2.360776901245117, "Full-pretrain/Step": 3162, "Full-pretrain/Step Time": 17.78237716667354} +{"Full-pretrain/Learning Rate": 3.8985297020404244e-05, "Full-pretrain/Loss": 1.9963717460632324, "Full-pretrain/Loss (Raw)": 2.228137493133545, "Full-pretrain/Step": 3163, "Full-pretrain/Step Time": 17.789653120562434} +{"Full-pretrain/Learning Rate": 3.897825828368191e-05, "Full-pretrain/Loss": 1.9998351335525513, "Full-pretrain/Loss (Raw)": 2.1588306427001953, "Full-pretrain/Step": 3164, "Full-pretrain/Step Time": 17.79246680624783} +{"Full-pretrain/Learning Rate": 3.897121793457239e-05, "Full-pretrain/Loss": 1.9922159910202026, "Full-pretrain/Loss (Raw)": 1.8654954433441162, "Full-pretrain/Step": 3165, "Full-pretrain/Step Time": 17.8029467407614} +{"Full-pretrain/Learning Rate": 3.896417597388781e-05, "Full-pretrain/Loss": 1.9795000553131104, "Full-pretrain/Loss (Raw)": 1.7740986347198486, "Full-pretrain/Step": 3166, "Full-pretrain/Step Time": 17.813114201650023} +{"Full-pretrain/Learning Rate": 3.8957132402440425e-05, "Full-pretrain/Loss": 1.96843683719635, "Full-pretrain/Loss (Raw)": 1.7124812602996826, "Full-pretrain/Step": 3167, "Full-pretrain/Step Time": 17.823742074891925} +{"Full-pretrain/Learning Rate": 3.895008722104272e-05, "Full-pretrain/Loss": 1.9712388515472412, "Full-pretrain/Loss (Raw)": 1.9541544914245605, "Full-pretrain/Step": 3168, "Full-pretrain/Step Time": 17.826062934473157} +{"Full-pretrain/Learning Rate": 3.894304043050736e-05, "Full-pretrain/Loss": 1.9762461185455322, "Full-pretrain/Loss (Raw)": 2.0586681365966797, "Full-pretrain/Step": 3169, "Full-pretrain/Step Time": 17.836808862164617} +{"Full-pretrain/Learning Rate": 3.893599203164718e-05, "Full-pretrain/Loss": 1.9710633754730225, "Full-pretrain/Loss (Raw)": 1.6941064596176147, "Full-pretrain/Step": 3170, "Full-pretrain/Step Time": 17.835348304361105} +{"Full-pretrain/Learning Rate": 3.892894202527523e-05, "Full-pretrain/Loss": 1.9741626977920532, "Full-pretrain/Loss (Raw)": 2.0298421382904053, "Full-pretrain/Step": 3171, "Full-pretrain/Step Time": 17.84663396142423} +{"Full-pretrain/Learning Rate": 3.8921890412204705e-05, "Full-pretrain/Loss": 1.985106110572815, "Full-pretrain/Loss (Raw)": 2.061281681060791, "Full-pretrain/Step": 3172, "Full-pretrain/Step Time": 17.849616277962923} +{"Full-pretrain/Learning Rate": 3.891483719324901e-05, "Full-pretrain/Loss": 1.9820491075515747, "Full-pretrain/Loss (Raw)": 1.8865488767623901, "Full-pretrain/Step": 3173, "Full-pretrain/Step Time": 17.863282730802894} +{"Full-pretrain/Learning Rate": 3.890778236922174e-05, "Full-pretrain/Loss": 1.9777414798736572, "Full-pretrain/Loss (Raw)": 1.9139595031738281, "Full-pretrain/Step": 3174, "Full-pretrain/Step Time": 17.86807106807828} +{"Full-pretrain/Learning Rate": 3.890072594093666e-05, "Full-pretrain/Loss": 1.9682339429855347, "Full-pretrain/Loss (Raw)": 1.740553379058838, "Full-pretrain/Step": 3175, "Full-pretrain/Step Time": 17.880843875929713} +{"Full-pretrain/Learning Rate": 3.8893667909207734e-05, "Full-pretrain/Loss": 1.9559346437454224, "Full-pretrain/Loss (Raw)": 1.8719854354858398, "Full-pretrain/Step": 3176, "Full-pretrain/Step Time": 17.88607496768236} +{"Full-pretrain/Learning Rate": 3.888660827484908e-05, "Full-pretrain/Loss": 1.9596751928329468, "Full-pretrain/Loss (Raw)": 2.2207469940185547, "Full-pretrain/Step": 3177, "Full-pretrain/Step Time": 17.890125857666135} +{"Full-pretrain/Learning Rate": 3.887954703867506e-05, "Full-pretrain/Loss": 1.958787202835083, "Full-pretrain/Loss (Raw)": 2.149513006210327, "Full-pretrain/Step": 3178, "Full-pretrain/Step Time": 17.899616930633783} +{"Full-pretrain/Learning Rate": 3.887248420150016e-05, "Full-pretrain/Loss": 1.9518944025039673, "Full-pretrain/Loss (Raw)": 2.0012145042419434, "Full-pretrain/Step": 3179, "Full-pretrain/Step Time": 17.90825548581779} +{"Full-pretrain/Learning Rate": 3.886541976413908e-05, "Full-pretrain/Loss": 1.956600546836853, "Full-pretrain/Loss (Raw)": 2.075754165649414, "Full-pretrain/Step": 3180, "Full-pretrain/Step Time": 17.91965977847576} +{"Full-pretrain/Learning Rate": 3.88583537274067e-05, "Full-pretrain/Loss": 1.9601292610168457, "Full-pretrain/Loss (Raw)": 1.852563738822937, "Full-pretrain/Step": 3181, "Full-pretrain/Step Time": 17.920002235099673} +{"Full-pretrain/Learning Rate": 3.885128609211809e-05, "Full-pretrain/Loss": 1.9622350931167603, "Full-pretrain/Loss (Raw)": 2.0469627380371094, "Full-pretrain/Step": 3182, "Full-pretrain/Step Time": 17.929264897480607} +{"Full-pretrain/Learning Rate": 3.88442168590885e-05, "Full-pretrain/Loss": 1.9645581245422363, "Full-pretrain/Loss (Raw)": 1.7511570453643799, "Full-pretrain/Step": 3183, "Full-pretrain/Step Time": 17.938947539776564} +{"Full-pretrain/Learning Rate": 3.8837146029133367e-05, "Full-pretrain/Loss": 1.9743022918701172, "Full-pretrain/Loss (Raw)": 2.025351047515869, "Full-pretrain/Step": 3184, "Full-pretrain/Step Time": 17.95997789502144} +{"Full-pretrain/Learning Rate": 3.8830073603068294e-05, "Full-pretrain/Loss": 1.9826712608337402, "Full-pretrain/Loss (Raw)": 1.9741523265838623, "Full-pretrain/Step": 3185, "Full-pretrain/Step Time": 17.963846007362008} +{"Full-pretrain/Learning Rate": 3.882299958170909e-05, "Full-pretrain/Loss": 1.9813469648361206, "Full-pretrain/Loss (Raw)": 2.0131306648254395, "Full-pretrain/Step": 3186, "Full-pretrain/Step Time": 17.979643700644374} +{"Full-pretrain/Learning Rate": 3.881592396587175e-05, "Full-pretrain/Loss": 1.984337568283081, "Full-pretrain/Loss (Raw)": 1.9829410314559937, "Full-pretrain/Step": 3187, "Full-pretrain/Step Time": 17.989895474165678} +{"Full-pretrain/Learning Rate": 3.880884675637242e-05, "Full-pretrain/Loss": 1.9889706373214722, "Full-pretrain/Loss (Raw)": 2.147310256958008, "Full-pretrain/Step": 3188, "Full-pretrain/Step Time": 18.011261822655797} +{"Full-pretrain/Learning Rate": 3.880176795402748e-05, "Full-pretrain/Loss": 1.982429027557373, "Full-pretrain/Loss (Raw)": 1.7847411632537842, "Full-pretrain/Step": 3189, "Full-pretrain/Step Time": 18.01887915469706} +{"Full-pretrain/Learning Rate": 3.879468755965346e-05, "Full-pretrain/Loss": 1.9902249574661255, "Full-pretrain/Loss (Raw)": 1.9557795524597168, "Full-pretrain/Step": 3190, "Full-pretrain/Step Time": 18.03454609401524} +{"Full-pretrain/Learning Rate": 3.8787605574067074e-05, "Full-pretrain/Loss": 1.9788110256195068, "Full-pretrain/Loss (Raw)": 1.962910771369934, "Full-pretrain/Step": 3191, "Full-pretrain/Step Time": 18.056694412603974} +{"Full-pretrain/Learning Rate": 3.878052199808523e-05, "Full-pretrain/Loss": 1.9776840209960938, "Full-pretrain/Loss (Raw)": 1.9278427362442017, "Full-pretrain/Step": 3192, "Full-pretrain/Step Time": 18.072659850120544} +{"Full-pretrain/Learning Rate": 3.877343683252501e-05, "Full-pretrain/Loss": 1.9811707735061646, "Full-pretrain/Loss (Raw)": 2.214470863342285, "Full-pretrain/Step": 3193, "Full-pretrain/Step Time": 18.083891270682216} +{"Full-pretrain/Learning Rate": 3.87663500782037e-05, "Full-pretrain/Loss": 1.9700000286102295, "Full-pretrain/Loss (Raw)": 2.003312587738037, "Full-pretrain/Step": 3194, "Full-pretrain/Step Time": 18.09820364974439} +{"Full-pretrain/Learning Rate": 3.875926173593875e-05, "Full-pretrain/Loss": 1.9616941213607788, "Full-pretrain/Loss (Raw)": 1.96234929561615, "Full-pretrain/Step": 3195, "Full-pretrain/Step Time": 18.123761244118214} +{"Full-pretrain/Learning Rate": 3.8752171806547787e-05, "Full-pretrain/Loss": 1.9600245952606201, "Full-pretrain/Loss (Raw)": 2.1054062843322754, "Full-pretrain/Step": 3196, "Full-pretrain/Step Time": 18.13114488311112} +{"Full-pretrain/Learning Rate": 3.874508029084863e-05, "Full-pretrain/Loss": 1.9673783779144287, "Full-pretrain/Loss (Raw)": 2.100818157196045, "Full-pretrain/Step": 3197, "Full-pretrain/Step Time": 18.14453962817788} +{"Full-pretrain/Learning Rate": 3.8737987189659315e-05, "Full-pretrain/Loss": 1.9700201749801636, "Full-pretrain/Loss (Raw)": 1.8586333990097046, "Full-pretrain/Step": 3198, "Full-pretrain/Step Time": 18.152384486049414} +{"Full-pretrain/Learning Rate": 3.873089250379799e-05, "Full-pretrain/Loss": 1.9709947109222412, "Full-pretrain/Loss (Raw)": 1.7436678409576416, "Full-pretrain/Step": 3199, "Full-pretrain/Step Time": 18.17475849762559} +{"Full-pretrain/Learning Rate": 3.872379623408304e-05, "Full-pretrain/Loss": 1.967556118965149, "Full-pretrain/Loss (Raw)": 1.844117283821106, "Full-pretrain/Step": 3200, "Full-pretrain/Step Time": 18.188263934105635} +{"Full-pretrain/Learning Rate": 3.871669838133303e-05, "Full-pretrain/Loss": 1.973633885383606, "Full-pretrain/Loss (Raw)": 2.253159999847412, "Full-pretrain/Step": 3201, "Full-pretrain/Step Time": 18.203768534585834} +{"Full-pretrain/Learning Rate": 3.870959894636666e-05, "Full-pretrain/Loss": 1.9733504056930542, "Full-pretrain/Loss (Raw)": 1.6850333213806152, "Full-pretrain/Step": 3202, "Full-pretrain/Step Time": 18.219172144308686} +{"Full-pretrain/Learning Rate": 3.870249793000289e-05, "Full-pretrain/Loss": 1.974825143814087, "Full-pretrain/Loss (Raw)": 2.077033758163452, "Full-pretrain/Step": 3203, "Full-pretrain/Step Time": 18.235325824469328} +{"Full-pretrain/Learning Rate": 3.869539533306079e-05, "Full-pretrain/Loss": 1.9654573202133179, "Full-pretrain/Loss (Raw)": 1.7615113258361816, "Full-pretrain/Step": 3204, "Full-pretrain/Step Time": 18.265881061553955} +{"Full-pretrain/Learning Rate": 3.8688291156359655e-05, "Full-pretrain/Loss": 1.9624732732772827, "Full-pretrain/Loss (Raw)": 1.7910597324371338, "Full-pretrain/Step": 3205, "Full-pretrain/Step Time": 18.28375532478094} +{"Full-pretrain/Learning Rate": 3.868118540071894e-05, "Full-pretrain/Loss": 1.9554940462112427, "Full-pretrain/Loss (Raw)": 1.6906242370605469, "Full-pretrain/Step": 3206, "Full-pretrain/Step Time": 18.309698851779103} +{"Full-pretrain/Learning Rate": 3.8674078066958296e-05, "Full-pretrain/Loss": 1.96820068359375, "Full-pretrain/Loss (Raw)": 2.1471669673919678, "Full-pretrain/Step": 3207, "Full-pretrain/Step Time": 18.3338073939085} +{"Full-pretrain/Learning Rate": 3.866696915589756e-05, "Full-pretrain/Loss": 1.9715139865875244, "Full-pretrain/Loss (Raw)": 1.9780114889144897, "Full-pretrain/Step": 3208, "Full-pretrain/Step Time": 18.359277300536633} +{"Full-pretrain/Learning Rate": 3.865985866835673e-05, "Full-pretrain/Loss": 1.9618275165557861, "Full-pretrain/Loss (Raw)": 1.9107773303985596, "Full-pretrain/Step": 3209, "Full-pretrain/Step Time": 18.377063490450382} +{"Full-pretrain/Learning Rate": 3.8652746605156e-05, "Full-pretrain/Loss": 1.957519769668579, "Full-pretrain/Loss (Raw)": 2.011664867401123, "Full-pretrain/Step": 3210, "Full-pretrain/Step Time": 18.398213820531964} +{"Full-pretrain/Learning Rate": 3.8645632967115753e-05, "Full-pretrain/Loss": 1.95601487159729, "Full-pretrain/Loss (Raw)": 1.9530630111694336, "Full-pretrain/Step": 3211, "Full-pretrain/Step Time": 18.427404139190912} +{"Full-pretrain/Learning Rate": 3.863851775505654e-05, "Full-pretrain/Loss": 1.9558137655258179, "Full-pretrain/Loss (Raw)": 2.06931734085083, "Full-pretrain/Step": 3212, "Full-pretrain/Step Time": 18.443166244775057} +{"Full-pretrain/Learning Rate": 3.8631400969799095e-05, "Full-pretrain/Loss": 1.9585933685302734, "Full-pretrain/Loss (Raw)": 1.9415115118026733, "Full-pretrain/Step": 3213, "Full-pretrain/Step Time": 18.462593622505665} +{"Full-pretrain/Learning Rate": 3.862428261216433e-05, "Full-pretrain/Loss": 1.962958812713623, "Full-pretrain/Loss (Raw)": 2.1866559982299805, "Full-pretrain/Step": 3214, "Full-pretrain/Step Time": 18.483074499294162} +{"Full-pretrain/Learning Rate": 3.861716268297336e-05, "Full-pretrain/Loss": 1.967698335647583, "Full-pretrain/Loss (Raw)": 1.902820110321045, "Full-pretrain/Step": 3215, "Full-pretrain/Step Time": 18.501324271783233} +{"Full-pretrain/Learning Rate": 3.861004118304746e-05, "Full-pretrain/Loss": 1.9625859260559082, "Full-pretrain/Loss (Raw)": 1.8617521524429321, "Full-pretrain/Step": 3216, "Full-pretrain/Step Time": 18.5318149831146} +{"Full-pretrain/Learning Rate": 3.86029181132081e-05, "Full-pretrain/Loss": 1.9637622833251953, "Full-pretrain/Loss (Raw)": 2.011794090270996, "Full-pretrain/Step": 3217, "Full-pretrain/Step Time": 18.54185164347291} +{"Full-pretrain/Learning Rate": 3.85957934742769e-05, "Full-pretrain/Loss": 1.970512866973877, "Full-pretrain/Loss (Raw)": 2.229151964187622, "Full-pretrain/Step": 3218, "Full-pretrain/Step Time": 18.55213731341064} +{"Full-pretrain/Learning Rate": 3.858866726707572e-05, "Full-pretrain/Loss": 1.9690935611724854, "Full-pretrain/Loss (Raw)": 1.9375232458114624, "Full-pretrain/Step": 3219, "Full-pretrain/Step Time": 18.578353440389037} +{"Full-pretrain/Learning Rate": 3.858153949242653e-05, "Full-pretrain/Loss": 1.9640259742736816, "Full-pretrain/Loss (Raw)": 1.985144853591919, "Full-pretrain/Step": 3220, "Full-pretrain/Step Time": 18.596329575404525} +{"Full-pretrain/Learning Rate": 3.857441015115154e-05, "Full-pretrain/Loss": 1.9765937328338623, "Full-pretrain/Loss (Raw)": 2.186908483505249, "Full-pretrain/Step": 3221, "Full-pretrain/Step Time": 18.62382081709802} +{"Full-pretrain/Learning Rate": 3.856727924407311e-05, "Full-pretrain/Loss": 1.9769748449325562, "Full-pretrain/Loss (Raw)": 1.9679782390594482, "Full-pretrain/Step": 3222, "Full-pretrain/Step Time": 18.648781713098288} +{"Full-pretrain/Learning Rate": 3.856014677201378e-05, "Full-pretrain/Loss": 1.9767518043518066, "Full-pretrain/Loss (Raw)": 1.9557760953903198, "Full-pretrain/Step": 3223, "Full-pretrain/Step Time": 18.683378336951137} +{"Full-pretrain/Learning Rate": 3.855301273579629e-05, "Full-pretrain/Loss": 1.9828855991363525, "Full-pretrain/Loss (Raw)": 2.124119758605957, "Full-pretrain/Step": 3224, "Full-pretrain/Step Time": 18.708727622404695} +{"Full-pretrain/Learning Rate": 3.8545877136243545e-05, "Full-pretrain/Loss": 1.9772045612335205, "Full-pretrain/Loss (Raw)": 2.032680034637451, "Full-pretrain/Step": 3225, "Full-pretrain/Step Time": 18.737734152004123} +{"Full-pretrain/Learning Rate": 3.8538739974178635e-05, "Full-pretrain/Loss": 1.9757136106491089, "Full-pretrain/Loss (Raw)": 1.9556019306182861, "Full-pretrain/Step": 3226, "Full-pretrain/Step Time": 18.7718543484807} +{"Full-pretrain/Learning Rate": 3.853160125042482e-05, "Full-pretrain/Loss": 1.9717631340026855, "Full-pretrain/Loss (Raw)": 1.835934042930603, "Full-pretrain/Step": 3227, "Full-pretrain/Step Time": 18.806106628850102} +{"Full-pretrain/Learning Rate": 3.852446096580556e-05, "Full-pretrain/Loss": 1.9618244171142578, "Full-pretrain/Loss (Raw)": 1.7873680591583252, "Full-pretrain/Step": 3228, "Full-pretrain/Step Time": 18.83217289671302} +{"Full-pretrain/Learning Rate": 3.851731912114448e-05, "Full-pretrain/Loss": 1.956148624420166, "Full-pretrain/Loss (Raw)": 1.9191900491714478, "Full-pretrain/Step": 3229, "Full-pretrain/Step Time": 18.871996693313122} +{"Full-pretrain/Learning Rate": 3.8510175717265387e-05, "Full-pretrain/Loss": 1.9530837535858154, "Full-pretrain/Loss (Raw)": 1.7605600357055664, "Full-pretrain/Step": 3230, "Full-pretrain/Step Time": 18.904956743121147} +{"Full-pretrain/Learning Rate": 3.8503030754992276e-05, "Full-pretrain/Loss": 1.9557151794433594, "Full-pretrain/Loss (Raw)": 1.8278717994689941, "Full-pretrain/Step": 3231, "Full-pretrain/Step Time": 18.929722340777516} +{"Full-pretrain/Learning Rate": 3.849588423514932e-05, "Full-pretrain/Loss": 1.9476763010025024, "Full-pretrain/Loss (Raw)": 1.5868735313415527, "Full-pretrain/Step": 3232, "Full-pretrain/Step Time": 18.96098681166768} +{"Full-pretrain/Learning Rate": 3.848873615856084e-05, "Full-pretrain/Loss": 1.9390426874160767, "Full-pretrain/Loss (Raw)": 1.9768871068954468, "Full-pretrain/Step": 3233, "Full-pretrain/Step Time": 18.99048923701048} +{"Full-pretrain/Learning Rate": 3.848158652605141e-05, "Full-pretrain/Loss": 1.9516229629516602, "Full-pretrain/Loss (Raw)": 2.08760404586792, "Full-pretrain/Step": 3234, "Full-pretrain/Step Time": 19.018038691952825} +{"Full-pretrain/Learning Rate": 3.847443533844569e-05, "Full-pretrain/Loss": 1.9466142654418945, "Full-pretrain/Loss (Raw)": 1.9167520999908447, "Full-pretrain/Step": 3235, "Full-pretrain/Step Time": 19.053385170176625} +{"Full-pretrain/Learning Rate": 3.84672825965686e-05, "Full-pretrain/Loss": 1.9569541215896606, "Full-pretrain/Loss (Raw)": 2.0923898220062256, "Full-pretrain/Step": 3236, "Full-pretrain/Step Time": 19.085714608430862} +{"Full-pretrain/Learning Rate": 3.846012830124519e-05, "Full-pretrain/Loss": 1.9654309749603271, "Full-pretrain/Loss (Raw)": 2.0623180866241455, "Full-pretrain/Step": 3237, "Full-pretrain/Step Time": 19.13228972814977} +{"Full-pretrain/Learning Rate": 3.845297245330071e-05, "Full-pretrain/Loss": 1.9763468503952026, "Full-pretrain/Loss (Raw)": 2.039933681488037, "Full-pretrain/Step": 3238, "Full-pretrain/Step Time": 19.164068520069122} +{"Full-pretrain/Learning Rate": 3.8445815053560595e-05, "Full-pretrain/Loss": 1.9708881378173828, "Full-pretrain/Loss (Raw)": 1.972486138343811, "Full-pretrain/Step": 3239, "Full-pretrain/Step Time": 19.200482711195946} +{"Full-pretrain/Learning Rate": 3.8438656102850435e-05, "Full-pretrain/Loss": 1.9678088426589966, "Full-pretrain/Loss (Raw)": 1.879476547241211, "Full-pretrain/Step": 3240, "Full-pretrain/Step Time": 19.232317315414548} +{"Full-pretrain/Learning Rate": 3.843149560199601e-05, "Full-pretrain/Loss": 1.9752670526504517, "Full-pretrain/Loss (Raw)": 2.1494357585906982, "Full-pretrain/Step": 3241, "Full-pretrain/Step Time": 19.26488297060132} +{"Full-pretrain/Learning Rate": 3.842433355182329e-05, "Full-pretrain/Loss": 1.9779354333877563, "Full-pretrain/Loss (Raw)": 2.0970566272735596, "Full-pretrain/Step": 3242, "Full-pretrain/Step Time": 19.3060441352427} +{"Full-pretrain/Learning Rate": 3.8417169953158414e-05, "Full-pretrain/Loss": 1.9841701984405518, "Full-pretrain/Loss (Raw)": 2.152575969696045, "Full-pretrain/Step": 3243, "Full-pretrain/Step Time": 19.343655940145254} +{"Full-pretrain/Learning Rate": 3.841000480682769e-05, "Full-pretrain/Loss": 1.9773589372634888, "Full-pretrain/Loss (Raw)": 1.8513555526733398, "Full-pretrain/Step": 3244, "Full-pretrain/Step Time": 19.387903176248074} +{"Full-pretrain/Learning Rate": 3.840283811365764e-05, "Full-pretrain/Loss": 1.9759480953216553, "Full-pretrain/Loss (Raw)": 1.8963645696640015, "Full-pretrain/Step": 3245, "Full-pretrain/Step Time": 19.43777360767126} +{"Full-pretrain/Learning Rate": 3.8395669874474915e-05, "Full-pretrain/Loss": 1.9736690521240234, "Full-pretrain/Loss (Raw)": 2.1137266159057617, "Full-pretrain/Step": 3246, "Full-pretrain/Step Time": 19.47223717905581} +{"Full-pretrain/Learning Rate": 3.838850009010638e-05, "Full-pretrain/Loss": 1.971658706665039, "Full-pretrain/Loss (Raw)": 1.8384891748428345, "Full-pretrain/Step": 3247, "Full-pretrain/Step Time": 19.508938862010837} +{"Full-pretrain/Learning Rate": 3.8381328761379066e-05, "Full-pretrain/Loss": 1.9678330421447754, "Full-pretrain/Loss (Raw)": 1.739328384399414, "Full-pretrain/Step": 3248, "Full-pretrain/Step Time": 19.55765121243894} +{"Full-pretrain/Learning Rate": 3.837415588912018e-05, "Full-pretrain/Loss": 1.9669618606567383, "Full-pretrain/Loss (Raw)": 1.983920693397522, "Full-pretrain/Step": 3249, "Full-pretrain/Step Time": 19.60406905412674} +{"Full-pretrain/Learning Rate": 3.836698147415711e-05, "Full-pretrain/Loss": 1.9608184099197388, "Full-pretrain/Loss (Raw)": 2.0325565338134766, "Full-pretrain/Step": 3250, "Full-pretrain/Step Time": 19.635600613430142} +{"Full-pretrain/Learning Rate": 3.835980551731743e-05, "Full-pretrain/Loss": 1.9631321430206299, "Full-pretrain/Loss (Raw)": 2.0115630626678467, "Full-pretrain/Step": 3251, "Full-pretrain/Step Time": 19.65279678441584} +{"Full-pretrain/Learning Rate": 3.835262801942887e-05, "Full-pretrain/Loss": 1.9666045904159546, "Full-pretrain/Loss (Raw)": 2.0962653160095215, "Full-pretrain/Step": 3252, "Full-pretrain/Step Time": 19.69488773867488} +{"Full-pretrain/Learning Rate": 3.834544898131937e-05, "Full-pretrain/Loss": 1.9642986059188843, "Full-pretrain/Loss (Raw)": 2.1131176948547363, "Full-pretrain/Step": 3253, "Full-pretrain/Step Time": 19.733091339468956} +{"Full-pretrain/Learning Rate": 3.833826840381701e-05, "Full-pretrain/Loss": 1.9628831148147583, "Full-pretrain/Loss (Raw)": 1.922680139541626, "Full-pretrain/Step": 3254, "Full-pretrain/Step Time": 19.755094865337014} +{"Full-pretrain/Learning Rate": 3.833108628775009e-05, "Full-pretrain/Loss": 1.9655447006225586, "Full-pretrain/Loss (Raw)": 2.040945291519165, "Full-pretrain/Step": 3255, "Full-pretrain/Step Time": 19.786282958462834} +{"Full-pretrain/Learning Rate": 3.832390263394704e-05, "Full-pretrain/Loss": 1.9561467170715332, "Full-pretrain/Loss (Raw)": 1.8233916759490967, "Full-pretrain/Step": 3256, "Full-pretrain/Step Time": 19.81829564087093} +{"Full-pretrain/Learning Rate": 3.8316717443236504e-05, "Full-pretrain/Loss": 1.9558759927749634, "Full-pretrain/Loss (Raw)": 2.0240139961242676, "Full-pretrain/Step": 3257, "Full-pretrain/Step Time": 19.843581400811672} +{"Full-pretrain/Learning Rate": 3.830953071644729e-05, "Full-pretrain/Loss": 1.968858242034912, "Full-pretrain/Loss (Raw)": 2.371032238006592, "Full-pretrain/Step": 3258, "Full-pretrain/Step Time": 19.87861638329923} +{"Full-pretrain/Learning Rate": 3.830234245440839e-05, "Full-pretrain/Loss": 1.9778332710266113, "Full-pretrain/Loss (Raw)": 2.123137950897217, "Full-pretrain/Step": 3259, "Full-pretrain/Step Time": 19.91355556063354} +{"Full-pretrain/Learning Rate": 3.8295152657948963e-05, "Full-pretrain/Loss": 1.9794747829437256, "Full-pretrain/Loss (Raw)": 1.8398947715759277, "Full-pretrain/Step": 3260, "Full-pretrain/Step Time": 19.942630166187882} +{"Full-pretrain/Learning Rate": 3.828796132789835e-05, "Full-pretrain/Loss": 1.9759975671768188, "Full-pretrain/Loss (Raw)": 1.8079164028167725, "Full-pretrain/Step": 3261, "Full-pretrain/Step Time": 19.966576239094138} +{"Full-pretrain/Learning Rate": 3.8280768465086066e-05, "Full-pretrain/Loss": 1.9801278114318848, "Full-pretrain/Loss (Raw)": 1.8927260637283325, "Full-pretrain/Step": 3262, "Full-pretrain/Step Time": 19.996919505298138} +{"Full-pretrain/Learning Rate": 3.827357407034181e-05, "Full-pretrain/Loss": 1.980170726776123, "Full-pretrain/Loss (Raw)": 1.829249382019043, "Full-pretrain/Step": 3263, "Full-pretrain/Step Time": 20.02056834846735} +{"Full-pretrain/Learning Rate": 3.826637814449544e-05, "Full-pretrain/Loss": 1.9941400289535522, "Full-pretrain/Loss (Raw)": 2.0338892936706543, "Full-pretrain/Step": 3264, "Full-pretrain/Step Time": 20.05239707417786} +{"Full-pretrain/Learning Rate": 3.825918068837702e-05, "Full-pretrain/Loss": 1.9930355548858643, "Full-pretrain/Loss (Raw)": 1.9415425062179565, "Full-pretrain/Step": 3265, "Full-pretrain/Step Time": 20.075564961880445} +{"Full-pretrain/Learning Rate": 3.825198170281677e-05, "Full-pretrain/Loss": 1.9919099807739258, "Full-pretrain/Loss (Raw)": 2.051588296890259, "Full-pretrain/Step": 3266, "Full-pretrain/Step Time": 20.11169664375484} +{"Full-pretrain/Learning Rate": 3.8244781188645084e-05, "Full-pretrain/Loss": 1.9992425441741943, "Full-pretrain/Loss (Raw)": 2.1513895988464355, "Full-pretrain/Step": 3267, "Full-pretrain/Step Time": 20.131741151213646} +{"Full-pretrain/Learning Rate": 3.823757914669254e-05, "Full-pretrain/Loss": 1.996825933456421, "Full-pretrain/Loss (Raw)": 2.015063524246216, "Full-pretrain/Step": 3268, "Full-pretrain/Step Time": 20.157142125070095} +{"Full-pretrain/Learning Rate": 3.8230375577789895e-05, "Full-pretrain/Loss": 1.9994690418243408, "Full-pretrain/Loss (Raw)": 2.1468920707702637, "Full-pretrain/Step": 3269, "Full-pretrain/Step Time": 20.191725037992} +{"Full-pretrain/Learning Rate": 3.8223170482768076e-05, "Full-pretrain/Loss": 1.9967278242111206, "Full-pretrain/Loss (Raw)": 1.9522180557250977, "Full-pretrain/Step": 3270, "Full-pretrain/Step Time": 20.21256659179926} +{"Full-pretrain/Learning Rate": 3.821596386245819e-05, "Full-pretrain/Loss": 1.992846131324768, "Full-pretrain/Loss (Raw)": 1.8482688665390015, "Full-pretrain/Step": 3271, "Full-pretrain/Step Time": 20.231627508997917} +{"Full-pretrain/Learning Rate": 3.8208755717691514e-05, "Full-pretrain/Loss": 1.9938602447509766, "Full-pretrain/Loss (Raw)": 1.9119330644607544, "Full-pretrain/Step": 3272, "Full-pretrain/Step Time": 20.251939672976732} +{"Full-pretrain/Learning Rate": 3.820154604929952e-05, "Full-pretrain/Loss": 1.98453950881958, "Full-pretrain/Loss (Raw)": 1.8511662483215332, "Full-pretrain/Step": 3273, "Full-pretrain/Step Time": 20.283404177054763} +{"Full-pretrain/Learning Rate": 3.819433485811382e-05, "Full-pretrain/Loss": 1.9796849489212036, "Full-pretrain/Loss (Raw)": 1.941715955734253, "Full-pretrain/Step": 3274, "Full-pretrain/Step Time": 20.309043485671282} +{"Full-pretrain/Learning Rate": 3.8187122144966225e-05, "Full-pretrain/Loss": 1.9785963296890259, "Full-pretrain/Loss (Raw)": 2.1177401542663574, "Full-pretrain/Step": 3275, "Full-pretrain/Step Time": 20.331292264163494} +{"Full-pretrain/Learning Rate": 3.8179907910688736e-05, "Full-pretrain/Loss": 1.9831279516220093, "Full-pretrain/Loss (Raw)": 1.9963653087615967, "Full-pretrain/Step": 3276, "Full-pretrain/Step Time": 20.347340473905206} +{"Full-pretrain/Learning Rate": 3.817269215611349e-05, "Full-pretrain/Loss": 1.9859793186187744, "Full-pretrain/Loss (Raw)": 1.9876104593276978, "Full-pretrain/Step": 3277, "Full-pretrain/Step Time": 20.36620336957276} +{"Full-pretrain/Learning Rate": 3.816547488207284e-05, "Full-pretrain/Loss": 1.9791228771209717, "Full-pretrain/Loss (Raw)": 1.8943167924880981, "Full-pretrain/Step": 3278, "Full-pretrain/Step Time": 20.386175151914358} +{"Full-pretrain/Learning Rate": 3.815825608939928e-05, "Full-pretrain/Loss": 1.9846023321151733, "Full-pretrain/Loss (Raw)": 2.0138349533081055, "Full-pretrain/Step": 3279, "Full-pretrain/Step Time": 20.396285727620125} +{"Full-pretrain/Learning Rate": 3.815103577892551e-05, "Full-pretrain/Loss": 1.9830198287963867, "Full-pretrain/Loss (Raw)": 1.688685417175293, "Full-pretrain/Step": 3280, "Full-pretrain/Step Time": 20.41268397308886} +{"Full-pretrain/Learning Rate": 3.8143813951484396e-05, "Full-pretrain/Loss": 1.990570068359375, "Full-pretrain/Loss (Raw)": 2.225532054901123, "Full-pretrain/Step": 3281, "Full-pretrain/Step Time": 20.43771816790104} +{"Full-pretrain/Learning Rate": 3.813659060790895e-05, "Full-pretrain/Loss": 1.982038140296936, "Full-pretrain/Loss (Raw)": 1.7595322132110596, "Full-pretrain/Step": 3282, "Full-pretrain/Step Time": 20.451182501390576} +{"Full-pretrain/Learning Rate": 3.81293657490324e-05, "Full-pretrain/Loss": 1.9762144088745117, "Full-pretrain/Loss (Raw)": 1.8252086639404297, "Full-pretrain/Step": 3283, "Full-pretrain/Step Time": 20.468407303094864} +{"Full-pretrain/Learning Rate": 3.812213937568811e-05, "Full-pretrain/Loss": 1.9724847078323364, "Full-pretrain/Loss (Raw)": 1.976910948753357, "Full-pretrain/Step": 3284, "Full-pretrain/Step Time": 20.474329732358456} +{"Full-pretrain/Learning Rate": 3.811491148870967e-05, "Full-pretrain/Loss": 1.958756923675537, "Full-pretrain/Loss (Raw)": 1.6738313436508179, "Full-pretrain/Step": 3285, "Full-pretrain/Step Time": 20.48617247864604} +{"Full-pretrain/Learning Rate": 3.8107682088930794e-05, "Full-pretrain/Loss": 1.9565117359161377, "Full-pretrain/Loss (Raw)": 1.850832223892212, "Full-pretrain/Step": 3286, "Full-pretrain/Step Time": 20.51192133501172} +{"Full-pretrain/Learning Rate": 3.81004511771854e-05, "Full-pretrain/Loss": 1.956658124923706, "Full-pretrain/Loss (Raw)": 2.04563045501709, "Full-pretrain/Step": 3287, "Full-pretrain/Step Time": 20.545828180387616} +{"Full-pretrain/Learning Rate": 3.809321875430756e-05, "Full-pretrain/Loss": 1.9673435688018799, "Full-pretrain/Loss (Raw)": 2.1653270721435547, "Full-pretrain/Step": 3288, "Full-pretrain/Step Time": 20.59737559594214} +{"Full-pretrain/Learning Rate": 3.808598482113154e-05, "Full-pretrain/Loss": 1.9600108861923218, "Full-pretrain/Loss (Raw)": 1.789368987083435, "Full-pretrain/Step": 3289, "Full-pretrain/Step Time": 20.629561237990856} +{"Full-pretrain/Learning Rate": 3.8078749378491766e-05, "Full-pretrain/Loss": 1.9458117485046387, "Full-pretrain/Loss (Raw)": 1.9166582822799683, "Full-pretrain/Step": 3290, "Full-pretrain/Step Time": 20.65814331918955} +{"Full-pretrain/Learning Rate": 3.8071512427222855e-05, "Full-pretrain/Loss": 1.9536904096603394, "Full-pretrain/Loss (Raw)": 2.3752553462982178, "Full-pretrain/Step": 3291, "Full-pretrain/Step Time": 20.697975378483534} +{"Full-pretrain/Learning Rate": 3.8064273968159574e-05, "Full-pretrain/Loss": 1.9535105228424072, "Full-pretrain/Loss (Raw)": 1.834136962890625, "Full-pretrain/Step": 3292, "Full-pretrain/Step Time": 20.73647110722959} +{"Full-pretrain/Learning Rate": 3.805703400213688e-05, "Full-pretrain/Loss": 1.9641414880752563, "Full-pretrain/Loss (Raw)": 2.1481080055236816, "Full-pretrain/Step": 3293, "Full-pretrain/Step Time": 20.76501953229308} +{"Full-pretrain/Learning Rate": 3.8049792529989905e-05, "Full-pretrain/Loss": 1.9767837524414062, "Full-pretrain/Loss (Raw)": 2.29727840423584, "Full-pretrain/Step": 3294, "Full-pretrain/Step Time": 20.79627557657659} +{"Full-pretrain/Learning Rate": 3.8042549552553955e-05, "Full-pretrain/Loss": 1.9827475547790527, "Full-pretrain/Loss (Raw)": 2.0200905799865723, "Full-pretrain/Step": 3295, "Full-pretrain/Step Time": 20.819808026775718} +{"Full-pretrain/Learning Rate": 3.803530507066448e-05, "Full-pretrain/Loss": 1.9908249378204346, "Full-pretrain/Loss (Raw)": 2.292365789413452, "Full-pretrain/Step": 3296, "Full-pretrain/Step Time": 20.849571293219924} +{"Full-pretrain/Learning Rate": 3.8028059085157166e-05, "Full-pretrain/Loss": 1.9931044578552246, "Full-pretrain/Loss (Raw)": 2.0144858360290527, "Full-pretrain/Step": 3297, "Full-pretrain/Step Time": 20.87796421162784} +{"Full-pretrain/Learning Rate": 3.80208115968678e-05, "Full-pretrain/Loss": 1.9859685897827148, "Full-pretrain/Loss (Raw)": 1.8232421875, "Full-pretrain/Step": 3298, "Full-pretrain/Step Time": 20.91423873603344} +{"Full-pretrain/Learning Rate": 3.8013562606632394e-05, "Full-pretrain/Loss": 1.9804024696350098, "Full-pretrain/Loss (Raw)": 1.9732704162597656, "Full-pretrain/Step": 3299, "Full-pretrain/Step Time": 20.947052827104926} +{"Full-pretrain/Learning Rate": 3.800631211528712e-05, "Full-pretrain/Loss": 1.9730656147003174, "Full-pretrain/Loss (Raw)": 1.7802839279174805, "Full-pretrain/Step": 3300, "Full-pretrain/Step Time": 20.9767611566931} +{"Full-pretrain/Learning Rate": 3.799906012366832e-05, "Full-pretrain/Loss": 1.9632320404052734, "Full-pretrain/Loss (Raw)": 1.8322179317474365, "Full-pretrain/Step": 3301, "Full-pretrain/Step Time": 21.003033926710486} +{"Full-pretrain/Learning Rate": 3.799180663261249e-05, "Full-pretrain/Loss": 1.9604321718215942, "Full-pretrain/Loss (Raw)": 1.8626222610473633, "Full-pretrain/Step": 3302, "Full-pretrain/Step Time": 21.03340708464384} +{"Full-pretrain/Learning Rate": 3.798455164295633e-05, "Full-pretrain/Loss": 1.9619593620300293, "Full-pretrain/Loss (Raw)": 1.8971397876739502, "Full-pretrain/Step": 3303, "Full-pretrain/Step Time": 21.04935763962567} +{"Full-pretrain/Learning Rate": 3.797729515553671e-05, "Full-pretrain/Loss": 1.9626518487930298, "Full-pretrain/Loss (Raw)": 1.934093952178955, "Full-pretrain/Step": 3304, "Full-pretrain/Step Time": 21.092716140672565} +{"Full-pretrain/Learning Rate": 3.7970037171190656e-05, "Full-pretrain/Loss": 1.9625903367996216, "Full-pretrain/Loss (Raw)": 1.849198579788208, "Full-pretrain/Step": 3305, "Full-pretrain/Step Time": 21.123997393995523} +{"Full-pretrain/Learning Rate": 3.796277769075536e-05, "Full-pretrain/Loss": 1.9630820751190186, "Full-pretrain/Loss (Raw)": 1.95745050907135, "Full-pretrain/Step": 3306, "Full-pretrain/Step Time": 21.144814217463136} +{"Full-pretrain/Learning Rate": 3.7955516715068226e-05, "Full-pretrain/Loss": 1.9544790983200073, "Full-pretrain/Loss (Raw)": 1.8424465656280518, "Full-pretrain/Step": 3307, "Full-pretrain/Step Time": 21.161794843152165} +{"Full-pretrain/Learning Rate": 3.7948254244966785e-05, "Full-pretrain/Loss": 1.956133246421814, "Full-pretrain/Loss (Raw)": 2.0492968559265137, "Full-pretrain/Step": 3308, "Full-pretrain/Step Time": 21.173793299123645} +{"Full-pretrain/Learning Rate": 3.794099028128877e-05, "Full-pretrain/Loss": 1.956917643547058, "Full-pretrain/Loss (Raw)": 2.0127124786376953, "Full-pretrain/Step": 3309, "Full-pretrain/Step Time": 21.19947157613933} +{"Full-pretrain/Learning Rate": 3.793372482487207e-05, "Full-pretrain/Loss": 1.9565962553024292, "Full-pretrain/Loss (Raw)": 1.8840333223342896, "Full-pretrain/Step": 3310, "Full-pretrain/Step Time": 21.217716122046113} +{"Full-pretrain/Learning Rate": 3.792645787655476e-05, "Full-pretrain/Loss": 1.958204984664917, "Full-pretrain/Loss (Raw)": 2.065314292907715, "Full-pretrain/Step": 3311, "Full-pretrain/Step Time": 21.229674631729722} +{"Full-pretrain/Learning Rate": 3.7919189437175074e-05, "Full-pretrain/Loss": 1.967970848083496, "Full-pretrain/Loss (Raw)": 2.0011892318725586, "Full-pretrain/Step": 3312, "Full-pretrain/Step Time": 21.238495966419578} +{"Full-pretrain/Learning Rate": 3.791191950757143e-05, "Full-pretrain/Loss": 1.957253336906433, "Full-pretrain/Loss (Raw)": 1.8825733661651611, "Full-pretrain/Step": 3313, "Full-pretrain/Step Time": 21.2505321521312} +{"Full-pretrain/Learning Rate": 3.790464808858241e-05, "Full-pretrain/Loss": 1.9718258380889893, "Full-pretrain/Loss (Raw)": 2.225850820541382, "Full-pretrain/Step": 3314, "Full-pretrain/Step Time": 21.259814420714974} +{"Full-pretrain/Learning Rate": 3.7897375181046766e-05, "Full-pretrain/Loss": 1.9796245098114014, "Full-pretrain/Loss (Raw)": 2.074770212173462, "Full-pretrain/Step": 3315, "Full-pretrain/Step Time": 21.262560039758682} +{"Full-pretrain/Learning Rate": 3.789010078580342e-05, "Full-pretrain/Loss": 1.9818320274353027, "Full-pretrain/Loss (Raw)": 2.0475478172302246, "Full-pretrain/Step": 3316, "Full-pretrain/Step Time": 21.265196351334453} +{"Full-pretrain/Learning Rate": 3.7882824903691484e-05, "Full-pretrain/Loss": 1.9816718101501465, "Full-pretrain/Loss (Raw)": 1.6687073707580566, "Full-pretrain/Step": 3317, "Full-pretrain/Step Time": 21.266522873193026} +{"Full-pretrain/Learning Rate": 3.7875547535550224e-05, "Full-pretrain/Loss": 1.986591100692749, "Full-pretrain/Loss (Raw)": 2.008246421813965, "Full-pretrain/Step": 3318, "Full-pretrain/Step Time": 21.267444614320993} +{"Full-pretrain/Learning Rate": 3.7868268682219076e-05, "Full-pretrain/Loss": 1.9837417602539062, "Full-pretrain/Loss (Raw)": 1.9544528722763062, "Full-pretrain/Step": 3319, "Full-pretrain/Step Time": 21.26210826076567} +{"Full-pretrain/Learning Rate": 3.786098834453766e-05, "Full-pretrain/Loss": 1.9774212837219238, "Full-pretrain/Loss (Raw)": 1.9630719423294067, "Full-pretrain/Step": 3320, "Full-pretrain/Step Time": 21.256981693208218} +{"Full-pretrain/Learning Rate": 3.785370652334577e-05, "Full-pretrain/Loss": 1.9639854431152344, "Full-pretrain/Loss (Raw)": 1.3594244718551636, "Full-pretrain/Step": 3321, "Full-pretrain/Step Time": 21.262980794534087} +{"Full-pretrain/Learning Rate": 3.784642321948333e-05, "Full-pretrain/Loss": 1.9773368835449219, "Full-pretrain/Loss (Raw)": 2.343903064727783, "Full-pretrain/Step": 3322, "Full-pretrain/Step Time": 21.260469557717443} +{"Full-pretrain/Learning Rate": 3.78391384337905e-05, "Full-pretrain/Loss": 1.9660840034484863, "Full-pretrain/Loss (Raw)": 2.015160083770752, "Full-pretrain/Step": 3323, "Full-pretrain/Step Time": 21.255205972120166} +{"Full-pretrain/Learning Rate": 3.783185216710756e-05, "Full-pretrain/Loss": 1.9656167030334473, "Full-pretrain/Loss (Raw)": 1.819183349609375, "Full-pretrain/Step": 3324, "Full-pretrain/Step Time": 21.264911007136106} +{"Full-pretrain/Learning Rate": 3.782456442027498e-05, "Full-pretrain/Loss": 1.951326847076416, "Full-pretrain/Loss (Raw)": 1.6908328533172607, "Full-pretrain/Step": 3325, "Full-pretrain/Step Time": 21.270696798339486} +{"Full-pretrain/Learning Rate": 3.78172751941334e-05, "Full-pretrain/Loss": 1.9376418590545654, "Full-pretrain/Loss (Raw)": 1.8593593835830688, "Full-pretrain/Step": 3326, "Full-pretrain/Step Time": 21.279706314206123} +{"Full-pretrain/Learning Rate": 3.780998448952363e-05, "Full-pretrain/Loss": 1.9463860988616943, "Full-pretrain/Loss (Raw)": 2.2999095916748047, "Full-pretrain/Step": 3327, "Full-pretrain/Step Time": 21.2763657476753} +{"Full-pretrain/Learning Rate": 3.7802692307286654e-05, "Full-pretrain/Loss": 1.9349684715270996, "Full-pretrain/Loss (Raw)": 1.9270001649856567, "Full-pretrain/Step": 3328, "Full-pretrain/Step Time": 21.28092517144978} +{"Full-pretrain/Learning Rate": 3.779539864826362e-05, "Full-pretrain/Loss": 1.9404921531677246, "Full-pretrain/Loss (Raw)": 2.1912424564361572, "Full-pretrain/Step": 3329, "Full-pretrain/Step Time": 21.28450951911509} +{"Full-pretrain/Learning Rate": 3.778810351329585e-05, "Full-pretrain/Loss": 1.9463437795639038, "Full-pretrain/Loss (Raw)": 2.0104942321777344, "Full-pretrain/Step": 3330, "Full-pretrain/Step Time": 21.28385705500841} +{"Full-pretrain/Learning Rate": 3.778080690322483e-05, "Full-pretrain/Loss": 1.9466724395751953, "Full-pretrain/Loss (Raw)": 1.983790397644043, "Full-pretrain/Step": 3331, "Full-pretrain/Step Time": 21.278753995895386} +{"Full-pretrain/Learning Rate": 3.7773508818892224e-05, "Full-pretrain/Loss": 1.9473886489868164, "Full-pretrain/Loss (Raw)": 1.8031978607177734, "Full-pretrain/Step": 3332, "Full-pretrain/Step Time": 21.263949137181044} +{"Full-pretrain/Learning Rate": 3.776620926113986e-05, "Full-pretrain/Loss": 1.9515409469604492, "Full-pretrain/Loss (Raw)": 1.9650930166244507, "Full-pretrain/Step": 3333, "Full-pretrain/Step Time": 21.251795718446374} +{"Full-pretrain/Learning Rate": 3.775890823080976e-05, "Full-pretrain/Loss": 1.9563359022140503, "Full-pretrain/Loss (Raw)": 2.016061782836914, "Full-pretrain/Step": 3334, "Full-pretrain/Step Time": 21.243972098454833} +{"Full-pretrain/Learning Rate": 3.7751605728744064e-05, "Full-pretrain/Loss": 1.9495244026184082, "Full-pretrain/Loss (Raw)": 1.6791709661483765, "Full-pretrain/Step": 3335, "Full-pretrain/Step Time": 21.23251200839877} +{"Full-pretrain/Learning Rate": 3.774430175578514e-05, "Full-pretrain/Loss": 1.9526782035827637, "Full-pretrain/Loss (Raw)": 2.0350191593170166, "Full-pretrain/Step": 3336, "Full-pretrain/Step Time": 21.21551650390029} +{"Full-pretrain/Learning Rate": 3.773699631277548e-05, "Full-pretrain/Loss": 1.9566880464553833, "Full-pretrain/Loss (Raw)": 1.9775105714797974, "Full-pretrain/Step": 3337, "Full-pretrain/Step Time": 21.205254400148988} +{"Full-pretrain/Learning Rate": 3.772968940055777e-05, "Full-pretrain/Loss": 1.9601088762283325, "Full-pretrain/Loss (Raw)": 2.0669145584106445, "Full-pretrain/Step": 3338, "Full-pretrain/Step Time": 21.200698420405388} +{"Full-pretrain/Learning Rate": 3.7722381019974864e-05, "Full-pretrain/Loss": 1.9569168090820312, "Full-pretrain/Loss (Raw)": 1.7403013706207275, "Full-pretrain/Step": 3339, "Full-pretrain/Step Time": 21.18853146955371} +{"Full-pretrain/Learning Rate": 3.771507117186978e-05, "Full-pretrain/Loss": 1.9472548961639404, "Full-pretrain/Loss (Raw)": 1.7401171922683716, "Full-pretrain/Step": 3340, "Full-pretrain/Step Time": 21.18769215606153} +{"Full-pretrain/Learning Rate": 3.77077598570857e-05, "Full-pretrain/Loss": 1.9410104751586914, "Full-pretrain/Loss (Raw)": 1.8128888607025146, "Full-pretrain/Step": 3341, "Full-pretrain/Step Time": 21.173648675903678} +{"Full-pretrain/Learning Rate": 3.770044707646599e-05, "Full-pretrain/Loss": 1.9448521137237549, "Full-pretrain/Loss (Raw)": 2.006965160369873, "Full-pretrain/Step": 3342, "Full-pretrain/Step Time": 21.169005304574966} +{"Full-pretrain/Learning Rate": 3.7693132830854185e-05, "Full-pretrain/Loss": 1.9486792087554932, "Full-pretrain/Loss (Raw)": 2.1877827644348145, "Full-pretrain/Step": 3343, "Full-pretrain/Step Time": 21.162887908518314} +{"Full-pretrain/Learning Rate": 3.768581712109395e-05, "Full-pretrain/Loss": 1.9441509246826172, "Full-pretrain/Loss (Raw)": 1.856284737586975, "Full-pretrain/Step": 3344, "Full-pretrain/Step Time": 21.150211669504642} +{"Full-pretrain/Learning Rate": 3.767849994802918e-05, "Full-pretrain/Loss": 1.9547679424285889, "Full-pretrain/Loss (Raw)": 2.2223153114318848, "Full-pretrain/Step": 3345, "Full-pretrain/Step Time": 21.147007567808032} +{"Full-pretrain/Learning Rate": 3.767118131250388e-05, "Full-pretrain/Loss": 1.9512395858764648, "Full-pretrain/Loss (Raw)": 2.112948417663574, "Full-pretrain/Step": 3346, "Full-pretrain/Step Time": 21.138946687802672} +{"Full-pretrain/Learning Rate": 3.7663861215362284e-05, "Full-pretrain/Loss": 1.9567551612854004, "Full-pretrain/Loss (Raw)": 2.2512705326080322, "Full-pretrain/Step": 3347, "Full-pretrain/Step Time": 21.12513430789113} +{"Full-pretrain/Learning Rate": 3.765653965744874e-05, "Full-pretrain/Loss": 1.9511711597442627, "Full-pretrain/Loss (Raw)": 1.8688561916351318, "Full-pretrain/Step": 3348, "Full-pretrain/Step Time": 21.11036578938365} +{"Full-pretrain/Learning Rate": 3.76492166396078e-05, "Full-pretrain/Loss": 1.9649794101715088, "Full-pretrain/Loss (Raw)": 2.1105732917785645, "Full-pretrain/Step": 3349, "Full-pretrain/Step Time": 21.09148557111621} +{"Full-pretrain/Learning Rate": 3.7641892162684164e-05, "Full-pretrain/Loss": 1.962633728981018, "Full-pretrain/Loss (Raw)": 1.93318510055542, "Full-pretrain/Step": 3350, "Full-pretrain/Step Time": 21.063185576349497} +{"Full-pretrain/Learning Rate": 3.7634566227522713e-05, "Full-pretrain/Loss": 1.9671423435211182, "Full-pretrain/Loss (Raw)": 2.0987253189086914, "Full-pretrain/Step": 3351, "Full-pretrain/Step Time": 21.03738790564239} +{"Full-pretrain/Learning Rate": 3.762723883496848e-05, "Full-pretrain/Loss": 1.9656058549880981, "Full-pretrain/Loss (Raw)": 1.913906216621399, "Full-pretrain/Step": 3352, "Full-pretrain/Step Time": 21.014442985877395} +{"Full-pretrain/Learning Rate": 3.761990998586669e-05, "Full-pretrain/Loss": 1.987807035446167, "Full-pretrain/Loss (Raw)": 2.0698611736297607, "Full-pretrain/Step": 3353, "Full-pretrain/Step Time": 20.992465391755104} +{"Full-pretrain/Learning Rate": 3.761257968106271e-05, "Full-pretrain/Loss": 1.982014536857605, "Full-pretrain/Loss (Raw)": 2.158541202545166, "Full-pretrain/Step": 3354, "Full-pretrain/Step Time": 20.96429923735559} +{"Full-pretrain/Learning Rate": 3.760524792140211e-05, "Full-pretrain/Loss": 1.983551025390625, "Full-pretrain/Loss (Raw)": 2.064326763153076, "Full-pretrain/Step": 3355, "Full-pretrain/Step Time": 20.93800327554345} +{"Full-pretrain/Learning Rate": 3.759791470773058e-05, "Full-pretrain/Loss": 1.9922499656677246, "Full-pretrain/Loss (Raw)": 2.097550392150879, "Full-pretrain/Step": 3356, "Full-pretrain/Step Time": 20.913876766338944} +{"Full-pretrain/Learning Rate": 3.759058004089402e-05, "Full-pretrain/Loss": 2.0006957054138184, "Full-pretrain/Loss (Raw)": 1.9610955715179443, "Full-pretrain/Step": 3357, "Full-pretrain/Step Time": 20.878608383238316} +{"Full-pretrain/Learning Rate": 3.758324392173849e-05, "Full-pretrain/Loss": 2.0114758014678955, "Full-pretrain/Loss (Raw)": 2.20432710647583, "Full-pretrain/Step": 3358, "Full-pretrain/Step Time": 20.846987234428525} +{"Full-pretrain/Learning Rate": 3.7575906351110176e-05, "Full-pretrain/Loss": 2.001800537109375, "Full-pretrain/Loss (Raw)": 1.9903042316436768, "Full-pretrain/Step": 3359, "Full-pretrain/Step Time": 20.830273889005184} +{"Full-pretrain/Learning Rate": 3.756856732985549e-05, "Full-pretrain/Loss": 2.0134434700012207, "Full-pretrain/Loss (Raw)": 2.2995710372924805, "Full-pretrain/Step": 3360, "Full-pretrain/Step Time": 20.802274223417044} +{"Full-pretrain/Learning Rate": 3.756122685882098e-05, "Full-pretrain/Loss": 2.004124164581299, "Full-pretrain/Loss (Raw)": 1.8930225372314453, "Full-pretrain/Step": 3361, "Full-pretrain/Step Time": 20.767815869301558} +{"Full-pretrain/Learning Rate": 3.755388493885337e-05, "Full-pretrain/Loss": 2.0073776245117188, "Full-pretrain/Loss (Raw)": 2.1146035194396973, "Full-pretrain/Step": 3362, "Full-pretrain/Step Time": 20.737899873405695} +{"Full-pretrain/Learning Rate": 3.7546541570799534e-05, "Full-pretrain/Loss": 2.002920627593994, "Full-pretrain/Loss (Raw)": 1.8411738872528076, "Full-pretrain/Step": 3363, "Full-pretrain/Step Time": 20.713141079992056} +{"Full-pretrain/Learning Rate": 3.753919675550654e-05, "Full-pretrain/Loss": 2.0134596824645996, "Full-pretrain/Loss (Raw)": 2.140446662902832, "Full-pretrain/Step": 3364, "Full-pretrain/Step Time": 20.675016118213534} +{"Full-pretrain/Learning Rate": 3.753185049382162e-05, "Full-pretrain/Loss": 2.0158162117004395, "Full-pretrain/Loss (Raw)": 2.040498733520508, "Full-pretrain/Step": 3365, "Full-pretrain/Step Time": 20.629893397912383} +{"Full-pretrain/Learning Rate": 3.752450278659214e-05, "Full-pretrain/Loss": 2.021111011505127, "Full-pretrain/Loss (Raw)": 2.185492515563965, "Full-pretrain/Step": 3366, "Full-pretrain/Step Time": 20.596175380051136} +{"Full-pretrain/Learning Rate": 3.7517153634665665e-05, "Full-pretrain/Loss": 2.0295286178588867, "Full-pretrain/Loss (Raw)": 1.948537826538086, "Full-pretrain/Step": 3367, "Full-pretrain/Step Time": 20.56523821502924} +{"Full-pretrain/Learning Rate": 3.750980303888991e-05, "Full-pretrain/Loss": 2.036648988723755, "Full-pretrain/Loss (Raw)": 2.262866973876953, "Full-pretrain/Step": 3368, "Full-pretrain/Step Time": 20.538094924762845} +{"Full-pretrain/Learning Rate": 3.750245100011278e-05, "Full-pretrain/Loss": 2.040963649749756, "Full-pretrain/Loss (Raw)": 2.1155788898468018, "Full-pretrain/Step": 3369, "Full-pretrain/Step Time": 20.500617753714323} +{"Full-pretrain/Learning Rate": 3.749509751918232e-05, "Full-pretrain/Loss": 2.036318063735962, "Full-pretrain/Loss (Raw)": 1.9182546138763428, "Full-pretrain/Step": 3370, "Full-pretrain/Step Time": 20.46436433121562} +{"Full-pretrain/Learning Rate": 3.748774259694675e-05, "Full-pretrain/Loss": 2.0449328422546387, "Full-pretrain/Loss (Raw)": 2.0159780979156494, "Full-pretrain/Step": 3371, "Full-pretrain/Step Time": 20.426601514220238} +{"Full-pretrain/Learning Rate": 3.748038623425446e-05, "Full-pretrain/Loss": 2.052828311920166, "Full-pretrain/Loss (Raw)": 1.9927653074264526, "Full-pretrain/Step": 3372, "Full-pretrain/Step Time": 20.386818036437035} +{"Full-pretrain/Learning Rate": 3.747302843195401e-05, "Full-pretrain/Loss": 2.063450574874878, "Full-pretrain/Loss (Raw)": 2.1528050899505615, "Full-pretrain/Step": 3373, "Full-pretrain/Step Time": 20.334641667082906} +{"Full-pretrain/Learning Rate": 3.746566919089411e-05, "Full-pretrain/Loss": 2.0657787322998047, "Full-pretrain/Loss (Raw)": 2.0814707279205322, "Full-pretrain/Step": 3374, "Full-pretrain/Step Time": 20.304917238652706} +{"Full-pretrain/Learning Rate": 3.745830851192364e-05, "Full-pretrain/Loss": 2.0577261447906494, "Full-pretrain/Loss (Raw)": 1.930100440979004, "Full-pretrain/Step": 3375, "Full-pretrain/Step Time": 20.2608094625175} +{"Full-pretrain/Learning Rate": 3.745094639589167e-05, "Full-pretrain/Loss": 2.065168857574463, "Full-pretrain/Loss (Raw)": 2.0944504737854004, "Full-pretrain/Step": 3376, "Full-pretrain/Step Time": 20.22657591663301} +{"Full-pretrain/Learning Rate": 3.744358284364741e-05, "Full-pretrain/Loss": 2.0596156120300293, "Full-pretrain/Loss (Raw)": 2.0446043014526367, "Full-pretrain/Step": 3377, "Full-pretrain/Step Time": 20.176085049286485} +{"Full-pretrain/Learning Rate": 3.743621785604024e-05, "Full-pretrain/Loss": 2.063220262527466, "Full-pretrain/Loss (Raw)": 2.2282981872558594, "Full-pretrain/Step": 3378, "Full-pretrain/Step Time": 20.143334727734327} +{"Full-pretrain/Learning Rate": 3.742885143391971e-05, "Full-pretrain/Loss": 2.0545654296875, "Full-pretrain/Loss (Raw)": 1.974319577217102, "Full-pretrain/Step": 3379, "Full-pretrain/Step Time": 20.118656277656555} +{"Full-pretrain/Learning Rate": 3.7421483578135536e-05, "Full-pretrain/Loss": 2.0585670471191406, "Full-pretrain/Loss (Raw)": 1.996908187866211, "Full-pretrain/Step": 3380, "Full-pretrain/Step Time": 20.08065523393452} +{"Full-pretrain/Learning Rate": 3.7414114289537596e-05, "Full-pretrain/Loss": 2.0577902793884277, "Full-pretrain/Loss (Raw)": 2.0857181549072266, "Full-pretrain/Step": 3381, "Full-pretrain/Step Time": 20.039282394573092} +{"Full-pretrain/Learning Rate": 3.740674356897593e-05, "Full-pretrain/Loss": 2.0580785274505615, "Full-pretrain/Loss (Raw)": 1.942402958869934, "Full-pretrain/Step": 3382, "Full-pretrain/Step Time": 20.013205701485276} +{"Full-pretrain/Learning Rate": 3.739937141730076e-05, "Full-pretrain/Loss": 2.0524518489837646, "Full-pretrain/Loss (Raw)": 1.9186716079711914, "Full-pretrain/Step": 3383, "Full-pretrain/Step Time": 19.98257951810956} +{"Full-pretrain/Learning Rate": 3.7391997835362455e-05, "Full-pretrain/Loss": 2.0567283630371094, "Full-pretrain/Loss (Raw)": 2.0507540702819824, "Full-pretrain/Step": 3384, "Full-pretrain/Step Time": 19.95239770039916} +{"Full-pretrain/Learning Rate": 3.7384622824011555e-05, "Full-pretrain/Loss": 2.0564355850219727, "Full-pretrain/Loss (Raw)": 2.060497999191284, "Full-pretrain/Step": 3385, "Full-pretrain/Step Time": 19.924949863925576} +{"Full-pretrain/Learning Rate": 3.737724638409876e-05, "Full-pretrain/Loss": 2.051189661026001, "Full-pretrain/Loss (Raw)": 1.9906673431396484, "Full-pretrain/Step": 3386, "Full-pretrain/Step Time": 19.88734987936914} +{"Full-pretrain/Learning Rate": 3.736986851647495e-05, "Full-pretrain/Loss": 2.044614791870117, "Full-pretrain/Loss (Raw)": 1.8539326190948486, "Full-pretrain/Step": 3387, "Full-pretrain/Step Time": 19.856548415496945} +{"Full-pretrain/Learning Rate": 3.736248922199115e-05, "Full-pretrain/Loss": 2.0408287048339844, "Full-pretrain/Loss (Raw)": 1.9763919115066528, "Full-pretrain/Step": 3388, "Full-pretrain/Step Time": 19.826521368697286} +{"Full-pretrain/Learning Rate": 3.735510850149856e-05, "Full-pretrain/Loss": 2.040438175201416, "Full-pretrain/Loss (Raw)": 1.948608160018921, "Full-pretrain/Step": 3389, "Full-pretrain/Step Time": 19.802232805639505} +{"Full-pretrain/Learning Rate": 3.734772635584855e-05, "Full-pretrain/Loss": 2.0334341526031494, "Full-pretrain/Loss (Raw)": 1.9801915884017944, "Full-pretrain/Step": 3390, "Full-pretrain/Step Time": 19.773653019219637} +{"Full-pretrain/Learning Rate": 3.7340342785892646e-05, "Full-pretrain/Loss": 2.0339252948760986, "Full-pretrain/Loss (Raw)": 2.006024122238159, "Full-pretrain/Step": 3391, "Full-pretrain/Step Time": 19.75024509243667} +{"Full-pretrain/Learning Rate": 3.7332957792482534e-05, "Full-pretrain/Loss": 2.0170273780822754, "Full-pretrain/Loss (Raw)": 1.7588365077972412, "Full-pretrain/Step": 3392, "Full-pretrain/Step Time": 19.715564792975783} +{"Full-pretrain/Learning Rate": 3.7325571376470076e-05, "Full-pretrain/Loss": 2.0262393951416016, "Full-pretrain/Loss (Raw)": 2.187809705734253, "Full-pretrain/Step": 3393, "Full-pretrain/Step Time": 19.697686694562435} +{"Full-pretrain/Learning Rate": 3.731818353870729e-05, "Full-pretrain/Loss": 2.0194644927978516, "Full-pretrain/Loss (Raw)": 1.897809386253357, "Full-pretrain/Step": 3394, "Full-pretrain/Step Time": 19.661644991487265} +{"Full-pretrain/Learning Rate": 3.731079428004637e-05, "Full-pretrain/Loss": 2.0157713890075684, "Full-pretrain/Loss (Raw)": 1.7229962348937988, "Full-pretrain/Step": 3395, "Full-pretrain/Step Time": 19.636660363525152} +{"Full-pretrain/Learning Rate": 3.7303403601339644e-05, "Full-pretrain/Loss": 2.0071380138397217, "Full-pretrain/Loss (Raw)": 1.8641715049743652, "Full-pretrain/Step": 3396, "Full-pretrain/Step Time": 19.611077478155494} +{"Full-pretrain/Learning Rate": 3.729601150343964e-05, "Full-pretrain/Loss": 1.9990532398223877, "Full-pretrain/Loss (Raw)": 1.78178870677948, "Full-pretrain/Step": 3397, "Full-pretrain/Step Time": 19.575879568234086} +{"Full-pretrain/Learning Rate": 3.728861798719903e-05, "Full-pretrain/Loss": 1.9992597103118896, "Full-pretrain/Loss (Raw)": 2.1921005249023438, "Full-pretrain/Step": 3398, "Full-pretrain/Step Time": 19.552268486469984} +{"Full-pretrain/Learning Rate": 3.728122305347066e-05, "Full-pretrain/Loss": 2.0004940032958984, "Full-pretrain/Loss (Raw)": 1.9880350828170776, "Full-pretrain/Step": 3399, "Full-pretrain/Step Time": 19.533077942207456} +{"Full-pretrain/Learning Rate": 3.727382670310753e-05, "Full-pretrain/Loss": 2.003121852874756, "Full-pretrain/Loss (Raw)": 2.3469555377960205, "Full-pretrain/Step": 3400, "Full-pretrain/Step Time": 19.50613364763558} +{"Full-pretrain/Learning Rate": 3.726642893696279e-05, "Full-pretrain/Loss": 1.998744010925293, "Full-pretrain/Loss (Raw)": 1.975488305091858, "Full-pretrain/Step": 3401, "Full-pretrain/Step Time": 19.481394816190004} +{"Full-pretrain/Learning Rate": 3.7259029755889786e-05, "Full-pretrain/Loss": 2.001382350921631, "Full-pretrain/Loss (Raw)": 2.002680778503418, "Full-pretrain/Step": 3402, "Full-pretrain/Step Time": 19.449523095041513} +{"Full-pretrain/Learning Rate": 3.725162916074201e-05, "Full-pretrain/Loss": 1.9985209703445435, "Full-pretrain/Loss (Raw)": 1.9244182109832764, "Full-pretrain/Step": 3403, "Full-pretrain/Step Time": 19.42074334435165} +{"Full-pretrain/Learning Rate": 3.7244227152373115e-05, "Full-pretrain/Loss": 2.0028152465820312, "Full-pretrain/Loss (Raw)": 2.130178451538086, "Full-pretrain/Step": 3404, "Full-pretrain/Step Time": 19.396611804142594} +{"Full-pretrain/Learning Rate": 3.7236823731636924e-05, "Full-pretrain/Loss": 1.9956090450286865, "Full-pretrain/Loss (Raw)": 1.922206163406372, "Full-pretrain/Step": 3405, "Full-pretrain/Step Time": 19.377486780285835} +{"Full-pretrain/Learning Rate": 3.722941889938741e-05, "Full-pretrain/Loss": 1.9826292991638184, "Full-pretrain/Loss (Raw)": 1.6661231517791748, "Full-pretrain/Step": 3406, "Full-pretrain/Step Time": 19.357705334201455} +{"Full-pretrain/Learning Rate": 3.7222012656478733e-05, "Full-pretrain/Loss": 1.9901034832000732, "Full-pretrain/Loss (Raw)": 2.169273853302002, "Full-pretrain/Step": 3407, "Full-pretrain/Step Time": 19.335120368748903} +{"Full-pretrain/Learning Rate": 3.7214605003765185e-05, "Full-pretrain/Loss": 1.9888343811035156, "Full-pretrain/Loss (Raw)": 2.0538370609283447, "Full-pretrain/Step": 3408, "Full-pretrain/Step Time": 19.321099501103163} +{"Full-pretrain/Learning Rate": 3.720719594210124e-05, "Full-pretrain/Loss": 1.9825043678283691, "Full-pretrain/Loss (Raw)": 1.842046856880188, "Full-pretrain/Step": 3409, "Full-pretrain/Step Time": 19.296746846288443} +{"Full-pretrain/Learning Rate": 3.7199785472341535e-05, "Full-pretrain/Loss": 1.9715927839279175, "Full-pretrain/Loss (Raw)": 1.8791261911392212, "Full-pretrain/Step": 3410, "Full-pretrain/Step Time": 19.277477966621518} +{"Full-pretrain/Learning Rate": 3.719237359534087e-05, "Full-pretrain/Loss": 1.9666870832443237, "Full-pretrain/Loss (Raw)": 1.8173357248306274, "Full-pretrain/Step": 3411, "Full-pretrain/Step Time": 19.254848515614867} +{"Full-pretrain/Learning Rate": 3.7184960311954185e-05, "Full-pretrain/Loss": 1.9738092422485352, "Full-pretrain/Loss (Raw)": 2.2248196601867676, "Full-pretrain/Step": 3412, "Full-pretrain/Step Time": 19.241910519078374} +{"Full-pretrain/Learning Rate": 3.717754562303661e-05, "Full-pretrain/Loss": 1.98276948928833, "Full-pretrain/Loss (Raw)": 2.3724448680877686, "Full-pretrain/Step": 3413, "Full-pretrain/Step Time": 19.228903179988265} +{"Full-pretrain/Learning Rate": 3.717012952944344e-05, "Full-pretrain/Loss": 1.983059287071228, "Full-pretrain/Loss (Raw)": 1.9516792297363281, "Full-pretrain/Step": 3414, "Full-pretrain/Step Time": 19.201023746281862} +{"Full-pretrain/Learning Rate": 3.716271203203009e-05, "Full-pretrain/Loss": 1.9926087856292725, "Full-pretrain/Loss (Raw)": 2.224252939224243, "Full-pretrain/Step": 3415, "Full-pretrain/Step Time": 19.15898028574884} +{"Full-pretrain/Learning Rate": 3.71552931316522e-05, "Full-pretrain/Loss": 1.9961495399475098, "Full-pretrain/Loss (Raw)": 2.164058208465576, "Full-pretrain/Step": 3416, "Full-pretrain/Step Time": 19.106491638347507} +{"Full-pretrain/Learning Rate": 3.71478728291655e-05, "Full-pretrain/Loss": 1.988104224205017, "Full-pretrain/Loss (Raw)": 1.8030498027801514, "Full-pretrain/Step": 3417, "Full-pretrain/Step Time": 19.070296052843332} +{"Full-pretrain/Learning Rate": 3.714045112542594e-05, "Full-pretrain/Loss": 1.9940766096115112, "Full-pretrain/Loss (Raw)": 2.181783676147461, "Full-pretrain/Step": 3418, "Full-pretrain/Step Time": 19.03578702919185} +{"Full-pretrain/Learning Rate": 3.7133028021289626e-05, "Full-pretrain/Loss": 1.9984235763549805, "Full-pretrain/Loss (Raw)": 1.9930325746536255, "Full-pretrain/Step": 3419, "Full-pretrain/Step Time": 18.989082658663392} +{"Full-pretrain/Learning Rate": 3.712560351761277e-05, "Full-pretrain/Loss": 1.9863901138305664, "Full-pretrain/Loss (Raw)": 1.591325044631958, "Full-pretrain/Step": 3420, "Full-pretrain/Step Time": 18.944547783583403} +{"Full-pretrain/Learning Rate": 3.711817761525183e-05, "Full-pretrain/Loss": 1.980772852897644, "Full-pretrain/Loss (Raw)": 1.7688541412353516, "Full-pretrain/Step": 3421, "Full-pretrain/Step Time": 18.908751407638192} +{"Full-pretrain/Learning Rate": 3.7110750315063344e-05, "Full-pretrain/Loss": 1.981002688407898, "Full-pretrain/Loss (Raw)": 1.9875431060791016, "Full-pretrain/Step": 3422, "Full-pretrain/Step Time": 18.87225835211575} +{"Full-pretrain/Learning Rate": 3.7103321617904076e-05, "Full-pretrain/Loss": 1.9823250770568848, "Full-pretrain/Loss (Raw)": 2.048340082168579, "Full-pretrain/Step": 3423, "Full-pretrain/Step Time": 18.840413101017475} +{"Full-pretrain/Learning Rate": 3.709589152463092e-05, "Full-pretrain/Loss": 1.997318983078003, "Full-pretrain/Loss (Raw)": 2.238640785217285, "Full-pretrain/Step": 3424, "Full-pretrain/Step Time": 18.803212082013488} +{"Full-pretrain/Learning Rate": 3.7088460036100917e-05, "Full-pretrain/Loss": 1.9886274337768555, "Full-pretrain/Loss (Raw)": 1.9096839427947998, "Full-pretrain/Step": 3425, "Full-pretrain/Step Time": 18.767519861459732} +{"Full-pretrain/Learning Rate": 3.70810271531713e-05, "Full-pretrain/Loss": 2.0006003379821777, "Full-pretrain/Loss (Raw)": 2.280937433242798, "Full-pretrain/Step": 3426, "Full-pretrain/Step Time": 18.727791983634233} +{"Full-pretrain/Learning Rate": 3.7073592876699444e-05, "Full-pretrain/Loss": 2.0108089447021484, "Full-pretrain/Loss (Raw)": 2.0496697425842285, "Full-pretrain/Step": 3427, "Full-pretrain/Step Time": 18.686390589922667} +{"Full-pretrain/Learning Rate": 3.706615720754288e-05, "Full-pretrain/Loss": 2.0174107551574707, "Full-pretrain/Loss (Raw)": 2.075437545776367, "Full-pretrain/Step": 3428, "Full-pretrain/Step Time": 18.647261779755354} +{"Full-pretrain/Learning Rate": 3.7058720146559346e-05, "Full-pretrain/Loss": 2.016629457473755, "Full-pretrain/Loss (Raw)": 1.7567861080169678, "Full-pretrain/Step": 3429, "Full-pretrain/Step Time": 18.613130658864975} +{"Full-pretrain/Learning Rate": 3.705128169460667e-05, "Full-pretrain/Loss": 2.0106542110443115, "Full-pretrain/Loss (Raw)": 2.0008888244628906, "Full-pretrain/Step": 3430, "Full-pretrain/Step Time": 18.572602918371558} +{"Full-pretrain/Learning Rate": 3.704384185254288e-05, "Full-pretrain/Loss": 2.0213468074798584, "Full-pretrain/Loss (Raw)": 2.3301992416381836, "Full-pretrain/Step": 3431, "Full-pretrain/Step Time": 18.546873891726136} +{"Full-pretrain/Learning Rate": 3.703640062122618e-05, "Full-pretrain/Loss": 2.0028300285339355, "Full-pretrain/Loss (Raw)": 1.7544264793395996, "Full-pretrain/Step": 3432, "Full-pretrain/Step Time": 18.49563856422901} +{"Full-pretrain/Learning Rate": 3.702895800151489e-05, "Full-pretrain/Loss": 2.0026354789733887, "Full-pretrain/Loss (Raw)": 1.9692565202713013, "Full-pretrain/Step": 3433, "Full-pretrain/Step Time": 18.460123045369983} +{"Full-pretrain/Learning Rate": 3.702151399426752e-05, "Full-pretrain/Loss": 1.9995198249816895, "Full-pretrain/Loss (Raw)": 1.9029812812805176, "Full-pretrain/Step": 3434, "Full-pretrain/Step Time": 18.434327924624085} +{"Full-pretrain/Learning Rate": 3.7014068600342734e-05, "Full-pretrain/Loss": 1.9994984865188599, "Full-pretrain/Loss (Raw)": 1.9237349033355713, "Full-pretrain/Step": 3435, "Full-pretrain/Step Time": 18.41148915886879} +{"Full-pretrain/Learning Rate": 3.7006621820599356e-05, "Full-pretrain/Loss": 1.9969226121902466, "Full-pretrain/Loss (Raw)": 2.0477490425109863, "Full-pretrain/Step": 3436, "Full-pretrain/Step Time": 18.38923537917435} +{"Full-pretrain/Learning Rate": 3.6999173655896374e-05, "Full-pretrain/Loss": 1.9953291416168213, "Full-pretrain/Loss (Raw)": 1.8712197542190552, "Full-pretrain/Step": 3437, "Full-pretrain/Step Time": 18.358381746336818} +{"Full-pretrain/Learning Rate": 3.699172410709293e-05, "Full-pretrain/Loss": 2.0056984424591064, "Full-pretrain/Loss (Raw)": 1.997936487197876, "Full-pretrain/Step": 3438, "Full-pretrain/Step Time": 18.33452838473022} +{"Full-pretrain/Learning Rate": 3.698427317504832e-05, "Full-pretrain/Loss": 2.0097408294677734, "Full-pretrain/Loss (Raw)": 2.298633575439453, "Full-pretrain/Step": 3439, "Full-pretrain/Step Time": 18.31066393852234} +{"Full-pretrain/Learning Rate": 3.697682086062201e-05, "Full-pretrain/Loss": 2.0077033042907715, "Full-pretrain/Loss (Raw)": 1.9886322021484375, "Full-pretrain/Step": 3440, "Full-pretrain/Step Time": 18.281591759994626} +{"Full-pretrain/Learning Rate": 3.696936716467363e-05, "Full-pretrain/Loss": 2.0117082595825195, "Full-pretrain/Loss (Raw)": 1.9702026844024658, "Full-pretrain/Step": 3441, "Full-pretrain/Step Time": 18.258282773196697} +{"Full-pretrain/Learning Rate": 3.696191208806295e-05, "Full-pretrain/Loss": 2.0147292613983154, "Full-pretrain/Loss (Raw)": 1.9757976531982422, "Full-pretrain/Step": 3442, "Full-pretrain/Step Time": 18.24306042306125} +{"Full-pretrain/Learning Rate": 3.695445563164991e-05, "Full-pretrain/Loss": 2.020669937133789, "Full-pretrain/Loss (Raw)": 2.007441520690918, "Full-pretrain/Step": 3443, "Full-pretrain/Step Time": 18.227667221799493} +{"Full-pretrain/Learning Rate": 3.694699779629461e-05, "Full-pretrain/Loss": 2.0196666717529297, "Full-pretrain/Loss (Raw)": 2.1927127838134766, "Full-pretrain/Step": 3444, "Full-pretrain/Step Time": 18.20725885592401} +{"Full-pretrain/Learning Rate": 3.693953858285733e-05, "Full-pretrain/Loss": 2.0051016807556152, "Full-pretrain/Loss (Raw)": 1.9063656330108643, "Full-pretrain/Step": 3445, "Full-pretrain/Step Time": 18.194473281502724} +{"Full-pretrain/Learning Rate": 3.693207799219845e-05, "Full-pretrain/Loss": 2.008584499359131, "Full-pretrain/Loss (Raw)": 2.063129425048828, "Full-pretrain/Step": 3446, "Full-pretrain/Step Time": 18.186495020985603} +{"Full-pretrain/Learning Rate": 3.692461602517859e-05, "Full-pretrain/Loss": 2.002619504928589, "Full-pretrain/Loss (Raw)": 2.0333752632141113, "Full-pretrain/Step": 3447, "Full-pretrain/Step Time": 18.170684196054935} +{"Full-pretrain/Learning Rate": 3.691715268265844e-05, "Full-pretrain/Loss": 1.9926178455352783, "Full-pretrain/Loss (Raw)": 1.843999981880188, "Full-pretrain/Step": 3448, "Full-pretrain/Step Time": 18.158956555649638} +{"Full-pretrain/Learning Rate": 3.690968796549893e-05, "Full-pretrain/Loss": 1.9970667362213135, "Full-pretrain/Loss (Raw)": 1.9454154968261719, "Full-pretrain/Step": 3449, "Full-pretrain/Step Time": 18.144229006022215} +{"Full-pretrain/Learning Rate": 3.69022218745611e-05, "Full-pretrain/Loss": 1.9742112159729004, "Full-pretrain/Loss (Raw)": 1.450408697128296, "Full-pretrain/Step": 3450, "Full-pretrain/Step Time": 18.134174624457955} +{"Full-pretrain/Learning Rate": 3.689475441070615e-05, "Full-pretrain/Loss": 1.980320692062378, "Full-pretrain/Loss (Raw)": 2.188535690307617, "Full-pretrain/Step": 3451, "Full-pretrain/Step Time": 18.120015125721693} +{"Full-pretrain/Learning Rate": 3.688728557479546e-05, "Full-pretrain/Loss": 1.9927031993865967, "Full-pretrain/Loss (Raw)": 1.9875659942626953, "Full-pretrain/Step": 3452, "Full-pretrain/Step Time": 18.096525616943836} +{"Full-pretrain/Learning Rate": 3.6879815367690565e-05, "Full-pretrain/Loss": 2.009860038757324, "Full-pretrain/Loss (Raw)": 2.3178791999816895, "Full-pretrain/Step": 3453, "Full-pretrain/Step Time": 18.07436660118401} +{"Full-pretrain/Learning Rate": 3.687234379025313e-05, "Full-pretrain/Loss": 2.015867233276367, "Full-pretrain/Loss (Raw)": 2.1797680854797363, "Full-pretrain/Step": 3454, "Full-pretrain/Step Time": 18.059426182880998} +{"Full-pretrain/Learning Rate": 3.686487084334502e-05, "Full-pretrain/Loss": 2.0151867866516113, "Full-pretrain/Loss (Raw)": 2.0265631675720215, "Full-pretrain/Step": 3455, "Full-pretrain/Step Time": 18.040063865482807} +{"Full-pretrain/Learning Rate": 3.685739652782822e-05, "Full-pretrain/Loss": 2.0154306888580322, "Full-pretrain/Loss (Raw)": 2.2464468479156494, "Full-pretrain/Step": 3456, "Full-pretrain/Step Time": 18.02030031569302} +{"Full-pretrain/Learning Rate": 3.6849920844564906e-05, "Full-pretrain/Loss": 2.026172161102295, "Full-pretrain/Loss (Raw)": 2.253417730331421, "Full-pretrain/Step": 3457, "Full-pretrain/Step Time": 18.00492273271084} +{"Full-pretrain/Learning Rate": 3.6842443794417384e-05, "Full-pretrain/Loss": 2.0200881958007812, "Full-pretrain/Loss (Raw)": 2.086244583129883, "Full-pretrain/Step": 3458, "Full-pretrain/Step Time": 17.98838809877634} +{"Full-pretrain/Learning Rate": 3.683496537824813e-05, "Full-pretrain/Loss": 2.0114877223968506, "Full-pretrain/Loss (Raw)": 1.7744555473327637, "Full-pretrain/Step": 3459, "Full-pretrain/Step Time": 17.973504040390253} +{"Full-pretrain/Learning Rate": 3.6827485596919776e-05, "Full-pretrain/Loss": 2.0121803283691406, "Full-pretrain/Loss (Raw)": 2.0976009368896484, "Full-pretrain/Step": 3460, "Full-pretrain/Step Time": 17.959887644276023} +{"Full-pretrain/Learning Rate": 3.682000445129512e-05, "Full-pretrain/Loss": 2.0316386222839355, "Full-pretrain/Loss (Raw)": 2.3794572353363037, "Full-pretrain/Step": 3461, "Full-pretrain/Step Time": 17.951238576322794} +{"Full-pretrain/Learning Rate": 3.6812521942237104e-05, "Full-pretrain/Loss": 2.0401992797851562, "Full-pretrain/Loss (Raw)": 2.274829387664795, "Full-pretrain/Step": 3462, "Full-pretrain/Step Time": 17.937221655622125} +{"Full-pretrain/Learning Rate": 3.680503807060883e-05, "Full-pretrain/Loss": 2.0306122303009033, "Full-pretrain/Loss (Raw)": 2.0234107971191406, "Full-pretrain/Step": 3463, "Full-pretrain/Step Time": 17.92303943261504} +{"Full-pretrain/Learning Rate": 3.6797552837273566e-05, "Full-pretrain/Loss": 2.0442588329315186, "Full-pretrain/Loss (Raw)": 2.1911182403564453, "Full-pretrain/Step": 3464, "Full-pretrain/Step Time": 17.906852532178164} +{"Full-pretrain/Learning Rate": 3.679006624309472e-05, "Full-pretrain/Loss": 2.0490362644195557, "Full-pretrain/Loss (Raw)": 2.122134208679199, "Full-pretrain/Step": 3465, "Full-pretrain/Step Time": 17.89487948268652} +{"Full-pretrain/Learning Rate": 3.678257828893589e-05, "Full-pretrain/Loss": 2.0499818325042725, "Full-pretrain/Loss (Raw)": 1.9332352876663208, "Full-pretrain/Step": 3466, "Full-pretrain/Step Time": 17.880141757428646} +{"Full-pretrain/Learning Rate": 3.6775088975660796e-05, "Full-pretrain/Loss": 2.0457329750061035, "Full-pretrain/Loss (Raw)": 1.7877719402313232, "Full-pretrain/Step": 3467, "Full-pretrain/Step Time": 17.870790280401707} +{"Full-pretrain/Learning Rate": 3.6767598304133324e-05, "Full-pretrain/Loss": 2.0361993312835693, "Full-pretrain/Loss (Raw)": 1.7426725625991821, "Full-pretrain/Step": 3468, "Full-pretrain/Step Time": 17.847003404051065} +{"Full-pretrain/Learning Rate": 3.676010627521751e-05, "Full-pretrain/Loss": 2.04166841506958, "Full-pretrain/Loss (Raw)": 2.046238422393799, "Full-pretrain/Step": 3469, "Full-pretrain/Step Time": 17.837761487811804} +{"Full-pretrain/Learning Rate": 3.6752612889777574e-05, "Full-pretrain/Loss": 2.0338406562805176, "Full-pretrain/Loss (Raw)": 1.7474379539489746, "Full-pretrain/Step": 3470, "Full-pretrain/Step Time": 17.82347170636058} +{"Full-pretrain/Learning Rate": 3.674511814867788e-05, "Full-pretrain/Loss": 2.025054931640625, "Full-pretrain/Loss (Raw)": 2.017489194869995, "Full-pretrain/Step": 3471, "Full-pretrain/Step Time": 17.815911265090108} +{"Full-pretrain/Learning Rate": 3.673762205278293e-05, "Full-pretrain/Loss": 2.0230212211608887, "Full-pretrain/Loss (Raw)": 1.9235559701919556, "Full-pretrain/Step": 3472, "Full-pretrain/Step Time": 17.7972704898566} +{"Full-pretrain/Learning Rate": 3.6730124602957396e-05, "Full-pretrain/Loss": 2.021069049835205, "Full-pretrain/Loss (Raw)": 1.9077383279800415, "Full-pretrain/Step": 3473, "Full-pretrain/Step Time": 17.785796819254756} +{"Full-pretrain/Learning Rate": 3.6722625800066124e-05, "Full-pretrain/Loss": 2.0137646198272705, "Full-pretrain/Loss (Raw)": 1.742053508758545, "Full-pretrain/Step": 3474, "Full-pretrain/Step Time": 17.775418553501368} +{"Full-pretrain/Learning Rate": 3.671512564497408e-05, "Full-pretrain/Loss": 2.01473331451416, "Full-pretrain/Loss (Raw)": 2.0384366512298584, "Full-pretrain/Step": 3475, "Full-pretrain/Step Time": 17.764308312907815} +{"Full-pretrain/Learning Rate": 3.6707624138546414e-05, "Full-pretrain/Loss": 2.0060689449310303, "Full-pretrain/Loss (Raw)": 1.9154596328735352, "Full-pretrain/Step": 3476, "Full-pretrain/Step Time": 17.75524098984897} +{"Full-pretrain/Learning Rate": 3.670012128164841e-05, "Full-pretrain/Loss": 2.0116844177246094, "Full-pretrain/Loss (Raw)": 2.0860583782196045, "Full-pretrain/Step": 3477, "Full-pretrain/Step Time": 17.744545578956604} +{"Full-pretrain/Learning Rate": 3.669261707514553e-05, "Full-pretrain/Loss": 2.005190372467041, "Full-pretrain/Loss (Raw)": 1.8553212881088257, "Full-pretrain/Step": 3478, "Full-pretrain/Step Time": 17.74169421568513} +{"Full-pretrain/Learning Rate": 3.6685111519903384e-05, "Full-pretrain/Loss": 2.0049211978912354, "Full-pretrain/Loss (Raw)": 2.0247554779052734, "Full-pretrain/Step": 3479, "Full-pretrain/Step Time": 17.734596541151404} +{"Full-pretrain/Learning Rate": 3.667760461678772e-05, "Full-pretrain/Loss": 2.0080957412719727, "Full-pretrain/Loss (Raw)": 1.9455909729003906, "Full-pretrain/Step": 3480, "Full-pretrain/Step Time": 17.729083256796002} +{"Full-pretrain/Learning Rate": 3.667009636666447e-05, "Full-pretrain/Loss": 2.011512279510498, "Full-pretrain/Loss (Raw)": 2.0547423362731934, "Full-pretrain/Step": 3481, "Full-pretrain/Step Time": 17.719967879354954} +{"Full-pretrain/Learning Rate": 3.6662586770399714e-05, "Full-pretrain/Loss": 2.0328853130340576, "Full-pretrain/Loss (Raw)": 2.1343464851379395, "Full-pretrain/Step": 3482, "Full-pretrain/Step Time": 17.70941912010312} +{"Full-pretrain/Learning Rate": 3.665507582885968e-05, "Full-pretrain/Loss": 2.0204269886016846, "Full-pretrain/Loss (Raw)": 1.7898685932159424, "Full-pretrain/Step": 3483, "Full-pretrain/Step Time": 17.697418315336108} +{"Full-pretrain/Learning Rate": 3.664756354291073e-05, "Full-pretrain/Loss": 2.020538330078125, "Full-pretrain/Loss (Raw)": 1.991132378578186, "Full-pretrain/Step": 3484, "Full-pretrain/Step Time": 17.706133848056197} +{"Full-pretrain/Learning Rate": 3.6640049913419414e-05, "Full-pretrain/Loss": 2.0034427642822266, "Full-pretrain/Loss (Raw)": 1.7708173990249634, "Full-pretrain/Step": 3485, "Full-pretrain/Step Time": 17.69462346099317} +{"Full-pretrain/Learning Rate": 3.663253494125244e-05, "Full-pretrain/Loss": 1.997802734375, "Full-pretrain/Loss (Raw)": 1.9992859363555908, "Full-pretrain/Step": 3486, "Full-pretrain/Step Time": 17.68970586359501} +{"Full-pretrain/Learning Rate": 3.6625018627276644e-05, "Full-pretrain/Loss": 1.995236873626709, "Full-pretrain/Loss (Raw)": 1.9444522857666016, "Full-pretrain/Step": 3487, "Full-pretrain/Step Time": 17.6850460562855} +{"Full-pretrain/Learning Rate": 3.661750097235904e-05, "Full-pretrain/Loss": 1.9931330680847168, "Full-pretrain/Loss (Raw)": 2.179129123687744, "Full-pretrain/Step": 3488, "Full-pretrain/Step Time": 17.68375255726278} +{"Full-pretrain/Learning Rate": 3.660998197736677e-05, "Full-pretrain/Loss": 1.9784245491027832, "Full-pretrain/Loss (Raw)": 1.7827463150024414, "Full-pretrain/Step": 3489, "Full-pretrain/Step Time": 17.678646532818675} +{"Full-pretrain/Learning Rate": 3.6602461643167174e-05, "Full-pretrain/Loss": 1.9762743711471558, "Full-pretrain/Loss (Raw)": 2.0174381732940674, "Full-pretrain/Step": 3490, "Full-pretrain/Step Time": 17.68197680823505} +{"Full-pretrain/Learning Rate": 3.65949399706277e-05, "Full-pretrain/Loss": 1.9903230667114258, "Full-pretrain/Loss (Raw)": 2.2240149974823, "Full-pretrain/Step": 3491, "Full-pretrain/Step Time": 17.672568306326866} +{"Full-pretrain/Learning Rate": 3.6587416960615985e-05, "Full-pretrain/Loss": 1.9906599521636963, "Full-pretrain/Loss (Raw)": 2.10837984085083, "Full-pretrain/Step": 3492, "Full-pretrain/Step Time": 17.672927152365446} +{"Full-pretrain/Learning Rate": 3.657989261399978e-05, "Full-pretrain/Loss": 1.9780784845352173, "Full-pretrain/Loss (Raw)": 1.9768495559692383, "Full-pretrain/Step": 3493, "Full-pretrain/Step Time": 17.6700412184} +{"Full-pretrain/Learning Rate": 3.6572366931647035e-05, "Full-pretrain/Loss": 1.9715734720230103, "Full-pretrain/Loss (Raw)": 2.06666898727417, "Full-pretrain/Step": 3494, "Full-pretrain/Step Time": 17.66922613978386} +{"Full-pretrain/Learning Rate": 3.656483991442583e-05, "Full-pretrain/Loss": 1.9725658893585205, "Full-pretrain/Loss (Raw)": 2.0551681518554688, "Full-pretrain/Step": 3495, "Full-pretrain/Step Time": 17.663944341242313} +{"Full-pretrain/Learning Rate": 3.655731156320441e-05, "Full-pretrain/Loss": 1.9665099382400513, "Full-pretrain/Loss (Raw)": 1.9973275661468506, "Full-pretrain/Step": 3496, "Full-pretrain/Step Time": 17.660969518125057} +{"Full-pretrain/Learning Rate": 3.654978187885116e-05, "Full-pretrain/Loss": 1.959529995918274, "Full-pretrain/Loss (Raw)": 1.8987741470336914, "Full-pretrain/Step": 3497, "Full-pretrain/Step Time": 17.65983202122152} +{"Full-pretrain/Learning Rate": 3.654225086223463e-05, "Full-pretrain/Loss": 1.9670374393463135, "Full-pretrain/Loss (Raw)": 2.173473834991455, "Full-pretrain/Step": 3498, "Full-pretrain/Step Time": 17.653355030342937} +{"Full-pretrain/Learning Rate": 3.653471851422352e-05, "Full-pretrain/Loss": 1.9706463813781738, "Full-pretrain/Loss (Raw)": 1.9032599925994873, "Full-pretrain/Step": 3499, "Full-pretrain/Step Time": 17.656747665256262} +{"Full-pretrain/Learning Rate": 3.6527184835686685e-05, "Full-pretrain/Loss": 1.9823830127716064, "Full-pretrain/Loss (Raw)": 2.1182444095611572, "Full-pretrain/Step": 3500, "Full-pretrain/Step Time": 17.64960159547627} +{"Full-pretrain/Learning Rate": 3.651964982749312e-05, "Full-pretrain/Loss": 1.9784282445907593, "Full-pretrain/Loss (Raw)": 1.919684648513794, "Full-pretrain/Step": 3501, "Full-pretrain/Step Time": 17.650646310299635} +{"Full-pretrain/Learning Rate": 3.6512113490512004e-05, "Full-pretrain/Loss": 1.9878604412078857, "Full-pretrain/Loss (Raw)": 2.04927134513855, "Full-pretrain/Step": 3502, "Full-pretrain/Step Time": 17.642980728298426} +{"Full-pretrain/Learning Rate": 3.6504575825612644e-05, "Full-pretrain/Loss": 1.9865522384643555, "Full-pretrain/Loss (Raw)": 1.975622296333313, "Full-pretrain/Step": 3503, "Full-pretrain/Step Time": 17.64702440239489} +{"Full-pretrain/Learning Rate": 3.64970368336645e-05, "Full-pretrain/Loss": 1.990728497505188, "Full-pretrain/Loss (Raw)": 2.0571975708007812, "Full-pretrain/Step": 3504, "Full-pretrain/Step Time": 17.637976745143533} +{"Full-pretrain/Learning Rate": 3.6489496515537204e-05, "Full-pretrain/Loss": 1.9910293817520142, "Full-pretrain/Loss (Raw)": 1.9173663854599, "Full-pretrain/Step": 3505, "Full-pretrain/Step Time": 17.63245606608689} +{"Full-pretrain/Learning Rate": 3.648195487210051e-05, "Full-pretrain/Loss": 2.0044634342193604, "Full-pretrain/Loss (Raw)": 2.171943187713623, "Full-pretrain/Step": 3506, "Full-pretrain/Step Time": 17.629467368125916} +{"Full-pretrain/Learning Rate": 3.647441190422437e-05, "Full-pretrain/Loss": 2.006019353866577, "Full-pretrain/Loss (Raw)": 2.0882253646850586, "Full-pretrain/Step": 3507, "Full-pretrain/Step Time": 17.62984874844551} +{"Full-pretrain/Learning Rate": 3.646686761277884e-05, "Full-pretrain/Loss": 2.011164665222168, "Full-pretrain/Loss (Raw)": 2.0801076889038086, "Full-pretrain/Step": 3508, "Full-pretrain/Step Time": 17.62752073071897} +{"Full-pretrain/Learning Rate": 3.6459321998634175e-05, "Full-pretrain/Loss": 2.014645576477051, "Full-pretrain/Loss (Raw)": 2.197446584701538, "Full-pretrain/Step": 3509, "Full-pretrain/Step Time": 17.623634653165936} +{"Full-pretrain/Learning Rate": 3.6451775062660726e-05, "Full-pretrain/Loss": 2.0178747177124023, "Full-pretrain/Loss (Raw)": 1.9586646556854248, "Full-pretrain/Step": 3510, "Full-pretrain/Step Time": 17.62674592807889} +{"Full-pretrain/Learning Rate": 3.6444226805729056e-05, "Full-pretrain/Loss": 2.0155606269836426, "Full-pretrain/Loss (Raw)": 1.95069420337677, "Full-pretrain/Step": 3511, "Full-pretrain/Step Time": 17.624066611751914} +{"Full-pretrain/Learning Rate": 3.6436677228709846e-05, "Full-pretrain/Loss": 2.0172102451324463, "Full-pretrain/Loss (Raw)": 1.9983845949172974, "Full-pretrain/Step": 3512, "Full-pretrain/Step Time": 17.624053727835417} +{"Full-pretrain/Learning Rate": 3.642912633247394e-05, "Full-pretrain/Loss": 2.0245046615600586, "Full-pretrain/Loss (Raw)": 2.2881574630737305, "Full-pretrain/Step": 3513, "Full-pretrain/Step Time": 17.62026971951127} +{"Full-pretrain/Learning Rate": 3.642157411789233e-05, "Full-pretrain/Loss": 2.0223920345306396, "Full-pretrain/Loss (Raw)": 2.0667531490325928, "Full-pretrain/Step": 3514, "Full-pretrain/Step Time": 17.624731365591288} +{"Full-pretrain/Learning Rate": 3.641402058583615e-05, "Full-pretrain/Loss": 2.029695510864258, "Full-pretrain/Loss (Raw)": 2.023578643798828, "Full-pretrain/Step": 3515, "Full-pretrain/Step Time": 17.623362300917506} +{"Full-pretrain/Learning Rate": 3.6406465737176706e-05, "Full-pretrain/Loss": 2.026007652282715, "Full-pretrain/Loss (Raw)": 1.8731201887130737, "Full-pretrain/Step": 3516, "Full-pretrain/Step Time": 17.624261043965816} +{"Full-pretrain/Learning Rate": 3.6398909572785464e-05, "Full-pretrain/Loss": 2.036478042602539, "Full-pretrain/Loss (Raw)": 2.1058719158172607, "Full-pretrain/Step": 3517, "Full-pretrain/Step Time": 17.617737978696823} +{"Full-pretrain/Learning Rate": 3.6391352093534e-05, "Full-pretrain/Loss": 2.0232491493225098, "Full-pretrain/Loss (Raw)": 1.5759611129760742, "Full-pretrain/Step": 3518, "Full-pretrain/Step Time": 17.613862106576562} +{"Full-pretrain/Learning Rate": 3.638379330029407e-05, "Full-pretrain/Loss": 2.021170139312744, "Full-pretrain/Loss (Raw)": 1.8779172897338867, "Full-pretrain/Step": 3519, "Full-pretrain/Step Time": 17.612135723233223} +{"Full-pretrain/Learning Rate": 3.637623319393758e-05, "Full-pretrain/Loss": 2.0187721252441406, "Full-pretrain/Loss (Raw)": 2.1023924350738525, "Full-pretrain/Step": 3520, "Full-pretrain/Step Time": 17.61268717981875} +{"Full-pretrain/Learning Rate": 3.63686717753366e-05, "Full-pretrain/Loss": 2.0275685787200928, "Full-pretrain/Loss (Raw)": 2.064237117767334, "Full-pretrain/Step": 3521, "Full-pretrain/Step Time": 17.60837318189442} +{"Full-pretrain/Learning Rate": 3.6361109045363315e-05, "Full-pretrain/Loss": 2.025679349899292, "Full-pretrain/Loss (Raw)": 1.9569809436798096, "Full-pretrain/Step": 3522, "Full-pretrain/Step Time": 17.607214618474245} +{"Full-pretrain/Learning Rate": 3.63535450048901e-05, "Full-pretrain/Loss": 2.013751268386841, "Full-pretrain/Loss (Raw)": 1.8423174619674683, "Full-pretrain/Step": 3523, "Full-pretrain/Step Time": 17.605220371857285} +{"Full-pretrain/Learning Rate": 3.634597965478946e-05, "Full-pretrain/Loss": 2.0066447257995605, "Full-pretrain/Loss (Raw)": 1.8809661865234375, "Full-pretrain/Step": 3524, "Full-pretrain/Step Time": 17.60153528302908} +{"Full-pretrain/Learning Rate": 3.633841299593406e-05, "Full-pretrain/Loss": 2.0051651000976562, "Full-pretrain/Loss (Raw)": 1.9295077323913574, "Full-pretrain/Step": 3525, "Full-pretrain/Step Time": 17.602189354598522} +{"Full-pretrain/Learning Rate": 3.6330845029196695e-05, "Full-pretrain/Loss": 2.005652666091919, "Full-pretrain/Loss (Raw)": 2.082268714904785, "Full-pretrain/Step": 3526, "Full-pretrain/Step Time": 17.600389640778303} +{"Full-pretrain/Learning Rate": 3.632327575545034e-05, "Full-pretrain/Loss": 2.0082294940948486, "Full-pretrain/Loss (Raw)": 2.137622833251953, "Full-pretrain/Step": 3527, "Full-pretrain/Step Time": 17.59447582438588} +{"Full-pretrain/Learning Rate": 3.6315705175568106e-05, "Full-pretrain/Loss": 2.011355400085449, "Full-pretrain/Loss (Raw)": 2.097364902496338, "Full-pretrain/Step": 3528, "Full-pretrain/Step Time": 17.598490266129375} +{"Full-pretrain/Learning Rate": 3.630813329042326e-05, "Full-pretrain/Loss": 2.0182316303253174, "Full-pretrain/Loss (Raw)": 2.1188042163848877, "Full-pretrain/Step": 3529, "Full-pretrain/Step Time": 17.596209360286593} +{"Full-pretrain/Learning Rate": 3.6300560100889207e-05, "Full-pretrain/Loss": 2.0159196853637695, "Full-pretrain/Loss (Raw)": 2.0994935035705566, "Full-pretrain/Step": 3530, "Full-pretrain/Step Time": 17.596685433760285} +{"Full-pretrain/Learning Rate": 3.629298560783952e-05, "Full-pretrain/Loss": 2.0210018157958984, "Full-pretrain/Loss (Raw)": 2.0658860206604004, "Full-pretrain/Step": 3531, "Full-pretrain/Step Time": 17.592268127948046} +{"Full-pretrain/Learning Rate": 3.628540981214792e-05, "Full-pretrain/Loss": 2.0197315216064453, "Full-pretrain/Loss (Raw)": 2.0775983333587646, "Full-pretrain/Step": 3532, "Full-pretrain/Step Time": 17.59671893529594} +{"Full-pretrain/Learning Rate": 3.627783271468825e-05, "Full-pretrain/Loss": 2.0170137882232666, "Full-pretrain/Loss (Raw)": 1.8327120542526245, "Full-pretrain/Step": 3533, "Full-pretrain/Step Time": 17.59362049587071} +{"Full-pretrain/Learning Rate": 3.627025431633455e-05, "Full-pretrain/Loss": 2.0123860836029053, "Full-pretrain/Loss (Raw)": 1.9011882543563843, "Full-pretrain/Step": 3534, "Full-pretrain/Step Time": 17.5886391364038} +{"Full-pretrain/Learning Rate": 3.6262674617960974e-05, "Full-pretrain/Loss": 2.0190787315368652, "Full-pretrain/Loss (Raw)": 2.189791679382324, "Full-pretrain/Step": 3535, "Full-pretrain/Step Time": 17.591057419776917} +{"Full-pretrain/Learning Rate": 3.6255093620441834e-05, "Full-pretrain/Loss": 2.009805202484131, "Full-pretrain/Loss (Raw)": 1.7604362964630127, "Full-pretrain/Step": 3536, "Full-pretrain/Step Time": 17.589017651975155} +{"Full-pretrain/Learning Rate": 3.6247511324651606e-05, "Full-pretrain/Loss": 2.0125551223754883, "Full-pretrain/Loss (Raw)": 2.005368232727051, "Full-pretrain/Step": 3537, "Full-pretrain/Step Time": 17.585621578618884} +{"Full-pretrain/Learning Rate": 3.6239927731464896e-05, "Full-pretrain/Loss": 2.008173942565918, "Full-pretrain/Loss (Raw)": 2.0317447185516357, "Full-pretrain/Step": 3538, "Full-pretrain/Step Time": 17.59041124023497} +{"Full-pretrain/Learning Rate": 3.6232342841756464e-05, "Full-pretrain/Loss": 1.9977235794067383, "Full-pretrain/Loss (Raw)": 1.7538156509399414, "Full-pretrain/Step": 3539, "Full-pretrain/Step Time": 17.592804165557027} +{"Full-pretrain/Learning Rate": 3.622475665640125e-05, "Full-pretrain/Loss": 2.0041794776916504, "Full-pretrain/Loss (Raw)": 2.2866992950439453, "Full-pretrain/Step": 3540, "Full-pretrain/Step Time": 17.589193992316723} +{"Full-pretrain/Learning Rate": 3.621716917627429e-05, "Full-pretrain/Loss": 2.0007190704345703, "Full-pretrain/Loss (Raw)": 2.086709499359131, "Full-pretrain/Step": 3541, "Full-pretrain/Step Time": 17.5847321562469} +{"Full-pretrain/Learning Rate": 3.6209580402250815e-05, "Full-pretrain/Loss": 2.0034711360931396, "Full-pretrain/Loss (Raw)": 2.0467336177825928, "Full-pretrain/Step": 3542, "Full-pretrain/Step Time": 17.582786347717047} +{"Full-pretrain/Learning Rate": 3.620199033520617e-05, "Full-pretrain/Loss": 1.999078631401062, "Full-pretrain/Loss (Raw)": 1.810133695602417, "Full-pretrain/Step": 3543, "Full-pretrain/Step Time": 17.582274602726102} +{"Full-pretrain/Learning Rate": 3.619439897601587e-05, "Full-pretrain/Loss": 1.9998033046722412, "Full-pretrain/Loss (Raw)": 2.0215744972229004, "Full-pretrain/Step": 3544, "Full-pretrain/Step Time": 17.576643329113722} +{"Full-pretrain/Learning Rate": 3.61868063255556e-05, "Full-pretrain/Loss": 1.9880175590515137, "Full-pretrain/Loss (Raw)": 1.9110126495361328, "Full-pretrain/Step": 3545, "Full-pretrain/Step Time": 17.58124252781272} +{"Full-pretrain/Learning Rate": 3.617921238470114e-05, "Full-pretrain/Loss": 1.9805636405944824, "Full-pretrain/Loss (Raw)": 1.8282256126403809, "Full-pretrain/Step": 3546, "Full-pretrain/Step Time": 17.58299843966961} +{"Full-pretrain/Learning Rate": 3.617161715432847e-05, "Full-pretrain/Loss": 1.9694033861160278, "Full-pretrain/Loss (Raw)": 1.6664533615112305, "Full-pretrain/Step": 3547, "Full-pretrain/Step Time": 17.58514131605625} +{"Full-pretrain/Learning Rate": 3.616402063531368e-05, "Full-pretrain/Loss": 1.965592384338379, "Full-pretrain/Loss (Raw)": 1.7511664628982544, "Full-pretrain/Step": 3548, "Full-pretrain/Step Time": 17.58170404098928} +{"Full-pretrain/Learning Rate": 3.6156422828533035e-05, "Full-pretrain/Loss": 1.9648571014404297, "Full-pretrain/Loss (Raw)": 2.0823416709899902, "Full-pretrain/Step": 3549, "Full-pretrain/Step Time": 17.583858780562878} +{"Full-pretrain/Learning Rate": 3.6148823734862934e-05, "Full-pretrain/Loss": 1.9800183773040771, "Full-pretrain/Loss (Raw)": 2.0611214637756348, "Full-pretrain/Step": 3550, "Full-pretrain/Step Time": 17.5855957493186} +{"Full-pretrain/Learning Rate": 3.6141223355179944e-05, "Full-pretrain/Loss": 1.981909155845642, "Full-pretrain/Loss (Raw)": 1.9384257793426514, "Full-pretrain/Step": 3551, "Full-pretrain/Step Time": 17.5800911039114} +{"Full-pretrain/Learning Rate": 3.613362169036074e-05, "Full-pretrain/Loss": 1.983772873878479, "Full-pretrain/Loss (Raw)": 2.1620287895202637, "Full-pretrain/Step": 3552, "Full-pretrain/Step Time": 17.579663498327136} +{"Full-pretrain/Learning Rate": 3.61260187412822e-05, "Full-pretrain/Loss": 1.9797557592391968, "Full-pretrain/Loss (Raw)": 1.9356917142868042, "Full-pretrain/Step": 3553, "Full-pretrain/Step Time": 17.584299944341183} +{"Full-pretrain/Learning Rate": 3.61184145088213e-05, "Full-pretrain/Loss": 1.9781544208526611, "Full-pretrain/Loss (Raw)": 1.9057374000549316, "Full-pretrain/Step": 3554, "Full-pretrain/Step Time": 17.58436325378716} +{"Full-pretrain/Learning Rate": 3.6110808993855194e-05, "Full-pretrain/Loss": 1.9828968048095703, "Full-pretrain/Loss (Raw)": 1.9940739870071411, "Full-pretrain/Step": 3555, "Full-pretrain/Step Time": 17.585142463445663} +{"Full-pretrain/Learning Rate": 3.6103202197261175e-05, "Full-pretrain/Loss": 1.9973773956298828, "Full-pretrain/Loss (Raw)": 2.3443431854248047, "Full-pretrain/Step": 3556, "Full-pretrain/Step Time": 17.588817957788706} +{"Full-pretrain/Learning Rate": 3.609559411991669e-05, "Full-pretrain/Loss": 1.9982023239135742, "Full-pretrain/Loss (Raw)": 1.955909252166748, "Full-pretrain/Step": 3557, "Full-pretrain/Step Time": 17.58749395236373} +{"Full-pretrain/Learning Rate": 3.608798476269932e-05, "Full-pretrain/Loss": 1.993861436843872, "Full-pretrain/Loss (Raw)": 1.9433578252792358, "Full-pretrain/Step": 3558, "Full-pretrain/Step Time": 17.59662681259215} +{"Full-pretrain/Learning Rate": 3.60803741264868e-05, "Full-pretrain/Loss": 1.9902238845825195, "Full-pretrain/Loss (Raw)": 2.0212206840515137, "Full-pretrain/Step": 3559, "Full-pretrain/Step Time": 17.59169622696936} +{"Full-pretrain/Learning Rate": 3.607276221215703e-05, "Full-pretrain/Loss": 1.9881830215454102, "Full-pretrain/Loss (Raw)": 2.032055616378784, "Full-pretrain/Step": 3560, "Full-pretrain/Step Time": 17.59553600102663} +{"Full-pretrain/Learning Rate": 3.606514902058802e-05, "Full-pretrain/Loss": 1.9877488613128662, "Full-pretrain/Loss (Raw)": 2.104910373687744, "Full-pretrain/Step": 3561, "Full-pretrain/Step Time": 17.59764571301639} +{"Full-pretrain/Learning Rate": 3.6057534552657954e-05, "Full-pretrain/Loss": 1.9909758567810059, "Full-pretrain/Loss (Raw)": 2.2027626037597656, "Full-pretrain/Step": 3562, "Full-pretrain/Step Time": 17.59803231433034} +{"Full-pretrain/Learning Rate": 3.604991880924518e-05, "Full-pretrain/Loss": 1.9919557571411133, "Full-pretrain/Loss (Raw)": 2.0972397327423096, "Full-pretrain/Step": 3563, "Full-pretrain/Step Time": 17.595081752166152} +{"Full-pretrain/Learning Rate": 3.604230179122814e-05, "Full-pretrain/Loss": 1.9826536178588867, "Full-pretrain/Loss (Raw)": 1.7799288034439087, "Full-pretrain/Step": 3564, "Full-pretrain/Step Time": 17.59905810467899} +{"Full-pretrain/Learning Rate": 3.6034683499485465e-05, "Full-pretrain/Loss": 1.9862251281738281, "Full-pretrain/Loss (Raw)": 1.9470012187957764, "Full-pretrain/Step": 3565, "Full-pretrain/Step Time": 17.60274195857346} +{"Full-pretrain/Learning Rate": 3.602706393489594e-05, "Full-pretrain/Loss": 1.9928276538848877, "Full-pretrain/Loss (Raw)": 2.1124720573425293, "Full-pretrain/Step": 3566, "Full-pretrain/Step Time": 17.601772671565413} +{"Full-pretrain/Learning Rate": 3.6019443098338466e-05, "Full-pretrain/Loss": 1.9831337928771973, "Full-pretrain/Loss (Raw)": 1.8795819282531738, "Full-pretrain/Step": 3567, "Full-pretrain/Step Time": 17.59913855046034} +{"Full-pretrain/Learning Rate": 3.6011820990692094e-05, "Full-pretrain/Loss": 1.9883627891540527, "Full-pretrain/Loss (Raw)": 1.927768349647522, "Full-pretrain/Step": 3568, "Full-pretrain/Step Time": 17.601540382951498} +{"Full-pretrain/Learning Rate": 3.6004197612836044e-05, "Full-pretrain/Loss": 1.9894723892211914, "Full-pretrain/Loss (Raw)": 2.0408730506896973, "Full-pretrain/Step": 3569, "Full-pretrain/Step Time": 17.606427989900112} +{"Full-pretrain/Learning Rate": 3.599657296564966e-05, "Full-pretrain/Loss": 1.9872262477874756, "Full-pretrain/Loss (Raw)": 1.9598685503005981, "Full-pretrain/Step": 3570, "Full-pretrain/Step Time": 17.599383307620883} +{"Full-pretrain/Learning Rate": 3.598894705001246e-05, "Full-pretrain/Loss": 2.004840850830078, "Full-pretrain/Loss (Raw)": 2.3174843788146973, "Full-pretrain/Step": 3571, "Full-pretrain/Step Time": 17.60038487613201} +{"Full-pretrain/Learning Rate": 3.598131986680408e-05, "Full-pretrain/Loss": 1.995152473449707, "Full-pretrain/Loss (Raw)": 1.976670503616333, "Full-pretrain/Step": 3572, "Full-pretrain/Step Time": 17.599504759535193} +{"Full-pretrain/Learning Rate": 3.59736914169043e-05, "Full-pretrain/Loss": 1.9883804321289062, "Full-pretrain/Loss (Raw)": 1.8700048923492432, "Full-pretrain/Step": 3573, "Full-pretrain/Step Time": 17.59752669557929} +{"Full-pretrain/Learning Rate": 3.596606170119308e-05, "Full-pretrain/Loss": 1.9853301048278809, "Full-pretrain/Loss (Raw)": 1.9491215944290161, "Full-pretrain/Step": 3574, "Full-pretrain/Step Time": 17.595568930730224} +{"Full-pretrain/Learning Rate": 3.59584307205505e-05, "Full-pretrain/Loss": 1.9879145622253418, "Full-pretrain/Loss (Raw)": 1.8928356170654297, "Full-pretrain/Step": 3575, "Full-pretrain/Step Time": 17.59820343181491} +{"Full-pretrain/Learning Rate": 3.5950798475856783e-05, "Full-pretrain/Loss": 1.9814311265945435, "Full-pretrain/Loss (Raw)": 1.8141053915023804, "Full-pretrain/Step": 3576, "Full-pretrain/Step Time": 17.59543294273317} +{"Full-pretrain/Learning Rate": 3.59431649679923e-05, "Full-pretrain/Loss": 1.988739252090454, "Full-pretrain/Loss (Raw)": 2.1448755264282227, "Full-pretrain/Step": 3577, "Full-pretrain/Step Time": 17.58990229666233} +{"Full-pretrain/Learning Rate": 3.59355301978376e-05, "Full-pretrain/Loss": 2.00296688079834, "Full-pretrain/Loss (Raw)": 2.283511161804199, "Full-pretrain/Step": 3578, "Full-pretrain/Step Time": 17.587372563779354} +{"Full-pretrain/Learning Rate": 3.592789416627332e-05, "Full-pretrain/Loss": 2.005131959915161, "Full-pretrain/Loss (Raw)": 1.7357356548309326, "Full-pretrain/Step": 3579, "Full-pretrain/Step Time": 17.592163057997823} +{"Full-pretrain/Learning Rate": 3.59202568741803e-05, "Full-pretrain/Loss": 2.012275218963623, "Full-pretrain/Loss (Raw)": 1.9797489643096924, "Full-pretrain/Step": 3580, "Full-pretrain/Step Time": 17.583954380825162} +{"Full-pretrain/Learning Rate": 3.5912618322439485e-05, "Full-pretrain/Loss": 2.004635810852051, "Full-pretrain/Loss (Raw)": 1.837878942489624, "Full-pretrain/Step": 3581, "Full-pretrain/Step Time": 17.592298425734043} +{"Full-pretrain/Learning Rate": 3.590497851193198e-05, "Full-pretrain/Loss": 2.0058610439300537, "Full-pretrain/Loss (Raw)": 2.100327730178833, "Full-pretrain/Step": 3582, "Full-pretrain/Step Time": 17.5869048461318} +{"Full-pretrain/Learning Rate": 3.589733744353904e-05, "Full-pretrain/Loss": 2.016796112060547, "Full-pretrain/Loss (Raw)": 2.2883551120758057, "Full-pretrain/Step": 3583, "Full-pretrain/Step Time": 17.592142563313246} +{"Full-pretrain/Learning Rate": 3.588969511814205e-05, "Full-pretrain/Loss": 2.003230571746826, "Full-pretrain/Loss (Raw)": 1.7279272079467773, "Full-pretrain/Step": 3584, "Full-pretrain/Step Time": 17.596121286973357} +{"Full-pretrain/Learning Rate": 3.588205153662256e-05, "Full-pretrain/Loss": 2.0016846656799316, "Full-pretrain/Loss (Raw)": 1.88621985912323, "Full-pretrain/Step": 3585, "Full-pretrain/Step Time": 17.594309501349926} +{"Full-pretrain/Learning Rate": 3.587440669986224e-05, "Full-pretrain/Loss": 2.002195358276367, "Full-pretrain/Loss (Raw)": 1.922074556350708, "Full-pretrain/Step": 3586, "Full-pretrain/Step Time": 17.592885425314307} +{"Full-pretrain/Learning Rate": 3.586676060874293e-05, "Full-pretrain/Loss": 2.002997875213623, "Full-pretrain/Loss (Raw)": 2.0197675228118896, "Full-pretrain/Step": 3587, "Full-pretrain/Step Time": 17.59537380002439} +{"Full-pretrain/Learning Rate": 3.585911326414661e-05, "Full-pretrain/Loss": 1.9910417795181274, "Full-pretrain/Loss (Raw)": 1.9617418050765991, "Full-pretrain/Step": 3588, "Full-pretrain/Step Time": 17.594817493110895} +{"Full-pretrain/Learning Rate": 3.5851464666955385e-05, "Full-pretrain/Loss": 1.9816721677780151, "Full-pretrain/Loss (Raw)": 1.6560832262039185, "Full-pretrain/Step": 3589, "Full-pretrain/Step Time": 17.590992879122496} +{"Full-pretrain/Learning Rate": 3.5843814818051534e-05, "Full-pretrain/Loss": 1.9865049123764038, "Full-pretrain/Loss (Raw)": 2.098001718521118, "Full-pretrain/Step": 3590, "Full-pretrain/Step Time": 17.595095360651612} +{"Full-pretrain/Learning Rate": 3.583616371831745e-05, "Full-pretrain/Loss": 1.9845540523529053, "Full-pretrain/Loss (Raw)": 1.9588007926940918, "Full-pretrain/Step": 3591, "Full-pretrain/Step Time": 17.597267361357808} +{"Full-pretrain/Learning Rate": 3.5828511368635685e-05, "Full-pretrain/Loss": 1.9782763719558716, "Full-pretrain/Loss (Raw)": 1.8311634063720703, "Full-pretrain/Step": 3592, "Full-pretrain/Step Time": 17.606523158028722} +{"Full-pretrain/Learning Rate": 3.5820857769888944e-05, "Full-pretrain/Loss": 1.9674081802368164, "Full-pretrain/Loss (Raw)": 1.7571295499801636, "Full-pretrain/Step": 3593, "Full-pretrain/Step Time": 17.60292582027614} +{"Full-pretrain/Learning Rate": 3.5813202922960056e-05, "Full-pretrain/Loss": 1.9502911567687988, "Full-pretrain/Loss (Raw)": 1.6550171375274658, "Full-pretrain/Step": 3594, "Full-pretrain/Step Time": 17.601917922496796} +{"Full-pretrain/Learning Rate": 3.5805546828732015e-05, "Full-pretrain/Loss": 1.9518439769744873, "Full-pretrain/Loss (Raw)": 2.1469311714172363, "Full-pretrain/Step": 3595, "Full-pretrain/Step Time": 17.598147958517075} +{"Full-pretrain/Learning Rate": 3.5797889488087945e-05, "Full-pretrain/Loss": 1.9620990753173828, "Full-pretrain/Loss (Raw)": 2.1080894470214844, "Full-pretrain/Step": 3596, "Full-pretrain/Step Time": 17.608204163610935} +{"Full-pretrain/Learning Rate": 3.579023090191112e-05, "Full-pretrain/Loss": 1.9623066186904907, "Full-pretrain/Loss (Raw)": 1.9536463022232056, "Full-pretrain/Step": 3597, "Full-pretrain/Step Time": 17.607735786587} +{"Full-pretrain/Learning Rate": 3.578257107108494e-05, "Full-pretrain/Loss": 1.955167293548584, "Full-pretrain/Loss (Raw)": 1.884013056755066, "Full-pretrain/Step": 3598, "Full-pretrain/Step Time": 17.600948248058558} +{"Full-pretrain/Learning Rate": 3.577490999649298e-05, "Full-pretrain/Loss": 1.9570865631103516, "Full-pretrain/Loss (Raw)": 1.9409992694854736, "Full-pretrain/Step": 3599, "Full-pretrain/Step Time": 17.600615676492453} +{"Full-pretrain/Learning Rate": 3.576724767901895e-05, "Full-pretrain/Loss": 1.960767149925232, "Full-pretrain/Loss (Raw)": 2.0455429553985596, "Full-pretrain/Step": 3600, "Full-pretrain/Step Time": 17.604407515376806} +{"Full-pretrain/Learning Rate": 3.575958411954668e-05, "Full-pretrain/Loss": 1.9661109447479248, "Full-pretrain/Loss (Raw)": 2.2118756771087646, "Full-pretrain/Step": 3601, "Full-pretrain/Step Time": 17.60016394034028} +{"Full-pretrain/Learning Rate": 3.575191931896016e-05, "Full-pretrain/Loss": 1.9679735898971558, "Full-pretrain/Loss (Raw)": 2.0194737911224365, "Full-pretrain/Step": 3602, "Full-pretrain/Step Time": 17.594461910426617} +{"Full-pretrain/Learning Rate": 3.574425327814352e-05, "Full-pretrain/Loss": 1.9610589742660522, "Full-pretrain/Loss (Raw)": 2.096219062805176, "Full-pretrain/Step": 3603, "Full-pretrain/Step Time": 17.601240498945117} +{"Full-pretrain/Learning Rate": 3.573658599798105e-05, "Full-pretrain/Loss": 1.9627147912979126, "Full-pretrain/Loss (Raw)": 2.0296554565429688, "Full-pretrain/Step": 3604, "Full-pretrain/Step Time": 17.60317644290626} +{"Full-pretrain/Learning Rate": 3.572891747935716e-05, "Full-pretrain/Loss": 1.970858097076416, "Full-pretrain/Loss (Raw)": 2.1305899620056152, "Full-pretrain/Step": 3605, "Full-pretrain/Step Time": 17.60054382868111} +{"Full-pretrain/Learning Rate": 3.572124772315639e-05, "Full-pretrain/Loss": 1.9662920236587524, "Full-pretrain/Loss (Raw)": 1.8030086755752563, "Full-pretrain/Step": 3606, "Full-pretrain/Step Time": 17.602674717083573} +{"Full-pretrain/Learning Rate": 3.5713576730263476e-05, "Full-pretrain/Loss": 1.9720079898834229, "Full-pretrain/Loss (Raw)": 2.075747489929199, "Full-pretrain/Step": 3607, "Full-pretrain/Step Time": 17.605665067210793} +{"Full-pretrain/Learning Rate": 3.570590450156325e-05, "Full-pretrain/Loss": 1.969871997833252, "Full-pretrain/Loss (Raw)": 1.7457548379898071, "Full-pretrain/Step": 3608, "Full-pretrain/Step Time": 17.60540514998138} +{"Full-pretrain/Learning Rate": 3.569823103794071e-05, "Full-pretrain/Loss": 1.9649298191070557, "Full-pretrain/Loss (Raw)": 1.9867249727249146, "Full-pretrain/Step": 3609, "Full-pretrain/Step Time": 17.60478206910193} +{"Full-pretrain/Learning Rate": 3.5690556340280965e-05, "Full-pretrain/Loss": 1.9575412273406982, "Full-pretrain/Loss (Raw)": 2.0470728874206543, "Full-pretrain/Step": 3610, "Full-pretrain/Step Time": 17.606321757659316} +{"Full-pretrain/Learning Rate": 3.5682880409469315e-05, "Full-pretrain/Loss": 1.9595372676849365, "Full-pretrain/Loss (Raw)": 1.7996132373809814, "Full-pretrain/Step": 3611, "Full-pretrain/Step Time": 17.609338361769915} +{"Full-pretrain/Learning Rate": 3.567520324639116e-05, "Full-pretrain/Loss": 1.9586883783340454, "Full-pretrain/Loss (Raw)": 1.9525831937789917, "Full-pretrain/Step": 3612, "Full-pretrain/Step Time": 17.598018733784556} +{"Full-pretrain/Learning Rate": 3.5667524851932066e-05, "Full-pretrain/Loss": 1.9601821899414062, "Full-pretrain/Loss (Raw)": 1.8856807947158813, "Full-pretrain/Step": 3613, "Full-pretrain/Step Time": 17.60165799036622} +{"Full-pretrain/Learning Rate": 3.5659845226977715e-05, "Full-pretrain/Loss": 1.9639533758163452, "Full-pretrain/Loss (Raw)": 2.2210025787353516, "Full-pretrain/Step": 3614, "Full-pretrain/Step Time": 17.598533302545547} +{"Full-pretrain/Learning Rate": 3.565216437241398e-05, "Full-pretrain/Loss": 1.9638562202453613, "Full-pretrain/Loss (Raw)": 2.2852487564086914, "Full-pretrain/Step": 3615, "Full-pretrain/Step Time": 17.595873897895217} +{"Full-pretrain/Learning Rate": 3.564448228912682e-05, "Full-pretrain/Loss": 1.9628219604492188, "Full-pretrain/Loss (Raw)": 1.694830060005188, "Full-pretrain/Step": 3616, "Full-pretrain/Step Time": 17.599282909184694} +{"Full-pretrain/Learning Rate": 3.563679897800237e-05, "Full-pretrain/Loss": 1.9579377174377441, "Full-pretrain/Loss (Raw)": 1.7299220561981201, "Full-pretrain/Step": 3617, "Full-pretrain/Step Time": 17.60042509995401} +{"Full-pretrain/Learning Rate": 3.5629114439926896e-05, "Full-pretrain/Loss": 1.9593983888626099, "Full-pretrain/Loss (Raw)": 1.9688185453414917, "Full-pretrain/Step": 3618, "Full-pretrain/Step Time": 17.594684276729822} +{"Full-pretrain/Learning Rate": 3.5621428675786806e-05, "Full-pretrain/Loss": 1.9556021690368652, "Full-pretrain/Loss (Raw)": 1.8982863426208496, "Full-pretrain/Step": 3619, "Full-pretrain/Step Time": 17.59452644176781} +{"Full-pretrain/Learning Rate": 3.561374168646865e-05, "Full-pretrain/Loss": 1.957059383392334, "Full-pretrain/Loss (Raw)": 2.008375406265259, "Full-pretrain/Step": 3620, "Full-pretrain/Step Time": 17.598045829683542} +{"Full-pretrain/Learning Rate": 3.560605347285913e-05, "Full-pretrain/Loss": 1.9657824039459229, "Full-pretrain/Loss (Raw)": 1.9352188110351562, "Full-pretrain/Step": 3621, "Full-pretrain/Step Time": 17.59770553931594} +{"Full-pretrain/Learning Rate": 3.559836403584505e-05, "Full-pretrain/Loss": 1.9639118909835815, "Full-pretrain/Loss (Raw)": 2.038147449493408, "Full-pretrain/Step": 3622, "Full-pretrain/Step Time": 17.598160644993186} +{"Full-pretrain/Learning Rate": 3.559067337631341e-05, "Full-pretrain/Loss": 1.966296911239624, "Full-pretrain/Loss (Raw)": 2.0351176261901855, "Full-pretrain/Step": 3623, "Full-pretrain/Step Time": 17.59920441545546} +{"Full-pretrain/Learning Rate": 3.558298149515133e-05, "Full-pretrain/Loss": 1.9743610620498657, "Full-pretrain/Loss (Raw)": 2.089221239089966, "Full-pretrain/Step": 3624, "Full-pretrain/Step Time": 17.593832712620497} +{"Full-pretrain/Learning Rate": 3.557528839324604e-05, "Full-pretrain/Loss": 1.9856607913970947, "Full-pretrain/Loss (Raw)": 2.1187222003936768, "Full-pretrain/Step": 3625, "Full-pretrain/Step Time": 17.599543856456876} +{"Full-pretrain/Learning Rate": 3.556759407148496e-05, "Full-pretrain/Loss": 1.9939615726470947, "Full-pretrain/Loss (Raw)": 1.9206407070159912, "Full-pretrain/Step": 3626, "Full-pretrain/Step Time": 17.5983365457505} +{"Full-pretrain/Learning Rate": 3.555989853075561e-05, "Full-pretrain/Loss": 1.9817163944244385, "Full-pretrain/Loss (Raw)": 1.755081295967102, "Full-pretrain/Step": 3627, "Full-pretrain/Step Time": 17.59574244916439} +{"Full-pretrain/Learning Rate": 3.5552201771945676e-05, "Full-pretrain/Loss": 1.9890191555023193, "Full-pretrain/Loss (Raw)": 2.3417820930480957, "Full-pretrain/Step": 3628, "Full-pretrain/Step Time": 17.593726525083184} +{"Full-pretrain/Learning Rate": 3.554450379594298e-05, "Full-pretrain/Loss": 1.994794487953186, "Full-pretrain/Loss (Raw)": 2.1384572982788086, "Full-pretrain/Step": 3629, "Full-pretrain/Step Time": 17.595274152234197} +{"Full-pretrain/Learning Rate": 3.5536804603635474e-05, "Full-pretrain/Loss": 1.995922565460205, "Full-pretrain/Loss (Raw)": 1.920108675956726, "Full-pretrain/Step": 3630, "Full-pretrain/Step Time": 17.59798738360405} +{"Full-pretrain/Learning Rate": 3.5529104195911256e-05, "Full-pretrain/Loss": 1.99422287940979, "Full-pretrain/Loss (Raw)": 1.8866108655929565, "Full-pretrain/Step": 3631, "Full-pretrain/Step Time": 17.59839392825961} +{"Full-pretrain/Learning Rate": 3.552140257365858e-05, "Full-pretrain/Loss": 1.9892399311065674, "Full-pretrain/Loss (Raw)": 1.8860865831375122, "Full-pretrain/Step": 3632, "Full-pretrain/Step Time": 17.590562535449862} +{"Full-pretrain/Learning Rate": 3.551369973776581e-05, "Full-pretrain/Loss": 1.9786018133163452, "Full-pretrain/Loss (Raw)": 1.8714563846588135, "Full-pretrain/Step": 3633, "Full-pretrain/Step Time": 17.59324269928038} +{"Full-pretrain/Learning Rate": 3.550599568912148e-05, "Full-pretrain/Loss": 1.9864215850830078, "Full-pretrain/Loss (Raw)": 2.2697064876556396, "Full-pretrain/Step": 3634, "Full-pretrain/Step Time": 17.595020089298487} +{"Full-pretrain/Learning Rate": 3.5498290428614214e-05, "Full-pretrain/Loss": 1.9796885251998901, "Full-pretrain/Loss (Raw)": 1.8807616233825684, "Full-pretrain/Step": 3635, "Full-pretrain/Step Time": 17.59870418906212} +{"Full-pretrain/Learning Rate": 3.549058395713285e-05, "Full-pretrain/Loss": 1.9736661911010742, "Full-pretrain/Loss (Raw)": 1.8369382619857788, "Full-pretrain/Step": 3636, "Full-pretrain/Step Time": 17.592270901426673} +{"Full-pretrain/Learning Rate": 3.548287627556632e-05, "Full-pretrain/Loss": 1.9719374179840088, "Full-pretrain/Loss (Raw)": 2.0752711296081543, "Full-pretrain/Step": 3637, "Full-pretrain/Step Time": 17.599428080022335} +{"Full-pretrain/Learning Rate": 3.5475167384803685e-05, "Full-pretrain/Loss": 1.9841463565826416, "Full-pretrain/Loss (Raw)": 2.193695545196533, "Full-pretrain/Step": 3638, "Full-pretrain/Step Time": 17.597745837643743} +{"Full-pretrain/Learning Rate": 3.546745728573418e-05, "Full-pretrain/Loss": 1.9778162240982056, "Full-pretrain/Loss (Raw)": 1.873178482055664, "Full-pretrain/Step": 3639, "Full-pretrain/Step Time": 17.60067167505622} +{"Full-pretrain/Learning Rate": 3.545974597924715e-05, "Full-pretrain/Loss": 1.9839838743209839, "Full-pretrain/Loss (Raw)": 1.9431241750717163, "Full-pretrain/Step": 3640, "Full-pretrain/Step Time": 17.597477715462446} +{"Full-pretrain/Learning Rate": 3.54520334662321e-05, "Full-pretrain/Loss": 1.9788800477981567, "Full-pretrain/Loss (Raw)": 1.8233996629714966, "Full-pretrain/Step": 3641, "Full-pretrain/Step Time": 17.598215125501156} +{"Full-pretrain/Learning Rate": 3.544431974757866e-05, "Full-pretrain/Loss": 1.9737571477890015, "Full-pretrain/Loss (Raw)": 1.8831405639648438, "Full-pretrain/Step": 3642, "Full-pretrain/Step Time": 17.595240959897637} +{"Full-pretrain/Learning Rate": 3.543660482417662e-05, "Full-pretrain/Loss": 1.9832279682159424, "Full-pretrain/Loss (Raw)": 2.1026768684387207, "Full-pretrain/Step": 3643, "Full-pretrain/Step Time": 17.587708262726665} +{"Full-pretrain/Learning Rate": 3.542888869691586e-05, "Full-pretrain/Loss": 1.9871597290039062, "Full-pretrain/Loss (Raw)": 2.078401803970337, "Full-pretrain/Step": 3644, "Full-pretrain/Step Time": 17.58979855850339} +{"Full-pretrain/Learning Rate": 3.542117136668647e-05, "Full-pretrain/Loss": 1.979745626449585, "Full-pretrain/Loss (Raw)": 1.6484273672103882, "Full-pretrain/Step": 3645, "Full-pretrain/Step Time": 17.593080163002014} +{"Full-pretrain/Learning Rate": 3.5413452834378625e-05, "Full-pretrain/Loss": 1.9668855667114258, "Full-pretrain/Loss (Raw)": 1.8094816207885742, "Full-pretrain/Step": 3646, "Full-pretrain/Step Time": 17.59129604883492} +{"Full-pretrain/Learning Rate": 3.5405733100882657e-05, "Full-pretrain/Loss": 1.9593403339385986, "Full-pretrain/Loss (Raw)": 2.04380464553833, "Full-pretrain/Step": 3647, "Full-pretrain/Step Time": 17.595376858487725} +{"Full-pretrain/Learning Rate": 3.5398012167089014e-05, "Full-pretrain/Loss": 1.9617197513580322, "Full-pretrain/Loss (Raw)": 1.7709710597991943, "Full-pretrain/Step": 3648, "Full-pretrain/Step Time": 17.598535165190697} +{"Full-pretrain/Learning Rate": 3.5390290033888336e-05, "Full-pretrain/Loss": 1.9763247966766357, "Full-pretrain/Loss (Raw)": 2.1972811222076416, "Full-pretrain/Step": 3649, "Full-pretrain/Step Time": 17.59236839413643} +{"Full-pretrain/Learning Rate": 3.5382566702171356e-05, "Full-pretrain/Loss": 1.9858105182647705, "Full-pretrain/Loss (Raw)": 2.2723655700683594, "Full-pretrain/Step": 3650, "Full-pretrain/Step Time": 17.596661610528827} +{"Full-pretrain/Learning Rate": 3.5374842172828955e-05, "Full-pretrain/Loss": 1.983371376991272, "Full-pretrain/Loss (Raw)": 1.8202321529388428, "Full-pretrain/Step": 3651, "Full-pretrain/Step Time": 17.59807302057743} +{"Full-pretrain/Learning Rate": 3.5367116446752145e-05, "Full-pretrain/Loss": 1.9813841581344604, "Full-pretrain/Loss (Raw)": 1.9447848796844482, "Full-pretrain/Step": 3652, "Full-pretrain/Step Time": 17.605283584445715} +{"Full-pretrain/Learning Rate": 3.535938952483211e-05, "Full-pretrain/Loss": 1.9887540340423584, "Full-pretrain/Loss (Raw)": 2.1710526943206787, "Full-pretrain/Step": 3653, "Full-pretrain/Step Time": 17.602530578151345} +{"Full-pretrain/Learning Rate": 3.5351661407960126e-05, "Full-pretrain/Loss": 1.9871881008148193, "Full-pretrain/Loss (Raw)": 1.988037109375, "Full-pretrain/Step": 3654, "Full-pretrain/Step Time": 17.60576487518847} +{"Full-pretrain/Learning Rate": 3.534393209702764e-05, "Full-pretrain/Loss": 1.9765249490737915, "Full-pretrain/Loss (Raw)": 1.6938990354537964, "Full-pretrain/Step": 3655, "Full-pretrain/Step Time": 17.60727916844189} +{"Full-pretrain/Learning Rate": 3.533620159292621e-05, "Full-pretrain/Loss": 1.9809319972991943, "Full-pretrain/Loss (Raw)": 2.2302472591400146, "Full-pretrain/Step": 3656, "Full-pretrain/Step Time": 17.611712550744414} +{"Full-pretrain/Learning Rate": 3.532846989654757e-05, "Full-pretrain/Loss": 1.971923828125, "Full-pretrain/Loss (Raw)": 1.830458402633667, "Full-pretrain/Step": 3657, "Full-pretrain/Step Time": 17.60778704471886} +{"Full-pretrain/Learning Rate": 3.532073700878355e-05, "Full-pretrain/Loss": 1.975274920463562, "Full-pretrain/Loss (Raw)": 2.0278737545013428, "Full-pretrain/Step": 3658, "Full-pretrain/Step Time": 17.607584670186043} +{"Full-pretrain/Learning Rate": 3.5313002930526155e-05, "Full-pretrain/Loss": 1.9743057489395142, "Full-pretrain/Loss (Raw)": 1.724071979522705, "Full-pretrain/Step": 3659, "Full-pretrain/Step Time": 17.614506667479873} +{"Full-pretrain/Learning Rate": 3.5305267662667484e-05, "Full-pretrain/Loss": 1.96295166015625, "Full-pretrain/Loss (Raw)": 1.9784517288208008, "Full-pretrain/Step": 3660, "Full-pretrain/Step Time": 17.61240189895034} +{"Full-pretrain/Learning Rate": 3.529753120609982e-05, "Full-pretrain/Loss": 1.9672755002975464, "Full-pretrain/Loss (Raw)": 2.276818037033081, "Full-pretrain/Step": 3661, "Full-pretrain/Step Time": 17.612735772505403} +{"Full-pretrain/Learning Rate": 3.528979356171555e-05, "Full-pretrain/Loss": 1.9702074527740479, "Full-pretrain/Loss (Raw)": 2.013932228088379, "Full-pretrain/Step": 3662, "Full-pretrain/Step Time": 17.607690580189228} +{"Full-pretrain/Learning Rate": 3.5282054730407196e-05, "Full-pretrain/Loss": 1.9781105518341064, "Full-pretrain/Loss (Raw)": 2.1395068168640137, "Full-pretrain/Step": 3663, "Full-pretrain/Step Time": 17.616631995886564} +{"Full-pretrain/Learning Rate": 3.527431471306745e-05, "Full-pretrain/Loss": 1.9782211780548096, "Full-pretrain/Loss (Raw)": 1.889626383781433, "Full-pretrain/Step": 3664, "Full-pretrain/Step Time": 17.613937186077237} +{"Full-pretrain/Learning Rate": 3.5266573510589114e-05, "Full-pretrain/Loss": 1.9785246849060059, "Full-pretrain/Loss (Raw)": 1.8811711072921753, "Full-pretrain/Step": 3665, "Full-pretrain/Step Time": 17.615119544789195} +{"Full-pretrain/Learning Rate": 3.525883112386513e-05, "Full-pretrain/Loss": 1.9693608283996582, "Full-pretrain/Loss (Raw)": 1.9764641523361206, "Full-pretrain/Step": 3666, "Full-pretrain/Step Time": 17.60800044052303} +{"Full-pretrain/Learning Rate": 3.5251087553788586e-05, "Full-pretrain/Loss": 1.9697070121765137, "Full-pretrain/Loss (Raw)": 1.891836404800415, "Full-pretrain/Step": 3667, "Full-pretrain/Step Time": 17.611886715516448} +{"Full-pretrain/Learning Rate": 3.524334280125269e-05, "Full-pretrain/Loss": 1.9727492332458496, "Full-pretrain/Loss (Raw)": 1.934289574623108, "Full-pretrain/Step": 3668, "Full-pretrain/Step Time": 17.610127978026867} +{"Full-pretrain/Learning Rate": 3.52355968671508e-05, "Full-pretrain/Loss": 1.9595005512237549, "Full-pretrain/Loss (Raw)": 1.6513147354125977, "Full-pretrain/Step": 3669, "Full-pretrain/Step Time": 17.61467053554952} +{"Full-pretrain/Learning Rate": 3.522784975237641e-05, "Full-pretrain/Loss": 1.9553800821304321, "Full-pretrain/Loss (Raw)": 2.0618395805358887, "Full-pretrain/Step": 3670, "Full-pretrain/Step Time": 17.61949289776385} +{"Full-pretrain/Learning Rate": 3.5220101457823146e-05, "Full-pretrain/Loss": 1.9553941488265991, "Full-pretrain/Loss (Raw)": 1.873626470565796, "Full-pretrain/Step": 3671, "Full-pretrain/Step Time": 17.620847713202238} +{"Full-pretrain/Learning Rate": 3.521235198438477e-05, "Full-pretrain/Loss": 1.9626182317733765, "Full-pretrain/Loss (Raw)": 2.1742959022521973, "Full-pretrain/Step": 3672, "Full-pretrain/Step Time": 17.61817497573793} +{"Full-pretrain/Learning Rate": 3.520460133295518e-05, "Full-pretrain/Loss": 1.97080659866333, "Full-pretrain/Loss (Raw)": 2.085428237915039, "Full-pretrain/Step": 3673, "Full-pretrain/Step Time": 17.619959583505988} +{"Full-pretrain/Learning Rate": 3.519684950442841e-05, "Full-pretrain/Loss": 1.9743833541870117, "Full-pretrain/Loss (Raw)": 1.9975980520248413, "Full-pretrain/Step": 3674, "Full-pretrain/Step Time": 17.617149002850056} +{"Full-pretrain/Learning Rate": 3.5189096499698645e-05, "Full-pretrain/Loss": 1.9702255725860596, "Full-pretrain/Loss (Raw)": 1.9696277379989624, "Full-pretrain/Step": 3675, "Full-pretrain/Step Time": 17.610513485968113} +{"Full-pretrain/Learning Rate": 3.518134231966017e-05, "Full-pretrain/Loss": 1.9661457538604736, "Full-pretrain/Loss (Raw)": 1.947847843170166, "Full-pretrain/Step": 3676, "Full-pretrain/Step Time": 17.619208127260208} +{"Full-pretrain/Learning Rate": 3.517358696520744e-05, "Full-pretrain/Loss": 1.9812345504760742, "Full-pretrain/Loss (Raw)": 2.1312661170959473, "Full-pretrain/Step": 3677, "Full-pretrain/Step Time": 17.61716710962355} +{"Full-pretrain/Learning Rate": 3.516583043723502e-05, "Full-pretrain/Loss": 1.9889276027679443, "Full-pretrain/Loss (Raw)": 2.055666446685791, "Full-pretrain/Step": 3678, "Full-pretrain/Step Time": 17.614979101344943} +{"Full-pretrain/Learning Rate": 3.515807273663764e-05, "Full-pretrain/Loss": 1.9921748638153076, "Full-pretrain/Loss (Raw)": 2.1477150917053223, "Full-pretrain/Step": 3679, "Full-pretrain/Step Time": 17.615452332422137} +{"Full-pretrain/Learning Rate": 3.515031386431014e-05, "Full-pretrain/Loss": 1.9977436065673828, "Full-pretrain/Loss (Raw)": 1.9491697549819946, "Full-pretrain/Step": 3680, "Full-pretrain/Step Time": 17.618607008829713} +{"Full-pretrain/Learning Rate": 3.5142553821147494e-05, "Full-pretrain/Loss": 1.995171308517456, "Full-pretrain/Loss (Raw)": 2.1149682998657227, "Full-pretrain/Step": 3681, "Full-pretrain/Step Time": 17.62125193886459} +{"Full-pretrain/Learning Rate": 3.513479260804484e-05, "Full-pretrain/Loss": 1.9844026565551758, "Full-pretrain/Loss (Raw)": 1.9277682304382324, "Full-pretrain/Step": 3682, "Full-pretrain/Step Time": 17.62317741289735} +{"Full-pretrain/Learning Rate": 3.512703022589741e-05, "Full-pretrain/Loss": 1.9856717586517334, "Full-pretrain/Loss (Raw)": 1.8608412742614746, "Full-pretrain/Step": 3683, "Full-pretrain/Step Time": 17.626032639294863} +{"Full-pretrain/Learning Rate": 3.5119266675600615e-05, "Full-pretrain/Loss": 1.9898959398269653, "Full-pretrain/Loss (Raw)": 2.0799591541290283, "Full-pretrain/Step": 3684, "Full-pretrain/Step Time": 17.62037735246122} +{"Full-pretrain/Learning Rate": 3.511150195804996e-05, "Full-pretrain/Loss": 1.9731478691101074, "Full-pretrain/Loss (Raw)": 1.635116457939148, "Full-pretrain/Step": 3685, "Full-pretrain/Step Time": 17.62965644709766} +{"Full-pretrain/Learning Rate": 3.5103736074141105e-05, "Full-pretrain/Loss": 1.9731800556182861, "Full-pretrain/Loss (Raw)": 1.9890632629394531, "Full-pretrain/Step": 3686, "Full-pretrain/Step Time": 17.620465291664004} +{"Full-pretrain/Learning Rate": 3.5095969024769845e-05, "Full-pretrain/Loss": 1.97992742061615, "Full-pretrain/Loss (Raw)": 1.909815788269043, "Full-pretrain/Step": 3687, "Full-pretrain/Step Time": 17.61857285350561} +{"Full-pretrain/Learning Rate": 3.508820081083211e-05, "Full-pretrain/Loss": 1.9731305837631226, "Full-pretrain/Loss (Raw)": 2.0127475261688232, "Full-pretrain/Step": 3688, "Full-pretrain/Step Time": 17.61373119801283} +{"Full-pretrain/Learning Rate": 3.508043143322395e-05, "Full-pretrain/Loss": 1.977563500404358, "Full-pretrain/Loss (Raw)": 1.9723122119903564, "Full-pretrain/Step": 3689, "Full-pretrain/Step Time": 17.618006952106953} +{"Full-pretrain/Learning Rate": 3.507266089284157e-05, "Full-pretrain/Loss": 1.9745299816131592, "Full-pretrain/Loss (Raw)": 1.9308007955551147, "Full-pretrain/Step": 3690, "Full-pretrain/Step Time": 17.617555553093553} +{"Full-pretrain/Learning Rate": 3.506488919058129e-05, "Full-pretrain/Loss": 1.9888532161712646, "Full-pretrain/Loss (Raw)": 2.1824162006378174, "Full-pretrain/Step": 3691, "Full-pretrain/Step Time": 17.612000036984682} +{"Full-pretrain/Learning Rate": 3.505711632733959e-05, "Full-pretrain/Loss": 1.9808404445648193, "Full-pretrain/Loss (Raw)": 1.7220460176467896, "Full-pretrain/Step": 3692, "Full-pretrain/Step Time": 17.608226282522082} +{"Full-pretrain/Learning Rate": 3.504934230401305e-05, "Full-pretrain/Loss": 1.9699640274047852, "Full-pretrain/Loss (Raw)": 1.928770661354065, "Full-pretrain/Step": 3693, "Full-pretrain/Step Time": 17.60506551153958} +{"Full-pretrain/Learning Rate": 3.504156712149841e-05, "Full-pretrain/Loss": 1.969794750213623, "Full-pretrain/Loss (Raw)": 2.008516550064087, "Full-pretrain/Step": 3694, "Full-pretrain/Step Time": 17.605489348992705} +{"Full-pretrain/Learning Rate": 3.503379078069253e-05, "Full-pretrain/Loss": 1.96187424659729, "Full-pretrain/Loss (Raw)": 1.8860527276992798, "Full-pretrain/Step": 3695, "Full-pretrain/Step Time": 17.607990335673094} +{"Full-pretrain/Learning Rate": 3.50260132824924e-05, "Full-pretrain/Loss": 1.970017671585083, "Full-pretrain/Loss (Raw)": 2.150209903717041, "Full-pretrain/Step": 3696, "Full-pretrain/Step Time": 17.60393470339477} +{"Full-pretrain/Learning Rate": 3.5018234627795175e-05, "Full-pretrain/Loss": 1.9680627584457397, "Full-pretrain/Loss (Raw)": 1.8186190128326416, "Full-pretrain/Step": 3697, "Full-pretrain/Step Time": 17.605851002037525} +{"Full-pretrain/Learning Rate": 3.50104548174981e-05, "Full-pretrain/Loss": 1.9662597179412842, "Full-pretrain/Loss (Raw)": 1.9187610149383545, "Full-pretrain/Step": 3698, "Full-pretrain/Step Time": 17.60785538330674} +{"Full-pretrain/Learning Rate": 3.500267385249858e-05, "Full-pretrain/Loss": 1.9629532098770142, "Full-pretrain/Loss (Raw)": 1.7860333919525146, "Full-pretrain/Step": 3699, "Full-pretrain/Step Time": 17.606316417455673} +{"Full-pretrain/Learning Rate": 3.4994891733694147e-05, "Full-pretrain/Loss": 1.9651925563812256, "Full-pretrain/Loss (Raw)": 2.005943536758423, "Full-pretrain/Step": 3700, "Full-pretrain/Step Time": 17.60814535059035} +{"Full-pretrain/Learning Rate": 3.4987108461982474e-05, "Full-pretrain/Loss": 1.9688985347747803, "Full-pretrain/Loss (Raw)": 1.769914150238037, "Full-pretrain/Step": 3701, "Full-pretrain/Step Time": 17.608548747375607} +{"Full-pretrain/Learning Rate": 3.497932403826133e-05, "Full-pretrain/Loss": 1.9748644828796387, "Full-pretrain/Loss (Raw)": 2.252741575241089, "Full-pretrain/Step": 3702, "Full-pretrain/Step Time": 17.605222560465336} +{"Full-pretrain/Learning Rate": 3.497153846342868e-05, "Full-pretrain/Loss": 1.9842517375946045, "Full-pretrain/Loss (Raw)": 2.1740245819091797, "Full-pretrain/Step": 3703, "Full-pretrain/Step Time": 17.599739896133542} +{"Full-pretrain/Learning Rate": 3.4963751738382566e-05, "Full-pretrain/Loss": 1.9801911115646362, "Full-pretrain/Loss (Raw)": 2.0443530082702637, "Full-pretrain/Step": 3704, "Full-pretrain/Step Time": 17.601978950202465} +{"Full-pretrain/Learning Rate": 3.49559638640212e-05, "Full-pretrain/Loss": 1.9742786884307861, "Full-pretrain/Loss (Raw)": 1.896233320236206, "Full-pretrain/Step": 3705, "Full-pretrain/Step Time": 17.6058615334332} +{"Full-pretrain/Learning Rate": 3.494817484124289e-05, "Full-pretrain/Loss": 1.9708678722381592, "Full-pretrain/Loss (Raw)": 1.8884475231170654, "Full-pretrain/Step": 3706, "Full-pretrain/Step Time": 17.601950719952583} +{"Full-pretrain/Learning Rate": 3.4940384670946105e-05, "Full-pretrain/Loss": 1.9729957580566406, "Full-pretrain/Loss (Raw)": 2.0377254486083984, "Full-pretrain/Step": 3707, "Full-pretrain/Step Time": 17.593494130298495} +{"Full-pretrain/Learning Rate": 3.4932593354029454e-05, "Full-pretrain/Loss": 1.973780632019043, "Full-pretrain/Loss (Raw)": 1.9729640483856201, "Full-pretrain/Step": 3708, "Full-pretrain/Step Time": 17.603526113554835} +{"Full-pretrain/Learning Rate": 3.4924800891391644e-05, "Full-pretrain/Loss": 1.9679561853408813, "Full-pretrain/Loss (Raw)": 1.9448792934417725, "Full-pretrain/Step": 3709, "Full-pretrain/Step Time": 17.60074833407998} +{"Full-pretrain/Learning Rate": 3.491700728393154e-05, "Full-pretrain/Loss": 1.9713706970214844, "Full-pretrain/Loss (Raw)": 2.1649317741394043, "Full-pretrain/Step": 3710, "Full-pretrain/Step Time": 17.597316805273294} +{"Full-pretrain/Learning Rate": 3.490921253254813e-05, "Full-pretrain/Loss": 1.9674994945526123, "Full-pretrain/Loss (Raw)": 2.023834228515625, "Full-pretrain/Step": 3711, "Full-pretrain/Step Time": 17.59602899849415} +{"Full-pretrain/Learning Rate": 3.4901416638140536e-05, "Full-pretrain/Loss": 1.9692331552505493, "Full-pretrain/Loss (Raw)": 2.0046494007110596, "Full-pretrain/Step": 3712, "Full-pretrain/Step Time": 17.596178341656923} +{"Full-pretrain/Learning Rate": 3.4893619601608017e-05, "Full-pretrain/Loss": 1.9637947082519531, "Full-pretrain/Loss (Raw)": 1.9409377574920654, "Full-pretrain/Step": 3713, "Full-pretrain/Step Time": 17.59567454084754} +{"Full-pretrain/Learning Rate": 3.488582142384995e-05, "Full-pretrain/Loss": 1.9632728099822998, "Full-pretrain/Loss (Raw)": 1.9110698699951172, "Full-pretrain/Step": 3714, "Full-pretrain/Step Time": 17.60008630156517} +{"Full-pretrain/Learning Rate": 3.4878022105765854e-05, "Full-pretrain/Loss": 1.9639763832092285, "Full-pretrain/Loss (Raw)": 1.883353352546692, "Full-pretrain/Step": 3715, "Full-pretrain/Step Time": 17.59387960098684} +{"Full-pretrain/Learning Rate": 3.487022164825538e-05, "Full-pretrain/Loss": 1.961327314376831, "Full-pretrain/Loss (Raw)": 1.995187759399414, "Full-pretrain/Step": 3716, "Full-pretrain/Step Time": 17.594786325469613} +{"Full-pretrain/Learning Rate": 3.4862420052218316e-05, "Full-pretrain/Loss": 1.9764968156814575, "Full-pretrain/Loss (Raw)": 2.120542287826538, "Full-pretrain/Step": 3717, "Full-pretrain/Step Time": 17.592602914199233} +{"Full-pretrain/Learning Rate": 3.485461731855456e-05, "Full-pretrain/Loss": 1.9666094779968262, "Full-pretrain/Loss (Raw)": 1.6726694107055664, "Full-pretrain/Step": 3718, "Full-pretrain/Step Time": 17.59160267189145} +{"Full-pretrain/Learning Rate": 3.484681344816416e-05, "Full-pretrain/Loss": 1.9627223014831543, "Full-pretrain/Loss (Raw)": 1.7854269742965698, "Full-pretrain/Step": 3719, "Full-pretrain/Step Time": 17.59450620599091} +{"Full-pretrain/Learning Rate": 3.483900844194728e-05, "Full-pretrain/Loss": 1.9595714807510376, "Full-pretrain/Loss (Raw)": 1.9119186401367188, "Full-pretrain/Step": 3720, "Full-pretrain/Step Time": 17.590095730498433} +{"Full-pretrain/Learning Rate": 3.483120230080425e-05, "Full-pretrain/Loss": 1.9543241262435913, "Full-pretrain/Loss (Raw)": 1.8043959140777588, "Full-pretrain/Step": 3721, "Full-pretrain/Step Time": 17.59169897250831} +{"Full-pretrain/Learning Rate": 3.482339502563547e-05, "Full-pretrain/Loss": 1.959374189376831, "Full-pretrain/Loss (Raw)": 2.092404365539551, "Full-pretrain/Step": 3722, "Full-pretrain/Step Time": 17.593577545136213} +{"Full-pretrain/Learning Rate": 3.481558661734153e-05, "Full-pretrain/Loss": 1.958388328552246, "Full-pretrain/Loss (Raw)": 2.1508660316467285, "Full-pretrain/Step": 3723, "Full-pretrain/Step Time": 17.59800899773836} +{"Full-pretrain/Learning Rate": 3.4807777076823137e-05, "Full-pretrain/Loss": 1.967214584350586, "Full-pretrain/Loss (Raw)": 2.004485845565796, "Full-pretrain/Step": 3724, "Full-pretrain/Step Time": 17.59203039482236} +{"Full-pretrain/Learning Rate": 3.4799966404981095e-05, "Full-pretrain/Loss": 1.96962571144104, "Full-pretrain/Loss (Raw)": 2.0059289932250977, "Full-pretrain/Step": 3725, "Full-pretrain/Step Time": 17.58948642015457} +{"Full-pretrain/Learning Rate": 3.479215460271637e-05, "Full-pretrain/Loss": 1.9634124040603638, "Full-pretrain/Loss (Raw)": 1.8096911907196045, "Full-pretrain/Step": 3726, "Full-pretrain/Step Time": 17.59403664059937} +{"Full-pretrain/Learning Rate": 3.4784341670930065e-05, "Full-pretrain/Loss": 1.9644254446029663, "Full-pretrain/Loss (Raw)": 1.9184703826904297, "Full-pretrain/Step": 3727, "Full-pretrain/Step Time": 17.589234145358205} +{"Full-pretrain/Learning Rate": 3.477652761052338e-05, "Full-pretrain/Loss": 1.9577805995941162, "Full-pretrain/Loss (Raw)": 1.9375767707824707, "Full-pretrain/Step": 3728, "Full-pretrain/Step Time": 17.5903063621372} +{"Full-pretrain/Learning Rate": 3.476871242239767e-05, "Full-pretrain/Loss": 1.9589418172836304, "Full-pretrain/Loss (Raw)": 1.8557770252227783, "Full-pretrain/Step": 3729, "Full-pretrain/Step Time": 17.5889329072088} +{"Full-pretrain/Learning Rate": 3.4760896107454414e-05, "Full-pretrain/Loss": 1.9530287981033325, "Full-pretrain/Loss (Raw)": 1.7295430898666382, "Full-pretrain/Step": 3730, "Full-pretrain/Step Time": 17.59380493685603} +{"Full-pretrain/Learning Rate": 3.4753078666595215e-05, "Full-pretrain/Loss": 1.9567770957946777, "Full-pretrain/Loss (Raw)": 1.9059813022613525, "Full-pretrain/Step": 3731, "Full-pretrain/Step Time": 17.58906150609255} +{"Full-pretrain/Learning Rate": 3.474526010072183e-05, "Full-pretrain/Loss": 1.9613453149795532, "Full-pretrain/Loss (Raw)": 2.152122974395752, "Full-pretrain/Step": 3732, "Full-pretrain/Step Time": 17.59282346814871} +{"Full-pretrain/Learning Rate": 3.473744041073611e-05, "Full-pretrain/Loss": 1.9826011657714844, "Full-pretrain/Loss (Raw)": 2.450101375579834, "Full-pretrain/Step": 3733, "Full-pretrain/Step Time": 17.595197658985853} +{"Full-pretrain/Learning Rate": 3.472961959754007e-05, "Full-pretrain/Loss": 1.9760020971298218, "Full-pretrain/Loss (Raw)": 2.0415728092193604, "Full-pretrain/Step": 3734, "Full-pretrain/Step Time": 17.59195340052247} +{"Full-pretrain/Learning Rate": 3.4721797662035824e-05, "Full-pretrain/Loss": 1.968560814857483, "Full-pretrain/Loss (Raw)": 1.9359043836593628, "Full-pretrain/Step": 3735, "Full-pretrain/Step Time": 17.591525856405497} +{"Full-pretrain/Learning Rate": 3.471397460512563e-05, "Full-pretrain/Loss": 1.962334156036377, "Full-pretrain/Loss (Raw)": 1.8451001644134521, "Full-pretrain/Step": 3736, "Full-pretrain/Step Time": 17.592111131176353} +{"Full-pretrain/Learning Rate": 3.4706150427711895e-05, "Full-pretrain/Loss": 1.9627853631973267, "Full-pretrain/Loss (Raw)": 1.9106694459915161, "Full-pretrain/Step": 3737, "Full-pretrain/Step Time": 17.594841500744224} +{"Full-pretrain/Learning Rate": 3.4698325130697104e-05, "Full-pretrain/Loss": 1.9675637483596802, "Full-pretrain/Loss (Raw)": 2.041358470916748, "Full-pretrain/Step": 3738, "Full-pretrain/Step Time": 17.590328752994537} +{"Full-pretrain/Learning Rate": 3.469049871498392e-05, "Full-pretrain/Loss": 1.9675004482269287, "Full-pretrain/Loss (Raw)": 2.035696506500244, "Full-pretrain/Step": 3739, "Full-pretrain/Step Time": 17.59052255190909} +{"Full-pretrain/Learning Rate": 3.4682671181475115e-05, "Full-pretrain/Loss": 1.9640109539031982, "Full-pretrain/Loss (Raw)": 1.8613059520721436, "Full-pretrain/Step": 3740, "Full-pretrain/Step Time": 17.598949747160077} +{"Full-pretrain/Learning Rate": 3.467484253107359e-05, "Full-pretrain/Loss": 1.9575029611587524, "Full-pretrain/Loss (Raw)": 1.736619234085083, "Full-pretrain/Step": 3741, "Full-pretrain/Step Time": 17.594559263437986} +{"Full-pretrain/Learning Rate": 3.466701276468238e-05, "Full-pretrain/Loss": 1.9496021270751953, "Full-pretrain/Loss (Raw)": 1.9121041297912598, "Full-pretrain/Step": 3742, "Full-pretrain/Step Time": 17.593915404751897} +{"Full-pretrain/Learning Rate": 3.465918188320465e-05, "Full-pretrain/Loss": 1.9530330896377563, "Full-pretrain/Loss (Raw)": 2.1336276531219482, "Full-pretrain/Step": 3743, "Full-pretrain/Step Time": 17.596031723544} +{"Full-pretrain/Learning Rate": 3.465134988754368e-05, "Full-pretrain/Loss": 1.9529027938842773, "Full-pretrain/Loss (Raw)": 2.0004801750183105, "Full-pretrain/Step": 3744, "Full-pretrain/Step Time": 17.595015358179808} +{"Full-pretrain/Learning Rate": 3.464351677860289e-05, "Full-pretrain/Loss": 1.955339789390564, "Full-pretrain/Loss (Raw)": 2.0189194679260254, "Full-pretrain/Step": 3745, "Full-pretrain/Step Time": 17.594513481482863} +{"Full-pretrain/Learning Rate": 3.4635682557285834e-05, "Full-pretrain/Loss": 1.955122947692871, "Full-pretrain/Loss (Raw)": 1.9041318893432617, "Full-pretrain/Step": 3746, "Full-pretrain/Step Time": 17.592439364641905} +{"Full-pretrain/Learning Rate": 3.462784722449617e-05, "Full-pretrain/Loss": 1.9543073177337646, "Full-pretrain/Loss (Raw)": 1.857254981994629, "Full-pretrain/Step": 3747, "Full-pretrain/Step Time": 17.592528449371457} +{"Full-pretrain/Learning Rate": 3.4620010781137726e-05, "Full-pretrain/Loss": 1.9551031589508057, "Full-pretrain/Loss (Raw)": 2.020653486251831, "Full-pretrain/Step": 3748, "Full-pretrain/Step Time": 17.59558708779514} +{"Full-pretrain/Learning Rate": 3.461217322811441e-05, "Full-pretrain/Loss": 1.9485461711883545, "Full-pretrain/Loss (Raw)": 1.9107187986373901, "Full-pretrain/Step": 3749, "Full-pretrain/Step Time": 17.59266434237361} +{"Full-pretrain/Learning Rate": 3.460433456633029e-05, "Full-pretrain/Loss": 1.9572583436965942, "Full-pretrain/Loss (Raw)": 1.9514559507369995, "Full-pretrain/Step": 3750, "Full-pretrain/Step Time": 17.58732113055885} +{"Full-pretrain/Learning Rate": 3.459649479668956e-05, "Full-pretrain/Loss": 1.9623751640319824, "Full-pretrain/Loss (Raw)": 1.9491684436798096, "Full-pretrain/Step": 3751, "Full-pretrain/Step Time": 17.58722907677293} +{"Full-pretrain/Learning Rate": 3.4588653920096526e-05, "Full-pretrain/Loss": 1.970107078552246, "Full-pretrain/Loss (Raw)": 2.159339427947998, "Full-pretrain/Step": 3752, "Full-pretrain/Step Time": 17.591986371204257} +{"Full-pretrain/Learning Rate": 3.4580811937455635e-05, "Full-pretrain/Loss": 1.9826345443725586, "Full-pretrain/Loss (Raw)": 2.205275535583496, "Full-pretrain/Step": 3753, "Full-pretrain/Step Time": 17.58553735911846} +{"Full-pretrain/Learning Rate": 3.457296884967144e-05, "Full-pretrain/Loss": 1.983109712600708, "Full-pretrain/Loss (Raw)": 2.1076087951660156, "Full-pretrain/Step": 3754, "Full-pretrain/Step Time": 17.588242933154106} +{"Full-pretrain/Learning Rate": 3.456512465764867e-05, "Full-pretrain/Loss": 1.9785325527191162, "Full-pretrain/Loss (Raw)": 2.0043997764587402, "Full-pretrain/Step": 3755, "Full-pretrain/Step Time": 17.581581311300397} +{"Full-pretrain/Learning Rate": 3.455727936229212e-05, "Full-pretrain/Loss": 1.9778931140899658, "Full-pretrain/Loss (Raw)": 1.9840185642242432, "Full-pretrain/Step": 3756, "Full-pretrain/Step Time": 17.583288721740246} +{"Full-pretrain/Learning Rate": 3.454943296450675e-05, "Full-pretrain/Loss": 1.9770313501358032, "Full-pretrain/Loss (Raw)": 1.978353500366211, "Full-pretrain/Step": 3757, "Full-pretrain/Step Time": 17.58481839671731} +{"Full-pretrain/Learning Rate": 3.454158546519766e-05, "Full-pretrain/Loss": 1.9771838188171387, "Full-pretrain/Loss (Raw)": 1.8145744800567627, "Full-pretrain/Step": 3758, "Full-pretrain/Step Time": 17.5853886641562} +{"Full-pretrain/Learning Rate": 3.453373686527003e-05, "Full-pretrain/Loss": 1.9798657894134521, "Full-pretrain/Loss (Raw)": 2.004291534423828, "Full-pretrain/Step": 3759, "Full-pretrain/Step Time": 17.578516390174627} +{"Full-pretrain/Learning Rate": 3.45258871656292e-05, "Full-pretrain/Loss": 1.9822909832000732, "Full-pretrain/Loss (Raw)": 2.0151846408843994, "Full-pretrain/Step": 3760, "Full-pretrain/Step Time": 17.583144841715693} +{"Full-pretrain/Learning Rate": 3.451803636718064e-05, "Full-pretrain/Loss": 1.9942139387130737, "Full-pretrain/Loss (Raw)": 2.2373077869415283, "Full-pretrain/Step": 3761, "Full-pretrain/Step Time": 17.584663225337863} +{"Full-pretrain/Learning Rate": 3.451018447082993e-05, "Full-pretrain/Loss": 2.0018162727355957, "Full-pretrain/Loss (Raw)": 1.9728169441223145, "Full-pretrain/Step": 3762, "Full-pretrain/Step Time": 17.582810247316957} +{"Full-pretrain/Learning Rate": 3.450233147748278e-05, "Full-pretrain/Loss": 1.9989819526672363, "Full-pretrain/Loss (Raw)": 1.8152873516082764, "Full-pretrain/Step": 3763, "Full-pretrain/Step Time": 17.575725842267275} +{"Full-pretrain/Learning Rate": 3.4494477388045035e-05, "Full-pretrain/Loss": 1.9942905902862549, "Full-pretrain/Loss (Raw)": 2.002002239227295, "Full-pretrain/Step": 3764, "Full-pretrain/Step Time": 17.578393392264843} +{"Full-pretrain/Learning Rate": 3.448662220342265e-05, "Full-pretrain/Loss": 1.9875729084014893, "Full-pretrain/Loss (Raw)": 2.2351346015930176, "Full-pretrain/Step": 3765, "Full-pretrain/Step Time": 17.57622329890728} +{"Full-pretrain/Learning Rate": 3.447876592452174e-05, "Full-pretrain/Loss": 1.980299472808838, "Full-pretrain/Loss (Raw)": 1.808819055557251, "Full-pretrain/Step": 3766, "Full-pretrain/Step Time": 17.574315689504147} +{"Full-pretrain/Learning Rate": 3.4470908552248504e-05, "Full-pretrain/Loss": 1.9838184118270874, "Full-pretrain/Loss (Raw)": 2.0485129356384277, "Full-pretrain/Step": 3767, "Full-pretrain/Step Time": 17.566643623635173} +{"Full-pretrain/Learning Rate": 3.44630500875093e-05, "Full-pretrain/Loss": 1.98838472366333, "Full-pretrain/Loss (Raw)": 1.9912195205688477, "Full-pretrain/Step": 3768, "Full-pretrain/Step Time": 17.570203026756644} +{"Full-pretrain/Learning Rate": 3.4455190531210595e-05, "Full-pretrain/Loss": 2.0016233921051025, "Full-pretrain/Loss (Raw)": 2.3343076705932617, "Full-pretrain/Step": 3769, "Full-pretrain/Step Time": 17.568985560908914} +{"Full-pretrain/Learning Rate": 3.4447329884258985e-05, "Full-pretrain/Loss": 1.9962162971496582, "Full-pretrain/Loss (Raw)": 1.868333101272583, "Full-pretrain/Step": 3770, "Full-pretrain/Step Time": 17.569533709436655} +{"Full-pretrain/Learning Rate": 3.44394681475612e-05, "Full-pretrain/Loss": 1.9914261102676392, "Full-pretrain/Loss (Raw)": 1.88240647315979, "Full-pretrain/Step": 3771, "Full-pretrain/Step Time": 17.573724368587136} +{"Full-pretrain/Learning Rate": 3.443160532202406e-05, "Full-pretrain/Loss": 1.995030164718628, "Full-pretrain/Loss (Raw)": 1.9766377210617065, "Full-pretrain/Step": 3772, "Full-pretrain/Step Time": 17.568889547139406} +{"Full-pretrain/Learning Rate": 3.442374140855457e-05, "Full-pretrain/Loss": 2.0001420974731445, "Full-pretrain/Loss (Raw)": 1.9001998901367188, "Full-pretrain/Step": 3773, "Full-pretrain/Step Time": 17.569518806412816} +{"Full-pretrain/Learning Rate": 3.441587640805983e-05, "Full-pretrain/Loss": 1.9978548288345337, "Full-pretrain/Loss (Raw)": 1.838914155960083, "Full-pretrain/Step": 3774, "Full-pretrain/Step Time": 17.57739282399416} +{"Full-pretrain/Learning Rate": 3.4408010321447046e-05, "Full-pretrain/Loss": 1.989820122718811, "Full-pretrain/Loss (Raw)": 1.8765122890472412, "Full-pretrain/Step": 3775, "Full-pretrain/Step Time": 17.57175429351628} +{"Full-pretrain/Learning Rate": 3.440014314962357e-05, "Full-pretrain/Loss": 1.9865002632141113, "Full-pretrain/Loss (Raw)": 1.8942495584487915, "Full-pretrain/Step": 3776, "Full-pretrain/Step Time": 17.567405082285404} +{"Full-pretrain/Learning Rate": 3.439227489349691e-05, "Full-pretrain/Loss": 1.9927723407745361, "Full-pretrain/Loss (Raw)": 2.21962308883667, "Full-pretrain/Step": 3777, "Full-pretrain/Step Time": 17.572338746860623} +{"Full-pretrain/Learning Rate": 3.438440555397462e-05, "Full-pretrain/Loss": 1.9958981275558472, "Full-pretrain/Loss (Raw)": 2.004155397415161, "Full-pretrain/Step": 3778, "Full-pretrain/Step Time": 17.571466393768787} +{"Full-pretrain/Learning Rate": 3.437653513196446e-05, "Full-pretrain/Loss": 2.0014452934265137, "Full-pretrain/Loss (Raw)": 2.034766674041748, "Full-pretrain/Step": 3779, "Full-pretrain/Step Time": 17.572121523320675} +{"Full-pretrain/Learning Rate": 3.436866362837425e-05, "Full-pretrain/Loss": 2.0059235095977783, "Full-pretrain/Loss (Raw)": 2.163954734802246, "Full-pretrain/Step": 3780, "Full-pretrain/Step Time": 17.568247916176915} +{"Full-pretrain/Learning Rate": 3.436079104411199e-05, "Full-pretrain/Loss": 2.012946605682373, "Full-pretrain/Loss (Raw)": 2.13545560836792, "Full-pretrain/Step": 3781, "Full-pretrain/Step Time": 17.567085087299347} +{"Full-pretrain/Learning Rate": 3.435291738008579e-05, "Full-pretrain/Loss": 2.0182578563690186, "Full-pretrain/Loss (Raw)": 2.1214146614074707, "Full-pretrain/Step": 3782, "Full-pretrain/Step Time": 17.57137073390186} +{"Full-pretrain/Learning Rate": 3.434504263720384e-05, "Full-pretrain/Loss": 2.0214226245880127, "Full-pretrain/Loss (Raw)": 2.0504441261291504, "Full-pretrain/Step": 3783, "Full-pretrain/Step Time": 17.568795580416918} +{"Full-pretrain/Learning Rate": 3.433716681637451e-05, "Full-pretrain/Loss": 2.0212931632995605, "Full-pretrain/Loss (Raw)": 2.155190944671631, "Full-pretrain/Step": 3784, "Full-pretrain/Step Time": 17.565471559762955} +{"Full-pretrain/Learning Rate": 3.432928991850627e-05, "Full-pretrain/Loss": 2.0192956924438477, "Full-pretrain/Loss (Raw)": 2.1413674354553223, "Full-pretrain/Step": 3785, "Full-pretrain/Step Time": 17.561424450948834} +{"Full-pretrain/Learning Rate": 3.432141194450772e-05, "Full-pretrain/Loss": 2.0065689086914062, "Full-pretrain/Loss (Raw)": 1.700348973274231, "Full-pretrain/Step": 3786, "Full-pretrain/Step Time": 17.566324841231108} +{"Full-pretrain/Learning Rate": 3.431353289528758e-05, "Full-pretrain/Loss": 1.9984369277954102, "Full-pretrain/Loss (Raw)": 1.7441775798797607, "Full-pretrain/Step": 3787, "Full-pretrain/Step Time": 17.562253823503852} +{"Full-pretrain/Learning Rate": 3.4305652771754684e-05, "Full-pretrain/Loss": 1.999079704284668, "Full-pretrain/Loss (Raw)": 2.0045838356018066, "Full-pretrain/Step": 3788, "Full-pretrain/Step Time": 17.56197115406394} +{"Full-pretrain/Learning Rate": 3.429777157481801e-05, "Full-pretrain/Loss": 2.0004875659942627, "Full-pretrain/Loss (Raw)": 2.023408889770508, "Full-pretrain/Step": 3789, "Full-pretrain/Step Time": 17.557226864621043} +{"Full-pretrain/Learning Rate": 3.428988930538666e-05, "Full-pretrain/Loss": 2.0101401805877686, "Full-pretrain/Loss (Raw)": 2.123457431793213, "Full-pretrain/Step": 3790, "Full-pretrain/Step Time": 17.568686055019498} +{"Full-pretrain/Learning Rate": 3.4282005964369835e-05, "Full-pretrain/Loss": 1.9998977184295654, "Full-pretrain/Loss (Raw)": 1.6765315532684326, "Full-pretrain/Step": 3791, "Full-pretrain/Step Time": 17.558822190389037} +{"Full-pretrain/Learning Rate": 3.4274121552676884e-05, "Full-pretrain/Loss": 1.9983940124511719, "Full-pretrain/Loss (Raw)": 1.9670650959014893, "Full-pretrain/Step": 3792, "Full-pretrain/Step Time": 17.557456459850073} +{"Full-pretrain/Learning Rate": 3.426623607121728e-05, "Full-pretrain/Loss": 1.994048833847046, "Full-pretrain/Loss (Raw)": 2.098263740539551, "Full-pretrain/Step": 3793, "Full-pretrain/Step Time": 17.556262519210577} +{"Full-pretrain/Learning Rate": 3.4258349520900595e-05, "Full-pretrain/Loss": 1.999323844909668, "Full-pretrain/Loss (Raw)": 2.141613006591797, "Full-pretrain/Step": 3794, "Full-pretrain/Step Time": 17.563306896016} +{"Full-pretrain/Learning Rate": 3.4250461902636554e-05, "Full-pretrain/Loss": 2.0030417442321777, "Full-pretrain/Loss (Raw)": 1.9342564344406128, "Full-pretrain/Step": 3795, "Full-pretrain/Step Time": 17.562101759016514} +{"Full-pretrain/Learning Rate": 3.4242573217334976e-05, "Full-pretrain/Loss": 2.0031847953796387, "Full-pretrain/Loss (Raw)": 2.0065879821777344, "Full-pretrain/Step": 3796, "Full-pretrain/Step Time": 17.566252421587706} +{"Full-pretrain/Learning Rate": 3.423468346590583e-05, "Full-pretrain/Loss": 1.9968422651290894, "Full-pretrain/Loss (Raw)": 2.032172203063965, "Full-pretrain/Step": 3797, "Full-pretrain/Step Time": 17.563723638653755} +{"Full-pretrain/Learning Rate": 3.4226792649259184e-05, "Full-pretrain/Loss": 2.001556873321533, "Full-pretrain/Loss (Raw)": 1.9596846103668213, "Full-pretrain/Step": 3798, "Full-pretrain/Step Time": 17.56276668421924} +{"Full-pretrain/Learning Rate": 3.421890076830525e-05, "Full-pretrain/Loss": 2.002718448638916, "Full-pretrain/Loss (Raw)": 2.085681676864624, "Full-pretrain/Step": 3799, "Full-pretrain/Step Time": 17.56215139478445} +{"Full-pretrain/Learning Rate": 3.421100782395436e-05, "Full-pretrain/Loss": 2.0056679248809814, "Full-pretrain/Loss (Raw)": 2.085602283477783, "Full-pretrain/Step": 3800, "Full-pretrain/Step Time": 17.566518565639853} +{"Full-pretrain/Learning Rate": 3.4203113817116957e-05, "Full-pretrain/Loss": 1.988945484161377, "Full-pretrain/Loss (Raw)": 1.7991960048675537, "Full-pretrain/Step": 3801, "Full-pretrain/Step Time": 17.561548424884677} +{"Full-pretrain/Learning Rate": 3.419521874870359e-05, "Full-pretrain/Loss": 1.9912725687026978, "Full-pretrain/Loss (Raw)": 1.942795753479004, "Full-pretrain/Step": 3802, "Full-pretrain/Step Time": 17.562660355120897} +{"Full-pretrain/Learning Rate": 3.4187322619624995e-05, "Full-pretrain/Loss": 1.998113989830017, "Full-pretrain/Loss (Raw)": 2.1013383865356445, "Full-pretrain/Step": 3803, "Full-pretrain/Step Time": 17.56453189998865} +{"Full-pretrain/Learning Rate": 3.417942543079195e-05, "Full-pretrain/Loss": 1.9977480173110962, "Full-pretrain/Loss (Raw)": 1.9649217128753662, "Full-pretrain/Step": 3804, "Full-pretrain/Step Time": 17.56516094133258} +{"Full-pretrain/Learning Rate": 3.4171527183115415e-05, "Full-pretrain/Loss": 2.0028586387634277, "Full-pretrain/Loss (Raw)": 2.063743829727173, "Full-pretrain/Step": 3805, "Full-pretrain/Step Time": 17.559579335153103} +{"Full-pretrain/Learning Rate": 3.4163627877506435e-05, "Full-pretrain/Loss": 2.010953903198242, "Full-pretrain/Loss (Raw)": 2.0979647636413574, "Full-pretrain/Step": 3806, "Full-pretrain/Step Time": 17.56039898842573} +{"Full-pretrain/Learning Rate": 3.41557275148762e-05, "Full-pretrain/Loss": 2.012467622756958, "Full-pretrain/Loss (Raw)": 1.9249467849731445, "Full-pretrain/Step": 3807, "Full-pretrain/Step Time": 17.56278402172029} +{"Full-pretrain/Learning Rate": 3.414782609613602e-05, "Full-pretrain/Loss": 2.0223236083984375, "Full-pretrain/Loss (Raw)": 2.209639072418213, "Full-pretrain/Step": 3808, "Full-pretrain/Step Time": 17.559000516310334} +{"Full-pretrain/Learning Rate": 3.413992362219731e-05, "Full-pretrain/Loss": 2.0141124725341797, "Full-pretrain/Loss (Raw)": 1.9568676948547363, "Full-pretrain/Step": 3809, "Full-pretrain/Step Time": 17.5473360568285} +{"Full-pretrain/Learning Rate": 3.413202009397163e-05, "Full-pretrain/Loss": 2.0202295780181885, "Full-pretrain/Loss (Raw)": 2.1999077796936035, "Full-pretrain/Step": 3810, "Full-pretrain/Step Time": 17.547098798677325} +{"Full-pretrain/Learning Rate": 3.412411551237064e-05, "Full-pretrain/Loss": 2.021756649017334, "Full-pretrain/Loss (Raw)": 2.0836269855499268, "Full-pretrain/Step": 3811, "Full-pretrain/Step Time": 17.54227458126843} +{"Full-pretrain/Learning Rate": 3.411620987830612e-05, "Full-pretrain/Loss": 2.0170297622680664, "Full-pretrain/Loss (Raw)": 2.012694835662842, "Full-pretrain/Step": 3812, "Full-pretrain/Step Time": 17.551253566518426} +{"Full-pretrain/Learning Rate": 3.410830319269e-05, "Full-pretrain/Loss": 2.0064280033111572, "Full-pretrain/Loss (Raw)": 1.796199917793274, "Full-pretrain/Step": 3813, "Full-pretrain/Step Time": 17.543115673586726} +{"Full-pretrain/Learning Rate": 3.410039545643431e-05, "Full-pretrain/Loss": 2.006600856781006, "Full-pretrain/Loss (Raw)": 2.1269490718841553, "Full-pretrain/Step": 3814, "Full-pretrain/Step Time": 17.5459217838943} +{"Full-pretrain/Learning Rate": 3.40924866704512e-05, "Full-pretrain/Loss": 2.003692150115967, "Full-pretrain/Loss (Raw)": 1.9573594331741333, "Full-pretrain/Step": 3815, "Full-pretrain/Step Time": 17.54838122613728} +{"Full-pretrain/Learning Rate": 3.408457683565295e-05, "Full-pretrain/Loss": 2.00016188621521, "Full-pretrain/Loss (Raw)": 2.042226552963257, "Full-pretrain/Step": 3816, "Full-pretrain/Step Time": 17.553279070183635} +{"Full-pretrain/Learning Rate": 3.407666595295195e-05, "Full-pretrain/Loss": 1.9931762218475342, "Full-pretrain/Loss (Raw)": 1.9178211688995361, "Full-pretrain/Step": 3817, "Full-pretrain/Step Time": 17.548160603269935} +{"Full-pretrain/Learning Rate": 3.4068754023260726e-05, "Full-pretrain/Loss": 2.0032522678375244, "Full-pretrain/Loss (Raw)": 2.0227866172790527, "Full-pretrain/Step": 3818, "Full-pretrain/Step Time": 17.54566813632846} +{"Full-pretrain/Learning Rate": 3.406084104749192e-05, "Full-pretrain/Loss": 2.0113861560821533, "Full-pretrain/Loss (Raw)": 2.0044636726379395, "Full-pretrain/Step": 3819, "Full-pretrain/Step Time": 17.549367817118764} +{"Full-pretrain/Learning Rate": 3.4052927026558265e-05, "Full-pretrain/Loss": 2.0098876953125, "Full-pretrain/Loss (Raw)": 1.9566344022750854, "Full-pretrain/Step": 3820, "Full-pretrain/Step Time": 17.552777199074626} +{"Full-pretrain/Learning Rate": 3.404501196137267e-05, "Full-pretrain/Loss": 2.0075368881225586, "Full-pretrain/Loss (Raw)": 1.9481744766235352, "Full-pretrain/Step": 3821, "Full-pretrain/Step Time": 17.556275384500623} +{"Full-pretrain/Learning Rate": 3.4037095852848126e-05, "Full-pretrain/Loss": 2.0000996589660645, "Full-pretrain/Loss (Raw)": 1.885472059249878, "Full-pretrain/Step": 3822, "Full-pretrain/Step Time": 17.5531837772578} +{"Full-pretrain/Learning Rate": 3.4029178701897744e-05, "Full-pretrain/Loss": 2.011169910430908, "Full-pretrain/Loss (Raw)": 2.030776262283325, "Full-pretrain/Step": 3823, "Full-pretrain/Step Time": 17.553973319008946} +{"Full-pretrain/Learning Rate": 3.402126050943478e-05, "Full-pretrain/Loss": 2.00515079498291, "Full-pretrain/Loss (Raw)": 1.7744615077972412, "Full-pretrain/Step": 3824, "Full-pretrain/Step Time": 17.553855750709772} +{"Full-pretrain/Learning Rate": 3.401334127637259e-05, "Full-pretrain/Loss": 1.9927802085876465, "Full-pretrain/Loss (Raw)": 1.7023957967758179, "Full-pretrain/Step": 3825, "Full-pretrain/Step Time": 17.55387992784381} +{"Full-pretrain/Learning Rate": 3.400542100362464e-05, "Full-pretrain/Loss": 1.991227388381958, "Full-pretrain/Loss (Raw)": 2.0919265747070312, "Full-pretrain/Step": 3826, "Full-pretrain/Step Time": 17.554398087784648} +{"Full-pretrain/Learning Rate": 3.399749969210455e-05, "Full-pretrain/Loss": 2.0043187141418457, "Full-pretrain/Loss (Raw)": 2.353178024291992, "Full-pretrain/Step": 3827, "Full-pretrain/Step Time": 17.552526779472828} +{"Full-pretrain/Learning Rate": 3.3989577342726025e-05, "Full-pretrain/Loss": 1.9995193481445312, "Full-pretrain/Loss (Raw)": 1.8530094623565674, "Full-pretrain/Step": 3828, "Full-pretrain/Step Time": 17.5579473990947} +{"Full-pretrain/Learning Rate": 3.398165395640292e-05, "Full-pretrain/Loss": 1.9958209991455078, "Full-pretrain/Loss (Raw)": 1.9138256311416626, "Full-pretrain/Step": 3829, "Full-pretrain/Step Time": 17.554739395156503} +{"Full-pretrain/Learning Rate": 3.397372953404918e-05, "Full-pretrain/Loss": 1.990524172782898, "Full-pretrain/Loss (Raw)": 1.7901843786239624, "Full-pretrain/Step": 3830, "Full-pretrain/Step Time": 17.555365040898323} +{"Full-pretrain/Learning Rate": 3.39658040765789e-05, "Full-pretrain/Loss": 1.9870787858963013, "Full-pretrain/Loss (Raw)": 1.9754325151443481, "Full-pretrain/Step": 3831, "Full-pretrain/Step Time": 17.559024777263403} +{"Full-pretrain/Learning Rate": 3.395787758490626e-05, "Full-pretrain/Loss": 1.9998728036880493, "Full-pretrain/Loss (Raw)": 2.4950039386749268, "Full-pretrain/Step": 3832, "Full-pretrain/Step Time": 17.560948414728045} +{"Full-pretrain/Learning Rate": 3.3949950059945594e-05, "Full-pretrain/Loss": 2.007237434387207, "Full-pretrain/Loss (Raw)": 2.034865140914917, "Full-pretrain/Step": 3833, "Full-pretrain/Step Time": 17.559924380853772} +{"Full-pretrain/Learning Rate": 3.394202150261134e-05, "Full-pretrain/Loss": 2.005390167236328, "Full-pretrain/Loss (Raw)": 1.8836867809295654, "Full-pretrain/Step": 3834, "Full-pretrain/Step Time": 17.55993734113872} +{"Full-pretrain/Learning Rate": 3.3934091913818046e-05, "Full-pretrain/Loss": 1.9959838390350342, "Full-pretrain/Loss (Raw)": 1.8003361225128174, "Full-pretrain/Step": 3835, "Full-pretrain/Step Time": 17.56890582665801} +{"Full-pretrain/Learning Rate": 3.392616129448038e-05, "Full-pretrain/Loss": 1.998974323272705, "Full-pretrain/Loss (Raw)": 2.0606131553649902, "Full-pretrain/Step": 3836, "Full-pretrain/Step Time": 17.566922813653946} +{"Full-pretrain/Learning Rate": 3.391822964551315e-05, "Full-pretrain/Loss": 1.992228388786316, "Full-pretrain/Loss (Raw)": 1.8478775024414062, "Full-pretrain/Step": 3837, "Full-pretrain/Step Time": 17.566333040595055} +{"Full-pretrain/Learning Rate": 3.3910296967831266e-05, "Full-pretrain/Loss": 1.9808053970336914, "Full-pretrain/Loss (Raw)": 1.7324296236038208, "Full-pretrain/Step": 3838, "Full-pretrain/Step Time": 17.571292268112302} +{"Full-pretrain/Learning Rate": 3.390236326234977e-05, "Full-pretrain/Loss": 1.9762898683547974, "Full-pretrain/Loss (Raw)": 1.7804501056671143, "Full-pretrain/Step": 3839, "Full-pretrain/Step Time": 17.574955282732844} +{"Full-pretrain/Learning Rate": 3.389442852998378e-05, "Full-pretrain/Loss": 1.9669768810272217, "Full-pretrain/Loss (Raw)": 1.9116228818893433, "Full-pretrain/Step": 3840, "Full-pretrain/Step Time": 17.5692104883492} +{"Full-pretrain/Learning Rate": 3.3886492771648593e-05, "Full-pretrain/Loss": 1.9615734815597534, "Full-pretrain/Loss (Raw)": 1.7839579582214355, "Full-pretrain/Step": 3841, "Full-pretrain/Step Time": 17.573017813265324} +{"Full-pretrain/Learning Rate": 3.3878555988259585e-05, "Full-pretrain/Loss": 1.963338017463684, "Full-pretrain/Loss (Raw)": 2.25637149810791, "Full-pretrain/Step": 3842, "Full-pretrain/Step Time": 17.570757266134024} +{"Full-pretrain/Learning Rate": 3.387061818073227e-05, "Full-pretrain/Loss": 1.9582762718200684, "Full-pretrain/Loss (Raw)": 1.9216541051864624, "Full-pretrain/Step": 3843, "Full-pretrain/Step Time": 17.577315770089626} +{"Full-pretrain/Learning Rate": 3.386267934998226e-05, "Full-pretrain/Loss": 1.9571373462677002, "Full-pretrain/Loss (Raw)": 1.9762496948242188, "Full-pretrain/Step": 3844, "Full-pretrain/Step Time": 17.577872393652797} +{"Full-pretrain/Learning Rate": 3.385473949692531e-05, "Full-pretrain/Loss": 1.9592111110687256, "Full-pretrain/Loss (Raw)": 1.8625587224960327, "Full-pretrain/Step": 3845, "Full-pretrain/Step Time": 17.580827228724957} +{"Full-pretrain/Learning Rate": 3.384679862247726e-05, "Full-pretrain/Loss": 1.9581069946289062, "Full-pretrain/Loss (Raw)": 2.091615676879883, "Full-pretrain/Step": 3846, "Full-pretrain/Step Time": 17.57305788807571} +{"Full-pretrain/Learning Rate": 3.383885672755411e-05, "Full-pretrain/Loss": 1.9691617488861084, "Full-pretrain/Loss (Raw)": 2.311112880706787, "Full-pretrain/Step": 3847, "Full-pretrain/Step Time": 17.570882128551602} +{"Full-pretrain/Learning Rate": 3.383091381307193e-05, "Full-pretrain/Loss": 1.9636964797973633, "Full-pretrain/Loss (Raw)": 1.8673380613327026, "Full-pretrain/Step": 3848, "Full-pretrain/Step Time": 17.573544135317206} +{"Full-pretrain/Learning Rate": 3.3822969879946947e-05, "Full-pretrain/Loss": 1.9655814170837402, "Full-pretrain/Loss (Raw)": 1.9781373739242554, "Full-pretrain/Step": 3849, "Full-pretrain/Step Time": 17.574160404503345} +{"Full-pretrain/Learning Rate": 3.38150249290955e-05, "Full-pretrain/Loss": 1.9684092998504639, "Full-pretrain/Loss (Raw)": 2.113280773162842, "Full-pretrain/Step": 3850, "Full-pretrain/Step Time": 17.57425076700747} +{"Full-pretrain/Learning Rate": 3.3807078961434013e-05, "Full-pretrain/Loss": 1.9633996486663818, "Full-pretrain/Loss (Raw)": 1.844152569770813, "Full-pretrain/Step": 3851, "Full-pretrain/Step Time": 17.569551220163703} +{"Full-pretrain/Learning Rate": 3.3799131977879064e-05, "Full-pretrain/Loss": 1.9644086360931396, "Full-pretrain/Loss (Raw)": 1.988925576210022, "Full-pretrain/Step": 3852, "Full-pretrain/Step Time": 17.57196626998484} +{"Full-pretrain/Learning Rate": 3.379118397934734e-05, "Full-pretrain/Loss": 1.9699153900146484, "Full-pretrain/Loss (Raw)": 2.1243927478790283, "Full-pretrain/Step": 3853, "Full-pretrain/Step Time": 17.57631368562579} +{"Full-pretrain/Learning Rate": 3.3783234966755625e-05, "Full-pretrain/Loss": 1.976549744606018, "Full-pretrain/Loss (Raw)": 2.0977697372436523, "Full-pretrain/Step": 3854, "Full-pretrain/Step Time": 17.57530109025538} +{"Full-pretrain/Learning Rate": 3.377528494102086e-05, "Full-pretrain/Loss": 1.9699407815933228, "Full-pretrain/Loss (Raw)": 1.8192883729934692, "Full-pretrain/Step": 3855, "Full-pretrain/Step Time": 17.578383373096585} +{"Full-pretrain/Learning Rate": 3.376733390306004e-05, "Full-pretrain/Loss": 1.9755311012268066, "Full-pretrain/Loss (Raw)": 1.9533536434173584, "Full-pretrain/Step": 3856, "Full-pretrain/Step Time": 17.58054980635643} +{"Full-pretrain/Learning Rate": 3.375938185379035e-05, "Full-pretrain/Loss": 1.9932961463928223, "Full-pretrain/Loss (Raw)": 2.270874500274658, "Full-pretrain/Step": 3857, "Full-pretrain/Step Time": 17.580382419750094} +{"Full-pretrain/Learning Rate": 3.375142879412903e-05, "Full-pretrain/Loss": 1.9879419803619385, "Full-pretrain/Loss (Raw)": 1.9205973148345947, "Full-pretrain/Step": 3858, "Full-pretrain/Step Time": 17.58219864591956} +{"Full-pretrain/Learning Rate": 3.374347472499348e-05, "Full-pretrain/Loss": 1.9815621376037598, "Full-pretrain/Loss (Raw)": 2.149019956588745, "Full-pretrain/Step": 3859, "Full-pretrain/Step Time": 17.58391660451889} +{"Full-pretrain/Learning Rate": 3.37355196473012e-05, "Full-pretrain/Loss": 1.9869115352630615, "Full-pretrain/Loss (Raw)": 2.0241899490356445, "Full-pretrain/Step": 3860, "Full-pretrain/Step Time": 17.580580066889524} +{"Full-pretrain/Learning Rate": 3.3727563561969787e-05, "Full-pretrain/Loss": 1.9929426908493042, "Full-pretrain/Loss (Raw)": 2.1068220138549805, "Full-pretrain/Step": 3861, "Full-pretrain/Step Time": 17.581445140764117} +{"Full-pretrain/Learning Rate": 3.3719606469916984e-05, "Full-pretrain/Loss": 1.9954699277877808, "Full-pretrain/Loss (Raw)": 1.8710570335388184, "Full-pretrain/Step": 3862, "Full-pretrain/Step Time": 17.583344945684075} +{"Full-pretrain/Learning Rate": 3.371164837206065e-05, "Full-pretrain/Loss": 1.994950294494629, "Full-pretrain/Loss (Raw)": 1.9588077068328857, "Full-pretrain/Step": 3863, "Full-pretrain/Step Time": 17.581084564328194} +{"Full-pretrain/Learning Rate": 3.370368926931873e-05, "Full-pretrain/Loss": 1.977114200592041, "Full-pretrain/Loss (Raw)": 1.924243688583374, "Full-pretrain/Step": 3864, "Full-pretrain/Step Time": 17.582598105072975} +{"Full-pretrain/Learning Rate": 3.3695729162609315e-05, "Full-pretrain/Loss": 1.9727572202682495, "Full-pretrain/Loss (Raw)": 1.8954437971115112, "Full-pretrain/Step": 3865, "Full-pretrain/Step Time": 17.580104995518923} +{"Full-pretrain/Learning Rate": 3.368776805285059e-05, "Full-pretrain/Loss": 1.9770411252975464, "Full-pretrain/Loss (Raw)": 2.020772695541382, "Full-pretrain/Step": 3866, "Full-pretrain/Step Time": 17.5825387686491} +{"Full-pretrain/Learning Rate": 3.367980594096088e-05, "Full-pretrain/Loss": 1.9789353609085083, "Full-pretrain/Loss (Raw)": 1.8609520196914673, "Full-pretrain/Step": 3867, "Full-pretrain/Step Time": 17.58405709080398} +{"Full-pretrain/Learning Rate": 3.367184282785861e-05, "Full-pretrain/Loss": 1.9703952074050903, "Full-pretrain/Loss (Raw)": 1.787325382232666, "Full-pretrain/Step": 3868, "Full-pretrain/Step Time": 17.584969710558653} +{"Full-pretrain/Learning Rate": 3.366387871446231e-05, "Full-pretrain/Loss": 1.9691768884658813, "Full-pretrain/Loss (Raw)": 1.8088957071304321, "Full-pretrain/Step": 3869, "Full-pretrain/Step Time": 17.584645207971334} +{"Full-pretrain/Learning Rate": 3.365591360169064e-05, "Full-pretrain/Loss": 1.9739621877670288, "Full-pretrain/Loss (Raw)": 1.8855578899383545, "Full-pretrain/Step": 3870, "Full-pretrain/Step Time": 17.583439018577337} +{"Full-pretrain/Learning Rate": 3.364794749046239e-05, "Full-pretrain/Loss": 1.9774553775787354, "Full-pretrain/Loss (Raw)": 1.8922326564788818, "Full-pretrain/Step": 3871, "Full-pretrain/Step Time": 17.584772307425737} +{"Full-pretrain/Learning Rate": 3.3639980381696426e-05, "Full-pretrain/Loss": 1.9763554334640503, "Full-pretrain/Loss (Raw)": 1.8764245510101318, "Full-pretrain/Step": 3872, "Full-pretrain/Step Time": 17.586249256506562} +{"Full-pretrain/Learning Rate": 3.363201227631176e-05, "Full-pretrain/Loss": 1.9896869659423828, "Full-pretrain/Loss (Raw)": 2.210569381713867, "Full-pretrain/Step": 3873, "Full-pretrain/Step Time": 17.582684874534607} +{"Full-pretrain/Learning Rate": 3.362404317522752e-05, "Full-pretrain/Loss": 1.979972243309021, "Full-pretrain/Loss (Raw)": 1.9454951286315918, "Full-pretrain/Step": 3874, "Full-pretrain/Step Time": 17.583651423454285} +{"Full-pretrain/Learning Rate": 3.3616073079362926e-05, "Full-pretrain/Loss": 1.9832041263580322, "Full-pretrain/Loss (Raw)": 2.025075912475586, "Full-pretrain/Step": 3875, "Full-pretrain/Step Time": 17.58773858845234} +{"Full-pretrain/Learning Rate": 3.360810198963733e-05, "Full-pretrain/Loss": 1.9716358184814453, "Full-pretrain/Loss (Raw)": 1.6060631275177002, "Full-pretrain/Step": 3876, "Full-pretrain/Step Time": 17.589205756783485} +{"Full-pretrain/Learning Rate": 3.36001299069702e-05, "Full-pretrain/Loss": 1.975468397140503, "Full-pretrain/Loss (Raw)": 1.985203742980957, "Full-pretrain/Step": 3877, "Full-pretrain/Step Time": 17.590576542541385} +{"Full-pretrain/Learning Rate": 3.35921568322811e-05, "Full-pretrain/Loss": 1.9741601943969727, "Full-pretrain/Loss (Raw)": 2.0497477054595947, "Full-pretrain/Step": 3878, "Full-pretrain/Step Time": 17.589162031188607} +{"Full-pretrain/Learning Rate": 3.3584182766489736e-05, "Full-pretrain/Loss": 1.9694111347198486, "Full-pretrain/Loss (Raw)": 2.159144878387451, "Full-pretrain/Step": 3879, "Full-pretrain/Step Time": 17.597278989851475} +{"Full-pretrain/Learning Rate": 3.35762077105159e-05, "Full-pretrain/Loss": 1.9773437976837158, "Full-pretrain/Loss (Raw)": 2.1211836338043213, "Full-pretrain/Step": 3880, "Full-pretrain/Step Time": 17.594654908403754} +{"Full-pretrain/Learning Rate": 3.356823166527952e-05, "Full-pretrain/Loss": 1.9848099946975708, "Full-pretrain/Loss (Raw)": 2.2170543670654297, "Full-pretrain/Step": 3881, "Full-pretrain/Step Time": 17.598201602697372} +{"Full-pretrain/Learning Rate": 3.356025463170063e-05, "Full-pretrain/Loss": 1.9858840703964233, "Full-pretrain/Loss (Raw)": 2.147648811340332, "Full-pretrain/Step": 3882, "Full-pretrain/Step Time": 17.59235990047455} +{"Full-pretrain/Learning Rate": 3.355227661069937e-05, "Full-pretrain/Loss": 1.9949475526809692, "Full-pretrain/Loss (Raw)": 2.134187936782837, "Full-pretrain/Step": 3883, "Full-pretrain/Step Time": 17.59629741869867} +{"Full-pretrain/Learning Rate": 3.354429760319602e-05, "Full-pretrain/Loss": 2.004420757293701, "Full-pretrain/Loss (Raw)": 2.292069911956787, "Full-pretrain/Step": 3884, "Full-pretrain/Step Time": 17.601278003305197} +{"Full-pretrain/Learning Rate": 3.3536317610110946e-05, "Full-pretrain/Loss": 2.0059359073638916, "Full-pretrain/Loss (Raw)": 2.1728756427764893, "Full-pretrain/Step": 3885, "Full-pretrain/Step Time": 17.595622956752777} +{"Full-pretrain/Learning Rate": 3.3528336632364624e-05, "Full-pretrain/Loss": 2.002025604248047, "Full-pretrain/Loss (Raw)": 1.972636103630066, "Full-pretrain/Step": 3886, "Full-pretrain/Step Time": 17.590793192386627} +{"Full-pretrain/Learning Rate": 3.352035467087767e-05, "Full-pretrain/Loss": 2.0136730670928955, "Full-pretrain/Loss (Raw)": 2.192009925842285, "Full-pretrain/Step": 3887, "Full-pretrain/Step Time": 17.590587170794606} +{"Full-pretrain/Learning Rate": 3.351237172657081e-05, "Full-pretrain/Loss": 2.0127146244049072, "Full-pretrain/Loss (Raw)": 1.9226856231689453, "Full-pretrain/Step": 3888, "Full-pretrain/Step Time": 17.593106150627136} +{"Full-pretrain/Learning Rate": 3.3504387800364856e-05, "Full-pretrain/Loss": 2.002192497253418, "Full-pretrain/Loss (Raw)": 1.9341635704040527, "Full-pretrain/Step": 3889, "Full-pretrain/Step Time": 17.594874339178205} +{"Full-pretrain/Learning Rate": 3.349640289318075e-05, "Full-pretrain/Loss": 1.9901652336120605, "Full-pretrain/Loss (Raw)": 1.5357283353805542, "Full-pretrain/Step": 3890, "Full-pretrain/Step Time": 17.59260641410947} +{"Full-pretrain/Learning Rate": 3.348841700593956e-05, "Full-pretrain/Loss": 1.980804681777954, "Full-pretrain/Loss (Raw)": 1.8494811058044434, "Full-pretrain/Step": 3891, "Full-pretrain/Step Time": 17.595711650326848} +{"Full-pretrain/Learning Rate": 3.3480430139562455e-05, "Full-pretrain/Loss": 1.9782378673553467, "Full-pretrain/Loss (Raw)": 1.9420498609542847, "Full-pretrain/Step": 3892, "Full-pretrain/Step Time": 17.59652010537684} +{"Full-pretrain/Learning Rate": 3.3472442294970716e-05, "Full-pretrain/Loss": 1.9744503498077393, "Full-pretrain/Loss (Raw)": 1.9856228828430176, "Full-pretrain/Step": 3893, "Full-pretrain/Step Time": 17.596899557858706} +{"Full-pretrain/Learning Rate": 3.346445347308573e-05, "Full-pretrain/Loss": 1.9810527563095093, "Full-pretrain/Loss (Raw)": 2.0823330879211426, "Full-pretrain/Step": 3894, "Full-pretrain/Step Time": 17.594282111153007} +{"Full-pretrain/Learning Rate": 3.345646367482902e-05, "Full-pretrain/Loss": 1.9807274341583252, "Full-pretrain/Loss (Raw)": 1.948397159576416, "Full-pretrain/Step": 3895, "Full-pretrain/Step Time": 17.59765962138772} +{"Full-pretrain/Learning Rate": 3.344847290112219e-05, "Full-pretrain/Loss": 1.9808707237243652, "Full-pretrain/Loss (Raw)": 1.9288318157196045, "Full-pretrain/Step": 3896, "Full-pretrain/Step Time": 17.598744774237275} +{"Full-pretrain/Learning Rate": 3.3440481152886974e-05, "Full-pretrain/Loss": 1.9879767894744873, "Full-pretrain/Loss (Raw)": 2.1228384971618652, "Full-pretrain/Step": 3897, "Full-pretrain/Step Time": 17.604846637696028} +{"Full-pretrain/Learning Rate": 3.343248843104523e-05, "Full-pretrain/Loss": 1.990663766860962, "Full-pretrain/Loss (Raw)": 2.1067538261413574, "Full-pretrain/Step": 3898, "Full-pretrain/Step Time": 17.604792455211282} +{"Full-pretrain/Learning Rate": 3.34244947365189e-05, "Full-pretrain/Loss": 1.9946280717849731, "Full-pretrain/Loss (Raw)": 1.9878123998641968, "Full-pretrain/Step": 3899, "Full-pretrain/Step Time": 17.603564020246267} +{"Full-pretrain/Learning Rate": 3.341650007023008e-05, "Full-pretrain/Loss": 1.9896185398101807, "Full-pretrain/Loss (Raw)": 1.6270179748535156, "Full-pretrain/Step": 3900, "Full-pretrain/Step Time": 17.608772251755} +{"Full-pretrain/Learning Rate": 3.340850443310092e-05, "Full-pretrain/Loss": 2.0001020431518555, "Full-pretrain/Loss (Raw)": 2.1443729400634766, "Full-pretrain/Step": 3901, "Full-pretrain/Step Time": 17.61326922662556} +{"Full-pretrain/Learning Rate": 3.3400507826053736e-05, "Full-pretrain/Loss": 2.0009284019470215, "Full-pretrain/Loss (Raw)": 1.9119980335235596, "Full-pretrain/Step": 3902, "Full-pretrain/Step Time": 17.60496312752366} +{"Full-pretrain/Learning Rate": 3.3392510250010926e-05, "Full-pretrain/Loss": 2.009859323501587, "Full-pretrain/Loss (Raw)": 2.1780223846435547, "Full-pretrain/Step": 3903, "Full-pretrain/Step Time": 17.601104585453868} +{"Full-pretrain/Learning Rate": 3.338451170589501e-05, "Full-pretrain/Loss": 2.00533390045166, "Full-pretrain/Loss (Raw)": 1.7316060066223145, "Full-pretrain/Step": 3904, "Full-pretrain/Step Time": 17.604380236938596} +{"Full-pretrain/Learning Rate": 3.337651219462861e-05, "Full-pretrain/Loss": 2.004201650619507, "Full-pretrain/Loss (Raw)": 2.1743412017822266, "Full-pretrain/Step": 3905, "Full-pretrain/Step Time": 17.60767188668251} +{"Full-pretrain/Learning Rate": 3.336851171713447e-05, "Full-pretrain/Loss": 2.001779556274414, "Full-pretrain/Loss (Raw)": 1.8679845333099365, "Full-pretrain/Step": 3906, "Full-pretrain/Step Time": 17.604840490967035} +{"Full-pretrain/Learning Rate": 3.3360510274335446e-05, "Full-pretrain/Loss": 1.9961140155792236, "Full-pretrain/Loss (Raw)": 1.843778371810913, "Full-pretrain/Step": 3907, "Full-pretrain/Step Time": 17.60180422104895} +{"Full-pretrain/Learning Rate": 3.33525078671545e-05, "Full-pretrain/Loss": 2.0020692348480225, "Full-pretrain/Loss (Raw)": 1.796634554862976, "Full-pretrain/Step": 3908, "Full-pretrain/Step Time": 17.605641273781657} +{"Full-pretrain/Learning Rate": 3.3344504496514705e-05, "Full-pretrain/Loss": 1.991161584854126, "Full-pretrain/Loss (Raw)": 1.636155605316162, "Full-pretrain/Step": 3909, "Full-pretrain/Step Time": 17.607137007638812} +{"Full-pretrain/Learning Rate": 3.333650016333926e-05, "Full-pretrain/Loss": 1.9910446405410767, "Full-pretrain/Loss (Raw)": 2.0460081100463867, "Full-pretrain/Step": 3910, "Full-pretrain/Step Time": 17.603921504691243} +{"Full-pretrain/Learning Rate": 3.332849486855144e-05, "Full-pretrain/Loss": 1.982053518295288, "Full-pretrain/Loss (Raw)": 1.8714280128479004, "Full-pretrain/Step": 3911, "Full-pretrain/Step Time": 17.601826252415776} +{"Full-pretrain/Learning Rate": 3.332048861307467e-05, "Full-pretrain/Loss": 1.9597063064575195, "Full-pretrain/Loss (Raw)": 1.4060726165771484, "Full-pretrain/Step": 3912, "Full-pretrain/Step Time": 17.603324370458722} +{"Full-pretrain/Learning Rate": 3.331248139783246e-05, "Full-pretrain/Loss": 1.9498701095581055, "Full-pretrain/Loss (Raw)": 1.9022948741912842, "Full-pretrain/Step": 3913, "Full-pretrain/Step Time": 17.609497640281916} +{"Full-pretrain/Learning Rate": 3.330447322374844e-05, "Full-pretrain/Loss": 1.9404525756835938, "Full-pretrain/Loss (Raw)": 1.8462886810302734, "Full-pretrain/Step": 3914, "Full-pretrain/Step Time": 17.60585024766624} +{"Full-pretrain/Learning Rate": 3.329646409174635e-05, "Full-pretrain/Loss": 1.9235763549804688, "Full-pretrain/Loss (Raw)": 1.5941463708877563, "Full-pretrain/Step": 3915, "Full-pretrain/Step Time": 17.604196744039655} +{"Full-pretrain/Learning Rate": 3.3288454002750044e-05, "Full-pretrain/Loss": 1.888738989830017, "Full-pretrain/Loss (Raw)": 1.1772770881652832, "Full-pretrain/Step": 3916, "Full-pretrain/Step Time": 17.602433303371072} +{"Full-pretrain/Learning Rate": 3.3280442957683486e-05, "Full-pretrain/Loss": 1.8790135383605957, "Full-pretrain/Loss (Raw)": 1.8616591691970825, "Full-pretrain/Step": 3917, "Full-pretrain/Step Time": 17.61100640334189} +{"Full-pretrain/Learning Rate": 3.327243095747075e-05, "Full-pretrain/Loss": 1.879612922668457, "Full-pretrain/Loss (Raw)": 1.9918186664581299, "Full-pretrain/Step": 3918, "Full-pretrain/Step Time": 17.600668845698237} +{"Full-pretrain/Learning Rate": 3.3264418003036e-05, "Full-pretrain/Loss": 1.876136064529419, "Full-pretrain/Loss (Raw)": 2.0807528495788574, "Full-pretrain/Step": 3919, "Full-pretrain/Step Time": 17.598360801115632} +{"Full-pretrain/Learning Rate": 3.3256404095303526e-05, "Full-pretrain/Loss": 1.8810551166534424, "Full-pretrain/Loss (Raw)": 2.0800952911376953, "Full-pretrain/Step": 3920, "Full-pretrain/Step Time": 17.603838577866554} +{"Full-pretrain/Learning Rate": 3.324838923519776e-05, "Full-pretrain/Loss": 1.8792016506195068, "Full-pretrain/Loss (Raw)": 1.8748482465744019, "Full-pretrain/Step": 3921, "Full-pretrain/Step Time": 17.609383329749107} +{"Full-pretrain/Learning Rate": 3.324037342364319e-05, "Full-pretrain/Loss": 1.8935340642929077, "Full-pretrain/Loss (Raw)": 1.9943695068359375, "Full-pretrain/Step": 3922, "Full-pretrain/Step Time": 17.600865714251995} +{"Full-pretrain/Learning Rate": 3.3232356661564435e-05, "Full-pretrain/Loss": 1.9013628959655762, "Full-pretrain/Loss (Raw)": 2.1000008583068848, "Full-pretrain/Step": 3923, "Full-pretrain/Step Time": 17.596715753898025} +{"Full-pretrain/Learning Rate": 3.322433894988624e-05, "Full-pretrain/Loss": 1.9111089706420898, "Full-pretrain/Loss (Raw)": 2.253927230834961, "Full-pretrain/Step": 3924, "Full-pretrain/Step Time": 17.596680434420705} +{"Full-pretrain/Learning Rate": 3.321632028953343e-05, "Full-pretrain/Loss": 1.9209883213043213, "Full-pretrain/Loss (Raw)": 2.301760196685791, "Full-pretrain/Step": 3925, "Full-pretrain/Step Time": 17.597287517040968} +{"Full-pretrain/Learning Rate": 3.3208300681430964e-05, "Full-pretrain/Loss": 1.9159936904907227, "Full-pretrain/Loss (Raw)": 1.9225075244903564, "Full-pretrain/Step": 3926, "Full-pretrain/Step Time": 17.595442689955235} +{"Full-pretrain/Learning Rate": 3.320028012650391e-05, "Full-pretrain/Loss": 1.9138468503952026, "Full-pretrain/Loss (Raw)": 1.879693865776062, "Full-pretrain/Step": 3927, "Full-pretrain/Step Time": 17.598928609862924} +{"Full-pretrain/Learning Rate": 3.319225862567741e-05, "Full-pretrain/Loss": 1.9214133024215698, "Full-pretrain/Loss (Raw)": 2.1709609031677246, "Full-pretrain/Step": 3928, "Full-pretrain/Step Time": 17.595805779099464} +{"Full-pretrain/Learning Rate": 3.318423617987676e-05, "Full-pretrain/Loss": 1.9194844961166382, "Full-pretrain/Loss (Raw)": 2.0611162185668945, "Full-pretrain/Step": 3929, "Full-pretrain/Step Time": 17.59861160069704} +{"Full-pretrain/Learning Rate": 3.317621279002735e-05, "Full-pretrain/Loss": 1.9163397550582886, "Full-pretrain/Loss (Raw)": 2.006121873855591, "Full-pretrain/Step": 3930, "Full-pretrain/Step Time": 17.59593763947487} +{"Full-pretrain/Learning Rate": 3.3168188457054654e-05, "Full-pretrain/Loss": 1.9234426021575928, "Full-pretrain/Loss (Raw)": 2.2151038646698, "Full-pretrain/Step": 3931, "Full-pretrain/Step Time": 17.59969161450863} +{"Full-pretrain/Learning Rate": 3.3160163181884307e-05, "Full-pretrain/Loss": 1.935538411140442, "Full-pretrain/Loss (Raw)": 2.014082193374634, "Full-pretrain/Step": 3932, "Full-pretrain/Step Time": 17.599347565323114} +{"Full-pretrain/Learning Rate": 3.3152136965441996e-05, "Full-pretrain/Loss": 1.937675952911377, "Full-pretrain/Loss (Raw)": 2.212775707244873, "Full-pretrain/Step": 3933, "Full-pretrain/Step Time": 17.604225669056177} +{"Full-pretrain/Learning Rate": 3.314410980865355e-05, "Full-pretrain/Loss": 1.9376935958862305, "Full-pretrain/Loss (Raw)": 1.9125615358352661, "Full-pretrain/Step": 3934, "Full-pretrain/Step Time": 17.60616383701563} +{"Full-pretrain/Learning Rate": 3.3136081712444905e-05, "Full-pretrain/Loss": 1.93708336353302, "Full-pretrain/Loss (Raw)": 2.158494472503662, "Full-pretrain/Step": 3935, "Full-pretrain/Step Time": 17.606115771457553} +{"Full-pretrain/Learning Rate": 3.312805267774209e-05, "Full-pretrain/Loss": 1.9439538717269897, "Full-pretrain/Loss (Raw)": 1.951463222503662, "Full-pretrain/Step": 3936, "Full-pretrain/Step Time": 17.60628097690642} +{"Full-pretrain/Learning Rate": 3.312002270547125e-05, "Full-pretrain/Loss": 1.936075210571289, "Full-pretrain/Loss (Raw)": 1.9222254753112793, "Full-pretrain/Step": 3937, "Full-pretrain/Step Time": 17.611513821408153} +{"Full-pretrain/Learning Rate": 3.311199179655865e-05, "Full-pretrain/Loss": 1.9345455169677734, "Full-pretrain/Loss (Raw)": 1.8190348148345947, "Full-pretrain/Step": 3938, "Full-pretrain/Step Time": 17.614446407184005} +{"Full-pretrain/Learning Rate": 3.3103959951930654e-05, "Full-pretrain/Loss": 1.9227991104125977, "Full-pretrain/Loss (Raw)": 1.4678915739059448, "Full-pretrain/Step": 3939, "Full-pretrain/Step Time": 17.611134195700288} +{"Full-pretrain/Learning Rate": 3.309592717251371e-05, "Full-pretrain/Loss": 1.9252293109893799, "Full-pretrain/Loss (Raw)": 1.8744020462036133, "Full-pretrain/Step": 3940, "Full-pretrain/Step Time": 17.60833109728992} +{"Full-pretrain/Learning Rate": 3.308789345923442e-05, "Full-pretrain/Loss": 1.9441741704940796, "Full-pretrain/Loss (Raw)": 2.2423911094665527, "Full-pretrain/Step": 3941, "Full-pretrain/Step Time": 17.605963515117764} +{"Full-pretrain/Learning Rate": 3.3079858813019465e-05, "Full-pretrain/Loss": 1.9452813863754272, "Full-pretrain/Loss (Raw)": 2.0814380645751953, "Full-pretrain/Step": 3942, "Full-pretrain/Step Time": 17.606934716925025} +{"Full-pretrain/Learning Rate": 3.307182323479563e-05, "Full-pretrain/Loss": 1.9495787620544434, "Full-pretrain/Loss (Raw)": 2.008944511413574, "Full-pretrain/Step": 3943, "Full-pretrain/Step Time": 17.605293441563845} +{"Full-pretrain/Learning Rate": 3.306378672548982e-05, "Full-pretrain/Loss": 1.969141960144043, "Full-pretrain/Loss (Raw)": 2.0320944786071777, "Full-pretrain/Step": 3944, "Full-pretrain/Step Time": 17.60180643759668} +{"Full-pretrain/Learning Rate": 3.305574928602905e-05, "Full-pretrain/Loss": 1.963228702545166, "Full-pretrain/Loss (Raw)": 1.713073968887329, "Full-pretrain/Step": 3945, "Full-pretrain/Step Time": 17.60103450715542} +{"Full-pretrain/Learning Rate": 3.304771091734043e-05, "Full-pretrain/Loss": 1.9688268899917603, "Full-pretrain/Loss (Raw)": 2.025428295135498, "Full-pretrain/Step": 3946, "Full-pretrain/Step Time": 17.605503855273128} +{"Full-pretrain/Learning Rate": 3.3039671620351185e-05, "Full-pretrain/Loss": 1.975055456161499, "Full-pretrain/Loss (Raw)": 1.7934577465057373, "Full-pretrain/Step": 3947, "Full-pretrain/Step Time": 17.60170228779316} +{"Full-pretrain/Learning Rate": 3.3031631395988644e-05, "Full-pretrain/Loss": 2.0020956993103027, "Full-pretrain/Loss (Raw)": 2.042570114135742, "Full-pretrain/Step": 3948, "Full-pretrain/Step Time": 17.596759270876646} +{"Full-pretrain/Learning Rate": 3.302359024518024e-05, "Full-pretrain/Loss": 2.0112316608428955, "Full-pretrain/Loss (Raw)": 2.154008150100708, "Full-pretrain/Step": 3949, "Full-pretrain/Step Time": 17.59438810683787} +{"Full-pretrain/Learning Rate": 3.3015548168853525e-05, "Full-pretrain/Loss": 2.0090808868408203, "Full-pretrain/Loss (Raw)": 1.9229960441589355, "Full-pretrain/Step": 3950, "Full-pretrain/Step Time": 17.59812312759459} +{"Full-pretrain/Learning Rate": 3.300750516793614e-05, "Full-pretrain/Loss": 2.004354238510132, "Full-pretrain/Loss (Raw)": 1.9294955730438232, "Full-pretrain/Step": 3951, "Full-pretrain/Step Time": 17.59810083732009} +{"Full-pretrain/Learning Rate": 3.2999461243355854e-05, "Full-pretrain/Loss": 2.008350372314453, "Full-pretrain/Loss (Raw)": 2.2079780101776123, "Full-pretrain/Step": 3952, "Full-pretrain/Step Time": 17.59781420044601} +{"Full-pretrain/Learning Rate": 3.299141639604053e-05, "Full-pretrain/Loss": 2.013925790786743, "Full-pretrain/Loss (Raw)": 2.0532546043395996, "Full-pretrain/Step": 3953, "Full-pretrain/Step Time": 17.59463626332581} +{"Full-pretrain/Learning Rate": 3.298337062691812e-05, "Full-pretrain/Loss": 2.0100467205047607, "Full-pretrain/Loss (Raw)": 1.8702380657196045, "Full-pretrain/Step": 3954, "Full-pretrain/Step Time": 17.598399309441447} +{"Full-pretrain/Learning Rate": 3.297532393691672e-05, "Full-pretrain/Loss": 2.0076985359191895, "Full-pretrain/Loss (Raw)": 2.0248641967773438, "Full-pretrain/Step": 3955, "Full-pretrain/Step Time": 17.60461523756385} +{"Full-pretrain/Learning Rate": 3.29672763269645e-05, "Full-pretrain/Loss": 1.9953081607818604, "Full-pretrain/Loss (Raw)": 1.8574316501617432, "Full-pretrain/Step": 3956, "Full-pretrain/Step Time": 17.594971038401127} +{"Full-pretrain/Learning Rate": 3.295922779798976e-05, "Full-pretrain/Loss": 1.97995924949646, "Full-pretrain/Loss (Raw)": 1.8105952739715576, "Full-pretrain/Step": 3957, "Full-pretrain/Step Time": 17.6015204153955} +{"Full-pretrain/Learning Rate": 3.2951178350920895e-05, "Full-pretrain/Loss": 1.986737847328186, "Full-pretrain/Loss (Raw)": 2.1394238471984863, "Full-pretrain/Step": 3958, "Full-pretrain/Step Time": 17.601001223549247} +{"Full-pretrain/Learning Rate": 3.2943127986686393e-05, "Full-pretrain/Loss": 1.9881592988967896, "Full-pretrain/Loss (Raw)": 1.9251787662506104, "Full-pretrain/Step": 3959, "Full-pretrain/Step Time": 17.600543869659305} +{"Full-pretrain/Learning Rate": 3.293507670621488e-05, "Full-pretrain/Loss": 1.9860496520996094, "Full-pretrain/Loss (Raw)": 2.103454351425171, "Full-pretrain/Step": 3960, "Full-pretrain/Step Time": 17.59112479351461} +{"Full-pretrain/Learning Rate": 3.2927024510435055e-05, "Full-pretrain/Loss": 1.990344762802124, "Full-pretrain/Loss (Raw)": 2.1985583305358887, "Full-pretrain/Step": 3961, "Full-pretrain/Step Time": 17.58985654078424} +{"Full-pretrain/Learning Rate": 3.2918971400275734e-05, "Full-pretrain/Loss": 1.9877228736877441, "Full-pretrain/Loss (Raw)": 1.9222180843353271, "Full-pretrain/Step": 3962, "Full-pretrain/Step Time": 17.594877038151026} +{"Full-pretrain/Learning Rate": 3.2910917376665845e-05, "Full-pretrain/Loss": 1.9749610424041748, "Full-pretrain/Loss (Raw)": 1.8067278861999512, "Full-pretrain/Step": 3963, "Full-pretrain/Step Time": 17.587330793961883} +{"Full-pretrain/Learning Rate": 3.290286244053442e-05, "Full-pretrain/Loss": 1.9780992269515991, "Full-pretrain/Loss (Raw)": 2.1145057678222656, "Full-pretrain/Step": 3964, "Full-pretrain/Step Time": 17.587503725662827} +{"Full-pretrain/Learning Rate": 3.289480659281058e-05, "Full-pretrain/Loss": 1.9661306142807007, "Full-pretrain/Loss (Raw)": 1.8297789096832275, "Full-pretrain/Step": 3965, "Full-pretrain/Step Time": 17.584088729694486} +{"Full-pretrain/Learning Rate": 3.288674983442359e-05, "Full-pretrain/Loss": 1.9762383699417114, "Full-pretrain/Loss (Raw)": 2.2360081672668457, "Full-pretrain/Step": 3966, "Full-pretrain/Step Time": 17.583371566608548} +{"Full-pretrain/Learning Rate": 3.287869216630277e-05, "Full-pretrain/Loss": 1.9794414043426514, "Full-pretrain/Loss (Raw)": 2.2609925270080566, "Full-pretrain/Step": 3967, "Full-pretrain/Step Time": 17.582190364599228} +{"Full-pretrain/Learning Rate": 3.287063358937757e-05, "Full-pretrain/Loss": 1.9830570220947266, "Full-pretrain/Loss (Raw)": 2.0671651363372803, "Full-pretrain/Step": 3968, "Full-pretrain/Step Time": 17.583701446652412} +{"Full-pretrain/Learning Rate": 3.286257410457756e-05, "Full-pretrain/Loss": 1.9872349500656128, "Full-pretrain/Loss (Raw)": 2.0559191703796387, "Full-pretrain/Step": 3969, "Full-pretrain/Step Time": 17.5760463681072} +{"Full-pretrain/Learning Rate": 3.285451371283239e-05, "Full-pretrain/Loss": 1.991622805595398, "Full-pretrain/Loss (Raw)": 1.9594449996948242, "Full-pretrain/Step": 3970, "Full-pretrain/Step Time": 17.574590107426047} +{"Full-pretrain/Learning Rate": 3.2846452415071826e-05, "Full-pretrain/Loss": 2.009585380554199, "Full-pretrain/Loss (Raw)": 2.0426931381225586, "Full-pretrain/Step": 3971, "Full-pretrain/Step Time": 17.581694971770048} +{"Full-pretrain/Learning Rate": 3.283839021222573e-05, "Full-pretrain/Loss": 2.014892339706421, "Full-pretrain/Loss (Raw)": 2.0442280769348145, "Full-pretrain/Step": 3972, "Full-pretrain/Step Time": 17.57423562183976} +{"Full-pretrain/Learning Rate": 3.2830327105224074e-05, "Full-pretrain/Loss": 2.0012755393981934, "Full-pretrain/Loss (Raw)": 1.8066496849060059, "Full-pretrain/Step": 3973, "Full-pretrain/Step Time": 17.57446056045592} +{"Full-pretrain/Learning Rate": 3.282226309499694e-05, "Full-pretrain/Loss": 2.0000991821289062, "Full-pretrain/Loss (Raw)": 2.043795108795166, "Full-pretrain/Step": 3974, "Full-pretrain/Step Time": 17.576317079365253} +{"Full-pretrain/Learning Rate": 3.281419818247451e-05, "Full-pretrain/Loss": 1.994802713394165, "Full-pretrain/Loss (Raw)": 1.8394603729248047, "Full-pretrain/Step": 3975, "Full-pretrain/Step Time": 17.58590385131538} +{"Full-pretrain/Learning Rate": 3.280613236858707e-05, "Full-pretrain/Loss": 1.9903223514556885, "Full-pretrain/Loss (Raw)": 1.8887240886688232, "Full-pretrain/Step": 3976, "Full-pretrain/Step Time": 17.58022357709706} +{"Full-pretrain/Learning Rate": 3.2798065654265e-05, "Full-pretrain/Loss": 1.9917466640472412, "Full-pretrain/Loss (Raw)": 1.7586517333984375, "Full-pretrain/Step": 3977, "Full-pretrain/Step Time": 17.581003850325942} +{"Full-pretrain/Learning Rate": 3.2789998040438794e-05, "Full-pretrain/Loss": 1.9912242889404297, "Full-pretrain/Loss (Raw)": 2.0087080001831055, "Full-pretrain/Step": 3978, "Full-pretrain/Step Time": 17.582499738782644} +{"Full-pretrain/Learning Rate": 3.278192952803905e-05, "Full-pretrain/Loss": 1.9975392818450928, "Full-pretrain/Loss (Raw)": 1.9955374002456665, "Full-pretrain/Step": 3979, "Full-pretrain/Step Time": 17.590105621144176} +{"Full-pretrain/Learning Rate": 3.277386011799647e-05, "Full-pretrain/Loss": 1.9902163743972778, "Full-pretrain/Loss (Raw)": 1.8082410097122192, "Full-pretrain/Step": 3980, "Full-pretrain/Step Time": 17.58933520503342} +{"Full-pretrain/Learning Rate": 3.276578981124186e-05, "Full-pretrain/Loss": 1.9787871837615967, "Full-pretrain/Loss (Raw)": 1.7882733345031738, "Full-pretrain/Step": 3981, "Full-pretrain/Step Time": 17.582762407138944} +{"Full-pretrain/Learning Rate": 3.275771860870613e-05, "Full-pretrain/Loss": 1.9790887832641602, "Full-pretrain/Loss (Raw)": 1.9326480627059937, "Full-pretrain/Step": 3982, "Full-pretrain/Step Time": 17.58255704678595} +{"Full-pretrain/Learning Rate": 3.2749646511320276e-05, "Full-pretrain/Loss": 1.9857511520385742, "Full-pretrain/Loss (Raw)": 2.142693042755127, "Full-pretrain/Step": 3983, "Full-pretrain/Step Time": 17.58260622434318} +{"Full-pretrain/Learning Rate": 3.2741573520015425e-05, "Full-pretrain/Loss": 1.975865364074707, "Full-pretrain/Loss (Raw)": 1.8916274309158325, "Full-pretrain/Step": 3984, "Full-pretrain/Step Time": 17.582505386322737} +{"Full-pretrain/Learning Rate": 3.273349963572279e-05, "Full-pretrain/Loss": 1.973484992980957, "Full-pretrain/Loss (Raw)": 1.9770843982696533, "Full-pretrain/Step": 3985, "Full-pretrain/Step Time": 17.58224048279226} +{"Full-pretrain/Learning Rate": 3.272542485937369e-05, "Full-pretrain/Loss": 1.9797921180725098, "Full-pretrain/Loss (Raw)": 2.07206392288208, "Full-pretrain/Step": 3986, "Full-pretrain/Step Time": 17.581699086353183} +{"Full-pretrain/Learning Rate": 3.271734919189955e-05, "Full-pretrain/Loss": 1.9783916473388672, "Full-pretrain/Loss (Raw)": 1.9800539016723633, "Full-pretrain/Step": 3987, "Full-pretrain/Step Time": 17.578593514859676} +{"Full-pretrain/Learning Rate": 3.270927263423188e-05, "Full-pretrain/Loss": 1.9700238704681396, "Full-pretrain/Loss (Raw)": 1.5896574258804321, "Full-pretrain/Step": 3988, "Full-pretrain/Step Time": 17.577128069475293} +{"Full-pretrain/Learning Rate": 3.270119518730233e-05, "Full-pretrain/Loss": 1.9714415073394775, "Full-pretrain/Loss (Raw)": 1.8559651374816895, "Full-pretrain/Step": 3989, "Full-pretrain/Step Time": 17.57966350018978} +{"Full-pretrain/Learning Rate": 3.269311685204262e-05, "Full-pretrain/Loss": 1.9693998098373413, "Full-pretrain/Loss (Raw)": 2.074087142944336, "Full-pretrain/Step": 3990, "Full-pretrain/Step Time": 17.577277440577745} +{"Full-pretrain/Learning Rate": 3.268503762938458e-05, "Full-pretrain/Loss": 1.9704604148864746, "Full-pretrain/Loss (Raw)": 1.9591180086135864, "Full-pretrain/Step": 3991, "Full-pretrain/Step Time": 17.576915288344026} +{"Full-pretrain/Learning Rate": 3.267695752026016e-05, "Full-pretrain/Loss": 1.958676815032959, "Full-pretrain/Loss (Raw)": 1.7263789176940918, "Full-pretrain/Step": 3992, "Full-pretrain/Step Time": 17.578772194683552} +{"Full-pretrain/Learning Rate": 3.266887652560138e-05, "Full-pretrain/Loss": 1.9475864171981812, "Full-pretrain/Loss (Raw)": 1.843664526939392, "Full-pretrain/Step": 3993, "Full-pretrain/Step Time": 17.580990076065063} +{"Full-pretrain/Learning Rate": 3.26607946463404e-05, "Full-pretrain/Loss": 1.9513920545578003, "Full-pretrain/Loss (Raw)": 2.0440011024475098, "Full-pretrain/Step": 3994, "Full-pretrain/Step Time": 17.58094206266105} +{"Full-pretrain/Learning Rate": 3.265271188340944e-05, "Full-pretrain/Loss": 1.9577244520187378, "Full-pretrain/Loss (Raw)": 2.0093631744384766, "Full-pretrain/Step": 3995, "Full-pretrain/Step Time": 17.582333674654365} +{"Full-pretrain/Learning Rate": 3.264462823774085e-05, "Full-pretrain/Loss": 1.9566490650177002, "Full-pretrain/Loss (Raw)": 2.080096483230591, "Full-pretrain/Step": 3996, "Full-pretrain/Step Time": 17.57664305716753} +{"Full-pretrain/Learning Rate": 3.263654371026709e-05, "Full-pretrain/Loss": 1.960111379623413, "Full-pretrain/Loss (Raw)": 1.940567970275879, "Full-pretrain/Step": 3997, "Full-pretrain/Step Time": 17.576146695762873} +{"Full-pretrain/Learning Rate": 3.2628458301920685e-05, "Full-pretrain/Loss": 1.9457778930664062, "Full-pretrain/Loss (Raw)": 1.777341604232788, "Full-pretrain/Step": 3998, "Full-pretrain/Step Time": 17.5842762067914} +{"Full-pretrain/Learning Rate": 3.26203720136343e-05, "Full-pretrain/Loss": 1.9405068159103394, "Full-pretrain/Loss (Raw)": 2.092315912246704, "Full-pretrain/Step": 3999, "Full-pretrain/Step Time": 17.58200767636299} +{"Full-pretrain/Learning Rate": 3.2612284846340687e-05, "Full-pretrain/Loss": 1.938307523727417, "Full-pretrain/Loss (Raw)": 1.996789574623108, "Full-pretrain/Step": 4000, "Full-pretrain/Step Time": 17.5777688883245} +{"Full-pretrain/Learning Rate": 3.260419680097268e-05, "Full-pretrain/Loss": 1.9441261291503906, "Full-pretrain/Loss (Raw)": 2.24211049079895, "Full-pretrain/Step": 4001, "Full-pretrain/Step Time": 17.578776532784104} +{"Full-pretrain/Learning Rate": 3.2596107878463254e-05, "Full-pretrain/Loss": 1.9506137371063232, "Full-pretrain/Loss (Raw)": 2.16705322265625, "Full-pretrain/Step": 4002, "Full-pretrain/Step Time": 17.588872557505965} +{"Full-pretrain/Learning Rate": 3.258801807974545e-05, "Full-pretrain/Loss": 1.9500558376312256, "Full-pretrain/Loss (Raw)": 2.0248379707336426, "Full-pretrain/Step": 4003, "Full-pretrain/Step Time": 17.58149684406817} +{"Full-pretrain/Learning Rate": 3.257992740575243e-05, "Full-pretrain/Loss": 1.9478635787963867, "Full-pretrain/Loss (Raw)": 1.9740749597549438, "Full-pretrain/Step": 4004, "Full-pretrain/Step Time": 17.577673383057117} +{"Full-pretrain/Learning Rate": 3.257183585741745e-05, "Full-pretrain/Loss": 1.9543659687042236, "Full-pretrain/Loss (Raw)": 2.0147223472595215, "Full-pretrain/Step": 4005, "Full-pretrain/Step Time": 17.581796497106552} +{"Full-pretrain/Learning Rate": 3.2563743435673855e-05, "Full-pretrain/Loss": 1.960913062095642, "Full-pretrain/Loss (Raw)": 2.253305435180664, "Full-pretrain/Step": 4006, "Full-pretrain/Step Time": 17.584196301177144} +{"Full-pretrain/Learning Rate": 3.255565014145512e-05, "Full-pretrain/Loss": 1.968109369277954, "Full-pretrain/Loss (Raw)": 2.0697388648986816, "Full-pretrain/Step": 4007, "Full-pretrain/Step Time": 17.578602673485875} +{"Full-pretrain/Learning Rate": 3.2547555975694796e-05, "Full-pretrain/Loss": 1.967583417892456, "Full-pretrain/Loss (Raw)": 1.8718982934951782, "Full-pretrain/Step": 4008, "Full-pretrain/Step Time": 17.57899153791368} +{"Full-pretrain/Learning Rate": 3.253946093932654e-05, "Full-pretrain/Loss": 1.9825351238250732, "Full-pretrain/Loss (Raw)": 2.2371020317077637, "Full-pretrain/Step": 4009, "Full-pretrain/Step Time": 17.584517393261194} +{"Full-pretrain/Learning Rate": 3.2531365033284115e-05, "Full-pretrain/Loss": 1.977602481842041, "Full-pretrain/Loss (Raw)": 1.8508647680282593, "Full-pretrain/Step": 4010, "Full-pretrain/Step Time": 17.588190581649542} +{"Full-pretrain/Learning Rate": 3.252326825850139e-05, "Full-pretrain/Loss": 1.9783140420913696, "Full-pretrain/Loss (Raw)": 2.018307685852051, "Full-pretrain/Step": 4011, "Full-pretrain/Step Time": 17.58897497691214} +{"Full-pretrain/Learning Rate": 3.25151706159123e-05, "Full-pretrain/Loss": 1.9811830520629883, "Full-pretrain/Loss (Raw)": 1.9000496864318848, "Full-pretrain/Step": 4012, "Full-pretrain/Step Time": 17.587866697460413} +{"Full-pretrain/Learning Rate": 3.250707210645093e-05, "Full-pretrain/Loss": 1.9904930591583252, "Full-pretrain/Loss (Raw)": 2.0861940383911133, "Full-pretrain/Step": 4013, "Full-pretrain/Step Time": 17.595672108232975} +{"Full-pretrain/Learning Rate": 3.249897273105143e-05, "Full-pretrain/Loss": 1.9895107746124268, "Full-pretrain/Loss (Raw)": 1.901216983795166, "Full-pretrain/Step": 4014, "Full-pretrain/Step Time": 17.59946541674435} +{"Full-pretrain/Learning Rate": 3.249087249064805e-05, "Full-pretrain/Loss": 1.9829654693603516, "Full-pretrain/Loss (Raw)": 1.9332425594329834, "Full-pretrain/Step": 4015, "Full-pretrain/Step Time": 17.60571231506765} +{"Full-pretrain/Learning Rate": 3.248277138617517e-05, "Full-pretrain/Loss": 1.9871671199798584, "Full-pretrain/Loss (Raw)": 2.0260822772979736, "Full-pretrain/Step": 4016, "Full-pretrain/Step Time": 17.601302184164524} +{"Full-pretrain/Learning Rate": 3.247466941856724e-05, "Full-pretrain/Loss": 1.992459774017334, "Full-pretrain/Loss (Raw)": 2.1464483737945557, "Full-pretrain/Step": 4017, "Full-pretrain/Step Time": 17.604992497712374} +{"Full-pretrain/Learning Rate": 3.246656658875882e-05, "Full-pretrain/Loss": 1.9901788234710693, "Full-pretrain/Loss (Raw)": 1.9990696907043457, "Full-pretrain/Step": 4018, "Full-pretrain/Step Time": 17.60341641679406} +{"Full-pretrain/Learning Rate": 3.2458462897684566e-05, "Full-pretrain/Loss": 1.9908459186553955, "Full-pretrain/Loss (Raw)": 2.001403331756592, "Full-pretrain/Step": 4019, "Full-pretrain/Step Time": 17.599851839244366} +{"Full-pretrain/Learning Rate": 3.2450358346279234e-05, "Full-pretrain/Loss": 1.9989972114562988, "Full-pretrain/Loss (Raw)": 1.8504973649978638, "Full-pretrain/Step": 4020, "Full-pretrain/Step Time": 17.60315041616559} +{"Full-pretrain/Learning Rate": 3.2442252935477696e-05, "Full-pretrain/Loss": 1.9989597797393799, "Full-pretrain/Loss (Raw)": 1.8547700643539429, "Full-pretrain/Step": 4021, "Full-pretrain/Step Time": 17.60274694673717} +{"Full-pretrain/Learning Rate": 3.243414666621489e-05, "Full-pretrain/Loss": 1.9916715621948242, "Full-pretrain/Loss (Raw)": 1.8408637046813965, "Full-pretrain/Step": 4022, "Full-pretrain/Step Time": 17.608842618763447} +{"Full-pretrain/Learning Rate": 3.2426039539425876e-05, "Full-pretrain/Loss": 1.987508773803711, "Full-pretrain/Loss (Raw)": 1.8259071111679077, "Full-pretrain/Step": 4023, "Full-pretrain/Step Time": 17.609711572527885} +{"Full-pretrain/Learning Rate": 3.241793155604581e-05, "Full-pretrain/Loss": 1.9923555850982666, "Full-pretrain/Loss (Raw)": 1.8814775943756104, "Full-pretrain/Step": 4024, "Full-pretrain/Step Time": 17.60802522301674} +{"Full-pretrain/Learning Rate": 3.240982271700995e-05, "Full-pretrain/Loss": 1.9988694190979004, "Full-pretrain/Loss (Raw)": 2.0521080493927, "Full-pretrain/Step": 4025, "Full-pretrain/Step Time": 17.605270240455866} +{"Full-pretrain/Learning Rate": 3.2401713023253644e-05, "Full-pretrain/Loss": 1.996483325958252, "Full-pretrain/Loss (Raw)": 1.967648983001709, "Full-pretrain/Step": 4026, "Full-pretrain/Step Time": 17.60417964681983} +{"Full-pretrain/Learning Rate": 3.2393602475712344e-05, "Full-pretrain/Loss": 1.9941377639770508, "Full-pretrain/Loss (Raw)": 1.9342992305755615, "Full-pretrain/Step": 4027, "Full-pretrain/Step Time": 17.60421670228243} +{"Full-pretrain/Learning Rate": 3.23854910753216e-05, "Full-pretrain/Loss": 1.987497091293335, "Full-pretrain/Loss (Raw)": 1.8675947189331055, "Full-pretrain/Step": 4028, "Full-pretrain/Step Time": 17.604422563686967} +{"Full-pretrain/Learning Rate": 3.237737882301705e-05, "Full-pretrain/Loss": 1.9762144088745117, "Full-pretrain/Loss (Raw)": 1.579525351524353, "Full-pretrain/Step": 4029, "Full-pretrain/Step Time": 17.595704030245543} +{"Full-pretrain/Learning Rate": 3.236926571973444e-05, "Full-pretrain/Loss": 1.9795210361480713, "Full-pretrain/Loss (Raw)": 1.8831571340560913, "Full-pretrain/Step": 4030, "Full-pretrain/Step Time": 17.600742164999247} +{"Full-pretrain/Learning Rate": 3.2361151766409624e-05, "Full-pretrain/Loss": 1.986943006515503, "Full-pretrain/Loss (Raw)": 2.3298110961914062, "Full-pretrain/Step": 4031, "Full-pretrain/Step Time": 17.60587635450065} +{"Full-pretrain/Learning Rate": 3.2353036963978536e-05, "Full-pretrain/Loss": 1.9877679347991943, "Full-pretrain/Loss (Raw)": 2.0231895446777344, "Full-pretrain/Step": 4032, "Full-pretrain/Step Time": 17.604756209999323} +{"Full-pretrain/Learning Rate": 3.234492131337722e-05, "Full-pretrain/Loss": 1.9826793670654297, "Full-pretrain/Loss (Raw)": 2.0792794227600098, "Full-pretrain/Step": 4033, "Full-pretrain/Step Time": 17.59899189695716} +{"Full-pretrain/Learning Rate": 3.233680481554182e-05, "Full-pretrain/Loss": 1.9762537479400635, "Full-pretrain/Loss (Raw)": 1.9614304304122925, "Full-pretrain/Step": 4034, "Full-pretrain/Step Time": 17.60090520232916} +{"Full-pretrain/Learning Rate": 3.232868747140855e-05, "Full-pretrain/Loss": 1.9787218570709229, "Full-pretrain/Loss (Raw)": 2.1038150787353516, "Full-pretrain/Step": 4035, "Full-pretrain/Step Time": 17.603947581723332} +{"Full-pretrain/Learning Rate": 3.232056928191376e-05, "Full-pretrain/Loss": 1.9730961322784424, "Full-pretrain/Loss (Raw)": 1.794058084487915, "Full-pretrain/Step": 4036, "Full-pretrain/Step Time": 17.602495742961764} +{"Full-pretrain/Learning Rate": 3.231245024799388e-05, "Full-pretrain/Loss": 1.9639564752578735, "Full-pretrain/Loss (Raw)": 1.7222493886947632, "Full-pretrain/Step": 4037, "Full-pretrain/Step Time": 17.59875124692917} +{"Full-pretrain/Learning Rate": 3.2304330370585436e-05, "Full-pretrain/Loss": 1.955479383468628, "Full-pretrain/Loss (Raw)": 1.982038140296936, "Full-pretrain/Step": 4038, "Full-pretrain/Step Time": 17.593115340918303} +{"Full-pretrain/Learning Rate": 3.2296209650625044e-05, "Full-pretrain/Loss": 1.9569553136825562, "Full-pretrain/Loss (Raw)": 2.11696720123291, "Full-pretrain/Step": 4039, "Full-pretrain/Step Time": 17.596816316246986} +{"Full-pretrain/Learning Rate": 3.228808808904943e-05, "Full-pretrain/Loss": 1.9622368812561035, "Full-pretrain/Loss (Raw)": 2.040910482406616, "Full-pretrain/Step": 4040, "Full-pretrain/Step Time": 17.59701319411397} +{"Full-pretrain/Learning Rate": 3.227996568679542e-05, "Full-pretrain/Loss": 1.9575194120407104, "Full-pretrain/Loss (Raw)": 2.0861403942108154, "Full-pretrain/Step": 4041, "Full-pretrain/Step Time": 17.59204263612628} +{"Full-pretrain/Learning Rate": 3.2271842444799925e-05, "Full-pretrain/Loss": 1.9569497108459473, "Full-pretrain/Loss (Raw)": 1.8326367139816284, "Full-pretrain/Step": 4042, "Full-pretrain/Step Time": 17.591848796233535} +{"Full-pretrain/Learning Rate": 3.2263718363999964e-05, "Full-pretrain/Loss": 1.959201455116272, "Full-pretrain/Loss (Raw)": 2.090365409851074, "Full-pretrain/Step": 4043, "Full-pretrain/Step Time": 17.596035728231072} +{"Full-pretrain/Learning Rate": 3.2255593445332645e-05, "Full-pretrain/Loss": 1.9593307971954346, "Full-pretrain/Loss (Raw)": 1.9041874408721924, "Full-pretrain/Step": 4044, "Full-pretrain/Step Time": 17.59761267900467} +{"Full-pretrain/Learning Rate": 3.2247467689735164e-05, "Full-pretrain/Loss": 1.9421250820159912, "Full-pretrain/Loss (Raw)": 1.5356087684631348, "Full-pretrain/Step": 4045, "Full-pretrain/Step Time": 17.58738297969103} +{"Full-pretrain/Learning Rate": 3.2239341098144834e-05, "Full-pretrain/Loss": 1.9476115703582764, "Full-pretrain/Loss (Raw)": 2.076788902282715, "Full-pretrain/Step": 4046, "Full-pretrain/Step Time": 17.593370262533426} +{"Full-pretrain/Learning Rate": 3.2231213671499057e-05, "Full-pretrain/Loss": 1.938416600227356, "Full-pretrain/Loss (Raw)": 1.6390032768249512, "Full-pretrain/Step": 4047, "Full-pretrain/Step Time": 17.60266263410449} +{"Full-pretrain/Learning Rate": 3.2223085410735314e-05, "Full-pretrain/Loss": 1.9403647184371948, "Full-pretrain/Loss (Raw)": 2.0884206295013428, "Full-pretrain/Step": 4048, "Full-pretrain/Step Time": 17.59334180317819} +{"Full-pretrain/Learning Rate": 3.221495631679121e-05, "Full-pretrain/Loss": 1.9349696636199951, "Full-pretrain/Loss (Raw)": 1.973808765411377, "Full-pretrain/Step": 4049, "Full-pretrain/Step Time": 17.588825596496463} +{"Full-pretrain/Learning Rate": 3.220682639060444e-05, "Full-pretrain/Loss": 1.9382436275482178, "Full-pretrain/Loss (Raw)": 2.1038360595703125, "Full-pretrain/Step": 4050, "Full-pretrain/Step Time": 17.588945373892784} +{"Full-pretrain/Learning Rate": 3.219869563311277e-05, "Full-pretrain/Loss": 1.927444577217102, "Full-pretrain/Loss (Raw)": 1.655830979347229, "Full-pretrain/Step": 4051, "Full-pretrain/Step Time": 17.595645086839795} +{"Full-pretrain/Learning Rate": 3.219056404525409e-05, "Full-pretrain/Loss": 1.9237734079360962, "Full-pretrain/Loss (Raw)": 1.733020544052124, "Full-pretrain/Step": 4052, "Full-pretrain/Step Time": 17.594219028949738} +{"Full-pretrain/Learning Rate": 3.218243162796638e-05, "Full-pretrain/Loss": 1.9250431060791016, "Full-pretrain/Loss (Raw)": 1.895402193069458, "Full-pretrain/Step": 4053, "Full-pretrain/Step Time": 17.59285388700664} +{"Full-pretrain/Learning Rate": 3.217429838218769e-05, "Full-pretrain/Loss": 1.9314367771148682, "Full-pretrain/Loss (Raw)": 2.0454604625701904, "Full-pretrain/Step": 4054, "Full-pretrain/Step Time": 17.588340245187283} +{"Full-pretrain/Learning Rate": 3.2166164308856224e-05, "Full-pretrain/Loss": 1.9323201179504395, "Full-pretrain/Loss (Raw)": 1.8541717529296875, "Full-pretrain/Step": 4055, "Full-pretrain/Step Time": 17.60002326592803} +{"Full-pretrain/Learning Rate": 3.215802940891021e-05, "Full-pretrain/Loss": 1.9289207458496094, "Full-pretrain/Loss (Raw)": 1.772700309753418, "Full-pretrain/Step": 4056, "Full-pretrain/Step Time": 17.59812980145216} +{"Full-pretrain/Learning Rate": 3.2149893683288024e-05, "Full-pretrain/Loss": 1.9360487461090088, "Full-pretrain/Loss (Raw)": 2.280202865600586, "Full-pretrain/Step": 4057, "Full-pretrain/Step Time": 17.59927000105381} +{"Full-pretrain/Learning Rate": 3.214175713292811e-05, "Full-pretrain/Loss": 1.946716547012329, "Full-pretrain/Loss (Raw)": 2.3090176582336426, "Full-pretrain/Step": 4058, "Full-pretrain/Step Time": 17.600519627332687} +{"Full-pretrain/Learning Rate": 3.213361975876902e-05, "Full-pretrain/Loss": 1.9473390579223633, "Full-pretrain/Loss (Raw)": 1.9542202949523926, "Full-pretrain/Step": 4059, "Full-pretrain/Step Time": 17.60256893746555} +{"Full-pretrain/Learning Rate": 3.21254815617494e-05, "Full-pretrain/Loss": 1.9476698637008667, "Full-pretrain/Loss (Raw)": 1.8781816959381104, "Full-pretrain/Step": 4060, "Full-pretrain/Step Time": 17.595682149752975} +{"Full-pretrain/Learning Rate": 3.211734254280799e-05, "Full-pretrain/Loss": 1.9591212272644043, "Full-pretrain/Loss (Raw)": 1.9459675550460815, "Full-pretrain/Step": 4061, "Full-pretrain/Step Time": 17.597954446449876} +{"Full-pretrain/Learning Rate": 3.210920270288362e-05, "Full-pretrain/Loss": 1.9612761735916138, "Full-pretrain/Loss (Raw)": 1.9521141052246094, "Full-pretrain/Step": 4062, "Full-pretrain/Step Time": 17.593884704634547} +{"Full-pretrain/Learning Rate": 3.2101062042915215e-05, "Full-pretrain/Loss": 1.9470102787017822, "Full-pretrain/Loss (Raw)": 1.8733044862747192, "Full-pretrain/Step": 4063, "Full-pretrain/Step Time": 17.594737824052572} +{"Full-pretrain/Learning Rate": 3.209292056384179e-05, "Full-pretrain/Loss": 1.9458246231079102, "Full-pretrain/Loss (Raw)": 1.9852490425109863, "Full-pretrain/Step": 4064, "Full-pretrain/Step Time": 17.597800171002746} +{"Full-pretrain/Learning Rate": 3.2084778266602476e-05, "Full-pretrain/Loss": 1.9469645023345947, "Full-pretrain/Loss (Raw)": 2.115753650665283, "Full-pretrain/Step": 4065, "Full-pretrain/Step Time": 17.59553817100823} +{"Full-pretrain/Learning Rate": 3.207663515213648e-05, "Full-pretrain/Loss": 1.9418469667434692, "Full-pretrain/Loss (Raw)": 1.7976692914962769, "Full-pretrain/Step": 4066, "Full-pretrain/Step Time": 17.590073032304645} +{"Full-pretrain/Learning Rate": 3.206849122138311e-05, "Full-pretrain/Loss": 1.9350295066833496, "Full-pretrain/Loss (Raw)": 1.885655164718628, "Full-pretrain/Step": 4067, "Full-pretrain/Step Time": 17.592806523665786} +{"Full-pretrain/Learning Rate": 3.2060346475281755e-05, "Full-pretrain/Loss": 1.9455044269561768, "Full-pretrain/Loss (Raw)": 2.1292600631713867, "Full-pretrain/Step": 4068, "Full-pretrain/Step Time": 17.599298717454076} +{"Full-pretrain/Learning Rate": 3.205220091477191e-05, "Full-pretrain/Loss": 1.956898808479309, "Full-pretrain/Loss (Raw)": 2.0868682861328125, "Full-pretrain/Step": 4069, "Full-pretrain/Step Time": 17.60042213462293} +{"Full-pretrain/Learning Rate": 3.204405454079318e-05, "Full-pretrain/Loss": 1.9605584144592285, "Full-pretrain/Loss (Raw)": 2.099144458770752, "Full-pretrain/Step": 4070, "Full-pretrain/Step Time": 17.598093697801232} +{"Full-pretrain/Learning Rate": 3.2035907354285234e-05, "Full-pretrain/Loss": 1.9456431865692139, "Full-pretrain/Loss (Raw)": 1.639681339263916, "Full-pretrain/Step": 4071, "Full-pretrain/Step Time": 17.60190466232598} +{"Full-pretrain/Learning Rate": 3.2027759356187844e-05, "Full-pretrain/Loss": 1.9430485963821411, "Full-pretrain/Loss (Raw)": 1.9578845500946045, "Full-pretrain/Step": 4072, "Full-pretrain/Step Time": 17.6061257943511} +{"Full-pretrain/Learning Rate": 3.201961054744088e-05, "Full-pretrain/Loss": 1.93544602394104, "Full-pretrain/Loss (Raw)": 1.8428558111190796, "Full-pretrain/Step": 4073, "Full-pretrain/Step Time": 17.605728236958385} +{"Full-pretrain/Learning Rate": 3.201146092898431e-05, "Full-pretrain/Loss": 1.9462566375732422, "Full-pretrain/Loss (Raw)": 2.1785738468170166, "Full-pretrain/Step": 4074, "Full-pretrain/Step Time": 17.59879857674241} +{"Full-pretrain/Learning Rate": 3.2003310501758174e-05, "Full-pretrain/Loss": 1.9434694051742554, "Full-pretrain/Loss (Raw)": 2.0011777877807617, "Full-pretrain/Step": 4075, "Full-pretrain/Step Time": 17.60410082899034} +{"Full-pretrain/Learning Rate": 3.1995159266702644e-05, "Full-pretrain/Loss": 1.9397251605987549, "Full-pretrain/Loss (Raw)": 1.7843726873397827, "Full-pretrain/Step": 4076, "Full-pretrain/Step Time": 17.612514197826385} +{"Full-pretrain/Learning Rate": 3.1987007224757946e-05, "Full-pretrain/Loss": 1.9506572484970093, "Full-pretrain/Loss (Raw)": 1.885434627532959, "Full-pretrain/Step": 4077, "Full-pretrain/Step Time": 17.609693877398968} +{"Full-pretrain/Learning Rate": 3.197885437686443e-05, "Full-pretrain/Loss": 1.9525146484375, "Full-pretrain/Loss (Raw)": 2.1362223625183105, "Full-pretrain/Step": 4078, "Full-pretrain/Step Time": 17.60298838093877} +{"Full-pretrain/Learning Rate": 3.1970700723962504e-05, "Full-pretrain/Loss": 1.9667153358459473, "Full-pretrain/Loss (Raw)": 2.093430995941162, "Full-pretrain/Step": 4079, "Full-pretrain/Step Time": 17.602426003664732} +{"Full-pretrain/Learning Rate": 3.1962546266992696e-05, "Full-pretrain/Loss": 1.9665334224700928, "Full-pretrain/Loss (Raw)": 2.082596778869629, "Full-pretrain/Step": 4080, "Full-pretrain/Step Time": 17.606291556730866} +{"Full-pretrain/Learning Rate": 3.1954391006895637e-05, "Full-pretrain/Loss": 1.9689993858337402, "Full-pretrain/Loss (Raw)": 2.0527195930480957, "Full-pretrain/Step": 4081, "Full-pretrain/Step Time": 17.60511029884219} +{"Full-pretrain/Learning Rate": 3.1946234944612006e-05, "Full-pretrain/Loss": 1.9676446914672852, "Full-pretrain/Loss (Raw)": 2.0604872703552246, "Full-pretrain/Step": 4082, "Full-pretrain/Step Time": 17.59758217073977} +{"Full-pretrain/Learning Rate": 3.193807808108262e-05, "Full-pretrain/Loss": 1.9836382865905762, "Full-pretrain/Loss (Raw)": 2.167625904083252, "Full-pretrain/Step": 4083, "Full-pretrain/Step Time": 17.59768201597035} +{"Full-pretrain/Learning Rate": 3.1929920417248364e-05, "Full-pretrain/Loss": 1.9890881776809692, "Full-pretrain/Loss (Raw)": 1.907414197921753, "Full-pretrain/Step": 4084, "Full-pretrain/Step Time": 17.597726041451097} +{"Full-pretrain/Learning Rate": 3.192176195405023e-05, "Full-pretrain/Loss": 1.992793321609497, "Full-pretrain/Loss (Raw)": 2.0139687061309814, "Full-pretrain/Step": 4085, "Full-pretrain/Step Time": 17.597566675394773} +{"Full-pretrain/Learning Rate": 3.191360269242928e-05, "Full-pretrain/Loss": 1.9944082498550415, "Full-pretrain/Loss (Raw)": 2.097136974334717, "Full-pretrain/Step": 4086, "Full-pretrain/Step Time": 17.59476781450212} +{"Full-pretrain/Learning Rate": 3.190544263332669e-05, "Full-pretrain/Loss": 1.9955979585647583, "Full-pretrain/Loss (Raw)": 1.8922420740127563, "Full-pretrain/Step": 4087, "Full-pretrain/Step Time": 17.59660050086677} +{"Full-pretrain/Learning Rate": 3.1897281777683715e-05, "Full-pretrain/Loss": 2.009312391281128, "Full-pretrain/Loss (Raw)": 2.2115635871887207, "Full-pretrain/Step": 4088, "Full-pretrain/Step Time": 17.603486040607095} +{"Full-pretrain/Learning Rate": 3.1889120126441725e-05, "Full-pretrain/Loss": 2.0106825828552246, "Full-pretrain/Loss (Raw)": 2.3240480422973633, "Full-pretrain/Step": 4089, "Full-pretrain/Step Time": 17.608401745557785} +{"Full-pretrain/Learning Rate": 3.188095768054214e-05, "Full-pretrain/Loss": 1.9996440410614014, "Full-pretrain/Loss (Raw)": 1.9557840824127197, "Full-pretrain/Step": 4090, "Full-pretrain/Step Time": 17.60391066595912} +{"Full-pretrain/Learning Rate": 3.18727944409265e-05, "Full-pretrain/Loss": 1.9993408918380737, "Full-pretrain/Loss (Raw)": 1.9445221424102783, "Full-pretrain/Step": 4091, "Full-pretrain/Step Time": 17.605022184550762} +{"Full-pretrain/Learning Rate": 3.186463040853645e-05, "Full-pretrain/Loss": 1.9927252531051636, "Full-pretrain/Loss (Raw)": 1.6664780378341675, "Full-pretrain/Step": 4092, "Full-pretrain/Step Time": 17.60920038074255} +{"Full-pretrain/Learning Rate": 3.185646558431368e-05, "Full-pretrain/Loss": 1.9882709980010986, "Full-pretrain/Loss (Raw)": 1.8034327030181885, "Full-pretrain/Step": 4093, "Full-pretrain/Step Time": 17.611169207841158} +{"Full-pretrain/Learning Rate": 3.184829996920002e-05, "Full-pretrain/Loss": 1.9880032539367676, "Full-pretrain/Loss (Raw)": 1.9435505867004395, "Full-pretrain/Step": 4094, "Full-pretrain/Step Time": 17.60570266842842} +{"Full-pretrain/Learning Rate": 3.184013356413737e-05, "Full-pretrain/Loss": 1.9989573955535889, "Full-pretrain/Loss (Raw)": 2.223834991455078, "Full-pretrain/Step": 4095, "Full-pretrain/Step Time": 17.60421585291624} +{"Full-pretrain/Learning Rate": 3.183196637006771e-05, "Full-pretrain/Loss": 2.0005033016204834, "Full-pretrain/Loss (Raw)": 2.0347142219543457, "Full-pretrain/Step": 4096, "Full-pretrain/Step Time": 17.60595614090562} +{"Full-pretrain/Learning Rate": 3.1823798387933134e-05, "Full-pretrain/Loss": 1.9992384910583496, "Full-pretrain/Loss (Raw)": 2.0752804279327393, "Full-pretrain/Step": 4097, "Full-pretrain/Step Time": 17.610551945865154} +{"Full-pretrain/Learning Rate": 3.181562961867581e-05, "Full-pretrain/Loss": 2.006659746170044, "Full-pretrain/Loss (Raw)": 2.0351479053497314, "Full-pretrain/Step": 4098, "Full-pretrain/Step Time": 17.6095247939229} +{"Full-pretrain/Learning Rate": 3.1807460063238e-05, "Full-pretrain/Loss": 2.0047998428344727, "Full-pretrain/Loss (Raw)": 1.8261364698410034, "Full-pretrain/Step": 4099, "Full-pretrain/Step Time": 17.599875938147306} +{"Full-pretrain/Learning Rate": 3.1799289722562075e-05, "Full-pretrain/Loss": 2.00640869140625, "Full-pretrain/Loss (Raw)": 2.1807470321655273, "Full-pretrain/Step": 4100, "Full-pretrain/Step Time": 17.60568996705115} +{"Full-pretrain/Learning Rate": 3.179111859759046e-05, "Full-pretrain/Loss": 2.00524640083313, "Full-pretrain/Loss (Raw)": 2.049675226211548, "Full-pretrain/Step": 4101, "Full-pretrain/Step Time": 17.607293711975217} +{"Full-pretrain/Learning Rate": 3.178294668926571e-05, "Full-pretrain/Loss": 1.994192361831665, "Full-pretrain/Loss (Raw)": 1.7454110383987427, "Full-pretrain/Step": 4102, "Full-pretrain/Step Time": 17.61053631082177} +{"Full-pretrain/Learning Rate": 3.177477399853045e-05, "Full-pretrain/Loss": 2.009732723236084, "Full-pretrain/Loss (Raw)": 2.1369807720184326, "Full-pretrain/Step": 4103, "Full-pretrain/Step Time": 17.603158075362444} +{"Full-pretrain/Learning Rate": 3.176660052632737e-05, "Full-pretrain/Loss": 2.00016713142395, "Full-pretrain/Loss (Raw)": 1.6517823934555054, "Full-pretrain/Step": 4104, "Full-pretrain/Step Time": 17.60028793103993} +{"Full-pretrain/Learning Rate": 3.1758426273599315e-05, "Full-pretrain/Loss": 1.99380362033844, "Full-pretrain/Loss (Raw)": 1.6392195224761963, "Full-pretrain/Step": 4105, "Full-pretrain/Step Time": 17.60205029323697} +{"Full-pretrain/Learning Rate": 3.1750251241289145e-05, "Full-pretrain/Loss": 1.9831032752990723, "Full-pretrain/Loss (Raw)": 1.8361647129058838, "Full-pretrain/Step": 4106, "Full-pretrain/Step Time": 17.60194693878293} +{"Full-pretrain/Learning Rate": 3.174207543033988e-05, "Full-pretrain/Loss": 1.9823681116104126, "Full-pretrain/Loss (Raw)": 1.9776521921157837, "Full-pretrain/Step": 4107, "Full-pretrain/Step Time": 17.59666564501822} +{"Full-pretrain/Learning Rate": 3.173389884169458e-05, "Full-pretrain/Loss": 1.986422061920166, "Full-pretrain/Loss (Raw)": 1.914102554321289, "Full-pretrain/Step": 4108, "Full-pretrain/Step Time": 17.59158606082201} +{"Full-pretrain/Learning Rate": 3.1725721476296416e-05, "Full-pretrain/Loss": 1.9866852760314941, "Full-pretrain/Loss (Raw)": 1.8938534259796143, "Full-pretrain/Step": 4109, "Full-pretrain/Step Time": 17.601456206291914} +{"Full-pretrain/Learning Rate": 3.1717543335088646e-05, "Full-pretrain/Loss": 1.9736545085906982, "Full-pretrain/Loss (Raw)": 1.7192425727844238, "Full-pretrain/Step": 4110, "Full-pretrain/Step Time": 17.59553986415267} +{"Full-pretrain/Learning Rate": 3.1709364419014615e-05, "Full-pretrain/Loss": 1.9645836353302002, "Full-pretrain/Loss (Raw)": 1.8031599521636963, "Full-pretrain/Step": 4111, "Full-pretrain/Step Time": 17.598324835300446} +{"Full-pretrain/Learning Rate": 3.170118472901775e-05, "Full-pretrain/Loss": 1.9551341533660889, "Full-pretrain/Loss (Raw)": 1.780212163925171, "Full-pretrain/Step": 4112, "Full-pretrain/Step Time": 17.5933137871325} +{"Full-pretrain/Learning Rate": 3.1693004266041584e-05, "Full-pretrain/Loss": 1.9442625045776367, "Full-pretrain/Loss (Raw)": 1.7048254013061523, "Full-pretrain/Step": 4113, "Full-pretrain/Step Time": 17.602530863136053} +{"Full-pretrain/Learning Rate": 3.168482303102972e-05, "Full-pretrain/Loss": 1.9446338415145874, "Full-pretrain/Loss (Raw)": 2.072370767593384, "Full-pretrain/Step": 4114, "Full-pretrain/Step Time": 17.595107294619083} +{"Full-pretrain/Learning Rate": 3.1676641024925875e-05, "Full-pretrain/Loss": 1.9381120204925537, "Full-pretrain/Loss (Raw)": 1.9589303731918335, "Full-pretrain/Step": 4115, "Full-pretrain/Step Time": 17.600239161401987} +{"Full-pretrain/Learning Rate": 3.166845824867384e-05, "Full-pretrain/Loss": 1.9370064735412598, "Full-pretrain/Loss (Raw)": 1.8720341920852661, "Full-pretrain/Step": 4116, "Full-pretrain/Step Time": 17.59766503237188} +{"Full-pretrain/Learning Rate": 3.166027470321748e-05, "Full-pretrain/Loss": 1.9308736324310303, "Full-pretrain/Loss (Raw)": 1.8177216053009033, "Full-pretrain/Step": 4117, "Full-pretrain/Step Time": 17.598203813657165} +{"Full-pretrain/Learning Rate": 3.1652090389500776e-05, "Full-pretrain/Loss": 1.9254952669143677, "Full-pretrain/Loss (Raw)": 1.9250255823135376, "Full-pretrain/Step": 4118, "Full-pretrain/Step Time": 17.60040322691202} +{"Full-pretrain/Learning Rate": 3.164390530846779e-05, "Full-pretrain/Loss": 1.9283027648925781, "Full-pretrain/Loss (Raw)": 1.9820809364318848, "Full-pretrain/Step": 4119, "Full-pretrain/Step Time": 17.60181526467204} +{"Full-pretrain/Learning Rate": 3.163571946106265e-05, "Full-pretrain/Loss": 1.9235643148422241, "Full-pretrain/Loss (Raw)": 2.0599350929260254, "Full-pretrain/Step": 4120, "Full-pretrain/Step Time": 17.601026410236955} +{"Full-pretrain/Learning Rate": 3.162753284822962e-05, "Full-pretrain/Loss": 1.9132434129714966, "Full-pretrain/Loss (Raw)": 1.9937818050384521, "Full-pretrain/Step": 4121, "Full-pretrain/Step Time": 17.597742930054665} +{"Full-pretrain/Learning Rate": 3.161934547091299e-05, "Full-pretrain/Loss": 1.9130284786224365, "Full-pretrain/Loss (Raw)": 1.9489054679870605, "Full-pretrain/Step": 4122, "Full-pretrain/Step Time": 17.599299922585487} +{"Full-pretrain/Learning Rate": 3.1611157330057185e-05, "Full-pretrain/Loss": 1.9159108400344849, "Full-pretrain/Loss (Raw)": 2.036756753921509, "Full-pretrain/Step": 4123, "Full-pretrain/Step Time": 17.59766684472561} +{"Full-pretrain/Learning Rate": 3.160296842660671e-05, "Full-pretrain/Loss": 1.925502061843872, "Full-pretrain/Loss (Raw)": 1.9733965396881104, "Full-pretrain/Step": 4124, "Full-pretrain/Step Time": 17.599053367972374} +{"Full-pretrain/Learning Rate": 3.159477876150615e-05, "Full-pretrain/Loss": 1.9332369565963745, "Full-pretrain/Loss (Raw)": 2.0509510040283203, "Full-pretrain/Step": 4125, "Full-pretrain/Step Time": 17.601696083322167} +{"Full-pretrain/Learning Rate": 3.158658833570017e-05, "Full-pretrain/Loss": 1.9353207349777222, "Full-pretrain/Loss (Raw)": 2.0102293491363525, "Full-pretrain/Step": 4126, "Full-pretrain/Step Time": 17.59622191824019} +{"Full-pretrain/Learning Rate": 3.157839715013355e-05, "Full-pretrain/Loss": 1.9244279861450195, "Full-pretrain/Loss (Raw)": 1.8752686977386475, "Full-pretrain/Step": 4127, "Full-pretrain/Step Time": 17.59885785356164} +{"Full-pretrain/Learning Rate": 3.1570205205751125e-05, "Full-pretrain/Loss": 1.9216655492782593, "Full-pretrain/Loss (Raw)": 1.9463144540786743, "Full-pretrain/Step": 4128, "Full-pretrain/Step Time": 17.600015211850405} +{"Full-pretrain/Learning Rate": 3.156201250349784e-05, "Full-pretrain/Loss": 1.9243903160095215, "Full-pretrain/Loss (Raw)": 2.162475347518921, "Full-pretrain/Step": 4129, "Full-pretrain/Step Time": 17.602110769599676} +{"Full-pretrain/Learning Rate": 3.155381904431872e-05, "Full-pretrain/Loss": 1.9224048852920532, "Full-pretrain/Loss (Raw)": 1.9716145992279053, "Full-pretrain/Step": 4130, "Full-pretrain/Step Time": 17.59112622961402} +{"Full-pretrain/Learning Rate": 3.154562482915887e-05, "Full-pretrain/Loss": 1.9283323287963867, "Full-pretrain/Loss (Raw)": 2.0158140659332275, "Full-pretrain/Step": 4131, "Full-pretrain/Step Time": 17.59710907191038} +{"Full-pretrain/Learning Rate": 3.15374298589635e-05, "Full-pretrain/Loss": 1.9188141822814941, "Full-pretrain/Loss (Raw)": 1.8761651515960693, "Full-pretrain/Step": 4132, "Full-pretrain/Step Time": 17.596510741859674} +{"Full-pretrain/Learning Rate": 3.1529234134677896e-05, "Full-pretrain/Loss": 1.9133858680725098, "Full-pretrain/Loss (Raw)": 1.8759713172912598, "Full-pretrain/Step": 4133, "Full-pretrain/Step Time": 17.598379952833056} +{"Full-pretrain/Learning Rate": 3.152103765724743e-05, "Full-pretrain/Loss": 1.918768048286438, "Full-pretrain/Loss (Raw)": 1.917639970779419, "Full-pretrain/Step": 4134, "Full-pretrain/Step Time": 17.597493708133698} +{"Full-pretrain/Learning Rate": 3.151284042761755e-05, "Full-pretrain/Loss": 1.9223122596740723, "Full-pretrain/Loss (Raw)": 2.2503936290740967, "Full-pretrain/Step": 4135, "Full-pretrain/Step Time": 17.591801211237907} +{"Full-pretrain/Learning Rate": 3.150464244673383e-05, "Full-pretrain/Loss": 1.928511619567871, "Full-pretrain/Loss (Raw)": 1.8501662015914917, "Full-pretrain/Step": 4136, "Full-pretrain/Step Time": 17.597531074658036} +{"Full-pretrain/Learning Rate": 3.149644371554189e-05, "Full-pretrain/Loss": 1.9337239265441895, "Full-pretrain/Loss (Raw)": 1.8060072660446167, "Full-pretrain/Step": 4137, "Full-pretrain/Step Time": 17.590656535699964} +{"Full-pretrain/Learning Rate": 3.148824423498744e-05, "Full-pretrain/Loss": 1.946317195892334, "Full-pretrain/Loss (Raw)": 2.239149332046509, "Full-pretrain/Step": 4138, "Full-pretrain/Step Time": 17.58621021732688} +{"Full-pretrain/Learning Rate": 3.14800440060163e-05, "Full-pretrain/Loss": 1.9439303874969482, "Full-pretrain/Loss (Raw)": 1.9012763500213623, "Full-pretrain/Step": 4139, "Full-pretrain/Step Time": 17.585780581459403} +{"Full-pretrain/Learning Rate": 3.147184302957436e-05, "Full-pretrain/Loss": 1.938948392868042, "Full-pretrain/Loss (Raw)": 1.7546782493591309, "Full-pretrain/Step": 4140, "Full-pretrain/Step Time": 17.59101228788495} +{"Full-pretrain/Learning Rate": 3.1463641306607604e-05, "Full-pretrain/Loss": 1.9475197792053223, "Full-pretrain/Loss (Raw)": 2.1681413650512695, "Full-pretrain/Step": 4141, "Full-pretrain/Step Time": 17.587812328711152} +{"Full-pretrain/Learning Rate": 3.14554388380621e-05, "Full-pretrain/Loss": 1.954863429069519, "Full-pretrain/Loss (Raw)": 1.9542371034622192, "Full-pretrain/Step": 4142, "Full-pretrain/Step Time": 17.582245726138353} +{"Full-pretrain/Learning Rate": 3.144723562488398e-05, "Full-pretrain/Loss": 1.9595988988876343, "Full-pretrain/Loss (Raw)": 1.9546961784362793, "Full-pretrain/Step": 4143, "Full-pretrain/Step Time": 17.58068729005754} +{"Full-pretrain/Learning Rate": 3.143903166801951e-05, "Full-pretrain/Loss": 1.9642584323883057, "Full-pretrain/Loss (Raw)": 1.929318904876709, "Full-pretrain/Step": 4144, "Full-pretrain/Step Time": 17.583492951467633} +{"Full-pretrain/Learning Rate": 3.1430826968415e-05, "Full-pretrain/Loss": 1.9701671600341797, "Full-pretrain/Loss (Raw)": 1.893899917602539, "Full-pretrain/Step": 4145, "Full-pretrain/Step Time": 17.57863483019173} +{"Full-pretrain/Learning Rate": 3.142262152701685e-05, "Full-pretrain/Loss": 1.9606963396072388, "Full-pretrain/Loss (Raw)": 1.7693073749542236, "Full-pretrain/Step": 4146, "Full-pretrain/Step Time": 17.583040580153465} +{"Full-pretrain/Learning Rate": 3.141441534477158e-05, "Full-pretrain/Loss": 1.966376543045044, "Full-pretrain/Loss (Raw)": 2.1406984329223633, "Full-pretrain/Step": 4147, "Full-pretrain/Step Time": 17.586542846634984} +{"Full-pretrain/Learning Rate": 3.140620842262573e-05, "Full-pretrain/Loss": 1.967878818511963, "Full-pretrain/Loss (Raw)": 1.9201076030731201, "Full-pretrain/Step": 4148, "Full-pretrain/Step Time": 17.582642575725913} +{"Full-pretrain/Learning Rate": 3.1398000761526e-05, "Full-pretrain/Loss": 1.9763448238372803, "Full-pretrain/Loss (Raw)": 2.0886306762695312, "Full-pretrain/Step": 4149, "Full-pretrain/Step Time": 17.580726392567158} +{"Full-pretrain/Learning Rate": 3.138979236241914e-05, "Full-pretrain/Loss": 1.9823594093322754, "Full-pretrain/Loss (Raw)": 2.1174962520599365, "Full-pretrain/Step": 4150, "Full-pretrain/Step Time": 17.573907434940338} +{"Full-pretrain/Learning Rate": 3.1381583226251965e-05, "Full-pretrain/Loss": 1.9837429523468018, "Full-pretrain/Loss (Raw)": 2.0263478755950928, "Full-pretrain/Step": 4151, "Full-pretrain/Step Time": 17.569278221577406} +{"Full-pretrain/Learning Rate": 3.1373373353971416e-05, "Full-pretrain/Loss": 1.9818106889724731, "Full-pretrain/Loss (Raw)": 1.9981082677841187, "Full-pretrain/Step": 4152, "Full-pretrain/Step Time": 17.570263855159283} +{"Full-pretrain/Learning Rate": 3.136516274652449e-05, "Full-pretrain/Loss": 1.985547423362732, "Full-pretrain/Loss (Raw)": 2.1133532524108887, "Full-pretrain/Step": 4153, "Full-pretrain/Step Time": 17.564974803477526} +{"Full-pretrain/Learning Rate": 3.135695140485827e-05, "Full-pretrain/Loss": 1.9811687469482422, "Full-pretrain/Loss (Raw)": 1.808788776397705, "Full-pretrain/Step": 4154, "Full-pretrain/Step Time": 17.562234718352556} +{"Full-pretrain/Learning Rate": 3.134873932991995e-05, "Full-pretrain/Loss": 1.9841760396957397, "Full-pretrain/Loss (Raw)": 2.1329894065856934, "Full-pretrain/Step": 4155, "Full-pretrain/Step Time": 17.56157765723765} +{"Full-pretrain/Learning Rate": 3.134052652265677e-05, "Full-pretrain/Loss": 1.9780471324920654, "Full-pretrain/Loss (Raw)": 1.7772767543792725, "Full-pretrain/Step": 4156, "Full-pretrain/Step Time": 17.560439996421337} +{"Full-pretrain/Learning Rate": 3.133231298401608e-05, "Full-pretrain/Loss": 1.9715458154678345, "Full-pretrain/Loss (Raw)": 1.8429009914398193, "Full-pretrain/Step": 4157, "Full-pretrain/Step Time": 17.561665501445532} +{"Full-pretrain/Learning Rate": 3.132409871494533e-05, "Full-pretrain/Loss": 1.9668241739273071, "Full-pretrain/Loss (Raw)": 1.8591383695602417, "Full-pretrain/Step": 4158, "Full-pretrain/Step Time": 17.558914717286825} +{"Full-pretrain/Learning Rate": 3.1315883716392e-05, "Full-pretrain/Loss": 1.969272494316101, "Full-pretrain/Loss (Raw)": 1.9536149501800537, "Full-pretrain/Step": 4159, "Full-pretrain/Step Time": 17.556489314883947} +{"Full-pretrain/Learning Rate": 3.130766798930371e-05, "Full-pretrain/Loss": 1.9673173427581787, "Full-pretrain/Loss (Raw)": 1.8837498426437378, "Full-pretrain/Step": 4160, "Full-pretrain/Step Time": 17.559321554377675} +{"Full-pretrain/Learning Rate": 3.1299451534628135e-05, "Full-pretrain/Loss": 1.963021993637085, "Full-pretrain/Loss (Raw)": 2.0250234603881836, "Full-pretrain/Step": 4161, "Full-pretrain/Step Time": 17.562131129205227} +{"Full-pretrain/Learning Rate": 3.129123435331304e-05, "Full-pretrain/Loss": 1.9503767490386963, "Full-pretrain/Loss (Raw)": 1.5669682025909424, "Full-pretrain/Step": 4162, "Full-pretrain/Step Time": 17.558234859257936} +{"Full-pretrain/Learning Rate": 3.128301644630627e-05, "Full-pretrain/Loss": 1.9425369501113892, "Full-pretrain/Loss (Raw)": 1.7649396657943726, "Full-pretrain/Step": 4163, "Full-pretrain/Step Time": 17.559070961549878} +{"Full-pretrain/Learning Rate": 3.127479781455576e-05, "Full-pretrain/Loss": 1.946616530418396, "Full-pretrain/Loss (Raw)": 2.0067129135131836, "Full-pretrain/Step": 4164, "Full-pretrain/Step Time": 17.558874836191535} +{"Full-pretrain/Learning Rate": 3.126657845900952e-05, "Full-pretrain/Loss": 1.956244707107544, "Full-pretrain/Loss (Raw)": 2.1840715408325195, "Full-pretrain/Step": 4165, "Full-pretrain/Step Time": 17.56266726180911} +{"Full-pretrain/Learning Rate": 3.125835838061567e-05, "Full-pretrain/Loss": 1.954495906829834, "Full-pretrain/Loss (Raw)": 1.8616799116134644, "Full-pretrain/Step": 4166, "Full-pretrain/Step Time": 17.56305560655892} +{"Full-pretrain/Learning Rate": 3.125013758032237e-05, "Full-pretrain/Loss": 1.944986343383789, "Full-pretrain/Loss (Raw)": 1.9460852146148682, "Full-pretrain/Step": 4167, "Full-pretrain/Step Time": 17.568779096007347} +{"Full-pretrain/Learning Rate": 3.1241916059077906e-05, "Full-pretrain/Loss": 1.9389376640319824, "Full-pretrain/Loss (Raw)": 1.6566095352172852, "Full-pretrain/Step": 4168, "Full-pretrain/Step Time": 17.56326642818749} +{"Full-pretrain/Learning Rate": 3.123369381783061e-05, "Full-pretrain/Loss": 1.945158839225769, "Full-pretrain/Loss (Raw)": 2.0050864219665527, "Full-pretrain/Step": 4169, "Full-pretrain/Step Time": 17.57069337926805} +{"Full-pretrain/Learning Rate": 3.122547085752893e-05, "Full-pretrain/Loss": 1.9362765550613403, "Full-pretrain/Loss (Raw)": 1.9549158811569214, "Full-pretrain/Step": 4170, "Full-pretrain/Step Time": 17.567897532135248} +{"Full-pretrain/Learning Rate": 3.121724717912138e-05, "Full-pretrain/Loss": 1.930944561958313, "Full-pretrain/Loss (Raw)": 1.730652093887329, "Full-pretrain/Step": 4171, "Full-pretrain/Step Time": 17.5688025765121} +{"Full-pretrain/Learning Rate": 3.1209022783556534e-05, "Full-pretrain/Loss": 1.9372563362121582, "Full-pretrain/Loss (Raw)": 1.9566569328308105, "Full-pretrain/Step": 4172, "Full-pretrain/Step Time": 17.57259139046073} +{"Full-pretrain/Learning Rate": 3.12007976717831e-05, "Full-pretrain/Loss": 1.9313507080078125, "Full-pretrain/Loss (Raw)": 1.9791595935821533, "Full-pretrain/Step": 4173, "Full-pretrain/Step Time": 17.57847456075251} +{"Full-pretrain/Learning Rate": 3.119257184474984e-05, "Full-pretrain/Loss": 1.935393214225769, "Full-pretrain/Loss (Raw)": 2.0835959911346436, "Full-pretrain/Step": 4174, "Full-pretrain/Step Time": 17.576382467523217} +{"Full-pretrain/Learning Rate": 3.118434530340559e-05, "Full-pretrain/Loss": 1.9422446489334106, "Full-pretrain/Loss (Raw)": 2.1739447116851807, "Full-pretrain/Step": 4175, "Full-pretrain/Step Time": 17.572327805683017} +{"Full-pretrain/Learning Rate": 3.117611804869928e-05, "Full-pretrain/Loss": 1.9388353824615479, "Full-pretrain/Loss (Raw)": 1.8202183246612549, "Full-pretrain/Step": 4176, "Full-pretrain/Step Time": 17.574769411236048} +{"Full-pretrain/Learning Rate": 3.116789008157993e-05, "Full-pretrain/Loss": 1.9416205883026123, "Full-pretrain/Loss (Raw)": 1.9830267429351807, "Full-pretrain/Step": 4177, "Full-pretrain/Step Time": 17.581438906490803} +{"Full-pretrain/Learning Rate": 3.115966140299662e-05, "Full-pretrain/Loss": 1.9579167366027832, "Full-pretrain/Loss (Raw)": 2.2907872200012207, "Full-pretrain/Step": 4178, "Full-pretrain/Step Time": 17.585456488654017} +{"Full-pretrain/Learning Rate": 3.115143201389853e-05, "Full-pretrain/Loss": 1.942510724067688, "Full-pretrain/Loss (Raw)": 1.6477059125900269, "Full-pretrain/Step": 4179, "Full-pretrain/Step Time": 17.584632312878966} +{"Full-pretrain/Learning Rate": 3.114320191523493e-05, "Full-pretrain/Loss": 1.9376755952835083, "Full-pretrain/Loss (Raw)": 1.7653822898864746, "Full-pretrain/Step": 4180, "Full-pretrain/Step Time": 17.587642837315798} +{"Full-pretrain/Learning Rate": 3.113497110795514e-05, "Full-pretrain/Loss": 1.9380929470062256, "Full-pretrain/Loss (Raw)": 2.1019833087921143, "Full-pretrain/Step": 4181, "Full-pretrain/Step Time": 17.591074420139194} +{"Full-pretrain/Learning Rate": 3.112673959300859e-05, "Full-pretrain/Loss": 1.9332140684127808, "Full-pretrain/Loss (Raw)": 1.9613776206970215, "Full-pretrain/Step": 4182, "Full-pretrain/Step Time": 17.59175806865096} +{"Full-pretrain/Learning Rate": 3.1118507371344776e-05, "Full-pretrain/Loss": 1.93415105342865, "Full-pretrain/Loss (Raw)": 2.056328296661377, "Full-pretrain/Step": 4183, "Full-pretrain/Step Time": 17.581874553114176} +{"Full-pretrain/Learning Rate": 3.111027444391329e-05, "Full-pretrain/Loss": 1.9293403625488281, "Full-pretrain/Loss (Raw)": 1.844167709350586, "Full-pretrain/Step": 4184, "Full-pretrain/Step Time": 17.58503008633852} +{"Full-pretrain/Learning Rate": 3.1102040811663796e-05, "Full-pretrain/Loss": 1.9306004047393799, "Full-pretrain/Loss (Raw)": 2.1536765098571777, "Full-pretrain/Step": 4185, "Full-pretrain/Step Time": 17.583612693473697} +{"Full-pretrain/Learning Rate": 3.109380647554604e-05, "Full-pretrain/Loss": 1.935231328010559, "Full-pretrain/Loss (Raw)": 1.9569776058197021, "Full-pretrain/Step": 4186, "Full-pretrain/Step Time": 17.582095040008426} +{"Full-pretrain/Learning Rate": 3.108557143650985e-05, "Full-pretrain/Loss": 1.9286744594573975, "Full-pretrain/Loss (Raw)": 1.9231672286987305, "Full-pretrain/Step": 4187, "Full-pretrain/Step Time": 17.574210841208696} +{"Full-pretrain/Learning Rate": 3.1077335695505127e-05, "Full-pretrain/Loss": 1.9372135400772095, "Full-pretrain/Loss (Raw)": 2.0505270957946777, "Full-pretrain/Step": 4188, "Full-pretrain/Step Time": 17.57733814418316} +{"Full-pretrain/Learning Rate": 3.1069099253481875e-05, "Full-pretrain/Loss": 1.9335124492645264, "Full-pretrain/Loss (Raw)": 1.724468469619751, "Full-pretrain/Step": 4189, "Full-pretrain/Step Time": 17.576709046959877} +{"Full-pretrain/Learning Rate": 3.1060862111390154e-05, "Full-pretrain/Loss": 1.935701847076416, "Full-pretrain/Loss (Raw)": 1.929199457168579, "Full-pretrain/Step": 4190, "Full-pretrain/Step Time": 17.576056534424424} +{"Full-pretrain/Learning Rate": 3.105262427018011e-05, "Full-pretrain/Loss": 1.9356368780136108, "Full-pretrain/Loss (Raw)": 1.9515328407287598, "Full-pretrain/Step": 4191, "Full-pretrain/Step Time": 17.56899009272456} +{"Full-pretrain/Learning Rate": 3.1044385730802e-05, "Full-pretrain/Loss": 1.9407106637954712, "Full-pretrain/Loss (Raw)": 2.0461111068725586, "Full-pretrain/Step": 4192, "Full-pretrain/Step Time": 17.567849779501557} +{"Full-pretrain/Learning Rate": 3.10361464942061e-05, "Full-pretrain/Loss": 1.9416922330856323, "Full-pretrain/Loss (Raw)": 2.056434154510498, "Full-pretrain/Step": 4193, "Full-pretrain/Step Time": 17.57075091637671} +{"Full-pretrain/Learning Rate": 3.102790656134284e-05, "Full-pretrain/Loss": 1.953364610671997, "Full-pretrain/Loss (Raw)": 1.940483570098877, "Full-pretrain/Step": 4194, "Full-pretrain/Step Time": 17.573431419208646} +{"Full-pretrain/Learning Rate": 3.1019665933162674e-05, "Full-pretrain/Loss": 1.964523196220398, "Full-pretrain/Loss (Raw)": 2.122014284133911, "Full-pretrain/Step": 4195, "Full-pretrain/Step Time": 17.568718133494258} +{"Full-pretrain/Learning Rate": 3.101142461061615e-05, "Full-pretrain/Loss": 1.9605371952056885, "Full-pretrain/Loss (Raw)": 1.8791625499725342, "Full-pretrain/Step": 4196, "Full-pretrain/Step Time": 17.561881883069873} +{"Full-pretrain/Learning Rate": 3.1003182594653916e-05, "Full-pretrain/Loss": 1.9589619636535645, "Full-pretrain/Loss (Raw)": 2.1336612701416016, "Full-pretrain/Step": 4197, "Full-pretrain/Step Time": 17.562632951885462} +{"Full-pretrain/Learning Rate": 3.0994939886226677e-05, "Full-pretrain/Loss": 1.9683424234390259, "Full-pretrain/Loss (Raw)": 2.161856174468994, "Full-pretrain/Step": 4198, "Full-pretrain/Step Time": 17.563110353425145} +{"Full-pretrain/Learning Rate": 3.098669648628523e-05, "Full-pretrain/Loss": 1.9692206382751465, "Full-pretrain/Loss (Raw)": 1.9741920232772827, "Full-pretrain/Step": 4199, "Full-pretrain/Step Time": 17.558421283960342} +{"Full-pretrain/Learning Rate": 3.0978452395780444e-05, "Full-pretrain/Loss": 1.9791405200958252, "Full-pretrain/Loss (Raw)": 1.9740428924560547, "Full-pretrain/Step": 4200, "Full-pretrain/Step Time": 17.555412711575627} +{"Full-pretrain/Learning Rate": 3.097020761566328e-05, "Full-pretrain/Loss": 1.9775645732879639, "Full-pretrain/Loss (Raw)": 1.95465886592865, "Full-pretrain/Step": 4201, "Full-pretrain/Step Time": 17.555846137925982} +{"Full-pretrain/Learning Rate": 3.0961962146884765e-05, "Full-pretrain/Loss": 1.962559700012207, "Full-pretrain/Loss (Raw)": 1.4747569561004639, "Full-pretrain/Step": 4202, "Full-pretrain/Step Time": 17.560492428019643} +{"Full-pretrain/Learning Rate": 3.095371599039601e-05, "Full-pretrain/Loss": 1.9605412483215332, "Full-pretrain/Loss (Raw)": 1.666062831878662, "Full-pretrain/Step": 4203, "Full-pretrain/Step Time": 17.560185253620148} +{"Full-pretrain/Learning Rate": 3.094546914714821e-05, "Full-pretrain/Loss": 1.9652365446090698, "Full-pretrain/Loss (Raw)": 2.106903314590454, "Full-pretrain/Step": 4204, "Full-pretrain/Step Time": 17.550980666652322} +{"Full-pretrain/Learning Rate": 3.093722161809263e-05, "Full-pretrain/Loss": 1.9639391899108887, "Full-pretrain/Loss (Raw)": 1.9376475811004639, "Full-pretrain/Step": 4205, "Full-pretrain/Step Time": 17.549863193184137} +{"Full-pretrain/Learning Rate": 3.092897340418062e-05, "Full-pretrain/Loss": 1.960373878479004, "Full-pretrain/Loss (Raw)": 1.9695024490356445, "Full-pretrain/Step": 4206, "Full-pretrain/Step Time": 17.559373535215855} +{"Full-pretrain/Learning Rate": 3.092072450636361e-05, "Full-pretrain/Loss": 1.956528902053833, "Full-pretrain/Loss (Raw)": 2.0509040355682373, "Full-pretrain/Step": 4207, "Full-pretrain/Step Time": 17.558080911636353} +{"Full-pretrain/Learning Rate": 3.091247492559312e-05, "Full-pretrain/Loss": 1.9584378004074097, "Full-pretrain/Loss (Raw)": 1.8813036680221558, "Full-pretrain/Step": 4208, "Full-pretrain/Step Time": 17.557979116216302} +{"Full-pretrain/Learning Rate": 3.090422466282072e-05, "Full-pretrain/Loss": 1.961949110031128, "Full-pretrain/Loss (Raw)": 2.095393419265747, "Full-pretrain/Step": 4209, "Full-pretrain/Step Time": 17.557813784107566} +{"Full-pretrain/Learning Rate": 3.089597371899808e-05, "Full-pretrain/Loss": 1.957497477531433, "Full-pretrain/Loss (Raw)": 2.1483328342437744, "Full-pretrain/Step": 4210, "Full-pretrain/Step Time": 17.565178364515305} +{"Full-pretrain/Learning Rate": 3.088772209507694e-05, "Full-pretrain/Loss": 1.9700826406478882, "Full-pretrain/Loss (Raw)": 2.0504307746887207, "Full-pretrain/Step": 4211, "Full-pretrain/Step Time": 17.560163581743836} +{"Full-pretrain/Learning Rate": 3.087946979200913e-05, "Full-pretrain/Loss": 1.9651693105697632, "Full-pretrain/Loss (Raw)": 1.608156442642212, "Full-pretrain/Step": 4212, "Full-pretrain/Step Time": 17.564881091937423} +{"Full-pretrain/Learning Rate": 3.0871216810746544e-05, "Full-pretrain/Loss": 1.9595746994018555, "Full-pretrain/Loss (Raw)": 1.922958493232727, "Full-pretrain/Step": 4213, "Full-pretrain/Step Time": 17.56045305915177} +{"Full-pretrain/Learning Rate": 3.0862963152241166e-05, "Full-pretrain/Loss": 1.9617490768432617, "Full-pretrain/Loss (Raw)": 2.0309581756591797, "Full-pretrain/Step": 4214, "Full-pretrain/Step Time": 17.565780702978373} +{"Full-pretrain/Learning Rate": 3.085470881744504e-05, "Full-pretrain/Loss": 1.952629804611206, "Full-pretrain/Loss (Raw)": 1.7645087242126465, "Full-pretrain/Step": 4215, "Full-pretrain/Step Time": 17.56199559941888} +{"Full-pretrain/Learning Rate": 3.0846453807310316e-05, "Full-pretrain/Loss": 1.949070930480957, "Full-pretrain/Loss (Raw)": 1.7302846908569336, "Full-pretrain/Step": 4216, "Full-pretrain/Step Time": 17.559933992102742} +{"Full-pretrain/Learning Rate": 3.0838198122789196e-05, "Full-pretrain/Loss": 1.9456833600997925, "Full-pretrain/Loss (Raw)": 2.045276165008545, "Full-pretrain/Step": 4217, "Full-pretrain/Step Time": 17.556942930445075} +{"Full-pretrain/Learning Rate": 3.082994176483398e-05, "Full-pretrain/Loss": 1.950819730758667, "Full-pretrain/Loss (Raw)": 2.121339797973633, "Full-pretrain/Step": 4218, "Full-pretrain/Step Time": 17.560536421835423} +{"Full-pretrain/Learning Rate": 3.082168473439702e-05, "Full-pretrain/Loss": 1.9496419429779053, "Full-pretrain/Loss (Raw)": 1.8854780197143555, "Full-pretrain/Step": 4219, "Full-pretrain/Step Time": 17.559302350506186} +{"Full-pretrain/Learning Rate": 3.0813427032430783e-05, "Full-pretrain/Loss": 1.9504108428955078, "Full-pretrain/Loss (Raw)": 2.075129985809326, "Full-pretrain/Step": 4220, "Full-pretrain/Step Time": 17.555761652067304} +{"Full-pretrain/Learning Rate": 3.080516865988778e-05, "Full-pretrain/Loss": 1.953330159187317, "Full-pretrain/Loss (Raw)": 1.8178892135620117, "Full-pretrain/Step": 4221, "Full-pretrain/Step Time": 17.552562886849046} +{"Full-pretrain/Learning Rate": 3.0796909617720604e-05, "Full-pretrain/Loss": 1.9583195447921753, "Full-pretrain/Loss (Raw)": 2.088858127593994, "Full-pretrain/Step": 4222, "Full-pretrain/Step Time": 17.559407072141767} +{"Full-pretrain/Learning Rate": 3.078864990688194e-05, "Full-pretrain/Loss": 1.9609687328338623, "Full-pretrain/Loss (Raw)": 2.036306858062744, "Full-pretrain/Step": 4223, "Full-pretrain/Step Time": 17.558783032000065} +{"Full-pretrain/Learning Rate": 3.0780389528324554e-05, "Full-pretrain/Loss": 1.9592037200927734, "Full-pretrain/Loss (Raw)": 1.9896281957626343, "Full-pretrain/Step": 4224, "Full-pretrain/Step Time": 17.553558506071568} +{"Full-pretrain/Learning Rate": 3.077212848300126e-05, "Full-pretrain/Loss": 1.9565761089324951, "Full-pretrain/Loss (Raw)": 1.9723535776138306, "Full-pretrain/Step": 4225, "Full-pretrain/Step Time": 17.55306188762188} +{"Full-pretrain/Learning Rate": 3.076386677186498e-05, "Full-pretrain/Loss": 1.9642994403839111, "Full-pretrain/Loss (Raw)": 2.187631845474243, "Full-pretrain/Step": 4226, "Full-pretrain/Step Time": 17.55876230634749} +{"Full-pretrain/Learning Rate": 3.0755604395868686e-05, "Full-pretrain/Loss": 1.9680222272872925, "Full-pretrain/Loss (Raw)": 2.2411398887634277, "Full-pretrain/Step": 4227, "Full-pretrain/Step Time": 17.558343928307295} +{"Full-pretrain/Learning Rate": 3.0747341355965455e-05, "Full-pretrain/Loss": 1.975778341293335, "Full-pretrain/Loss (Raw)": 2.12736177444458, "Full-pretrain/Step": 4228, "Full-pretrain/Step Time": 17.559524776414037} +{"Full-pretrain/Learning Rate": 3.073907765310841e-05, "Full-pretrain/Loss": 1.9552326202392578, "Full-pretrain/Loss (Raw)": 1.4761948585510254, "Full-pretrain/Step": 4229, "Full-pretrain/Step Time": 17.558525320142508} +{"Full-pretrain/Learning Rate": 3.073081328825078e-05, "Full-pretrain/Loss": 1.9469667673110962, "Full-pretrain/Loss (Raw)": 1.8973509073257446, "Full-pretrain/Step": 4230, "Full-pretrain/Step Time": 17.558540731668472} +{"Full-pretrain/Learning Rate": 3.072254826234585e-05, "Full-pretrain/Loss": 1.94864821434021, "Full-pretrain/Loss (Raw)": 2.0279979705810547, "Full-pretrain/Step": 4231, "Full-pretrain/Step Time": 17.552948724478483} +{"Full-pretrain/Learning Rate": 3.071428257634699e-05, "Full-pretrain/Loss": 1.955489993095398, "Full-pretrain/Loss (Raw)": 2.192978858947754, "Full-pretrain/Step": 4232, "Full-pretrain/Step Time": 17.55698230303824} +{"Full-pretrain/Learning Rate": 3.0706016231207635e-05, "Full-pretrain/Loss": 1.9529767036437988, "Full-pretrain/Loss (Raw)": 1.8742344379425049, "Full-pretrain/Step": 4233, "Full-pretrain/Step Time": 17.553904553875327} +{"Full-pretrain/Learning Rate": 3.069774922788132e-05, "Full-pretrain/Loss": 1.9689630270004272, "Full-pretrain/Loss (Raw)": 1.9863201379776, "Full-pretrain/Step": 4234, "Full-pretrain/Step Time": 17.55246203765273} +{"Full-pretrain/Learning Rate": 3.0689481567321634e-05, "Full-pretrain/Loss": 1.9674960374832153, "Full-pretrain/Loss (Raw)": 1.6191165447235107, "Full-pretrain/Step": 4235, "Full-pretrain/Step Time": 17.548457564786077} +{"Full-pretrain/Learning Rate": 3.0681213250482255e-05, "Full-pretrain/Loss": 1.9613738059997559, "Full-pretrain/Loss (Raw)": 1.910993218421936, "Full-pretrain/Step": 4236, "Full-pretrain/Step Time": 17.551744924858212} +{"Full-pretrain/Learning Rate": 3.0672944278316916e-05, "Full-pretrain/Loss": 1.9630404710769653, "Full-pretrain/Loss (Raw)": 1.990980625152588, "Full-pretrain/Step": 4237, "Full-pretrain/Step Time": 17.551137248054147} +{"Full-pretrain/Learning Rate": 3.066467465177945e-05, "Full-pretrain/Loss": 1.9736416339874268, "Full-pretrain/Loss (Raw)": 2.3087401390075684, "Full-pretrain/Step": 4238, "Full-pretrain/Step Time": 17.557543396949768} +{"Full-pretrain/Learning Rate": 3.065640437182376e-05, "Full-pretrain/Loss": 1.9578770399093628, "Full-pretrain/Loss (Raw)": 1.5464348793029785, "Full-pretrain/Step": 4239, "Full-pretrain/Step Time": 17.555708583444357} +{"Full-pretrain/Learning Rate": 3.0648133439403795e-05, "Full-pretrain/Loss": 1.9684096574783325, "Full-pretrain/Loss (Raw)": 2.218348503112793, "Full-pretrain/Step": 4240, "Full-pretrain/Step Time": 17.5600350741297} +{"Full-pretrain/Learning Rate": 3.0639861855473635e-05, "Full-pretrain/Loss": 1.968860387802124, "Full-pretrain/Loss (Raw)": 2.1098134517669678, "Full-pretrain/Step": 4241, "Full-pretrain/Step Time": 17.556984670460224} +{"Full-pretrain/Learning Rate": 3.0631589620987396e-05, "Full-pretrain/Loss": 1.9577105045318604, "Full-pretrain/Loss (Raw)": 1.7915403842926025, "Full-pretrain/Step": 4242, "Full-pretrain/Step Time": 17.556388879194856} +{"Full-pretrain/Learning Rate": 3.062331673689926e-05, "Full-pretrain/Loss": 1.958022117614746, "Full-pretrain/Loss (Raw)": 2.0604023933410645, "Full-pretrain/Step": 4243, "Full-pretrain/Step Time": 17.55564351938665} +{"Full-pretrain/Learning Rate": 3.0615043204163524e-05, "Full-pretrain/Loss": 1.9693734645843506, "Full-pretrain/Loss (Raw)": 1.971399188041687, "Full-pretrain/Step": 4244, "Full-pretrain/Step Time": 17.562049116939306} +{"Full-pretrain/Learning Rate": 3.0606769023734536e-05, "Full-pretrain/Loss": 1.9724547863006592, "Full-pretrain/Loss (Raw)": 2.0215561389923096, "Full-pretrain/Step": 4245, "Full-pretrain/Step Time": 17.557349808514118} +{"Full-pretrain/Learning Rate": 3.05984941965667e-05, "Full-pretrain/Loss": 1.9705541133880615, "Full-pretrain/Loss (Raw)": 1.9701380729675293, "Full-pretrain/Step": 4246, "Full-pretrain/Step Time": 17.557818554341793} +{"Full-pretrain/Learning Rate": 3.059021872361453e-05, "Full-pretrain/Loss": 1.9756356477737427, "Full-pretrain/Loss (Raw)": 1.9271217584609985, "Full-pretrain/Step": 4247, "Full-pretrain/Step Time": 17.55353290773928} +{"Full-pretrain/Learning Rate": 3.058194260583259e-05, "Full-pretrain/Loss": 1.9822278022766113, "Full-pretrain/Loss (Raw)": 1.9412298202514648, "Full-pretrain/Step": 4248, "Full-pretrain/Step Time": 17.55706538632512} +{"Full-pretrain/Learning Rate": 3.057366584417553e-05, "Full-pretrain/Loss": 1.9874463081359863, "Full-pretrain/Loss (Raw)": 2.2122693061828613, "Full-pretrain/Step": 4249, "Full-pretrain/Step Time": 17.55591331794858} +{"Full-pretrain/Learning Rate": 3.056538843959808e-05, "Full-pretrain/Loss": 1.9836013317108154, "Full-pretrain/Loss (Raw)": 1.998300313949585, "Full-pretrain/Step": 4250, "Full-pretrain/Step Time": 17.555667754262686} +{"Full-pretrain/Learning Rate": 3.055711039305503e-05, "Full-pretrain/Loss": 1.9842859506607056, "Full-pretrain/Loss (Raw)": 1.907386064529419, "Full-pretrain/Step": 4251, "Full-pretrain/Step Time": 17.55354568362236} +{"Full-pretrain/Learning Rate": 3.054883170550125e-05, "Full-pretrain/Loss": 1.980309247970581, "Full-pretrain/Loss (Raw)": 1.9478795528411865, "Full-pretrain/Step": 4252, "Full-pretrain/Step Time": 17.55327620357275} +{"Full-pretrain/Learning Rate": 3.054055237789167e-05, "Full-pretrain/Loss": 1.9908288717269897, "Full-pretrain/Loss (Raw)": 2.1545166969299316, "Full-pretrain/Step": 4253, "Full-pretrain/Step Time": 17.55250394716859} +{"Full-pretrain/Learning Rate": 3.053227241118134e-05, "Full-pretrain/Loss": 1.9882686138153076, "Full-pretrain/Loss (Raw)": 2.0069284439086914, "Full-pretrain/Step": 4254, "Full-pretrain/Step Time": 17.55206647142768} +{"Full-pretrain/Learning Rate": 3.0523991806325326e-05, "Full-pretrain/Loss": 1.9853618144989014, "Full-pretrain/Loss (Raw)": 1.9432885646820068, "Full-pretrain/Step": 4255, "Full-pretrain/Step Time": 17.549963638186455} +{"Full-pretrain/Learning Rate": 3.0515710564278788e-05, "Full-pretrain/Loss": 1.9927647113800049, "Full-pretrain/Loss (Raw)": 2.2265219688415527, "Full-pretrain/Step": 4256, "Full-pretrain/Step Time": 17.55079911649227} +{"Full-pretrain/Learning Rate": 3.050742868599698e-05, "Full-pretrain/Loss": 1.996910810470581, "Full-pretrain/Loss (Raw)": 2.1050291061401367, "Full-pretrain/Step": 4257, "Full-pretrain/Step Time": 17.557388911023736} +{"Full-pretrain/Learning Rate": 3.049914617243521e-05, "Full-pretrain/Loss": 1.980787754058838, "Full-pretrain/Loss (Raw)": 1.6716959476470947, "Full-pretrain/Step": 4258, "Full-pretrain/Step Time": 17.560821568593383} +{"Full-pretrain/Learning Rate": 3.049086302454886e-05, "Full-pretrain/Loss": 1.9658477306365967, "Full-pretrain/Loss (Raw)": 1.7630585432052612, "Full-pretrain/Step": 4259, "Full-pretrain/Step Time": 17.554570281878114} +{"Full-pretrain/Learning Rate": 3.048257924329339e-05, "Full-pretrain/Loss": 1.9614231586456299, "Full-pretrain/Loss (Raw)": 1.9857726097106934, "Full-pretrain/Step": 4260, "Full-pretrain/Step Time": 17.55346821807325} +{"Full-pretrain/Learning Rate": 3.0474294829624327e-05, "Full-pretrain/Loss": 1.9798091650009155, "Full-pretrain/Loss (Raw)": 2.064547300338745, "Full-pretrain/Step": 4261, "Full-pretrain/Step Time": 17.557596610859036} +{"Full-pretrain/Learning Rate": 3.046600978449729e-05, "Full-pretrain/Loss": 1.9815409183502197, "Full-pretrain/Loss (Raw)": 1.952770709991455, "Full-pretrain/Step": 4262, "Full-pretrain/Step Time": 17.5596233420074} +{"Full-pretrain/Learning Rate": 3.0457724108867942e-05, "Full-pretrain/Loss": 1.9840035438537598, "Full-pretrain/Loss (Raw)": 2.106801986694336, "Full-pretrain/Step": 4263, "Full-pretrain/Step Time": 17.56221480295062} +{"Full-pretrain/Learning Rate": 3.044943780369203e-05, "Full-pretrain/Loss": 1.9924076795578003, "Full-pretrain/Loss (Raw)": 2.4619083404541016, "Full-pretrain/Step": 4264, "Full-pretrain/Step Time": 17.554774107411504} +{"Full-pretrain/Learning Rate": 3.0441150869925384e-05, "Full-pretrain/Loss": 1.9949039220809937, "Full-pretrain/Loss (Raw)": 1.954114317893982, "Full-pretrain/Step": 4265, "Full-pretrain/Step Time": 17.56165226176381} +{"Full-pretrain/Learning Rate": 3.04328633085239e-05, "Full-pretrain/Loss": 2.0043063163757324, "Full-pretrain/Loss (Raw)": 2.287200927734375, "Full-pretrain/Step": 4266, "Full-pretrain/Step Time": 17.563089422881603} +{"Full-pretrain/Learning Rate": 3.0424575120443537e-05, "Full-pretrain/Loss": 2.014843225479126, "Full-pretrain/Loss (Raw)": 1.956292748451233, "Full-pretrain/Step": 4267, "Full-pretrain/Step Time": 17.561138393357396} +{"Full-pretrain/Learning Rate": 3.041628630664035e-05, "Full-pretrain/Loss": 2.0094971656799316, "Full-pretrain/Loss (Raw)": 1.739919900894165, "Full-pretrain/Step": 4268, "Full-pretrain/Step Time": 17.555373026058078} +{"Full-pretrain/Learning Rate": 3.0407996868070433e-05, "Full-pretrain/Loss": 2.018268585205078, "Full-pretrain/Loss (Raw)": 2.271662712097168, "Full-pretrain/Step": 4269, "Full-pretrain/Step Time": 17.558469304814935} +{"Full-pretrain/Learning Rate": 3.039970680568998e-05, "Full-pretrain/Loss": 2.013983726501465, "Full-pretrain/Loss (Raw)": 2.1716320514678955, "Full-pretrain/Step": 4270, "Full-pretrain/Step Time": 17.559177661314607} +{"Full-pretrain/Learning Rate": 3.0391416120455253e-05, "Full-pretrain/Loss": 2.031102180480957, "Full-pretrain/Loss (Raw)": 2.094228744506836, "Full-pretrain/Step": 4271, "Full-pretrain/Step Time": 17.561154881492257} +{"Full-pretrain/Learning Rate": 3.0383124813322557e-05, "Full-pretrain/Loss": 2.0192575454711914, "Full-pretrain/Loss (Raw)": 1.8393160104751587, "Full-pretrain/Step": 4272, "Full-pretrain/Step Time": 17.554868910461664} +{"Full-pretrain/Learning Rate": 3.0374832885248313e-05, "Full-pretrain/Loss": 2.0143566131591797, "Full-pretrain/Loss (Raw)": 1.952984094619751, "Full-pretrain/Step": 4273, "Full-pretrain/Step Time": 17.564772117882967} +{"Full-pretrain/Learning Rate": 3.036654033718898e-05, "Full-pretrain/Loss": 2.0162456035614014, "Full-pretrain/Loss (Raw)": 1.8519847393035889, "Full-pretrain/Step": 4274, "Full-pretrain/Step Time": 17.564120709896088} +{"Full-pretrain/Learning Rate": 3.0358247170101108e-05, "Full-pretrain/Loss": 2.01920747756958, "Full-pretrain/Loss (Raw)": 2.1551871299743652, "Full-pretrain/Step": 4275, "Full-pretrain/Step Time": 17.559267442673445} +{"Full-pretrain/Learning Rate": 3.034995338494131e-05, "Full-pretrain/Loss": 2.0169177055358887, "Full-pretrain/Loss (Raw)": 1.8981258869171143, "Full-pretrain/Step": 4276, "Full-pretrain/Step Time": 17.554171627387404} +{"Full-pretrain/Learning Rate": 3.0341658982666266e-05, "Full-pretrain/Loss": 1.998153567314148, "Full-pretrain/Loss (Raw)": 1.4211039543151855, "Full-pretrain/Step": 4277, "Full-pretrain/Step Time": 17.56312365271151} +{"Full-pretrain/Learning Rate": 3.0333363964232738e-05, "Full-pretrain/Loss": 1.9955615997314453, "Full-pretrain/Loss (Raw)": 1.8871896266937256, "Full-pretrain/Step": 4278, "Full-pretrain/Step Time": 17.56803940050304} +{"Full-pretrain/Learning Rate": 3.032506833059755e-05, "Full-pretrain/Loss": 1.9987260103225708, "Full-pretrain/Loss (Raw)": 2.028388500213623, "Full-pretrain/Step": 4279, "Full-pretrain/Step Time": 17.57059551216662} +{"Full-pretrain/Learning Rate": 3.0316772082717603e-05, "Full-pretrain/Loss": 2.0026025772094727, "Full-pretrain/Loss (Raw)": 2.0652782917022705, "Full-pretrain/Step": 4280, "Full-pretrain/Step Time": 17.561931677162647} +{"Full-pretrain/Learning Rate": 3.0308475221549864e-05, "Full-pretrain/Loss": 1.993139624595642, "Full-pretrain/Loss (Raw)": 1.90945303440094, "Full-pretrain/Step": 4281, "Full-pretrain/Step Time": 17.570547569543123} +{"Full-pretrain/Learning Rate": 3.0300177748051373e-05, "Full-pretrain/Loss": 1.9928553104400635, "Full-pretrain/Loss (Raw)": 1.9892032146453857, "Full-pretrain/Step": 4282, "Full-pretrain/Step Time": 17.575991412624717} +{"Full-pretrain/Learning Rate": 3.0291879663179235e-05, "Full-pretrain/Loss": 1.9987399578094482, "Full-pretrain/Loss (Raw)": 2.095693826675415, "Full-pretrain/Step": 4283, "Full-pretrain/Step Time": 17.576982522383332} +{"Full-pretrain/Learning Rate": 3.0283580967890645e-05, "Full-pretrain/Loss": 2.0019052028656006, "Full-pretrain/Loss (Raw)": 2.049165725708008, "Full-pretrain/Step": 4284, "Full-pretrain/Step Time": 17.572444770485163} +{"Full-pretrain/Learning Rate": 3.0275281663142846e-05, "Full-pretrain/Loss": 1.9972295761108398, "Full-pretrain/Loss (Raw)": 2.0049004554748535, "Full-pretrain/Step": 4285, "Full-pretrain/Step Time": 17.57762780599296} +{"Full-pretrain/Learning Rate": 3.0266981749893157e-05, "Full-pretrain/Loss": 1.9984705448150635, "Full-pretrain/Loss (Raw)": 2.0466372966766357, "Full-pretrain/Step": 4286, "Full-pretrain/Step Time": 17.58098486997187} +{"Full-pretrain/Learning Rate": 3.025868122909898e-05, "Full-pretrain/Loss": 2.0030434131622314, "Full-pretrain/Loss (Raw)": 2.0896201133728027, "Full-pretrain/Step": 4287, "Full-pretrain/Step Time": 17.58044771105051} +{"Full-pretrain/Learning Rate": 3.0250380101717774e-05, "Full-pretrain/Loss": 1.9896080493927002, "Full-pretrain/Loss (Raw)": 1.7965922355651855, "Full-pretrain/Step": 4288, "Full-pretrain/Step Time": 17.57358743622899} +{"Full-pretrain/Learning Rate": 3.024207836870706e-05, "Full-pretrain/Loss": 1.990046739578247, "Full-pretrain/Loss (Raw)": 2.11906361579895, "Full-pretrain/Step": 4289, "Full-pretrain/Step Time": 17.571784041821957} +{"Full-pretrain/Learning Rate": 3.023377603102445e-05, "Full-pretrain/Loss": 2.0064806938171387, "Full-pretrain/Loss (Raw)": 2.1975858211517334, "Full-pretrain/Step": 4290, "Full-pretrain/Step Time": 17.57702376320958} +{"Full-pretrain/Learning Rate": 3.0225473089627616e-05, "Full-pretrain/Loss": 2.0094211101531982, "Full-pretrain/Loss (Raw)": 1.8571525812149048, "Full-pretrain/Step": 4291, "Full-pretrain/Step Time": 17.57622718811035} +{"Full-pretrain/Learning Rate": 3.02171695454743e-05, "Full-pretrain/Loss": 2.0098352432250977, "Full-pretrain/Loss (Raw)": 1.9990177154541016, "Full-pretrain/Step": 4292, "Full-pretrain/Step Time": 17.569883527234197} +{"Full-pretrain/Learning Rate": 3.0208865399522306e-05, "Full-pretrain/Loss": 2.0056838989257812, "Full-pretrain/Loss (Raw)": 1.9317097663879395, "Full-pretrain/Step": 4293, "Full-pretrain/Step Time": 17.570899944752455} +{"Full-pretrain/Learning Rate": 3.0200560652729516e-05, "Full-pretrain/Loss": 2.0112948417663574, "Full-pretrain/Loss (Raw)": 2.1323273181915283, "Full-pretrain/Step": 4294, "Full-pretrain/Step Time": 17.573775343596935} +{"Full-pretrain/Learning Rate": 3.019225530605389e-05, "Full-pretrain/Loss": 2.010085105895996, "Full-pretrain/Loss (Raw)": 2.0680880546569824, "Full-pretrain/Step": 4295, "Full-pretrain/Step Time": 17.568698232993484} +{"Full-pretrain/Learning Rate": 3.018394936045344e-05, "Full-pretrain/Loss": 1.997281789779663, "Full-pretrain/Loss (Raw)": 2.052194595336914, "Full-pretrain/Step": 4296, "Full-pretrain/Step Time": 17.57121804729104} +{"Full-pretrain/Learning Rate": 3.0175642816886253e-05, "Full-pretrain/Loss": 2.0014142990112305, "Full-pretrain/Loss (Raw)": 2.086353302001953, "Full-pretrain/Step": 4297, "Full-pretrain/Step Time": 17.56531298533082} +{"Full-pretrain/Learning Rate": 3.0167335676310476e-05, "Full-pretrain/Loss": 1.9872699975967407, "Full-pretrain/Loss (Raw)": 1.8345885276794434, "Full-pretrain/Step": 4298, "Full-pretrain/Step Time": 17.56656400114298} +{"Full-pretrain/Learning Rate": 3.015902793968435e-05, "Full-pretrain/Loss": 1.9962786436080933, "Full-pretrain/Loss (Raw)": 2.244570016860962, "Full-pretrain/Step": 4299, "Full-pretrain/Step Time": 17.563307352364063} +{"Full-pretrain/Learning Rate": 3.0150719607966166e-05, "Full-pretrain/Loss": 2.002828598022461, "Full-pretrain/Loss (Raw)": 1.9495153427124023, "Full-pretrain/Step": 4300, "Full-pretrain/Step Time": 17.556535637006164} +{"Full-pretrain/Learning Rate": 3.014241068211428e-05, "Full-pretrain/Loss": 1.9896320104599, "Full-pretrain/Loss (Raw)": 1.8493729829788208, "Full-pretrain/Step": 4301, "Full-pretrain/Step Time": 17.555971775203943} +{"Full-pretrain/Learning Rate": 3.0134101163087137e-05, "Full-pretrain/Loss": 1.9693498611450195, "Full-pretrain/Loss (Raw)": 1.5226041078567505, "Full-pretrain/Step": 4302, "Full-pretrain/Step Time": 17.555599752813578} +{"Full-pretrain/Learning Rate": 3.012579105184322e-05, "Full-pretrain/Loss": 1.9603010416030884, "Full-pretrain/Loss (Raw)": 1.8046679496765137, "Full-pretrain/Step": 4303, "Full-pretrain/Step Time": 17.557241635397077} +{"Full-pretrain/Learning Rate": 3.0117480349341114e-05, "Full-pretrain/Loss": 1.9645464420318604, "Full-pretrain/Loss (Raw)": 1.97516930103302, "Full-pretrain/Step": 4304, "Full-pretrain/Step Time": 17.560295462608337} +{"Full-pretrain/Learning Rate": 3.010916905653945e-05, "Full-pretrain/Loss": 1.9643744230270386, "Full-pretrain/Loss (Raw)": 1.9474766254425049, "Full-pretrain/Step": 4305, "Full-pretrain/Step Time": 17.55528563633561} +{"Full-pretrain/Learning Rate": 3.0100857174396922e-05, "Full-pretrain/Loss": 1.9633866548538208, "Full-pretrain/Loss (Raw)": 1.8203774690628052, "Full-pretrain/Step": 4306, "Full-pretrain/Step Time": 17.549829859286547} +{"Full-pretrain/Learning Rate": 3.0092544703872315e-05, "Full-pretrain/Loss": 1.968919277191162, "Full-pretrain/Loss (Raw)": 2.332228660583496, "Full-pretrain/Step": 4307, "Full-pretrain/Step Time": 17.54816723614931} +{"Full-pretrain/Learning Rate": 3.008423164592447e-05, "Full-pretrain/Loss": 1.9726462364196777, "Full-pretrain/Loss (Raw)": 2.017392158508301, "Full-pretrain/Step": 4308, "Full-pretrain/Step Time": 17.547685507684946} +{"Full-pretrain/Learning Rate": 3.0075918001512286e-05, "Full-pretrain/Loss": 1.982171893119812, "Full-pretrain/Loss (Raw)": 1.7259197235107422, "Full-pretrain/Step": 4309, "Full-pretrain/Step Time": 17.542603278532624} +{"Full-pretrain/Learning Rate": 3.0067603771594748e-05, "Full-pretrain/Loss": 1.9815126657485962, "Full-pretrain/Loss (Raw)": 1.8660967350006104, "Full-pretrain/Step": 4310, "Full-pretrain/Step Time": 17.541127622127533} +{"Full-pretrain/Learning Rate": 3.0059288957130892e-05, "Full-pretrain/Loss": 1.986242651939392, "Full-pretrain/Loss (Raw)": 2.179745674133301, "Full-pretrain/Step": 4311, "Full-pretrain/Step Time": 17.535054102540016} +{"Full-pretrain/Learning Rate": 3.005097355907984e-05, "Full-pretrain/Loss": 1.97885000705719, "Full-pretrain/Loss (Raw)": 1.8287153244018555, "Full-pretrain/Step": 4312, "Full-pretrain/Step Time": 17.535344058647752} +{"Full-pretrain/Learning Rate": 3.0042657578400763e-05, "Full-pretrain/Loss": 1.9855539798736572, "Full-pretrain/Loss (Raw)": 2.123976945877075, "Full-pretrain/Step": 4313, "Full-pretrain/Step Time": 17.534874320030212} +{"Full-pretrain/Learning Rate": 3.0034341016052897e-05, "Full-pretrain/Loss": 1.9844486713409424, "Full-pretrain/Loss (Raw)": 1.9538328647613525, "Full-pretrain/Step": 4314, "Full-pretrain/Step Time": 17.54065065830946} +{"Full-pretrain/Learning Rate": 3.0026023872995567e-05, "Full-pretrain/Loss": 1.981335163116455, "Full-pretrain/Loss (Raw)": 1.9960660934448242, "Full-pretrain/Step": 4315, "Full-pretrain/Step Time": 17.544185046106577} +{"Full-pretrain/Learning Rate": 3.0017706150188153e-05, "Full-pretrain/Loss": 1.9767318964004517, "Full-pretrain/Loss (Raw)": 1.9018588066101074, "Full-pretrain/Step": 4316, "Full-pretrain/Step Time": 17.547539457678795} +{"Full-pretrain/Learning Rate": 3.0009387848590094e-05, "Full-pretrain/Loss": 1.9763603210449219, "Full-pretrain/Loss (Raw)": 1.9930098056793213, "Full-pretrain/Step": 4317, "Full-pretrain/Step Time": 17.544305816292763} +{"Full-pretrain/Learning Rate": 3.000106896916091e-05, "Full-pretrain/Loss": 1.9783589839935303, "Full-pretrain/Loss (Raw)": 2.1105947494506836, "Full-pretrain/Step": 4318, "Full-pretrain/Step Time": 17.543560028076172} +{"Full-pretrain/Learning Rate": 2.9992749512860173e-05, "Full-pretrain/Loss": 1.9762539863586426, "Full-pretrain/Loss (Raw)": 2.0222630500793457, "Full-pretrain/Step": 4319, "Full-pretrain/Step Time": 17.55182963423431} +{"Full-pretrain/Learning Rate": 2.9984429480647548e-05, "Full-pretrain/Loss": 1.9813733100891113, "Full-pretrain/Loss (Raw)": 1.960410714149475, "Full-pretrain/Step": 4320, "Full-pretrain/Step Time": 17.550842301920056} +{"Full-pretrain/Learning Rate": 2.997610887348272e-05, "Full-pretrain/Loss": 1.9806181192398071, "Full-pretrain/Loss (Raw)": 2.0948967933654785, "Full-pretrain/Step": 4321, "Full-pretrain/Step Time": 17.54987070709467} +{"Full-pretrain/Learning Rate": 2.996778769232549e-05, "Full-pretrain/Loss": 1.9699053764343262, "Full-pretrain/Loss (Raw)": 1.8547773361206055, "Full-pretrain/Step": 4322, "Full-pretrain/Step Time": 17.54647494852543} +{"Full-pretrain/Learning Rate": 2.995946593813569e-05, "Full-pretrain/Loss": 1.9744184017181396, "Full-pretrain/Loss (Raw)": 2.001570463180542, "Full-pretrain/Step": 4323, "Full-pretrain/Step Time": 17.556884843856096} +{"Full-pretrain/Learning Rate": 2.995114361187324e-05, "Full-pretrain/Loss": 1.9728798866271973, "Full-pretrain/Loss (Raw)": 1.9497877359390259, "Full-pretrain/Step": 4324, "Full-pretrain/Step Time": 17.55787425301969} +{"Full-pretrain/Learning Rate": 2.994282071449811e-05, "Full-pretrain/Loss": 1.970384120941162, "Full-pretrain/Loss (Raw)": 1.8518457412719727, "Full-pretrain/Step": 4325, "Full-pretrain/Step Time": 17.55983685515821} +{"Full-pretrain/Learning Rate": 2.9934497246970357e-05, "Full-pretrain/Loss": 1.972817063331604, "Full-pretrain/Loss (Raw)": 2.210177421569824, "Full-pretrain/Step": 4326, "Full-pretrain/Step Time": 17.558543641120195} +{"Full-pretrain/Learning Rate": 2.992617321025007e-05, "Full-pretrain/Loss": 1.9729959964752197, "Full-pretrain/Loss (Raw)": 2.0738162994384766, "Full-pretrain/Step": 4327, "Full-pretrain/Step Time": 17.559779098257422} +{"Full-pretrain/Learning Rate": 2.9917848605297437e-05, "Full-pretrain/Loss": 1.9674925804138184, "Full-pretrain/Loss (Raw)": 1.8760825395584106, "Full-pretrain/Step": 4328, "Full-pretrain/Step Time": 17.56283761933446} +{"Full-pretrain/Learning Rate": 2.99095234330727e-05, "Full-pretrain/Loss": 1.9627745151519775, "Full-pretrain/Loss (Raw)": 1.9353801012039185, "Full-pretrain/Step": 4329, "Full-pretrain/Step Time": 17.557391203939915} +{"Full-pretrain/Learning Rate": 2.990119769453616e-05, "Full-pretrain/Loss": 1.965635895729065, "Full-pretrain/Loss (Raw)": 1.9261486530303955, "Full-pretrain/Step": 4330, "Full-pretrain/Step Time": 17.556988960132003} +{"Full-pretrain/Learning Rate": 2.989287139064819e-05, "Full-pretrain/Loss": 1.9562166929244995, "Full-pretrain/Loss (Raw)": 1.9431569576263428, "Full-pretrain/Step": 4331, "Full-pretrain/Step Time": 17.558787625283003} +{"Full-pretrain/Learning Rate": 2.988454452236922e-05, "Full-pretrain/Loss": 1.9561843872070312, "Full-pretrain/Loss (Raw)": 1.9484806060791016, "Full-pretrain/Step": 4332, "Full-pretrain/Step Time": 17.556911593303084} +{"Full-pretrain/Learning Rate": 2.9876217090659753e-05, "Full-pretrain/Loss": 1.9519340991973877, "Full-pretrain/Loss (Raw)": 1.7133643627166748, "Full-pretrain/Step": 4333, "Full-pretrain/Step Time": 17.560423389077187} +{"Full-pretrain/Learning Rate": 2.9867889096480362e-05, "Full-pretrain/Loss": 1.970095157623291, "Full-pretrain/Loss (Raw)": 2.1037535667419434, "Full-pretrain/Step": 4334, "Full-pretrain/Step Time": 17.556223621591926} +{"Full-pretrain/Learning Rate": 2.985956054079167e-05, "Full-pretrain/Loss": 1.9742932319641113, "Full-pretrain/Loss (Raw)": 1.9390116930007935, "Full-pretrain/Step": 4335, "Full-pretrain/Step Time": 17.55991361103952} +{"Full-pretrain/Learning Rate": 2.985123142455438e-05, "Full-pretrain/Loss": 1.9697704315185547, "Full-pretrain/Loss (Raw)": 1.8304373025894165, "Full-pretrain/Step": 4336, "Full-pretrain/Step Time": 17.56335205771029} +{"Full-pretrain/Learning Rate": 2.9842901748729256e-05, "Full-pretrain/Loss": 1.9705028533935547, "Full-pretrain/Loss (Raw)": 1.9709175825119019, "Full-pretrain/Step": 4337, "Full-pretrain/Step Time": 17.56137734465301} +{"Full-pretrain/Learning Rate": 2.9834571514277116e-05, "Full-pretrain/Loss": 1.9788458347320557, "Full-pretrain/Loss (Raw)": 2.087352752685547, "Full-pretrain/Step": 4338, "Full-pretrain/Step Time": 17.562138866633177} +{"Full-pretrain/Learning Rate": 2.982624072215885e-05, "Full-pretrain/Loss": 1.9729098081588745, "Full-pretrain/Loss (Raw)": 2.142274856567383, "Full-pretrain/Step": 4339, "Full-pretrain/Step Time": 17.56188715621829} +{"Full-pretrain/Learning Rate": 2.9817909373335405e-05, "Full-pretrain/Loss": 1.9797148704528809, "Full-pretrain/Loss (Raw)": 2.23515248298645, "Full-pretrain/Step": 4340, "Full-pretrain/Step Time": 17.563388470560312} +{"Full-pretrain/Learning Rate": 2.9809577468767813e-05, "Full-pretrain/Loss": 1.9891383647918701, "Full-pretrain/Loss (Raw)": 2.0274736881256104, "Full-pretrain/Step": 4341, "Full-pretrain/Step Time": 17.56809308193624} +{"Full-pretrain/Learning Rate": 2.9801245009417155e-05, "Full-pretrain/Loss": 1.987243413925171, "Full-pretrain/Loss (Raw)": 1.8054574728012085, "Full-pretrain/Step": 4342, "Full-pretrain/Step Time": 17.56973156146705} +{"Full-pretrain/Learning Rate": 2.979291199624456e-05, "Full-pretrain/Loss": 1.9795653820037842, "Full-pretrain/Loss (Raw)": 1.934047818183899, "Full-pretrain/Step": 4343, "Full-pretrain/Step Time": 17.571624720469117} +{"Full-pretrain/Learning Rate": 2.978457843021126e-05, "Full-pretrain/Loss": 1.9836000204086304, "Full-pretrain/Loss (Raw)": 1.9578226804733276, "Full-pretrain/Step": 4344, "Full-pretrain/Step Time": 17.574304219335318} +{"Full-pretrain/Learning Rate": 2.9776244312278518e-05, "Full-pretrain/Loss": 1.9782997369766235, "Full-pretrain/Loss (Raw)": 1.954367756843567, "Full-pretrain/Step": 4345, "Full-pretrain/Step Time": 17.57105758599937} +{"Full-pretrain/Learning Rate": 2.9767909643407675e-05, "Full-pretrain/Loss": 1.9855201244354248, "Full-pretrain/Loss (Raw)": 2.1848855018615723, "Full-pretrain/Step": 4346, "Full-pretrain/Step Time": 17.57021783106029} +{"Full-pretrain/Learning Rate": 2.975957442456013e-05, "Full-pretrain/Loss": 1.9820997714996338, "Full-pretrain/Loss (Raw)": 1.886613368988037, "Full-pretrain/Step": 4347, "Full-pretrain/Step Time": 17.571575459092855} +{"Full-pretrain/Learning Rate": 2.9751238656697344e-05, "Full-pretrain/Loss": 1.982140302658081, "Full-pretrain/Loss (Raw)": 1.9031577110290527, "Full-pretrain/Step": 4348, "Full-pretrain/Step Time": 17.576104637235403} +{"Full-pretrain/Learning Rate": 2.9742902340780848e-05, "Full-pretrain/Loss": 1.9858551025390625, "Full-pretrain/Loss (Raw)": 2.1118857860565186, "Full-pretrain/Step": 4349, "Full-pretrain/Step Time": 17.574316672980785} +{"Full-pretrain/Learning Rate": 2.9734565477772236e-05, "Full-pretrain/Loss": 1.9766061305999756, "Full-pretrain/Loss (Raw)": 1.8146235942840576, "Full-pretrain/Step": 4350, "Full-pretrain/Step Time": 17.57277404330671} +{"Full-pretrain/Learning Rate": 2.9726228068633155e-05, "Full-pretrain/Loss": 1.976039171218872, "Full-pretrain/Loss (Raw)": 2.004124641418457, "Full-pretrain/Step": 4351, "Full-pretrain/Step Time": 17.5766574293375} +{"Full-pretrain/Learning Rate": 2.9717890114325336e-05, "Full-pretrain/Loss": 1.9747852087020874, "Full-pretrain/Loss (Raw)": 1.9202816486358643, "Full-pretrain/Step": 4352, "Full-pretrain/Step Time": 17.58150092512369} +{"Full-pretrain/Learning Rate": 2.9709551615810544e-05, "Full-pretrain/Loss": 1.9664030075073242, "Full-pretrain/Loss (Raw)": 1.826664686203003, "Full-pretrain/Step": 4353, "Full-pretrain/Step Time": 17.580689769238234} +{"Full-pretrain/Learning Rate": 2.9701212574050636e-05, "Full-pretrain/Loss": 1.9655942916870117, "Full-pretrain/Loss (Raw)": 1.8289004564285278, "Full-pretrain/Step": 4354, "Full-pretrain/Step Time": 17.576815988868475} +{"Full-pretrain/Learning Rate": 2.9692872990007503e-05, "Full-pretrain/Loss": 1.9734184741973877, "Full-pretrain/Loss (Raw)": 2.251943588256836, "Full-pretrain/Step": 4355, "Full-pretrain/Step Time": 17.575859727337956} +{"Full-pretrain/Learning Rate": 2.9684532864643122e-05, "Full-pretrain/Loss": 1.9724199771881104, "Full-pretrain/Loss (Raw)": 1.9178340435028076, "Full-pretrain/Step": 4356, "Full-pretrain/Step Time": 17.57627266831696} +{"Full-pretrain/Learning Rate": 2.9676192198919518e-05, "Full-pretrain/Loss": 1.9855122566223145, "Full-pretrain/Loss (Raw)": 2.2708003520965576, "Full-pretrain/Step": 4357, "Full-pretrain/Step Time": 17.57529044151306} +{"Full-pretrain/Learning Rate": 2.966785099379879e-05, "Full-pretrain/Loss": 1.9772759675979614, "Full-pretrain/Loss (Raw)": 1.9466150999069214, "Full-pretrain/Step": 4358, "Full-pretrain/Step Time": 17.58141453191638} +{"Full-pretrain/Learning Rate": 2.9659509250243085e-05, "Full-pretrain/Loss": 1.9852209091186523, "Full-pretrain/Loss (Raw)": 2.328056573867798, "Full-pretrain/Step": 4359, "Full-pretrain/Step Time": 17.579597923904657} +{"Full-pretrain/Learning Rate": 2.9651166969214633e-05, "Full-pretrain/Loss": 1.9906373023986816, "Full-pretrain/Loss (Raw)": 2.049407482147217, "Full-pretrain/Step": 4360, "Full-pretrain/Step Time": 17.584669835865498} +{"Full-pretrain/Learning Rate": 2.9642824151675702e-05, "Full-pretrain/Loss": 1.9985055923461914, "Full-pretrain/Loss (Raw)": 2.1871635913848877, "Full-pretrain/Step": 4361, "Full-pretrain/Step Time": 17.5840206425637} +{"Full-pretrain/Learning Rate": 2.9634480798588637e-05, "Full-pretrain/Loss": 1.9980570077896118, "Full-pretrain/Loss (Raw)": 1.9117916822433472, "Full-pretrain/Step": 4362, "Full-pretrain/Step Time": 17.583185203373432} +{"Full-pretrain/Learning Rate": 2.9626136910915846e-05, "Full-pretrain/Loss": 1.9903638362884521, "Full-pretrain/Loss (Raw)": 1.6969807147979736, "Full-pretrain/Step": 4363, "Full-pretrain/Step Time": 17.58767482638359} +{"Full-pretrain/Learning Rate": 2.9617792489619776e-05, "Full-pretrain/Loss": 1.9884692430496216, "Full-pretrain/Loss (Raw)": 1.8878517150878906, "Full-pretrain/Step": 4364, "Full-pretrain/Step Time": 17.585749357938766} +{"Full-pretrain/Learning Rate": 2.9609447535662972e-05, "Full-pretrain/Loss": 1.9977517127990723, "Full-pretrain/Loss (Raw)": 2.0104007720947266, "Full-pretrain/Step": 4365, "Full-pretrain/Step Time": 17.580806639045477} +{"Full-pretrain/Learning Rate": 2.9601102050008018e-05, "Full-pretrain/Loss": 1.9862468242645264, "Full-pretrain/Loss (Raw)": 1.7355999946594238, "Full-pretrain/Step": 4366, "Full-pretrain/Step Time": 17.58240409195423} +{"Full-pretrain/Learning Rate": 2.9592756033617554e-05, "Full-pretrain/Loss": 1.9796077013015747, "Full-pretrain/Loss (Raw)": 1.7265598773956299, "Full-pretrain/Step": 4367, "Full-pretrain/Step Time": 17.580724695697427} +{"Full-pretrain/Learning Rate": 2.95844094874543e-05, "Full-pretrain/Loss": 1.9779245853424072, "Full-pretrain/Loss (Raw)": 1.7765789031982422, "Full-pretrain/Step": 4368, "Full-pretrain/Step Time": 17.576569320634007} +{"Full-pretrain/Learning Rate": 2.957606241248102e-05, "Full-pretrain/Loss": 1.9756364822387695, "Full-pretrain/Loss (Raw)": 1.8976953029632568, "Full-pretrain/Step": 4369, "Full-pretrain/Step Time": 17.576827878132463} +{"Full-pretrain/Learning Rate": 2.9567714809660552e-05, "Full-pretrain/Loss": 1.9744999408721924, "Full-pretrain/Loss (Raw)": 2.050985813140869, "Full-pretrain/Step": 4370, "Full-pretrain/Step Time": 17.583436746150255} +{"Full-pretrain/Learning Rate": 2.955936667995578e-05, "Full-pretrain/Loss": 1.9625258445739746, "Full-pretrain/Loss (Raw)": 1.759103536605835, "Full-pretrain/Step": 4371, "Full-pretrain/Step Time": 17.578532995656133} +{"Full-pretrain/Learning Rate": 2.9551018024329668e-05, "Full-pretrain/Loss": 1.944166898727417, "Full-pretrain/Loss (Raw)": 1.6476647853851318, "Full-pretrain/Step": 4372, "Full-pretrain/Step Time": 17.571272429078817} +{"Full-pretrain/Learning Rate": 2.954266884374523e-05, "Full-pretrain/Loss": 1.9541621208190918, "Full-pretrain/Loss (Raw)": 2.3473188877105713, "Full-pretrain/Step": 4373, "Full-pretrain/Step Time": 17.574724808335304} +{"Full-pretrain/Learning Rate": 2.953431913916553e-05, "Full-pretrain/Loss": 1.9649760723114014, "Full-pretrain/Loss (Raw)": 2.1515049934387207, "Full-pretrain/Step": 4374, "Full-pretrain/Step Time": 17.57752464711666} +{"Full-pretrain/Learning Rate": 2.9525968911553707e-05, "Full-pretrain/Loss": 1.9669692516326904, "Full-pretrain/Loss (Raw)": 1.9978300333023071, "Full-pretrain/Step": 4375, "Full-pretrain/Step Time": 17.58049438893795} +{"Full-pretrain/Learning Rate": 2.9517618161872973e-05, "Full-pretrain/Loss": 1.9679102897644043, "Full-pretrain/Loss (Raw)": 1.9879353046417236, "Full-pretrain/Step": 4376, "Full-pretrain/Step Time": 17.575011184439063} +{"Full-pretrain/Learning Rate": 2.950926689108656e-05, "Full-pretrain/Loss": 1.9636294841766357, "Full-pretrain/Loss (Raw)": 1.8173811435699463, "Full-pretrain/Step": 4377, "Full-pretrain/Step Time": 17.58121678046882} +{"Full-pretrain/Learning Rate": 2.95009151001578e-05, "Full-pretrain/Loss": 1.9556519985198975, "Full-pretrain/Loss (Raw)": 1.9296070337295532, "Full-pretrain/Step": 4378, "Full-pretrain/Step Time": 17.584001583978534} +{"Full-pretrain/Learning Rate": 2.9492562790050072e-05, "Full-pretrain/Loss": 1.965796709060669, "Full-pretrain/Loss (Raw)": 2.211247682571411, "Full-pretrain/Step": 4379, "Full-pretrain/Step Time": 17.58715914748609} +{"Full-pretrain/Learning Rate": 2.9484209961726798e-05, "Full-pretrain/Loss": 1.9692091941833496, "Full-pretrain/Loss (Raw)": 2.012355327606201, "Full-pretrain/Step": 4380, "Full-pretrain/Step Time": 17.585495932027698} +{"Full-pretrain/Learning Rate": 2.9475856616151488e-05, "Full-pretrain/Loss": 1.958464503288269, "Full-pretrain/Loss (Raw)": 1.7680537700653076, "Full-pretrain/Step": 4381, "Full-pretrain/Step Time": 17.591977825388312} +{"Full-pretrain/Learning Rate": 2.946750275428768e-05, "Full-pretrain/Loss": 1.9670116901397705, "Full-pretrain/Loss (Raw)": 2.0881361961364746, "Full-pretrain/Step": 4382, "Full-pretrain/Step Time": 17.59043743647635} +{"Full-pretrain/Learning Rate": 2.9459148377099e-05, "Full-pretrain/Loss": 1.9625701904296875, "Full-pretrain/Loss (Raw)": 1.8619953393936157, "Full-pretrain/Step": 4383, "Full-pretrain/Step Time": 17.592132981866598} +{"Full-pretrain/Learning Rate": 2.9450793485549128e-05, "Full-pretrain/Loss": 1.964827060699463, "Full-pretrain/Loss (Raw)": 1.9925010204315186, "Full-pretrain/Step": 4384, "Full-pretrain/Step Time": 17.59290638193488} +{"Full-pretrain/Learning Rate": 2.9442438080601787e-05, "Full-pretrain/Loss": 1.9688732624053955, "Full-pretrain/Loss (Raw)": 1.9561426639556885, "Full-pretrain/Step": 4385, "Full-pretrain/Step Time": 17.589912448078394} +{"Full-pretrain/Learning Rate": 2.9434082163220773e-05, "Full-pretrain/Loss": 1.9709866046905518, "Full-pretrain/Loss (Raw)": 1.8965250253677368, "Full-pretrain/Step": 4386, "Full-pretrain/Step Time": 17.58479392901063} +{"Full-pretrain/Learning Rate": 2.9425725734369946e-05, "Full-pretrain/Loss": 1.9646834135055542, "Full-pretrain/Loss (Raw)": 2.050243377685547, "Full-pretrain/Step": 4387, "Full-pretrain/Step Time": 17.59452036395669} +{"Full-pretrain/Learning Rate": 2.941736879501321e-05, "Full-pretrain/Loss": 1.9692351818084717, "Full-pretrain/Loss (Raw)": 2.0634899139404297, "Full-pretrain/Step": 4388, "Full-pretrain/Step Time": 17.59809142164886} +{"Full-pretrain/Learning Rate": 2.940901134611454e-05, "Full-pretrain/Loss": 1.9538028240203857, "Full-pretrain/Loss (Raw)": 1.7769638299942017, "Full-pretrain/Step": 4389, "Full-pretrain/Step Time": 17.58938323520124} +{"Full-pretrain/Learning Rate": 2.940065338863795e-05, "Full-pretrain/Loss": 1.9553337097167969, "Full-pretrain/Loss (Raw)": 1.9956010580062866, "Full-pretrain/Step": 4390, "Full-pretrain/Step Time": 17.587750731036067} +{"Full-pretrain/Learning Rate": 2.939229492354754e-05, "Full-pretrain/Loss": 1.9410876035690308, "Full-pretrain/Loss (Raw)": 1.8721849918365479, "Full-pretrain/Step": 4391, "Full-pretrain/Step Time": 17.591823866590858} +{"Full-pretrain/Learning Rate": 2.938393595180746e-05, "Full-pretrain/Loss": 1.9550057649612427, "Full-pretrain/Loss (Raw)": 2.4947872161865234, "Full-pretrain/Step": 4392, "Full-pretrain/Step Time": 17.591135784983635} +{"Full-pretrain/Learning Rate": 2.9375576474381905e-05, "Full-pretrain/Loss": 1.948517084121704, "Full-pretrain/Loss (Raw)": 1.9795290231704712, "Full-pretrain/Step": 4393, "Full-pretrain/Step Time": 17.594306010752916} +{"Full-pretrain/Learning Rate": 2.9367216492235138e-05, "Full-pretrain/Loss": 1.943403720855713, "Full-pretrain/Loss (Raw)": 1.7481629848480225, "Full-pretrain/Step": 4394, "Full-pretrain/Step Time": 17.598101260140538} +{"Full-pretrain/Learning Rate": 2.9358856006331487e-05, "Full-pretrain/Loss": 1.9377459287643433, "Full-pretrain/Loss (Raw)": 1.515929937362671, "Full-pretrain/Step": 4395, "Full-pretrain/Step Time": 17.600019324570894} +{"Full-pretrain/Learning Rate": 2.9350495017635334e-05, "Full-pretrain/Loss": 1.938981533050537, "Full-pretrain/Loss (Raw)": 1.9273886680603027, "Full-pretrain/Step": 4396, "Full-pretrain/Step Time": 17.5999976657331} +{"Full-pretrain/Learning Rate": 2.9342133527111105e-05, "Full-pretrain/Loss": 1.9359833002090454, "Full-pretrain/Loss (Raw)": 1.914461612701416, "Full-pretrain/Step": 4397, "Full-pretrain/Step Time": 17.594332493841648} +{"Full-pretrain/Learning Rate": 2.933377153572329e-05, "Full-pretrain/Loss": 1.9394404888153076, "Full-pretrain/Loss (Raw)": 1.8462305068969727, "Full-pretrain/Step": 4398, "Full-pretrain/Step Time": 17.599177587777376} +{"Full-pretrain/Learning Rate": 2.932540904443646e-05, "Full-pretrain/Loss": 1.95106041431427, "Full-pretrain/Loss (Raw)": 2.098395347595215, "Full-pretrain/Step": 4399, "Full-pretrain/Step Time": 17.597447166219354} +{"Full-pretrain/Learning Rate": 2.9317046054215218e-05, "Full-pretrain/Loss": 1.9529540538787842, "Full-pretrain/Loss (Raw)": 1.8371777534484863, "Full-pretrain/Step": 4400, "Full-pretrain/Step Time": 17.60313663445413} +{"Full-pretrain/Learning Rate": 2.9308682566024224e-05, "Full-pretrain/Loss": 1.9576835632324219, "Full-pretrain/Loss (Raw)": 2.0490384101867676, "Full-pretrain/Step": 4401, "Full-pretrain/Step Time": 17.595823507755995} +{"Full-pretrain/Learning Rate": 2.930031858082822e-05, "Full-pretrain/Loss": 1.9547178745269775, "Full-pretrain/Loss (Raw)": 1.956082820892334, "Full-pretrain/Step": 4402, "Full-pretrain/Step Time": 17.594579208642244} +{"Full-pretrain/Learning Rate": 2.9291954099591973e-05, "Full-pretrain/Loss": 1.964966058731079, "Full-pretrain/Loss (Raw)": 2.0870466232299805, "Full-pretrain/Step": 4403, "Full-pretrain/Step Time": 17.594030125066638} +{"Full-pretrain/Learning Rate": 2.928358912328033e-05, "Full-pretrain/Loss": 1.9699912071228027, "Full-pretrain/Loss (Raw)": 1.808469533920288, "Full-pretrain/Step": 4404, "Full-pretrain/Step Time": 17.602129662409425} +{"Full-pretrain/Learning Rate": 2.9275223652858193e-05, "Full-pretrain/Loss": 1.9578604698181152, "Full-pretrain/Loss (Raw)": 1.9591343402862549, "Full-pretrain/Step": 4405, "Full-pretrain/Step Time": 17.597727980464697} +{"Full-pretrain/Learning Rate": 2.92668576892905e-05, "Full-pretrain/Loss": 1.9604976177215576, "Full-pretrain/Loss (Raw)": 2.2358932495117188, "Full-pretrain/Step": 4406, "Full-pretrain/Step Time": 17.59265122190118} +{"Full-pretrain/Learning Rate": 2.9258491233542274e-05, "Full-pretrain/Loss": 1.9604461193084717, "Full-pretrain/Loss (Raw)": 1.9961854219436646, "Full-pretrain/Step": 4407, "Full-pretrain/Step Time": 17.59332912042737} +{"Full-pretrain/Learning Rate": 2.9250124286578584e-05, "Full-pretrain/Loss": 1.9561432600021362, "Full-pretrain/Loss (Raw)": 1.8502421379089355, "Full-pretrain/Step": 4408, "Full-pretrain/Step Time": 17.598380029201508} +{"Full-pretrain/Learning Rate": 2.9241756849364542e-05, "Full-pretrain/Loss": 1.968510627746582, "Full-pretrain/Loss (Raw)": 2.2131404876708984, "Full-pretrain/Step": 4409, "Full-pretrain/Step Time": 17.595888936892152} +{"Full-pretrain/Learning Rate": 2.923338892286535e-05, "Full-pretrain/Loss": 1.9723905324935913, "Full-pretrain/Loss (Raw)": 2.0537586212158203, "Full-pretrain/Step": 4410, "Full-pretrain/Step Time": 17.593969171866775} +{"Full-pretrain/Learning Rate": 2.9225020508046232e-05, "Full-pretrain/Loss": 1.9666122198104858, "Full-pretrain/Loss (Raw)": 2.0263442993164062, "Full-pretrain/Step": 4411, "Full-pretrain/Step Time": 17.59389721043408} +{"Full-pretrain/Learning Rate": 2.921665160587248e-05, "Full-pretrain/Loss": 1.9595146179199219, "Full-pretrain/Loss (Raw)": 1.7852331399917603, "Full-pretrain/Step": 4412, "Full-pretrain/Step Time": 17.594081113114953} +{"Full-pretrain/Learning Rate": 2.9208282217309447e-05, "Full-pretrain/Loss": 1.9585933685302734, "Full-pretrain/Loss (Raw)": 1.7385730743408203, "Full-pretrain/Step": 4413, "Full-pretrain/Step Time": 17.592860413715243} +{"Full-pretrain/Learning Rate": 2.919991234332254e-05, "Full-pretrain/Loss": 1.955709457397461, "Full-pretrain/Loss (Raw)": 1.9958503246307373, "Full-pretrain/Step": 4414, "Full-pretrain/Step Time": 17.59379881620407} +{"Full-pretrain/Learning Rate": 2.9191541984877218e-05, "Full-pretrain/Loss": 1.9560260772705078, "Full-pretrain/Loss (Raw)": 1.8721286058425903, "Full-pretrain/Step": 4415, "Full-pretrain/Step Time": 17.593672450631857} +{"Full-pretrain/Learning Rate": 2.9183171142939005e-05, "Full-pretrain/Loss": 1.9511027336120605, "Full-pretrain/Loss (Raw)": 1.8349549770355225, "Full-pretrain/Step": 4416, "Full-pretrain/Step Time": 17.596102299168706} +{"Full-pretrain/Learning Rate": 2.9174799818473464e-05, "Full-pretrain/Loss": 1.9542622566223145, "Full-pretrain/Loss (Raw)": 2.0572433471679688, "Full-pretrain/Step": 4417, "Full-pretrain/Step Time": 17.596968786790967} +{"Full-pretrain/Learning Rate": 2.916642801244624e-05, "Full-pretrain/Loss": 1.9545561075210571, "Full-pretrain/Loss (Raw)": 1.9059298038482666, "Full-pretrain/Step": 4418, "Full-pretrain/Step Time": 17.589461486786604} +{"Full-pretrain/Learning Rate": 2.9158055725823e-05, "Full-pretrain/Loss": 1.949021577835083, "Full-pretrain/Loss (Raw)": 1.8731374740600586, "Full-pretrain/Step": 4419, "Full-pretrain/Step Time": 17.594509407877922} +{"Full-pretrain/Learning Rate": 2.9149682959569498e-05, "Full-pretrain/Loss": 1.944448709487915, "Full-pretrain/Loss (Raw)": 1.9171597957611084, "Full-pretrain/Step": 4420, "Full-pretrain/Step Time": 17.60067579895258} +{"Full-pretrain/Learning Rate": 2.9141309714651526e-05, "Full-pretrain/Loss": 1.954921841621399, "Full-pretrain/Loss (Raw)": 2.1121020317077637, "Full-pretrain/Step": 4421, "Full-pretrain/Step Time": 17.60063479654491} +{"Full-pretrain/Learning Rate": 2.9132935992034938e-05, "Full-pretrain/Loss": 1.9482287168502808, "Full-pretrain/Loss (Raw)": 1.7814233303070068, "Full-pretrain/Step": 4422, "Full-pretrain/Step Time": 17.59604823961854} +{"Full-pretrain/Learning Rate": 2.912456179268563e-05, "Full-pretrain/Loss": 1.9547539949417114, "Full-pretrain/Loss (Raw)": 2.0809929370880127, "Full-pretrain/Step": 4423, "Full-pretrain/Step Time": 17.598693231120706} +{"Full-pretrain/Learning Rate": 2.9116187117569564e-05, "Full-pretrain/Loss": 1.9375677108764648, "Full-pretrain/Loss (Raw)": 1.9448294639587402, "Full-pretrain/Step": 4424, "Full-pretrain/Step Time": 17.598646707832813} +{"Full-pretrain/Learning Rate": 2.9107811967652766e-05, "Full-pretrain/Loss": 1.9348628520965576, "Full-pretrain/Loss (Raw)": 1.8929734230041504, "Full-pretrain/Step": 4425, "Full-pretrain/Step Time": 17.601108441129327} +{"Full-pretrain/Learning Rate": 2.9099436343901306e-05, "Full-pretrain/Loss": 1.9436650276184082, "Full-pretrain/Loss (Raw)": 2.029831886291504, "Full-pretrain/Step": 4426, "Full-pretrain/Step Time": 17.600835049524903} +{"Full-pretrain/Learning Rate": 2.909106024728129e-05, "Full-pretrain/Loss": 1.9528608322143555, "Full-pretrain/Loss (Raw)": 1.8101942539215088, "Full-pretrain/Step": 4427, "Full-pretrain/Step Time": 17.599285185337067} +{"Full-pretrain/Learning Rate": 2.908268367875892e-05, "Full-pretrain/Loss": 1.9550800323486328, "Full-pretrain/Loss (Raw)": 1.9984023571014404, "Full-pretrain/Step": 4428, "Full-pretrain/Step Time": 17.600488547235727} +{"Full-pretrain/Learning Rate": 2.9074306639300424e-05, "Full-pretrain/Loss": 1.957174301147461, "Full-pretrain/Loss (Raw)": 1.9814776182174683, "Full-pretrain/Step": 4429, "Full-pretrain/Step Time": 17.598503032699227} +{"Full-pretrain/Learning Rate": 2.9065929129872094e-05, "Full-pretrain/Loss": 1.9600569009780884, "Full-pretrain/Loss (Raw)": 1.9384727478027344, "Full-pretrain/Step": 4430, "Full-pretrain/Step Time": 17.597998585551977} +{"Full-pretrain/Learning Rate": 2.9057551151440265e-05, "Full-pretrain/Loss": 1.9544224739074707, "Full-pretrain/Loss (Raw)": 1.9180951118469238, "Full-pretrain/Step": 4431, "Full-pretrain/Step Time": 17.594776324927807} +{"Full-pretrain/Learning Rate": 2.9049172704971332e-05, "Full-pretrain/Loss": 1.9573404788970947, "Full-pretrain/Loss (Raw)": 1.930549144744873, "Full-pretrain/Step": 4432, "Full-pretrain/Step Time": 17.590613592416048} +{"Full-pretrain/Learning Rate": 2.904079379143175e-05, "Full-pretrain/Loss": 1.9481875896453857, "Full-pretrain/Loss (Raw)": 1.7561500072479248, "Full-pretrain/Step": 4433, "Full-pretrain/Step Time": 17.593052690848708} +{"Full-pretrain/Learning Rate": 2.9032414411788027e-05, "Full-pretrain/Loss": 1.9468750953674316, "Full-pretrain/Loss (Raw)": 1.9140803813934326, "Full-pretrain/Step": 4434, "Full-pretrain/Step Time": 17.597830211743712} +{"Full-pretrain/Learning Rate": 2.902403456700672e-05, "Full-pretrain/Loss": 1.937728762626648, "Full-pretrain/Loss (Raw)": 1.7943646907806396, "Full-pretrain/Step": 4435, "Full-pretrain/Step Time": 17.599255988374352} +{"Full-pretrain/Learning Rate": 2.901565425805443e-05, "Full-pretrain/Loss": 1.9431489706039429, "Full-pretrain/Loss (Raw)": 1.981918454170227, "Full-pretrain/Step": 4436, "Full-pretrain/Step Time": 17.594711085781455} +{"Full-pretrain/Learning Rate": 2.9007273485897847e-05, "Full-pretrain/Loss": 1.946652889251709, "Full-pretrain/Loss (Raw)": 2.071258068084717, "Full-pretrain/Step": 4437, "Full-pretrain/Step Time": 17.596936402842402} +{"Full-pretrain/Learning Rate": 2.8998892251503675e-05, "Full-pretrain/Loss": 1.9402334690093994, "Full-pretrain/Loss (Raw)": 2.030473232269287, "Full-pretrain/Step": 4438, "Full-pretrain/Step Time": 17.600273629650474} +{"Full-pretrain/Learning Rate": 2.899051055583868e-05, "Full-pretrain/Loss": 1.9393621683120728, "Full-pretrain/Loss (Raw)": 1.9683036804199219, "Full-pretrain/Step": 4439, "Full-pretrain/Step Time": 17.60942686535418} +{"Full-pretrain/Learning Rate": 2.898212839986969e-05, "Full-pretrain/Loss": 1.944474458694458, "Full-pretrain/Loss (Raw)": 2.0138392448425293, "Full-pretrain/Step": 4440, "Full-pretrain/Step Time": 17.608768997713923} +{"Full-pretrain/Learning Rate": 2.8973745784563593e-05, "Full-pretrain/Loss": 1.9359188079833984, "Full-pretrain/Loss (Raw)": 1.9393534660339355, "Full-pretrain/Step": 4441, "Full-pretrain/Step Time": 17.605361368507147} +{"Full-pretrain/Learning Rate": 2.8965362710887324e-05, "Full-pretrain/Loss": 1.9268364906311035, "Full-pretrain/Loss (Raw)": 1.7631306648254395, "Full-pretrain/Step": 4442, "Full-pretrain/Step Time": 17.601173039525747} +{"Full-pretrain/Learning Rate": 2.8956979179807846e-05, "Full-pretrain/Loss": 1.9292386770248413, "Full-pretrain/Loss (Raw)": 2.1032121181488037, "Full-pretrain/Step": 4443, "Full-pretrain/Step Time": 17.59924591332674} +{"Full-pretrain/Learning Rate": 2.8948595192292216e-05, "Full-pretrain/Loss": 1.9372496604919434, "Full-pretrain/Loss (Raw)": 2.041583776473999, "Full-pretrain/Step": 4444, "Full-pretrain/Step Time": 17.604657862335443} +{"Full-pretrain/Learning Rate": 2.8940210749307522e-05, "Full-pretrain/Loss": 1.9463493824005127, "Full-pretrain/Loss (Raw)": 2.0297648906707764, "Full-pretrain/Step": 4445, "Full-pretrain/Step Time": 17.60335949808359} +{"Full-pretrain/Learning Rate": 2.8931825851820904e-05, "Full-pretrain/Loss": 1.9415161609649658, "Full-pretrain/Loss (Raw)": 1.841184139251709, "Full-pretrain/Step": 4446, "Full-pretrain/Step Time": 17.60937392897904} +{"Full-pretrain/Learning Rate": 2.8923440500799557e-05, "Full-pretrain/Loss": 1.9365806579589844, "Full-pretrain/Loss (Raw)": 1.7141960859298706, "Full-pretrain/Step": 4447, "Full-pretrain/Step Time": 17.606299912557006} +{"Full-pretrain/Learning Rate": 2.891505469721072e-05, "Full-pretrain/Loss": 1.9446182250976562, "Full-pretrain/Loss (Raw)": 2.0921578407287598, "Full-pretrain/Step": 4448, "Full-pretrain/Step Time": 17.613707633689046} +{"Full-pretrain/Learning Rate": 2.8906668442021702e-05, "Full-pretrain/Loss": 1.9449063539505005, "Full-pretrain/Loss (Raw)": 2.066460132598877, "Full-pretrain/Step": 4449, "Full-pretrain/Step Time": 17.60760878585279} +{"Full-pretrain/Learning Rate": 2.889828173619985e-05, "Full-pretrain/Loss": 1.948947548866272, "Full-pretrain/Loss (Raw)": 2.0352489948272705, "Full-pretrain/Step": 4450, "Full-pretrain/Step Time": 17.610084416344762} +{"Full-pretrain/Learning Rate": 2.8889894580712574e-05, "Full-pretrain/Loss": 1.9622098207473755, "Full-pretrain/Loss (Raw)": 2.2975287437438965, "Full-pretrain/Step": 4451, "Full-pretrain/Step Time": 17.60190218128264} +{"Full-pretrain/Learning Rate": 2.888150697652732e-05, "Full-pretrain/Loss": 1.9733541011810303, "Full-pretrain/Loss (Raw)": 2.2737789154052734, "Full-pretrain/Step": 4452, "Full-pretrain/Step Time": 17.609726203605533} +{"Full-pretrain/Learning Rate": 2.8873118924611603e-05, "Full-pretrain/Loss": 1.969409465789795, "Full-pretrain/Loss (Raw)": 1.9858720302581787, "Full-pretrain/Step": 4453, "Full-pretrain/Step Time": 17.603564145043492} +{"Full-pretrain/Learning Rate": 2.8864730425932984e-05, "Full-pretrain/Loss": 1.9605883359909058, "Full-pretrain/Loss (Raw)": 1.4991493225097656, "Full-pretrain/Step": 4454, "Full-pretrain/Step Time": 17.60674886405468} +{"Full-pretrain/Learning Rate": 2.8856341481459066e-05, "Full-pretrain/Loss": 1.945221185684204, "Full-pretrain/Loss (Raw)": 1.5892415046691895, "Full-pretrain/Step": 4455, "Full-pretrain/Step Time": 17.60975673235953} +{"Full-pretrain/Learning Rate": 2.884795209215751e-05, "Full-pretrain/Loss": 1.9435476064682007, "Full-pretrain/Loss (Raw)": 1.891275405883789, "Full-pretrain/Step": 4456, "Full-pretrain/Step Time": 17.61307457461953} +{"Full-pretrain/Learning Rate": 2.8839562258996028e-05, "Full-pretrain/Loss": 1.9462504386901855, "Full-pretrain/Loss (Raw)": 1.979462742805481, "Full-pretrain/Step": 4457, "Full-pretrain/Step Time": 17.613484187051654} +{"Full-pretrain/Learning Rate": 2.8831171982942396e-05, "Full-pretrain/Loss": 1.9460535049438477, "Full-pretrain/Loss (Raw)": 2.0235323905944824, "Full-pretrain/Step": 4458, "Full-pretrain/Step Time": 17.61126844212413} +{"Full-pretrain/Learning Rate": 2.882278126496442e-05, "Full-pretrain/Loss": 1.9457628726959229, "Full-pretrain/Loss (Raw)": 1.8008966445922852, "Full-pretrain/Step": 4459, "Full-pretrain/Step Time": 17.60771546140313} +{"Full-pretrain/Learning Rate": 2.881439010602997e-05, "Full-pretrain/Loss": 1.9460254907608032, "Full-pretrain/Loss (Raw)": 2.0068001747131348, "Full-pretrain/Step": 4460, "Full-pretrain/Step Time": 17.61915090121329} +{"Full-pretrain/Learning Rate": 2.8805998507106956e-05, "Full-pretrain/Loss": 1.9485514163970947, "Full-pretrain/Loss (Raw)": 2.062307357788086, "Full-pretrain/Step": 4461, "Full-pretrain/Step Time": 17.613289285451174} +{"Full-pretrain/Learning Rate": 2.8797606469163357e-05, "Full-pretrain/Loss": 1.9554245471954346, "Full-pretrain/Loss (Raw)": 2.158413887023926, "Full-pretrain/Step": 4462, "Full-pretrain/Step Time": 17.611979246139526} +{"Full-pretrain/Learning Rate": 2.8789213993167192e-05, "Full-pretrain/Loss": 1.9389840364456177, "Full-pretrain/Loss (Raw)": 1.3920013904571533, "Full-pretrain/Step": 4463, "Full-pretrain/Step Time": 17.606656624004245} +{"Full-pretrain/Learning Rate": 2.8780821080086516e-05, "Full-pretrain/Loss": 1.94393789768219, "Full-pretrain/Loss (Raw)": 2.0890700817108154, "Full-pretrain/Step": 4464, "Full-pretrain/Step Time": 17.61099706031382} +{"Full-pretrain/Learning Rate": 2.8772427730889463e-05, "Full-pretrain/Loss": 1.9555728435516357, "Full-pretrain/Loss (Raw)": 2.1284704208374023, "Full-pretrain/Step": 4465, "Full-pretrain/Step Time": 17.6110423412174} +{"Full-pretrain/Learning Rate": 2.8764033946544195e-05, "Full-pretrain/Loss": 1.94493567943573, "Full-pretrain/Loss (Raw)": 1.57369065284729, "Full-pretrain/Step": 4466, "Full-pretrain/Step Time": 17.606060789898038} +{"Full-pretrain/Learning Rate": 2.875563972801893e-05, "Full-pretrain/Loss": 1.9493314027786255, "Full-pretrain/Loss (Raw)": 1.9350279569625854, "Full-pretrain/Step": 4467, "Full-pretrain/Step Time": 17.606885485351086} +{"Full-pretrain/Learning Rate": 2.874724507628195e-05, "Full-pretrain/Loss": 1.9462970495224, "Full-pretrain/Loss (Raw)": 1.8848198652267456, "Full-pretrain/Step": 4468, "Full-pretrain/Step Time": 17.611024737358093} +{"Full-pretrain/Learning Rate": 2.873884999230155e-05, "Full-pretrain/Loss": 1.9429271221160889, "Full-pretrain/Loss (Raw)": 1.963423252105713, "Full-pretrain/Step": 4469, "Full-pretrain/Step Time": 17.608593048527837} +{"Full-pretrain/Learning Rate": 2.873045447704613e-05, "Full-pretrain/Loss": 1.9537419080734253, "Full-pretrain/Loss (Raw)": 2.3765459060668945, "Full-pretrain/Step": 4470, "Full-pretrain/Step Time": 17.60525810904801} +{"Full-pretrain/Learning Rate": 2.8722058531484103e-05, "Full-pretrain/Loss": 1.9494792222976685, "Full-pretrain/Loss (Raw)": 1.8318970203399658, "Full-pretrain/Step": 4471, "Full-pretrain/Step Time": 17.608808977529407} +{"Full-pretrain/Learning Rate": 2.8713662156583925e-05, "Full-pretrain/Loss": 1.9584870338439941, "Full-pretrain/Loss (Raw)": 2.302090644836426, "Full-pretrain/Step": 4472, "Full-pretrain/Step Time": 17.61065759882331} +{"Full-pretrain/Learning Rate": 2.8705265353314124e-05, "Full-pretrain/Loss": 1.9572923183441162, "Full-pretrain/Loss (Raw)": 1.901118278503418, "Full-pretrain/Step": 4473, "Full-pretrain/Step Time": 17.613967042416334} +{"Full-pretrain/Learning Rate": 2.8696868122643268e-05, "Full-pretrain/Loss": 1.9644560813903809, "Full-pretrain/Loss (Raw)": 1.9923738241195679, "Full-pretrain/Step": 4474, "Full-pretrain/Step Time": 17.613674115389585} +{"Full-pretrain/Learning Rate": 2.868847046553997e-05, "Full-pretrain/Loss": 1.9608252048492432, "Full-pretrain/Loss (Raw)": 1.987025260925293, "Full-pretrain/Step": 4475, "Full-pretrain/Step Time": 17.611129323020577} +{"Full-pretrain/Learning Rate": 2.86800723829729e-05, "Full-pretrain/Loss": 1.9566593170166016, "Full-pretrain/Loss (Raw)": 1.9082744121551514, "Full-pretrain/Step": 4476, "Full-pretrain/Step Time": 17.611995613202453} +{"Full-pretrain/Learning Rate": 2.8671673875910772e-05, "Full-pretrain/Loss": 1.9551782608032227, "Full-pretrain/Loss (Raw)": 1.9823654890060425, "Full-pretrain/Step": 4477, "Full-pretrain/Step Time": 17.616664400324225} +{"Full-pretrain/Learning Rate": 2.8663274945322355e-05, "Full-pretrain/Loss": 1.9586408138275146, "Full-pretrain/Loss (Raw)": 1.9519891738891602, "Full-pretrain/Step": 4478, "Full-pretrain/Step Time": 17.614569509401917} +{"Full-pretrain/Learning Rate": 2.8654875592176462e-05, "Full-pretrain/Loss": 1.9684200286865234, "Full-pretrain/Loss (Raw)": 2.027132034301758, "Full-pretrain/Step": 4479, "Full-pretrain/Step Time": 17.61005912721157} +{"Full-pretrain/Learning Rate": 2.8646475817441952e-05, "Full-pretrain/Loss": 1.9664647579193115, "Full-pretrain/Loss (Raw)": 2.0295891761779785, "Full-pretrain/Step": 4480, "Full-pretrain/Step Time": 17.61068090610206} +{"Full-pretrain/Learning Rate": 2.8638075622087747e-05, "Full-pretrain/Loss": 1.966280221939087, "Full-pretrain/Loss (Raw)": 2.060555934906006, "Full-pretrain/Step": 4481, "Full-pretrain/Step Time": 17.614248171448708} +{"Full-pretrain/Learning Rate": 2.8629675007082784e-05, "Full-pretrain/Loss": 1.9645310640335083, "Full-pretrain/Loss (Raw)": 1.9792733192443848, "Full-pretrain/Step": 4482, "Full-pretrain/Step Time": 17.615719160065055} +{"Full-pretrain/Learning Rate": 2.862127397339609e-05, "Full-pretrain/Loss": 1.9486215114593506, "Full-pretrain/Loss (Raw)": 1.788424015045166, "Full-pretrain/Step": 4483, "Full-pretrain/Step Time": 17.617436569184065} +{"Full-pretrain/Learning Rate": 2.8612872521996714e-05, "Full-pretrain/Loss": 1.9317971467971802, "Full-pretrain/Loss (Raw)": 1.7354017496109009, "Full-pretrain/Step": 4484, "Full-pretrain/Step Time": 17.613116651773453} +{"Full-pretrain/Learning Rate": 2.8604470653853766e-05, "Full-pretrain/Loss": 1.9399374723434448, "Full-pretrain/Loss (Raw)": 2.2463607788085938, "Full-pretrain/Step": 4485, "Full-pretrain/Step Time": 17.618838109076023} +{"Full-pretrain/Learning Rate": 2.8596068369936386e-05, "Full-pretrain/Loss": 1.9570269584655762, "Full-pretrain/Loss (Raw)": 2.046013832092285, "Full-pretrain/Step": 4486, "Full-pretrain/Step Time": 17.61207709647715} +{"Full-pretrain/Learning Rate": 2.858766567121379e-05, "Full-pretrain/Loss": 1.9592092037200928, "Full-pretrain/Loss (Raw)": 1.6590746641159058, "Full-pretrain/Step": 4487, "Full-pretrain/Step Time": 17.613658148795366} +{"Full-pretrain/Learning Rate": 2.857926255865523e-05, "Full-pretrain/Loss": 1.9599971771240234, "Full-pretrain/Loss (Raw)": 1.916490912437439, "Full-pretrain/Step": 4488, "Full-pretrain/Step Time": 17.613135386258364} +{"Full-pretrain/Learning Rate": 2.857085903322998e-05, "Full-pretrain/Loss": 1.9572196006774902, "Full-pretrain/Loss (Raw)": 1.8905752897262573, "Full-pretrain/Step": 4489, "Full-pretrain/Step Time": 17.61702475696802} +{"Full-pretrain/Learning Rate": 2.8562455095907392e-05, "Full-pretrain/Loss": 1.9595391750335693, "Full-pretrain/Loss (Raw)": 2.0977654457092285, "Full-pretrain/Step": 4490, "Full-pretrain/Step Time": 17.6176913138479} +{"Full-pretrain/Learning Rate": 2.855405074765686e-05, "Full-pretrain/Loss": 1.9766993522644043, "Full-pretrain/Loss (Raw)": 2.3500213623046875, "Full-pretrain/Step": 4491, "Full-pretrain/Step Time": 17.614392487332225} +{"Full-pretrain/Learning Rate": 2.8545645989447832e-05, "Full-pretrain/Loss": 1.9677692651748657, "Full-pretrain/Loss (Raw)": 1.721036672592163, "Full-pretrain/Step": 4492, "Full-pretrain/Step Time": 17.61793086491525} +{"Full-pretrain/Learning Rate": 2.8537240822249784e-05, "Full-pretrain/Loss": 1.9687347412109375, "Full-pretrain/Loss (Raw)": 2.093197822570801, "Full-pretrain/Step": 4493, "Full-pretrain/Step Time": 17.614309342578053} +{"Full-pretrain/Learning Rate": 2.8528835247032242e-05, "Full-pretrain/Loss": 1.9547126293182373, "Full-pretrain/Loss (Raw)": 1.709708571434021, "Full-pretrain/Step": 4494, "Full-pretrain/Step Time": 17.615944858640432} +{"Full-pretrain/Learning Rate": 2.8520429264764805e-05, "Full-pretrain/Loss": 1.9763637781143188, "Full-pretrain/Loss (Raw)": 2.084838390350342, "Full-pretrain/Step": 4495, "Full-pretrain/Step Time": 17.613706612959504} +{"Full-pretrain/Learning Rate": 2.8512022876417087e-05, "Full-pretrain/Loss": 1.9703881740570068, "Full-pretrain/Loss (Raw)": 1.8978534936904907, "Full-pretrain/Step": 4496, "Full-pretrain/Step Time": 17.620250057429075} +{"Full-pretrain/Learning Rate": 2.8503616082958766e-05, "Full-pretrain/Loss": 1.9669733047485352, "Full-pretrain/Loss (Raw)": 2.0191903114318848, "Full-pretrain/Step": 4497, "Full-pretrain/Step Time": 17.615961695089936} +{"Full-pretrain/Learning Rate": 2.8495208885359555e-05, "Full-pretrain/Loss": 1.9823994636535645, "Full-pretrain/Loss (Raw)": 2.0673298835754395, "Full-pretrain/Step": 4498, "Full-pretrain/Step Time": 17.616344025358558} +{"Full-pretrain/Learning Rate": 2.8486801284589225e-05, "Full-pretrain/Loss": 1.9914003610610962, "Full-pretrain/Loss (Raw)": 2.2230546474456787, "Full-pretrain/Step": 4499, "Full-pretrain/Step Time": 17.61869558133185} +{"Full-pretrain/Learning Rate": 2.84783932816176e-05, "Full-pretrain/Loss": 2.0035321712493896, "Full-pretrain/Loss (Raw)": 2.273038864135742, "Full-pretrain/Step": 4500, "Full-pretrain/Step Time": 17.620435481891036} +{"Full-pretrain/Learning Rate": 2.8469984877414525e-05, "Full-pretrain/Loss": 1.9999797344207764, "Full-pretrain/Loss (Raw)": 1.8497456312179565, "Full-pretrain/Step": 4501, "Full-pretrain/Step Time": 17.620274228975177} +{"Full-pretrain/Learning Rate": 2.8461576072949926e-05, "Full-pretrain/Loss": 1.9805738925933838, "Full-pretrain/Loss (Raw)": 1.7555592060089111, "Full-pretrain/Step": 4502, "Full-pretrain/Step Time": 17.615857418626547} +{"Full-pretrain/Learning Rate": 2.8453166869193725e-05, "Full-pretrain/Loss": 1.9826579093933105, "Full-pretrain/Loss (Raw)": 1.8985860347747803, "Full-pretrain/Step": 4503, "Full-pretrain/Step Time": 17.617714509367943} +{"Full-pretrain/Learning Rate": 2.844475726711595e-05, "Full-pretrain/Loss": 1.967634916305542, "Full-pretrain/Loss (Raw)": 1.8213542699813843, "Full-pretrain/Step": 4504, "Full-pretrain/Step Time": 17.61821257509291} +{"Full-pretrain/Learning Rate": 2.8436347267686636e-05, "Full-pretrain/Loss": 1.9726502895355225, "Full-pretrain/Loss (Raw)": 2.0616064071655273, "Full-pretrain/Step": 4505, "Full-pretrain/Step Time": 17.614141209051013} +{"Full-pretrain/Learning Rate": 2.8427936871875876e-05, "Full-pretrain/Loss": 1.9700522422790527, "Full-pretrain/Loss (Raw)": 1.909238338470459, "Full-pretrain/Step": 4506, "Full-pretrain/Step Time": 17.6110207028687} +{"Full-pretrain/Learning Rate": 2.8419526080653792e-05, "Full-pretrain/Loss": 1.9646426439285278, "Full-pretrain/Loss (Raw)": 1.8139184713363647, "Full-pretrain/Step": 4507, "Full-pretrain/Step Time": 17.607035806402564} +{"Full-pretrain/Learning Rate": 2.8411114894990585e-05, "Full-pretrain/Loss": 1.9737789630889893, "Full-pretrain/Loss (Raw)": 2.2006404399871826, "Full-pretrain/Step": 4508, "Full-pretrain/Step Time": 17.602972887456417} +{"Full-pretrain/Learning Rate": 2.8402703315856465e-05, "Full-pretrain/Loss": 1.9662771224975586, "Full-pretrain/Loss (Raw)": 1.7423033714294434, "Full-pretrain/Step": 4509, "Full-pretrain/Step Time": 17.60118437744677} +{"Full-pretrain/Learning Rate": 2.8394291344221724e-05, "Full-pretrain/Loss": 1.9703493118286133, "Full-pretrain/Loss (Raw)": 2.0822982788085938, "Full-pretrain/Step": 4510, "Full-pretrain/Step Time": 17.60456519573927} +{"Full-pretrain/Learning Rate": 2.8385878981056662e-05, "Full-pretrain/Loss": 1.9701054096221924, "Full-pretrain/Loss (Raw)": 2.019327163696289, "Full-pretrain/Step": 4511, "Full-pretrain/Step Time": 17.60003301501274} +{"Full-pretrain/Learning Rate": 2.837746622733165e-05, "Full-pretrain/Loss": 1.9694410562515259, "Full-pretrain/Loss (Raw)": 2.0083305835723877, "Full-pretrain/Step": 4512, "Full-pretrain/Step Time": 17.599040610715747} +{"Full-pretrain/Learning Rate": 2.8369053084017094e-05, "Full-pretrain/Loss": 1.9684962034225464, "Full-pretrain/Loss (Raw)": 2.030320167541504, "Full-pretrain/Step": 4513, "Full-pretrain/Step Time": 17.59361646696925} +{"Full-pretrain/Learning Rate": 2.8360639552083455e-05, "Full-pretrain/Loss": 1.9711683988571167, "Full-pretrain/Loss (Raw)": 2.0647835731506348, "Full-pretrain/Step": 4514, "Full-pretrain/Step Time": 17.596893856301904} +{"Full-pretrain/Learning Rate": 2.8352225632501224e-05, "Full-pretrain/Loss": 1.9792355298995972, "Full-pretrain/Loss (Raw)": 2.0465755462646484, "Full-pretrain/Step": 4515, "Full-pretrain/Step Time": 17.591044088825583} +{"Full-pretrain/Learning Rate": 2.8343811326240945e-05, "Full-pretrain/Loss": 1.9935706853866577, "Full-pretrain/Loss (Raw)": 2.1941232681274414, "Full-pretrain/Step": 4516, "Full-pretrain/Step Time": 17.584670724347234} +{"Full-pretrain/Learning Rate": 2.833539663427319e-05, "Full-pretrain/Loss": 1.992672085762024, "Full-pretrain/Loss (Raw)": 2.2176060676574707, "Full-pretrain/Step": 4517, "Full-pretrain/Step Time": 17.58983468450606} +{"Full-pretrain/Learning Rate": 2.8326981557568622e-05, "Full-pretrain/Loss": 1.980412244796753, "Full-pretrain/Loss (Raw)": 1.653698444366455, "Full-pretrain/Step": 4518, "Full-pretrain/Step Time": 17.594892954453826} +{"Full-pretrain/Learning Rate": 2.831856609709789e-05, "Full-pretrain/Loss": 1.986688494682312, "Full-pretrain/Loss (Raw)": 1.8599168062210083, "Full-pretrain/Step": 4519, "Full-pretrain/Step Time": 17.591552022844553} +{"Full-pretrain/Learning Rate": 2.831015025383173e-05, "Full-pretrain/Loss": 1.9877692461013794, "Full-pretrain/Loss (Raw)": 1.9510713815689087, "Full-pretrain/Step": 4520, "Full-pretrain/Step Time": 17.595351388677955} +{"Full-pretrain/Learning Rate": 2.8301734028740905e-05, "Full-pretrain/Loss": 1.9915529489517212, "Full-pretrain/Loss (Raw)": 2.011655330657959, "Full-pretrain/Step": 4521, "Full-pretrain/Step Time": 17.59272602945566} +{"Full-pretrain/Learning Rate": 2.8293317422796217e-05, "Full-pretrain/Loss": 1.9794365167617798, "Full-pretrain/Loss (Raw)": 1.7100374698638916, "Full-pretrain/Step": 4522, "Full-pretrain/Step Time": 17.58835695683956} +{"Full-pretrain/Learning Rate": 2.8284900436968527e-05, "Full-pretrain/Loss": 1.9701147079467773, "Full-pretrain/Loss (Raw)": 2.051724433898926, "Full-pretrain/Step": 4523, "Full-pretrain/Step Time": 17.589414957910776} +{"Full-pretrain/Learning Rate": 2.8276483072228715e-05, "Full-pretrain/Loss": 1.9750407934188843, "Full-pretrain/Loss (Raw)": 1.8786723613739014, "Full-pretrain/Step": 4524, "Full-pretrain/Step Time": 17.591825414448977} +{"Full-pretrain/Learning Rate": 2.826806532954773e-05, "Full-pretrain/Loss": 1.9741129875183105, "Full-pretrain/Loss (Raw)": 2.063507556915283, "Full-pretrain/Step": 4525, "Full-pretrain/Step Time": 17.59447307139635} +{"Full-pretrain/Learning Rate": 2.8259647209896572e-05, "Full-pretrain/Loss": 1.9783316850662231, "Full-pretrain/Loss (Raw)": 1.8447072505950928, "Full-pretrain/Step": 4526, "Full-pretrain/Step Time": 17.593030204996467} +{"Full-pretrain/Learning Rate": 2.8251228714246246e-05, "Full-pretrain/Loss": 1.9739048480987549, "Full-pretrain/Loss (Raw)": 1.9431785345077515, "Full-pretrain/Step": 4527, "Full-pretrain/Step Time": 17.59252586774528} +{"Full-pretrain/Learning Rate": 2.824280984356783e-05, "Full-pretrain/Loss": 1.9729338884353638, "Full-pretrain/Loss (Raw)": 1.8667845726013184, "Full-pretrain/Step": 4528, "Full-pretrain/Step Time": 17.58992604725063} +{"Full-pretrain/Learning Rate": 2.8234390598832437e-05, "Full-pretrain/Loss": 1.9616913795471191, "Full-pretrain/Loss (Raw)": 1.659427523612976, "Full-pretrain/Step": 4529, "Full-pretrain/Step Time": 17.59106378443539} +{"Full-pretrain/Learning Rate": 2.8225970981011233e-05, "Full-pretrain/Loss": 1.965683937072754, "Full-pretrain/Loss (Raw)": 2.1950926780700684, "Full-pretrain/Step": 4530, "Full-pretrain/Step Time": 17.591913798823953} +{"Full-pretrain/Learning Rate": 2.821755099107541e-05, "Full-pretrain/Loss": 1.9573776721954346, "Full-pretrain/Loss (Raw)": 1.9572558403015137, "Full-pretrain/Step": 4531, "Full-pretrain/Step Time": 17.59685475938022} +{"Full-pretrain/Learning Rate": 2.82091306299962e-05, "Full-pretrain/Loss": 1.9417521953582764, "Full-pretrain/Loss (Raw)": 1.7730205059051514, "Full-pretrain/Step": 4532, "Full-pretrain/Step Time": 17.593192860484123} +{"Full-pretrain/Learning Rate": 2.8200709898744902e-05, "Full-pretrain/Loss": 1.9452130794525146, "Full-pretrain/Loss (Raw)": 1.9604945182800293, "Full-pretrain/Step": 4533, "Full-pretrain/Step Time": 17.590253150090575} +{"Full-pretrain/Learning Rate": 2.8192288798292847e-05, "Full-pretrain/Loss": 1.9600660800933838, "Full-pretrain/Loss (Raw)": 2.2308545112609863, "Full-pretrain/Step": 4534, "Full-pretrain/Step Time": 17.597606724128127} +{"Full-pretrain/Learning Rate": 2.8183867329611395e-05, "Full-pretrain/Loss": 1.9513075351715088, "Full-pretrain/Loss (Raw)": 1.6183130741119385, "Full-pretrain/Step": 4535, "Full-pretrain/Step Time": 17.59713370539248} +{"Full-pretrain/Learning Rate": 2.8175445493671972e-05, "Full-pretrain/Loss": 1.959191083908081, "Full-pretrain/Loss (Raw)": 2.073627471923828, "Full-pretrain/Step": 4536, "Full-pretrain/Step Time": 17.593714566901326} +{"Full-pretrain/Learning Rate": 2.8167023291446022e-05, "Full-pretrain/Loss": 1.9556794166564941, "Full-pretrain/Loss (Raw)": 1.9492342472076416, "Full-pretrain/Step": 4537, "Full-pretrain/Step Time": 17.598109619691968} +{"Full-pretrain/Learning Rate": 2.8158600723905055e-05, "Full-pretrain/Loss": 1.9542648792266846, "Full-pretrain/Loss (Raw)": 1.8639739751815796, "Full-pretrain/Step": 4538, "Full-pretrain/Step Time": 17.5978617798537} +{"Full-pretrain/Learning Rate": 2.8150177792020604e-05, "Full-pretrain/Loss": 1.9639477729797363, "Full-pretrain/Loss (Raw)": 2.1237683296203613, "Full-pretrain/Step": 4539, "Full-pretrain/Step Time": 17.59749398380518} +{"Full-pretrain/Learning Rate": 2.8141754496764244e-05, "Full-pretrain/Loss": 1.952575922012329, "Full-pretrain/Loss (Raw)": 1.8367443084716797, "Full-pretrain/Step": 4540, "Full-pretrain/Step Time": 17.596306772902608} +{"Full-pretrain/Learning Rate": 2.8133330839107608e-05, "Full-pretrain/Loss": 1.9599260091781616, "Full-pretrain/Loss (Raw)": 1.9775053262710571, "Full-pretrain/Step": 4541, "Full-pretrain/Step Time": 17.594192024320364} +{"Full-pretrain/Learning Rate": 2.8124906820022366e-05, "Full-pretrain/Loss": 1.9635789394378662, "Full-pretrain/Loss (Raw)": 2.1991934776306152, "Full-pretrain/Step": 4542, "Full-pretrain/Step Time": 17.595297027379274} +{"Full-pretrain/Learning Rate": 2.8116482440480218e-05, "Full-pretrain/Loss": 1.9608399868011475, "Full-pretrain/Loss (Raw)": 1.9316798448562622, "Full-pretrain/Step": 4543, "Full-pretrain/Step Time": 17.603375120088458} +{"Full-pretrain/Learning Rate": 2.8108057701452915e-05, "Full-pretrain/Loss": 1.9597556591033936, "Full-pretrain/Loss (Raw)": 1.9736329317092896, "Full-pretrain/Step": 4544, "Full-pretrain/Step Time": 17.600176464766264} +{"Full-pretrain/Learning Rate": 2.8099632603912247e-05, "Full-pretrain/Loss": 1.9606339931488037, "Full-pretrain/Loss (Raw)": 2.0584239959716797, "Full-pretrain/Step": 4545, "Full-pretrain/Step Time": 17.600663824006915} +{"Full-pretrain/Learning Rate": 2.8091207148830044e-05, "Full-pretrain/Loss": 1.9442723989486694, "Full-pretrain/Loss (Raw)": 1.5412132740020752, "Full-pretrain/Step": 4546, "Full-pretrain/Step Time": 17.607626624405384} +{"Full-pretrain/Learning Rate": 2.8082781337178195e-05, "Full-pretrain/Loss": 1.9405109882354736, "Full-pretrain/Loss (Raw)": 1.9262131452560425, "Full-pretrain/Step": 4547, "Full-pretrain/Step Time": 17.60465227253735} +{"Full-pretrain/Learning Rate": 2.8074355169928603e-05, "Full-pretrain/Loss": 1.9305751323699951, "Full-pretrain/Loss (Raw)": 1.8761767148971558, "Full-pretrain/Step": 4548, "Full-pretrain/Step Time": 17.598039841279387} +{"Full-pretrain/Learning Rate": 2.8065928648053207e-05, "Full-pretrain/Loss": 1.917346477508545, "Full-pretrain/Loss (Raw)": 1.7942912578582764, "Full-pretrain/Step": 4549, "Full-pretrain/Step Time": 17.598695050925016} +{"Full-pretrain/Learning Rate": 2.805750177252403e-05, "Full-pretrain/Loss": 1.9330761432647705, "Full-pretrain/Loss (Raw)": 2.1570420265197754, "Full-pretrain/Step": 4550, "Full-pretrain/Step Time": 17.605167020112276} +{"Full-pretrain/Learning Rate": 2.8049074544313094e-05, "Full-pretrain/Loss": 1.9334876537322998, "Full-pretrain/Loss (Raw)": 1.8730881214141846, "Full-pretrain/Step": 4551, "Full-pretrain/Step Time": 17.606529561802745} +{"Full-pretrain/Learning Rate": 2.8040646964392482e-05, "Full-pretrain/Loss": 1.9323976039886475, "Full-pretrain/Loss (Raw)": 1.9161909818649292, "Full-pretrain/Step": 4552, "Full-pretrain/Step Time": 17.605084827169776} +{"Full-pretrain/Learning Rate": 2.8032219033734308e-05, "Full-pretrain/Loss": 1.92741060256958, "Full-pretrain/Loss (Raw)": 1.8520698547363281, "Full-pretrain/Step": 4553, "Full-pretrain/Step Time": 17.60290190577507} +{"Full-pretrain/Learning Rate": 2.8023790753310737e-05, "Full-pretrain/Loss": 1.9331945180892944, "Full-pretrain/Loss (Raw)": 1.8951225280761719, "Full-pretrain/Step": 4554, "Full-pretrain/Step Time": 17.609854200854897} +{"Full-pretrain/Learning Rate": 2.8015362124093968e-05, "Full-pretrain/Loss": 1.9364187717437744, "Full-pretrain/Loss (Raw)": 2.1548995971679688, "Full-pretrain/Step": 4555, "Full-pretrain/Step Time": 17.613253900781274} +{"Full-pretrain/Learning Rate": 2.8006933147056234e-05, "Full-pretrain/Loss": 1.934436559677124, "Full-pretrain/Loss (Raw)": 1.8152440786361694, "Full-pretrain/Step": 4556, "Full-pretrain/Step Time": 17.609719451516867} +{"Full-pretrain/Learning Rate": 2.7998503823169818e-05, "Full-pretrain/Loss": 1.9338901042938232, "Full-pretrain/Loss (Raw)": 2.046016216278076, "Full-pretrain/Step": 4557, "Full-pretrain/Step Time": 17.611402543261647} +{"Full-pretrain/Learning Rate": 2.799007415340705e-05, "Full-pretrain/Loss": 1.9386478662490845, "Full-pretrain/Loss (Raw)": 1.9969606399536133, "Full-pretrain/Step": 4558, "Full-pretrain/Step Time": 17.616602243855596} +{"Full-pretrain/Learning Rate": 2.7981644138740267e-05, "Full-pretrain/Loss": 1.9394550323486328, "Full-pretrain/Loss (Raw)": 1.9690077304840088, "Full-pretrain/Step": 4559, "Full-pretrain/Step Time": 17.616004057228565} +{"Full-pretrain/Learning Rate": 2.7973213780141882e-05, "Full-pretrain/Loss": 1.9380452632904053, "Full-pretrain/Loss (Raw)": 1.8216725587844849, "Full-pretrain/Step": 4560, "Full-pretrain/Step Time": 17.621062092483044} +{"Full-pretrain/Learning Rate": 2.7964783078584333e-05, "Full-pretrain/Loss": 1.9513037204742432, "Full-pretrain/Loss (Raw)": 2.0836949348449707, "Full-pretrain/Step": 4561, "Full-pretrain/Step Time": 17.61328344233334} +{"Full-pretrain/Learning Rate": 2.7956352035040094e-05, "Full-pretrain/Loss": 1.948457956314087, "Full-pretrain/Loss (Raw)": 2.1040291786193848, "Full-pretrain/Step": 4562, "Full-pretrain/Step Time": 17.61424971744418} +{"Full-pretrain/Learning Rate": 2.7947920650481695e-05, "Full-pretrain/Loss": 1.9546799659729004, "Full-pretrain/Loss (Raw)": 2.156362533569336, "Full-pretrain/Step": 4563, "Full-pretrain/Step Time": 17.614401130005717} +{"Full-pretrain/Learning Rate": 2.7939488925881685e-05, "Full-pretrain/Loss": 1.9591492414474487, "Full-pretrain/Loss (Raw)": 1.916034460067749, "Full-pretrain/Step": 4564, "Full-pretrain/Step Time": 17.616795130074024} +{"Full-pretrain/Learning Rate": 2.7931056862212652e-05, "Full-pretrain/Loss": 1.9679651260375977, "Full-pretrain/Loss (Raw)": 2.2426013946533203, "Full-pretrain/Step": 4565, "Full-pretrain/Step Time": 17.617128625512123} +{"Full-pretrain/Learning Rate": 2.792262446044725e-05, "Full-pretrain/Loss": 1.972088098526001, "Full-pretrain/Loss (Raw)": 2.362791061401367, "Full-pretrain/Step": 4566, "Full-pretrain/Step Time": 17.618453783914447} +{"Full-pretrain/Learning Rate": 2.7914191721558135e-05, "Full-pretrain/Loss": 1.980276346206665, "Full-pretrain/Loss (Raw)": 1.8803398609161377, "Full-pretrain/Step": 4567, "Full-pretrain/Step Time": 17.615912279114127} +{"Full-pretrain/Learning Rate": 2.790575864651803e-05, "Full-pretrain/Loss": 1.9756335020065308, "Full-pretrain/Loss (Raw)": 1.925053358078003, "Full-pretrain/Step": 4568, "Full-pretrain/Step Time": 17.614747416228056} +{"Full-pretrain/Learning Rate": 2.7897325236299688e-05, "Full-pretrain/Loss": 1.9710941314697266, "Full-pretrain/Loss (Raw)": 1.8039758205413818, "Full-pretrain/Step": 4569, "Full-pretrain/Step Time": 17.621501725167036} +{"Full-pretrain/Learning Rate": 2.7888891491875897e-05, "Full-pretrain/Loss": 1.9703407287597656, "Full-pretrain/Loss (Raw)": 1.839863657951355, "Full-pretrain/Step": 4570, "Full-pretrain/Step Time": 17.620220471173525} +{"Full-pretrain/Learning Rate": 2.788045741421949e-05, "Full-pretrain/Loss": 1.970726490020752, "Full-pretrain/Loss (Raw)": 2.13611102104187, "Full-pretrain/Step": 4571, "Full-pretrain/Step Time": 17.62676097266376} +{"Full-pretrain/Learning Rate": 2.7872023004303337e-05, "Full-pretrain/Loss": 1.9778190851211548, "Full-pretrain/Loss (Raw)": 2.0637073516845703, "Full-pretrain/Step": 4572, "Full-pretrain/Step Time": 17.614517917856574} +{"Full-pretrain/Learning Rate": 2.786358826310034e-05, "Full-pretrain/Loss": 1.9761154651641846, "Full-pretrain/Loss (Raw)": 1.9229910373687744, "Full-pretrain/Step": 4573, "Full-pretrain/Step Time": 17.616602797061205} +{"Full-pretrain/Learning Rate": 2.7855153191583432e-05, "Full-pretrain/Loss": 1.9736806154251099, "Full-pretrain/Loss (Raw)": 2.121277093887329, "Full-pretrain/Step": 4574, "Full-pretrain/Step Time": 17.613652486354113} +{"Full-pretrain/Learning Rate": 2.7846717790725614e-05, "Full-pretrain/Loss": 1.9752315282821655, "Full-pretrain/Loss (Raw)": 1.981308102607727, "Full-pretrain/Step": 4575, "Full-pretrain/Step Time": 17.61687128804624} +{"Full-pretrain/Learning Rate": 2.78382820614999e-05, "Full-pretrain/Loss": 1.9797861576080322, "Full-pretrain/Loss (Raw)": 2.1193811893463135, "Full-pretrain/Step": 4576, "Full-pretrain/Step Time": 17.61273330450058} +{"Full-pretrain/Learning Rate": 2.7829846004879338e-05, "Full-pretrain/Loss": 1.9742608070373535, "Full-pretrain/Loss (Raw)": 1.8816152811050415, "Full-pretrain/Step": 4577, "Full-pretrain/Step Time": 17.623839804902673} +{"Full-pretrain/Learning Rate": 2.782140962183704e-05, "Full-pretrain/Loss": 2.0025110244750977, "Full-pretrain/Loss (Raw)": 2.445220947265625, "Full-pretrain/Step": 4578, "Full-pretrain/Step Time": 17.622520031407475} +{"Full-pretrain/Learning Rate": 2.781297291334614e-05, "Full-pretrain/Loss": 2.0010147094726562, "Full-pretrain/Loss (Raw)": 1.87832510471344, "Full-pretrain/Step": 4579, "Full-pretrain/Step Time": 17.62646677903831} +{"Full-pretrain/Learning Rate": 2.78045358803798e-05, "Full-pretrain/Loss": 2.0087366104125977, "Full-pretrain/Loss (Raw)": 2.123281955718994, "Full-pretrain/Step": 4580, "Full-pretrain/Step Time": 17.61493975110352} +{"Full-pretrain/Learning Rate": 2.779609852391123e-05, "Full-pretrain/Loss": 2.0225744247436523, "Full-pretrain/Loss (Raw)": 2.23710036277771, "Full-pretrain/Step": 4581, "Full-pretrain/Step Time": 17.618392812088132} +{"Full-pretrain/Learning Rate": 2.7787660844913676e-05, "Full-pretrain/Loss": 2.003126382827759, "Full-pretrain/Loss (Raw)": 1.5347033739089966, "Full-pretrain/Step": 4582, "Full-pretrain/Step Time": 17.615441298112273} +{"Full-pretrain/Learning Rate": 2.7779222844360426e-05, "Full-pretrain/Loss": 2.0094308853149414, "Full-pretrain/Loss (Raw)": 2.0748367309570312, "Full-pretrain/Step": 4583, "Full-pretrain/Step Time": 17.61273704096675} +{"Full-pretrain/Learning Rate": 2.7770784523224796e-05, "Full-pretrain/Loss": 1.9978601932525635, "Full-pretrain/Loss (Raw)": 1.545929193496704, "Full-pretrain/Step": 4584, "Full-pretrain/Step Time": 17.60837603546679} +{"Full-pretrain/Learning Rate": 2.7762345882480144e-05, "Full-pretrain/Loss": 1.9970946311950684, "Full-pretrain/Loss (Raw)": 1.827566385269165, "Full-pretrain/Step": 4585, "Full-pretrain/Step Time": 17.616713032126427} +{"Full-pretrain/Learning Rate": 2.7753906923099865e-05, "Full-pretrain/Loss": 1.9954296350479126, "Full-pretrain/Loss (Raw)": 1.8418463468551636, "Full-pretrain/Step": 4586, "Full-pretrain/Step Time": 17.613623209297657} +{"Full-pretrain/Learning Rate": 2.7745467646057393e-05, "Full-pretrain/Loss": 1.9903252124786377, "Full-pretrain/Loss (Raw)": 1.9915610551834106, "Full-pretrain/Step": 4587, "Full-pretrain/Step Time": 17.61090106330812} +{"Full-pretrain/Learning Rate": 2.7737028052326188e-05, "Full-pretrain/Loss": 1.9956462383270264, "Full-pretrain/Loss (Raw)": 1.9855151176452637, "Full-pretrain/Step": 4588, "Full-pretrain/Step Time": 17.605668000876904} +{"Full-pretrain/Learning Rate": 2.7728588142879762e-05, "Full-pretrain/Loss": 1.997187852859497, "Full-pretrain/Loss (Raw)": 2.095350742340088, "Full-pretrain/Step": 4589, "Full-pretrain/Step Time": 17.612240443006158} +{"Full-pretrain/Learning Rate": 2.7720147918691658e-05, "Full-pretrain/Loss": 2.003523588180542, "Full-pretrain/Loss (Raw)": 2.1997036933898926, "Full-pretrain/Step": 4590, "Full-pretrain/Step Time": 17.61647681519389} +{"Full-pretrain/Learning Rate": 2.771170738073544e-05, "Full-pretrain/Loss": 2.001502752304077, "Full-pretrain/Loss (Raw)": 1.9043376445770264, "Full-pretrain/Step": 4591, "Full-pretrain/Step Time": 17.62016241811216} +{"Full-pretrain/Learning Rate": 2.7703266529984734e-05, "Full-pretrain/Loss": 2.005295753479004, "Full-pretrain/Loss (Raw)": 1.9430493116378784, "Full-pretrain/Step": 4592, "Full-pretrain/Step Time": 17.612272664904594} +{"Full-pretrain/Learning Rate": 2.7694825367413178e-05, "Full-pretrain/Loss": 2.0024497509002686, "Full-pretrain/Loss (Raw)": 1.992625117301941, "Full-pretrain/Step": 4593, "Full-pretrain/Step Time": 17.614664524793625} +{"Full-pretrain/Learning Rate": 2.7686383893994473e-05, "Full-pretrain/Loss": 2.0016069412231445, "Full-pretrain/Loss (Raw)": 2.0770604610443115, "Full-pretrain/Step": 4594, "Full-pretrain/Step Time": 17.615955682471395} +{"Full-pretrain/Learning Rate": 2.767794211070232e-05, "Full-pretrain/Loss": 1.9985387325286865, "Full-pretrain/Loss (Raw)": 2.058173656463623, "Full-pretrain/Step": 4595, "Full-pretrain/Step Time": 17.614696146920323} +{"Full-pretrain/Learning Rate": 2.7669500018510485e-05, "Full-pretrain/Loss": 2.0042037963867188, "Full-pretrain/Loss (Raw)": 2.0973196029663086, "Full-pretrain/Step": 4596, "Full-pretrain/Step Time": 17.607037149369717} +{"Full-pretrain/Learning Rate": 2.7661057618392765e-05, "Full-pretrain/Loss": 1.9933922290802002, "Full-pretrain/Loss (Raw)": 1.8966281414031982, "Full-pretrain/Step": 4597, "Full-pretrain/Step Time": 17.611694265156984} +{"Full-pretrain/Learning Rate": 2.7652614911322987e-05, "Full-pretrain/Loss": 1.9794191122055054, "Full-pretrain/Loss (Raw)": 1.9156485795974731, "Full-pretrain/Step": 4598, "Full-pretrain/Step Time": 17.606591364368796} +{"Full-pretrain/Learning Rate": 2.7644171898275008e-05, "Full-pretrain/Loss": 1.986096978187561, "Full-pretrain/Loss (Raw)": 2.0940346717834473, "Full-pretrain/Step": 4599, "Full-pretrain/Step Time": 17.605285458266735} +{"Full-pretrain/Learning Rate": 2.763572858022273e-05, "Full-pretrain/Loss": 1.9934557676315308, "Full-pretrain/Loss (Raw)": 2.160531997680664, "Full-pretrain/Step": 4600, "Full-pretrain/Step Time": 17.600597605109215} +{"Full-pretrain/Learning Rate": 2.762728495814008e-05, "Full-pretrain/Loss": 1.99335777759552, "Full-pretrain/Loss (Raw)": 1.800844669342041, "Full-pretrain/Step": 4601, "Full-pretrain/Step Time": 17.602696562185884} +{"Full-pretrain/Learning Rate": 2.7618841033001047e-05, "Full-pretrain/Loss": 1.986982822418213, "Full-pretrain/Loss (Raw)": 1.6358637809753418, "Full-pretrain/Step": 4602, "Full-pretrain/Step Time": 17.603674359619617} +{"Full-pretrain/Learning Rate": 2.761039680577961e-05, "Full-pretrain/Loss": 1.9840493202209473, "Full-pretrain/Loss (Raw)": 2.0422396659851074, "Full-pretrain/Step": 4603, "Full-pretrain/Step Time": 17.607273062691092} +{"Full-pretrain/Learning Rate": 2.7601952277449816e-05, "Full-pretrain/Loss": 1.9817460775375366, "Full-pretrain/Loss (Raw)": 1.9900025129318237, "Full-pretrain/Step": 4604, "Full-pretrain/Step Time": 17.598224014043808} +{"Full-pretrain/Learning Rate": 2.759350744898575e-05, "Full-pretrain/Loss": 1.9814953804016113, "Full-pretrain/Loss (Raw)": 1.9149694442749023, "Full-pretrain/Step": 4605, "Full-pretrain/Step Time": 17.60493959672749} +{"Full-pretrain/Learning Rate": 2.7585062321361516e-05, "Full-pretrain/Loss": 1.9803340435028076, "Full-pretrain/Loss (Raw)": 2.0841145515441895, "Full-pretrain/Step": 4606, "Full-pretrain/Step Time": 17.606684172526002} +{"Full-pretrain/Learning Rate": 2.757661689555124e-05, "Full-pretrain/Loss": 1.9806429147720337, "Full-pretrain/Loss (Raw)": 1.9911915063858032, "Full-pretrain/Step": 4607, "Full-pretrain/Step Time": 17.610172791406512} +{"Full-pretrain/Learning Rate": 2.7568171172529118e-05, "Full-pretrain/Loss": 1.9681570529937744, "Full-pretrain/Loss (Raw)": 1.7198328971862793, "Full-pretrain/Step": 4608, "Full-pretrain/Step Time": 17.60170992463827} +{"Full-pretrain/Learning Rate": 2.7559725153269346e-05, "Full-pretrain/Loss": 1.9756081104278564, "Full-pretrain/Loss (Raw)": 2.1200480461120605, "Full-pretrain/Step": 4609, "Full-pretrain/Step Time": 17.602662831544876} +{"Full-pretrain/Learning Rate": 2.7551278838746185e-05, "Full-pretrain/Loss": 1.9565534591674805, "Full-pretrain/Loss (Raw)": 1.8354723453521729, "Full-pretrain/Step": 4610, "Full-pretrain/Step Time": 17.609283147379756} +{"Full-pretrain/Learning Rate": 2.75428322299339e-05, "Full-pretrain/Loss": 1.9539299011230469, "Full-pretrain/Loss (Raw)": 1.7943694591522217, "Full-pretrain/Step": 4611, "Full-pretrain/Step Time": 17.611439015716314} +{"Full-pretrain/Learning Rate": 2.753438532780681e-05, "Full-pretrain/Loss": 1.955751895904541, "Full-pretrain/Loss (Raw)": 2.181586265563965, "Full-pretrain/Step": 4612, "Full-pretrain/Step Time": 17.610829062759876} +{"Full-pretrain/Learning Rate": 2.7525938133339273e-05, "Full-pretrain/Loss": 1.9527618885040283, "Full-pretrain/Loss (Raw)": 2.1414215564727783, "Full-pretrain/Step": 4613, "Full-pretrain/Step Time": 17.606936926022172} +{"Full-pretrain/Learning Rate": 2.7517490647505658e-05, "Full-pretrain/Loss": 1.9632562398910522, "Full-pretrain/Loss (Raw)": 1.8705240488052368, "Full-pretrain/Step": 4614, "Full-pretrain/Step Time": 17.609492691233754} +{"Full-pretrain/Learning Rate": 2.7509042871280372e-05, "Full-pretrain/Loss": 1.9649274349212646, "Full-pretrain/Loss (Raw)": 2.128312587738037, "Full-pretrain/Step": 4615, "Full-pretrain/Step Time": 17.616654694080353} +{"Full-pretrain/Learning Rate": 2.750059480563788e-05, "Full-pretrain/Loss": 1.9766757488250732, "Full-pretrain/Loss (Raw)": 1.9218779802322388, "Full-pretrain/Step": 4616, "Full-pretrain/Step Time": 17.61265305429697} +{"Full-pretrain/Learning Rate": 2.7492146451552654e-05, "Full-pretrain/Loss": 1.984876036643982, "Full-pretrain/Loss (Raw)": 2.0899744033813477, "Full-pretrain/Step": 4617, "Full-pretrain/Step Time": 17.613560227677226} +{"Full-pretrain/Learning Rate": 2.7483697809999214e-05, "Full-pretrain/Loss": 1.977599859237671, "Full-pretrain/Loss (Raw)": 1.6090073585510254, "Full-pretrain/Step": 4618, "Full-pretrain/Step Time": 17.61549772322178} +{"Full-pretrain/Learning Rate": 2.74752488819521e-05, "Full-pretrain/Loss": 1.9761130809783936, "Full-pretrain/Loss (Raw)": 1.9439847469329834, "Full-pretrain/Step": 4619, "Full-pretrain/Step Time": 17.622073605656624} +{"Full-pretrain/Learning Rate": 2.7466799668385896e-05, "Full-pretrain/Loss": 1.9613654613494873, "Full-pretrain/Loss (Raw)": 1.5135934352874756, "Full-pretrain/Step": 4620, "Full-pretrain/Step Time": 17.620399734005332} +{"Full-pretrain/Learning Rate": 2.745835017027522e-05, "Full-pretrain/Loss": 1.9634745121002197, "Full-pretrain/Loss (Raw)": 2.1628386974334717, "Full-pretrain/Step": 4621, "Full-pretrain/Step Time": 17.627113768830895} +{"Full-pretrain/Learning Rate": 2.7449900388594718e-05, "Full-pretrain/Loss": 1.9483017921447754, "Full-pretrain/Loss (Raw)": 1.7141791582107544, "Full-pretrain/Step": 4622, "Full-pretrain/Step Time": 17.623699586838484} +{"Full-pretrain/Learning Rate": 2.7441450324319068e-05, "Full-pretrain/Loss": 1.9541345834732056, "Full-pretrain/Loss (Raw)": 2.0909831523895264, "Full-pretrain/Step": 4623, "Full-pretrain/Step Time": 17.629637917503715} +{"Full-pretrain/Learning Rate": 2.7432999978422974e-05, "Full-pretrain/Loss": 1.9513218402862549, "Full-pretrain/Loss (Raw)": 1.8530446290969849, "Full-pretrain/Step": 4624, "Full-pretrain/Step Time": 17.62686601281166} +{"Full-pretrain/Learning Rate": 2.7424549351881192e-05, "Full-pretrain/Loss": 1.9525055885314941, "Full-pretrain/Loss (Raw)": 2.030503749847412, "Full-pretrain/Step": 4625, "Full-pretrain/Step Time": 17.628770364448428} +{"Full-pretrain/Learning Rate": 2.7416098445668497e-05, "Full-pretrain/Loss": 1.949385643005371, "Full-pretrain/Loss (Raw)": 1.9772239923477173, "Full-pretrain/Step": 4626, "Full-pretrain/Step Time": 17.628578413277864} +{"Full-pretrain/Learning Rate": 2.740764726075969e-05, "Full-pretrain/Loss": 1.964741587638855, "Full-pretrain/Loss (Raw)": 2.549560546875, "Full-pretrain/Step": 4627, "Full-pretrain/Step Time": 17.62466593645513} +{"Full-pretrain/Learning Rate": 2.739919579812961e-05, "Full-pretrain/Loss": 1.964951753616333, "Full-pretrain/Loss (Raw)": 2.1040472984313965, "Full-pretrain/Step": 4628, "Full-pretrain/Step Time": 17.62996551580727} +{"Full-pretrain/Learning Rate": 2.7390744058753155e-05, "Full-pretrain/Loss": 1.9579737186431885, "Full-pretrain/Loss (Raw)": 1.673330545425415, "Full-pretrain/Step": 4629, "Full-pretrain/Step Time": 17.63004326634109} +{"Full-pretrain/Learning Rate": 2.7382292043605207e-05, "Full-pretrain/Loss": 1.9608510732650757, "Full-pretrain/Loss (Raw)": 2.007725715637207, "Full-pretrain/Step": 4630, "Full-pretrain/Step Time": 17.632759042084217} +{"Full-pretrain/Learning Rate": 2.7373839753660706e-05, "Full-pretrain/Loss": 1.9493408203125, "Full-pretrain/Loss (Raw)": 1.7257046699523926, "Full-pretrain/Step": 4631, "Full-pretrain/Step Time": 17.629815576598048} +{"Full-pretrain/Learning Rate": 2.7365387189894624e-05, "Full-pretrain/Loss": 1.9501633644104004, "Full-pretrain/Loss (Raw)": 2.186856746673584, "Full-pretrain/Step": 4632, "Full-pretrain/Step Time": 17.62642795406282} +{"Full-pretrain/Learning Rate": 2.735693435328196e-05, "Full-pretrain/Loss": 1.9603124856948853, "Full-pretrain/Loss (Raw)": 2.1256155967712402, "Full-pretrain/Step": 4633, "Full-pretrain/Step Time": 17.62810873053968} +{"Full-pretrain/Learning Rate": 2.7348481244797752e-05, "Full-pretrain/Loss": 1.966038703918457, "Full-pretrain/Loss (Raw)": 1.8191020488739014, "Full-pretrain/Step": 4634, "Full-pretrain/Step Time": 17.637626372277737} +{"Full-pretrain/Learning Rate": 2.7340027865417055e-05, "Full-pretrain/Loss": 1.9664027690887451, "Full-pretrain/Loss (Raw)": 2.053892135620117, "Full-pretrain/Step": 4635, "Full-pretrain/Step Time": 17.63542240485549} +{"Full-pretrain/Learning Rate": 2.7331574216114964e-05, "Full-pretrain/Loss": 1.9560166597366333, "Full-pretrain/Loss (Raw)": 1.6576462984085083, "Full-pretrain/Step": 4636, "Full-pretrain/Step Time": 17.63619697280228} +{"Full-pretrain/Learning Rate": 2.7323120297866604e-05, "Full-pretrain/Loss": 1.9534671306610107, "Full-pretrain/Loss (Raw)": 1.8333806991577148, "Full-pretrain/Step": 4637, "Full-pretrain/Step Time": 17.63447513245046} +{"Full-pretrain/Learning Rate": 2.731466611164714e-05, "Full-pretrain/Loss": 1.949123740196228, "Full-pretrain/Loss (Raw)": 1.945129156112671, "Full-pretrain/Step": 4638, "Full-pretrain/Step Time": 17.635938240215182} +{"Full-pretrain/Learning Rate": 2.730621165843175e-05, "Full-pretrain/Loss": 1.949358344078064, "Full-pretrain/Loss (Raw)": 1.9986975193023682, "Full-pretrain/Step": 4639, "Full-pretrain/Step Time": 17.637707885354757} +{"Full-pretrain/Learning Rate": 2.7297756939195662e-05, "Full-pretrain/Loss": 1.9692327976226807, "Full-pretrain/Loss (Raw)": 2.3558130264282227, "Full-pretrain/Step": 4640, "Full-pretrain/Step Time": 17.633195020258427} +{"Full-pretrain/Learning Rate": 2.728930195491411e-05, "Full-pretrain/Loss": 1.9610834121704102, "Full-pretrain/Loss (Raw)": 1.859266996383667, "Full-pretrain/Step": 4641, "Full-pretrain/Step Time": 17.64420584216714} +{"Full-pretrain/Learning Rate": 2.728084670656239e-05, "Full-pretrain/Loss": 1.9627774953842163, "Full-pretrain/Loss (Raw)": 1.8896842002868652, "Full-pretrain/Step": 4642, "Full-pretrain/Step Time": 17.647240752354264} +{"Full-pretrain/Learning Rate": 2.72723911951158e-05, "Full-pretrain/Loss": 1.9685587882995605, "Full-pretrain/Loss (Raw)": 1.979367971420288, "Full-pretrain/Step": 4643, "Full-pretrain/Step Time": 17.653733666986227} +{"Full-pretrain/Learning Rate": 2.7263935421549684e-05, "Full-pretrain/Loss": 1.960289478302002, "Full-pretrain/Loss (Raw)": 1.9169719219207764, "Full-pretrain/Step": 4644, "Full-pretrain/Step Time": 17.653415402397513} +{"Full-pretrain/Learning Rate": 2.725547938683941e-05, "Full-pretrain/Loss": 1.955811619758606, "Full-pretrain/Loss (Raw)": 1.9981287717819214, "Full-pretrain/Step": 4645, "Full-pretrain/Step Time": 17.65229255333543} +{"Full-pretrain/Learning Rate": 2.7247023091960376e-05, "Full-pretrain/Loss": 1.9600830078125, "Full-pretrain/Loss (Raw)": 2.0072054862976074, "Full-pretrain/Step": 4646, "Full-pretrain/Step Time": 17.650451125577092} +{"Full-pretrain/Learning Rate": 2.7238566537888033e-05, "Full-pretrain/Loss": 1.9524767398834229, "Full-pretrain/Loss (Raw)": 1.8849139213562012, "Full-pretrain/Step": 4647, "Full-pretrain/Step Time": 17.650181291624904} +{"Full-pretrain/Learning Rate": 2.7230109725597825e-05, "Full-pretrain/Loss": 1.9506056308746338, "Full-pretrain/Loss (Raw)": 1.8620072603225708, "Full-pretrain/Step": 4648, "Full-pretrain/Step Time": 17.644237898290157} +{"Full-pretrain/Learning Rate": 2.722165265606523e-05, "Full-pretrain/Loss": 1.9455482959747314, "Full-pretrain/Loss (Raw)": 1.9281370639801025, "Full-pretrain/Step": 4649, "Full-pretrain/Step Time": 17.64142125286162} +{"Full-pretrain/Learning Rate": 2.7213195330265795e-05, "Full-pretrain/Loss": 1.9519281387329102, "Full-pretrain/Loss (Raw)": 1.8131661415100098, "Full-pretrain/Step": 4650, "Full-pretrain/Step Time": 17.641888484358788} +{"Full-pretrain/Learning Rate": 2.7204737749175046e-05, "Full-pretrain/Loss": 1.9607958793640137, "Full-pretrain/Loss (Raw)": 2.227750062942505, "Full-pretrain/Step": 4651, "Full-pretrain/Step Time": 17.64946883544326} +{"Full-pretrain/Learning Rate": 2.7196279913768584e-05, "Full-pretrain/Loss": 1.9801019430160522, "Full-pretrain/Loss (Raw)": 2.131385564804077, "Full-pretrain/Step": 4652, "Full-pretrain/Step Time": 17.644051613286138} +{"Full-pretrain/Learning Rate": 2.7187821825021998e-05, "Full-pretrain/Loss": 1.974365234375, "Full-pretrain/Loss (Raw)": 1.9792675971984863, "Full-pretrain/Step": 4653, "Full-pretrain/Step Time": 17.642668655142188} +{"Full-pretrain/Learning Rate": 2.717936348391093e-05, "Full-pretrain/Loss": 1.9897358417510986, "Full-pretrain/Loss (Raw)": 2.2060375213623047, "Full-pretrain/Step": 4654, "Full-pretrain/Step Time": 17.64558458700776} +{"Full-pretrain/Learning Rate": 2.717090489141106e-05, "Full-pretrain/Loss": 1.9877017736434937, "Full-pretrain/Loss (Raw)": 2.0258898735046387, "Full-pretrain/Step": 4655, "Full-pretrain/Step Time": 17.64560932852328} +{"Full-pretrain/Learning Rate": 2.716244604849807e-05, "Full-pretrain/Loss": 1.9926388263702393, "Full-pretrain/Loss (Raw)": 2.0110297203063965, "Full-pretrain/Step": 4656, "Full-pretrain/Step Time": 17.645084884017706} +{"Full-pretrain/Learning Rate": 2.7153986956147687e-05, "Full-pretrain/Loss": 1.9853897094726562, "Full-pretrain/Loss (Raw)": 1.7985363006591797, "Full-pretrain/Step": 4657, "Full-pretrain/Step Time": 17.64837745577097} +{"Full-pretrain/Learning Rate": 2.7145527615335663e-05, "Full-pretrain/Loss": 1.9829950332641602, "Full-pretrain/Loss (Raw)": 1.9005908966064453, "Full-pretrain/Step": 4658, "Full-pretrain/Step Time": 17.645905882120132} +{"Full-pretrain/Learning Rate": 2.7137068027037787e-05, "Full-pretrain/Loss": 1.9540863037109375, "Full-pretrain/Loss (Raw)": 1.6244841814041138, "Full-pretrain/Step": 4659, "Full-pretrain/Step Time": 17.646834637969732} +{"Full-pretrain/Learning Rate": 2.7128608192229867e-05, "Full-pretrain/Loss": 1.9467182159423828, "Full-pretrain/Loss (Raw)": 1.8682661056518555, "Full-pretrain/Step": 4660, "Full-pretrain/Step Time": 17.645798318088055} +{"Full-pretrain/Learning Rate": 2.7120148111887732e-05, "Full-pretrain/Loss": 1.9483327865600586, "Full-pretrain/Loss (Raw)": 1.7249963283538818, "Full-pretrain/Step": 4661, "Full-pretrain/Step Time": 17.644268224015832} +{"Full-pretrain/Learning Rate": 2.711168778698726e-05, "Full-pretrain/Loss": 1.9436324834823608, "Full-pretrain/Loss (Raw)": 1.857317328453064, "Full-pretrain/Step": 4662, "Full-pretrain/Step Time": 17.643824376165867} +{"Full-pretrain/Learning Rate": 2.7103227218504345e-05, "Full-pretrain/Loss": 1.9590673446655273, "Full-pretrain/Loss (Raw)": 2.219616174697876, "Full-pretrain/Step": 4663, "Full-pretrain/Step Time": 17.64285912923515} +{"Full-pretrain/Learning Rate": 2.7094766407414917e-05, "Full-pretrain/Loss": 1.9425113201141357, "Full-pretrain/Loss (Raw)": 1.6570677757263184, "Full-pretrain/Step": 4664, "Full-pretrain/Step Time": 17.65244448930025} +{"Full-pretrain/Learning Rate": 2.7086305354694907e-05, "Full-pretrain/Loss": 1.9413020610809326, "Full-pretrain/Loss (Raw)": 2.086916923522949, "Full-pretrain/Step": 4665, "Full-pretrain/Step Time": 17.643821068108082} +{"Full-pretrain/Learning Rate": 2.7077844061320317e-05, "Full-pretrain/Loss": 1.960137128829956, "Full-pretrain/Loss (Raw)": 2.4218263626098633, "Full-pretrain/Step": 4666, "Full-pretrain/Step Time": 17.64663876220584} +{"Full-pretrain/Learning Rate": 2.706938252826714e-05, "Full-pretrain/Loss": 1.9541295766830444, "Full-pretrain/Loss (Raw)": 1.8616502285003662, "Full-pretrain/Step": 4667, "Full-pretrain/Step Time": 17.64607542566955} +{"Full-pretrain/Learning Rate": 2.7060920756511422e-05, "Full-pretrain/Loss": 1.9690240621566772, "Full-pretrain/Loss (Raw)": 2.1342720985412598, "Full-pretrain/Step": 4668, "Full-pretrain/Step Time": 17.654295038431883} +{"Full-pretrain/Learning Rate": 2.705245874702921e-05, "Full-pretrain/Loss": 1.968416452407837, "Full-pretrain/Loss (Raw)": 1.8139351606369019, "Full-pretrain/Step": 4669, "Full-pretrain/Step Time": 17.649983774870634} +{"Full-pretrain/Learning Rate": 2.7043996500796605e-05, "Full-pretrain/Loss": 1.9634209871292114, "Full-pretrain/Loss (Raw)": 1.785273790359497, "Full-pretrain/Step": 4670, "Full-pretrain/Step Time": 17.647273229435086} +{"Full-pretrain/Learning Rate": 2.703553401878972e-05, "Full-pretrain/Loss": 1.9591881036758423, "Full-pretrain/Loss (Raw)": 1.863248586654663, "Full-pretrain/Step": 4671, "Full-pretrain/Step Time": 17.639502422884107} +{"Full-pretrain/Learning Rate": 2.7027071301984713e-05, "Full-pretrain/Loss": 1.9416600465774536, "Full-pretrain/Loss (Raw)": 1.7949144840240479, "Full-pretrain/Step": 4672, "Full-pretrain/Step Time": 17.6450831964612} +{"Full-pretrain/Learning Rate": 2.701860835135773e-05, "Full-pretrain/Loss": 1.9407591819763184, "Full-pretrain/Loss (Raw)": 1.8304407596588135, "Full-pretrain/Step": 4673, "Full-pretrain/Step Time": 17.640039013698697} +{"Full-pretrain/Learning Rate": 2.7010145167884994e-05, "Full-pretrain/Loss": 1.9330203533172607, "Full-pretrain/Loss (Raw)": 1.6420419216156006, "Full-pretrain/Step": 4674, "Full-pretrain/Step Time": 17.64361753128469} +{"Full-pretrain/Learning Rate": 2.7001681752542713e-05, "Full-pretrain/Loss": 1.9325966835021973, "Full-pretrain/Loss (Raw)": 1.9658074378967285, "Full-pretrain/Step": 4675, "Full-pretrain/Step Time": 17.639047546312213} +{"Full-pretrain/Learning Rate": 2.6993218106307145e-05, "Full-pretrain/Loss": 1.9469351768493652, "Full-pretrain/Loss (Raw)": 2.375807523727417, "Full-pretrain/Step": 4676, "Full-pretrain/Step Time": 17.6463016923517} +{"Full-pretrain/Learning Rate": 2.698475423015457e-05, "Full-pretrain/Loss": 1.9440572261810303, "Full-pretrain/Loss (Raw)": 1.9060328006744385, "Full-pretrain/Step": 4677, "Full-pretrain/Step Time": 17.646997541189194} +{"Full-pretrain/Learning Rate": 2.6976290125061288e-05, "Full-pretrain/Loss": 1.945683240890503, "Full-pretrain/Loss (Raw)": 2.0592353343963623, "Full-pretrain/Step": 4678, "Full-pretrain/Step Time": 17.643229819834232} +{"Full-pretrain/Learning Rate": 2.6967825792003644e-05, "Full-pretrain/Loss": 1.9465348720550537, "Full-pretrain/Loss (Raw)": 1.9121679067611694, "Full-pretrain/Step": 4679, "Full-pretrain/Step Time": 17.640256691724062} +{"Full-pretrain/Learning Rate": 2.6959361231957975e-05, "Full-pretrain/Loss": 1.9463441371917725, "Full-pretrain/Loss (Raw)": 1.8559056520462036, "Full-pretrain/Step": 4680, "Full-pretrain/Step Time": 17.6427009254694} +{"Full-pretrain/Learning Rate": 2.6950896445900687e-05, "Full-pretrain/Loss": 1.9333306550979614, "Full-pretrain/Loss (Raw)": 1.5117027759552002, "Full-pretrain/Step": 4681, "Full-pretrain/Step Time": 17.641746217384934} +{"Full-pretrain/Learning Rate": 2.694243143480818e-05, "Full-pretrain/Loss": 1.9390220642089844, "Full-pretrain/Loss (Raw)": 1.9952929019927979, "Full-pretrain/Step": 4682, "Full-pretrain/Step Time": 17.64056094735861} +{"Full-pretrain/Learning Rate": 2.693396619965688e-05, "Full-pretrain/Loss": 1.9288486242294312, "Full-pretrain/Loss (Raw)": 1.90220046043396, "Full-pretrain/Step": 4683, "Full-pretrain/Step Time": 17.64159221202135} +{"Full-pretrain/Learning Rate": 2.6925500741423265e-05, "Full-pretrain/Loss": 1.918993353843689, "Full-pretrain/Loss (Raw)": 1.8160123825073242, "Full-pretrain/Step": 4684, "Full-pretrain/Step Time": 17.649623634293675} +{"Full-pretrain/Learning Rate": 2.691703506108381e-05, "Full-pretrain/Loss": 1.917803406715393, "Full-pretrain/Loss (Raw)": 1.941190481185913, "Full-pretrain/Step": 4685, "Full-pretrain/Step Time": 17.64883140847087} +{"Full-pretrain/Learning Rate": 2.6908569159615038e-05, "Full-pretrain/Loss": 1.9092391729354858, "Full-pretrain/Loss (Raw)": 1.9319816827774048, "Full-pretrain/Step": 4686, "Full-pretrain/Step Time": 17.646355560049415} +{"Full-pretrain/Learning Rate": 2.6900103037993492e-05, "Full-pretrain/Loss": 1.9064395427703857, "Full-pretrain/Loss (Raw)": 1.9363012313842773, "Full-pretrain/Step": 4687, "Full-pretrain/Step Time": 17.644393717870116} +{"Full-pretrain/Learning Rate": 2.6891636697195716e-05, "Full-pretrain/Loss": 1.9065284729003906, "Full-pretrain/Loss (Raw)": 2.01387619972229, "Full-pretrain/Step": 4688, "Full-pretrain/Step Time": 17.638179156929255} +{"Full-pretrain/Learning Rate": 2.6883170138198323e-05, "Full-pretrain/Loss": 1.9155395030975342, "Full-pretrain/Loss (Raw)": 2.0868897438049316, "Full-pretrain/Step": 4689, "Full-pretrain/Step Time": 17.648323414847255} +{"Full-pretrain/Learning Rate": 2.687470336197791e-05, "Full-pretrain/Loss": 1.914847493171692, "Full-pretrain/Loss (Raw)": 1.8784446716308594, "Full-pretrain/Step": 4690, "Full-pretrain/Step Time": 17.64952990040183} +{"Full-pretrain/Learning Rate": 2.6866236369511122e-05, "Full-pretrain/Loss": 1.9287831783294678, "Full-pretrain/Loss (Raw)": 2.070425510406494, "Full-pretrain/Step": 4691, "Full-pretrain/Step Time": 17.6474425829947} +{"Full-pretrain/Learning Rate": 2.6857769161774627e-05, "Full-pretrain/Loss": 1.935521125793457, "Full-pretrain/Loss (Raw)": 2.0838842391967773, "Full-pretrain/Step": 4692, "Full-pretrain/Step Time": 17.64410217665136} +{"Full-pretrain/Learning Rate": 2.6849301739745108e-05, "Full-pretrain/Loss": 1.944199562072754, "Full-pretrain/Loss (Raw)": 2.0027048587799072, "Full-pretrain/Step": 4693, "Full-pretrain/Step Time": 17.644505754113197} +{"Full-pretrain/Learning Rate": 2.6840834104399293e-05, "Full-pretrain/Loss": 1.9504247903823853, "Full-pretrain/Loss (Raw)": 2.0565249919891357, "Full-pretrain/Step": 4694, "Full-pretrain/Step Time": 17.64360356889665} +{"Full-pretrain/Learning Rate": 2.68323662567139e-05, "Full-pretrain/Loss": 1.9316537380218506, "Full-pretrain/Loss (Raw)": 1.618943691253662, "Full-pretrain/Step": 4695, "Full-pretrain/Step Time": 17.640454687178135} +{"Full-pretrain/Learning Rate": 2.6823898197665703e-05, "Full-pretrain/Loss": 1.943321704864502, "Full-pretrain/Loss (Raw)": 2.0304431915283203, "Full-pretrain/Step": 4696, "Full-pretrain/Step Time": 17.642816001549363} +{"Full-pretrain/Learning Rate": 2.68154299282315e-05, "Full-pretrain/Loss": 1.9393478631973267, "Full-pretrain/Loss (Raw)": 1.9597513675689697, "Full-pretrain/Step": 4697, "Full-pretrain/Step Time": 17.64196864888072} +{"Full-pretrain/Learning Rate": 2.680696144938809e-05, "Full-pretrain/Loss": 1.9333083629608154, "Full-pretrain/Loss (Raw)": 2.2285637855529785, "Full-pretrain/Step": 4698, "Full-pretrain/Step Time": 17.643867203965783} +{"Full-pretrain/Learning Rate": 2.6798492762112303e-05, "Full-pretrain/Loss": 1.9356334209442139, "Full-pretrain/Loss (Raw)": 1.9360522031784058, "Full-pretrain/Step": 4699, "Full-pretrain/Step Time": 17.639199366793036} +{"Full-pretrain/Learning Rate": 2.679002386738102e-05, "Full-pretrain/Loss": 1.9376018047332764, "Full-pretrain/Loss (Raw)": 2.1972570419311523, "Full-pretrain/Step": 4700, "Full-pretrain/Step Time": 17.64340563490987} +{"Full-pretrain/Learning Rate": 2.67815547661711e-05, "Full-pretrain/Loss": 1.9471255540847778, "Full-pretrain/Loss (Raw)": 2.1186976432800293, "Full-pretrain/Step": 4701, "Full-pretrain/Step Time": 17.6466874293983} +{"Full-pretrain/Learning Rate": 2.677308545945948e-05, "Full-pretrain/Loss": 1.9570629596710205, "Full-pretrain/Loss (Raw)": 2.1032700538635254, "Full-pretrain/Step": 4702, "Full-pretrain/Step Time": 17.65321619808674} +{"Full-pretrain/Learning Rate": 2.676461594822306e-05, "Full-pretrain/Loss": 1.9640791416168213, "Full-pretrain/Loss (Raw)": 2.08776593208313, "Full-pretrain/Step": 4703, "Full-pretrain/Step Time": 17.648643342778087} +{"Full-pretrain/Learning Rate": 2.6756146233438816e-05, "Full-pretrain/Loss": 1.9707515239715576, "Full-pretrain/Loss (Raw)": 2.008431911468506, "Full-pretrain/Step": 4704, "Full-pretrain/Step Time": 17.64042286761105} +{"Full-pretrain/Learning Rate": 2.6747676316083726e-05, "Full-pretrain/Loss": 1.987000584602356, "Full-pretrain/Loss (Raw)": 2.3504114151000977, "Full-pretrain/Step": 4705, "Full-pretrain/Step Time": 17.641739709302783} +{"Full-pretrain/Learning Rate": 2.673920619713478e-05, "Full-pretrain/Loss": 1.9919681549072266, "Full-pretrain/Loss (Raw)": 1.8010034561157227, "Full-pretrain/Step": 4706, "Full-pretrain/Step Time": 17.64592290110886} +{"Full-pretrain/Learning Rate": 2.6730735877569014e-05, "Full-pretrain/Loss": 1.9962530136108398, "Full-pretrain/Loss (Raw)": 2.102926254272461, "Full-pretrain/Step": 4707, "Full-pretrain/Step Time": 17.646559350192547} +{"Full-pretrain/Learning Rate": 2.6722265358363473e-05, "Full-pretrain/Loss": 1.9835245609283447, "Full-pretrain/Loss (Raw)": 1.9684962034225464, "Full-pretrain/Step": 4708, "Full-pretrain/Step Time": 17.649114962667227} +{"Full-pretrain/Learning Rate": 2.6713794640495227e-05, "Full-pretrain/Loss": 1.9876035451889038, "Full-pretrain/Loss (Raw)": 2.0365583896636963, "Full-pretrain/Step": 4709, "Full-pretrain/Step Time": 17.64960952475667} +{"Full-pretrain/Learning Rate": 2.6705323724941374e-05, "Full-pretrain/Loss": 1.9813734292984009, "Full-pretrain/Loss (Raw)": 1.8598713874816895, "Full-pretrain/Step": 4710, "Full-pretrain/Step Time": 17.6587874032557} +{"Full-pretrain/Learning Rate": 2.6696852612679023e-05, "Full-pretrain/Loss": 1.9807746410369873, "Full-pretrain/Loss (Raw)": 1.8930070400238037, "Full-pretrain/Step": 4711, "Full-pretrain/Step Time": 17.662304926663637} +{"Full-pretrain/Learning Rate": 2.668838130468532e-05, "Full-pretrain/Loss": 1.98060941696167, "Full-pretrain/Loss (Raw)": 1.8506156206130981, "Full-pretrain/Step": 4712, "Full-pretrain/Step Time": 17.6583017334342} +{"Full-pretrain/Learning Rate": 2.667990980193743e-05, "Full-pretrain/Loss": 2.000615119934082, "Full-pretrain/Loss (Raw)": 2.1518871784210205, "Full-pretrain/Step": 4713, "Full-pretrain/Step Time": 17.66199859790504} +{"Full-pretrain/Learning Rate": 2.667143810541254e-05, "Full-pretrain/Loss": 1.9982753992080688, "Full-pretrain/Loss (Raw)": 1.9204190969467163, "Full-pretrain/Step": 4714, "Full-pretrain/Step Time": 17.667061677202582} +{"Full-pretrain/Learning Rate": 2.666296621608784e-05, "Full-pretrain/Loss": 1.9956026077270508, "Full-pretrain/Loss (Raw)": 1.816670536994934, "Full-pretrain/Step": 4715, "Full-pretrain/Step Time": 17.66919009387493} +{"Full-pretrain/Learning Rate": 2.6654494134940582e-05, "Full-pretrain/Loss": 2.0003700256347656, "Full-pretrain/Loss (Raw)": 1.9685657024383545, "Full-pretrain/Step": 4716, "Full-pretrain/Step Time": 17.66940287873149} +{"Full-pretrain/Learning Rate": 2.6646021862948e-05, "Full-pretrain/Loss": 2.0002212524414062, "Full-pretrain/Loss (Raw)": 1.9364374876022339, "Full-pretrain/Step": 4717, "Full-pretrain/Step Time": 17.66872614622116} +{"Full-pretrain/Learning Rate": 2.663754940108738e-05, "Full-pretrain/Loss": 2.003392219543457, "Full-pretrain/Loss (Raw)": 2.033449411392212, "Full-pretrain/Step": 4718, "Full-pretrain/Step Time": 17.669602328911424} +{"Full-pretrain/Learning Rate": 2.6629076750336008e-05, "Full-pretrain/Loss": 1.9848527908325195, "Full-pretrain/Loss (Raw)": 1.3430376052856445, "Full-pretrain/Step": 4719, "Full-pretrain/Step Time": 17.664516385644674} +{"Full-pretrain/Learning Rate": 2.66206039116712e-05, "Full-pretrain/Loss": 1.9846473932266235, "Full-pretrain/Loss (Raw)": 2.007305860519409, "Full-pretrain/Step": 4720, "Full-pretrain/Step Time": 17.666113309562206} +{"Full-pretrain/Learning Rate": 2.6612130886070315e-05, "Full-pretrain/Loss": 1.9878907203674316, "Full-pretrain/Loss (Raw)": 2.1906795501708984, "Full-pretrain/Step": 4721, "Full-pretrain/Step Time": 17.671444538980722} +{"Full-pretrain/Learning Rate": 2.6603657674510686e-05, "Full-pretrain/Loss": 1.990283489227295, "Full-pretrain/Loss (Raw)": 1.9550113677978516, "Full-pretrain/Step": 4722, "Full-pretrain/Step Time": 17.670733470469713} +{"Full-pretrain/Learning Rate": 2.6595184277969713e-05, "Full-pretrain/Loss": 1.9869043827056885, "Full-pretrain/Loss (Raw)": 1.9622975587844849, "Full-pretrain/Step": 4723, "Full-pretrain/Step Time": 17.676247339695692} +{"Full-pretrain/Learning Rate": 2.65867106974248e-05, "Full-pretrain/Loss": 1.97927725315094, "Full-pretrain/Loss (Raw)": 1.8398163318634033, "Full-pretrain/Step": 4724, "Full-pretrain/Step Time": 17.675404213368893} +{"Full-pretrain/Learning Rate": 2.657823693385335e-05, "Full-pretrain/Loss": 1.977868914604187, "Full-pretrain/Loss (Raw)": 1.9576351642608643, "Full-pretrain/Step": 4725, "Full-pretrain/Step Time": 17.67177689447999} +{"Full-pretrain/Learning Rate": 2.656976298823284e-05, "Full-pretrain/Loss": 1.9761478900909424, "Full-pretrain/Loss (Raw)": 2.0014538764953613, "Full-pretrain/Step": 4726, "Full-pretrain/Step Time": 17.676428889855742} +{"Full-pretrain/Learning Rate": 2.656128886154071e-05, "Full-pretrain/Loss": 1.9823108911514282, "Full-pretrain/Loss (Raw)": 1.8161606788635254, "Full-pretrain/Step": 4727, "Full-pretrain/Step Time": 17.679042011499405} +{"Full-pretrain/Learning Rate": 2.6552814554754463e-05, "Full-pretrain/Loss": 1.9650068283081055, "Full-pretrain/Loss (Raw)": 1.476710557937622, "Full-pretrain/Step": 4728, "Full-pretrain/Step Time": 17.679747773334384} +{"Full-pretrain/Learning Rate": 2.6544340068851604e-05, "Full-pretrain/Loss": 1.9626619815826416, "Full-pretrain/Loss (Raw)": 1.88471519947052, "Full-pretrain/Step": 4729, "Full-pretrain/Step Time": 17.676978709176183} +{"Full-pretrain/Learning Rate": 2.6535865404809658e-05, "Full-pretrain/Loss": 1.9466118812561035, "Full-pretrain/Loss (Raw)": 1.7149640321731567, "Full-pretrain/Step": 4730, "Full-pretrain/Step Time": 17.68002856709063} +{"Full-pretrain/Learning Rate": 2.652739056360618e-05, "Full-pretrain/Loss": 1.9519693851470947, "Full-pretrain/Loss (Raw)": 2.107489585876465, "Full-pretrain/Step": 4731, "Full-pretrain/Step Time": 17.677762620151043} +{"Full-pretrain/Learning Rate": 2.6518915546218736e-05, "Full-pretrain/Loss": 1.938166856765747, "Full-pretrain/Loss (Raw)": 1.7555756568908691, "Full-pretrain/Step": 4732, "Full-pretrain/Step Time": 17.67743046581745} +{"Full-pretrain/Learning Rate": 2.6510440353624914e-05, "Full-pretrain/Loss": 1.9404100179672241, "Full-pretrain/Loss (Raw)": 2.1904799938201904, "Full-pretrain/Step": 4733, "Full-pretrain/Step Time": 17.667869068682194} +{"Full-pretrain/Learning Rate": 2.650196498680234e-05, "Full-pretrain/Loss": 1.9368393421173096, "Full-pretrain/Loss (Raw)": 1.9890083074569702, "Full-pretrain/Step": 4734, "Full-pretrain/Step Time": 17.673798870295286} +{"Full-pretrain/Learning Rate": 2.649348944672862e-05, "Full-pretrain/Loss": 1.930274486541748, "Full-pretrain/Loss (Raw)": 1.8776918649673462, "Full-pretrain/Step": 4735, "Full-pretrain/Step Time": 17.66831947118044} +{"Full-pretrain/Learning Rate": 2.648501373438142e-05, "Full-pretrain/Loss": 1.9295130968093872, "Full-pretrain/Loss (Raw)": 1.9840667247772217, "Full-pretrain/Step": 4736, "Full-pretrain/Step Time": 17.672450713813305} +{"Full-pretrain/Learning Rate": 2.647653785073841e-05, "Full-pretrain/Loss": 1.919724702835083, "Full-pretrain/Loss (Raw)": 2.0371809005737305, "Full-pretrain/Step": 4737, "Full-pretrain/Step Time": 17.668685095384717} +{"Full-pretrain/Learning Rate": 2.6468061796777278e-05, "Full-pretrain/Loss": 1.9282279014587402, "Full-pretrain/Loss (Raw)": 2.0731067657470703, "Full-pretrain/Step": 4738, "Full-pretrain/Step Time": 17.663077902048826} +{"Full-pretrain/Learning Rate": 2.645958557347573e-05, "Full-pretrain/Loss": 1.9185246229171753, "Full-pretrain/Loss (Raw)": 1.792421579360962, "Full-pretrain/Step": 4739, "Full-pretrain/Step Time": 17.664050921797752} +{"Full-pretrain/Learning Rate": 2.6451109181811505e-05, "Full-pretrain/Loss": 1.9206774234771729, "Full-pretrain/Loss (Raw)": 2.0373854637145996, "Full-pretrain/Step": 4740, "Full-pretrain/Step Time": 17.666036497801542} +{"Full-pretrain/Learning Rate": 2.6442632622762344e-05, "Full-pretrain/Loss": 1.92429518699646, "Full-pretrain/Loss (Raw)": 2.15232515335083, "Full-pretrain/Step": 4741, "Full-pretrain/Step Time": 17.667527129873633} +{"Full-pretrain/Learning Rate": 2.6434155897306018e-05, "Full-pretrain/Loss": 1.9181180000305176, "Full-pretrain/Loss (Raw)": 1.6622047424316406, "Full-pretrain/Step": 4742, "Full-pretrain/Step Time": 17.67034720443189} +{"Full-pretrain/Learning Rate": 2.6425679006420306e-05, "Full-pretrain/Loss": 1.923370361328125, "Full-pretrain/Loss (Raw)": 2.0610809326171875, "Full-pretrain/Step": 4743, "Full-pretrain/Step Time": 17.667299918830395} +{"Full-pretrain/Learning Rate": 2.6417201951083025e-05, "Full-pretrain/Loss": 1.924451470375061, "Full-pretrain/Loss (Raw)": 1.8852112293243408, "Full-pretrain/Step": 4744, "Full-pretrain/Step Time": 17.668512478470802} +{"Full-pretrain/Learning Rate": 2.6408724732272e-05, "Full-pretrain/Loss": 1.9043903350830078, "Full-pretrain/Loss (Raw)": 1.50993013381958, "Full-pretrain/Step": 4745, "Full-pretrain/Step Time": 17.664415672421455} +{"Full-pretrain/Learning Rate": 2.640024735096507e-05, "Full-pretrain/Loss": 1.9050477743148804, "Full-pretrain/Loss (Raw)": 1.9414587020874023, "Full-pretrain/Step": 4746, "Full-pretrain/Step Time": 17.659399090334773} +{"Full-pretrain/Learning Rate": 2.63917698081401e-05, "Full-pretrain/Loss": 1.9043042659759521, "Full-pretrain/Loss (Raw)": 1.7928776741027832, "Full-pretrain/Step": 4747, "Full-pretrain/Step Time": 17.659138649702072} +{"Full-pretrain/Learning Rate": 2.6383292104774977e-05, "Full-pretrain/Loss": 1.9014862775802612, "Full-pretrain/Loss (Raw)": 1.8783900737762451, "Full-pretrain/Step": 4748, "Full-pretrain/Step Time": 17.659617057070136} +{"Full-pretrain/Learning Rate": 2.6374814241847583e-05, "Full-pretrain/Loss": 1.8995089530944824, "Full-pretrain/Loss (Raw)": 1.8731637001037598, "Full-pretrain/Step": 4749, "Full-pretrain/Step Time": 17.65058155171573} +{"Full-pretrain/Learning Rate": 2.6366336220335862e-05, "Full-pretrain/Loss": 1.9086406230926514, "Full-pretrain/Loss (Raw)": 2.3256635665893555, "Full-pretrain/Step": 4750, "Full-pretrain/Step Time": 17.659898590296507} +{"Full-pretrain/Learning Rate": 2.635785804121773e-05, "Full-pretrain/Loss": 1.9348554611206055, "Full-pretrain/Loss (Raw)": 2.181910753250122, "Full-pretrain/Step": 4751, "Full-pretrain/Step Time": 17.65807005390525} +{"Full-pretrain/Learning Rate": 2.6349379705471155e-05, "Full-pretrain/Loss": 1.9313932657241821, "Full-pretrain/Loss (Raw)": 1.8965144157409668, "Full-pretrain/Step": 4752, "Full-pretrain/Step Time": 17.655931951478124} +{"Full-pretrain/Learning Rate": 2.6340901214074103e-05, "Full-pretrain/Loss": 1.9293895959854126, "Full-pretrain/Loss (Raw)": 2.1265652179718018, "Full-pretrain/Step": 4753, "Full-pretrain/Step Time": 17.65533726476133} +{"Full-pretrain/Learning Rate": 2.6332422568004566e-05, "Full-pretrain/Loss": 1.9296953678131104, "Full-pretrain/Loss (Raw)": 1.9647953510284424, "Full-pretrain/Step": 4754, "Full-pretrain/Step Time": 17.660532113164663} +{"Full-pretrain/Learning Rate": 2.632394376824056e-05, "Full-pretrain/Loss": 1.9267287254333496, "Full-pretrain/Loss (Raw)": 1.8673632144927979, "Full-pretrain/Step": 4755, "Full-pretrain/Step Time": 17.667605467140675} +{"Full-pretrain/Learning Rate": 2.6315464815760105e-05, "Full-pretrain/Loss": 1.9357144832611084, "Full-pretrain/Loss (Raw)": 2.1273579597473145, "Full-pretrain/Step": 4756, "Full-pretrain/Step Time": 17.663616029545665} +{"Full-pretrain/Learning Rate": 2.6306985711541238e-05, "Full-pretrain/Loss": 1.9368821382522583, "Full-pretrain/Loss (Raw)": 1.9950042963027954, "Full-pretrain/Step": 4757, "Full-pretrain/Step Time": 17.659043420106173} +{"Full-pretrain/Learning Rate": 2.629850645656204e-05, "Full-pretrain/Loss": 1.9357929229736328, "Full-pretrain/Loss (Raw)": 1.9665992259979248, "Full-pretrain/Step": 4758, "Full-pretrain/Step Time": 17.66192110441625} +{"Full-pretrain/Learning Rate": 2.6290027051800565e-05, "Full-pretrain/Loss": 1.9484572410583496, "Full-pretrain/Loss (Raw)": 2.221416473388672, "Full-pretrain/Step": 4759, "Full-pretrain/Step Time": 17.666327005252242} +{"Full-pretrain/Learning Rate": 2.628154749823493e-05, "Full-pretrain/Loss": 1.9677512645721436, "Full-pretrain/Loss (Raw)": 2.0941178798675537, "Full-pretrain/Step": 4760, "Full-pretrain/Step Time": 17.664483746513724} +{"Full-pretrain/Learning Rate": 2.6273067796843244e-05, "Full-pretrain/Loss": 1.97550368309021, "Full-pretrain/Loss (Raw)": 2.1327970027923584, "Full-pretrain/Step": 4761, "Full-pretrain/Step Time": 17.666038131341338} +{"Full-pretrain/Learning Rate": 2.6264587948603626e-05, "Full-pretrain/Loss": 1.9839720726013184, "Full-pretrain/Loss (Raw)": 1.985953688621521, "Full-pretrain/Step": 4762, "Full-pretrain/Step Time": 17.658070592209697} +{"Full-pretrain/Learning Rate": 2.6256107954494242e-05, "Full-pretrain/Loss": 1.983306884765625, "Full-pretrain/Loss (Raw)": 2.08620023727417, "Full-pretrain/Step": 4763, "Full-pretrain/Step Time": 17.66154694929719} +{"Full-pretrain/Learning Rate": 2.624762781549324e-05, "Full-pretrain/Loss": 1.9787784814834595, "Full-pretrain/Loss (Raw)": 1.610667109489441, "Full-pretrain/Step": 4764, "Full-pretrain/Step Time": 17.663980808109045} +{"Full-pretrain/Learning Rate": 2.6239147532578812e-05, "Full-pretrain/Loss": 1.9678412675857544, "Full-pretrain/Loss (Raw)": 1.8404897451400757, "Full-pretrain/Step": 4765, "Full-pretrain/Step Time": 17.660560961812735} +{"Full-pretrain/Learning Rate": 2.6230667106729156e-05, "Full-pretrain/Loss": 1.9585545063018799, "Full-pretrain/Loss (Raw)": 1.691833257675171, "Full-pretrain/Step": 4766, "Full-pretrain/Step Time": 17.663413178175688} +{"Full-pretrain/Learning Rate": 2.6222186538922473e-05, "Full-pretrain/Loss": 1.9724868535995483, "Full-pretrain/Loss (Raw)": 2.3235249519348145, "Full-pretrain/Step": 4767, "Full-pretrain/Step Time": 17.6667191516608} +{"Full-pretrain/Learning Rate": 2.6213705830137008e-05, "Full-pretrain/Loss": 1.9754966497421265, "Full-pretrain/Loss (Raw)": 2.080380916595459, "Full-pretrain/Step": 4768, "Full-pretrain/Step Time": 17.669966831803322} +{"Full-pretrain/Learning Rate": 2.6205224981350997e-05, "Full-pretrain/Loss": 1.9764142036437988, "Full-pretrain/Loss (Raw)": 2.0665457248687744, "Full-pretrain/Step": 4769, "Full-pretrain/Step Time": 17.657404895871878} +{"Full-pretrain/Learning Rate": 2.6196743993542712e-05, "Full-pretrain/Loss": 1.9708558320999146, "Full-pretrain/Loss (Raw)": 1.8952372074127197, "Full-pretrain/Step": 4770, "Full-pretrain/Step Time": 17.658208353444934} +{"Full-pretrain/Learning Rate": 2.6188262867690428e-05, "Full-pretrain/Loss": 1.9762821197509766, "Full-pretrain/Loss (Raw)": 1.966057300567627, "Full-pretrain/Step": 4771, "Full-pretrain/Step Time": 17.659559339284897} +{"Full-pretrain/Learning Rate": 2.6179781604772435e-05, "Full-pretrain/Loss": 1.9699668884277344, "Full-pretrain/Loss (Raw)": 1.8353018760681152, "Full-pretrain/Step": 4772, "Full-pretrain/Step Time": 17.66003268584609} +{"Full-pretrain/Learning Rate": 2.6171300205767052e-05, "Full-pretrain/Loss": 1.9635478258132935, "Full-pretrain/Loss (Raw)": 1.9469150304794312, "Full-pretrain/Step": 4773, "Full-pretrain/Step Time": 17.65853996016085} +{"Full-pretrain/Learning Rate": 2.6162818671652606e-05, "Full-pretrain/Loss": 1.9698989391326904, "Full-pretrain/Loss (Raw)": 1.8654417991638184, "Full-pretrain/Step": 4774, "Full-pretrain/Step Time": 17.659563371911645} +{"Full-pretrain/Learning Rate": 2.615433700340743e-05, "Full-pretrain/Loss": 1.9633152484893799, "Full-pretrain/Loss (Raw)": 1.8504031896591187, "Full-pretrain/Step": 4775, "Full-pretrain/Step Time": 17.657372511923313} +{"Full-pretrain/Learning Rate": 2.614585520200989e-05, "Full-pretrain/Loss": 1.9647066593170166, "Full-pretrain/Loss (Raw)": 1.929734468460083, "Full-pretrain/Step": 4776, "Full-pretrain/Step Time": 17.659956162795424} +{"Full-pretrain/Learning Rate": 2.613737326843835e-05, "Full-pretrain/Loss": 1.9720491170883179, "Full-pretrain/Loss (Raw)": 1.7448902130126953, "Full-pretrain/Step": 4777, "Full-pretrain/Step Time": 17.655375698581338} +{"Full-pretrain/Learning Rate": 2.6128891203671202e-05, "Full-pretrain/Loss": 1.9649330377578735, "Full-pretrain/Loss (Raw)": 1.713744044303894, "Full-pretrain/Step": 4778, "Full-pretrain/Step Time": 17.66231545805931} +{"Full-pretrain/Learning Rate": 2.612040900868685e-05, "Full-pretrain/Loss": 1.963984727859497, "Full-pretrain/Loss (Raw)": 1.7625360488891602, "Full-pretrain/Step": 4779, "Full-pretrain/Step Time": 17.65222790837288} +{"Full-pretrain/Learning Rate": 2.6111926684463717e-05, "Full-pretrain/Loss": 1.9668456315994263, "Full-pretrain/Loss (Raw)": 1.969931960105896, "Full-pretrain/Step": 4780, "Full-pretrain/Step Time": 17.656021298840642} +{"Full-pretrain/Learning Rate": 2.6103444231980236e-05, "Full-pretrain/Loss": 1.9698466062545776, "Full-pretrain/Loss (Raw)": 1.969200849533081, "Full-pretrain/Step": 4781, "Full-pretrain/Step Time": 17.652661794796586} +{"Full-pretrain/Learning Rate": 2.609496165221485e-05, "Full-pretrain/Loss": 1.959388256072998, "Full-pretrain/Loss (Raw)": 1.9909921884536743, "Full-pretrain/Step": 4782, "Full-pretrain/Step Time": 17.648450886830688} +{"Full-pretrain/Learning Rate": 2.6086478946146015e-05, "Full-pretrain/Loss": 1.9557344913482666, "Full-pretrain/Loss (Raw)": 2.064992904663086, "Full-pretrain/Step": 4783, "Full-pretrain/Step Time": 17.649472353979945} +{"Full-pretrain/Learning Rate": 2.6077996114752218e-05, "Full-pretrain/Loss": 1.9572570323944092, "Full-pretrain/Loss (Raw)": 1.9452329874038696, "Full-pretrain/Step": 4784, "Full-pretrain/Step Time": 17.655174365267158} +{"Full-pretrain/Learning Rate": 2.6069513159011947e-05, "Full-pretrain/Loss": 1.9542914628982544, "Full-pretrain/Loss (Raw)": 2.0316710472106934, "Full-pretrain/Step": 4785, "Full-pretrain/Step Time": 17.64902800694108} +{"Full-pretrain/Learning Rate": 2.606103007990371e-05, "Full-pretrain/Loss": 1.9572211503982544, "Full-pretrain/Loss (Raw)": 2.0585389137268066, "Full-pretrain/Step": 4786, "Full-pretrain/Step Time": 17.650082543492317} +{"Full-pretrain/Learning Rate": 2.6052546878406025e-05, "Full-pretrain/Loss": 1.9647397994995117, "Full-pretrain/Loss (Raw)": 2.1079635620117188, "Full-pretrain/Step": 4787, "Full-pretrain/Step Time": 17.65040715970099} +{"Full-pretrain/Learning Rate": 2.6044063555497426e-05, "Full-pretrain/Loss": 1.94162118434906, "Full-pretrain/Loss (Raw)": 1.3875629901885986, "Full-pretrain/Step": 4788, "Full-pretrain/Step Time": 17.653861885890365} +{"Full-pretrain/Learning Rate": 2.603558011215647e-05, "Full-pretrain/Loss": 1.9410430192947388, "Full-pretrain/Loss (Raw)": 1.9765046834945679, "Full-pretrain/Step": 4789, "Full-pretrain/Step Time": 17.654493995010853} +{"Full-pretrain/Learning Rate": 2.6027096549361713e-05, "Full-pretrain/Loss": 1.9472126960754395, "Full-pretrain/Loss (Raw)": 2.164024829864502, "Full-pretrain/Step": 4790, "Full-pretrain/Step Time": 17.648274654522538} +{"Full-pretrain/Learning Rate": 2.601861286809172e-05, "Full-pretrain/Loss": 1.9378809928894043, "Full-pretrain/Loss (Raw)": 1.9228055477142334, "Full-pretrain/Step": 4791, "Full-pretrain/Step Time": 17.653862942010164} +{"Full-pretrain/Learning Rate": 2.6010129069325096e-05, "Full-pretrain/Loss": 1.939072608947754, "Full-pretrain/Loss (Raw)": 2.1322503089904785, "Full-pretrain/Step": 4792, "Full-pretrain/Step Time": 17.649636201560497} +{"Full-pretrain/Learning Rate": 2.6001645154040438e-05, "Full-pretrain/Loss": 1.9354276657104492, "Full-pretrain/Loss (Raw)": 2.016159772872925, "Full-pretrain/Step": 4793, "Full-pretrain/Step Time": 17.6535663921386} +{"Full-pretrain/Learning Rate": 2.5993161123216365e-05, "Full-pretrain/Loss": 1.9318232536315918, "Full-pretrain/Loss (Raw)": 1.8706074953079224, "Full-pretrain/Step": 4794, "Full-pretrain/Step Time": 17.6506609916687} +{"Full-pretrain/Learning Rate": 2.59846769778315e-05, "Full-pretrain/Loss": 1.9325244426727295, "Full-pretrain/Loss (Raw)": 2.108640670776367, "Full-pretrain/Step": 4795, "Full-pretrain/Step Time": 17.649118669331074} +{"Full-pretrain/Learning Rate": 2.5976192718864494e-05, "Full-pretrain/Loss": 1.9431389570236206, "Full-pretrain/Loss (Raw)": 1.9503310918807983, "Full-pretrain/Step": 4796, "Full-pretrain/Step Time": 17.649681702256203} +{"Full-pretrain/Learning Rate": 2.5967708347294005e-05, "Full-pretrain/Loss": 1.9514362812042236, "Full-pretrain/Loss (Raw)": 2.106004476547241, "Full-pretrain/Step": 4797, "Full-pretrain/Step Time": 17.654790122061968} +{"Full-pretrain/Learning Rate": 2.5959223864098696e-05, "Full-pretrain/Loss": 1.9632916450500488, "Full-pretrain/Loss (Raw)": 2.071207046508789, "Full-pretrain/Step": 4798, "Full-pretrain/Step Time": 17.653239339590073} +{"Full-pretrain/Learning Rate": 2.595073927025725e-05, "Full-pretrain/Loss": 1.9516273736953735, "Full-pretrain/Loss (Raw)": 1.9502661228179932, "Full-pretrain/Step": 4799, "Full-pretrain/Step Time": 17.65339256078005} +{"Full-pretrain/Learning Rate": 2.594225456674837e-05, "Full-pretrain/Loss": 1.9516408443450928, "Full-pretrain/Loss (Raw)": 2.080810546875, "Full-pretrain/Step": 4800, "Full-pretrain/Step Time": 17.65456801839173} +{"Full-pretrain/Learning Rate": 2.5933769754550747e-05, "Full-pretrain/Loss": 1.9362597465515137, "Full-pretrain/Loss (Raw)": 1.574354887008667, "Full-pretrain/Step": 4801, "Full-pretrain/Step Time": 17.656841535121202} +{"Full-pretrain/Learning Rate": 2.5925284834643122e-05, "Full-pretrain/Loss": 1.9251916408538818, "Full-pretrain/Loss (Raw)": 1.541053056716919, "Full-pretrain/Step": 4802, "Full-pretrain/Step Time": 17.653344254940748} +{"Full-pretrain/Learning Rate": 2.5916799808004206e-05, "Full-pretrain/Loss": 1.937256097793579, "Full-pretrain/Loss (Raw)": 2.3521223068237305, "Full-pretrain/Step": 4803, "Full-pretrain/Step Time": 17.648175101727247} +{"Full-pretrain/Learning Rate": 2.5908314675612756e-05, "Full-pretrain/Loss": 1.9396644830703735, "Full-pretrain/Loss (Raw)": 1.9123696088790894, "Full-pretrain/Step": 4804, "Full-pretrain/Step Time": 17.6524247713387} +{"Full-pretrain/Learning Rate": 2.589982943844753e-05, "Full-pretrain/Loss": 1.9418659210205078, "Full-pretrain/Loss (Raw)": 2.0173633098602295, "Full-pretrain/Step": 4805, "Full-pretrain/Step Time": 17.65011826530099} +{"Full-pretrain/Learning Rate": 2.589134409748729e-05, "Full-pretrain/Loss": 1.9430865049362183, "Full-pretrain/Loss (Raw)": 1.9044978618621826, "Full-pretrain/Step": 4806, "Full-pretrain/Step Time": 17.653757378458977} +{"Full-pretrain/Learning Rate": 2.5882858653710827e-05, "Full-pretrain/Loss": 1.9463253021240234, "Full-pretrain/Loss (Raw)": 1.9540419578552246, "Full-pretrain/Step": 4807, "Full-pretrain/Step Time": 17.65308885462582} +{"Full-pretrain/Learning Rate": 2.5874373108096932e-05, "Full-pretrain/Loss": 1.947113275527954, "Full-pretrain/Loss (Raw)": 1.9549498558044434, "Full-pretrain/Step": 4808, "Full-pretrain/Step Time": 17.659052839502692} +{"Full-pretrain/Learning Rate": 2.5865887461624398e-05, "Full-pretrain/Loss": 1.9472167491912842, "Full-pretrain/Loss (Raw)": 1.7482048273086548, "Full-pretrain/Step": 4809, "Full-pretrain/Step Time": 17.66384724341333} +{"Full-pretrain/Learning Rate": 2.5857401715272056e-05, "Full-pretrain/Loss": 1.9501709938049316, "Full-pretrain/Loss (Raw)": 1.8082804679870605, "Full-pretrain/Step": 4810, "Full-pretrain/Step Time": 17.657022941857576} +{"Full-pretrain/Learning Rate": 2.5848915870018718e-05, "Full-pretrain/Loss": 1.9612375497817993, "Full-pretrain/Loss (Raw)": 2.1166648864746094, "Full-pretrain/Step": 4811, "Full-pretrain/Step Time": 17.65425506606698} +{"Full-pretrain/Learning Rate": 2.584042992684324e-05, "Full-pretrain/Loss": 1.9493777751922607, "Full-pretrain/Loss (Raw)": 1.590416669845581, "Full-pretrain/Step": 4812, "Full-pretrain/Step Time": 17.653596941381693} +{"Full-pretrain/Learning Rate": 2.5831943886724467e-05, "Full-pretrain/Loss": 1.9437775611877441, "Full-pretrain/Loss (Raw)": 1.789996862411499, "Full-pretrain/Step": 4813, "Full-pretrain/Step Time": 17.655662067234516} +{"Full-pretrain/Learning Rate": 2.5823457750641255e-05, "Full-pretrain/Loss": 1.949187159538269, "Full-pretrain/Loss (Raw)": 2.1640989780426025, "Full-pretrain/Step": 4814, "Full-pretrain/Step Time": 17.65555107407272} +{"Full-pretrain/Learning Rate": 2.5814971519572483e-05, "Full-pretrain/Loss": 1.9367318153381348, "Full-pretrain/Loss (Raw)": 1.666418433189392, "Full-pretrain/Step": 4815, "Full-pretrain/Step Time": 17.65688595548272} +{"Full-pretrain/Learning Rate": 2.5806485194497037e-05, "Full-pretrain/Loss": 1.932661771774292, "Full-pretrain/Loss (Raw)": 1.8149930238723755, "Full-pretrain/Step": 4816, "Full-pretrain/Step Time": 17.668946597725153} +{"Full-pretrain/Learning Rate": 2.57979987763938e-05, "Full-pretrain/Loss": 1.9181795120239258, "Full-pretrain/Loss (Raw)": 1.5682402849197388, "Full-pretrain/Step": 4817, "Full-pretrain/Step Time": 17.66469930112362} +{"Full-pretrain/Learning Rate": 2.578951226624169e-05, "Full-pretrain/Loss": 1.9116448163986206, "Full-pretrain/Loss (Raw)": 1.8494294881820679, "Full-pretrain/Step": 4818, "Full-pretrain/Step Time": 17.66276049800217} +{"Full-pretrain/Learning Rate": 2.578102566501961e-05, "Full-pretrain/Loss": 1.9057393074035645, "Full-pretrain/Loss (Raw)": 1.918982744216919, "Full-pretrain/Step": 4819, "Full-pretrain/Step Time": 17.655881414189935} +{"Full-pretrain/Learning Rate": 2.5772538973706496e-05, "Full-pretrain/Loss": 1.9182974100112915, "Full-pretrain/Loss (Raw)": 1.7894240617752075, "Full-pretrain/Step": 4820, "Full-pretrain/Step Time": 17.6645055282861} +{"Full-pretrain/Learning Rate": 2.5764052193281285e-05, "Full-pretrain/Loss": 1.9185686111450195, "Full-pretrain/Loss (Raw)": 1.985185146331787, "Full-pretrain/Step": 4821, "Full-pretrain/Step Time": 17.663183296099305} +{"Full-pretrain/Learning Rate": 2.575556532472292e-05, "Full-pretrain/Loss": 1.9134219884872437, "Full-pretrain/Loss (Raw)": 1.999333381652832, "Full-pretrain/Step": 4822, "Full-pretrain/Step Time": 17.664062444120646} +{"Full-pretrain/Learning Rate": 2.574707836901037e-05, "Full-pretrain/Loss": 1.917121410369873, "Full-pretrain/Loss (Raw)": 2.0411839485168457, "Full-pretrain/Step": 4823, "Full-pretrain/Step Time": 17.662497809156775} +{"Full-pretrain/Learning Rate": 2.5738591327122586e-05, "Full-pretrain/Loss": 1.913822889328003, "Full-pretrain/Loss (Raw)": 2.0266990661621094, "Full-pretrain/Step": 4824, "Full-pretrain/Step Time": 17.6649222150445} +{"Full-pretrain/Learning Rate": 2.5730104200038547e-05, "Full-pretrain/Loss": 1.9160579442977905, "Full-pretrain/Loss (Raw)": 2.0876824855804443, "Full-pretrain/Step": 4825, "Full-pretrain/Step Time": 17.66681075282395} +{"Full-pretrain/Learning Rate": 2.572161698873725e-05, "Full-pretrain/Loss": 1.9166336059570312, "Full-pretrain/Loss (Raw)": 1.8890304565429688, "Full-pretrain/Step": 4826, "Full-pretrain/Step Time": 17.665188474580646} +{"Full-pretrain/Learning Rate": 2.5713129694197685e-05, "Full-pretrain/Loss": 1.9243242740631104, "Full-pretrain/Loss (Raw)": 2.3547403812408447, "Full-pretrain/Step": 4827, "Full-pretrain/Step Time": 17.664746690541506} +{"Full-pretrain/Learning Rate": 2.5704642317398857e-05, "Full-pretrain/Loss": 1.9221227169036865, "Full-pretrain/Loss (Raw)": 1.8798795938491821, "Full-pretrain/Step": 4828, "Full-pretrain/Step Time": 17.664111910387874} +{"Full-pretrain/Learning Rate": 2.5696154859319794e-05, "Full-pretrain/Loss": 1.9144799709320068, "Full-pretrain/Loss (Raw)": 1.8614357709884644, "Full-pretrain/Step": 4829, "Full-pretrain/Step Time": 17.65939045883715} +{"Full-pretrain/Learning Rate": 2.5687667320939508e-05, "Full-pretrain/Loss": 1.9205023050308228, "Full-pretrain/Loss (Raw)": 2.263925075531006, "Full-pretrain/Step": 4830, "Full-pretrain/Step Time": 17.652841305360198} +{"Full-pretrain/Learning Rate": 2.5679179703237038e-05, "Full-pretrain/Loss": 1.9220935106277466, "Full-pretrain/Loss (Raw)": 2.001182794570923, "Full-pretrain/Step": 4831, "Full-pretrain/Step Time": 17.653699645772576} +{"Full-pretrain/Learning Rate": 2.567069200719143e-05, "Full-pretrain/Loss": 1.9165120124816895, "Full-pretrain/Loss (Raw)": 1.9021987915039062, "Full-pretrain/Step": 4832, "Full-pretrain/Step Time": 17.66689077951014} +{"Full-pretrain/Learning Rate": 2.5662204233781734e-05, "Full-pretrain/Loss": 1.9218528270721436, "Full-pretrain/Loss (Raw)": 1.7452677488327026, "Full-pretrain/Step": 4833, "Full-pretrain/Step Time": 17.66420228406787} +{"Full-pretrain/Learning Rate": 2.5653716383987013e-05, "Full-pretrain/Loss": 1.9368476867675781, "Full-pretrain/Loss (Raw)": 2.0208852291107178, "Full-pretrain/Step": 4834, "Full-pretrain/Step Time": 17.661952083930373} +{"Full-pretrain/Learning Rate": 2.5645228458786336e-05, "Full-pretrain/Loss": 1.9238638877868652, "Full-pretrain/Loss (Raw)": 1.936638593673706, "Full-pretrain/Step": 4835, "Full-pretrain/Step Time": 17.66168907471001} +{"Full-pretrain/Learning Rate": 2.5636740459158777e-05, "Full-pretrain/Loss": 1.9240562915802002, "Full-pretrain/Loss (Raw)": 1.9185254573822021, "Full-pretrain/Step": 4836, "Full-pretrain/Step Time": 17.661417201161385} +{"Full-pretrain/Learning Rate": 2.562825238608344e-05, "Full-pretrain/Loss": 1.9264376163482666, "Full-pretrain/Loss (Raw)": 2.0935726165771484, "Full-pretrain/Step": 4837, "Full-pretrain/Step Time": 17.66013920865953} +{"Full-pretrain/Learning Rate": 2.56197642405394e-05, "Full-pretrain/Loss": 1.9280920028686523, "Full-pretrain/Loss (Raw)": 1.9574331045150757, "Full-pretrain/Step": 4838, "Full-pretrain/Step Time": 17.65489357151091} +{"Full-pretrain/Learning Rate": 2.5611276023505785e-05, "Full-pretrain/Loss": 1.9283156394958496, "Full-pretrain/Loss (Raw)": 1.9612021446228027, "Full-pretrain/Step": 4839, "Full-pretrain/Step Time": 17.650027142837644} +{"Full-pretrain/Learning Rate": 2.5602787735961692e-05, "Full-pretrain/Loss": 1.923598289489746, "Full-pretrain/Loss (Raw)": 1.8039931058883667, "Full-pretrain/Step": 4840, "Full-pretrain/Step Time": 17.652303721755743} +{"Full-pretrain/Learning Rate": 2.5594299378886237e-05, "Full-pretrain/Loss": 1.925863265991211, "Full-pretrain/Loss (Raw)": 1.820685625076294, "Full-pretrain/Step": 4841, "Full-pretrain/Step Time": 17.649690065532923} +{"Full-pretrain/Learning Rate": 2.5585810953258572e-05, "Full-pretrain/Loss": 1.9427337646484375, "Full-pretrain/Loss (Raw)": 2.348137855529785, "Full-pretrain/Step": 4842, "Full-pretrain/Step Time": 17.652658624574542} +{"Full-pretrain/Learning Rate": 2.5577322460057807e-05, "Full-pretrain/Loss": 1.9379159212112427, "Full-pretrain/Loss (Raw)": 1.9624910354614258, "Full-pretrain/Step": 4843, "Full-pretrain/Step Time": 17.655539663508534} +{"Full-pretrain/Learning Rate": 2.5568833900263105e-05, "Full-pretrain/Loss": 1.9447834491729736, "Full-pretrain/Loss (Raw)": 1.8101770877838135, "Full-pretrain/Step": 4844, "Full-pretrain/Step Time": 17.652883971109986} +{"Full-pretrain/Learning Rate": 2.556034527485361e-05, "Full-pretrain/Loss": 1.9549893140792847, "Full-pretrain/Loss (Raw)": 2.1165852546691895, "Full-pretrain/Step": 4845, "Full-pretrain/Step Time": 17.6555638872087} +{"Full-pretrain/Learning Rate": 2.5551856584808482e-05, "Full-pretrain/Loss": 1.9607884883880615, "Full-pretrain/Loss (Raw)": 2.3496742248535156, "Full-pretrain/Step": 4846, "Full-pretrain/Step Time": 17.653241949155927} +{"Full-pretrain/Learning Rate": 2.5543367831106895e-05, "Full-pretrain/Loss": 1.9677871465682983, "Full-pretrain/Loss (Raw)": 1.8903741836547852, "Full-pretrain/Step": 4847, "Full-pretrain/Step Time": 17.66360646672547} +{"Full-pretrain/Learning Rate": 2.5534879014728013e-05, "Full-pretrain/Loss": 1.9567716121673584, "Full-pretrain/Loss (Raw)": 1.46249520778656, "Full-pretrain/Step": 4848, "Full-pretrain/Step Time": 17.662564497441053} +{"Full-pretrain/Learning Rate": 2.5526390136651035e-05, "Full-pretrain/Loss": 1.9655160903930664, "Full-pretrain/Loss (Raw)": 1.8480653762817383, "Full-pretrain/Step": 4849, "Full-pretrain/Step Time": 17.65929007716477} +{"Full-pretrain/Learning Rate": 2.5517901197855137e-05, "Full-pretrain/Loss": 1.9644821882247925, "Full-pretrain/Loss (Raw)": 1.8163437843322754, "Full-pretrain/Step": 4850, "Full-pretrain/Step Time": 17.66515713557601} +{"Full-pretrain/Learning Rate": 2.5509412199319517e-05, "Full-pretrain/Loss": 1.978651523590088, "Full-pretrain/Loss (Raw)": 2.3724024295806885, "Full-pretrain/Step": 4851, "Full-pretrain/Step Time": 17.66068197786808} +{"Full-pretrain/Learning Rate": 2.5500923142023374e-05, "Full-pretrain/Loss": 1.9770069122314453, "Full-pretrain/Loss (Raw)": 1.7367939949035645, "Full-pretrain/Step": 4852, "Full-pretrain/Step Time": 17.663366690278053} +{"Full-pretrain/Learning Rate": 2.5492434026945927e-05, "Full-pretrain/Loss": 1.980423927307129, "Full-pretrain/Loss (Raw)": 2.0945301055908203, "Full-pretrain/Step": 4853, "Full-pretrain/Step Time": 17.658265037462115} +{"Full-pretrain/Learning Rate": 2.5483944855066383e-05, "Full-pretrain/Loss": 1.9812660217285156, "Full-pretrain/Loss (Raw)": 2.0262792110443115, "Full-pretrain/Step": 4854, "Full-pretrain/Step Time": 17.661112597212195} +{"Full-pretrain/Learning Rate": 2.5475455627363976e-05, "Full-pretrain/Loss": 1.984877586364746, "Full-pretrain/Loss (Raw)": 2.1567554473876953, "Full-pretrain/Step": 4855, "Full-pretrain/Step Time": 17.654021928086877} +{"Full-pretrain/Learning Rate": 2.5466966344817927e-05, "Full-pretrain/Loss": 1.9869930744171143, "Full-pretrain/Loss (Raw)": 2.094395637512207, "Full-pretrain/Step": 4856, "Full-pretrain/Step Time": 17.655874283984303} +{"Full-pretrain/Learning Rate": 2.5458477008407477e-05, "Full-pretrain/Loss": 1.985701560974121, "Full-pretrain/Loss (Raw)": 2.046353340148926, "Full-pretrain/Step": 4857, "Full-pretrain/Step Time": 17.654261764138937} +{"Full-pretrain/Learning Rate": 2.5449987619111865e-05, "Full-pretrain/Loss": 1.99015474319458, "Full-pretrain/Loss (Raw)": 2.0315310955047607, "Full-pretrain/Step": 4858, "Full-pretrain/Step Time": 17.64942184276879} +{"Full-pretrain/Learning Rate": 2.5441498177910338e-05, "Full-pretrain/Loss": 1.963007926940918, "Full-pretrain/Loss (Raw)": 1.4860398769378662, "Full-pretrain/Step": 4859, "Full-pretrain/Step Time": 17.65019541978836} +{"Full-pretrain/Learning Rate": 2.543300868578215e-05, "Full-pretrain/Loss": 1.9672043323516846, "Full-pretrain/Loss (Raw)": 2.0141677856445312, "Full-pretrain/Step": 4860, "Full-pretrain/Step Time": 17.651313468813896} +{"Full-pretrain/Learning Rate": 2.542451914370656e-05, "Full-pretrain/Loss": 1.9638532400131226, "Full-pretrain/Loss (Raw)": 1.7542006969451904, "Full-pretrain/Step": 4861, "Full-pretrain/Step Time": 17.651767002418637} +{"Full-pretrain/Learning Rate": 2.541602955266284e-05, "Full-pretrain/Loss": 1.95126211643219, "Full-pretrain/Loss (Raw)": 1.861009955406189, "Full-pretrain/Step": 4862, "Full-pretrain/Step Time": 17.64556764252484} +{"Full-pretrain/Learning Rate": 2.5407539913630256e-05, "Full-pretrain/Loss": 1.948317289352417, "Full-pretrain/Loss (Raw)": 1.9069478511810303, "Full-pretrain/Step": 4863, "Full-pretrain/Step Time": 17.64969134889543} +{"Full-pretrain/Learning Rate": 2.5399050227588085e-05, "Full-pretrain/Loss": 1.9451006650924683, "Full-pretrain/Loss (Raw)": 1.7992689609527588, "Full-pretrain/Step": 4864, "Full-pretrain/Step Time": 17.64826257713139} +{"Full-pretrain/Learning Rate": 2.5390560495515614e-05, "Full-pretrain/Loss": 1.953832983970642, "Full-pretrain/Loss (Raw)": 2.0246996879577637, "Full-pretrain/Step": 4865, "Full-pretrain/Step Time": 17.64807212166488} +{"Full-pretrain/Learning Rate": 2.5382070718392133e-05, "Full-pretrain/Loss": 1.960862398147583, "Full-pretrain/Loss (Raw)": 2.2458276748657227, "Full-pretrain/Step": 4866, "Full-pretrain/Step Time": 17.647525254637003} +{"Full-pretrain/Learning Rate": 2.5373580897196914e-05, "Full-pretrain/Loss": 1.9673335552215576, "Full-pretrain/Loss (Raw)": 2.1437125205993652, "Full-pretrain/Step": 4867, "Full-pretrain/Step Time": 17.642053231596947} +{"Full-pretrain/Learning Rate": 2.5365091032909277e-05, "Full-pretrain/Loss": 1.9637717008590698, "Full-pretrain/Loss (Raw)": 1.8045494556427002, "Full-pretrain/Step": 4868, "Full-pretrain/Step Time": 17.64360265992582} +{"Full-pretrain/Learning Rate": 2.5356601126508518e-05, "Full-pretrain/Loss": 1.9592397212982178, "Full-pretrain/Loss (Raw)": 1.9485468864440918, "Full-pretrain/Step": 4869, "Full-pretrain/Step Time": 17.64445598050952} +{"Full-pretrain/Learning Rate": 2.5348111178973937e-05, "Full-pretrain/Loss": 1.9535737037658691, "Full-pretrain/Loss (Raw)": 1.7761235237121582, "Full-pretrain/Step": 4870, "Full-pretrain/Step Time": 17.63716610148549} +{"Full-pretrain/Learning Rate": 2.533962119128487e-05, "Full-pretrain/Loss": 1.9633235931396484, "Full-pretrain/Loss (Raw)": 2.273196220397949, "Full-pretrain/Step": 4871, "Full-pretrain/Step Time": 17.635407196357846} +{"Full-pretrain/Learning Rate": 2.53311311644206e-05, "Full-pretrain/Loss": 1.9621214866638184, "Full-pretrain/Loss (Raw)": 1.76552414894104, "Full-pretrain/Step": 4872, "Full-pretrain/Step Time": 17.636624982580543} +{"Full-pretrain/Learning Rate": 2.5322641099360477e-05, "Full-pretrain/Loss": 1.968005657196045, "Full-pretrain/Loss (Raw)": 2.008981704711914, "Full-pretrain/Step": 4873, "Full-pretrain/Step Time": 17.63498486019671} +{"Full-pretrain/Learning Rate": 2.531415099708382e-05, "Full-pretrain/Loss": 1.9566547870635986, "Full-pretrain/Loss (Raw)": 1.9849114418029785, "Full-pretrain/Step": 4874, "Full-pretrain/Step Time": 17.640183145180345} +{"Full-pretrain/Learning Rate": 2.5305660858569947e-05, "Full-pretrain/Loss": 1.9456015825271606, "Full-pretrain/Loss (Raw)": 1.608786702156067, "Full-pretrain/Step": 4875, "Full-pretrain/Step Time": 17.631343256682158} +{"Full-pretrain/Learning Rate": 2.529717068479821e-05, "Full-pretrain/Loss": 1.9512577056884766, "Full-pretrain/Loss (Raw)": 1.9911723136901855, "Full-pretrain/Step": 4876, "Full-pretrain/Step Time": 17.63640180043876} +{"Full-pretrain/Learning Rate": 2.5288680476747926e-05, "Full-pretrain/Loss": 1.9517021179199219, "Full-pretrain/Loss (Raw)": 2.130807399749756, "Full-pretrain/Step": 4877, "Full-pretrain/Step Time": 17.641298782080412} +{"Full-pretrain/Learning Rate": 2.528019023539846e-05, "Full-pretrain/Loss": 1.9583864212036133, "Full-pretrain/Loss (Raw)": 2.5635735988616943, "Full-pretrain/Step": 4878, "Full-pretrain/Step Time": 17.6339094042778} +{"Full-pretrain/Learning Rate": 2.527169996172915e-05, "Full-pretrain/Loss": 1.9539486169815063, "Full-pretrain/Loss (Raw)": 1.7483620643615723, "Full-pretrain/Step": 4879, "Full-pretrain/Step Time": 17.62876470759511} +{"Full-pretrain/Learning Rate": 2.526320965671934e-05, "Full-pretrain/Loss": 1.9646790027618408, "Full-pretrain/Loss (Raw)": 1.8058634996414185, "Full-pretrain/Step": 4880, "Full-pretrain/Step Time": 17.63094319216907} +{"Full-pretrain/Learning Rate": 2.5254719321348392e-05, "Full-pretrain/Loss": 1.9633461236953735, "Full-pretrain/Loss (Raw)": 1.805417776107788, "Full-pretrain/Step": 4881, "Full-pretrain/Step Time": 17.631978018209338} +{"Full-pretrain/Learning Rate": 2.5246228956595662e-05, "Full-pretrain/Loss": 1.9656438827514648, "Full-pretrain/Loss (Raw)": 1.8898718357086182, "Full-pretrain/Step": 4882, "Full-pretrain/Step Time": 17.626424757763743} +{"Full-pretrain/Learning Rate": 2.52377385634405e-05, "Full-pretrain/Loss": 1.9470369815826416, "Full-pretrain/Loss (Raw)": 1.776977300643921, "Full-pretrain/Step": 4883, "Full-pretrain/Step Time": 17.623325569555163} +{"Full-pretrain/Learning Rate": 2.5229248142862288e-05, "Full-pretrain/Loss": 1.950763463973999, "Full-pretrain/Loss (Raw)": 1.8560431003570557, "Full-pretrain/Step": 4884, "Full-pretrain/Step Time": 17.627158228307962} +{"Full-pretrain/Learning Rate": 2.5220757695840375e-05, "Full-pretrain/Loss": 1.9404940605163574, "Full-pretrain/Loss (Raw)": 1.76591157913208, "Full-pretrain/Step": 4885, "Full-pretrain/Step Time": 17.627770207822323} +{"Full-pretrain/Learning Rate": 2.521226722335414e-05, "Full-pretrain/Loss": 1.938854455947876, "Full-pretrain/Loss (Raw)": 1.9738119840621948, "Full-pretrain/Step": 4886, "Full-pretrain/Step Time": 17.623810878023505} +{"Full-pretrain/Learning Rate": 2.5203776726382962e-05, "Full-pretrain/Loss": 1.9267009496688843, "Full-pretrain/Loss (Raw)": 1.7678427696228027, "Full-pretrain/Step": 4887, "Full-pretrain/Step Time": 17.618402710184455} +{"Full-pretrain/Learning Rate": 2.5195286205906206e-05, "Full-pretrain/Loss": 1.9224642515182495, "Full-pretrain/Loss (Raw)": 1.9588230848312378, "Full-pretrain/Step": 4888, "Full-pretrain/Step Time": 17.620860632508993} +{"Full-pretrain/Learning Rate": 2.5186795662903255e-05, "Full-pretrain/Loss": 1.9259257316589355, "Full-pretrain/Loss (Raw)": 2.157119035720825, "Full-pretrain/Step": 4889, "Full-pretrain/Step Time": 17.617981035262346} +{"Full-pretrain/Learning Rate": 2.5178305098353488e-05, "Full-pretrain/Loss": 1.9196901321411133, "Full-pretrain/Loss (Raw)": 1.8319952487945557, "Full-pretrain/Step": 4890, "Full-pretrain/Step Time": 17.618735084310174} +{"Full-pretrain/Learning Rate": 2.5169814513236296e-05, "Full-pretrain/Loss": 1.9314744472503662, "Full-pretrain/Loss (Raw)": 1.8631346225738525, "Full-pretrain/Step": 4891, "Full-pretrain/Step Time": 17.617653680965304} +{"Full-pretrain/Learning Rate": 2.5161323908531058e-05, "Full-pretrain/Loss": 1.9336230754852295, "Full-pretrain/Loss (Raw)": 2.08292293548584, "Full-pretrain/Step": 4892, "Full-pretrain/Step Time": 17.617269726470113} +{"Full-pretrain/Learning Rate": 2.515283328521716e-05, "Full-pretrain/Loss": 1.9339637756347656, "Full-pretrain/Loss (Raw)": 1.7651017904281616, "Full-pretrain/Step": 4893, "Full-pretrain/Step Time": 17.619463320821524} +{"Full-pretrain/Learning Rate": 2.5144342644274e-05, "Full-pretrain/Loss": 1.9373794794082642, "Full-pretrain/Loss (Raw)": 1.970315933227539, "Full-pretrain/Step": 4894, "Full-pretrain/Step Time": 17.617883315309882} +{"Full-pretrain/Learning Rate": 2.5135851986680962e-05, "Full-pretrain/Loss": 1.9309821128845215, "Full-pretrain/Loss (Raw)": 1.7022342681884766, "Full-pretrain/Step": 4895, "Full-pretrain/Step Time": 17.614164013415575} +{"Full-pretrain/Learning Rate": 2.5127361313417447e-05, "Full-pretrain/Loss": 1.938575029373169, "Full-pretrain/Loss (Raw)": 2.042238712310791, "Full-pretrain/Step": 4896, "Full-pretrain/Step Time": 17.61888754926622} +{"Full-pretrain/Learning Rate": 2.5118870625462853e-05, "Full-pretrain/Loss": 1.9382314682006836, "Full-pretrain/Loss (Raw)": 2.0137081146240234, "Full-pretrain/Step": 4897, "Full-pretrain/Step Time": 17.622498609125614} +{"Full-pretrain/Learning Rate": 2.5110379923796567e-05, "Full-pretrain/Loss": 1.9285154342651367, "Full-pretrain/Loss (Raw)": 1.9349138736724854, "Full-pretrain/Step": 4898, "Full-pretrain/Step Time": 17.619956323876977} +{"Full-pretrain/Learning Rate": 2.5101889209398004e-05, "Full-pretrain/Loss": 1.9386026859283447, "Full-pretrain/Loss (Raw)": 2.466503620147705, "Full-pretrain/Step": 4899, "Full-pretrain/Step Time": 17.613997602835298} +{"Full-pretrain/Learning Rate": 2.5093398483246554e-05, "Full-pretrain/Loss": 1.9470181465148926, "Full-pretrain/Loss (Raw)": 2.073845863342285, "Full-pretrain/Step": 4900, "Full-pretrain/Step Time": 17.62210384197533} +{"Full-pretrain/Learning Rate": 2.5084907746321618e-05, "Full-pretrain/Loss": 1.9563438892364502, "Full-pretrain/Loss (Raw)": 2.246969223022461, "Full-pretrain/Step": 4901, "Full-pretrain/Step Time": 17.618712920695543} +{"Full-pretrain/Learning Rate": 2.507641699960261e-05, "Full-pretrain/Loss": 1.96232008934021, "Full-pretrain/Loss (Raw)": 1.9673573970794678, "Full-pretrain/Step": 4902, "Full-pretrain/Step Time": 17.618278978392482} +{"Full-pretrain/Learning Rate": 2.5067926244068917e-05, "Full-pretrain/Loss": 1.955151915550232, "Full-pretrain/Loss (Raw)": 2.043818473815918, "Full-pretrain/Step": 4903, "Full-pretrain/Step Time": 17.62266750447452} +{"Full-pretrain/Learning Rate": 2.505943548069996e-05, "Full-pretrain/Loss": 1.959831953048706, "Full-pretrain/Loss (Raw)": 1.9152858257293701, "Full-pretrain/Step": 4904, "Full-pretrain/Step Time": 17.62275530397892} +{"Full-pretrain/Learning Rate": 2.505094471047515e-05, "Full-pretrain/Loss": 1.9534374475479126, "Full-pretrain/Loss (Raw)": 1.804356575012207, "Full-pretrain/Step": 4905, "Full-pretrain/Step Time": 17.6293613743037} +{"Full-pretrain/Learning Rate": 2.5042453934373873e-05, "Full-pretrain/Loss": 1.9503949880599976, "Full-pretrain/Loss (Raw)": 1.887552261352539, "Full-pretrain/Step": 4906, "Full-pretrain/Step Time": 17.62360069900751} +{"Full-pretrain/Learning Rate": 2.5033963153375556e-05, "Full-pretrain/Loss": 1.9615577459335327, "Full-pretrain/Loss (Raw)": 1.9659950733184814, "Full-pretrain/Step": 4907, "Full-pretrain/Step Time": 17.625519244000316} +{"Full-pretrain/Learning Rate": 2.5025472368459606e-05, "Full-pretrain/Loss": 1.959139347076416, "Full-pretrain/Loss (Raw)": 1.9137864112854004, "Full-pretrain/Step": 4908, "Full-pretrain/Step Time": 17.62587032467127} +{"Full-pretrain/Learning Rate": 2.501698158060542e-05, "Full-pretrain/Loss": 1.9621294736862183, "Full-pretrain/Loss (Raw)": 2.226487159729004, "Full-pretrain/Step": 4909, "Full-pretrain/Step Time": 17.628313655033708} +{"Full-pretrain/Learning Rate": 2.5008490790792415e-05, "Full-pretrain/Loss": 1.9428892135620117, "Full-pretrain/Loss (Raw)": 1.947890281677246, "Full-pretrain/Step": 4910, "Full-pretrain/Step Time": 17.634248791262507} +{"Full-pretrain/Learning Rate": 2.5e-05, "Full-pretrain/Loss": 1.950559377670288, "Full-pretrain/Loss (Raw)": 1.9938057661056519, "Full-pretrain/Step": 4911, "Full-pretrain/Step Time": 17.63563165254891} +{"Full-pretrain/Learning Rate": 2.4991509209207588e-05, "Full-pretrain/Loss": 1.957932710647583, "Full-pretrain/Loss (Raw)": 2.041809320449829, "Full-pretrain/Step": 4912, "Full-pretrain/Step Time": 17.62941336631775} +{"Full-pretrain/Learning Rate": 2.498301841939458e-05, "Full-pretrain/Loss": 1.9610135555267334, "Full-pretrain/Loss (Raw)": 1.904001235961914, "Full-pretrain/Step": 4913, "Full-pretrain/Step Time": 17.633475098758936} +{"Full-pretrain/Learning Rate": 2.4974527631540403e-05, "Full-pretrain/Loss": 1.9718565940856934, "Full-pretrain/Loss (Raw)": 2.236848831176758, "Full-pretrain/Step": 4914, "Full-pretrain/Step Time": 17.631316285580397} +{"Full-pretrain/Learning Rate": 2.4966036846624447e-05, "Full-pretrain/Loss": 1.9688291549682617, "Full-pretrain/Loss (Raw)": 1.6801013946533203, "Full-pretrain/Step": 4915, "Full-pretrain/Step Time": 17.628908583894372} +{"Full-pretrain/Learning Rate": 2.4957546065626133e-05, "Full-pretrain/Loss": 1.959670066833496, "Full-pretrain/Loss (Raw)": 1.5629539489746094, "Full-pretrain/Step": 4916, "Full-pretrain/Step Time": 17.625142477452755} +{"Full-pretrain/Learning Rate": 2.494905528952486e-05, "Full-pretrain/Loss": 1.9672136306762695, "Full-pretrain/Loss (Raw)": 2.007302761077881, "Full-pretrain/Step": 4917, "Full-pretrain/Step Time": 17.633780542761087} +{"Full-pretrain/Learning Rate": 2.4940564519300038e-05, "Full-pretrain/Loss": 1.9657297134399414, "Full-pretrain/Loss (Raw)": 1.9263266324996948, "Full-pretrain/Step": 4918, "Full-pretrain/Step Time": 17.634211825206876} +{"Full-pretrain/Learning Rate": 2.4932073755931092e-05, "Full-pretrain/Loss": 1.9757704734802246, "Full-pretrain/Loss (Raw)": 2.0891470909118652, "Full-pretrain/Step": 4919, "Full-pretrain/Step Time": 17.626884698867798} +{"Full-pretrain/Learning Rate": 2.49235830003974e-05, "Full-pretrain/Loss": 1.9775934219360352, "Full-pretrain/Loss (Raw)": 2.0171570777893066, "Full-pretrain/Step": 4920, "Full-pretrain/Step Time": 17.620429722592235} +{"Full-pretrain/Learning Rate": 2.4915092253678388e-05, "Full-pretrain/Loss": 1.9746479988098145, "Full-pretrain/Loss (Raw)": 2.062869071960449, "Full-pretrain/Step": 4921, "Full-pretrain/Step Time": 17.622574359178543} +{"Full-pretrain/Learning Rate": 2.490660151675345e-05, "Full-pretrain/Loss": 1.9807647466659546, "Full-pretrain/Loss (Raw)": 2.0277295112609863, "Full-pretrain/Step": 4922, "Full-pretrain/Step Time": 17.62216416373849} +{"Full-pretrain/Learning Rate": 2.4898110790602e-05, "Full-pretrain/Loss": 1.9778964519500732, "Full-pretrain/Loss (Raw)": 1.7713465690612793, "Full-pretrain/Step": 4923, "Full-pretrain/Step Time": 17.62599627673626} +{"Full-pretrain/Learning Rate": 2.4889620076203432e-05, "Full-pretrain/Loss": 1.981558918952942, "Full-pretrain/Loss (Raw)": 2.2001242637634277, "Full-pretrain/Step": 4924, "Full-pretrain/Step Time": 17.61382519453764} +{"Full-pretrain/Learning Rate": 2.488112937453716e-05, "Full-pretrain/Loss": 1.9930307865142822, "Full-pretrain/Loss (Raw)": 2.132205009460449, "Full-pretrain/Step": 4925, "Full-pretrain/Step Time": 17.61537924222648} +{"Full-pretrain/Learning Rate": 2.4872638686582563e-05, "Full-pretrain/Loss": 1.9910379648208618, "Full-pretrain/Loss (Raw)": 1.9065420627593994, "Full-pretrain/Step": 4926, "Full-pretrain/Step Time": 17.618383144959807} +{"Full-pretrain/Learning Rate": 2.4864148013319044e-05, "Full-pretrain/Loss": 2.007171392440796, "Full-pretrain/Loss (Raw)": 2.218507766723633, "Full-pretrain/Step": 4927, "Full-pretrain/Step Time": 17.620566360652447} +{"Full-pretrain/Learning Rate": 2.4855657355726007e-05, "Full-pretrain/Loss": 2.0057291984558105, "Full-pretrain/Loss (Raw)": 1.9960894584655762, "Full-pretrain/Step": 4928, "Full-pretrain/Step Time": 17.613371156156063} +{"Full-pretrain/Learning Rate": 2.4847166714782842e-05, "Full-pretrain/Loss": 1.9970686435699463, "Full-pretrain/Loss (Raw)": 1.7365710735321045, "Full-pretrain/Step": 4929, "Full-pretrain/Step Time": 17.613787600770593} +{"Full-pretrain/Learning Rate": 2.4838676091468954e-05, "Full-pretrain/Loss": 1.9904613494873047, "Full-pretrain/Loss (Raw)": 1.7234787940979004, "Full-pretrain/Step": 4930, "Full-pretrain/Step Time": 17.61624568141997} +{"Full-pretrain/Learning Rate": 2.483018548676371e-05, "Full-pretrain/Loss": 1.9778298139572144, "Full-pretrain/Loss (Raw)": 2.0622925758361816, "Full-pretrain/Step": 4931, "Full-pretrain/Step Time": 17.620936455205083} +{"Full-pretrain/Learning Rate": 2.4821694901646518e-05, "Full-pretrain/Loss": 1.9693565368652344, "Full-pretrain/Loss (Raw)": 1.8027000427246094, "Full-pretrain/Step": 4932, "Full-pretrain/Step Time": 17.614443980157375} +{"Full-pretrain/Learning Rate": 2.481320433709675e-05, "Full-pretrain/Loss": 1.9604800939559937, "Full-pretrain/Loss (Raw)": 1.9629234075546265, "Full-pretrain/Step": 4933, "Full-pretrain/Step Time": 17.61384072341025} +{"Full-pretrain/Learning Rate": 2.4804713794093797e-05, "Full-pretrain/Loss": 1.9592435359954834, "Full-pretrain/Loss (Raw)": 1.9277875423431396, "Full-pretrain/Step": 4934, "Full-pretrain/Step Time": 17.610105587169528} +{"Full-pretrain/Learning Rate": 2.479622327361705e-05, "Full-pretrain/Loss": 1.9573287963867188, "Full-pretrain/Loss (Raw)": 1.9825482368469238, "Full-pretrain/Step": 4935, "Full-pretrain/Step Time": 17.607428580522537} +{"Full-pretrain/Learning Rate": 2.4787732776645865e-05, "Full-pretrain/Loss": 1.9502464532852173, "Full-pretrain/Loss (Raw)": 1.6886515617370605, "Full-pretrain/Step": 4936, "Full-pretrain/Step Time": 17.597162008285522} +{"Full-pretrain/Learning Rate": 2.477924230415963e-05, "Full-pretrain/Loss": 1.9622162580490112, "Full-pretrain/Loss (Raw)": 2.1873888969421387, "Full-pretrain/Step": 4937, "Full-pretrain/Step Time": 17.595318626612425} +{"Full-pretrain/Learning Rate": 2.4770751857137718e-05, "Full-pretrain/Loss": 1.9679591655731201, "Full-pretrain/Loss (Raw)": 2.0713257789611816, "Full-pretrain/Step": 4938, "Full-pretrain/Step Time": 17.59701687283814} +{"Full-pretrain/Learning Rate": 2.47622614365595e-05, "Full-pretrain/Loss": 1.9668269157409668, "Full-pretrain/Loss (Raw)": 1.9297629594802856, "Full-pretrain/Step": 4939, "Full-pretrain/Step Time": 17.597965287044644} +{"Full-pretrain/Learning Rate": 2.475377104340435e-05, "Full-pretrain/Loss": 1.9668476581573486, "Full-pretrain/Loss (Raw)": 1.9144525527954102, "Full-pretrain/Step": 4940, "Full-pretrain/Step Time": 17.591805834323168} +{"Full-pretrain/Learning Rate": 2.4745280678651614e-05, "Full-pretrain/Loss": 1.961230754852295, "Full-pretrain/Loss (Raw)": 2.0467472076416016, "Full-pretrain/Step": 4941, "Full-pretrain/Step Time": 17.58762140199542} +{"Full-pretrain/Learning Rate": 2.4736790343280667e-05, "Full-pretrain/Loss": 1.9604816436767578, "Full-pretrain/Loss (Raw)": 1.9239168167114258, "Full-pretrain/Step": 4942, "Full-pretrain/Step Time": 17.58713073655963} +{"Full-pretrain/Learning Rate": 2.4728300038270854e-05, "Full-pretrain/Loss": 1.9553781747817993, "Full-pretrain/Loss (Raw)": 1.8304924964904785, "Full-pretrain/Step": 4943, "Full-pretrain/Step Time": 17.593440979719162} +{"Full-pretrain/Learning Rate": 2.471980976460154e-05, "Full-pretrain/Loss": 1.9510080814361572, "Full-pretrain/Loss (Raw)": 1.9019672870635986, "Full-pretrain/Step": 4944, "Full-pretrain/Step Time": 17.58739984035492} +{"Full-pretrain/Learning Rate": 2.471131952325207e-05, "Full-pretrain/Loss": 1.9501713514328003, "Full-pretrain/Loss (Raw)": 1.8772262334823608, "Full-pretrain/Step": 4945, "Full-pretrain/Step Time": 17.580159170553088} +{"Full-pretrain/Learning Rate": 2.4702829315201803e-05, "Full-pretrain/Loss": 1.9443230628967285, "Full-pretrain/Loss (Raw)": 2.0497047901153564, "Full-pretrain/Step": 4946, "Full-pretrain/Step Time": 17.584542129188776} +{"Full-pretrain/Learning Rate": 2.4694339141430055e-05, "Full-pretrain/Loss": 1.9545084238052368, "Full-pretrain/Loss (Raw)": 2.006030559539795, "Full-pretrain/Step": 4947, "Full-pretrain/Step Time": 17.59529345855117} +{"Full-pretrain/Learning Rate": 2.4685849002916183e-05, "Full-pretrain/Loss": 1.9673964977264404, "Full-pretrain/Loss (Raw)": 1.97537100315094, "Full-pretrain/Step": 4948, "Full-pretrain/Step Time": 17.590441988781095} +{"Full-pretrain/Learning Rate": 2.4677358900639525e-05, "Full-pretrain/Loss": 1.965417742729187, "Full-pretrain/Loss (Raw)": 1.9439830780029297, "Full-pretrain/Step": 4949, "Full-pretrain/Step Time": 17.58994422480464} +{"Full-pretrain/Learning Rate": 2.4668868835579398e-05, "Full-pretrain/Loss": 1.9722282886505127, "Full-pretrain/Loss (Raw)": 2.144263744354248, "Full-pretrain/Step": 4950, "Full-pretrain/Step Time": 17.590218596160412} +{"Full-pretrain/Learning Rate": 2.4660378808715147e-05, "Full-pretrain/Loss": 1.9694507122039795, "Full-pretrain/Loss (Raw)": 2.0002641677856445, "Full-pretrain/Step": 4951, "Full-pretrain/Step Time": 17.587969593703747} +{"Full-pretrain/Learning Rate": 2.4651888821026065e-05, "Full-pretrain/Loss": 1.9700610637664795, "Full-pretrain/Loss (Raw)": 2.0366873741149902, "Full-pretrain/Step": 4952, "Full-pretrain/Step Time": 17.586591007187963} +{"Full-pretrain/Learning Rate": 2.4643398873491488e-05, "Full-pretrain/Loss": 1.9712204933166504, "Full-pretrain/Loss (Raw)": 2.099972724914551, "Full-pretrain/Step": 4953, "Full-pretrain/Step Time": 17.579715522006154} +{"Full-pretrain/Learning Rate": 2.4634908967090725e-05, "Full-pretrain/Loss": 1.9729660749435425, "Full-pretrain/Loss (Raw)": 2.083587646484375, "Full-pretrain/Step": 4954, "Full-pretrain/Step Time": 17.57919192314148} +{"Full-pretrain/Learning Rate": 2.4626419102803085e-05, "Full-pretrain/Loss": 1.988548755645752, "Full-pretrain/Loss (Raw)": 2.269991874694824, "Full-pretrain/Step": 4955, "Full-pretrain/Step Time": 17.57797321304679} +{"Full-pretrain/Learning Rate": 2.4617929281607883e-05, "Full-pretrain/Loss": 1.9785776138305664, "Full-pretrain/Loss (Raw)": 1.8810478448867798, "Full-pretrain/Step": 4956, "Full-pretrain/Step Time": 17.583622170612216} +{"Full-pretrain/Learning Rate": 2.4609439504484392e-05, "Full-pretrain/Loss": 1.9696403741836548, "Full-pretrain/Loss (Raw)": 1.846216082572937, "Full-pretrain/Step": 4957, "Full-pretrain/Step Time": 17.584070479497313} +{"Full-pretrain/Learning Rate": 2.460094977241192e-05, "Full-pretrain/Loss": 1.9773120880126953, "Full-pretrain/Loss (Raw)": 2.152035713195801, "Full-pretrain/Step": 4958, "Full-pretrain/Step Time": 17.582846647128463} +{"Full-pretrain/Learning Rate": 2.4592460086369747e-05, "Full-pretrain/Loss": 1.9627385139465332, "Full-pretrain/Loss (Raw)": 1.752151608467102, "Full-pretrain/Step": 4959, "Full-pretrain/Step Time": 17.578657902777195} +{"Full-pretrain/Learning Rate": 2.4583970447337163e-05, "Full-pretrain/Loss": 1.970766305923462, "Full-pretrain/Loss (Raw)": 2.252981662750244, "Full-pretrain/Step": 4960, "Full-pretrain/Step Time": 17.57623620890081} +{"Full-pretrain/Learning Rate": 2.4575480856293447e-05, "Full-pretrain/Loss": 1.9839369058609009, "Full-pretrain/Loss (Raw)": 2.1580307483673096, "Full-pretrain/Step": 4961, "Full-pretrain/Step Time": 17.571894094347954} +{"Full-pretrain/Learning Rate": 2.456699131421786e-05, "Full-pretrain/Loss": 1.992607593536377, "Full-pretrain/Loss (Raw)": 2.000943183898926, "Full-pretrain/Step": 4962, "Full-pretrain/Step Time": 17.56990235671401} +{"Full-pretrain/Learning Rate": 2.4558501822089668e-05, "Full-pretrain/Loss": 1.9896843433380127, "Full-pretrain/Loss (Raw)": 1.968747615814209, "Full-pretrain/Step": 4963, "Full-pretrain/Step Time": 17.567405300214887} +{"Full-pretrain/Learning Rate": 2.4550012380888138e-05, "Full-pretrain/Loss": 1.9964368343353271, "Full-pretrain/Loss (Raw)": 2.018778085708618, "Full-pretrain/Step": 4964, "Full-pretrain/Step Time": 17.568119382485747} +{"Full-pretrain/Learning Rate": 2.454152299159253e-05, "Full-pretrain/Loss": 1.993213415145874, "Full-pretrain/Loss (Raw)": 1.8597716093063354, "Full-pretrain/Step": 4965, "Full-pretrain/Step Time": 17.571059739217162} +{"Full-pretrain/Learning Rate": 2.4533033655182072e-05, "Full-pretrain/Loss": 1.9979784488677979, "Full-pretrain/Loss (Raw)": 2.0802700519561768, "Full-pretrain/Step": 4966, "Full-pretrain/Step Time": 17.573223473504186} +{"Full-pretrain/Learning Rate": 2.4524544372636034e-05, "Full-pretrain/Loss": 1.9926977157592773, "Full-pretrain/Loss (Raw)": 1.8135673999786377, "Full-pretrain/Step": 4967, "Full-pretrain/Step Time": 17.57503035478294} +{"Full-pretrain/Learning Rate": 2.4516055144933623e-05, "Full-pretrain/Loss": 1.995436191558838, "Full-pretrain/Loss (Raw)": 1.7762773036956787, "Full-pretrain/Step": 4968, "Full-pretrain/Step Time": 17.57704672962427} +{"Full-pretrain/Learning Rate": 2.450756597305408e-05, "Full-pretrain/Loss": 1.9898210763931274, "Full-pretrain/Loss (Raw)": 2.0077083110809326, "Full-pretrain/Step": 4969, "Full-pretrain/Step Time": 17.572216080501676} +{"Full-pretrain/Learning Rate": 2.4499076857976628e-05, "Full-pretrain/Loss": 1.9856939315795898, "Full-pretrain/Loss (Raw)": 1.9392554759979248, "Full-pretrain/Step": 4970, "Full-pretrain/Step Time": 17.56992864049971} +{"Full-pretrain/Learning Rate": 2.4490587800680486e-05, "Full-pretrain/Loss": 1.985320806503296, "Full-pretrain/Loss (Raw)": 1.9178210496902466, "Full-pretrain/Step": 4971, "Full-pretrain/Step Time": 17.569980988278985} +{"Full-pretrain/Learning Rate": 2.4482098802144872e-05, "Full-pretrain/Loss": 1.989671230316162, "Full-pretrain/Loss (Raw)": 2.0536651611328125, "Full-pretrain/Step": 4972, "Full-pretrain/Step Time": 17.570287249982357} +{"Full-pretrain/Learning Rate": 2.447360986334897e-05, "Full-pretrain/Loss": 1.985548973083496, "Full-pretrain/Loss (Raw)": 1.9148374795913696, "Full-pretrain/Step": 4973, "Full-pretrain/Step Time": 17.56586902588606} +{"Full-pretrain/Learning Rate": 2.446512098527199e-05, "Full-pretrain/Loss": 1.9962232112884521, "Full-pretrain/Loss (Raw)": 2.2654943466186523, "Full-pretrain/Step": 4974, "Full-pretrain/Step Time": 17.568130988627672} +{"Full-pretrain/Learning Rate": 2.445663216889311e-05, "Full-pretrain/Loss": 1.996154546737671, "Full-pretrain/Loss (Raw)": 1.828291654586792, "Full-pretrain/Step": 4975, "Full-pretrain/Step Time": 17.56535559333861} +{"Full-pretrain/Learning Rate": 2.444814341519152e-05, "Full-pretrain/Loss": 2.0016939640045166, "Full-pretrain/Loss (Raw)": 2.0792298316955566, "Full-pretrain/Step": 4976, "Full-pretrain/Step Time": 17.559663474559784} +{"Full-pretrain/Learning Rate": 2.44396547251464e-05, "Full-pretrain/Loss": 2.0081048011779785, "Full-pretrain/Loss (Raw)": 2.082364559173584, "Full-pretrain/Step": 4977, "Full-pretrain/Step Time": 17.556496212258935} +{"Full-pretrain/Learning Rate": 2.4431166099736908e-05, "Full-pretrain/Loss": 2.0005273818969727, "Full-pretrain/Loss (Raw)": 1.8072357177734375, "Full-pretrain/Step": 4978, "Full-pretrain/Step Time": 17.557843945920467} +{"Full-pretrain/Learning Rate": 2.44226775399422e-05, "Full-pretrain/Loss": 1.995872139930725, "Full-pretrain/Loss (Raw)": 1.8570616245269775, "Full-pretrain/Step": 4979, "Full-pretrain/Step Time": 17.55911876820028} +{"Full-pretrain/Learning Rate": 2.4414189046741437e-05, "Full-pretrain/Loss": 2.001016616821289, "Full-pretrain/Loss (Raw)": 2.139991283416748, "Full-pretrain/Step": 4980, "Full-pretrain/Step Time": 17.562470015138388} +{"Full-pretrain/Learning Rate": 2.440570062111376e-05, "Full-pretrain/Loss": 1.9832627773284912, "Full-pretrain/Loss (Raw)": 1.3758620023727417, "Full-pretrain/Step": 4981, "Full-pretrain/Step Time": 17.563422759994864} +{"Full-pretrain/Learning Rate": 2.4397212264038313e-05, "Full-pretrain/Loss": 1.974705457687378, "Full-pretrain/Loss (Raw)": 1.8704302310943604, "Full-pretrain/Step": 4982, "Full-pretrain/Step Time": 17.561238318681717} +{"Full-pretrain/Learning Rate": 2.438872397649422e-05, "Full-pretrain/Loss": 1.9794487953186035, "Full-pretrain/Loss (Raw)": 2.152052879333496, "Full-pretrain/Step": 4983, "Full-pretrain/Step Time": 17.565963534638286} +{"Full-pretrain/Learning Rate": 2.4380235759460603e-05, "Full-pretrain/Loss": 1.977080225944519, "Full-pretrain/Loss (Raw)": 1.9608925580978394, "Full-pretrain/Step": 4984, "Full-pretrain/Step Time": 17.563859371468425} +{"Full-pretrain/Learning Rate": 2.4371747613916566e-05, "Full-pretrain/Loss": 1.9726394414901733, "Full-pretrain/Loss (Raw)": 1.9578694105148315, "Full-pretrain/Step": 4985, "Full-pretrain/Step Time": 17.564015513285995} +{"Full-pretrain/Learning Rate": 2.4363259540841222e-05, "Full-pretrain/Loss": 1.9697285890579224, "Full-pretrain/Loss (Raw)": 1.9904396533966064, "Full-pretrain/Step": 4986, "Full-pretrain/Step Time": 17.56399683840573} +{"Full-pretrain/Learning Rate": 2.4354771541213663e-05, "Full-pretrain/Loss": 1.9615352153778076, "Full-pretrain/Loss (Raw)": 2.0078067779541016, "Full-pretrain/Step": 4987, "Full-pretrain/Step Time": 17.56597196869552} +{"Full-pretrain/Learning Rate": 2.4346283616012996e-05, "Full-pretrain/Loss": 1.964815616607666, "Full-pretrain/Loss (Raw)": 1.9860175848007202, "Full-pretrain/Step": 4988, "Full-pretrain/Step Time": 17.56403890438378} +{"Full-pretrain/Learning Rate": 2.433779576621827e-05, "Full-pretrain/Loss": 1.972944974899292, "Full-pretrain/Loss (Raw)": 2.1063578128814697, "Full-pretrain/Step": 4989, "Full-pretrain/Step Time": 17.564472548663616} +{"Full-pretrain/Learning Rate": 2.432930799280857e-05, "Full-pretrain/Loss": 1.9598268270492554, "Full-pretrain/Loss (Raw)": 1.7322520017623901, "Full-pretrain/Step": 4990, "Full-pretrain/Step Time": 17.56696492433548} +{"Full-pretrain/Learning Rate": 2.4320820296762964e-05, "Full-pretrain/Loss": 1.9699287414550781, "Full-pretrain/Loss (Raw)": 2.0754170417785645, "Full-pretrain/Step": 4991, "Full-pretrain/Step Time": 17.569113474339247} +{"Full-pretrain/Learning Rate": 2.431233267906049e-05, "Full-pretrain/Loss": 1.9543085098266602, "Full-pretrain/Loss (Raw)": 1.7531319856643677, "Full-pretrain/Step": 4992, "Full-pretrain/Step Time": 17.56938958913088} +{"Full-pretrain/Learning Rate": 2.4303845140680215e-05, "Full-pretrain/Loss": 1.9388811588287354, "Full-pretrain/Loss (Raw)": 1.6643515825271606, "Full-pretrain/Step": 4993, "Full-pretrain/Step Time": 17.569581100717187} +{"Full-pretrain/Learning Rate": 2.429535768260115e-05, "Full-pretrain/Loss": 1.9444284439086914, "Full-pretrain/Loss (Raw)": 2.1784615516662598, "Full-pretrain/Step": 4994, "Full-pretrain/Step Time": 17.567450515925884} +{"Full-pretrain/Learning Rate": 2.428687030580232e-05, "Full-pretrain/Loss": 1.9344865083694458, "Full-pretrain/Loss (Raw)": 1.6506037712097168, "Full-pretrain/Step": 4995, "Full-pretrain/Step Time": 17.569650961086154} +{"Full-pretrain/Learning Rate": 2.4278383011262755e-05, "Full-pretrain/Loss": 1.9372358322143555, "Full-pretrain/Loss (Raw)": 2.106759548187256, "Full-pretrain/Step": 4996, "Full-pretrain/Step Time": 17.566743964329362} +{"Full-pretrain/Learning Rate": 2.4269895799961452e-05, "Full-pretrain/Loss": 1.9365870952606201, "Full-pretrain/Loss (Raw)": 1.8390085697174072, "Full-pretrain/Step": 4997, "Full-pretrain/Step Time": 17.56340934149921} +{"Full-pretrain/Learning Rate": 2.4261408672877427e-05, "Full-pretrain/Loss": 1.9335029125213623, "Full-pretrain/Loss (Raw)": 1.9815768003463745, "Full-pretrain/Step": 4998, "Full-pretrain/Step Time": 17.57017963193357} +{"Full-pretrain/Learning Rate": 2.425292163098964e-05, "Full-pretrain/Loss": 1.9311071634292603, "Full-pretrain/Loss (Raw)": 1.7369025945663452, "Full-pretrain/Step": 4999, "Full-pretrain/Step Time": 17.57108818553388} +{"Full-pretrain/Learning Rate": 2.4244434675277082e-05, "Full-pretrain/Loss": 1.9342783689498901, "Full-pretrain/Loss (Raw)": 1.8777587413787842, "Full-pretrain/Step": 5000, "Full-pretrain/Step Time": 17.56445954181254} +{"Full-pretrain/Learning Rate": 2.4235947806718717e-05, "Full-pretrain/Loss": 1.926575779914856, "Full-pretrain/Loss (Raw)": 1.7612234354019165, "Full-pretrain/Step": 5001, "Full-pretrain/Step Time": 18.760856196284294} +{"Full-pretrain/Learning Rate": 2.4227461026293503e-05, "Full-pretrain/Loss": 1.923930287361145, "Full-pretrain/Loss (Raw)": 1.8546006679534912, "Full-pretrain/Step": 5002, "Full-pretrain/Step Time": 18.760673521086574} +{"Full-pretrain/Learning Rate": 2.421897433498039e-05, "Full-pretrain/Loss": 1.9178354740142822, "Full-pretrain/Loss (Raw)": 1.7227847576141357, "Full-pretrain/Step": 5003, "Full-pretrain/Step Time": 18.765644611790776} +{"Full-pretrain/Learning Rate": 2.4210487733758326e-05, "Full-pretrain/Loss": 1.9145891666412354, "Full-pretrain/Loss (Raw)": 1.9497870206832886, "Full-pretrain/Step": 5004, "Full-pretrain/Step Time": 18.757916091009974} +{"Full-pretrain/Learning Rate": 2.4202001223606208e-05, "Full-pretrain/Loss": 1.9097099304199219, "Full-pretrain/Loss (Raw)": 1.7587025165557861, "Full-pretrain/Step": 5005, "Full-pretrain/Step Time": 18.759938975796103} +{"Full-pretrain/Learning Rate": 2.419351480550297e-05, "Full-pretrain/Loss": 1.892259120941162, "Full-pretrain/Loss (Raw)": 1.7070647478103638, "Full-pretrain/Step": 5006, "Full-pretrain/Step Time": 18.761383943259716} +{"Full-pretrain/Learning Rate": 2.4185028480427523e-05, "Full-pretrain/Loss": 1.8951094150543213, "Full-pretrain/Loss (Raw)": 1.9195048809051514, "Full-pretrain/Step": 5007, "Full-pretrain/Step Time": 18.764886481687427} +{"Full-pretrain/Learning Rate": 2.4176542249358747e-05, "Full-pretrain/Loss": 1.898006796836853, "Full-pretrain/Loss (Raw)": 2.1719436645507812, "Full-pretrain/Step": 5008, "Full-pretrain/Step Time": 18.76668732985854} +{"Full-pretrain/Learning Rate": 2.4168056113275545e-05, "Full-pretrain/Loss": 1.8955934047698975, "Full-pretrain/Loss (Raw)": 2.0051357746124268, "Full-pretrain/Step": 5009, "Full-pretrain/Step Time": 18.76387489400804} +{"Full-pretrain/Learning Rate": 2.4159570073156765e-05, "Full-pretrain/Loss": 1.8970515727996826, "Full-pretrain/Loss (Raw)": 1.8539000749588013, "Full-pretrain/Step": 5010, "Full-pretrain/Step Time": 18.772083023563027} +{"Full-pretrain/Learning Rate": 2.4151084129981285e-05, "Full-pretrain/Loss": 1.9006098508834839, "Full-pretrain/Loss (Raw)": 1.9709240198135376, "Full-pretrain/Step": 5011, "Full-pretrain/Step Time": 18.76740274950862} +{"Full-pretrain/Learning Rate": 2.414259828472795e-05, "Full-pretrain/Loss": 1.909019947052002, "Full-pretrain/Loss (Raw)": 2.4091129302978516, "Full-pretrain/Step": 5012, "Full-pretrain/Step Time": 18.765124917030334} +{"Full-pretrain/Learning Rate": 2.4134112538375604e-05, "Full-pretrain/Loss": 1.9286786317825317, "Full-pretrain/Loss (Raw)": 2.0049400329589844, "Full-pretrain/Step": 5013, "Full-pretrain/Step Time": 18.761863375082612} +{"Full-pretrain/Learning Rate": 2.412562689190308e-05, "Full-pretrain/Loss": 1.9303250312805176, "Full-pretrain/Loss (Raw)": 1.9231154918670654, "Full-pretrain/Step": 5014, "Full-pretrain/Step Time": 18.763385387137532} +{"Full-pretrain/Learning Rate": 2.4117141346289175e-05, "Full-pretrain/Loss": 1.9224985837936401, "Full-pretrain/Loss (Raw)": 1.9016058444976807, "Full-pretrain/Step": 5015, "Full-pretrain/Step Time": 18.763302570208907} +{"Full-pretrain/Learning Rate": 2.4108655902512713e-05, "Full-pretrain/Loss": 1.9311715364456177, "Full-pretrain/Loss (Raw)": 2.2384276390075684, "Full-pretrain/Step": 5016, "Full-pretrain/Step Time": 18.768180824816227} +{"Full-pretrain/Learning Rate": 2.4100170561552478e-05, "Full-pretrain/Loss": 1.9238492250442505, "Full-pretrain/Loss (Raw)": 1.7235536575317383, "Full-pretrain/Step": 5017, "Full-pretrain/Step Time": 18.764692032709718} +{"Full-pretrain/Learning Rate": 2.4091685324387246e-05, "Full-pretrain/Loss": 1.9264297485351562, "Full-pretrain/Loss (Raw)": 2.0730161666870117, "Full-pretrain/Step": 5018, "Full-pretrain/Step Time": 18.76601209677756} +{"Full-pretrain/Learning Rate": 2.408320019199581e-05, "Full-pretrain/Loss": 1.9130830764770508, "Full-pretrain/Loss (Raw)": 1.5807147026062012, "Full-pretrain/Step": 5019, "Full-pretrain/Step Time": 18.759309977293015} +{"Full-pretrain/Learning Rate": 2.4074715165356894e-05, "Full-pretrain/Loss": 1.9135679006576538, "Full-pretrain/Loss (Raw)": 2.001533269882202, "Full-pretrain/Step": 5020, "Full-pretrain/Step Time": 18.76654714345932} +{"Full-pretrain/Learning Rate": 2.406623024544926e-05, "Full-pretrain/Loss": 1.9051027297973633, "Full-pretrain/Loss (Raw)": 1.8354719877243042, "Full-pretrain/Step": 5021, "Full-pretrain/Step Time": 18.77278906479478} +{"Full-pretrain/Learning Rate": 2.4057745433251635e-05, "Full-pretrain/Loss": 1.913172721862793, "Full-pretrain/Loss (Raw)": 1.990495204925537, "Full-pretrain/Step": 5022, "Full-pretrain/Step Time": 18.768402621150017} +{"Full-pretrain/Learning Rate": 2.4049260729742748e-05, "Full-pretrain/Loss": 1.9111590385437012, "Full-pretrain/Loss (Raw)": 2.010977268218994, "Full-pretrain/Step": 5023, "Full-pretrain/Step Time": 18.76973883062601} +{"Full-pretrain/Learning Rate": 2.4040776135901306e-05, "Full-pretrain/Loss": 1.9151259660720825, "Full-pretrain/Loss (Raw)": 1.88007390499115, "Full-pretrain/Step": 5024, "Full-pretrain/Step Time": 18.766809232532978} +{"Full-pretrain/Learning Rate": 2.4032291652706e-05, "Full-pretrain/Loss": 1.93035089969635, "Full-pretrain/Loss (Raw)": 2.1515471935272217, "Full-pretrain/Step": 5025, "Full-pretrain/Step Time": 18.767003145068884} +{"Full-pretrain/Learning Rate": 2.402380728113551e-05, "Full-pretrain/Loss": 1.928365707397461, "Full-pretrain/Loss (Raw)": 2.1149375438690186, "Full-pretrain/Step": 5026, "Full-pretrain/Step Time": 18.76686565205455} +{"Full-pretrain/Learning Rate": 2.4015323022168505e-05, "Full-pretrain/Loss": 1.939521312713623, "Full-pretrain/Loss (Raw)": 2.007584571838379, "Full-pretrain/Step": 5027, "Full-pretrain/Step Time": 18.76770099811256} +{"Full-pretrain/Learning Rate": 2.400683887678364e-05, "Full-pretrain/Loss": 1.9276385307312012, "Full-pretrain/Loss (Raw)": 1.7265084981918335, "Full-pretrain/Step": 5028, "Full-pretrain/Step Time": 18.761077346280217} +{"Full-pretrain/Learning Rate": 2.3998354845959565e-05, "Full-pretrain/Loss": 1.9336531162261963, "Full-pretrain/Loss (Raw)": 2.0314745903015137, "Full-pretrain/Step": 5029, "Full-pretrain/Step Time": 18.76315095834434} +{"Full-pretrain/Learning Rate": 2.3989870930674913e-05, "Full-pretrain/Loss": 1.933305025100708, "Full-pretrain/Loss (Raw)": 1.9704375267028809, "Full-pretrain/Step": 5030, "Full-pretrain/Step Time": 18.763656049966812} +{"Full-pretrain/Learning Rate": 2.3981387131908287e-05, "Full-pretrain/Loss": 1.936227798461914, "Full-pretrain/Loss (Raw)": 1.8304333686828613, "Full-pretrain/Step": 5031, "Full-pretrain/Step Time": 18.759574545547366} +{"Full-pretrain/Learning Rate": 2.3972903450638296e-05, "Full-pretrain/Loss": 1.9426555633544922, "Full-pretrain/Loss (Raw)": 2.0834438800811768, "Full-pretrain/Step": 5032, "Full-pretrain/Step Time": 18.760061955079436} +{"Full-pretrain/Learning Rate": 2.3964419887843536e-05, "Full-pretrain/Loss": 1.954615831375122, "Full-pretrain/Loss (Raw)": 2.143948554992676, "Full-pretrain/Step": 5033, "Full-pretrain/Step Time": 18.75818188302219} +{"Full-pretrain/Learning Rate": 2.3955936444502573e-05, "Full-pretrain/Loss": 1.9681512117385864, "Full-pretrain/Loss (Raw)": 2.2877354621887207, "Full-pretrain/Step": 5034, "Full-pretrain/Step Time": 18.759125428274274} +{"Full-pretrain/Learning Rate": 2.3947453121593984e-05, "Full-pretrain/Loss": 1.9812867641448975, "Full-pretrain/Loss (Raw)": 2.1431241035461426, "Full-pretrain/Step": 5035, "Full-pretrain/Step Time": 18.76360377855599} +{"Full-pretrain/Learning Rate": 2.39389699200963e-05, "Full-pretrain/Loss": 1.9775515794754028, "Full-pretrain/Loss (Raw)": 1.8302578926086426, "Full-pretrain/Step": 5036, "Full-pretrain/Step Time": 18.763325130566955} +{"Full-pretrain/Learning Rate": 2.393048684098806e-05, "Full-pretrain/Loss": 1.986407995223999, "Full-pretrain/Loss (Raw)": 2.0421104431152344, "Full-pretrain/Step": 5037, "Full-pretrain/Step Time": 18.76197218708694} +{"Full-pretrain/Learning Rate": 2.3922003885247788e-05, "Full-pretrain/Loss": 1.9931833744049072, "Full-pretrain/Loss (Raw)": 1.9238768815994263, "Full-pretrain/Step": 5038, "Full-pretrain/Step Time": 18.75923064723611} +{"Full-pretrain/Learning Rate": 2.3913521053853987e-05, "Full-pretrain/Loss": 1.9957188367843628, "Full-pretrain/Loss (Raw)": 2.000640869140625, "Full-pretrain/Step": 5039, "Full-pretrain/Step Time": 18.761961076408625} +{"Full-pretrain/Learning Rate": 2.3905038347785165e-05, "Full-pretrain/Loss": 1.9847445487976074, "Full-pretrain/Loss (Raw)": 1.8207648992538452, "Full-pretrain/Step": 5040, "Full-pretrain/Step Time": 18.763373067602515} +{"Full-pretrain/Learning Rate": 2.389655576801977e-05, "Full-pretrain/Loss": 1.9812954664230347, "Full-pretrain/Loss (Raw)": 1.894768476486206, "Full-pretrain/Step": 5041, "Full-pretrain/Step Time": 18.763520186766982} +{"Full-pretrain/Learning Rate": 2.3888073315536285e-05, "Full-pretrain/Loss": 1.995693325996399, "Full-pretrain/Loss (Raw)": 2.314634084701538, "Full-pretrain/Step": 5042, "Full-pretrain/Step Time": 18.768894713371992} +{"Full-pretrain/Learning Rate": 2.387959099131315e-05, "Full-pretrain/Loss": 1.9941744804382324, "Full-pretrain/Loss (Raw)": 1.922318696975708, "Full-pretrain/Step": 5043, "Full-pretrain/Step Time": 18.76710106432438} +{"Full-pretrain/Learning Rate": 2.38711087963288e-05, "Full-pretrain/Loss": 1.986655831336975, "Full-pretrain/Loss (Raw)": 2.16851544380188, "Full-pretrain/Step": 5044, "Full-pretrain/Step Time": 18.77014877460897} +{"Full-pretrain/Learning Rate": 2.386262673156165e-05, "Full-pretrain/Loss": 1.9758034944534302, "Full-pretrain/Loss (Raw)": 1.6576648950576782, "Full-pretrain/Step": 5045, "Full-pretrain/Step Time": 18.766300596296787} +{"Full-pretrain/Learning Rate": 2.3854144797990122e-05, "Full-pretrain/Loss": 1.9768353700637817, "Full-pretrain/Loss (Raw)": 1.9561386108398438, "Full-pretrain/Step": 5046, "Full-pretrain/Step Time": 18.770951444283128} +{"Full-pretrain/Learning Rate": 2.3845662996592576e-05, "Full-pretrain/Loss": 1.9831173419952393, "Full-pretrain/Loss (Raw)": 2.1026248931884766, "Full-pretrain/Step": 5047, "Full-pretrain/Step Time": 18.773707050830126} +{"Full-pretrain/Learning Rate": 2.38371813283474e-05, "Full-pretrain/Loss": 1.9785341024398804, "Full-pretrain/Loss (Raw)": 2.091763973236084, "Full-pretrain/Step": 5048, "Full-pretrain/Step Time": 18.777134586125612} +{"Full-pretrain/Learning Rate": 2.382869979423295e-05, "Full-pretrain/Loss": 1.989818811416626, "Full-pretrain/Loss (Raw)": 2.0846614837646484, "Full-pretrain/Step": 5049, "Full-pretrain/Step Time": 18.776635656133294} +{"Full-pretrain/Learning Rate": 2.3820218395227567e-05, "Full-pretrain/Loss": 1.9945001602172852, "Full-pretrain/Loss (Raw)": 2.2228198051452637, "Full-pretrain/Step": 5050, "Full-pretrain/Step Time": 18.776762494817376} +{"Full-pretrain/Learning Rate": 2.3811737132309584e-05, "Full-pretrain/Loss": 2.0001707077026367, "Full-pretrain/Loss (Raw)": 1.7621755599975586, "Full-pretrain/Step": 5051, "Full-pretrain/Step Time": 18.772604947909713} +{"Full-pretrain/Learning Rate": 2.3803256006457297e-05, "Full-pretrain/Loss": 1.9992802143096924, "Full-pretrain/Loss (Raw)": 1.973032832145691, "Full-pretrain/Step": 5052, "Full-pretrain/Step Time": 18.78121662698686} +{"Full-pretrain/Learning Rate": 2.3794775018649005e-05, "Full-pretrain/Loss": 2.010221242904663, "Full-pretrain/Loss (Raw)": 2.185586929321289, "Full-pretrain/Step": 5053, "Full-pretrain/Step Time": 18.774658804759383} +{"Full-pretrain/Learning Rate": 2.3786294169862998e-05, "Full-pretrain/Loss": 1.9985153675079346, "Full-pretrain/Loss (Raw)": 1.6159076690673828, "Full-pretrain/Step": 5054, "Full-pretrain/Step Time": 18.77685498446226} +{"Full-pretrain/Learning Rate": 2.3777813461077526e-05, "Full-pretrain/Loss": 1.9968560934066772, "Full-pretrain/Loss (Raw)": 1.9578794240951538, "Full-pretrain/Step": 5055, "Full-pretrain/Step Time": 18.77653825841844} +{"Full-pretrain/Learning Rate": 2.3769332893270853e-05, "Full-pretrain/Loss": 1.9956579208374023, "Full-pretrain/Loss (Raw)": 1.841728687286377, "Full-pretrain/Step": 5056, "Full-pretrain/Step Time": 18.781568098813295} +{"Full-pretrain/Learning Rate": 2.376085246742119e-05, "Full-pretrain/Loss": 1.9889295101165771, "Full-pretrain/Loss (Raw)": 1.9362449645996094, "Full-pretrain/Step": 5057, "Full-pretrain/Step Time": 18.784012511372566} +{"Full-pretrain/Learning Rate": 2.3752372184506764e-05, "Full-pretrain/Loss": 1.9899308681488037, "Full-pretrain/Loss (Raw)": 2.1469743251800537, "Full-pretrain/Step": 5058, "Full-pretrain/Step Time": 18.777334781363606} +{"Full-pretrain/Learning Rate": 2.3743892045505764e-05, "Full-pretrain/Loss": 1.9966269731521606, "Full-pretrain/Loss (Raw)": 2.2218642234802246, "Full-pretrain/Step": 5059, "Full-pretrain/Step Time": 18.779897740110755} +{"Full-pretrain/Learning Rate": 2.3735412051396376e-05, "Full-pretrain/Loss": 2.0094170570373535, "Full-pretrain/Loss (Raw)": 2.1357924938201904, "Full-pretrain/Step": 5060, "Full-pretrain/Step Time": 18.778242953121662} +{"Full-pretrain/Learning Rate": 2.3726932203156772e-05, "Full-pretrain/Loss": 2.0100862979888916, "Full-pretrain/Loss (Raw)": 2.052889823913574, "Full-pretrain/Step": 5061, "Full-pretrain/Step Time": 18.781055530533195} +{"Full-pretrain/Learning Rate": 2.3718452501765078e-05, "Full-pretrain/Loss": 2.003896713256836, "Full-pretrain/Loss (Raw)": 1.7723658084869385, "Full-pretrain/Step": 5062, "Full-pretrain/Step Time": 18.78205731138587} +{"Full-pretrain/Learning Rate": 2.370997294819944e-05, "Full-pretrain/Loss": 2.003498077392578, "Full-pretrain/Loss (Raw)": 1.8176803588867188, "Full-pretrain/Step": 5063, "Full-pretrain/Step Time": 18.784658828750253} +{"Full-pretrain/Learning Rate": 2.370149354343797e-05, "Full-pretrain/Loss": 1.995785117149353, "Full-pretrain/Loss (Raw)": 1.8366297483444214, "Full-pretrain/Step": 5064, "Full-pretrain/Step Time": 18.782917197793722} +{"Full-pretrain/Learning Rate": 2.369301428845876e-05, "Full-pretrain/Loss": 1.9808001518249512, "Full-pretrain/Loss (Raw)": 1.6644306182861328, "Full-pretrain/Step": 5065, "Full-pretrain/Step Time": 18.792752915993333} +{"Full-pretrain/Learning Rate": 2.36845351842399e-05, "Full-pretrain/Loss": 1.9719114303588867, "Full-pretrain/Loss (Raw)": 2.003293514251709, "Full-pretrain/Step": 5066, "Full-pretrain/Step Time": 18.79636009223759} +{"Full-pretrain/Learning Rate": 2.3676056231759448e-05, "Full-pretrain/Loss": 1.9710575342178345, "Full-pretrain/Loss (Raw)": 2.1158053874969482, "Full-pretrain/Step": 5067, "Full-pretrain/Step Time": 18.798597602173686} +{"Full-pretrain/Learning Rate": 2.366757743199544e-05, "Full-pretrain/Loss": 1.9756574630737305, "Full-pretrain/Loss (Raw)": 1.977452278137207, "Full-pretrain/Step": 5068, "Full-pretrain/Step Time": 18.798953318968415} +{"Full-pretrain/Learning Rate": 2.36590987859259e-05, "Full-pretrain/Loss": 1.9730808734893799, "Full-pretrain/Loss (Raw)": 1.9596588611602783, "Full-pretrain/Step": 5069, "Full-pretrain/Step Time": 18.805661907419562} +{"Full-pretrain/Learning Rate": 2.3650620294528848e-05, "Full-pretrain/Loss": 1.9735307693481445, "Full-pretrain/Loss (Raw)": 1.9382725954055786, "Full-pretrain/Step": 5070, "Full-pretrain/Step Time": 18.804145203903317} +{"Full-pretrain/Learning Rate": 2.364214195878227e-05, "Full-pretrain/Loss": 1.9809362888336182, "Full-pretrain/Loss (Raw)": 2.237618923187256, "Full-pretrain/Step": 5071, "Full-pretrain/Step Time": 18.798932245001197} +{"Full-pretrain/Learning Rate": 2.3633663779664147e-05, "Full-pretrain/Loss": 1.987963080406189, "Full-pretrain/Loss (Raw)": 2.045623779296875, "Full-pretrain/Step": 5072, "Full-pretrain/Step Time": 18.794440621510148} +{"Full-pretrain/Learning Rate": 2.362518575815242e-05, "Full-pretrain/Loss": 1.9886939525604248, "Full-pretrain/Loss (Raw)": 1.9181512594223022, "Full-pretrain/Step": 5073, "Full-pretrain/Step Time": 18.800971381366253} +{"Full-pretrain/Learning Rate": 2.3616707895225032e-05, "Full-pretrain/Loss": 1.9909472465515137, "Full-pretrain/Loss (Raw)": 2.386744976043701, "Full-pretrain/Step": 5074, "Full-pretrain/Step Time": 18.801113734021783} +{"Full-pretrain/Learning Rate": 2.3608230191859906e-05, "Full-pretrain/Loss": 1.9844681024551392, "Full-pretrain/Loss (Raw)": 1.7149847745895386, "Full-pretrain/Step": 5075, "Full-pretrain/Step Time": 18.794470170512795} +{"Full-pretrain/Learning Rate": 2.3599752649034933e-05, "Full-pretrain/Loss": 1.9764924049377441, "Full-pretrain/Loss (Raw)": 1.9132936000823975, "Full-pretrain/Step": 5076, "Full-pretrain/Step Time": 18.7971323877573} +{"Full-pretrain/Learning Rate": 2.3591275267728013e-05, "Full-pretrain/Loss": 1.9904003143310547, "Full-pretrain/Loss (Raw)": 2.102721691131592, "Full-pretrain/Step": 5077, "Full-pretrain/Step Time": 18.797855522483587} +{"Full-pretrain/Learning Rate": 2.358279804891698e-05, "Full-pretrain/Loss": 2.0028040409088135, "Full-pretrain/Loss (Raw)": 2.353053569793701, "Full-pretrain/Step": 5078, "Full-pretrain/Step Time": 18.79715260863304} +{"Full-pretrain/Learning Rate": 2.35743209935797e-05, "Full-pretrain/Loss": 1.993345022201538, "Full-pretrain/Loss (Raw)": 1.7999403476715088, "Full-pretrain/Step": 5079, "Full-pretrain/Step Time": 18.804404441267252} +{"Full-pretrain/Learning Rate": 2.356584410269399e-05, "Full-pretrain/Loss": 1.987634539604187, "Full-pretrain/Loss (Raw)": 1.9090250730514526, "Full-pretrain/Step": 5080, "Full-pretrain/Step Time": 18.80470861494541} +{"Full-pretrain/Learning Rate": 2.355736737723766e-05, "Full-pretrain/Loss": 1.982506513595581, "Full-pretrain/Loss (Raw)": 1.920568585395813, "Full-pretrain/Step": 5081, "Full-pretrain/Step Time": 18.805421732366085} +{"Full-pretrain/Learning Rate": 2.3548890818188497e-05, "Full-pretrain/Loss": 1.9640251398086548, "Full-pretrain/Loss (Raw)": 1.6314128637313843, "Full-pretrain/Step": 5082, "Full-pretrain/Step Time": 18.815266896039248} +{"Full-pretrain/Learning Rate": 2.3540414426524275e-05, "Full-pretrain/Loss": 1.9682291746139526, "Full-pretrain/Loss (Raw)": 1.8967087268829346, "Full-pretrain/Step": 5083, "Full-pretrain/Step Time": 18.817135240882635} +{"Full-pretrain/Learning Rate": 2.353193820322273e-05, "Full-pretrain/Loss": 1.959846019744873, "Full-pretrain/Loss (Raw)": 1.704766869544983, "Full-pretrain/Step": 5084, "Full-pretrain/Step Time": 18.811107797548175} +{"Full-pretrain/Learning Rate": 2.3523462149261593e-05, "Full-pretrain/Loss": 1.9508075714111328, "Full-pretrain/Loss (Raw)": 1.8963565826416016, "Full-pretrain/Step": 5085, "Full-pretrain/Step Time": 18.814545733854175} +{"Full-pretrain/Learning Rate": 2.351498626561858e-05, "Full-pretrain/Loss": 1.9627149105072021, "Full-pretrain/Loss (Raw)": 1.996941328048706, "Full-pretrain/Step": 5086, "Full-pretrain/Step Time": 18.81534674204886} +{"Full-pretrain/Learning Rate": 2.350651055327138e-05, "Full-pretrain/Loss": 1.9616847038269043, "Full-pretrain/Loss (Raw)": 1.9249175786972046, "Full-pretrain/Step": 5087, "Full-pretrain/Step Time": 18.824405195191503} +{"Full-pretrain/Learning Rate": 2.349803501319767e-05, "Full-pretrain/Loss": 1.9696760177612305, "Full-pretrain/Loss (Raw)": 2.0974459648132324, "Full-pretrain/Step": 5088, "Full-pretrain/Step Time": 18.81542724557221} +{"Full-pretrain/Learning Rate": 2.3489559646375088e-05, "Full-pretrain/Loss": 1.9670637845993042, "Full-pretrain/Loss (Raw)": 1.8526560068130493, "Full-pretrain/Step": 5089, "Full-pretrain/Step Time": 18.81788963265717} +{"Full-pretrain/Learning Rate": 2.3481084453781267e-05, "Full-pretrain/Loss": 1.9688081741333008, "Full-pretrain/Loss (Raw)": 2.2027926445007324, "Full-pretrain/Step": 5090, "Full-pretrain/Step Time": 18.820112319663167} +{"Full-pretrain/Learning Rate": 2.3472609436393825e-05, "Full-pretrain/Loss": 1.962576150894165, "Full-pretrain/Loss (Raw)": 2.02244234085083, "Full-pretrain/Step": 5091, "Full-pretrain/Step Time": 18.824335189536214} +{"Full-pretrain/Learning Rate": 2.3464134595190344e-05, "Full-pretrain/Loss": 1.9648849964141846, "Full-pretrain/Loss (Raw)": 2.2096734046936035, "Full-pretrain/Step": 5092, "Full-pretrain/Step Time": 18.82213309034705} +{"Full-pretrain/Learning Rate": 2.345565993114841e-05, "Full-pretrain/Loss": 1.9702274799346924, "Full-pretrain/Loss (Raw)": 2.223848819732666, "Full-pretrain/Step": 5093, "Full-pretrain/Step Time": 18.818663956597447} +{"Full-pretrain/Learning Rate": 2.3447185445245546e-05, "Full-pretrain/Loss": 1.9762048721313477, "Full-pretrain/Loss (Raw)": 1.9636404514312744, "Full-pretrain/Step": 5094, "Full-pretrain/Step Time": 18.8166074026376} +{"Full-pretrain/Learning Rate": 2.3438711138459292e-05, "Full-pretrain/Loss": 1.979103446006775, "Full-pretrain/Loss (Raw)": 1.9104409217834473, "Full-pretrain/Step": 5095, "Full-pretrain/Step Time": 18.818216159939766} +{"Full-pretrain/Learning Rate": 2.3430237011767167e-05, "Full-pretrain/Loss": 1.9826164245605469, "Full-pretrain/Loss (Raw)": 1.9490411281585693, "Full-pretrain/Step": 5096, "Full-pretrain/Step Time": 18.81321136839688} +{"Full-pretrain/Learning Rate": 2.3421763066146645e-05, "Full-pretrain/Loss": 1.9912610054016113, "Full-pretrain/Loss (Raw)": 1.9410555362701416, "Full-pretrain/Step": 5097, "Full-pretrain/Step Time": 18.816221822053194} +{"Full-pretrain/Learning Rate": 2.3413289302575214e-05, "Full-pretrain/Loss": 1.9959361553192139, "Full-pretrain/Loss (Raw)": 2.1529035568237305, "Full-pretrain/Step": 5098, "Full-pretrain/Step Time": 18.814594635739923} +{"Full-pretrain/Learning Rate": 2.3404815722030292e-05, "Full-pretrain/Loss": 1.9990458488464355, "Full-pretrain/Loss (Raw)": 2.2153162956237793, "Full-pretrain/Step": 5099, "Full-pretrain/Step Time": 18.814531307667494} +{"Full-pretrain/Learning Rate": 2.339634232548932e-05, "Full-pretrain/Loss": 1.9992069005966187, "Full-pretrain/Loss (Raw)": 1.9826008081436157, "Full-pretrain/Step": 5100, "Full-pretrain/Step Time": 18.81004703603685} +{"Full-pretrain/Learning Rate": 2.3387869113929694e-05, "Full-pretrain/Loss": 1.9981014728546143, "Full-pretrain/Loss (Raw)": 1.9242885112762451, "Full-pretrain/Step": 5101, "Full-pretrain/Step Time": 18.814832909032702} +{"Full-pretrain/Learning Rate": 2.3379396088328797e-05, "Full-pretrain/Loss": 2.002988815307617, "Full-pretrain/Loss (Raw)": 2.0946621894836426, "Full-pretrain/Step": 5102, "Full-pretrain/Step Time": 18.811583179980516} +{"Full-pretrain/Learning Rate": 2.3370923249663994e-05, "Full-pretrain/Loss": 1.990307092666626, "Full-pretrain/Loss (Raw)": 1.8318047523498535, "Full-pretrain/Step": 5103, "Full-pretrain/Step Time": 18.808385560289025} +{"Full-pretrain/Learning Rate": 2.336245059891263e-05, "Full-pretrain/Loss": 1.996557354927063, "Full-pretrain/Loss (Raw)": 2.245633840560913, "Full-pretrain/Step": 5104, "Full-pretrain/Step Time": 18.81303127296269} +{"Full-pretrain/Learning Rate": 2.3353978137052008e-05, "Full-pretrain/Loss": 2.0058021545410156, "Full-pretrain/Loss (Raw)": 2.2139899730682373, "Full-pretrain/Step": 5105, "Full-pretrain/Step Time": 18.81256629154086} +{"Full-pretrain/Learning Rate": 2.3345505865059424e-05, "Full-pretrain/Loss": 1.9934930801391602, "Full-pretrain/Loss (Raw)": 1.9928492307662964, "Full-pretrain/Step": 5106, "Full-pretrain/Step Time": 18.80841708742082} +{"Full-pretrain/Learning Rate": 2.3337033783912164e-05, "Full-pretrain/Loss": 2.0027523040771484, "Full-pretrain/Loss (Raw)": 2.011282205581665, "Full-pretrain/Step": 5107, "Full-pretrain/Step Time": 18.811678571626544} +{"Full-pretrain/Learning Rate": 2.3328561894587466e-05, "Full-pretrain/Loss": 1.999754786491394, "Full-pretrain/Loss (Raw)": 1.8173717260360718, "Full-pretrain/Step": 5108, "Full-pretrain/Step Time": 18.80440789088607} +{"Full-pretrain/Learning Rate": 2.3320090198062575e-05, "Full-pretrain/Loss": 2.0003411769866943, "Full-pretrain/Loss (Raw)": 2.121485710144043, "Full-pretrain/Step": 5109, "Full-pretrain/Step Time": 18.803797334432602} +{"Full-pretrain/Learning Rate": 2.3311618695314684e-05, "Full-pretrain/Loss": 1.9933080673217773, "Full-pretrain/Loss (Raw)": 2.127991199493408, "Full-pretrain/Step": 5110, "Full-pretrain/Step Time": 18.80328791961074} +{"Full-pretrain/Learning Rate": 2.3303147387320983e-05, "Full-pretrain/Loss": 1.9926236867904663, "Full-pretrain/Loss (Raw)": 1.7780389785766602, "Full-pretrain/Step": 5111, "Full-pretrain/Step Time": 18.80885981209576} +{"Full-pretrain/Learning Rate": 2.3294676275058632e-05, "Full-pretrain/Loss": 1.9782514572143555, "Full-pretrain/Loss (Raw)": 1.4491171836853027, "Full-pretrain/Step": 5112, "Full-pretrain/Step Time": 18.8093996476382} +{"Full-pretrain/Learning Rate": 2.3286205359504775e-05, "Full-pretrain/Loss": 1.9844489097595215, "Full-pretrain/Loss (Raw)": 2.1188859939575195, "Full-pretrain/Step": 5113, "Full-pretrain/Step Time": 18.807967452332377} +{"Full-pretrain/Learning Rate": 2.3277734641636536e-05, "Full-pretrain/Loss": 1.992937684059143, "Full-pretrain/Loss (Raw)": 1.903053641319275, "Full-pretrain/Step": 5114, "Full-pretrain/Step Time": 18.81404895707965} +{"Full-pretrain/Learning Rate": 2.3269264122430992e-05, "Full-pretrain/Loss": 1.9910703897476196, "Full-pretrain/Loss (Raw)": 1.836958408355713, "Full-pretrain/Step": 5115, "Full-pretrain/Step Time": 18.812416093423963} +{"Full-pretrain/Learning Rate": 2.3260793802865224e-05, "Full-pretrain/Loss": 2.0069899559020996, "Full-pretrain/Loss (Raw)": 2.2141971588134766, "Full-pretrain/Step": 5116, "Full-pretrain/Step Time": 18.81672216951847} +{"Full-pretrain/Learning Rate": 2.3252323683916283e-05, "Full-pretrain/Loss": 2.0122342109680176, "Full-pretrain/Loss (Raw)": 2.064166784286499, "Full-pretrain/Step": 5117, "Full-pretrain/Step Time": 18.817181412130594} +{"Full-pretrain/Learning Rate": 2.3243853766561186e-05, "Full-pretrain/Loss": 2.0192480087280273, "Full-pretrain/Loss (Raw)": 2.2213869094848633, "Full-pretrain/Step": 5118, "Full-pretrain/Step Time": 18.817391792312264} +{"Full-pretrain/Learning Rate": 2.323538405177695e-05, "Full-pretrain/Loss": 2.0268139839172363, "Full-pretrain/Loss (Raw)": 2.1670265197753906, "Full-pretrain/Step": 5119, "Full-pretrain/Step Time": 18.8194693736732} +{"Full-pretrain/Learning Rate": 2.3226914540540534e-05, "Full-pretrain/Loss": 2.0154786109924316, "Full-pretrain/Loss (Raw)": 1.7347123622894287, "Full-pretrain/Step": 5120, "Full-pretrain/Step Time": 18.821314143016934} +{"Full-pretrain/Learning Rate": 2.3218445233828904e-05, "Full-pretrain/Loss": 2.0264339447021484, "Full-pretrain/Loss (Raw)": 2.2032277584075928, "Full-pretrain/Step": 5121, "Full-pretrain/Step Time": 18.820625755935907} +{"Full-pretrain/Learning Rate": 2.3209976132618987e-05, "Full-pretrain/Loss": 2.020946979522705, "Full-pretrain/Loss (Raw)": 2.027209758758545, "Full-pretrain/Step": 5122, "Full-pretrain/Step Time": 18.820375751703978} +{"Full-pretrain/Learning Rate": 2.3201507237887696e-05, "Full-pretrain/Loss": 2.018028736114502, "Full-pretrain/Loss (Raw)": 1.9290591478347778, "Full-pretrain/Step": 5123, "Full-pretrain/Step Time": 18.82414608821273} +{"Full-pretrain/Learning Rate": 2.3193038550611918e-05, "Full-pretrain/Loss": 2.013343572616577, "Full-pretrain/Loss (Raw)": 2.0597481727600098, "Full-pretrain/Step": 5124, "Full-pretrain/Step Time": 18.828493617475033} +{"Full-pretrain/Learning Rate": 2.3184570071768508e-05, "Full-pretrain/Loss": 2.0081591606140137, "Full-pretrain/Loss (Raw)": 2.0579378604888916, "Full-pretrain/Step": 5125, "Full-pretrain/Step Time": 18.826144767925143} +{"Full-pretrain/Learning Rate": 2.3176101802334303e-05, "Full-pretrain/Loss": 2.0027637481689453, "Full-pretrain/Loss (Raw)": 1.7909979820251465, "Full-pretrain/Step": 5126, "Full-pretrain/Step Time": 18.820220595225692} +{"Full-pretrain/Learning Rate": 2.3167633743286104e-05, "Full-pretrain/Loss": 2.0008935928344727, "Full-pretrain/Loss (Raw)": 1.8505901098251343, "Full-pretrain/Step": 5127, "Full-pretrain/Step Time": 18.82052986510098} +{"Full-pretrain/Learning Rate": 2.3159165895600716e-05, "Full-pretrain/Loss": 1.999650478363037, "Full-pretrain/Loss (Raw)": 1.9092628955841064, "Full-pretrain/Step": 5128, "Full-pretrain/Step Time": 18.829191137105227} +{"Full-pretrain/Learning Rate": 2.315069826025489e-05, "Full-pretrain/Loss": 1.9830653667449951, "Full-pretrain/Loss (Raw)": 1.4103286266326904, "Full-pretrain/Step": 5129, "Full-pretrain/Step Time": 17.634732127189636} +{"Full-pretrain/Learning Rate": 2.3142230838225382e-05, "Full-pretrain/Loss": 1.9772831201553345, "Full-pretrain/Loss (Raw)": 1.9678763151168823, "Full-pretrain/Step": 5130, "Full-pretrain/Step Time": 17.62819977104664} +{"Full-pretrain/Learning Rate": 2.3133763630488884e-05, "Full-pretrain/Loss": 1.9697761535644531, "Full-pretrain/Loss (Raw)": 1.9750940799713135, "Full-pretrain/Step": 5131, "Full-pretrain/Step Time": 17.631735179573298} +{"Full-pretrain/Learning Rate": 2.3125296638022095e-05, "Full-pretrain/Loss": 1.9686009883880615, "Full-pretrain/Loss (Raw)": 1.9449927806854248, "Full-pretrain/Step": 5132, "Full-pretrain/Step Time": 17.64354384317994} +{"Full-pretrain/Learning Rate": 2.3116829861801686e-05, "Full-pretrain/Loss": 1.9725685119628906, "Full-pretrain/Loss (Raw)": 2.0512514114379883, "Full-pretrain/Step": 5133, "Full-pretrain/Step Time": 17.639951553195715} +{"Full-pretrain/Learning Rate": 2.3108363302804283e-05, "Full-pretrain/Loss": 1.9642773866653442, "Full-pretrain/Loss (Raw)": 1.829348087310791, "Full-pretrain/Step": 5134, "Full-pretrain/Step Time": 17.635313099250197} +{"Full-pretrain/Learning Rate": 2.309989696200652e-05, "Full-pretrain/Loss": 1.9680612087249756, "Full-pretrain/Loss (Raw)": 1.9528870582580566, "Full-pretrain/Step": 5135, "Full-pretrain/Step Time": 17.637026412412524} +{"Full-pretrain/Learning Rate": 2.3091430840384964e-05, "Full-pretrain/Loss": 1.963503122329712, "Full-pretrain/Loss (Raw)": 2.099776268005371, "Full-pretrain/Step": 5136, "Full-pretrain/Step Time": 17.638509983196855} +{"Full-pretrain/Learning Rate": 2.3082964938916192e-05, "Full-pretrain/Loss": 1.9675703048706055, "Full-pretrain/Loss (Raw)": 2.344137668609619, "Full-pretrain/Step": 5137, "Full-pretrain/Step Time": 17.63671071641147} +{"Full-pretrain/Learning Rate": 2.307449925857674e-05, "Full-pretrain/Loss": 1.955597162246704, "Full-pretrain/Loss (Raw)": 1.6097102165222168, "Full-pretrain/Step": 5138, "Full-pretrain/Step Time": 17.62526743672788} +{"Full-pretrain/Learning Rate": 2.3066033800343122e-05, "Full-pretrain/Loss": 1.9509886503219604, "Full-pretrain/Loss (Raw)": 1.8638073205947876, "Full-pretrain/Step": 5139, "Full-pretrain/Step Time": 17.6306118555367} +{"Full-pretrain/Learning Rate": 2.3057568565191835e-05, "Full-pretrain/Loss": 1.9571483135223389, "Full-pretrain/Loss (Raw)": 2.014482021331787, "Full-pretrain/Step": 5140, "Full-pretrain/Step Time": 17.63524328917265} +{"Full-pretrain/Learning Rate": 2.304910355409932e-05, "Full-pretrain/Loss": 1.9534883499145508, "Full-pretrain/Loss (Raw)": 2.004364490509033, "Full-pretrain/Step": 5141, "Full-pretrain/Step Time": 17.63635889068246} +{"Full-pretrain/Learning Rate": 2.3040638768042027e-05, "Full-pretrain/Loss": 1.948679804801941, "Full-pretrain/Loss (Raw)": 1.9741220474243164, "Full-pretrain/Step": 5142, "Full-pretrain/Step Time": 17.629075234755874} +{"Full-pretrain/Learning Rate": 2.3032174207996362e-05, "Full-pretrain/Loss": 1.9468379020690918, "Full-pretrain/Loss (Raw)": 1.719093680381775, "Full-pretrain/Step": 5143, "Full-pretrain/Step Time": 17.636740691959858} +{"Full-pretrain/Learning Rate": 2.302370987493871e-05, "Full-pretrain/Loss": 1.9639697074890137, "Full-pretrain/Loss (Raw)": 1.9973398447036743, "Full-pretrain/Step": 5144, "Full-pretrain/Step Time": 17.63331313058734} +{"Full-pretrain/Learning Rate": 2.3015245769845433e-05, "Full-pretrain/Loss": 1.951085090637207, "Full-pretrain/Loss (Raw)": 1.706573724746704, "Full-pretrain/Step": 5145, "Full-pretrain/Step Time": 17.63627210445702} +{"Full-pretrain/Learning Rate": 2.3006781893692864e-05, "Full-pretrain/Loss": 1.9531786441802979, "Full-pretrain/Loss (Raw)": 1.970051646232605, "Full-pretrain/Step": 5146, "Full-pretrain/Step Time": 17.63395133242011} +{"Full-pretrain/Learning Rate": 2.2998318247457296e-05, "Full-pretrain/Loss": 1.9627611637115479, "Full-pretrain/Loss (Raw)": 2.1435959339141846, "Full-pretrain/Step": 5147, "Full-pretrain/Step Time": 17.645658776164055} +{"Full-pretrain/Learning Rate": 2.2989854832115012e-05, "Full-pretrain/Loss": 1.948344111442566, "Full-pretrain/Loss (Raw)": 1.7528529167175293, "Full-pretrain/Step": 5148, "Full-pretrain/Step Time": 17.63957409374416} +{"Full-pretrain/Learning Rate": 2.2981391648642275e-05, "Full-pretrain/Loss": 1.9445244073867798, "Full-pretrain/Loss (Raw)": 1.941934585571289, "Full-pretrain/Step": 5149, "Full-pretrain/Step Time": 17.63367048278451} +{"Full-pretrain/Learning Rate": 2.2972928698015296e-05, "Full-pretrain/Loss": 1.947479248046875, "Full-pretrain/Loss (Raw)": 2.3159451484680176, "Full-pretrain/Step": 5150, "Full-pretrain/Step Time": 17.629911666736007} +{"Full-pretrain/Learning Rate": 2.2964465981210282e-05, "Full-pretrain/Loss": 1.9471062421798706, "Full-pretrain/Loss (Raw)": 2.1550872325897217, "Full-pretrain/Step": 5151, "Full-pretrain/Step Time": 17.63473355025053} +{"Full-pretrain/Learning Rate": 2.2956003499203404e-05, "Full-pretrain/Loss": 1.9517900943756104, "Full-pretrain/Loss (Raw)": 1.8845953941345215, "Full-pretrain/Step": 5152, "Full-pretrain/Step Time": 17.637018255889416} +{"Full-pretrain/Learning Rate": 2.2947541252970797e-05, "Full-pretrain/Loss": 1.9533612728118896, "Full-pretrain/Loss (Raw)": 2.253507137298584, "Full-pretrain/Step": 5153, "Full-pretrain/Step Time": 17.63707945495844} +{"Full-pretrain/Learning Rate": 2.2939079243488587e-05, "Full-pretrain/Loss": 1.9435789585113525, "Full-pretrain/Loss (Raw)": 1.7141777276992798, "Full-pretrain/Step": 5154, "Full-pretrain/Step Time": 17.633705088868737} +{"Full-pretrain/Learning Rate": 2.293061747173286e-05, "Full-pretrain/Loss": 1.9455676078796387, "Full-pretrain/Loss (Raw)": 1.9926905632019043, "Full-pretrain/Step": 5155, "Full-pretrain/Step Time": 17.6343005746603} +{"Full-pretrain/Learning Rate": 2.2922155938679692e-05, "Full-pretrain/Loss": 1.9403983354568481, "Full-pretrain/Loss (Raw)": 1.8943334817886353, "Full-pretrain/Step": 5156, "Full-pretrain/Step Time": 17.638932732865214} +{"Full-pretrain/Learning Rate": 2.29136946453051e-05, "Full-pretrain/Loss": 1.9318454265594482, "Full-pretrain/Loss (Raw)": 1.7842435836791992, "Full-pretrain/Step": 5157, "Full-pretrain/Step Time": 17.63765435293317} +{"Full-pretrain/Learning Rate": 2.290523359258509e-05, "Full-pretrain/Loss": 1.9313327074050903, "Full-pretrain/Loss (Raw)": 1.774595022201538, "Full-pretrain/Step": 5158, "Full-pretrain/Step Time": 17.63033653795719} +{"Full-pretrain/Learning Rate": 2.289677278149566e-05, "Full-pretrain/Loss": 1.9291086196899414, "Full-pretrain/Loss (Raw)": 1.7794148921966553, "Full-pretrain/Step": 5159, "Full-pretrain/Step Time": 17.63042742945254} +{"Full-pretrain/Learning Rate": 2.2888312213012742e-05, "Full-pretrain/Loss": 1.9357805252075195, "Full-pretrain/Loss (Raw)": 2.122765302658081, "Full-pretrain/Step": 5160, "Full-pretrain/Step Time": 17.6371604334563} +{"Full-pretrain/Learning Rate": 2.287985188811228e-05, "Full-pretrain/Loss": 1.9524621963500977, "Full-pretrain/Loss (Raw)": 1.944143533706665, "Full-pretrain/Step": 5161, "Full-pretrain/Step Time": 17.634443148970604} +{"Full-pretrain/Learning Rate": 2.2871391807770146e-05, "Full-pretrain/Loss": 1.9515743255615234, "Full-pretrain/Loss (Raw)": 1.9394619464874268, "Full-pretrain/Step": 5162, "Full-pretrain/Step Time": 17.629061745479703} +{"Full-pretrain/Learning Rate": 2.286293197296222e-05, "Full-pretrain/Loss": 1.9454171657562256, "Full-pretrain/Loss (Raw)": 1.7780643701553345, "Full-pretrain/Step": 5163, "Full-pretrain/Step Time": 17.6257466301322} +{"Full-pretrain/Learning Rate": 2.285447238466434e-05, "Full-pretrain/Loss": 1.9494788646697998, "Full-pretrain/Loss (Raw)": 2.074967861175537, "Full-pretrain/Step": 5164, "Full-pretrain/Step Time": 17.626893358305097} +{"Full-pretrain/Learning Rate": 2.2846013043852315e-05, "Full-pretrain/Loss": 1.9555168151855469, "Full-pretrain/Loss (Raw)": 2.2444682121276855, "Full-pretrain/Step": 5165, "Full-pretrain/Step Time": 17.6271665468812} +{"Full-pretrain/Learning Rate": 2.2837553951501933e-05, "Full-pretrain/Loss": 1.9540889263153076, "Full-pretrain/Loss (Raw)": 1.7836511135101318, "Full-pretrain/Step": 5166, "Full-pretrain/Step Time": 17.622025752440095} +{"Full-pretrain/Learning Rate": 2.2829095108588947e-05, "Full-pretrain/Loss": 1.9504408836364746, "Full-pretrain/Loss (Raw)": 1.8361551761627197, "Full-pretrain/Step": 5167, "Full-pretrain/Step Time": 17.618854435160756} +{"Full-pretrain/Learning Rate": 2.2820636516089075e-05, "Full-pretrain/Loss": 1.938949465751648, "Full-pretrain/Loss (Raw)": 1.7320488691329956, "Full-pretrain/Step": 5168, "Full-pretrain/Step Time": 17.623244708403945} +{"Full-pretrain/Learning Rate": 2.2812178174978008e-05, "Full-pretrain/Loss": 1.926296591758728, "Full-pretrain/Loss (Raw)": 1.9392470121383667, "Full-pretrain/Step": 5169, "Full-pretrain/Step Time": 17.6209539975971} +{"Full-pretrain/Learning Rate": 2.280372008623142e-05, "Full-pretrain/Loss": 1.9300470352172852, "Full-pretrain/Loss (Raw)": 1.729720950126648, "Full-pretrain/Step": 5170, "Full-pretrain/Step Time": 17.615862051025033} +{"Full-pretrain/Learning Rate": 2.279526225082495e-05, "Full-pretrain/Loss": 1.9337890148162842, "Full-pretrain/Loss (Raw)": 1.9835525751113892, "Full-pretrain/Step": 5171, "Full-pretrain/Step Time": 17.622380036860704} +{"Full-pretrain/Learning Rate": 2.2786804669734217e-05, "Full-pretrain/Loss": 1.930826187133789, "Full-pretrain/Loss (Raw)": 1.9196739196777344, "Full-pretrain/Step": 5172, "Full-pretrain/Step Time": 17.624767817556858} +{"Full-pretrain/Learning Rate": 2.277834734393477e-05, "Full-pretrain/Loss": 1.928979754447937, "Full-pretrain/Loss (Raw)": 1.9452767372131348, "Full-pretrain/Step": 5173, "Full-pretrain/Step Time": 17.62236524373293} +{"Full-pretrain/Learning Rate": 2.2769890274402184e-05, "Full-pretrain/Loss": 1.9321216344833374, "Full-pretrain/Loss (Raw)": 2.074659824371338, "Full-pretrain/Step": 5174, "Full-pretrain/Step Time": 17.61386051028967} +{"Full-pretrain/Learning Rate": 2.2761433462111973e-05, "Full-pretrain/Loss": 1.940392017364502, "Full-pretrain/Loss (Raw)": 1.9837439060211182, "Full-pretrain/Step": 5175, "Full-pretrain/Step Time": 17.61746859923005} +{"Full-pretrain/Learning Rate": 2.275297690803962e-05, "Full-pretrain/Loss": 1.947621464729309, "Full-pretrain/Loss (Raw)": 2.2286858558654785, "Full-pretrain/Step": 5176, "Full-pretrain/Step Time": 17.62126992829144} +{"Full-pretrain/Learning Rate": 2.27445206131606e-05, "Full-pretrain/Loss": 1.9547410011291504, "Full-pretrain/Loss (Raw)": 1.9343986511230469, "Full-pretrain/Step": 5177, "Full-pretrain/Step Time": 17.62022127956152} +{"Full-pretrain/Learning Rate": 2.273606457845033e-05, "Full-pretrain/Loss": 1.9482524394989014, "Full-pretrain/Loss (Raw)": 1.7624201774597168, "Full-pretrain/Step": 5178, "Full-pretrain/Step Time": 17.619919573888183} +{"Full-pretrain/Learning Rate": 2.272760880488421e-05, "Full-pretrain/Loss": 1.9430327415466309, "Full-pretrain/Loss (Raw)": 1.9765594005584717, "Full-pretrain/Step": 5179, "Full-pretrain/Step Time": 17.619629370048642} +{"Full-pretrain/Learning Rate": 2.2719153293437613e-05, "Full-pretrain/Loss": 1.9391565322875977, "Full-pretrain/Loss (Raw)": 1.628816843032837, "Full-pretrain/Step": 5180, "Full-pretrain/Step Time": 17.62501854263246} +{"Full-pretrain/Learning Rate": 2.2710698045085887e-05, "Full-pretrain/Loss": 1.9417457580566406, "Full-pretrain/Loss (Raw)": 2.024789333343506, "Full-pretrain/Step": 5181, "Full-pretrain/Step Time": 17.628491738811135} +{"Full-pretrain/Learning Rate": 2.270224306080435e-05, "Full-pretrain/Loss": 1.930390477180481, "Full-pretrain/Loss (Raw)": 1.9525798559188843, "Full-pretrain/Step": 5182, "Full-pretrain/Step Time": 17.621045172214508} +{"Full-pretrain/Learning Rate": 2.2693788341568252e-05, "Full-pretrain/Loss": 1.915848970413208, "Full-pretrain/Loss (Raw)": 1.6897568702697754, "Full-pretrain/Step": 5183, "Full-pretrain/Step Time": 17.621168233454227} +{"Full-pretrain/Learning Rate": 2.2685333888352866e-05, "Full-pretrain/Loss": 1.925036072731018, "Full-pretrain/Loss (Raw)": 2.178584337234497, "Full-pretrain/Step": 5184, "Full-pretrain/Step Time": 17.621902026236057} +{"Full-pretrain/Learning Rate": 2.26768797021334e-05, "Full-pretrain/Loss": 1.914597749710083, "Full-pretrain/Loss (Raw)": 1.9194828271865845, "Full-pretrain/Step": 5185, "Full-pretrain/Step Time": 17.616561014205217} +{"Full-pretrain/Learning Rate": 2.2668425783885038e-05, "Full-pretrain/Loss": 1.9174436330795288, "Full-pretrain/Loss (Raw)": 1.8052442073822021, "Full-pretrain/Step": 5186, "Full-pretrain/Step Time": 17.620090130716562} +{"Full-pretrain/Learning Rate": 2.2659972134582947e-05, "Full-pretrain/Loss": 1.9108023643493652, "Full-pretrain/Loss (Raw)": 1.780170202255249, "Full-pretrain/Step": 5187, "Full-pretrain/Step Time": 17.619458766654134} +{"Full-pretrain/Learning Rate": 2.2651518755202257e-05, "Full-pretrain/Loss": 1.9178344011306763, "Full-pretrain/Loss (Raw)": 2.1193575859069824, "Full-pretrain/Step": 5188, "Full-pretrain/Step Time": 17.620971566066146} +{"Full-pretrain/Learning Rate": 2.2643065646718042e-05, "Full-pretrain/Loss": 1.9263489246368408, "Full-pretrain/Loss (Raw)": 2.0567052364349365, "Full-pretrain/Step": 5189, "Full-pretrain/Step Time": 17.623241674154997} +{"Full-pretrain/Learning Rate": 2.2634612810105378e-05, "Full-pretrain/Loss": 1.9294326305389404, "Full-pretrain/Loss (Raw)": 1.8732781410217285, "Full-pretrain/Step": 5190, "Full-pretrain/Step Time": 17.618346124887466} +{"Full-pretrain/Learning Rate": 2.26261602463393e-05, "Full-pretrain/Loss": 1.9373300075531006, "Full-pretrain/Loss (Raw)": 2.032132148742676, "Full-pretrain/Step": 5191, "Full-pretrain/Step Time": 17.618228055536747} +{"Full-pretrain/Learning Rate": 2.26177079563948e-05, "Full-pretrain/Loss": 1.9350305795669556, "Full-pretrain/Loss (Raw)": 2.049180507659912, "Full-pretrain/Step": 5192, "Full-pretrain/Step Time": 17.625593945384026} +{"Full-pretrain/Learning Rate": 2.260925594124685e-05, "Full-pretrain/Loss": 1.9381978511810303, "Full-pretrain/Loss (Raw)": 2.045496940612793, "Full-pretrain/Step": 5193, "Full-pretrain/Step Time": 17.61718357540667} +{"Full-pretrain/Learning Rate": 2.260080420187039e-05, "Full-pretrain/Loss": 1.9407039880752563, "Full-pretrain/Loss (Raw)": 2.0196595191955566, "Full-pretrain/Step": 5194, "Full-pretrain/Step Time": 17.610538290813565} +{"Full-pretrain/Learning Rate": 2.259235273924032e-05, "Full-pretrain/Loss": 1.9504765272140503, "Full-pretrain/Loss (Raw)": 2.0907859802246094, "Full-pretrain/Step": 5195, "Full-pretrain/Step Time": 17.60775882564485} +{"Full-pretrain/Learning Rate": 2.258390155433151e-05, "Full-pretrain/Loss": 1.9546377658843994, "Full-pretrain/Loss (Raw)": 2.208127975463867, "Full-pretrain/Step": 5196, "Full-pretrain/Step Time": 17.609784761443734} +{"Full-pretrain/Learning Rate": 2.257545064811881e-05, "Full-pretrain/Loss": 1.9454989433288574, "Full-pretrain/Loss (Raw)": 1.9520248174667358, "Full-pretrain/Step": 5197, "Full-pretrain/Step Time": 17.61228165216744} +{"Full-pretrain/Learning Rate": 2.2567000021577035e-05, "Full-pretrain/Loss": 1.9576066732406616, "Full-pretrain/Loss (Raw)": 2.171097993850708, "Full-pretrain/Step": 5198, "Full-pretrain/Step Time": 17.610529886558652} +{"Full-pretrain/Learning Rate": 2.255854967568094e-05, "Full-pretrain/Loss": 1.960160255432129, "Full-pretrain/Loss (Raw)": 1.9178729057312012, "Full-pretrain/Step": 5199, "Full-pretrain/Step Time": 17.61183168180287} +{"Full-pretrain/Learning Rate": 2.2550099611405285e-05, "Full-pretrain/Loss": 1.9709259271621704, "Full-pretrain/Loss (Raw)": 2.076545238494873, "Full-pretrain/Step": 5200, "Full-pretrain/Step Time": 17.616614079102874} +{"Full-pretrain/Learning Rate": 2.2541649829724783e-05, "Full-pretrain/Loss": 1.970869779586792, "Full-pretrain/Loss (Raw)": 1.937454104423523, "Full-pretrain/Step": 5201, "Full-pretrain/Step Time": 17.61683759652078} +{"Full-pretrain/Learning Rate": 2.2533200331614103e-05, "Full-pretrain/Loss": 1.986899495124817, "Full-pretrain/Loss (Raw)": 2.242668628692627, "Full-pretrain/Step": 5202, "Full-pretrain/Step Time": 17.610415171831846} +{"Full-pretrain/Learning Rate": 2.2524751118047903e-05, "Full-pretrain/Loss": 1.989760398864746, "Full-pretrain/Loss (Raw)": 2.0751051902770996, "Full-pretrain/Step": 5203, "Full-pretrain/Step Time": 17.611740700900555} +{"Full-pretrain/Learning Rate": 2.2516302190000795e-05, "Full-pretrain/Loss": 1.9908971786499023, "Full-pretrain/Loss (Raw)": 1.9560458660125732, "Full-pretrain/Step": 5204, "Full-pretrain/Step Time": 17.61523768492043} +{"Full-pretrain/Learning Rate": 2.250785354844735e-05, "Full-pretrain/Loss": 1.999467372894287, "Full-pretrain/Loss (Raw)": 2.2195255756378174, "Full-pretrain/Step": 5205, "Full-pretrain/Step Time": 17.61578161083162} +{"Full-pretrain/Learning Rate": 2.2499405194362122e-05, "Full-pretrain/Loss": 1.9913684129714966, "Full-pretrain/Loss (Raw)": 1.8154921531677246, "Full-pretrain/Step": 5206, "Full-pretrain/Step Time": 17.614738347008824} +{"Full-pretrain/Learning Rate": 2.2490957128719624e-05, "Full-pretrain/Loss": 1.9878082275390625, "Full-pretrain/Loss (Raw)": 1.8698171377182007, "Full-pretrain/Step": 5207, "Full-pretrain/Step Time": 17.61244853772223} +{"Full-pretrain/Learning Rate": 2.2482509352494348e-05, "Full-pretrain/Loss": 1.9810700416564941, "Full-pretrain/Loss (Raw)": 2.013066291809082, "Full-pretrain/Step": 5208, "Full-pretrain/Step Time": 17.611973052844405} +{"Full-pretrain/Learning Rate": 2.2474061866660732e-05, "Full-pretrain/Loss": 1.9908760786056519, "Full-pretrain/Loss (Raw)": 2.2481889724731445, "Full-pretrain/Step": 5209, "Full-pretrain/Step Time": 17.616271913051605} +{"Full-pretrain/Learning Rate": 2.2465614672193193e-05, "Full-pretrain/Loss": 2.0042724609375, "Full-pretrain/Loss (Raw)": 2.191100835800171, "Full-pretrain/Step": 5210, "Full-pretrain/Step Time": 17.609284847974777} +{"Full-pretrain/Learning Rate": 2.2457167770066105e-05, "Full-pretrain/Loss": 2.0002121925354004, "Full-pretrain/Loss (Raw)": 1.8466365337371826, "Full-pretrain/Step": 5211, "Full-pretrain/Step Time": 17.605798995122313} +{"Full-pretrain/Learning Rate": 2.2448721161253818e-05, "Full-pretrain/Loss": 2.0127193927764893, "Full-pretrain/Loss (Raw)": 2.0290489196777344, "Full-pretrain/Step": 5212, "Full-pretrain/Step Time": 17.609780563041568} +{"Full-pretrain/Learning Rate": 2.2440274846730653e-05, "Full-pretrain/Loss": 2.0080971717834473, "Full-pretrain/Loss (Raw)": 1.8768748044967651, "Full-pretrain/Step": 5213, "Full-pretrain/Step Time": 17.610715627670288} +{"Full-pretrain/Learning Rate": 2.2431828827470895e-05, "Full-pretrain/Loss": 2.0138444900512695, "Full-pretrain/Loss (Raw)": 2.136491537094116, "Full-pretrain/Step": 5214, "Full-pretrain/Step Time": 17.604950696229935} +{"Full-pretrain/Learning Rate": 2.2423383104448767e-05, "Full-pretrain/Loss": 2.019211530685425, "Full-pretrain/Loss (Raw)": 1.8615058660507202, "Full-pretrain/Step": 5215, "Full-pretrain/Step Time": 17.601220285519958} +{"Full-pretrain/Learning Rate": 2.2414937678638493e-05, "Full-pretrain/Loss": 2.0302231311798096, "Full-pretrain/Loss (Raw)": 2.5309579372406006, "Full-pretrain/Step": 5216, "Full-pretrain/Step Time": 17.605221141129732} +{"Full-pretrain/Learning Rate": 2.2406492551014252e-05, "Full-pretrain/Loss": 2.029353618621826, "Full-pretrain/Loss (Raw)": 1.8916536569595337, "Full-pretrain/Step": 5217, "Full-pretrain/Step Time": 17.60642676986754} +{"Full-pretrain/Learning Rate": 2.239804772255018e-05, "Full-pretrain/Loss": 2.0403614044189453, "Full-pretrain/Loss (Raw)": 2.157500743865967, "Full-pretrain/Step": 5218, "Full-pretrain/Step Time": 17.60646130889654} +{"Full-pretrain/Learning Rate": 2.23896031942204e-05, "Full-pretrain/Loss": 2.051424026489258, "Full-pretrain/Loss (Raw)": 2.1341662406921387, "Full-pretrain/Step": 5219, "Full-pretrain/Step Time": 17.60510638728738} +{"Full-pretrain/Learning Rate": 2.2381158966998966e-05, "Full-pretrain/Loss": 2.0481836795806885, "Full-pretrain/Loss (Raw)": 2.0156679153442383, "Full-pretrain/Step": 5220, "Full-pretrain/Step Time": 17.605260625481606} +{"Full-pretrain/Learning Rate": 2.2372715041859922e-05, "Full-pretrain/Loss": 2.0485782623291016, "Full-pretrain/Loss (Raw)": 2.0693304538726807, "Full-pretrain/Step": 5221, "Full-pretrain/Step Time": 17.607370479032397} +{"Full-pretrain/Learning Rate": 2.2364271419777273e-05, "Full-pretrain/Loss": 2.0476717948913574, "Full-pretrain/Loss (Raw)": 1.8442741632461548, "Full-pretrain/Step": 5222, "Full-pretrain/Step Time": 17.607015930116177} +{"Full-pretrain/Learning Rate": 2.2355828101724995e-05, "Full-pretrain/Loss": 2.047518253326416, "Full-pretrain/Loss (Raw)": 2.0272204875946045, "Full-pretrain/Step": 5223, "Full-pretrain/Step Time": 17.6069274302572} +{"Full-pretrain/Learning Rate": 2.2347385088677015e-05, "Full-pretrain/Loss": 2.0412023067474365, "Full-pretrain/Loss (Raw)": 1.8470678329467773, "Full-pretrain/Step": 5224, "Full-pretrain/Step Time": 17.60990696400404} +{"Full-pretrain/Learning Rate": 2.233894238160724e-05, "Full-pretrain/Loss": 2.0356063842773438, "Full-pretrain/Loss (Raw)": 1.8664335012435913, "Full-pretrain/Step": 5225, "Full-pretrain/Step Time": 17.60658733546734} +{"Full-pretrain/Learning Rate": 2.2330499981489524e-05, "Full-pretrain/Loss": 2.035614252090454, "Full-pretrain/Loss (Raw)": 2.019904136657715, "Full-pretrain/Step": 5226, "Full-pretrain/Step Time": 17.605311719700694} +{"Full-pretrain/Learning Rate": 2.2322057889297686e-05, "Full-pretrain/Loss": 2.032649040222168, "Full-pretrain/Loss (Raw)": 1.995898962020874, "Full-pretrain/Step": 5227, "Full-pretrain/Step Time": 17.61122508905828} +{"Full-pretrain/Learning Rate": 2.2313616106005533e-05, "Full-pretrain/Loss": 2.0278477668762207, "Full-pretrain/Loss (Raw)": 2.0544934272766113, "Full-pretrain/Step": 5228, "Full-pretrain/Step Time": 17.614718290045857} +{"Full-pretrain/Learning Rate": 2.230517463258682e-05, "Full-pretrain/Loss": 2.0291104316711426, "Full-pretrain/Loss (Raw)": 1.9924254417419434, "Full-pretrain/Step": 5229, "Full-pretrain/Step Time": 17.61097899824381} +{"Full-pretrain/Learning Rate": 2.2296733470015275e-05, "Full-pretrain/Loss": 2.0187735557556152, "Full-pretrain/Loss (Raw)": 1.8403141498565674, "Full-pretrain/Step": 5230, "Full-pretrain/Step Time": 17.61212495714426} +{"Full-pretrain/Learning Rate": 2.2288292619264564e-05, "Full-pretrain/Loss": 2.0181479454040527, "Full-pretrain/Loss (Raw)": 1.8978551626205444, "Full-pretrain/Step": 5231, "Full-pretrain/Step Time": 17.61366413347423} +{"Full-pretrain/Learning Rate": 2.2279852081308345e-05, "Full-pretrain/Loss": 2.0155763626098633, "Full-pretrain/Loss (Raw)": 1.9942573308944702, "Full-pretrain/Step": 5232, "Full-pretrain/Step Time": 17.614943275228143} +{"Full-pretrain/Learning Rate": 2.227141185712024e-05, "Full-pretrain/Loss": 2.020902633666992, "Full-pretrain/Loss (Raw)": 2.1078944206237793, "Full-pretrain/Step": 5233, "Full-pretrain/Step Time": 17.613123208284378} +{"Full-pretrain/Learning Rate": 2.226297194767381e-05, "Full-pretrain/Loss": 2.0243396759033203, "Full-pretrain/Loss (Raw)": 2.352659225463867, "Full-pretrain/Step": 5234, "Full-pretrain/Step Time": 17.61486041173339} +{"Full-pretrain/Learning Rate": 2.2254532353942613e-05, "Full-pretrain/Loss": 2.013265371322632, "Full-pretrain/Loss (Raw)": 1.7207218408584595, "Full-pretrain/Step": 5235, "Full-pretrain/Step Time": 17.609865985810757} +{"Full-pretrain/Learning Rate": 2.2246093076900144e-05, "Full-pretrain/Loss": 2.004331111907959, "Full-pretrain/Loss (Raw)": 1.670154094696045, "Full-pretrain/Step": 5236, "Full-pretrain/Step Time": 17.613894255831838} +{"Full-pretrain/Learning Rate": 2.223765411751986e-05, "Full-pretrain/Loss": 1.9915661811828613, "Full-pretrain/Loss (Raw)": 1.8110408782958984, "Full-pretrain/Step": 5237, "Full-pretrain/Step Time": 17.615327637642622} +{"Full-pretrain/Learning Rate": 2.222921547677521e-05, "Full-pretrain/Loss": 2.0048298835754395, "Full-pretrain/Loss (Raw)": 2.239929437637329, "Full-pretrain/Step": 5238, "Full-pretrain/Step Time": 17.622684659436345} +{"Full-pretrain/Learning Rate": 2.2220777155639576e-05, "Full-pretrain/Loss": 1.9983737468719482, "Full-pretrain/Loss (Raw)": 1.6632288694381714, "Full-pretrain/Step": 5239, "Full-pretrain/Step Time": 17.614480443298817} +{"Full-pretrain/Learning Rate": 2.2212339155086333e-05, "Full-pretrain/Loss": 2.0138583183288574, "Full-pretrain/Loss (Raw)": 2.5085644721984863, "Full-pretrain/Step": 5240, "Full-pretrain/Step Time": 17.615223441272974} +{"Full-pretrain/Learning Rate": 2.220390147608878e-05, "Full-pretrain/Loss": 2.004530191421509, "Full-pretrain/Loss (Raw)": 1.949691653251648, "Full-pretrain/Step": 5241, "Full-pretrain/Step Time": 17.61974810808897} +{"Full-pretrain/Learning Rate": 2.2195464119620208e-05, "Full-pretrain/Loss": 1.9901340007781982, "Full-pretrain/Loss (Raw)": 1.7304222583770752, "Full-pretrain/Step": 5242, "Full-pretrain/Step Time": 17.619736209511757} +{"Full-pretrain/Learning Rate": 2.2187027086653866e-05, "Full-pretrain/Loss": 2.0002002716064453, "Full-pretrain/Loss (Raw)": 2.1687583923339844, "Full-pretrain/Step": 5243, "Full-pretrain/Step Time": 17.622505633160472} +{"Full-pretrain/Learning Rate": 2.217859037816296e-05, "Full-pretrain/Loss": 2.0020229816436768, "Full-pretrain/Loss (Raw)": 2.087374210357666, "Full-pretrain/Step": 5244, "Full-pretrain/Step Time": 17.626616429537535} +{"Full-pretrain/Learning Rate": 2.217015399512066e-05, "Full-pretrain/Loss": 2.0042052268981934, "Full-pretrain/Loss (Raw)": 1.9467122554779053, "Full-pretrain/Step": 5245, "Full-pretrain/Step Time": 17.62854290381074} +{"Full-pretrain/Learning Rate": 2.2161717938500113e-05, "Full-pretrain/Loss": 1.998995065689087, "Full-pretrain/Loss (Raw)": 1.9697625637054443, "Full-pretrain/Step": 5246, "Full-pretrain/Step Time": 17.631987685337663} +{"Full-pretrain/Learning Rate": 2.2153282209274395e-05, "Full-pretrain/Loss": 2.0013880729675293, "Full-pretrain/Loss (Raw)": 1.938084602355957, "Full-pretrain/Step": 5247, "Full-pretrain/Step Time": 17.62766532972455} +{"Full-pretrain/Learning Rate": 2.2144846808416574e-05, "Full-pretrain/Loss": 1.9841113090515137, "Full-pretrain/Loss (Raw)": 1.9780985116958618, "Full-pretrain/Step": 5248, "Full-pretrain/Step Time": 17.628961715847254} +{"Full-pretrain/Learning Rate": 2.2136411736899667e-05, "Full-pretrain/Loss": 1.9772169589996338, "Full-pretrain/Loss (Raw)": 1.671032428741455, "Full-pretrain/Step": 5249, "Full-pretrain/Step Time": 17.628635499626398} +{"Full-pretrain/Learning Rate": 2.2127976995696665e-05, "Full-pretrain/Loss": 1.9734035730361938, "Full-pretrain/Loss (Raw)": 2.035475730895996, "Full-pretrain/Step": 5250, "Full-pretrain/Step Time": 17.636288974434137} +{"Full-pretrain/Learning Rate": 2.211954258578051e-05, "Full-pretrain/Loss": 1.9599075317382812, "Full-pretrain/Loss (Raw)": 1.7022931575775146, "Full-pretrain/Step": 5251, "Full-pretrain/Step Time": 17.63104140199721} +{"Full-pretrain/Learning Rate": 2.2111108508124105e-05, "Full-pretrain/Loss": 1.955462098121643, "Full-pretrain/Loss (Raw)": 1.8734135627746582, "Full-pretrain/Step": 5252, "Full-pretrain/Step Time": 17.628425862640142} +{"Full-pretrain/Learning Rate": 2.2102674763700314e-05, "Full-pretrain/Loss": 1.9582281112670898, "Full-pretrain/Loss (Raw)": 2.157844305038452, "Full-pretrain/Step": 5253, "Full-pretrain/Step Time": 17.632351910695434} +{"Full-pretrain/Learning Rate": 2.209424135348197e-05, "Full-pretrain/Loss": 1.9687583446502686, "Full-pretrain/Loss (Raw)": 2.1812429428100586, "Full-pretrain/Step": 5254, "Full-pretrain/Step Time": 17.632080629467964} +{"Full-pretrain/Learning Rate": 2.2085808278441868e-05, "Full-pretrain/Loss": 1.9691739082336426, "Full-pretrain/Loss (Raw)": 2.0405139923095703, "Full-pretrain/Step": 5255, "Full-pretrain/Step Time": 17.630878545343876} +{"Full-pretrain/Learning Rate": 2.2077375539552765e-05, "Full-pretrain/Loss": 1.971418857574463, "Full-pretrain/Loss (Raw)": 1.9189081192016602, "Full-pretrain/Step": 5256, "Full-pretrain/Step Time": 17.627888940274715} +{"Full-pretrain/Learning Rate": 2.2068943137787353e-05, "Full-pretrain/Loss": 1.9715988636016846, "Full-pretrain/Loss (Raw)": 1.8721925020217896, "Full-pretrain/Step": 5257, "Full-pretrain/Step Time": 17.62801224924624} +{"Full-pretrain/Learning Rate": 2.2060511074118324e-05, "Full-pretrain/Loss": 1.9624691009521484, "Full-pretrain/Loss (Raw)": 1.7277562618255615, "Full-pretrain/Step": 5258, "Full-pretrain/Step Time": 17.63307628966868} +{"Full-pretrain/Learning Rate": 2.205207934951831e-05, "Full-pretrain/Loss": 1.9606757164001465, "Full-pretrain/Loss (Raw)": 1.9385058879852295, "Full-pretrain/Step": 5259, "Full-pretrain/Step Time": 17.633501002565026} +{"Full-pretrain/Learning Rate": 2.204364796495991e-05, "Full-pretrain/Loss": 1.954317569732666, "Full-pretrain/Loss (Raw)": 1.8510377407073975, "Full-pretrain/Step": 5260, "Full-pretrain/Step Time": 17.62139323912561} +{"Full-pretrain/Learning Rate": 2.203521692141568e-05, "Full-pretrain/Loss": 1.95195734500885, "Full-pretrain/Loss (Raw)": 1.916895866394043, "Full-pretrain/Step": 5261, "Full-pretrain/Step Time": 17.624381059780717} +{"Full-pretrain/Learning Rate": 2.2026786219858127e-05, "Full-pretrain/Loss": 1.9531095027923584, "Full-pretrain/Loss (Raw)": 1.8771816492080688, "Full-pretrain/Step": 5262, "Full-pretrain/Step Time": 17.62412610836327} +{"Full-pretrain/Learning Rate": 2.2018355861259742e-05, "Full-pretrain/Loss": 1.9638394117355347, "Full-pretrain/Loss (Raw)": 2.241212844848633, "Full-pretrain/Step": 5263, "Full-pretrain/Step Time": 17.626520808786154} +{"Full-pretrain/Learning Rate": 2.200992584659296e-05, "Full-pretrain/Loss": 1.9608869552612305, "Full-pretrain/Loss (Raw)": 1.8997787237167358, "Full-pretrain/Step": 5264, "Full-pretrain/Step Time": 17.62285688519478} +{"Full-pretrain/Learning Rate": 2.200149617683018e-05, "Full-pretrain/Loss": 1.9460458755493164, "Full-pretrain/Loss (Raw)": 1.6329805850982666, "Full-pretrain/Step": 5265, "Full-pretrain/Step Time": 17.628442393615842} +{"Full-pretrain/Learning Rate": 2.199306685294377e-05, "Full-pretrain/Loss": 1.9387967586517334, "Full-pretrain/Loss (Raw)": 2.1206865310668945, "Full-pretrain/Step": 5266, "Full-pretrain/Step Time": 17.631414975970984} +{"Full-pretrain/Learning Rate": 2.1984637875906038e-05, "Full-pretrain/Loss": 1.94533371925354, "Full-pretrain/Loss (Raw)": 1.929903268814087, "Full-pretrain/Step": 5267, "Full-pretrain/Step Time": 17.63660710863769} +{"Full-pretrain/Learning Rate": 2.197620924668927e-05, "Full-pretrain/Loss": 1.9614700078964233, "Full-pretrain/Loss (Raw)": 2.1865170001983643, "Full-pretrain/Step": 5268, "Full-pretrain/Step Time": 17.62811808474362} +{"Full-pretrain/Learning Rate": 2.1967780966265695e-05, "Full-pretrain/Loss": 1.9685544967651367, "Full-pretrain/Loss (Raw)": 2.0377449989318848, "Full-pretrain/Step": 5269, "Full-pretrain/Step Time": 17.63678153976798} +{"Full-pretrain/Learning Rate": 2.195935303560752e-05, "Full-pretrain/Loss": 1.961626410484314, "Full-pretrain/Loss (Raw)": 2.018230438232422, "Full-pretrain/Step": 5270, "Full-pretrain/Step Time": 17.63540668040514} +{"Full-pretrain/Learning Rate": 2.195092545568691e-05, "Full-pretrain/Loss": 1.9596576690673828, "Full-pretrain/Loss (Raw)": 1.6002317667007446, "Full-pretrain/Step": 5271, "Full-pretrain/Step Time": 17.638658782467246} +{"Full-pretrain/Learning Rate": 2.194249822747598e-05, "Full-pretrain/Loss": 1.9339520931243896, "Full-pretrain/Loss (Raw)": 1.685983657836914, "Full-pretrain/Step": 5272, "Full-pretrain/Step Time": 17.63630997017026} +{"Full-pretrain/Learning Rate": 2.19340713519468e-05, "Full-pretrain/Loss": 1.932629108428955, "Full-pretrain/Loss (Raw)": 1.9073585271835327, "Full-pretrain/Step": 5273, "Full-pretrain/Step Time": 17.640130119398236} +{"Full-pretrain/Learning Rate": 2.1925644830071407e-05, "Full-pretrain/Loss": 1.936842679977417, "Full-pretrain/Loss (Raw)": 1.8652551174163818, "Full-pretrain/Step": 5274, "Full-pretrain/Step Time": 17.632625410333276} +{"Full-pretrain/Learning Rate": 2.1917218662821808e-05, "Full-pretrain/Loss": 1.933439016342163, "Full-pretrain/Loss (Raw)": 2.0598385334014893, "Full-pretrain/Step": 5275, "Full-pretrain/Step Time": 17.631177946925163} +{"Full-pretrain/Learning Rate": 2.1908792851169952e-05, "Full-pretrain/Loss": 1.9286041259765625, "Full-pretrain/Loss (Raw)": 1.9326565265655518, "Full-pretrain/Step": 5276, "Full-pretrain/Step Time": 17.628740217536688} +{"Full-pretrain/Learning Rate": 2.1900367396087755e-05, "Full-pretrain/Loss": 1.9251413345336914, "Full-pretrain/Loss (Raw)": 1.8359038829803467, "Full-pretrain/Step": 5277, "Full-pretrain/Step Time": 17.63491341471672} +{"Full-pretrain/Learning Rate": 2.1891942298547094e-05, "Full-pretrain/Loss": 1.9193612337112427, "Full-pretrain/Loss (Raw)": 1.7848000526428223, "Full-pretrain/Step": 5278, "Full-pretrain/Step Time": 17.63778106495738} +{"Full-pretrain/Learning Rate": 2.1883517559519788e-05, "Full-pretrain/Loss": 1.9257488250732422, "Full-pretrain/Loss (Raw)": 2.1424853801727295, "Full-pretrain/Step": 5279, "Full-pretrain/Step Time": 17.630876211449504} +{"Full-pretrain/Learning Rate": 2.187509317997764e-05, "Full-pretrain/Loss": 1.922959804534912, "Full-pretrain/Loss (Raw)": 1.888849139213562, "Full-pretrain/Step": 5280, "Full-pretrain/Step Time": 17.632993176579475} +{"Full-pretrain/Learning Rate": 2.186666916089239e-05, "Full-pretrain/Loss": 1.9217299222946167, "Full-pretrain/Loss (Raw)": 1.6316771507263184, "Full-pretrain/Step": 5281, "Full-pretrain/Step Time": 17.63365230895579} +{"Full-pretrain/Learning Rate": 2.1858245503235765e-05, "Full-pretrain/Loss": 1.9234414100646973, "Full-pretrain/Loss (Raw)": 2.0902462005615234, "Full-pretrain/Step": 5282, "Full-pretrain/Step Time": 17.636242328211665} +{"Full-pretrain/Learning Rate": 2.1849822207979408e-05, "Full-pretrain/Loss": 1.9317896366119385, "Full-pretrain/Loss (Raw)": 1.969431757926941, "Full-pretrain/Step": 5283, "Full-pretrain/Step Time": 17.63873390108347} +{"Full-pretrain/Learning Rate": 2.184139927609495e-05, "Full-pretrain/Loss": 1.9406050443649292, "Full-pretrain/Loss (Raw)": 2.155508041381836, "Full-pretrain/Step": 5284, "Full-pretrain/Step Time": 17.634477684274316} +{"Full-pretrain/Learning Rate": 2.183297670855398e-05, "Full-pretrain/Loss": 1.923160433769226, "Full-pretrain/Loss (Raw)": 1.5996181964874268, "Full-pretrain/Step": 5285, "Full-pretrain/Step Time": 17.6348759829998} +{"Full-pretrain/Learning Rate": 2.182455450632803e-05, "Full-pretrain/Loss": 1.9147822856903076, "Full-pretrain/Loss (Raw)": 1.9131391048431396, "Full-pretrain/Step": 5286, "Full-pretrain/Step Time": 17.643408872187138} +{"Full-pretrain/Learning Rate": 2.1816132670388604e-05, "Full-pretrain/Loss": 1.9160486459732056, "Full-pretrain/Loss (Raw)": 2.081040143966675, "Full-pretrain/Step": 5287, "Full-pretrain/Step Time": 17.641923509538174} +{"Full-pretrain/Learning Rate": 2.1807711201707166e-05, "Full-pretrain/Loss": 1.9193919897079468, "Full-pretrain/Loss (Raw)": 2.025893449783325, "Full-pretrain/Step": 5288, "Full-pretrain/Step Time": 17.640250438824296} +{"Full-pretrain/Learning Rate": 2.1799290101255104e-05, "Full-pretrain/Loss": 1.9169098138809204, "Full-pretrain/Loss (Raw)": 1.7927641868591309, "Full-pretrain/Step": 5289, "Full-pretrain/Step Time": 17.63798035122454} +{"Full-pretrain/Learning Rate": 2.1790869370003805e-05, "Full-pretrain/Loss": 1.926934003829956, "Full-pretrain/Loss (Raw)": 2.0485310554504395, "Full-pretrain/Step": 5290, "Full-pretrain/Step Time": 17.64221621491015} +{"Full-pretrain/Learning Rate": 2.17824490089246e-05, "Full-pretrain/Loss": 1.9299428462982178, "Full-pretrain/Loss (Raw)": 2.0347869396209717, "Full-pretrain/Step": 5291, "Full-pretrain/Step Time": 17.640489229932427} +{"Full-pretrain/Learning Rate": 2.1774029018988772e-05, "Full-pretrain/Loss": 1.9359242916107178, "Full-pretrain/Loss (Raw)": 2.0424442291259766, "Full-pretrain/Step": 5292, "Full-pretrain/Step Time": 17.63934457860887} +{"Full-pretrain/Learning Rate": 2.1765609401167565e-05, "Full-pretrain/Loss": 1.9396761655807495, "Full-pretrain/Loss (Raw)": 2.0369558334350586, "Full-pretrain/Step": 5293, "Full-pretrain/Step Time": 17.641812331974506} +{"Full-pretrain/Learning Rate": 2.1757190156432177e-05, "Full-pretrain/Loss": 1.9376492500305176, "Full-pretrain/Loss (Raw)": 1.8123180866241455, "Full-pretrain/Step": 5294, "Full-pretrain/Step Time": 17.642796440050006} +{"Full-pretrain/Learning Rate": 2.174877128575376e-05, "Full-pretrain/Loss": 1.928317904472351, "Full-pretrain/Loss (Raw)": 1.9426132440567017, "Full-pretrain/Step": 5295, "Full-pretrain/Step Time": 17.636647451668978} +{"Full-pretrain/Learning Rate": 2.1740352790103434e-05, "Full-pretrain/Loss": 1.935463309288025, "Full-pretrain/Loss (Raw)": 2.1284303665161133, "Full-pretrain/Step": 5296, "Full-pretrain/Step Time": 17.63720914721489} +{"Full-pretrain/Learning Rate": 2.1731934670452264e-05, "Full-pretrain/Loss": 1.9528796672821045, "Full-pretrain/Loss (Raw)": 2.190302848815918, "Full-pretrain/Step": 5297, "Full-pretrain/Step Time": 17.638239791616797} +{"Full-pretrain/Learning Rate": 2.1723516927771294e-05, "Full-pretrain/Loss": 1.949741005897522, "Full-pretrain/Loss (Raw)": 2.020251750946045, "Full-pretrain/Step": 5298, "Full-pretrain/Step Time": 17.640545969828963} +{"Full-pretrain/Learning Rate": 2.1715099563031486e-05, "Full-pretrain/Loss": 1.9497311115264893, "Full-pretrain/Loss (Raw)": 1.9295870065689087, "Full-pretrain/Step": 5299, "Full-pretrain/Step Time": 17.634493872523308} +{"Full-pretrain/Learning Rate": 2.1706682577203786e-05, "Full-pretrain/Loss": 1.941983699798584, "Full-pretrain/Loss (Raw)": 1.9385998249053955, "Full-pretrain/Step": 5300, "Full-pretrain/Step Time": 17.631376897916198} +{"Full-pretrain/Learning Rate": 2.16982659712591e-05, "Full-pretrain/Loss": 1.938917636871338, "Full-pretrain/Loss (Raw)": 1.939630389213562, "Full-pretrain/Step": 5301, "Full-pretrain/Step Time": 17.63424547202885} +{"Full-pretrain/Learning Rate": 2.1689849746168268e-05, "Full-pretrain/Loss": 1.9259692430496216, "Full-pretrain/Loss (Raw)": 1.6038830280303955, "Full-pretrain/Step": 5302, "Full-pretrain/Step Time": 17.64116827584803} +{"Full-pretrain/Learning Rate": 2.1681433902902118e-05, "Full-pretrain/Loss": 1.9368088245391846, "Full-pretrain/Loss (Raw)": 1.947100281715393, "Full-pretrain/Step": 5303, "Full-pretrain/Step Time": 17.63569306395948} +{"Full-pretrain/Learning Rate": 2.1673018442431387e-05, "Full-pretrain/Loss": 1.9533915519714355, "Full-pretrain/Loss (Raw)": 2.2166261672973633, "Full-pretrain/Step": 5304, "Full-pretrain/Step Time": 17.63435368053615} +{"Full-pretrain/Learning Rate": 2.166460336572681e-05, "Full-pretrain/Loss": 1.9557827711105347, "Full-pretrain/Loss (Raw)": 1.9838829040527344, "Full-pretrain/Step": 5305, "Full-pretrain/Step Time": 17.634940752759576} +{"Full-pretrain/Learning Rate": 2.1656188673759065e-05, "Full-pretrain/Loss": 1.9632773399353027, "Full-pretrain/Loss (Raw)": 2.1050732135772705, "Full-pretrain/Step": 5306, "Full-pretrain/Step Time": 17.634187264367938} +{"Full-pretrain/Learning Rate": 2.1647774367498778e-05, "Full-pretrain/Loss": 1.9628838300704956, "Full-pretrain/Loss (Raw)": 2.0472536087036133, "Full-pretrain/Step": 5307, "Full-pretrain/Step Time": 17.635463017970324} +{"Full-pretrain/Learning Rate": 2.1639360447916547e-05, "Full-pretrain/Loss": 1.9683785438537598, "Full-pretrain/Loss (Raw)": 2.10848331451416, "Full-pretrain/Step": 5308, "Full-pretrain/Step Time": 17.627352645620704} +{"Full-pretrain/Learning Rate": 2.163094691598291e-05, "Full-pretrain/Loss": 1.970871925354004, "Full-pretrain/Loss (Raw)": 1.9156923294067383, "Full-pretrain/Step": 5309, "Full-pretrain/Step Time": 17.638619743287563} +{"Full-pretrain/Learning Rate": 2.1622533772668356e-05, "Full-pretrain/Loss": 1.9670672416687012, "Full-pretrain/Loss (Raw)": 1.6630488634109497, "Full-pretrain/Step": 5310, "Full-pretrain/Step Time": 17.642279459163547} +{"Full-pretrain/Learning Rate": 2.1614121018943344e-05, "Full-pretrain/Loss": 1.9623699188232422, "Full-pretrain/Loss (Raw)": 1.9921760559082031, "Full-pretrain/Step": 5311, "Full-pretrain/Step Time": 17.63976980186999} +{"Full-pretrain/Learning Rate": 2.1605708655778282e-05, "Full-pretrain/Loss": 1.955906629562378, "Full-pretrain/Loss (Raw)": 1.682018756866455, "Full-pretrain/Step": 5312, "Full-pretrain/Step Time": 17.640512235462666} +{"Full-pretrain/Learning Rate": 2.159729668414353e-05, "Full-pretrain/Loss": 1.9649909734725952, "Full-pretrain/Loss (Raw)": 1.922378420829773, "Full-pretrain/Step": 5313, "Full-pretrain/Step Time": 17.650065302848816} +{"Full-pretrain/Learning Rate": 2.1588885105009427e-05, "Full-pretrain/Loss": 1.9553418159484863, "Full-pretrain/Loss (Raw)": 1.7814735174179077, "Full-pretrain/Step": 5314, "Full-pretrain/Step Time": 17.64836109429598} +{"Full-pretrain/Learning Rate": 2.158047391934621e-05, "Full-pretrain/Loss": 1.9595866203308105, "Full-pretrain/Loss (Raw)": 2.105266809463501, "Full-pretrain/Step": 5315, "Full-pretrain/Step Time": 17.648296916857362} +{"Full-pretrain/Learning Rate": 2.157206312812413e-05, "Full-pretrain/Loss": 1.9629311561584473, "Full-pretrain/Loss (Raw)": 2.2625293731689453, "Full-pretrain/Step": 5316, "Full-pretrain/Step Time": 17.64543000049889} +{"Full-pretrain/Learning Rate": 2.1563652732313367e-05, "Full-pretrain/Loss": 1.9713609218597412, "Full-pretrain/Loss (Raw)": 1.8693772554397583, "Full-pretrain/Step": 5317, "Full-pretrain/Step Time": 17.647259959951043} +{"Full-pretrain/Learning Rate": 2.155524273288405e-05, "Full-pretrain/Loss": 1.9776222705841064, "Full-pretrain/Loss (Raw)": 2.113499641418457, "Full-pretrain/Step": 5318, "Full-pretrain/Step Time": 17.65105039253831} +{"Full-pretrain/Learning Rate": 2.1546833130806277e-05, "Full-pretrain/Loss": 1.9705926179885864, "Full-pretrain/Loss (Raw)": 1.8560950756072998, "Full-pretrain/Step": 5319, "Full-pretrain/Step Time": 17.652462847530842} +{"Full-pretrain/Learning Rate": 2.153842392705009e-05, "Full-pretrain/Loss": 1.9699242115020752, "Full-pretrain/Loss (Raw)": 2.004502296447754, "Full-pretrain/Step": 5320, "Full-pretrain/Step Time": 17.64728324301541} +{"Full-pretrain/Learning Rate": 2.1530015122585478e-05, "Full-pretrain/Loss": 1.965388298034668, "Full-pretrain/Loss (Raw)": 1.6476143598556519, "Full-pretrain/Step": 5321, "Full-pretrain/Step Time": 17.644569406285882} +{"Full-pretrain/Learning Rate": 2.1521606718382406e-05, "Full-pretrain/Loss": 1.9595069885253906, "Full-pretrain/Loss (Raw)": 1.8603296279907227, "Full-pretrain/Step": 5322, "Full-pretrain/Step Time": 17.654311634600163} +{"Full-pretrain/Learning Rate": 2.1513198715410777e-05, "Full-pretrain/Loss": 1.9640321731567383, "Full-pretrain/Loss (Raw)": 2.1795921325683594, "Full-pretrain/Step": 5323, "Full-pretrain/Step Time": 17.653821444138885} +{"Full-pretrain/Learning Rate": 2.150479111464045e-05, "Full-pretrain/Loss": 1.9613993167877197, "Full-pretrain/Loss (Raw)": 1.9581894874572754, "Full-pretrain/Step": 5324, "Full-pretrain/Step Time": 17.660547068342566} +{"Full-pretrain/Learning Rate": 2.1496383917041247e-05, "Full-pretrain/Loss": 1.9680218696594238, "Full-pretrain/Loss (Raw)": 2.2488784790039062, "Full-pretrain/Step": 5325, "Full-pretrain/Step Time": 17.653655925765634} +{"Full-pretrain/Learning Rate": 2.148797712358292e-05, "Full-pretrain/Loss": 1.9781758785247803, "Full-pretrain/Loss (Raw)": 2.1372478008270264, "Full-pretrain/Step": 5326, "Full-pretrain/Step Time": 17.65742185898125} +{"Full-pretrain/Learning Rate": 2.1479570735235198e-05, "Full-pretrain/Loss": 1.984607458114624, "Full-pretrain/Loss (Raw)": 2.1484241485595703, "Full-pretrain/Step": 5327, "Full-pretrain/Step Time": 17.65402292087674} +{"Full-pretrain/Learning Rate": 2.1471164752967757e-05, "Full-pretrain/Loss": 1.968241572380066, "Full-pretrain/Loss (Raw)": 1.6047195196151733, "Full-pretrain/Step": 5328, "Full-pretrain/Step Time": 17.653034191578627} +{"Full-pretrain/Learning Rate": 2.1462759177750218e-05, "Full-pretrain/Loss": 1.9536333084106445, "Full-pretrain/Loss (Raw)": 1.7228392362594604, "Full-pretrain/Step": 5329, "Full-pretrain/Step Time": 17.646828996017575} +{"Full-pretrain/Learning Rate": 2.1454354010552174e-05, "Full-pretrain/Loss": 1.9459764957427979, "Full-pretrain/Loss (Raw)": 1.7752330303192139, "Full-pretrain/Step": 5330, "Full-pretrain/Step Time": 17.651358243077993} +{"Full-pretrain/Learning Rate": 2.144594925234314e-05, "Full-pretrain/Loss": 1.94705331325531, "Full-pretrain/Loss (Raw)": 1.9640446901321411, "Full-pretrain/Step": 5331, "Full-pretrain/Step Time": 17.654568165540695} +{"Full-pretrain/Learning Rate": 2.143754490409261e-05, "Full-pretrain/Loss": 1.9506396055221558, "Full-pretrain/Loss (Raw)": 2.05336332321167, "Full-pretrain/Step": 5332, "Full-pretrain/Step Time": 17.643650440499187} +{"Full-pretrain/Learning Rate": 2.1429140966770027e-05, "Full-pretrain/Loss": 1.9451225996017456, "Full-pretrain/Loss (Raw)": 1.763083815574646, "Full-pretrain/Step": 5333, "Full-pretrain/Step Time": 17.64434360899031} +{"Full-pretrain/Learning Rate": 2.142073744134478e-05, "Full-pretrain/Loss": 1.9621851444244385, "Full-pretrain/Loss (Raw)": 2.1498866081237793, "Full-pretrain/Step": 5334, "Full-pretrain/Step Time": 17.639604181051254} +{"Full-pretrain/Learning Rate": 2.141233432878621e-05, "Full-pretrain/Loss": 1.9629738330841064, "Full-pretrain/Loss (Raw)": 1.9723360538482666, "Full-pretrain/Step": 5335, "Full-pretrain/Step Time": 17.64178275130689} +{"Full-pretrain/Learning Rate": 2.1403931630063616e-05, "Full-pretrain/Loss": 1.9622645378112793, "Full-pretrain/Loss (Raw)": 2.1939315795898438, "Full-pretrain/Step": 5336, "Full-pretrain/Step Time": 17.63988285139203} +{"Full-pretrain/Learning Rate": 2.1395529346146243e-05, "Full-pretrain/Loss": 1.9525678157806396, "Full-pretrain/Loss (Raw)": 1.673583745956421, "Full-pretrain/Step": 5337, "Full-pretrain/Step Time": 17.63491071946919} +{"Full-pretrain/Learning Rate": 2.138712747800329e-05, "Full-pretrain/Loss": 1.9500013589859009, "Full-pretrain/Loss (Raw)": 2.0229506492614746, "Full-pretrain/Step": 5338, "Full-pretrain/Step Time": 17.633049046620727} +{"Full-pretrain/Learning Rate": 2.1378726026603913e-05, "Full-pretrain/Loss": 1.9495662450790405, "Full-pretrain/Loss (Raw)": 2.0333316326141357, "Full-pretrain/Step": 5339, "Full-pretrain/Step Time": 17.638811949640512} +{"Full-pretrain/Learning Rate": 2.1370324992917225e-05, "Full-pretrain/Loss": 1.9440661668777466, "Full-pretrain/Loss (Raw)": 1.932477593421936, "Full-pretrain/Step": 5340, "Full-pretrain/Step Time": 17.631369791924953} +{"Full-pretrain/Learning Rate": 2.1361924377912266e-05, "Full-pretrain/Loss": 1.944133996963501, "Full-pretrain/Loss (Raw)": 1.9178636074066162, "Full-pretrain/Step": 5341, "Full-pretrain/Step Time": 17.625898966565728} +{"Full-pretrain/Learning Rate": 2.135352418255805e-05, "Full-pretrain/Loss": 1.9641871452331543, "Full-pretrain/Loss (Raw)": 2.304749011993408, "Full-pretrain/Step": 5342, "Full-pretrain/Step Time": 17.631146831437945} +{"Full-pretrain/Learning Rate": 2.1345124407823544e-05, "Full-pretrain/Loss": 1.9668703079223633, "Full-pretrain/Loss (Raw)": 2.0780386924743652, "Full-pretrain/Step": 5343, "Full-pretrain/Step Time": 17.63125440105796} +{"Full-pretrain/Learning Rate": 2.1336725054677647e-05, "Full-pretrain/Loss": 1.9840933084487915, "Full-pretrain/Loss (Raw)": 2.233156204223633, "Full-pretrain/Step": 5344, "Full-pretrain/Step Time": 17.631032172590494} +{"Full-pretrain/Learning Rate": 2.1328326124089227e-05, "Full-pretrain/Loss": 1.9882440567016602, "Full-pretrain/Loss (Raw)": 2.0552022457122803, "Full-pretrain/Step": 5345, "Full-pretrain/Step Time": 17.62714508548379} +{"Full-pretrain/Learning Rate": 2.131992761702711e-05, "Full-pretrain/Loss": 1.9984546899795532, "Full-pretrain/Loss (Raw)": 2.108210802078247, "Full-pretrain/Step": 5346, "Full-pretrain/Step Time": 17.623568821698427} +{"Full-pretrain/Learning Rate": 2.131152953446004e-05, "Full-pretrain/Loss": 2.0014748573303223, "Full-pretrain/Loss (Raw)": 2.2019119262695312, "Full-pretrain/Step": 5347, "Full-pretrain/Step Time": 17.624306118115783} +{"Full-pretrain/Learning Rate": 2.1303131877356738e-05, "Full-pretrain/Loss": 1.9863433837890625, "Full-pretrain/Loss (Raw)": 1.7783279418945312, "Full-pretrain/Step": 5348, "Full-pretrain/Step Time": 17.628877514973283} +{"Full-pretrain/Learning Rate": 2.1294734646685878e-05, "Full-pretrain/Loss": 1.9917871952056885, "Full-pretrain/Loss (Raw)": 2.0435733795166016, "Full-pretrain/Step": 5349, "Full-pretrain/Step Time": 17.62763105891645} +{"Full-pretrain/Learning Rate": 2.128633784341608e-05, "Full-pretrain/Loss": 1.990620732307434, "Full-pretrain/Loss (Raw)": 2.0761733055114746, "Full-pretrain/Step": 5350, "Full-pretrain/Step Time": 17.622165575623512} +{"Full-pretrain/Learning Rate": 2.1277941468515906e-05, "Full-pretrain/Loss": 1.9995319843292236, "Full-pretrain/Loss (Raw)": 2.14125394821167, "Full-pretrain/Step": 5351, "Full-pretrain/Step Time": 17.6248286254704} +{"Full-pretrain/Learning Rate": 2.1269545522953873e-05, "Full-pretrain/Loss": 2.0047590732574463, "Full-pretrain/Loss (Raw)": 2.171771764755249, "Full-pretrain/Step": 5352, "Full-pretrain/Step Time": 17.628321208059788} +{"Full-pretrain/Learning Rate": 2.126115000769845e-05, "Full-pretrain/Loss": 2.0155417919158936, "Full-pretrain/Loss (Raw)": 1.992659091949463, "Full-pretrain/Step": 5353, "Full-pretrain/Step Time": 17.62711636722088} +{"Full-pretrain/Learning Rate": 2.125275492371806e-05, "Full-pretrain/Loss": 2.0199570655822754, "Full-pretrain/Loss (Raw)": 2.0016183853149414, "Full-pretrain/Step": 5354, "Full-pretrain/Step Time": 17.627275662496686} +{"Full-pretrain/Learning Rate": 2.1244360271981073e-05, "Full-pretrain/Loss": 2.007042646408081, "Full-pretrain/Loss (Raw)": 1.7663328647613525, "Full-pretrain/Step": 5355, "Full-pretrain/Step Time": 17.620692018419504} +{"Full-pretrain/Learning Rate": 2.123596605345582e-05, "Full-pretrain/Loss": 2.007565498352051, "Full-pretrain/Loss (Raw)": 1.9749178886413574, "Full-pretrain/Step": 5356, "Full-pretrain/Step Time": 17.621501855552197} +{"Full-pretrain/Learning Rate": 2.1227572269110546e-05, "Full-pretrain/Loss": 2.002974271774292, "Full-pretrain/Loss (Raw)": 2.101957321166992, "Full-pretrain/Step": 5357, "Full-pretrain/Step Time": 17.624407414346933} +{"Full-pretrain/Learning Rate": 2.1219178919913486e-05, "Full-pretrain/Loss": 1.9977197647094727, "Full-pretrain/Loss (Raw)": 1.9691095352172852, "Full-pretrain/Step": 5358, "Full-pretrain/Step Time": 17.626011222600937} +{"Full-pretrain/Learning Rate": 2.1210786006832817e-05, "Full-pretrain/Loss": 1.9842039346694946, "Full-pretrain/Loss (Raw)": 1.7159157991409302, "Full-pretrain/Step": 5359, "Full-pretrain/Step Time": 17.624837210401893} +{"Full-pretrain/Learning Rate": 2.1202393530836642e-05, "Full-pretrain/Loss": 1.9938218593597412, "Full-pretrain/Loss (Raw)": 1.9124948978424072, "Full-pretrain/Step": 5360, "Full-pretrain/Step Time": 17.626355573534966} +{"Full-pretrain/Learning Rate": 2.119400149289305e-05, "Full-pretrain/Loss": 2.005049467086792, "Full-pretrain/Loss (Raw)": 2.082120656967163, "Full-pretrain/Step": 5361, "Full-pretrain/Step Time": 17.63077144138515} +{"Full-pretrain/Learning Rate": 2.118560989397004e-05, "Full-pretrain/Loss": 2.0106606483459473, "Full-pretrain/Loss (Raw)": 1.9547874927520752, "Full-pretrain/Step": 5362, "Full-pretrain/Step Time": 17.625132078304887} +{"Full-pretrain/Learning Rate": 2.1177218735035588e-05, "Full-pretrain/Loss": 2.0096943378448486, "Full-pretrain/Loss (Raw)": 1.9331283569335938, "Full-pretrain/Step": 5363, "Full-pretrain/Step Time": 17.626789949834347} +{"Full-pretrain/Learning Rate": 2.1168828017057607e-05, "Full-pretrain/Loss": 2.0083470344543457, "Full-pretrain/Loss (Raw)": 2.010244846343994, "Full-pretrain/Step": 5364, "Full-pretrain/Step Time": 17.62239419668913} +{"Full-pretrain/Learning Rate": 2.116043774100397e-05, "Full-pretrain/Loss": 2.0223934650421143, "Full-pretrain/Loss (Raw)": 2.212571620941162, "Full-pretrain/Step": 5365, "Full-pretrain/Step Time": 17.629126135259867} +{"Full-pretrain/Learning Rate": 2.1152047907842498e-05, "Full-pretrain/Loss": 2.012505531311035, "Full-pretrain/Loss (Raw)": 1.8334686756134033, "Full-pretrain/Step": 5366, "Full-pretrain/Step Time": 17.623241549357772} +{"Full-pretrain/Learning Rate": 2.1143658518540947e-05, "Full-pretrain/Loss": 2.009584426879883, "Full-pretrain/Loss (Raw)": 1.8788697719573975, "Full-pretrain/Step": 5367, "Full-pretrain/Step Time": 17.621099850162864} +{"Full-pretrain/Learning Rate": 2.1135269574067025e-05, "Full-pretrain/Loss": 2.0078296661376953, "Full-pretrain/Loss (Raw)": 2.1377742290496826, "Full-pretrain/Step": 5368, "Full-pretrain/Step Time": 17.624242270365357} +{"Full-pretrain/Learning Rate": 2.1126881075388403e-05, "Full-pretrain/Loss": 2.0154190063476562, "Full-pretrain/Loss (Raw)": 1.9164421558380127, "Full-pretrain/Step": 5369, "Full-pretrain/Step Time": 17.62680330313742} +{"Full-pretrain/Learning Rate": 2.111849302347268e-05, "Full-pretrain/Loss": 2.0175771713256836, "Full-pretrain/Loss (Raw)": 2.0920069217681885, "Full-pretrain/Step": 5370, "Full-pretrain/Step Time": 17.623085601255298} +{"Full-pretrain/Learning Rate": 2.1110105419287428e-05, "Full-pretrain/Loss": 2.0051777362823486, "Full-pretrain/Loss (Raw)": 1.6365559101104736, "Full-pretrain/Step": 5371, "Full-pretrain/Step Time": 17.61837438493967} +{"Full-pretrain/Learning Rate": 2.110171826380016e-05, "Full-pretrain/Loss": 2.011725902557373, "Full-pretrain/Loss (Raw)": 2.1420207023620605, "Full-pretrain/Step": 5372, "Full-pretrain/Step Time": 17.60878144018352} +{"Full-pretrain/Learning Rate": 2.1093331557978307e-05, "Full-pretrain/Loss": 2.0195603370666504, "Full-pretrain/Loss (Raw)": 2.168562650680542, "Full-pretrain/Step": 5373, "Full-pretrain/Step Time": 17.61264664120972} +{"Full-pretrain/Learning Rate": 2.1084945302789286e-05, "Full-pretrain/Loss": 2.006885528564453, "Full-pretrain/Loss (Raw)": 1.8991533517837524, "Full-pretrain/Step": 5374, "Full-pretrain/Step Time": 17.60509359277785} +{"Full-pretrain/Learning Rate": 2.107655949920045e-05, "Full-pretrain/Loss": 2.005575656890869, "Full-pretrain/Loss (Raw)": 2.036120891571045, "Full-pretrain/Step": 5375, "Full-pretrain/Step Time": 17.60275956429541} +{"Full-pretrain/Learning Rate": 2.10681741481791e-05, "Full-pretrain/Loss": 2.0014939308166504, "Full-pretrain/Loss (Raw)": 2.1025476455688477, "Full-pretrain/Step": 5376, "Full-pretrain/Step Time": 17.602117709815502} +{"Full-pretrain/Learning Rate": 2.105978925069248e-05, "Full-pretrain/Loss": 1.9916468858718872, "Full-pretrain/Loss (Raw)": 1.740096092224121, "Full-pretrain/Step": 5377, "Full-pretrain/Step Time": 17.607800668105483} +{"Full-pretrain/Learning Rate": 2.1051404807707787e-05, "Full-pretrain/Loss": 1.9853404760360718, "Full-pretrain/Loss (Raw)": 1.9064061641693115, "Full-pretrain/Step": 5378, "Full-pretrain/Step Time": 17.59858664497733} +{"Full-pretrain/Learning Rate": 2.1043020820192157e-05, "Full-pretrain/Loss": 1.980299472808838, "Full-pretrain/Loss (Raw)": 2.0405993461608887, "Full-pretrain/Step": 5379, "Full-pretrain/Step Time": 17.600718772038817} +{"Full-pretrain/Learning Rate": 2.1034637289112685e-05, "Full-pretrain/Loss": 1.9781360626220703, "Full-pretrain/Loss (Raw)": 1.7090981006622314, "Full-pretrain/Step": 5380, "Full-pretrain/Step Time": 17.598766524344683} +{"Full-pretrain/Learning Rate": 2.1026254215436406e-05, "Full-pretrain/Loss": 1.9707412719726562, "Full-pretrain/Loss (Raw)": 1.80693781375885, "Full-pretrain/Step": 5381, "Full-pretrain/Step Time": 17.598048854619265} +{"Full-pretrain/Learning Rate": 2.101787160013032e-05, "Full-pretrain/Loss": 1.9676697254180908, "Full-pretrain/Loss (Raw)": 1.9778831005096436, "Full-pretrain/Step": 5382, "Full-pretrain/Step Time": 17.600795412436128} +{"Full-pretrain/Learning Rate": 2.1009489444161332e-05, "Full-pretrain/Loss": 1.9614660739898682, "Full-pretrain/Loss (Raw)": 1.9427385330200195, "Full-pretrain/Step": 5383, "Full-pretrain/Step Time": 17.603000413626432} +{"Full-pretrain/Learning Rate": 2.1001107748496334e-05, "Full-pretrain/Loss": 1.9610434770584106, "Full-pretrain/Loss (Raw)": 2.1582489013671875, "Full-pretrain/Step": 5384, "Full-pretrain/Step Time": 17.60268192924559} +{"Full-pretrain/Learning Rate": 2.099272651410216e-05, "Full-pretrain/Loss": 1.9531011581420898, "Full-pretrain/Loss (Raw)": 1.73850417137146, "Full-pretrain/Step": 5385, "Full-pretrain/Step Time": 17.60360200703144} +{"Full-pretrain/Learning Rate": 2.098434574194557e-05, "Full-pretrain/Loss": 1.9519585371017456, "Full-pretrain/Loss (Raw)": 1.9650567770004272, "Full-pretrain/Step": 5386, "Full-pretrain/Step Time": 17.608084339648485} +{"Full-pretrain/Learning Rate": 2.0975965432993283e-05, "Full-pretrain/Loss": 1.96059250831604, "Full-pretrain/Loss (Raw)": 2.0426182746887207, "Full-pretrain/Step": 5387, "Full-pretrain/Step Time": 17.602125108242035} +{"Full-pretrain/Learning Rate": 2.0967585588211982e-05, "Full-pretrain/Loss": 1.9625645875930786, "Full-pretrain/Loss (Raw)": 2.0380263328552246, "Full-pretrain/Step": 5388, "Full-pretrain/Step Time": 17.606463188305497} +{"Full-pretrain/Learning Rate": 2.0959206208568254e-05, "Full-pretrain/Loss": 1.952654242515564, "Full-pretrain/Loss (Raw)": 1.7848252058029175, "Full-pretrain/Step": 5389, "Full-pretrain/Step Time": 17.608019625768065} +{"Full-pretrain/Learning Rate": 2.0950827295028674e-05, "Full-pretrain/Loss": 1.9459669589996338, "Full-pretrain/Loss (Raw)": 1.7551162242889404, "Full-pretrain/Step": 5390, "Full-pretrain/Step Time": 17.610710280016065} +{"Full-pretrain/Learning Rate": 2.094244884855974e-05, "Full-pretrain/Loss": 1.9546401500701904, "Full-pretrain/Loss (Raw)": 1.9934611320495605, "Full-pretrain/Step": 5391, "Full-pretrain/Step Time": 17.604879656806588} +{"Full-pretrain/Learning Rate": 2.0934070870127912e-05, "Full-pretrain/Loss": 1.9627866744995117, "Full-pretrain/Loss (Raw)": 2.1731815338134766, "Full-pretrain/Step": 5392, "Full-pretrain/Step Time": 17.603914270177484} +{"Full-pretrain/Learning Rate": 2.0925693360699578e-05, "Full-pretrain/Loss": 1.9580893516540527, "Full-pretrain/Loss (Raw)": 1.9318052530288696, "Full-pretrain/Step": 5393, "Full-pretrain/Step Time": 17.602019058540463} +{"Full-pretrain/Learning Rate": 2.0917316321241085e-05, "Full-pretrain/Loss": 1.9653137922286987, "Full-pretrain/Loss (Raw)": 2.185971260070801, "Full-pretrain/Step": 5394, "Full-pretrain/Step Time": 17.605621991679072} +{"Full-pretrain/Learning Rate": 2.0908939752718714e-05, "Full-pretrain/Loss": 1.9629782438278198, "Full-pretrain/Loss (Raw)": 1.8583900928497314, "Full-pretrain/Step": 5395, "Full-pretrain/Step Time": 17.59923606365919} +{"Full-pretrain/Learning Rate": 2.0900563656098704e-05, "Full-pretrain/Loss": 1.9561558961868286, "Full-pretrain/Loss (Raw)": 1.7919304370880127, "Full-pretrain/Step": 5396, "Full-pretrain/Step Time": 17.603746997192502} +{"Full-pretrain/Learning Rate": 2.0892188032347236e-05, "Full-pretrain/Loss": 1.9476892948150635, "Full-pretrain/Loss (Raw)": 1.9416414499282837, "Full-pretrain/Step": 5397, "Full-pretrain/Step Time": 17.597264951094985} +{"Full-pretrain/Learning Rate": 2.0883812882430445e-05, "Full-pretrain/Loss": 1.9396722316741943, "Full-pretrain/Loss (Raw)": 1.5769195556640625, "Full-pretrain/Step": 5398, "Full-pretrain/Step Time": 17.60331873036921} +{"Full-pretrain/Learning Rate": 2.087543820731438e-05, "Full-pretrain/Loss": 1.9400441646575928, "Full-pretrain/Loss (Raw)": 1.8907705545425415, "Full-pretrain/Step": 5399, "Full-pretrain/Step Time": 17.593327490612864} +{"Full-pretrain/Learning Rate": 2.086706400796507e-05, "Full-pretrain/Loss": 1.9296777248382568, "Full-pretrain/Loss (Raw)": 1.806047797203064, "Full-pretrain/Step": 5400, "Full-pretrain/Step Time": 17.595043256878853} +{"Full-pretrain/Learning Rate": 2.085869028534848e-05, "Full-pretrain/Loss": 1.927595615386963, "Full-pretrain/Loss (Raw)": 1.8498148918151855, "Full-pretrain/Step": 5401, "Full-pretrain/Step Time": 17.59204588085413} +{"Full-pretrain/Learning Rate": 2.0850317040430505e-05, "Full-pretrain/Loss": 1.9201996326446533, "Full-pretrain/Loss (Raw)": 1.8553335666656494, "Full-pretrain/Step": 5402, "Full-pretrain/Step Time": 17.59627154096961} +{"Full-pretrain/Learning Rate": 2.084194427417701e-05, "Full-pretrain/Loss": 1.928602695465088, "Full-pretrain/Loss (Raw)": 1.90545654296875, "Full-pretrain/Step": 5403, "Full-pretrain/Step Time": 17.59087468869984} +{"Full-pretrain/Learning Rate": 2.0833571987553772e-05, "Full-pretrain/Loss": 1.9299356937408447, "Full-pretrain/Loss (Raw)": 2.1846745014190674, "Full-pretrain/Step": 5404, "Full-pretrain/Step Time": 17.59462851844728} +{"Full-pretrain/Learning Rate": 2.0825200181526542e-05, "Full-pretrain/Loss": 1.919710636138916, "Full-pretrain/Loss (Raw)": 1.8413658142089844, "Full-pretrain/Step": 5405, "Full-pretrain/Step Time": 17.59336660988629} +{"Full-pretrain/Learning Rate": 2.0816828857061e-05, "Full-pretrain/Loss": 1.9241704940795898, "Full-pretrain/Loss (Raw)": 2.041865825653076, "Full-pretrain/Step": 5406, "Full-pretrain/Step Time": 17.594914915040135} +{"Full-pretrain/Learning Rate": 2.0808458015122785e-05, "Full-pretrain/Loss": 1.9251946210861206, "Full-pretrain/Loss (Raw)": 2.0688953399658203, "Full-pretrain/Step": 5407, "Full-pretrain/Step Time": 17.599396558478475} +{"Full-pretrain/Learning Rate": 2.0800087656677467e-05, "Full-pretrain/Loss": 1.9231245517730713, "Full-pretrain/Loss (Raw)": 2.0363032817840576, "Full-pretrain/Step": 5408, "Full-pretrain/Step Time": 17.59398764744401} +{"Full-pretrain/Learning Rate": 2.0791717782690562e-05, "Full-pretrain/Loss": 1.9330003261566162, "Full-pretrain/Loss (Raw)": 2.0561234951019287, "Full-pretrain/Step": 5409, "Full-pretrain/Step Time": 17.59510837122798} +{"Full-pretrain/Learning Rate": 2.0783348394127526e-05, "Full-pretrain/Loss": 1.9410593509674072, "Full-pretrain/Loss (Raw)": 2.164292812347412, "Full-pretrain/Step": 5410, "Full-pretrain/Step Time": 17.596962604671717} +{"Full-pretrain/Learning Rate": 2.0774979491953777e-05, "Full-pretrain/Loss": 1.9384734630584717, "Full-pretrain/Loss (Raw)": 1.9578505754470825, "Full-pretrain/Step": 5411, "Full-pretrain/Step Time": 17.59071945771575} +{"Full-pretrain/Learning Rate": 2.0766611077134654e-05, "Full-pretrain/Loss": 1.9458110332489014, "Full-pretrain/Loss (Raw)": 1.9439011812210083, "Full-pretrain/Step": 5412, "Full-pretrain/Step Time": 17.590816298499703} +{"Full-pretrain/Learning Rate": 2.0758243150635453e-05, "Full-pretrain/Loss": 1.9418798685073853, "Full-pretrain/Loss (Raw)": 1.6811407804489136, "Full-pretrain/Step": 5413, "Full-pretrain/Step Time": 17.594502843916416} +{"Full-pretrain/Learning Rate": 2.074987571342143e-05, "Full-pretrain/Loss": 1.9446252584457397, "Full-pretrain/Loss (Raw)": 2.065735340118408, "Full-pretrain/Step": 5414, "Full-pretrain/Step Time": 17.59375474974513} +{"Full-pretrain/Learning Rate": 2.0741508766457735e-05, "Full-pretrain/Loss": 1.9444814920425415, "Full-pretrain/Loss (Raw)": 1.9381380081176758, "Full-pretrain/Step": 5415, "Full-pretrain/Step Time": 17.59830529242754} +{"Full-pretrain/Learning Rate": 2.0733142310709508e-05, "Full-pretrain/Loss": 1.935114860534668, "Full-pretrain/Loss (Raw)": 1.8585195541381836, "Full-pretrain/Step": 5416, "Full-pretrain/Step Time": 17.60009459964931} +{"Full-pretrain/Learning Rate": 2.0724776347141816e-05, "Full-pretrain/Loss": 1.9485162496566772, "Full-pretrain/Loss (Raw)": 2.167346477508545, "Full-pretrain/Step": 5417, "Full-pretrain/Step Time": 17.60186012275517} +{"Full-pretrain/Learning Rate": 2.0716410876719674e-05, "Full-pretrain/Loss": 1.949341893196106, "Full-pretrain/Loss (Raw)": 1.9914811849594116, "Full-pretrain/Step": 5418, "Full-pretrain/Step Time": 17.603741608560085} +{"Full-pretrain/Learning Rate": 2.0708045900408036e-05, "Full-pretrain/Loss": 1.9499740600585938, "Full-pretrain/Loss (Raw)": 2.062847375869751, "Full-pretrain/Step": 5419, "Full-pretrain/Step Time": 17.60382848419249} +{"Full-pretrain/Learning Rate": 2.069968141917179e-05, "Full-pretrain/Loss": 1.9494702816009521, "Full-pretrain/Loss (Raw)": 2.021904468536377, "Full-pretrain/Step": 5420, "Full-pretrain/Step Time": 17.60357323102653} +{"Full-pretrain/Learning Rate": 2.0691317433975778e-05, "Full-pretrain/Loss": 1.9611862897872925, "Full-pretrain/Loss (Raw)": 2.1597354412078857, "Full-pretrain/Step": 5421, "Full-pretrain/Step Time": 17.60548632964492} +{"Full-pretrain/Learning Rate": 2.0682953945784785e-05, "Full-pretrain/Loss": 1.9684370756149292, "Full-pretrain/Loss (Raw)": 1.98714280128479, "Full-pretrain/Step": 5422, "Full-pretrain/Step Time": 17.608484141528606} +{"Full-pretrain/Learning Rate": 2.067459095556354e-05, "Full-pretrain/Loss": 1.9620014429092407, "Full-pretrain/Loss (Raw)": 1.7875220775604248, "Full-pretrain/Step": 5423, "Full-pretrain/Step Time": 17.611548887565732} +{"Full-pretrain/Learning Rate": 2.0666228464276707e-05, "Full-pretrain/Loss": 1.9589260816574097, "Full-pretrain/Loss (Raw)": 2.0747673511505127, "Full-pretrain/Step": 5424, "Full-pretrain/Step Time": 17.60643050260842} +{"Full-pretrain/Learning Rate": 2.0657866472888907e-05, "Full-pretrain/Loss": 1.9686648845672607, "Full-pretrain/Loss (Raw)": 2.2434518337249756, "Full-pretrain/Step": 5425, "Full-pretrain/Step Time": 17.610000260174274} +{"Full-pretrain/Learning Rate": 2.0649504982364672e-05, "Full-pretrain/Loss": 1.9599097967147827, "Full-pretrain/Loss (Raw)": 1.9058022499084473, "Full-pretrain/Step": 5426, "Full-pretrain/Step Time": 17.608471723273396} +{"Full-pretrain/Learning Rate": 2.0641143993668515e-05, "Full-pretrain/Loss": 1.9619656801223755, "Full-pretrain/Loss (Raw)": 1.9241819381713867, "Full-pretrain/Step": 5427, "Full-pretrain/Step Time": 17.609059439972043} +{"Full-pretrain/Learning Rate": 2.0632783507764864e-05, "Full-pretrain/Loss": 1.9712871313095093, "Full-pretrain/Loss (Raw)": 2.09021258354187, "Full-pretrain/Step": 5428, "Full-pretrain/Step Time": 17.608491271734238} +{"Full-pretrain/Learning Rate": 2.0624423525618098e-05, "Full-pretrain/Loss": 1.9718060493469238, "Full-pretrain/Loss (Raw)": 1.9582479000091553, "Full-pretrain/Step": 5429, "Full-pretrain/Step Time": 17.607104314491153} +{"Full-pretrain/Learning Rate": 2.061606404819255e-05, "Full-pretrain/Loss": 1.9859052896499634, "Full-pretrain/Loss (Raw)": 2.0280938148498535, "Full-pretrain/Step": 5430, "Full-pretrain/Step Time": 17.61103514023125} +{"Full-pretrain/Learning Rate": 2.0607705076452465e-05, "Full-pretrain/Loss": 1.9861719608306885, "Full-pretrain/Loss (Raw)": 1.8993055820465088, "Full-pretrain/Step": 5431, "Full-pretrain/Step Time": 17.61084346845746} +{"Full-pretrain/Learning Rate": 2.0599346611362056e-05, "Full-pretrain/Loss": 1.9943552017211914, "Full-pretrain/Loss (Raw)": 2.0679125785827637, "Full-pretrain/Step": 5432, "Full-pretrain/Step Time": 17.6111049503088} +{"Full-pretrain/Learning Rate": 2.0590988653885468e-05, "Full-pretrain/Loss": 1.9983030557632446, "Full-pretrain/Loss (Raw)": 1.9761419296264648, "Full-pretrain/Step": 5433, "Full-pretrain/Step Time": 17.612295489758253} +{"Full-pretrain/Learning Rate": 2.0582631204986794e-05, "Full-pretrain/Loss": 2.003420829772949, "Full-pretrain/Loss (Raw)": 2.019108772277832, "Full-pretrain/Step": 5434, "Full-pretrain/Step Time": 17.61623920686543} +{"Full-pretrain/Learning Rate": 2.057427426563006e-05, "Full-pretrain/Loss": 1.9965310096740723, "Full-pretrain/Loss (Raw)": 1.6849782466888428, "Full-pretrain/Step": 5435, "Full-pretrain/Step Time": 17.613547885790467} +{"Full-pretrain/Learning Rate": 2.056591783677923e-05, "Full-pretrain/Loss": 1.9981045722961426, "Full-pretrain/Loss (Raw)": 2.2350282669067383, "Full-pretrain/Step": 5436, "Full-pretrain/Step Time": 17.61585388891399} +{"Full-pretrain/Learning Rate": 2.055756191939822e-05, "Full-pretrain/Loss": 2.0127310752868652, "Full-pretrain/Loss (Raw)": 2.309417247772217, "Full-pretrain/Step": 5437, "Full-pretrain/Step Time": 17.60510611347854} +{"Full-pretrain/Learning Rate": 2.0549206514450874e-05, "Full-pretrain/Loss": 2.0146985054016113, "Full-pretrain/Loss (Raw)": 2.1048243045806885, "Full-pretrain/Step": 5438, "Full-pretrain/Step Time": 17.611440481618047} +{"Full-pretrain/Learning Rate": 2.0540851622900997e-05, "Full-pretrain/Loss": 2.0092320442199707, "Full-pretrain/Loss (Raw)": 1.8939627408981323, "Full-pretrain/Step": 5439, "Full-pretrain/Step Time": 17.610341884195805} +{"Full-pretrain/Learning Rate": 2.0532497245712327e-05, "Full-pretrain/Loss": 2.0025601387023926, "Full-pretrain/Loss (Raw)": 1.8228070735931396, "Full-pretrain/Step": 5440, "Full-pretrain/Step Time": 17.60509840399027} +{"Full-pretrain/Learning Rate": 2.0524143383848525e-05, "Full-pretrain/Loss": 1.9963035583496094, "Full-pretrain/Loss (Raw)": 1.8559131622314453, "Full-pretrain/Step": 5441, "Full-pretrain/Step Time": 17.600211957469583} +{"Full-pretrain/Learning Rate": 2.0515790038273204e-05, "Full-pretrain/Loss": 1.9893569946289062, "Full-pretrain/Loss (Raw)": 1.942001223564148, "Full-pretrain/Step": 5442, "Full-pretrain/Step Time": 17.602950444445014} +{"Full-pretrain/Learning Rate": 2.0507437209949937e-05, "Full-pretrain/Loss": 1.9904135465621948, "Full-pretrain/Loss (Raw)": 1.9916599988937378, "Full-pretrain/Step": 5443, "Full-pretrain/Step Time": 17.60421209782362} +{"Full-pretrain/Learning Rate": 2.04990848998422e-05, "Full-pretrain/Loss": 1.9962327480316162, "Full-pretrain/Loss (Raw)": 2.130113124847412, "Full-pretrain/Step": 5444, "Full-pretrain/Step Time": 17.603190038353205} +{"Full-pretrain/Learning Rate": 2.0490733108913438e-05, "Full-pretrain/Loss": 2.002784490585327, "Full-pretrain/Loss (Raw)": 1.8908002376556396, "Full-pretrain/Step": 5445, "Full-pretrain/Step Time": 17.598773561418056} +{"Full-pretrain/Learning Rate": 2.0482381838127036e-05, "Full-pretrain/Loss": 1.988415002822876, "Full-pretrain/Loss (Raw)": 1.605912208557129, "Full-pretrain/Step": 5446, "Full-pretrain/Step Time": 17.603612320497632} +{"Full-pretrain/Learning Rate": 2.0474031088446295e-05, "Full-pretrain/Loss": 1.9884837865829468, "Full-pretrain/Loss (Raw)": 1.9403367042541504, "Full-pretrain/Step": 5447, "Full-pretrain/Step Time": 17.602318005636334} +{"Full-pretrain/Learning Rate": 2.0465680860834477e-05, "Full-pretrain/Loss": 1.9820046424865723, "Full-pretrain/Loss (Raw)": 1.6511900424957275, "Full-pretrain/Step": 5448, "Full-pretrain/Step Time": 17.607885925099254} +{"Full-pretrain/Learning Rate": 2.0457331156254776e-05, "Full-pretrain/Loss": 1.9831913709640503, "Full-pretrain/Loss (Raw)": 2.2053186893463135, "Full-pretrain/Step": 5449, "Full-pretrain/Step Time": 17.60539272800088} +{"Full-pretrain/Learning Rate": 2.0448981975670338e-05, "Full-pretrain/Loss": 1.972639799118042, "Full-pretrain/Loss (Raw)": 1.6538324356079102, "Full-pretrain/Step": 5450, "Full-pretrain/Step Time": 17.60038930736482} +{"Full-pretrain/Learning Rate": 2.0440633320044225e-05, "Full-pretrain/Loss": 1.9652467966079712, "Full-pretrain/Loss (Raw)": 1.8262684345245361, "Full-pretrain/Step": 5451, "Full-pretrain/Step Time": 17.60451508872211} +{"Full-pretrain/Learning Rate": 2.0432285190339453e-05, "Full-pretrain/Loss": 1.9675352573394775, "Full-pretrain/Loss (Raw)": 2.0951387882232666, "Full-pretrain/Step": 5452, "Full-pretrain/Step Time": 17.595789374783635} +{"Full-pretrain/Learning Rate": 2.0423937587518987e-05, "Full-pretrain/Loss": 1.9744067192077637, "Full-pretrain/Loss (Raw)": 2.3796191215515137, "Full-pretrain/Step": 5453, "Full-pretrain/Step Time": 17.59466320462525} +{"Full-pretrain/Learning Rate": 2.0415590512545705e-05, "Full-pretrain/Loss": 1.9612467288970947, "Full-pretrain/Loss (Raw)": 1.5660227537155151, "Full-pretrain/Step": 5454, "Full-pretrain/Step Time": 17.590615617111325} +{"Full-pretrain/Learning Rate": 2.0407243966382445e-05, "Full-pretrain/Loss": 1.9666180610656738, "Full-pretrain/Loss (Raw)": 1.9594054222106934, "Full-pretrain/Step": 5455, "Full-pretrain/Step Time": 17.60008159838617} +{"Full-pretrain/Learning Rate": 2.039889794999199e-05, "Full-pretrain/Loss": 1.9628281593322754, "Full-pretrain/Loss (Raw)": 1.9534902572631836, "Full-pretrain/Step": 5456, "Full-pretrain/Step Time": 17.59674584120512} +{"Full-pretrain/Learning Rate": 2.039055246433703e-05, "Full-pretrain/Loss": 1.9523534774780273, "Full-pretrain/Loss (Raw)": 1.9082615375518799, "Full-pretrain/Step": 5457, "Full-pretrain/Step Time": 17.599849428981543} +{"Full-pretrain/Learning Rate": 2.0382207510380226e-05, "Full-pretrain/Loss": 1.95479416847229, "Full-pretrain/Loss (Raw)": 1.983906626701355, "Full-pretrain/Step": 5458, "Full-pretrain/Step Time": 17.5989031791687} +{"Full-pretrain/Learning Rate": 2.037386308908416e-05, "Full-pretrain/Loss": 1.9617745876312256, "Full-pretrain/Loss (Raw)": 2.1475539207458496, "Full-pretrain/Step": 5459, "Full-pretrain/Step Time": 17.600597335025668} +{"Full-pretrain/Learning Rate": 2.0365519201411366e-05, "Full-pretrain/Loss": 1.9633033275604248, "Full-pretrain/Loss (Raw)": 2.139131546020508, "Full-pretrain/Step": 5460, "Full-pretrain/Step Time": 17.60281472094357} +{"Full-pretrain/Learning Rate": 2.0357175848324307e-05, "Full-pretrain/Loss": 1.9561482667922974, "Full-pretrain/Loss (Raw)": 1.7292866706848145, "Full-pretrain/Step": 5461, "Full-pretrain/Step Time": 17.599229769781232} +{"Full-pretrain/Learning Rate": 2.0348833030785376e-05, "Full-pretrain/Loss": 1.9596705436706543, "Full-pretrain/Loss (Raw)": 2.1408071517944336, "Full-pretrain/Step": 5462, "Full-pretrain/Step Time": 17.59978179074824} +{"Full-pretrain/Learning Rate": 2.0340490749756918e-05, "Full-pretrain/Loss": 1.9479033946990967, "Full-pretrain/Loss (Raw)": 1.5227587223052979, "Full-pretrain/Step": 5463, "Full-pretrain/Step Time": 17.603890772908926} +{"Full-pretrain/Learning Rate": 2.033214900620122e-05, "Full-pretrain/Loss": 1.9519944190979004, "Full-pretrain/Loss (Raw)": 2.1988210678100586, "Full-pretrain/Step": 5464, "Full-pretrain/Step Time": 17.601938677951694} +{"Full-pretrain/Learning Rate": 2.0323807801080484e-05, "Full-pretrain/Loss": 1.957503080368042, "Full-pretrain/Loss (Raw)": 2.1524200439453125, "Full-pretrain/Step": 5465, "Full-pretrain/Step Time": 17.603842144832015} +{"Full-pretrain/Learning Rate": 2.031546713535688e-05, "Full-pretrain/Loss": 1.9512622356414795, "Full-pretrain/Loss (Raw)": 1.8194022178649902, "Full-pretrain/Step": 5466, "Full-pretrain/Step Time": 17.600589755922556} +{"Full-pretrain/Learning Rate": 2.0307127009992503e-05, "Full-pretrain/Loss": 1.9443209171295166, "Full-pretrain/Loss (Raw)": 1.4628565311431885, "Full-pretrain/Step": 5467, "Full-pretrain/Step Time": 17.599531657993793} +{"Full-pretrain/Learning Rate": 2.0298787425949373e-05, "Full-pretrain/Loss": 1.9398775100708008, "Full-pretrain/Loss (Raw)": 2.0928356647491455, "Full-pretrain/Step": 5468, "Full-pretrain/Step Time": 17.603385139256716} +{"Full-pretrain/Learning Rate": 2.0290448384189462e-05, "Full-pretrain/Loss": 1.9333747625350952, "Full-pretrain/Loss (Raw)": 2.1013336181640625, "Full-pretrain/Step": 5469, "Full-pretrain/Step Time": 17.602449104189873} +{"Full-pretrain/Learning Rate": 2.028210988567467e-05, "Full-pretrain/Loss": 1.9325501918792725, "Full-pretrain/Loss (Raw)": 2.078436851501465, "Full-pretrain/Step": 5470, "Full-pretrain/Step Time": 17.60060480237007} +{"Full-pretrain/Learning Rate": 2.027377193136684e-05, "Full-pretrain/Loss": 1.9383957386016846, "Full-pretrain/Loss (Raw)": 2.0810232162475586, "Full-pretrain/Step": 5471, "Full-pretrain/Step Time": 17.60428156517446} +{"Full-pretrain/Learning Rate": 2.0265434522227776e-05, "Full-pretrain/Loss": 1.9388723373413086, "Full-pretrain/Loss (Raw)": 1.8380542993545532, "Full-pretrain/Step": 5472, "Full-pretrain/Step Time": 17.606696920469403} +{"Full-pretrain/Learning Rate": 2.025709765921916e-05, "Full-pretrain/Loss": 1.946225881576538, "Full-pretrain/Loss (Raw)": 2.0912294387817383, "Full-pretrain/Step": 5473, "Full-pretrain/Step Time": 17.60527502000332} +{"Full-pretrain/Learning Rate": 2.0248761343302662e-05, "Full-pretrain/Loss": 1.950589656829834, "Full-pretrain/Loss (Raw)": 2.0816421508789062, "Full-pretrain/Step": 5474, "Full-pretrain/Step Time": 17.60446852259338} +{"Full-pretrain/Learning Rate": 2.0240425575439875e-05, "Full-pretrain/Loss": 1.9535315036773682, "Full-pretrain/Loss (Raw)": 2.085799217224121, "Full-pretrain/Step": 5475, "Full-pretrain/Step Time": 17.60501040890813} +{"Full-pretrain/Learning Rate": 2.023209035659233e-05, "Full-pretrain/Loss": 1.9499216079711914, "Full-pretrain/Loss (Raw)": 2.0145950317382812, "Full-pretrain/Step": 5476, "Full-pretrain/Step Time": 17.608289789408445} +{"Full-pretrain/Learning Rate": 2.0223755687721488e-05, "Full-pretrain/Loss": 1.9551682472229004, "Full-pretrain/Loss (Raw)": 2.058690071105957, "Full-pretrain/Step": 5477, "Full-pretrain/Step Time": 17.60470002144575} +{"Full-pretrain/Learning Rate": 2.0215421569788747e-05, "Full-pretrain/Loss": 1.9751280546188354, "Full-pretrain/Loss (Raw)": 2.24463152885437, "Full-pretrain/Step": 5478, "Full-pretrain/Step Time": 17.613148890435696} +{"Full-pretrain/Learning Rate": 2.020708800375544e-05, "Full-pretrain/Loss": 1.9724172353744507, "Full-pretrain/Loss (Raw)": 1.8535912036895752, "Full-pretrain/Step": 5479, "Full-pretrain/Step Time": 17.611069904640317} +{"Full-pretrain/Learning Rate": 2.019875499058285e-05, "Full-pretrain/Loss": 1.982682704925537, "Full-pretrain/Loss (Raw)": 1.979683756828308, "Full-pretrain/Step": 5480, "Full-pretrain/Step Time": 17.615347715094686} +{"Full-pretrain/Learning Rate": 2.0190422531232186e-05, "Full-pretrain/Loss": 1.9791475534439087, "Full-pretrain/Loss (Raw)": 2.092193126678467, "Full-pretrain/Step": 5481, "Full-pretrain/Step Time": 17.614406120032072} +{"Full-pretrain/Learning Rate": 2.01820906266646e-05, "Full-pretrain/Loss": 1.9963099956512451, "Full-pretrain/Loss (Raw)": 2.203032970428467, "Full-pretrain/Step": 5482, "Full-pretrain/Step Time": 17.615153899416327} +{"Full-pretrain/Learning Rate": 2.017375927784116e-05, "Full-pretrain/Loss": 1.9982445240020752, "Full-pretrain/Loss (Raw)": 1.8881744146347046, "Full-pretrain/Step": 5483, "Full-pretrain/Step Time": 17.61452433653176} +{"Full-pretrain/Learning Rate": 2.016542848572289e-05, "Full-pretrain/Loss": 1.9913222789764404, "Full-pretrain/Loss (Raw)": 1.8736199140548706, "Full-pretrain/Step": 5484, "Full-pretrain/Step Time": 17.61692307330668} +{"Full-pretrain/Learning Rate": 2.015709825127075e-05, "Full-pretrain/Loss": 1.9820196628570557, "Full-pretrain/Loss (Raw)": 2.0819430351257324, "Full-pretrain/Step": 5485, "Full-pretrain/Step Time": 17.616184167563915} +{"Full-pretrain/Learning Rate": 2.0148768575445617e-05, "Full-pretrain/Loss": 1.9854047298431396, "Full-pretrain/Loss (Raw)": 1.6743437051773071, "Full-pretrain/Step": 5486, "Full-pretrain/Step Time": 17.609940011054277} +{"Full-pretrain/Learning Rate": 2.0140439459208326e-05, "Full-pretrain/Loss": 1.990325927734375, "Full-pretrain/Loss (Raw)": 2.116884231567383, "Full-pretrain/Step": 5487, "Full-pretrain/Step Time": 17.612253116443753} +{"Full-pretrain/Learning Rate": 2.0132110903519647e-05, "Full-pretrain/Loss": 1.9890631437301636, "Full-pretrain/Loss (Raw)": 1.9130760431289673, "Full-pretrain/Step": 5488, "Full-pretrain/Step Time": 17.6089581027627} +{"Full-pretrain/Learning Rate": 2.0123782909340257e-05, "Full-pretrain/Loss": 1.9874539375305176, "Full-pretrain/Loss (Raw)": 1.8567664623260498, "Full-pretrain/Step": 5489, "Full-pretrain/Step Time": 17.61014806292951} +{"Full-pretrain/Learning Rate": 2.011545547763079e-05, "Full-pretrain/Loss": 1.9803965091705322, "Full-pretrain/Loss (Raw)": 1.7580736875534058, "Full-pretrain/Step": 5490, "Full-pretrain/Step Time": 17.608429197221994} +{"Full-pretrain/Learning Rate": 2.0107128609351815e-05, "Full-pretrain/Loss": 1.9764375686645508, "Full-pretrain/Loss (Raw)": 2.020862579345703, "Full-pretrain/Step": 5491, "Full-pretrain/Step Time": 17.60940377227962} +{"Full-pretrain/Learning Rate": 2.0098802305463845e-05, "Full-pretrain/Loss": 1.9720938205718994, "Full-pretrain/Loss (Raw)": 2.000131368637085, "Full-pretrain/Step": 5492, "Full-pretrain/Step Time": 17.614607874304056} +{"Full-pretrain/Learning Rate": 2.0090476566927308e-05, "Full-pretrain/Loss": 1.9735844135284424, "Full-pretrain/Loss (Raw)": 1.7769839763641357, "Full-pretrain/Step": 5493, "Full-pretrain/Step Time": 17.61370873451233} +{"Full-pretrain/Learning Rate": 2.0082151394702566e-05, "Full-pretrain/Loss": 1.9767236709594727, "Full-pretrain/Loss (Raw)": 2.2412657737731934, "Full-pretrain/Step": 5494, "Full-pretrain/Step Time": 17.608920462429523} +{"Full-pretrain/Learning Rate": 2.0073826789749937e-05, "Full-pretrain/Loss": 1.9906524419784546, "Full-pretrain/Loss (Raw)": 1.9684803485870361, "Full-pretrain/Step": 5495, "Full-pretrain/Step Time": 17.613116331398487} +{"Full-pretrain/Learning Rate": 2.0065502753029653e-05, "Full-pretrain/Loss": 1.9862680435180664, "Full-pretrain/Loss (Raw)": 2.0585203170776367, "Full-pretrain/Step": 5496, "Full-pretrain/Step Time": 17.61137466877699} +{"Full-pretrain/Learning Rate": 2.005717928550189e-05, "Full-pretrain/Loss": 1.9799118041992188, "Full-pretrain/Loss (Raw)": 1.9490200281143188, "Full-pretrain/Step": 5497, "Full-pretrain/Step Time": 17.60562489554286} +{"Full-pretrain/Learning Rate": 2.0048856388126773e-05, "Full-pretrain/Loss": 1.9811817407608032, "Full-pretrain/Loss (Raw)": 1.8600411415100098, "Full-pretrain/Step": 5498, "Full-pretrain/Step Time": 17.60463404841721} +{"Full-pretrain/Learning Rate": 2.004053406186432e-05, "Full-pretrain/Loss": 2.005286693572998, "Full-pretrain/Loss (Raw)": 2.234218120574951, "Full-pretrain/Step": 5499, "Full-pretrain/Step Time": 17.604092322289944} +{"Full-pretrain/Learning Rate": 2.0032212307674517e-05, "Full-pretrain/Loss": 2.000913619995117, "Full-pretrain/Loss (Raw)": 1.9528944492340088, "Full-pretrain/Step": 5500, "Full-pretrain/Step Time": 17.61068594828248} +{"Full-pretrain/Learning Rate": 2.002389112651728e-05, "Full-pretrain/Loss": 1.9996953010559082, "Full-pretrain/Loss (Raw)": 2.0623483657836914, "Full-pretrain/Step": 5501, "Full-pretrain/Step Time": 17.605579551309347} +{"Full-pretrain/Learning Rate": 2.001557051935246e-05, "Full-pretrain/Loss": 2.000152587890625, "Full-pretrain/Loss (Raw)": 2.093061685562134, "Full-pretrain/Step": 5502, "Full-pretrain/Step Time": 17.609759947285056} +{"Full-pretrain/Learning Rate": 2.000725048713983e-05, "Full-pretrain/Loss": 1.9914700984954834, "Full-pretrain/Loss (Raw)": 1.8031902313232422, "Full-pretrain/Step": 5503, "Full-pretrain/Step Time": 17.61208006180823} +{"Full-pretrain/Learning Rate": 1.9998931030839098e-05, "Full-pretrain/Loss": 1.9953348636627197, "Full-pretrain/Loss (Raw)": 1.9617249965667725, "Full-pretrain/Step": 5504, "Full-pretrain/Step Time": 17.61528936214745} +{"Full-pretrain/Learning Rate": 1.9990612151409908e-05, "Full-pretrain/Loss": 1.9915142059326172, "Full-pretrain/Loss (Raw)": 1.968967080116272, "Full-pretrain/Step": 5505, "Full-pretrain/Step Time": 17.61092934012413} +{"Full-pretrain/Learning Rate": 1.998229384981185e-05, "Full-pretrain/Loss": 1.9915058612823486, "Full-pretrain/Loss (Raw)": 2.081373929977417, "Full-pretrain/Step": 5506, "Full-pretrain/Step Time": 17.615920811891556} +{"Full-pretrain/Learning Rate": 1.9973976127004435e-05, "Full-pretrain/Loss": 1.9820492267608643, "Full-pretrain/Loss (Raw)": 1.783190369606018, "Full-pretrain/Step": 5507, "Full-pretrain/Step Time": 17.621802804991603} +{"Full-pretrain/Learning Rate": 1.99656589839471e-05, "Full-pretrain/Loss": 1.9803340435028076, "Full-pretrain/Loss (Raw)": 1.9597103595733643, "Full-pretrain/Step": 5508, "Full-pretrain/Step Time": 17.624990954995155} +{"Full-pretrain/Learning Rate": 1.995734242159925e-05, "Full-pretrain/Loss": 1.9771840572357178, "Full-pretrain/Loss (Raw)": 1.9578865766525269, "Full-pretrain/Step": 5509, "Full-pretrain/Step Time": 17.627843657508492} +{"Full-pretrain/Learning Rate": 1.9949026440920164e-05, "Full-pretrain/Loss": 1.9618628025054932, "Full-pretrain/Loss (Raw)": 1.754354476928711, "Full-pretrain/Step": 5510, "Full-pretrain/Step Time": 17.62657696940005} +{"Full-pretrain/Learning Rate": 1.994071104286911e-05, "Full-pretrain/Loss": 1.9674301147460938, "Full-pretrain/Loss (Raw)": 2.031745672225952, "Full-pretrain/Step": 5511, "Full-pretrain/Step Time": 17.62485259771347} +{"Full-pretrain/Learning Rate": 1.9932396228405255e-05, "Full-pretrain/Loss": 1.9680640697479248, "Full-pretrain/Loss (Raw)": 1.9999700784683228, "Full-pretrain/Step": 5512, "Full-pretrain/Step Time": 17.626955216750503} +{"Full-pretrain/Learning Rate": 1.9924081998487716e-05, "Full-pretrain/Loss": 1.9689762592315674, "Full-pretrain/Loss (Raw)": 2.1213812828063965, "Full-pretrain/Step": 5513, "Full-pretrain/Step Time": 17.625924522057176} +{"Full-pretrain/Learning Rate": 1.991576835407554e-05, "Full-pretrain/Loss": 1.9615570306777954, "Full-pretrain/Loss (Raw)": 1.9656189680099487, "Full-pretrain/Step": 5514, "Full-pretrain/Step Time": 17.62258799187839} +{"Full-pretrain/Learning Rate": 1.9907455296127688e-05, "Full-pretrain/Loss": 1.9671781063079834, "Full-pretrain/Loss (Raw)": 2.068051338195801, "Full-pretrain/Step": 5515, "Full-pretrain/Step Time": 17.62734479829669} +{"Full-pretrain/Learning Rate": 1.989914282560308e-05, "Full-pretrain/Loss": 1.975736379623413, "Full-pretrain/Loss (Raw)": 2.1474804878234863, "Full-pretrain/Step": 5516, "Full-pretrain/Step Time": 17.62362402677536} +{"Full-pretrain/Learning Rate": 1.989083094346055e-05, "Full-pretrain/Loss": 1.9704347848892212, "Full-pretrain/Loss (Raw)": 1.912294864654541, "Full-pretrain/Step": 5517, "Full-pretrain/Step Time": 17.625637969002128} +{"Full-pretrain/Learning Rate": 1.988251965065889e-05, "Full-pretrain/Loss": 1.9885656833648682, "Full-pretrain/Loss (Raw)": 2.2545316219329834, "Full-pretrain/Step": 5518, "Full-pretrain/Step Time": 17.619991842657328} +{"Full-pretrain/Learning Rate": 1.9874208948156784e-05, "Full-pretrain/Loss": 1.9817413091659546, "Full-pretrain/Loss (Raw)": 1.8985041379928589, "Full-pretrain/Step": 5519, "Full-pretrain/Step Time": 17.621875816956162} +{"Full-pretrain/Learning Rate": 1.9865898836912876e-05, "Full-pretrain/Loss": 1.9775439500808716, "Full-pretrain/Loss (Raw)": 1.778760313987732, "Full-pretrain/Step": 5520, "Full-pretrain/Step Time": 17.62032642774284} +{"Full-pretrain/Learning Rate": 1.9857589317885723e-05, "Full-pretrain/Loss": 1.9834785461425781, "Full-pretrain/Loss (Raw)": 2.0466740131378174, "Full-pretrain/Step": 5521, "Full-pretrain/Step Time": 17.6244032997638} +{"Full-pretrain/Learning Rate": 1.984928039203384e-05, "Full-pretrain/Loss": 1.9896016120910645, "Full-pretrain/Loss (Raw)": 1.9540109634399414, "Full-pretrain/Step": 5522, "Full-pretrain/Step Time": 17.62170623242855} +{"Full-pretrain/Learning Rate": 1.9840972060315653e-05, "Full-pretrain/Loss": 1.9922088384628296, "Full-pretrain/Loss (Raw)": 2.104296922683716, "Full-pretrain/Step": 5523, "Full-pretrain/Step Time": 17.62185588106513} +{"Full-pretrain/Learning Rate": 1.9832664323689533e-05, "Full-pretrain/Loss": 1.981391191482544, "Full-pretrain/Loss (Raw)": 1.6539636850357056, "Full-pretrain/Step": 5524, "Full-pretrain/Step Time": 17.62026545032859} +{"Full-pretrain/Learning Rate": 1.982435718311376e-05, "Full-pretrain/Loss": 1.9883463382720947, "Full-pretrain/Loss (Raw)": 1.9995479583740234, "Full-pretrain/Step": 5525, "Full-pretrain/Step Time": 17.62130169942975} +{"Full-pretrain/Learning Rate": 1.9816050639546567e-05, "Full-pretrain/Loss": 1.978062391281128, "Full-pretrain/Loss (Raw)": 1.9121828079223633, "Full-pretrain/Step": 5526, "Full-pretrain/Step Time": 17.62615634687245} +{"Full-pretrain/Learning Rate": 1.9807744693946115e-05, "Full-pretrain/Loss": 1.9765617847442627, "Full-pretrain/Loss (Raw)": 1.9204609394073486, "Full-pretrain/Step": 5527, "Full-pretrain/Step Time": 17.62505918368697} +{"Full-pretrain/Learning Rate": 1.9799439347270483e-05, "Full-pretrain/Loss": 1.9745838642120361, "Full-pretrain/Loss (Raw)": 1.995226263999939, "Full-pretrain/Step": 5528, "Full-pretrain/Step Time": 17.627063754945993} +{"Full-pretrain/Learning Rate": 1.9791134600477696e-05, "Full-pretrain/Loss": 1.9693784713745117, "Full-pretrain/Loss (Raw)": 1.7824456691741943, "Full-pretrain/Step": 5529, "Full-pretrain/Step Time": 17.627749351784587} +{"Full-pretrain/Learning Rate": 1.978283045452571e-05, "Full-pretrain/Loss": 1.9628068208694458, "Full-pretrain/Loss (Raw)": 1.6497515439987183, "Full-pretrain/Step": 5530, "Full-pretrain/Step Time": 17.628365200012922} +{"Full-pretrain/Learning Rate": 1.977452691037239e-05, "Full-pretrain/Loss": 1.952857255935669, "Full-pretrain/Loss (Raw)": 1.9158291816711426, "Full-pretrain/Step": 5531, "Full-pretrain/Step Time": 17.635872036218643} +{"Full-pretrain/Learning Rate": 1.9766223968975554e-05, "Full-pretrain/Loss": 1.9580163955688477, "Full-pretrain/Loss (Raw)": 2.117987871170044, "Full-pretrain/Step": 5532, "Full-pretrain/Step Time": 17.634109990671277} +{"Full-pretrain/Learning Rate": 1.975792163129294e-05, "Full-pretrain/Loss": 1.9579405784606934, "Full-pretrain/Loss (Raw)": 2.0599234104156494, "Full-pretrain/Step": 5533, "Full-pretrain/Step Time": 17.633037390187383} +{"Full-pretrain/Learning Rate": 1.9749619898282235e-05, "Full-pretrain/Loss": 1.9552955627441406, "Full-pretrain/Loss (Raw)": 2.008419990539551, "Full-pretrain/Step": 5534, "Full-pretrain/Step Time": 17.629418900236487} +{"Full-pretrain/Learning Rate": 1.9741318770901026e-05, "Full-pretrain/Loss": 1.964830994606018, "Full-pretrain/Loss (Raw)": 2.108322858810425, "Full-pretrain/Step": 5535, "Full-pretrain/Step Time": 17.630486968904734} +{"Full-pretrain/Learning Rate": 1.973301825010685e-05, "Full-pretrain/Loss": 1.9711719751358032, "Full-pretrain/Loss (Raw)": 2.1646370887756348, "Full-pretrain/Step": 5536, "Full-pretrain/Step Time": 17.626996213570237} +{"Full-pretrain/Learning Rate": 1.9724718336857163e-05, "Full-pretrain/Loss": 1.9643396139144897, "Full-pretrain/Loss (Raw)": 1.750331997871399, "Full-pretrain/Step": 5537, "Full-pretrain/Step Time": 17.629107603803277} +{"Full-pretrain/Learning Rate": 1.971641903210936e-05, "Full-pretrain/Loss": 1.9639145135879517, "Full-pretrain/Loss (Raw)": 2.067770004272461, "Full-pretrain/Step": 5538, "Full-pretrain/Step Time": 17.619566848501563} +{"Full-pretrain/Learning Rate": 1.9708120336820764e-05, "Full-pretrain/Loss": 1.9659000635147095, "Full-pretrain/Loss (Raw)": 1.846726417541504, "Full-pretrain/Step": 5539, "Full-pretrain/Step Time": 17.628635052591562} +{"Full-pretrain/Learning Rate": 1.969982225194864e-05, "Full-pretrain/Loss": 1.9660370349884033, "Full-pretrain/Loss (Raw)": 1.9640933275222778, "Full-pretrain/Step": 5540, "Full-pretrain/Step Time": 17.630657648667693} +{"Full-pretrain/Learning Rate": 1.9691524778450145e-05, "Full-pretrain/Loss": 1.9779164791107178, "Full-pretrain/Loss (Raw)": 2.338028907775879, "Full-pretrain/Step": 5541, "Full-pretrain/Step Time": 17.628068717196584} +{"Full-pretrain/Learning Rate": 1.9683227917282403e-05, "Full-pretrain/Loss": 1.9885798692703247, "Full-pretrain/Loss (Raw)": 2.095588207244873, "Full-pretrain/Step": 5542, "Full-pretrain/Step Time": 17.625092836096883} +{"Full-pretrain/Learning Rate": 1.9674931669402452e-05, "Full-pretrain/Loss": 1.9866042137145996, "Full-pretrain/Loss (Raw)": 1.968521237373352, "Full-pretrain/Step": 5543, "Full-pretrain/Step Time": 17.622950794175267} +{"Full-pretrain/Learning Rate": 1.9666636035767265e-05, "Full-pretrain/Loss": 1.9854962825775146, "Full-pretrain/Loss (Raw)": 1.964522123336792, "Full-pretrain/Step": 5544, "Full-pretrain/Step Time": 17.626372762024403} +{"Full-pretrain/Learning Rate": 1.9658341017333736e-05, "Full-pretrain/Loss": 1.9803059101104736, "Full-pretrain/Loss (Raw)": 1.9552819728851318, "Full-pretrain/Step": 5545, "Full-pretrain/Step Time": 17.628108151257038} +{"Full-pretrain/Learning Rate": 1.96500466150587e-05, "Full-pretrain/Loss": 1.9785858392715454, "Full-pretrain/Loss (Raw)": 1.9105819463729858, "Full-pretrain/Step": 5546, "Full-pretrain/Step Time": 17.624943360686302} +{"Full-pretrain/Learning Rate": 1.9641752829898898e-05, "Full-pretrain/Loss": 1.9758596420288086, "Full-pretrain/Loss (Raw)": 1.9808123111724854, "Full-pretrain/Step": 5547, "Full-pretrain/Step Time": 17.628998309373856} +{"Full-pretrain/Learning Rate": 1.9633459662811025e-05, "Full-pretrain/Loss": 1.969016671180725, "Full-pretrain/Loss (Raw)": 1.928505301475525, "Full-pretrain/Step": 5548, "Full-pretrain/Step Time": 17.632120231166482} +{"Full-pretrain/Learning Rate": 1.962516711475169e-05, "Full-pretrain/Loss": 1.9680083990097046, "Full-pretrain/Loss (Raw)": 1.8800281286239624, "Full-pretrain/Step": 5549, "Full-pretrain/Step Time": 17.631013555452228} +{"Full-pretrain/Learning Rate": 1.9616875186677442e-05, "Full-pretrain/Loss": 1.9542282819747925, "Full-pretrain/Loss (Raw)": 1.8135693073272705, "Full-pretrain/Step": 5550, "Full-pretrain/Step Time": 17.628777714446187} +{"Full-pretrain/Learning Rate": 1.9608583879544763e-05, "Full-pretrain/Loss": 1.956218957901001, "Full-pretrain/Loss (Raw)": 1.962200403213501, "Full-pretrain/Step": 5551, "Full-pretrain/Step Time": 17.632818814367056} +{"Full-pretrain/Learning Rate": 1.9600293194310022e-05, "Full-pretrain/Loss": 1.94870126247406, "Full-pretrain/Loss (Raw)": 1.5381968021392822, "Full-pretrain/Step": 5552, "Full-pretrain/Step Time": 17.632159857079387} +{"Full-pretrain/Learning Rate": 1.9592003131929572e-05, "Full-pretrain/Loss": 1.9453800916671753, "Full-pretrain/Loss (Raw)": 1.9403955936431885, "Full-pretrain/Step": 5553, "Full-pretrain/Step Time": 17.63104865886271} +{"Full-pretrain/Learning Rate": 1.9583713693359655e-05, "Full-pretrain/Loss": 1.9430015087127686, "Full-pretrain/Loss (Raw)": 1.8778982162475586, "Full-pretrain/Step": 5554, "Full-pretrain/Step Time": 17.629149086773396} +{"Full-pretrain/Learning Rate": 1.9575424879556462e-05, "Full-pretrain/Loss": 1.9308857917785645, "Full-pretrain/Loss (Raw)": 1.7165896892547607, "Full-pretrain/Step": 5555, "Full-pretrain/Step Time": 17.630247239023447} +{"Full-pretrain/Learning Rate": 1.956713669147611e-05, "Full-pretrain/Loss": 1.938460111618042, "Full-pretrain/Loss (Raw)": 1.8963429927825928, "Full-pretrain/Step": 5556, "Full-pretrain/Step Time": 17.63620938360691} +{"Full-pretrain/Learning Rate": 1.9558849130074622e-05, "Full-pretrain/Loss": 1.9357595443725586, "Full-pretrain/Loss (Raw)": 1.9131313562393188, "Full-pretrain/Step": 5557, "Full-pretrain/Step Time": 17.636331943795085} +{"Full-pretrain/Learning Rate": 1.9550562196307975e-05, "Full-pretrain/Loss": 1.9280343055725098, "Full-pretrain/Loss (Raw)": 1.6649774312973022, "Full-pretrain/Step": 5558, "Full-pretrain/Step Time": 17.6267797537148} +{"Full-pretrain/Learning Rate": 1.9542275891132063e-05, "Full-pretrain/Loss": 1.9245610237121582, "Full-pretrain/Loss (Raw)": 1.8093156814575195, "Full-pretrain/Step": 5559, "Full-pretrain/Step Time": 17.63324547931552} +{"Full-pretrain/Learning Rate": 1.9533990215502714e-05, "Full-pretrain/Loss": 1.925653100013733, "Full-pretrain/Loss (Raw)": 2.030170440673828, "Full-pretrain/Step": 5560, "Full-pretrain/Step Time": 17.63136361539364} +{"Full-pretrain/Learning Rate": 1.9525705170375675e-05, "Full-pretrain/Loss": 1.930802583694458, "Full-pretrain/Loss (Raw)": 1.9472267627716064, "Full-pretrain/Step": 5561, "Full-pretrain/Step Time": 17.631258016452193} +{"Full-pretrain/Learning Rate": 1.951742075670662e-05, "Full-pretrain/Loss": 1.9285874366760254, "Full-pretrain/Loss (Raw)": 1.5788722038269043, "Full-pretrain/Step": 5562, "Full-pretrain/Step Time": 17.62810304760933} +{"Full-pretrain/Learning Rate": 1.950913697545115e-05, "Full-pretrain/Loss": 1.9255846738815308, "Full-pretrain/Loss (Raw)": 1.8197362422943115, "Full-pretrain/Step": 5563, "Full-pretrain/Step Time": 17.635701466351748} +{"Full-pretrain/Learning Rate": 1.9500853827564793e-05, "Full-pretrain/Loss": 1.915783405303955, "Full-pretrain/Loss (Raw)": 1.804349660873413, "Full-pretrain/Step": 5564, "Full-pretrain/Step Time": 17.632311774417758} +{"Full-pretrain/Learning Rate": 1.9492571314003022e-05, "Full-pretrain/Loss": 1.9244498014450073, "Full-pretrain/Loss (Raw)": 2.337246894836426, "Full-pretrain/Step": 5565, "Full-pretrain/Step Time": 17.634930834174156} +{"Full-pretrain/Learning Rate": 1.948428943572121e-05, "Full-pretrain/Loss": 1.924408197402954, "Full-pretrain/Loss (Raw)": 2.007089138031006, "Full-pretrain/Step": 5566, "Full-pretrain/Step Time": 17.62442857772112} +{"Full-pretrain/Learning Rate": 1.947600819367469e-05, "Full-pretrain/Loss": 1.9179089069366455, "Full-pretrain/Loss (Raw)": 1.9003435373306274, "Full-pretrain/Step": 5567, "Full-pretrain/Step Time": 17.629331782460213} +{"Full-pretrain/Learning Rate": 1.9467727588818667e-05, "Full-pretrain/Loss": 1.9140050411224365, "Full-pretrain/Loss (Raw)": 2.0397167205810547, "Full-pretrain/Step": 5568, "Full-pretrain/Step Time": 17.631752284243703} +{"Full-pretrain/Learning Rate": 1.945944762210833e-05, "Full-pretrain/Loss": 1.9201412200927734, "Full-pretrain/Loss (Raw)": 1.946689248085022, "Full-pretrain/Step": 5569, "Full-pretrain/Step Time": 17.631633009761572} +{"Full-pretrain/Learning Rate": 1.9451168294498756e-05, "Full-pretrain/Loss": 1.9212007522583008, "Full-pretrain/Loss (Raw)": 2.1016738414764404, "Full-pretrain/Step": 5570, "Full-pretrain/Step Time": 17.632722986862063} +{"Full-pretrain/Learning Rate": 1.9442889606944968e-05, "Full-pretrain/Loss": 1.9258142709732056, "Full-pretrain/Loss (Raw)": 1.994361400604248, "Full-pretrain/Step": 5571, "Full-pretrain/Step Time": 17.628094408661127} +{"Full-pretrain/Learning Rate": 1.9434611560401926e-05, "Full-pretrain/Loss": 1.9333655834197998, "Full-pretrain/Loss (Raw)": 2.2057347297668457, "Full-pretrain/Step": 5572, "Full-pretrain/Step Time": 17.631578873842955} +{"Full-pretrain/Learning Rate": 1.942633415582447e-05, "Full-pretrain/Loss": 1.9142471551895142, "Full-pretrain/Loss (Raw)": 1.7262381315231323, "Full-pretrain/Step": 5573, "Full-pretrain/Step Time": 17.63058423064649} +{"Full-pretrain/Learning Rate": 1.9418057394167418e-05, "Full-pretrain/Loss": 1.8976337909698486, "Full-pretrain/Loss (Raw)": 1.5639598369598389, "Full-pretrain/Step": 5574, "Full-pretrain/Step Time": 17.62791958451271} +{"Full-pretrain/Learning Rate": 1.9409781276385475e-05, "Full-pretrain/Loss": 1.8964693546295166, "Full-pretrain/Loss (Raw)": 1.931260347366333, "Full-pretrain/Step": 5575, "Full-pretrain/Step Time": 17.626486932858825} +{"Full-pretrain/Learning Rate": 1.9401505803433306e-05, "Full-pretrain/Loss": 1.9003807306289673, "Full-pretrain/Loss (Raw)": 2.089686155319214, "Full-pretrain/Step": 5576, "Full-pretrain/Step Time": 17.62617197446525} +{"Full-pretrain/Learning Rate": 1.9393230976265473e-05, "Full-pretrain/Loss": 1.905901551246643, "Full-pretrain/Loss (Raw)": 2.1319475173950195, "Full-pretrain/Step": 5577, "Full-pretrain/Step Time": 17.62878218665719} +{"Full-pretrain/Learning Rate": 1.938495679583648e-05, "Full-pretrain/Loss": 1.9038581848144531, "Full-pretrain/Loss (Raw)": 1.8451942205429077, "Full-pretrain/Step": 5578, "Full-pretrain/Step Time": 17.63476406596601} +{"Full-pretrain/Learning Rate": 1.9376683263100743e-05, "Full-pretrain/Loss": 1.9057190418243408, "Full-pretrain/Loss (Raw)": 2.0403618812561035, "Full-pretrain/Step": 5579, "Full-pretrain/Step Time": 17.62996430322528} +{"Full-pretrain/Learning Rate": 1.936841037901261e-05, "Full-pretrain/Loss": 1.8943171501159668, "Full-pretrain/Loss (Raw)": 1.5636448860168457, "Full-pretrain/Step": 5580, "Full-pretrain/Step Time": 17.62727352976799} +{"Full-pretrain/Learning Rate": 1.9360138144526364e-05, "Full-pretrain/Loss": 1.9020812511444092, "Full-pretrain/Loss (Raw)": 2.1284782886505127, "Full-pretrain/Step": 5581, "Full-pretrain/Step Time": 17.630915336310863} +{"Full-pretrain/Learning Rate": 1.935186656059621e-05, "Full-pretrain/Loss": 1.909722924232483, "Full-pretrain/Loss (Raw)": 2.0581018924713135, "Full-pretrain/Step": 5582, "Full-pretrain/Step Time": 17.62980856001377} +{"Full-pretrain/Learning Rate": 1.9343595628176254e-05, "Full-pretrain/Loss": 1.908935546875, "Full-pretrain/Loss (Raw)": 1.9370037317276, "Full-pretrain/Step": 5583, "Full-pretrain/Step Time": 17.620843993499875} +{"Full-pretrain/Learning Rate": 1.9335325348220557e-05, "Full-pretrain/Loss": 1.9184387922286987, "Full-pretrain/Loss (Raw)": 1.842301607131958, "Full-pretrain/Step": 5584, "Full-pretrain/Step Time": 17.6201333925128} +{"Full-pretrain/Learning Rate": 1.9327055721683086e-05, "Full-pretrain/Loss": 1.9107941389083862, "Full-pretrain/Loss (Raw)": 1.6957685947418213, "Full-pretrain/Step": 5585, "Full-pretrain/Step Time": 17.61667232774198} +{"Full-pretrain/Learning Rate": 1.9318786749517755e-05, "Full-pretrain/Loss": 1.9159126281738281, "Full-pretrain/Loss (Raw)": 2.0416855812072754, "Full-pretrain/Step": 5586, "Full-pretrain/Step Time": 17.61178867891431} +{"Full-pretrain/Learning Rate": 1.9310518432678365e-05, "Full-pretrain/Loss": 1.9176030158996582, "Full-pretrain/Loss (Raw)": 1.7706818580627441, "Full-pretrain/Step": 5587, "Full-pretrain/Step Time": 17.60811216197908} +{"Full-pretrain/Learning Rate": 1.9302250772118687e-05, "Full-pretrain/Loss": 1.922359585762024, "Full-pretrain/Loss (Raw)": 2.048555850982666, "Full-pretrain/Step": 5588, "Full-pretrain/Step Time": 17.61432246491313} +{"Full-pretrain/Learning Rate": 1.9293983768792367e-05, "Full-pretrain/Loss": 1.9235023260116577, "Full-pretrain/Loss (Raw)": 1.9496979713439941, "Full-pretrain/Step": 5589, "Full-pretrain/Step Time": 17.611575385555625} +{"Full-pretrain/Learning Rate": 1.9285717423653016e-05, "Full-pretrain/Loss": 1.9279811382293701, "Full-pretrain/Loss (Raw)": 1.8083000183105469, "Full-pretrain/Step": 5590, "Full-pretrain/Step Time": 17.61752924695611} +{"Full-pretrain/Learning Rate": 1.9277451737654152e-05, "Full-pretrain/Loss": 1.9327402114868164, "Full-pretrain/Loss (Raw)": 1.9616045951843262, "Full-pretrain/Step": 5591, "Full-pretrain/Step Time": 17.610493848100305} +{"Full-pretrain/Learning Rate": 1.9269186711749223e-05, "Full-pretrain/Loss": 1.9284712076187134, "Full-pretrain/Loss (Raw)": 1.8935648202896118, "Full-pretrain/Step": 5592, "Full-pretrain/Step Time": 17.61437489464879} +{"Full-pretrain/Learning Rate": 1.9260922346891597e-05, "Full-pretrain/Loss": 1.9350411891937256, "Full-pretrain/Loss (Raw)": 2.1574625968933105, "Full-pretrain/Step": 5593, "Full-pretrain/Step Time": 17.610978877171874} +{"Full-pretrain/Learning Rate": 1.9252658644034554e-05, "Full-pretrain/Loss": 1.9488954544067383, "Full-pretrain/Loss (Raw)": 2.0222091674804688, "Full-pretrain/Step": 5594, "Full-pretrain/Step Time": 17.616219440475106} +{"Full-pretrain/Learning Rate": 1.9244395604131323e-05, "Full-pretrain/Loss": 1.9593324661254883, "Full-pretrain/Loss (Raw)": 2.1537222862243652, "Full-pretrain/Step": 5595, "Full-pretrain/Step Time": 17.618399718776345} +{"Full-pretrain/Learning Rate": 1.9236133228135027e-05, "Full-pretrain/Loss": 1.964728593826294, "Full-pretrain/Loss (Raw)": 1.9770245552062988, "Full-pretrain/Step": 5596, "Full-pretrain/Step Time": 17.61595217883587} +{"Full-pretrain/Learning Rate": 1.922787151699874e-05, "Full-pretrain/Loss": 1.9423296451568604, "Full-pretrain/Loss (Raw)": 1.6204813718795776, "Full-pretrain/Step": 5597, "Full-pretrain/Step Time": 17.621156899258494} +{"Full-pretrain/Learning Rate": 1.921961047167546e-05, "Full-pretrain/Loss": 1.9498803615570068, "Full-pretrain/Loss (Raw)": 2.248713493347168, "Full-pretrain/Step": 5598, "Full-pretrain/Step Time": 17.61746071279049} +{"Full-pretrain/Learning Rate": 1.9211350093118063e-05, "Full-pretrain/Loss": 1.949007272720337, "Full-pretrain/Loss (Raw)": 1.8724015951156616, "Full-pretrain/Step": 5599, "Full-pretrain/Step Time": 17.621422849595547} +{"Full-pretrain/Learning Rate": 1.92030903822794e-05, "Full-pretrain/Loss": 1.946470022201538, "Full-pretrain/Loss (Raw)": 1.9585248231887817, "Full-pretrain/Step": 5600, "Full-pretrain/Step Time": 17.619583940133452} +{"Full-pretrain/Learning Rate": 1.9194831340112225e-05, "Full-pretrain/Loss": 1.9432475566864014, "Full-pretrain/Loss (Raw)": 1.8435734510421753, "Full-pretrain/Step": 5601, "Full-pretrain/Step Time": 17.623340198770165} +{"Full-pretrain/Learning Rate": 1.9186572967569222e-05, "Full-pretrain/Loss": 1.9311617612838745, "Full-pretrain/Loss (Raw)": 1.7149277925491333, "Full-pretrain/Step": 5602, "Full-pretrain/Step Time": 17.6234712600708} +{"Full-pretrain/Learning Rate": 1.9178315265602983e-05, "Full-pretrain/Loss": 1.9249688386917114, "Full-pretrain/Loss (Raw)": 1.796188473701477, "Full-pretrain/Step": 5603, "Full-pretrain/Step Time": 17.624967623502016} +{"Full-pretrain/Learning Rate": 1.9170058235166033e-05, "Full-pretrain/Loss": 1.915661096572876, "Full-pretrain/Loss (Raw)": 1.9078888893127441, "Full-pretrain/Step": 5604, "Full-pretrain/Step Time": 17.617024509236217} +{"Full-pretrain/Learning Rate": 1.916180187721081e-05, "Full-pretrain/Loss": 1.9247748851776123, "Full-pretrain/Loss (Raw)": 2.01788067817688, "Full-pretrain/Step": 5605, "Full-pretrain/Step Time": 17.62056644819677} +{"Full-pretrain/Learning Rate": 1.9153546192689694e-05, "Full-pretrain/Loss": 1.931185007095337, "Full-pretrain/Loss (Raw)": 1.769078254699707, "Full-pretrain/Step": 5606, "Full-pretrain/Step Time": 17.614499863237143} +{"Full-pretrain/Learning Rate": 1.914529118255496e-05, "Full-pretrain/Loss": 1.9357459545135498, "Full-pretrain/Loss (Raw)": 2.0772147178649902, "Full-pretrain/Step": 5607, "Full-pretrain/Step Time": 17.613938484340906} +{"Full-pretrain/Learning Rate": 1.913703684775884e-05, "Full-pretrain/Loss": 1.9214513301849365, "Full-pretrain/Loss (Raw)": 1.6322604417800903, "Full-pretrain/Step": 5608, "Full-pretrain/Step Time": 17.609737953171134} +{"Full-pretrain/Learning Rate": 1.912878318925346e-05, "Full-pretrain/Loss": 1.9081788063049316, "Full-pretrain/Loss (Raw)": 1.7072241306304932, "Full-pretrain/Step": 5609, "Full-pretrain/Step Time": 17.6145312897861} +{"Full-pretrain/Learning Rate": 1.9120530207990875e-05, "Full-pretrain/Loss": 1.8941750526428223, "Full-pretrain/Loss (Raw)": 1.397073745727539, "Full-pretrain/Step": 5610, "Full-pretrain/Step Time": 17.615207344293594} +{"Full-pretrain/Learning Rate": 1.9112277904923065e-05, "Full-pretrain/Loss": 1.900191307067871, "Full-pretrain/Loss (Raw)": 2.232882022857666, "Full-pretrain/Step": 5611, "Full-pretrain/Step Time": 17.610660437494516} +{"Full-pretrain/Learning Rate": 1.9104026281001926e-05, "Full-pretrain/Loss": 1.9079216718673706, "Full-pretrain/Loss (Raw)": 1.8110164403915405, "Full-pretrain/Step": 5612, "Full-pretrain/Step Time": 17.615790750831366} +{"Full-pretrain/Learning Rate": 1.9095775337179282e-05, "Full-pretrain/Loss": 1.9048811197280884, "Full-pretrain/Loss (Raw)": 2.031179428100586, "Full-pretrain/Step": 5613, "Full-pretrain/Step Time": 17.60863467119634} +{"Full-pretrain/Learning Rate": 1.908752507440689e-05, "Full-pretrain/Loss": 1.908104658126831, "Full-pretrain/Loss (Raw)": 2.1612558364868164, "Full-pretrain/Step": 5614, "Full-pretrain/Step Time": 17.607371758669615} +{"Full-pretrain/Learning Rate": 1.9079275493636392e-05, "Full-pretrain/Loss": 1.9089869260787964, "Full-pretrain/Loss (Raw)": 1.9652352333068848, "Full-pretrain/Step": 5615, "Full-pretrain/Step Time": 17.6084348205477} +{"Full-pretrain/Learning Rate": 1.9071026595819386e-05, "Full-pretrain/Loss": 1.9087401628494263, "Full-pretrain/Loss (Raw)": 1.8344054222106934, "Full-pretrain/Step": 5616, "Full-pretrain/Step Time": 17.610706567764282} +{"Full-pretrain/Learning Rate": 1.9062778381907376e-05, "Full-pretrain/Loss": 1.9137179851531982, "Full-pretrain/Loss (Raw)": 1.855059027671814, "Full-pretrain/Step": 5617, "Full-pretrain/Step Time": 17.613689851015806} +{"Full-pretrain/Learning Rate": 1.90545308528518e-05, "Full-pretrain/Loss": 1.9087915420532227, "Full-pretrain/Loss (Raw)": 1.884039282798767, "Full-pretrain/Step": 5618, "Full-pretrain/Step Time": 17.61421055532992} +{"Full-pretrain/Learning Rate": 1.9046284009604e-05, "Full-pretrain/Loss": 1.917123556137085, "Full-pretrain/Loss (Raw)": 2.0373082160949707, "Full-pretrain/Step": 5619, "Full-pretrain/Step Time": 17.619402527809143} +{"Full-pretrain/Learning Rate": 1.9038037853115248e-05, "Full-pretrain/Loss": 1.9089155197143555, "Full-pretrain/Loss (Raw)": 1.7858985662460327, "Full-pretrain/Step": 5620, "Full-pretrain/Step Time": 17.62040259130299} +{"Full-pretrain/Learning Rate": 1.9029792384336728e-05, "Full-pretrain/Loss": 1.913489580154419, "Full-pretrain/Loss (Raw)": 2.0960710048675537, "Full-pretrain/Step": 5621, "Full-pretrain/Step Time": 17.619063034653664} +{"Full-pretrain/Learning Rate": 1.9021547604219558e-05, "Full-pretrain/Loss": 1.915994644165039, "Full-pretrain/Loss (Raw)": 1.8884572982788086, "Full-pretrain/Step": 5622, "Full-pretrain/Step Time": 17.626649759709835} +{"Full-pretrain/Learning Rate": 1.9013303513714774e-05, "Full-pretrain/Loss": 1.9358627796173096, "Full-pretrain/Loss (Raw)": 2.597384452819824, "Full-pretrain/Step": 5623, "Full-pretrain/Step Time": 17.62815684080124} +{"Full-pretrain/Learning Rate": 1.9005060113773333e-05, "Full-pretrain/Loss": 1.9392915964126587, "Full-pretrain/Loss (Raw)": 2.003291130065918, "Full-pretrain/Step": 5624, "Full-pretrain/Step Time": 17.627458760514855} +{"Full-pretrain/Learning Rate": 1.8996817405346093e-05, "Full-pretrain/Loss": 1.9297940731048584, "Full-pretrain/Loss (Raw)": 1.8535408973693848, "Full-pretrain/Step": 5625, "Full-pretrain/Step Time": 17.629578286781907} +{"Full-pretrain/Learning Rate": 1.8988575389383853e-05, "Full-pretrain/Loss": 1.9299051761627197, "Full-pretrain/Loss (Raw)": 2.0257625579833984, "Full-pretrain/Step": 5626, "Full-pretrain/Step Time": 17.635678339749575} +{"Full-pretrain/Learning Rate": 1.8980334066837332e-05, "Full-pretrain/Loss": 1.9126648902893066, "Full-pretrain/Loss (Raw)": 1.6020293235778809, "Full-pretrain/Step": 5627, "Full-pretrain/Step Time": 17.642666583880782} +{"Full-pretrain/Learning Rate": 1.8972093438657166e-05, "Full-pretrain/Loss": 1.913224697113037, "Full-pretrain/Loss (Raw)": 1.9949415922164917, "Full-pretrain/Step": 5628, "Full-pretrain/Step Time": 17.642191257327795} +{"Full-pretrain/Learning Rate": 1.8963853505793898e-05, "Full-pretrain/Loss": 1.934755563735962, "Full-pretrain/Loss (Raw)": 2.3094675540924072, "Full-pretrain/Step": 5629, "Full-pretrain/Step Time": 17.6440713647753} +{"Full-pretrain/Learning Rate": 1.8955614269198015e-05, "Full-pretrain/Loss": 1.9319913387298584, "Full-pretrain/Loss (Raw)": 2.1602609157562256, "Full-pretrain/Step": 5630, "Full-pretrain/Step Time": 17.644071316346526} +{"Full-pretrain/Learning Rate": 1.8947375729819894e-05, "Full-pretrain/Loss": 1.939851999282837, "Full-pretrain/Loss (Raw)": 2.12394380569458, "Full-pretrain/Step": 5631, "Full-pretrain/Step Time": 17.64538150653243} +{"Full-pretrain/Learning Rate": 1.8939137888609855e-05, "Full-pretrain/Loss": 1.9500279426574707, "Full-pretrain/Loss (Raw)": 2.284153938293457, "Full-pretrain/Step": 5632, "Full-pretrain/Step Time": 17.645160097628832} +{"Full-pretrain/Learning Rate": 1.8930900746518128e-05, "Full-pretrain/Loss": 1.9575514793395996, "Full-pretrain/Loss (Raw)": 2.0843238830566406, "Full-pretrain/Step": 5633, "Full-pretrain/Step Time": 17.64665726572275} +{"Full-pretrain/Learning Rate": 1.892266430449487e-05, "Full-pretrain/Loss": 1.9695658683776855, "Full-pretrain/Loss (Raw)": 2.099391460418701, "Full-pretrain/Step": 5634, "Full-pretrain/Step Time": 17.64413008838892} +{"Full-pretrain/Learning Rate": 1.891442856349016e-05, "Full-pretrain/Loss": 1.971311092376709, "Full-pretrain/Loss (Raw)": 1.852036714553833, "Full-pretrain/Step": 5635, "Full-pretrain/Step Time": 17.637480922043324} +{"Full-pretrain/Learning Rate": 1.8906193524453964e-05, "Full-pretrain/Loss": 1.9757254123687744, "Full-pretrain/Loss (Raw)": 2.0491483211517334, "Full-pretrain/Step": 5636, "Full-pretrain/Step Time": 17.632827086374164} +{"Full-pretrain/Learning Rate": 1.8897959188336206e-05, "Full-pretrain/Loss": 1.9688730239868164, "Full-pretrain/Loss (Raw)": 1.7986021041870117, "Full-pretrain/Step": 5637, "Full-pretrain/Step Time": 17.629450162872672} +{"Full-pretrain/Learning Rate": 1.8889725556086713e-05, "Full-pretrain/Loss": 1.9746003150939941, "Full-pretrain/Loss (Raw)": 1.9523491859436035, "Full-pretrain/Step": 5638, "Full-pretrain/Step Time": 17.63005255907774} +{"Full-pretrain/Learning Rate": 1.8881492628655223e-05, "Full-pretrain/Loss": 1.976184606552124, "Full-pretrain/Loss (Raw)": 2.1279168128967285, "Full-pretrain/Step": 5639, "Full-pretrain/Step Time": 17.630477964878082} +{"Full-pretrain/Learning Rate": 1.887326040699142e-05, "Full-pretrain/Loss": 1.9822661876678467, "Full-pretrain/Loss (Raw)": 1.8268709182739258, "Full-pretrain/Step": 5640, "Full-pretrain/Step Time": 17.623844504356384} +{"Full-pretrain/Learning Rate": 1.886502889204487e-05, "Full-pretrain/Loss": 1.9892276525497437, "Full-pretrain/Loss (Raw)": 1.9299907684326172, "Full-pretrain/Step": 5641, "Full-pretrain/Step Time": 17.627883916720748} +{"Full-pretrain/Learning Rate": 1.8856798084765077e-05, "Full-pretrain/Loss": 2.010624885559082, "Full-pretrain/Loss (Raw)": 2.081786632537842, "Full-pretrain/Step": 5642, "Full-pretrain/Step Time": 17.627426395192742} +{"Full-pretrain/Learning Rate": 1.8848567986101467e-05, "Full-pretrain/Loss": 2.004465103149414, "Full-pretrain/Loss (Raw)": 2.0357680320739746, "Full-pretrain/Step": 5643, "Full-pretrain/Step Time": 17.62413244508207} +{"Full-pretrain/Learning Rate": 1.8840338597003384e-05, "Full-pretrain/Loss": 1.9899497032165527, "Full-pretrain/Loss (Raw)": 1.346522569656372, "Full-pretrain/Step": 5644, "Full-pretrain/Step Time": 17.622238416224718} +{"Full-pretrain/Learning Rate": 1.8832109918420074e-05, "Full-pretrain/Loss": 1.9924445152282715, "Full-pretrain/Loss (Raw)": 2.1110143661499023, "Full-pretrain/Step": 5645, "Full-pretrain/Step Time": 17.618828613311052} +{"Full-pretrain/Learning Rate": 1.8823881951300727e-05, "Full-pretrain/Loss": 1.9908850193023682, "Full-pretrain/Loss (Raw)": 2.111348867416382, "Full-pretrain/Step": 5646, "Full-pretrain/Step Time": 17.625355821102858} +{"Full-pretrain/Learning Rate": 1.8815654696594418e-05, "Full-pretrain/Loss": 1.9839401245117188, "Full-pretrain/Loss (Raw)": 1.7430009841918945, "Full-pretrain/Step": 5647, "Full-pretrain/Step Time": 17.628236697986722} +{"Full-pretrain/Learning Rate": 1.8807428155250164e-05, "Full-pretrain/Loss": 1.990680456161499, "Full-pretrain/Loss (Raw)": 2.0500950813293457, "Full-pretrain/Step": 5648, "Full-pretrain/Step Time": 17.629779746755958} +{"Full-pretrain/Learning Rate": 1.87992023282169e-05, "Full-pretrain/Loss": 1.9988219738006592, "Full-pretrain/Loss (Raw)": 2.115589141845703, "Full-pretrain/Step": 5649, "Full-pretrain/Step Time": 17.625159794464707} +{"Full-pretrain/Learning Rate": 1.879097721644346e-05, "Full-pretrain/Loss": 1.9959425926208496, "Full-pretrain/Loss (Raw)": 1.7918943166732788, "Full-pretrain/Step": 5650, "Full-pretrain/Step Time": 17.625807063654065} +{"Full-pretrain/Learning Rate": 1.8782752820878634e-05, "Full-pretrain/Loss": 1.999048113822937, "Full-pretrain/Loss (Raw)": 2.136688709259033, "Full-pretrain/Step": 5651, "Full-pretrain/Step Time": 17.62604083865881} +{"Full-pretrain/Learning Rate": 1.8774529142471074e-05, "Full-pretrain/Loss": 1.993614673614502, "Full-pretrain/Loss (Raw)": 1.6120309829711914, "Full-pretrain/Step": 5652, "Full-pretrain/Step Time": 17.628955248743296} +{"Full-pretrain/Learning Rate": 1.8766306182169394e-05, "Full-pretrain/Loss": 1.9872236251831055, "Full-pretrain/Loss (Raw)": 1.8915538787841797, "Full-pretrain/Step": 5653, "Full-pretrain/Step Time": 17.627022629603744} +{"Full-pretrain/Learning Rate": 1.87580839409221e-05, "Full-pretrain/Loss": 1.9951937198638916, "Full-pretrain/Loss (Raw)": 2.143500804901123, "Full-pretrain/Step": 5654, "Full-pretrain/Step Time": 17.623764449730515} +{"Full-pretrain/Learning Rate": 1.8749862419677626e-05, "Full-pretrain/Loss": 1.9679197072982788, "Full-pretrain/Loss (Raw)": 1.7246140241622925, "Full-pretrain/Step": 5655, "Full-pretrain/Step Time": 17.624057358130813} +{"Full-pretrain/Learning Rate": 1.874164161938434e-05, "Full-pretrain/Loss": 1.9673914909362793, "Full-pretrain/Loss (Raw)": 1.9863932132720947, "Full-pretrain/Step": 5656, "Full-pretrain/Step Time": 17.624554056674242} +{"Full-pretrain/Learning Rate": 1.8733421540990484e-05, "Full-pretrain/Loss": 1.9692256450653076, "Full-pretrain/Loss (Raw)": 1.9122265577316284, "Full-pretrain/Step": 5657, "Full-pretrain/Step Time": 17.620935076847672} +{"Full-pretrain/Learning Rate": 1.8725202185444247e-05, "Full-pretrain/Loss": 1.9697353839874268, "Full-pretrain/Loss (Raw)": 2.0420753955841064, "Full-pretrain/Step": 5658, "Full-pretrain/Step Time": 17.626021306961775} +{"Full-pretrain/Learning Rate": 1.8716983553693736e-05, "Full-pretrain/Loss": 1.975618600845337, "Full-pretrain/Loss (Raw)": 1.7902902364730835, "Full-pretrain/Step": 5659, "Full-pretrain/Step Time": 17.61571121774614} +{"Full-pretrain/Learning Rate": 1.8708765646686972e-05, "Full-pretrain/Loss": 1.9762167930603027, "Full-pretrain/Loss (Raw)": 2.014087677001953, "Full-pretrain/Step": 5660, "Full-pretrain/Step Time": 17.62196463532746} +{"Full-pretrain/Learning Rate": 1.8700548465371874e-05, "Full-pretrain/Loss": 1.96499764919281, "Full-pretrain/Loss (Raw)": 1.9504526853561401, "Full-pretrain/Step": 5661, "Full-pretrain/Step Time": 17.610531952232122} +{"Full-pretrain/Learning Rate": 1.86923320106963e-05, "Full-pretrain/Loss": 1.954904556274414, "Full-pretrain/Loss (Raw)": 1.837282657623291, "Full-pretrain/Step": 5662, "Full-pretrain/Step Time": 17.612049164250493} +{"Full-pretrain/Learning Rate": 1.8684116283608006e-05, "Full-pretrain/Loss": 1.951714277267456, "Full-pretrain/Loss (Raw)": 2.021853446960449, "Full-pretrain/Step": 5663, "Full-pretrain/Step Time": 17.612155988812447} +{"Full-pretrain/Learning Rate": 1.867590128505468e-05, "Full-pretrain/Loss": 1.9482365846633911, "Full-pretrain/Loss (Raw)": 2.172870635986328, "Full-pretrain/Step": 5664, "Full-pretrain/Step Time": 17.619130106642842} +{"Full-pretrain/Learning Rate": 1.8667687015983913e-05, "Full-pretrain/Loss": 1.9465734958648682, "Full-pretrain/Loss (Raw)": 2.0311014652252197, "Full-pretrain/Step": 5665, "Full-pretrain/Step Time": 17.614683819934726} +{"Full-pretrain/Learning Rate": 1.865947347734323e-05, "Full-pretrain/Loss": 1.9372196197509766, "Full-pretrain/Loss (Raw)": 1.800067663192749, "Full-pretrain/Step": 5666, "Full-pretrain/Step Time": 17.62386321462691} +{"Full-pretrain/Learning Rate": 1.8651260670080063e-05, "Full-pretrain/Loss": 1.9365861415863037, "Full-pretrain/Loss (Raw)": 1.8317652940750122, "Full-pretrain/Step": 5667, "Full-pretrain/Step Time": 17.619732486084104} +{"Full-pretrain/Learning Rate": 1.8643048595141733e-05, "Full-pretrain/Loss": 1.9376161098480225, "Full-pretrain/Loss (Raw)": 2.0821099281311035, "Full-pretrain/Step": 5668, "Full-pretrain/Step Time": 17.619006553664804} +{"Full-pretrain/Learning Rate": 1.863483725347552e-05, "Full-pretrain/Loss": 1.9410374164581299, "Full-pretrain/Loss (Raw)": 1.908080816268921, "Full-pretrain/Step": 5669, "Full-pretrain/Step Time": 17.619031868875027} +{"Full-pretrain/Learning Rate": 1.862662664602859e-05, "Full-pretrain/Loss": 1.9391754865646362, "Full-pretrain/Loss (Raw)": 1.892770767211914, "Full-pretrain/Step": 5670, "Full-pretrain/Step Time": 17.617109552025795} +{"Full-pretrain/Learning Rate": 1.861841677374803e-05, "Full-pretrain/Loss": 1.939103126525879, "Full-pretrain/Loss (Raw)": 2.1255977153778076, "Full-pretrain/Step": 5671, "Full-pretrain/Step Time": 17.617053454741836} +{"Full-pretrain/Learning Rate": 1.8610207637580872e-05, "Full-pretrain/Loss": 1.9494202136993408, "Full-pretrain/Loss (Raw)": 2.157024621963501, "Full-pretrain/Step": 5672, "Full-pretrain/Step Time": 17.614692302420735} +{"Full-pretrain/Learning Rate": 1.8601999238474e-05, "Full-pretrain/Loss": 1.9475947618484497, "Full-pretrain/Loss (Raw)": 1.8715710639953613, "Full-pretrain/Step": 5673, "Full-pretrain/Step Time": 17.611886458471417} +{"Full-pretrain/Learning Rate": 1.859379157737427e-05, "Full-pretrain/Loss": 1.9457125663757324, "Full-pretrain/Loss (Raw)": 2.021559953689575, "Full-pretrain/Step": 5674, "Full-pretrain/Step Time": 17.61659155599773} +{"Full-pretrain/Learning Rate": 1.858558465522843e-05, "Full-pretrain/Loss": 1.9503705501556396, "Full-pretrain/Loss (Raw)": 2.1848201751708984, "Full-pretrain/Step": 5675, "Full-pretrain/Step Time": 17.608988534659147} +{"Full-pretrain/Learning Rate": 1.857737847298315e-05, "Full-pretrain/Loss": 1.9755955934524536, "Full-pretrain/Loss (Raw)": 2.1537246704101562, "Full-pretrain/Step": 5676, "Full-pretrain/Step Time": 17.60578084923327} +{"Full-pretrain/Learning Rate": 1.856917303158501e-05, "Full-pretrain/Loss": 1.9709163904190063, "Full-pretrain/Loss (Raw)": 1.9612805843353271, "Full-pretrain/Step": 5677, "Full-pretrain/Step Time": 17.60795529000461} +{"Full-pretrain/Learning Rate": 1.8560968331980493e-05, "Full-pretrain/Loss": 1.9637584686279297, "Full-pretrain/Loss (Raw)": 1.8822968006134033, "Full-pretrain/Step": 5678, "Full-pretrain/Step Time": 17.60847420617938} +{"Full-pretrain/Learning Rate": 1.8552764375116023e-05, "Full-pretrain/Loss": 1.9615356922149658, "Full-pretrain/Loss (Raw)": 1.6718710660934448, "Full-pretrain/Step": 5679, "Full-pretrain/Step Time": 17.605982184410095} +{"Full-pretrain/Learning Rate": 1.8544561161937906e-05, "Full-pretrain/Loss": 1.9568455219268799, "Full-pretrain/Loss (Raw)": 1.9000091552734375, "Full-pretrain/Step": 5680, "Full-pretrain/Step Time": 17.607931232079864} +{"Full-pretrain/Learning Rate": 1.8536358693392398e-05, "Full-pretrain/Loss": 1.9489197731018066, "Full-pretrain/Loss (Raw)": 1.8619675636291504, "Full-pretrain/Step": 5681, "Full-pretrain/Step Time": 17.599713686853647} +{"Full-pretrain/Learning Rate": 1.8528156970425647e-05, "Full-pretrain/Loss": 1.94211745262146, "Full-pretrain/Loss (Raw)": 1.5742191076278687, "Full-pretrain/Step": 5682, "Full-pretrain/Step Time": 17.604355558753014} +{"Full-pretrain/Learning Rate": 1.851995599398371e-05, "Full-pretrain/Loss": 1.9359180927276611, "Full-pretrain/Loss (Raw)": 1.9383105039596558, "Full-pretrain/Step": 5683, "Full-pretrain/Step Time": 17.596518211066723} +{"Full-pretrain/Learning Rate": 1.8511755765012566e-05, "Full-pretrain/Loss": 1.9458632469177246, "Full-pretrain/Loss (Raw)": 1.930277705192566, "Full-pretrain/Step": 5684, "Full-pretrain/Step Time": 17.595579320564866} +{"Full-pretrain/Learning Rate": 1.850355628445812e-05, "Full-pretrain/Loss": 1.95089852809906, "Full-pretrain/Loss (Raw)": 2.0526788234710693, "Full-pretrain/Step": 5685, "Full-pretrain/Step Time": 17.592760799452662} +{"Full-pretrain/Learning Rate": 1.8495357553266178e-05, "Full-pretrain/Loss": 1.9397817850112915, "Full-pretrain/Loss (Raw)": 1.787765383720398, "Full-pretrain/Step": 5686, "Full-pretrain/Step Time": 17.59881736896932} +{"Full-pretrain/Learning Rate": 1.848715957238245e-05, "Full-pretrain/Loss": 1.940391182899475, "Full-pretrain/Loss (Raw)": 1.7441132068634033, "Full-pretrain/Step": 5687, "Full-pretrain/Step Time": 17.594203965738416} +{"Full-pretrain/Learning Rate": 1.8478962342752583e-05, "Full-pretrain/Loss": 1.9387564659118652, "Full-pretrain/Loss (Raw)": 1.9340837001800537, "Full-pretrain/Step": 5688, "Full-pretrain/Step Time": 17.598385201767087} +{"Full-pretrain/Learning Rate": 1.8470765865322113e-05, "Full-pretrain/Loss": 1.9270806312561035, "Full-pretrain/Loss (Raw)": 1.538597583770752, "Full-pretrain/Step": 5689, "Full-pretrain/Step Time": 17.59281884878874} +{"Full-pretrain/Learning Rate": 1.8462570141036505e-05, "Full-pretrain/Loss": 1.922348141670227, "Full-pretrain/Loss (Raw)": 1.890636682510376, "Full-pretrain/Step": 5690, "Full-pretrain/Step Time": 17.59407901018858} +{"Full-pretrain/Learning Rate": 1.845437517084113e-05, "Full-pretrain/Loss": 1.932521104812622, "Full-pretrain/Loss (Raw)": 2.11582350730896, "Full-pretrain/Step": 5691, "Full-pretrain/Step Time": 17.58811630681157} +{"Full-pretrain/Learning Rate": 1.8446180955681282e-05, "Full-pretrain/Loss": 1.9352554082870483, "Full-pretrain/Loss (Raw)": 2.1015877723693848, "Full-pretrain/Step": 5692, "Full-pretrain/Step Time": 17.59313871897757} +{"Full-pretrain/Learning Rate": 1.843798749650217e-05, "Full-pretrain/Loss": 1.934367299079895, "Full-pretrain/Loss (Raw)": 1.922032356262207, "Full-pretrain/Step": 5693, "Full-pretrain/Step Time": 17.59083380922675} +{"Full-pretrain/Learning Rate": 1.8429794794248877e-05, "Full-pretrain/Loss": 1.9326109886169434, "Full-pretrain/Loss (Raw)": 1.7810834646224976, "Full-pretrain/Step": 5694, "Full-pretrain/Step Time": 17.59151427820325} +{"Full-pretrain/Learning Rate": 1.842160284986646e-05, "Full-pretrain/Loss": 1.9338197708129883, "Full-pretrain/Loss (Raw)": 2.060535430908203, "Full-pretrain/Step": 5695, "Full-pretrain/Step Time": 17.587498504668474} +{"Full-pretrain/Learning Rate": 1.8413411664299828e-05, "Full-pretrain/Loss": 1.9305574893951416, "Full-pretrain/Loss (Raw)": 2.0684778690338135, "Full-pretrain/Step": 5696, "Full-pretrain/Step Time": 17.593162367120385} +{"Full-pretrain/Learning Rate": 1.840522123849385e-05, "Full-pretrain/Loss": 1.939355731010437, "Full-pretrain/Loss (Raw)": 2.312643527984619, "Full-pretrain/Step": 5697, "Full-pretrain/Step Time": 17.593997908756137} +{"Full-pretrain/Learning Rate": 1.8397031573393297e-05, "Full-pretrain/Loss": 1.952871322631836, "Full-pretrain/Loss (Raw)": 2.2325692176818848, "Full-pretrain/Step": 5698, "Full-pretrain/Step Time": 17.589209662750363} +{"Full-pretrain/Learning Rate": 1.838884266994282e-05, "Full-pretrain/Loss": 1.9482991695404053, "Full-pretrain/Loss (Raw)": 1.6854513883590698, "Full-pretrain/Step": 5699, "Full-pretrain/Step Time": 17.588949078693986} +{"Full-pretrain/Learning Rate": 1.8380654529087017e-05, "Full-pretrain/Loss": 1.9470460414886475, "Full-pretrain/Loss (Raw)": 2.0420117378234863, "Full-pretrain/Step": 5700, "Full-pretrain/Step Time": 17.59163996949792} +{"Full-pretrain/Learning Rate": 1.8372467151770388e-05, "Full-pretrain/Loss": 1.9445290565490723, "Full-pretrain/Loss (Raw)": 1.8275398015975952, "Full-pretrain/Step": 5701, "Full-pretrain/Step Time": 17.596641585230827} +{"Full-pretrain/Learning Rate": 1.8364280538937352e-05, "Full-pretrain/Loss": 1.9486280679702759, "Full-pretrain/Loss (Raw)": 2.0239365100860596, "Full-pretrain/Step": 5702, "Full-pretrain/Step Time": 17.592229805886745} +{"Full-pretrain/Learning Rate": 1.835609469153222e-05, "Full-pretrain/Loss": 1.9484682083129883, "Full-pretrain/Loss (Raw)": 2.1204822063446045, "Full-pretrain/Step": 5703, "Full-pretrain/Step Time": 17.59276690147817} +{"Full-pretrain/Learning Rate": 1.834790961049923e-05, "Full-pretrain/Loss": 1.9345004558563232, "Full-pretrain/Loss (Raw)": 1.7100567817687988, "Full-pretrain/Step": 5704, "Full-pretrain/Step Time": 17.589115465059876} +{"Full-pretrain/Learning Rate": 1.8339725296782525e-05, "Full-pretrain/Loss": 1.93928062915802, "Full-pretrain/Loss (Raw)": 2.024536371231079, "Full-pretrain/Step": 5705, "Full-pretrain/Step Time": 17.585855534300208} +{"Full-pretrain/Learning Rate": 1.8331541751326167e-05, "Full-pretrain/Loss": 1.9432058334350586, "Full-pretrain/Loss (Raw)": 2.1471662521362305, "Full-pretrain/Step": 5706, "Full-pretrain/Step Time": 17.578593177720904} +{"Full-pretrain/Learning Rate": 1.8323358975074124e-05, "Full-pretrain/Loss": 1.9181344509124756, "Full-pretrain/Loss (Raw)": 1.3825342655181885, "Full-pretrain/Step": 5707, "Full-pretrain/Step Time": 17.582201959565282} +{"Full-pretrain/Learning Rate": 1.8315176968970277e-05, "Full-pretrain/Loss": 1.9068516492843628, "Full-pretrain/Loss (Raw)": 1.7926769256591797, "Full-pretrain/Step": 5708, "Full-pretrain/Step Time": 17.588273836299777} +{"Full-pretrain/Learning Rate": 1.8306995733958425e-05, "Full-pretrain/Loss": 1.9107102155685425, "Full-pretrain/Loss (Raw)": 2.084754467010498, "Full-pretrain/Step": 5709, "Full-pretrain/Step Time": 17.586729833856225} +{"Full-pretrain/Learning Rate": 1.8298815270982258e-05, "Full-pretrain/Loss": 1.911386251449585, "Full-pretrain/Loss (Raw)": 1.9039280414581299, "Full-pretrain/Step": 5710, "Full-pretrain/Step Time": 17.588951211422682} +{"Full-pretrain/Learning Rate": 1.8290635580985394e-05, "Full-pretrain/Loss": 1.9195029735565186, "Full-pretrain/Loss (Raw)": 1.9316074848175049, "Full-pretrain/Step": 5711, "Full-pretrain/Step Time": 17.589732326567173} +{"Full-pretrain/Learning Rate": 1.828245666491136e-05, "Full-pretrain/Loss": 1.9162712097167969, "Full-pretrain/Loss (Raw)": 1.7965928316116333, "Full-pretrain/Step": 5712, "Full-pretrain/Step Time": 17.591531662270427} +{"Full-pretrain/Learning Rate": 1.8274278523703583e-05, "Full-pretrain/Loss": 1.9193124771118164, "Full-pretrain/Loss (Raw)": 1.9592899084091187, "Full-pretrain/Step": 5713, "Full-pretrain/Step Time": 17.59644248150289} +{"Full-pretrain/Learning Rate": 1.8266101158305427e-05, "Full-pretrain/Loss": 1.928929090499878, "Full-pretrain/Loss (Raw)": 1.8819458484649658, "Full-pretrain/Step": 5714, "Full-pretrain/Step Time": 17.598874274641275} +{"Full-pretrain/Learning Rate": 1.8257924569660126e-05, "Full-pretrain/Loss": 1.931302547454834, "Full-pretrain/Loss (Raw)": 2.0142629146575928, "Full-pretrain/Step": 5715, "Full-pretrain/Step Time": 17.596830734983087} +{"Full-pretrain/Learning Rate": 1.8249748758710854e-05, "Full-pretrain/Loss": 1.9310452938079834, "Full-pretrain/Loss (Raw)": 1.922046422958374, "Full-pretrain/Step": 5716, "Full-pretrain/Step Time": 17.594968205317855} +{"Full-pretrain/Learning Rate": 1.8241573726400695e-05, "Full-pretrain/Loss": 1.926761507987976, "Full-pretrain/Loss (Raw)": 1.915595531463623, "Full-pretrain/Step": 5717, "Full-pretrain/Step Time": 17.599690092727542} +{"Full-pretrain/Learning Rate": 1.823339947367263e-05, "Full-pretrain/Loss": 1.9351184368133545, "Full-pretrain/Loss (Raw)": 2.0551881790161133, "Full-pretrain/Step": 5718, "Full-pretrain/Step Time": 17.59597871825099} +{"Full-pretrain/Learning Rate": 1.8225226001469566e-05, "Full-pretrain/Loss": 1.9368962049484253, "Full-pretrain/Loss (Raw)": 1.801001787185669, "Full-pretrain/Step": 5719, "Full-pretrain/Step Time": 17.5999092515558} +{"Full-pretrain/Learning Rate": 1.8217053310734294e-05, "Full-pretrain/Loss": 1.9462006092071533, "Full-pretrain/Loss (Raw)": 2.2318263053894043, "Full-pretrain/Step": 5720, "Full-pretrain/Step Time": 17.59815128520131} +{"Full-pretrain/Learning Rate": 1.8208881402409543e-05, "Full-pretrain/Loss": 1.954514741897583, "Full-pretrain/Loss (Raw)": 1.804649829864502, "Full-pretrain/Step": 5721, "Full-pretrain/Step Time": 17.600153390318155} +{"Full-pretrain/Learning Rate": 1.8200710277437928e-05, "Full-pretrain/Loss": 1.9402422904968262, "Full-pretrain/Loss (Raw)": 1.4339170455932617, "Full-pretrain/Step": 5722, "Full-pretrain/Step Time": 17.592970937490463} +{"Full-pretrain/Learning Rate": 1.8192539936761996e-05, "Full-pretrain/Loss": 1.9309266805648804, "Full-pretrain/Loss (Raw)": 1.8177241086959839, "Full-pretrain/Step": 5723, "Full-pretrain/Step Time": 17.592211309820414} +{"Full-pretrain/Learning Rate": 1.81843703813242e-05, "Full-pretrain/Loss": 1.9236729145050049, "Full-pretrain/Loss (Raw)": 1.8694663047790527, "Full-pretrain/Step": 5724, "Full-pretrain/Step Time": 17.598913801833987} +{"Full-pretrain/Learning Rate": 1.817620161206687e-05, "Full-pretrain/Loss": 1.926790714263916, "Full-pretrain/Loss (Raw)": 2.0218043327331543, "Full-pretrain/Step": 5725, "Full-pretrain/Step Time": 17.596558405086398} +{"Full-pretrain/Learning Rate": 1.8168033629932297e-05, "Full-pretrain/Loss": 1.928802490234375, "Full-pretrain/Loss (Raw)": 1.845460057258606, "Full-pretrain/Step": 5726, "Full-pretrain/Step Time": 17.60220581293106} +{"Full-pretrain/Learning Rate": 1.8159866435862635e-05, "Full-pretrain/Loss": 1.9221842288970947, "Full-pretrain/Loss (Raw)": 1.8487486839294434, "Full-pretrain/Step": 5727, "Full-pretrain/Step Time": 17.592452788725495} +{"Full-pretrain/Learning Rate": 1.8151700030799982e-05, "Full-pretrain/Loss": 1.9167910814285278, "Full-pretrain/Loss (Raw)": 1.895897626876831, "Full-pretrain/Step": 5728, "Full-pretrain/Step Time": 17.595085065811872} +{"Full-pretrain/Learning Rate": 1.814353441568632e-05, "Full-pretrain/Loss": 1.8963277339935303, "Full-pretrain/Loss (Raw)": 1.6578178405761719, "Full-pretrain/Step": 5729, "Full-pretrain/Step Time": 17.59283276833594} +{"Full-pretrain/Learning Rate": 1.8135369591463565e-05, "Full-pretrain/Loss": 1.8880388736724854, "Full-pretrain/Loss (Raw)": 1.9673247337341309, "Full-pretrain/Step": 5730, "Full-pretrain/Step Time": 17.60036345012486} +{"Full-pretrain/Learning Rate": 1.8127205559073507e-05, "Full-pretrain/Loss": 1.8939486742019653, "Full-pretrain/Loss (Raw)": 1.874565601348877, "Full-pretrain/Step": 5731, "Full-pretrain/Step Time": 17.596309900283813} +{"Full-pretrain/Learning Rate": 1.8119042319457868e-05, "Full-pretrain/Loss": 1.8930041790008545, "Full-pretrain/Loss (Raw)": 2.0117902755737305, "Full-pretrain/Step": 5732, "Full-pretrain/Step Time": 17.596709839999676} +{"Full-pretrain/Learning Rate": 1.8110879873558278e-05, "Full-pretrain/Loss": 1.9048666954040527, "Full-pretrain/Loss (Raw)": 2.2071361541748047, "Full-pretrain/Step": 5733, "Full-pretrain/Step Time": 17.59942282177508} +{"Full-pretrain/Learning Rate": 1.8102718222316277e-05, "Full-pretrain/Loss": 1.9080820083618164, "Full-pretrain/Loss (Raw)": 2.126826524734497, "Full-pretrain/Step": 5734, "Full-pretrain/Step Time": 17.59793417342007} +{"Full-pretrain/Learning Rate": 1.8094557366673316e-05, "Full-pretrain/Loss": 1.9001576900482178, "Full-pretrain/Loss (Raw)": 1.8669054508209229, "Full-pretrain/Step": 5735, "Full-pretrain/Step Time": 17.605198927223682} +{"Full-pretrain/Learning Rate": 1.8086397307570723e-05, "Full-pretrain/Loss": 1.9066858291625977, "Full-pretrain/Loss (Raw)": 1.9189621210098267, "Full-pretrain/Step": 5736, "Full-pretrain/Step Time": 17.60184825770557} +{"Full-pretrain/Learning Rate": 1.807823804594978e-05, "Full-pretrain/Loss": 1.9058737754821777, "Full-pretrain/Loss (Raw)": 1.9985485076904297, "Full-pretrain/Step": 5737, "Full-pretrain/Step Time": 17.596085151657462} +{"Full-pretrain/Learning Rate": 1.8070079582751638e-05, "Full-pretrain/Loss": 1.8950921297073364, "Full-pretrain/Loss (Raw)": 1.8021504878997803, "Full-pretrain/Step": 5738, "Full-pretrain/Step Time": 17.598151160404086} +{"Full-pretrain/Learning Rate": 1.806192191891738e-05, "Full-pretrain/Loss": 1.9104197025299072, "Full-pretrain/Loss (Raw)": 1.8730169534683228, "Full-pretrain/Step": 5739, "Full-pretrain/Step Time": 17.59964657947421} +{"Full-pretrain/Learning Rate": 1.8053765055388004e-05, "Full-pretrain/Loss": 1.9195549488067627, "Full-pretrain/Loss (Raw)": 2.0850043296813965, "Full-pretrain/Step": 5740, "Full-pretrain/Step Time": 17.59490007907152} +{"Full-pretrain/Learning Rate": 1.8045608993104373e-05, "Full-pretrain/Loss": 1.9253515005111694, "Full-pretrain/Loss (Raw)": 2.2702462673187256, "Full-pretrain/Step": 5741, "Full-pretrain/Step Time": 17.602452060207725} +{"Full-pretrain/Learning Rate": 1.8037453733007303e-05, "Full-pretrain/Loss": 1.924399971961975, "Full-pretrain/Loss (Raw)": 1.8734781742095947, "Full-pretrain/Step": 5742, "Full-pretrain/Step Time": 17.604476373642683} +{"Full-pretrain/Learning Rate": 1.8029299276037498e-05, "Full-pretrain/Loss": 1.9292339086532593, "Full-pretrain/Loss (Raw)": 2.086293935775757, "Full-pretrain/Step": 5743, "Full-pretrain/Step Time": 17.60092382505536} +{"Full-pretrain/Learning Rate": 1.8021145623135575e-05, "Full-pretrain/Loss": 1.9296414852142334, "Full-pretrain/Loss (Raw)": 1.8096368312835693, "Full-pretrain/Step": 5744, "Full-pretrain/Step Time": 17.602968452498317} +{"Full-pretrain/Learning Rate": 1.8012992775242056e-05, "Full-pretrain/Loss": 1.9210706949234009, "Full-pretrain/Loss (Raw)": 1.685021162033081, "Full-pretrain/Step": 5745, "Full-pretrain/Step Time": 17.600009500980377} +{"Full-pretrain/Learning Rate": 1.8004840733297365e-05, "Full-pretrain/Loss": 1.9271934032440186, "Full-pretrain/Loss (Raw)": 2.077873706817627, "Full-pretrain/Step": 5746, "Full-pretrain/Step Time": 17.59929893910885} +{"Full-pretrain/Learning Rate": 1.7996689498241832e-05, "Full-pretrain/Loss": 1.9306056499481201, "Full-pretrain/Loss (Raw)": 2.1234564781188965, "Full-pretrain/Step": 5747, "Full-pretrain/Step Time": 17.596956811845303} +{"Full-pretrain/Learning Rate": 1.79885390710157e-05, "Full-pretrain/Loss": 1.928839921951294, "Full-pretrain/Loss (Raw)": 1.8655407428741455, "Full-pretrain/Step": 5748, "Full-pretrain/Step Time": 17.597880009561777} +{"Full-pretrain/Learning Rate": 1.7980389452559124e-05, "Full-pretrain/Loss": 1.9291645288467407, "Full-pretrain/Loss (Raw)": 1.9259867668151855, "Full-pretrain/Step": 5749, "Full-pretrain/Step Time": 17.59382499754429} +{"Full-pretrain/Learning Rate": 1.7972240643812162e-05, "Full-pretrain/Loss": 1.9318351745605469, "Full-pretrain/Loss (Raw)": 2.140650510787964, "Full-pretrain/Step": 5750, "Full-pretrain/Step Time": 17.590288143604994} +{"Full-pretrain/Learning Rate": 1.7964092645714776e-05, "Full-pretrain/Loss": 1.9346504211425781, "Full-pretrain/Loss (Raw)": 1.8910852670669556, "Full-pretrain/Step": 5751, "Full-pretrain/Step Time": 17.59626546315849} +{"Full-pretrain/Learning Rate": 1.7955945459206822e-05, "Full-pretrain/Loss": 1.934204339981079, "Full-pretrain/Loss (Raw)": 2.2175521850585938, "Full-pretrain/Step": 5752, "Full-pretrain/Step Time": 17.596630159765482} +{"Full-pretrain/Learning Rate": 1.794779908522809e-05, "Full-pretrain/Loss": 1.9445008039474487, "Full-pretrain/Loss (Raw)": 2.1341400146484375, "Full-pretrain/Step": 5753, "Full-pretrain/Step Time": 17.58906109444797} +{"Full-pretrain/Learning Rate": 1.793965352471825e-05, "Full-pretrain/Loss": 1.965191125869751, "Full-pretrain/Loss (Raw)": 2.0960071086883545, "Full-pretrain/Step": 5754, "Full-pretrain/Step Time": 17.583794178441167} +{"Full-pretrain/Learning Rate": 1.7931508778616895e-05, "Full-pretrain/Loss": 1.967247486114502, "Full-pretrain/Loss (Raw)": 1.8835256099700928, "Full-pretrain/Step": 5755, "Full-pretrain/Step Time": 17.580619433894753} +{"Full-pretrain/Learning Rate": 1.7923364847863527e-05, "Full-pretrain/Loss": 1.9730262756347656, "Full-pretrain/Loss (Raw)": 2.0543854236602783, "Full-pretrain/Step": 5756, "Full-pretrain/Step Time": 17.579948373138905} +{"Full-pretrain/Learning Rate": 1.791522173339753e-05, "Full-pretrain/Loss": 1.9842371940612793, "Full-pretrain/Loss (Raw)": 2.380554676055908, "Full-pretrain/Step": 5757, "Full-pretrain/Step Time": 17.576140876859426} +{"Full-pretrain/Learning Rate": 1.7907079436158213e-05, "Full-pretrain/Loss": 1.9920389652252197, "Full-pretrain/Loss (Raw)": 2.0951151847839355, "Full-pretrain/Step": 5758, "Full-pretrain/Step Time": 17.573028491809964} +{"Full-pretrain/Learning Rate": 1.789893795708479e-05, "Full-pretrain/Loss": 1.998142957687378, "Full-pretrain/Loss (Raw)": 2.0440759658813477, "Full-pretrain/Step": 5759, "Full-pretrain/Step Time": 17.572701821103692} +{"Full-pretrain/Learning Rate": 1.789079729711638e-05, "Full-pretrain/Loss": 2.0002760887145996, "Full-pretrain/Loss (Raw)": 1.964160442352295, "Full-pretrain/Step": 5760, "Full-pretrain/Step Time": 17.569166749715805} +{"Full-pretrain/Learning Rate": 1.7882657457192013e-05, "Full-pretrain/Loss": 2.0131571292877197, "Full-pretrain/Loss (Raw)": 2.0700082778930664, "Full-pretrain/Step": 5761, "Full-pretrain/Step Time": 17.572531336918473} +{"Full-pretrain/Learning Rate": 1.7874518438250597e-05, "Full-pretrain/Loss": 2.0212583541870117, "Full-pretrain/Loss (Raw)": 2.226569652557373, "Full-pretrain/Step": 5762, "Full-pretrain/Step Time": 17.57205589301884} +{"Full-pretrain/Learning Rate": 1.7866380241230983e-05, "Full-pretrain/Loss": 2.02308988571167, "Full-pretrain/Loss (Raw)": 1.9331738948822021, "Full-pretrain/Step": 5763, "Full-pretrain/Step Time": 17.57501356676221} +{"Full-pretrain/Learning Rate": 1.7858242867071896e-05, "Full-pretrain/Loss": 2.027937412261963, "Full-pretrain/Loss (Raw)": 2.166907548904419, "Full-pretrain/Step": 5764, "Full-pretrain/Step Time": 17.577692037448287} +{"Full-pretrain/Learning Rate": 1.785010631671198e-05, "Full-pretrain/Loss": 2.018465042114258, "Full-pretrain/Loss (Raw)": 1.9040162563323975, "Full-pretrain/Step": 5765, "Full-pretrain/Step Time": 17.57866076566279} +{"Full-pretrain/Learning Rate": 1.784197059108979e-05, "Full-pretrain/Loss": 2.013930320739746, "Full-pretrain/Loss (Raw)": 1.9817183017730713, "Full-pretrain/Step": 5766, "Full-pretrain/Step Time": 17.581395510584116} +{"Full-pretrain/Learning Rate": 1.7833835691143785e-05, "Full-pretrain/Loss": 2.027169704437256, "Full-pretrain/Loss (Raw)": 2.290565013885498, "Full-pretrain/Step": 5767, "Full-pretrain/Step Time": 17.582831824198365} +{"Full-pretrain/Learning Rate": 1.7825701617812307e-05, "Full-pretrain/Loss": 2.030061721801758, "Full-pretrain/Loss (Raw)": 2.011504650115967, "Full-pretrain/Step": 5768, "Full-pretrain/Step Time": 17.581470927223563} +{"Full-pretrain/Learning Rate": 1.7817568372033628e-05, "Full-pretrain/Loss": 2.0271196365356445, "Full-pretrain/Loss (Raw)": 1.9044110774993896, "Full-pretrain/Step": 5769, "Full-pretrain/Step Time": 17.581760980188847} +{"Full-pretrain/Learning Rate": 1.780943595474591e-05, "Full-pretrain/Loss": 2.028132677078247, "Full-pretrain/Loss (Raw)": 1.8345606327056885, "Full-pretrain/Step": 5770, "Full-pretrain/Step Time": 17.580045050010085} +{"Full-pretrain/Learning Rate": 1.7801304366887235e-05, "Full-pretrain/Loss": 2.0341691970825195, "Full-pretrain/Loss (Raw)": 2.0661866664886475, "Full-pretrain/Step": 5771, "Full-pretrain/Step Time": 17.58041569404304} +{"Full-pretrain/Learning Rate": 1.779317360939557e-05, "Full-pretrain/Loss": 2.0284104347229004, "Full-pretrain/Loss (Raw)": 1.9007205963134766, "Full-pretrain/Step": 5772, "Full-pretrain/Step Time": 17.582754708826542} +{"Full-pretrain/Learning Rate": 1.7785043683208794e-05, "Full-pretrain/Loss": 2.015049695968628, "Full-pretrain/Loss (Raw)": 1.8427075147628784, "Full-pretrain/Step": 5773, "Full-pretrain/Step Time": 17.58398906700313} +{"Full-pretrain/Learning Rate": 1.777691458926469e-05, "Full-pretrain/Loss": 2.0195627212524414, "Full-pretrain/Loss (Raw)": 2.017895221710205, "Full-pretrain/Step": 5774, "Full-pretrain/Step Time": 17.582777997478843} +{"Full-pretrain/Learning Rate": 1.7768786328500953e-05, "Full-pretrain/Loss": 2.0110113620758057, "Full-pretrain/Loss (Raw)": 1.8126471042633057, "Full-pretrain/Step": 5775, "Full-pretrain/Step Time": 17.579465007409453} +{"Full-pretrain/Learning Rate": 1.776065890185517e-05, "Full-pretrain/Loss": 2.0176987648010254, "Full-pretrain/Loss (Raw)": 2.023644208908081, "Full-pretrain/Step": 5776, "Full-pretrain/Step Time": 17.583726972341537} +{"Full-pretrain/Learning Rate": 1.7752532310264846e-05, "Full-pretrain/Loss": 2.025745153427124, "Full-pretrain/Loss (Raw)": 1.9424946308135986, "Full-pretrain/Step": 5777, "Full-pretrain/Step Time": 17.587830811738968} +{"Full-pretrain/Learning Rate": 1.7744406554667364e-05, "Full-pretrain/Loss": 2.0169098377227783, "Full-pretrain/Loss (Raw)": 1.7951490879058838, "Full-pretrain/Step": 5778, "Full-pretrain/Step Time": 17.590097565203905} +{"Full-pretrain/Learning Rate": 1.7736281636000045e-05, "Full-pretrain/Loss": 2.0029408931732178, "Full-pretrain/Loss (Raw)": 1.6764448881149292, "Full-pretrain/Step": 5779, "Full-pretrain/Step Time": 17.587494248524308} +{"Full-pretrain/Learning Rate": 1.7728157555200075e-05, "Full-pretrain/Loss": 2.004950523376465, "Full-pretrain/Loss (Raw)": 1.9298489093780518, "Full-pretrain/Step": 5780, "Full-pretrain/Step Time": 17.58555986918509} +{"Full-pretrain/Learning Rate": 1.772003431320458e-05, "Full-pretrain/Loss": 2.0058846473693848, "Full-pretrain/Loss (Raw)": 1.9558820724487305, "Full-pretrain/Step": 5781, "Full-pretrain/Step Time": 17.591751085594296} +{"Full-pretrain/Learning Rate": 1.771191191095058e-05, "Full-pretrain/Loss": 2.005791425704956, "Full-pretrain/Loss (Raw)": 2.137667655944824, "Full-pretrain/Step": 5782, "Full-pretrain/Step Time": 17.589490031823516} +{"Full-pretrain/Learning Rate": 1.770379034937497e-05, "Full-pretrain/Loss": 2.0051441192626953, "Full-pretrain/Loss (Raw)": 1.8703703880310059, "Full-pretrain/Step": 5783, "Full-pretrain/Step Time": 17.59364788234234} +{"Full-pretrain/Learning Rate": 1.7695669629414573e-05, "Full-pretrain/Loss": 1.9879339933395386, "Full-pretrain/Loss (Raw)": 1.6668254137039185, "Full-pretrain/Step": 5784, "Full-pretrain/Step Time": 17.593869399279356} +{"Full-pretrain/Learning Rate": 1.768754975200612e-05, "Full-pretrain/Loss": 1.9849872589111328, "Full-pretrain/Loss (Raw)": 2.0398478507995605, "Full-pretrain/Step": 5785, "Full-pretrain/Step Time": 17.595151843503118} +{"Full-pretrain/Learning Rate": 1.7679430718086243e-05, "Full-pretrain/Loss": 1.9813976287841797, "Full-pretrain/Loss (Raw)": 1.981141448020935, "Full-pretrain/Step": 5786, "Full-pretrain/Step Time": 17.590961998328567} +{"Full-pretrain/Learning Rate": 1.7671312528591454e-05, "Full-pretrain/Loss": 1.9799548387527466, "Full-pretrain/Loss (Raw)": 1.8373537063598633, "Full-pretrain/Step": 5787, "Full-pretrain/Step Time": 17.59578773006797} +{"Full-pretrain/Learning Rate": 1.7663195184458196e-05, "Full-pretrain/Loss": 1.978071928024292, "Full-pretrain/Loss (Raw)": 1.9941344261169434, "Full-pretrain/Step": 5788, "Full-pretrain/Step Time": 17.588349713012576} +{"Full-pretrain/Learning Rate": 1.7655078686622782e-05, "Full-pretrain/Loss": 1.9650391340255737, "Full-pretrain/Loss (Raw)": 1.9635035991668701, "Full-pretrain/Step": 5789, "Full-pretrain/Step Time": 17.600258249789476} +{"Full-pretrain/Learning Rate": 1.764696303602147e-05, "Full-pretrain/Loss": 1.9540587663650513, "Full-pretrain/Loss (Raw)": 1.743746042251587, "Full-pretrain/Step": 5790, "Full-pretrain/Step Time": 17.600829491391778} +{"Full-pretrain/Learning Rate": 1.763884823359038e-05, "Full-pretrain/Loss": 1.9549872875213623, "Full-pretrain/Loss (Raw)": 2.0737881660461426, "Full-pretrain/Step": 5791, "Full-pretrain/Step Time": 17.5990341398865} +{"Full-pretrain/Learning Rate": 1.763073428026556e-05, "Full-pretrain/Loss": 1.944100260734558, "Full-pretrain/Loss (Raw)": 1.6157749891281128, "Full-pretrain/Step": 5792, "Full-pretrain/Step Time": 17.593968173488975} +{"Full-pretrain/Learning Rate": 1.7622621176982964e-05, "Full-pretrain/Loss": 1.9318082332611084, "Full-pretrain/Loss (Raw)": 1.6766602993011475, "Full-pretrain/Step": 5793, "Full-pretrain/Step Time": 17.59497985802591} +{"Full-pretrain/Learning Rate": 1.7614508924678412e-05, "Full-pretrain/Loss": 1.9288992881774902, "Full-pretrain/Loss (Raw)": 2.1334879398345947, "Full-pretrain/Step": 5794, "Full-pretrain/Step Time": 17.595296569168568} +{"Full-pretrain/Learning Rate": 1.7606397524287665e-05, "Full-pretrain/Loss": 1.9259580373764038, "Full-pretrain/Loss (Raw)": 1.8390514850616455, "Full-pretrain/Step": 5795, "Full-pretrain/Step Time": 17.58995235338807} +{"Full-pretrain/Learning Rate": 1.759828697674636e-05, "Full-pretrain/Loss": 1.9272428750991821, "Full-pretrain/Loss (Raw)": 2.2080233097076416, "Full-pretrain/Step": 5796, "Full-pretrain/Step Time": 17.59243830293417} +{"Full-pretrain/Learning Rate": 1.759017728299005e-05, "Full-pretrain/Loss": 1.9297654628753662, "Full-pretrain/Loss (Raw)": 1.984736442565918, "Full-pretrain/Step": 5797, "Full-pretrain/Step Time": 17.590726478025317} +{"Full-pretrain/Learning Rate": 1.7582068443954198e-05, "Full-pretrain/Loss": 1.9318281412124634, "Full-pretrain/Loss (Raw)": 2.0477259159088135, "Full-pretrain/Step": 5798, "Full-pretrain/Step Time": 17.596825437620282} +{"Full-pretrain/Learning Rate": 1.7573960460574133e-05, "Full-pretrain/Loss": 1.921083927154541, "Full-pretrain/Loss (Raw)": 1.946751594543457, "Full-pretrain/Step": 5799, "Full-pretrain/Step Time": 17.601772122085094} +{"Full-pretrain/Learning Rate": 1.756585333378512e-05, "Full-pretrain/Loss": 1.9182302951812744, "Full-pretrain/Loss (Raw)": 1.9201884269714355, "Full-pretrain/Step": 5800, "Full-pretrain/Step Time": 17.595468923449516} +{"Full-pretrain/Learning Rate": 1.7557747064522313e-05, "Full-pretrain/Loss": 1.9198158979415894, "Full-pretrain/Loss (Raw)": 1.9551503658294678, "Full-pretrain/Step": 5801, "Full-pretrain/Step Time": 17.597924139350653} +{"Full-pretrain/Learning Rate": 1.7549641653720765e-05, "Full-pretrain/Loss": 1.9263808727264404, "Full-pretrain/Loss (Raw)": 2.04463529586792, "Full-pretrain/Step": 5802, "Full-pretrain/Step Time": 17.594070402905345} +{"Full-pretrain/Learning Rate": 1.7541537102315443e-05, "Full-pretrain/Loss": 1.9184937477111816, "Full-pretrain/Loss (Raw)": 1.8138023614883423, "Full-pretrain/Step": 5803, "Full-pretrain/Step Time": 17.599243318662047} +{"Full-pretrain/Learning Rate": 1.7533433411241188e-05, "Full-pretrain/Loss": 1.9169073104858398, "Full-pretrain/Loss (Raw)": 1.8499500751495361, "Full-pretrain/Step": 5804, "Full-pretrain/Step Time": 17.59970206581056} +{"Full-pretrain/Learning Rate": 1.7525330581432768e-05, "Full-pretrain/Loss": 1.9203376770019531, "Full-pretrain/Loss (Raw)": 1.952484369277954, "Full-pretrain/Step": 5805, "Full-pretrain/Step Time": 17.595348650589585} +{"Full-pretrain/Learning Rate": 1.7517228613824833e-05, "Full-pretrain/Loss": 1.9167994260787964, "Full-pretrain/Loss (Raw)": 1.9046690464019775, "Full-pretrain/Step": 5806, "Full-pretrain/Step Time": 17.592093121260405} +{"Full-pretrain/Learning Rate": 1.7509127509351952e-05, "Full-pretrain/Loss": 1.9242067337036133, "Full-pretrain/Loss (Raw)": 2.0496835708618164, "Full-pretrain/Step": 5807, "Full-pretrain/Step Time": 17.591276690363884} +{"Full-pretrain/Learning Rate": 1.7501027268948578e-05, "Full-pretrain/Loss": 1.924001932144165, "Full-pretrain/Loss (Raw)": 2.0170891284942627, "Full-pretrain/Step": 5808, "Full-pretrain/Step Time": 17.59239987656474} +{"Full-pretrain/Learning Rate": 1.7492927893549083e-05, "Full-pretrain/Loss": 1.922572135925293, "Full-pretrain/Loss (Raw)": 1.8967379331588745, "Full-pretrain/Step": 5809, "Full-pretrain/Step Time": 17.598789932206273} +{"Full-pretrain/Learning Rate": 1.74848293840877e-05, "Full-pretrain/Loss": 1.935409426689148, "Full-pretrain/Loss (Raw)": 2.2059450149536133, "Full-pretrain/Step": 5810, "Full-pretrain/Step Time": 17.59994911029935} +{"Full-pretrain/Learning Rate": 1.747673174149862e-05, "Full-pretrain/Loss": 1.947886347770691, "Full-pretrain/Loss (Raw)": 2.075706958770752, "Full-pretrain/Step": 5811, "Full-pretrain/Step Time": 17.610927380621433} +{"Full-pretrain/Learning Rate": 1.7468634966715884e-05, "Full-pretrain/Loss": 1.9510014057159424, "Full-pretrain/Loss (Raw)": 2.0295281410217285, "Full-pretrain/Step": 5812, "Full-pretrain/Step Time": 17.60895561426878} +{"Full-pretrain/Learning Rate": 1.7460539060673458e-05, "Full-pretrain/Loss": 1.9466787576675415, "Full-pretrain/Loss (Raw)": 1.8175582885742188, "Full-pretrain/Step": 5813, "Full-pretrain/Step Time": 17.610695112496614} +{"Full-pretrain/Learning Rate": 1.7452444024305214e-05, "Full-pretrain/Loss": 1.9363517761230469, "Full-pretrain/Loss (Raw)": 1.8072043657302856, "Full-pretrain/Step": 5814, "Full-pretrain/Step Time": 17.613089935854077} +{"Full-pretrain/Learning Rate": 1.7444349858544886e-05, "Full-pretrain/Loss": 1.936002492904663, "Full-pretrain/Loss (Raw)": 1.859192132949829, "Full-pretrain/Step": 5815, "Full-pretrain/Step Time": 17.608346158638597} +{"Full-pretrain/Learning Rate": 1.7436256564326147e-05, "Full-pretrain/Loss": 1.9542356729507446, "Full-pretrain/Loss (Raw)": 2.2502872943878174, "Full-pretrain/Step": 5816, "Full-pretrain/Step Time": 17.60984706506133} +{"Full-pretrain/Learning Rate": 1.7428164142582555e-05, "Full-pretrain/Loss": 1.9557201862335205, "Full-pretrain/Loss (Raw)": 2.087352752685547, "Full-pretrain/Step": 5817, "Full-pretrain/Step Time": 17.61170244216919} +{"Full-pretrain/Learning Rate": 1.7420072594247568e-05, "Full-pretrain/Loss": 1.962010145187378, "Full-pretrain/Loss (Raw)": 2.1824183464050293, "Full-pretrain/Step": 5818, "Full-pretrain/Step Time": 17.611073572188616} +{"Full-pretrain/Learning Rate": 1.7411981920254555e-05, "Full-pretrain/Loss": 1.9615418910980225, "Full-pretrain/Loss (Raw)": 1.8223726749420166, "Full-pretrain/Step": 5819, "Full-pretrain/Step Time": 17.611545668914914} +{"Full-pretrain/Learning Rate": 1.740389212153675e-05, "Full-pretrain/Loss": 1.961333990097046, "Full-pretrain/Loss (Raw)": 1.9874821901321411, "Full-pretrain/Step": 5820, "Full-pretrain/Step Time": 17.609017331153154} +{"Full-pretrain/Learning Rate": 1.7395803199027323e-05, "Full-pretrain/Loss": 1.9614591598510742, "Full-pretrain/Loss (Raw)": 1.967508316040039, "Full-pretrain/Step": 5821, "Full-pretrain/Step Time": 17.613692248240113} +{"Full-pretrain/Learning Rate": 1.7387715153659323e-05, "Full-pretrain/Loss": 1.9668798446655273, "Full-pretrain/Loss (Raw)": 1.917206048965454, "Full-pretrain/Step": 5822, "Full-pretrain/Step Time": 17.61123776808381} +{"Full-pretrain/Learning Rate": 1.7379627986365702e-05, "Full-pretrain/Loss": 1.959634780883789, "Full-pretrain/Loss (Raw)": 1.841946005821228, "Full-pretrain/Step": 5823, "Full-pretrain/Step Time": 17.616248248144984} +{"Full-pretrain/Learning Rate": 1.7371541698079324e-05, "Full-pretrain/Loss": 1.966214895248413, "Full-pretrain/Loss (Raw)": 1.8263393640518188, "Full-pretrain/Step": 5824, "Full-pretrain/Step Time": 17.608908591791987} +{"Full-pretrain/Learning Rate": 1.7363456289732922e-05, "Full-pretrain/Loss": 1.9728119373321533, "Full-pretrain/Loss (Raw)": 1.887763500213623, "Full-pretrain/Step": 5825, "Full-pretrain/Step Time": 17.609473949298263} +{"Full-pretrain/Learning Rate": 1.7355371762259153e-05, "Full-pretrain/Loss": 1.9724011421203613, "Full-pretrain/Loss (Raw)": 2.1203455924987793, "Full-pretrain/Step": 5826, "Full-pretrain/Step Time": 17.610970677807927} +{"Full-pretrain/Learning Rate": 1.7347288116590565e-05, "Full-pretrain/Loss": 1.9770894050598145, "Full-pretrain/Loss (Raw)": 1.9890775680541992, "Full-pretrain/Step": 5827, "Full-pretrain/Step Time": 17.61946465075016} +{"Full-pretrain/Learning Rate": 1.733920535365961e-05, "Full-pretrain/Loss": 1.9723083972930908, "Full-pretrain/Loss (Raw)": 2.055025339126587, "Full-pretrain/Step": 5828, "Full-pretrain/Step Time": 17.616362188011408} +{"Full-pretrain/Learning Rate": 1.733112347439862e-05, "Full-pretrain/Loss": 1.9610004425048828, "Full-pretrain/Loss (Raw)": 1.6228859424591064, "Full-pretrain/Step": 5829, "Full-pretrain/Step Time": 17.61919090896845} +{"Full-pretrain/Learning Rate": 1.732304247973985e-05, "Full-pretrain/Loss": 1.9605729579925537, "Full-pretrain/Loss (Raw)": 2.0340428352355957, "Full-pretrain/Step": 5830, "Full-pretrain/Step Time": 17.621694799512625} +{"Full-pretrain/Learning Rate": 1.7314962370615423e-05, "Full-pretrain/Loss": 1.96449875831604, "Full-pretrain/Loss (Raw)": 2.0723795890808105, "Full-pretrain/Step": 5831, "Full-pretrain/Step Time": 17.6245392318815} +{"Full-pretrain/Learning Rate": 1.7306883147957383e-05, "Full-pretrain/Loss": 1.9774346351623535, "Full-pretrain/Loss (Raw)": 2.334137439727783, "Full-pretrain/Step": 5832, "Full-pretrain/Step Time": 17.627861427143216} +{"Full-pretrain/Learning Rate": 1.7298804812697673e-05, "Full-pretrain/Loss": 1.9799084663391113, "Full-pretrain/Loss (Raw)": 2.0343148708343506, "Full-pretrain/Step": 5833, "Full-pretrain/Step Time": 17.635173611342907} +{"Full-pretrain/Learning Rate": 1.7290727365768116e-05, "Full-pretrain/Loss": 1.9796617031097412, "Full-pretrain/Loss (Raw)": 2.036731719970703, "Full-pretrain/Step": 5834, "Full-pretrain/Step Time": 17.635660637170076} +{"Full-pretrain/Learning Rate": 1.7282650808100463e-05, "Full-pretrain/Loss": 1.9833984375, "Full-pretrain/Loss (Raw)": 1.9333852529525757, "Full-pretrain/Step": 5835, "Full-pretrain/Step Time": 17.636532293632627} +{"Full-pretrain/Learning Rate": 1.7274575140626318e-05, "Full-pretrain/Loss": 1.9942476749420166, "Full-pretrain/Loss (Raw)": 2.1971240043640137, "Full-pretrain/Step": 5836, "Full-pretrain/Step Time": 17.635063396766782} +{"Full-pretrain/Learning Rate": 1.7266500364277217e-05, "Full-pretrain/Loss": 1.9934806823730469, "Full-pretrain/Loss (Raw)": 1.927943229675293, "Full-pretrain/Step": 5837, "Full-pretrain/Step Time": 17.643395084887743} +{"Full-pretrain/Learning Rate": 1.725842647998458e-05, "Full-pretrain/Loss": 1.9930676221847534, "Full-pretrain/Loss (Raw)": 1.8914453983306885, "Full-pretrain/Step": 5838, "Full-pretrain/Step Time": 17.64256689697504} +{"Full-pretrain/Learning Rate": 1.7250353488679723e-05, "Full-pretrain/Loss": 1.9946062564849854, "Full-pretrain/Loss (Raw)": 2.098924398422241, "Full-pretrain/Step": 5839, "Full-pretrain/Step Time": 17.645731884986162} +{"Full-pretrain/Learning Rate": 1.724228139129388e-05, "Full-pretrain/Loss": 1.995542287826538, "Full-pretrain/Loss (Raw)": 2.0470376014709473, "Full-pretrain/Step": 5840, "Full-pretrain/Step Time": 17.6447414457798} +{"Full-pretrain/Learning Rate": 1.7234210188758144e-05, "Full-pretrain/Loss": 2.0017144680023193, "Full-pretrain/Loss (Raw)": 2.0942506790161133, "Full-pretrain/Step": 5841, "Full-pretrain/Step Time": 17.646764140576124} +{"Full-pretrain/Learning Rate": 1.7226139882003534e-05, "Full-pretrain/Loss": 1.995430827140808, "Full-pretrain/Loss (Raw)": 2.004869222640991, "Full-pretrain/Step": 5842, "Full-pretrain/Step Time": 17.651077706366777} +{"Full-pretrain/Learning Rate": 1.721807047196095e-05, "Full-pretrain/Loss": 1.9956352710723877, "Full-pretrain/Loss (Raw)": 2.0822510719299316, "Full-pretrain/Step": 5843, "Full-pretrain/Step Time": 17.65371144376695} +{"Full-pretrain/Learning Rate": 1.721000195956121e-05, "Full-pretrain/Loss": 1.9933867454528809, "Full-pretrain/Loss (Raw)": 1.9575746059417725, "Full-pretrain/Step": 5844, "Full-pretrain/Step Time": 17.64813464321196} +{"Full-pretrain/Learning Rate": 1.7201934345735012e-05, "Full-pretrain/Loss": 1.9969561100006104, "Full-pretrain/Loss (Raw)": 1.9317760467529297, "Full-pretrain/Step": 5845, "Full-pretrain/Step Time": 17.647819897159934} +{"Full-pretrain/Learning Rate": 1.719386763141294e-05, "Full-pretrain/Loss": 2.0124640464782715, "Full-pretrain/Loss (Raw)": 2.303457260131836, "Full-pretrain/Step": 5846, "Full-pretrain/Step Time": 17.650144539773464} +{"Full-pretrain/Learning Rate": 1.7185801817525498e-05, "Full-pretrain/Loss": 2.012969970703125, "Full-pretrain/Loss (Raw)": 1.8753812313079834, "Full-pretrain/Step": 5847, "Full-pretrain/Step Time": 17.649321040138602} +{"Full-pretrain/Learning Rate": 1.717773690500306e-05, "Full-pretrain/Loss": 2.003174304962158, "Full-pretrain/Loss (Raw)": 1.9368263483047485, "Full-pretrain/Step": 5848, "Full-pretrain/Step Time": 17.646125685423613} +{"Full-pretrain/Learning Rate": 1.7169672894775928e-05, "Full-pretrain/Loss": 2.0025691986083984, "Full-pretrain/Loss (Raw)": 2.067991256713867, "Full-pretrain/Step": 5849, "Full-pretrain/Step Time": 17.652598345652223} +{"Full-pretrain/Learning Rate": 1.716160978777427e-05, "Full-pretrain/Loss": 2.0001614093780518, "Full-pretrain/Loss (Raw)": 2.10536527633667, "Full-pretrain/Step": 5850, "Full-pretrain/Step Time": 17.660819796845317} +{"Full-pretrain/Learning Rate": 1.7153547584928183e-05, "Full-pretrain/Loss": 1.9922970533370972, "Full-pretrain/Loss (Raw)": 1.5707173347473145, "Full-pretrain/Step": 5851, "Full-pretrain/Step Time": 17.655547620728612} +{"Full-pretrain/Learning Rate": 1.714548628716761e-05, "Full-pretrain/Loss": 1.9925646781921387, "Full-pretrain/Loss (Raw)": 1.9960463047027588, "Full-pretrain/Step": 5852, "Full-pretrain/Step Time": 17.653771579265594} +{"Full-pretrain/Learning Rate": 1.7137425895422437e-05, "Full-pretrain/Loss": 1.9888622760772705, "Full-pretrain/Loss (Raw)": 1.8490331172943115, "Full-pretrain/Step": 5853, "Full-pretrain/Step Time": 17.653490841388702} +{"Full-pretrain/Learning Rate": 1.7129366410622433e-05, "Full-pretrain/Loss": 1.9898364543914795, "Full-pretrain/Loss (Raw)": 1.9483764171600342, "Full-pretrain/Step": 5854, "Full-pretrain/Step Time": 17.658990554511547} +{"Full-pretrain/Learning Rate": 1.7121307833697238e-05, "Full-pretrain/Loss": 1.9904029369354248, "Full-pretrain/Loss (Raw)": 1.8600733280181885, "Full-pretrain/Step": 5855, "Full-pretrain/Step Time": 17.657771073281765} +{"Full-pretrain/Learning Rate": 1.7113250165576423e-05, "Full-pretrain/Loss": 1.9955235719680786, "Full-pretrain/Loss (Raw)": 1.9902020692825317, "Full-pretrain/Step": 5856, "Full-pretrain/Step Time": 17.656598402187228} +{"Full-pretrain/Learning Rate": 1.7105193407189423e-05, "Full-pretrain/Loss": 1.9988149404525757, "Full-pretrain/Loss (Raw)": 1.993088960647583, "Full-pretrain/Step": 5857, "Full-pretrain/Step Time": 17.663690384477377} +{"Full-pretrain/Learning Rate": 1.7097137559465587e-05, "Full-pretrain/Loss": 1.9984458684921265, "Full-pretrain/Loss (Raw)": 2.1085336208343506, "Full-pretrain/Step": 5858, "Full-pretrain/Step Time": 17.659148145467043} +{"Full-pretrain/Learning Rate": 1.7089082623334158e-05, "Full-pretrain/Loss": 2.00225567817688, "Full-pretrain/Loss (Raw)": 2.110994338989258, "Full-pretrain/Step": 5859, "Full-pretrain/Step Time": 17.661870039999485} +{"Full-pretrain/Learning Rate": 1.7081028599724268e-05, "Full-pretrain/Loss": 2.004213571548462, "Full-pretrain/Loss (Raw)": 2.1176743507385254, "Full-pretrain/Step": 5860, "Full-pretrain/Step Time": 17.664204105734825} +{"Full-pretrain/Learning Rate": 1.7072975489564958e-05, "Full-pretrain/Loss": 2.0199551582336426, "Full-pretrain/Loss (Raw)": 2.126621961593628, "Full-pretrain/Step": 5861, "Full-pretrain/Step Time": 17.66491997241974} +{"Full-pretrain/Learning Rate": 1.7064923293785127e-05, "Full-pretrain/Loss": 2.0137853622436523, "Full-pretrain/Loss (Raw)": 1.8366026878356934, "Full-pretrain/Step": 5862, "Full-pretrain/Step Time": 17.668928699567914} +{"Full-pretrain/Learning Rate": 1.705687201331361e-05, "Full-pretrain/Loss": 2.0086870193481445, "Full-pretrain/Loss (Raw)": 1.9092401266098022, "Full-pretrain/Step": 5863, "Full-pretrain/Step Time": 17.66303456388414} +{"Full-pretrain/Learning Rate": 1.704882164907911e-05, "Full-pretrain/Loss": 2.0014307498931885, "Full-pretrain/Loss (Raw)": 2.101933479309082, "Full-pretrain/Step": 5864, "Full-pretrain/Step Time": 17.66208648495376} +{"Full-pretrain/Learning Rate": 1.704077220201024e-05, "Full-pretrain/Loss": 2.005984306335449, "Full-pretrain/Loss (Raw)": 2.18002986907959, "Full-pretrain/Step": 5865, "Full-pretrain/Step Time": 17.668358525261283} +{"Full-pretrain/Learning Rate": 1.703272367303551e-05, "Full-pretrain/Loss": 2.002744436264038, "Full-pretrain/Loss (Raw)": 1.93305504322052, "Full-pretrain/Step": 5866, "Full-pretrain/Step Time": 17.665770219638944} +{"Full-pretrain/Learning Rate": 1.702467606308329e-05, "Full-pretrain/Loss": 2.0017051696777344, "Full-pretrain/Loss (Raw)": 1.900127649307251, "Full-pretrain/Step": 5867, "Full-pretrain/Step Time": 17.668599719181657} +{"Full-pretrain/Learning Rate": 1.7016629373081887e-05, "Full-pretrain/Loss": 2.0000805854797363, "Full-pretrain/Loss (Raw)": 2.145141124725342, "Full-pretrain/Step": 5868, "Full-pretrain/Step Time": 17.662074152380228} +{"Full-pretrain/Learning Rate": 1.7008583603959484e-05, "Full-pretrain/Loss": 2.002769947052002, "Full-pretrain/Loss (Raw)": 2.01399827003479, "Full-pretrain/Step": 5869, "Full-pretrain/Step Time": 17.660409396514297} +{"Full-pretrain/Learning Rate": 1.7000538756644152e-05, "Full-pretrain/Loss": 2.0071187019348145, "Full-pretrain/Loss (Raw)": 2.0306081771850586, "Full-pretrain/Step": 5870, "Full-pretrain/Step Time": 17.659046314656734} +{"Full-pretrain/Learning Rate": 1.699249483206386e-05, "Full-pretrain/Loss": 1.990715503692627, "Full-pretrain/Loss (Raw)": 1.574021577835083, "Full-pretrain/Step": 5871, "Full-pretrain/Step Time": 17.661963870748878} +{"Full-pretrain/Learning Rate": 1.6984451831146488e-05, "Full-pretrain/Loss": 1.9916155338287354, "Full-pretrain/Loss (Raw)": 2.075835704803467, "Full-pretrain/Step": 5872, "Full-pretrain/Step Time": 17.656744863837957} +{"Full-pretrain/Learning Rate": 1.6976409754819767e-05, "Full-pretrain/Loss": 1.99013352394104, "Full-pretrain/Loss (Raw)": 2.0468251705169678, "Full-pretrain/Step": 5873, "Full-pretrain/Step Time": 17.65724322013557} +{"Full-pretrain/Learning Rate": 1.6968368604011366e-05, "Full-pretrain/Loss": 1.9810504913330078, "Full-pretrain/Loss (Raw)": 1.7142130136489868, "Full-pretrain/Step": 5874, "Full-pretrain/Step Time": 17.6559869479388} +{"Full-pretrain/Learning Rate": 1.6960328379648818e-05, "Full-pretrain/Loss": 1.9770686626434326, "Full-pretrain/Loss (Raw)": 1.9548343420028687, "Full-pretrain/Step": 5875, "Full-pretrain/Step Time": 17.65906429849565} +{"Full-pretrain/Learning Rate": 1.6952289082659567e-05, "Full-pretrain/Loss": 1.9789323806762695, "Full-pretrain/Loss (Raw)": 2.0172126293182373, "Full-pretrain/Step": 5876, "Full-pretrain/Step Time": 17.651477934792638} +{"Full-pretrain/Learning Rate": 1.6944250713970956e-05, "Full-pretrain/Loss": 1.9782967567443848, "Full-pretrain/Loss (Raw)": 1.9114344120025635, "Full-pretrain/Step": 5877, "Full-pretrain/Step Time": 17.651876708492637} +{"Full-pretrain/Learning Rate": 1.6936213274510183e-05, "Full-pretrain/Loss": 1.9595301151275635, "Full-pretrain/Loss (Raw)": 1.7029240131378174, "Full-pretrain/Step": 5878, "Full-pretrain/Step Time": 17.64986669830978} +{"Full-pretrain/Learning Rate": 1.692817676520438e-05, "Full-pretrain/Loss": 1.9547033309936523, "Full-pretrain/Loss (Raw)": 1.720923900604248, "Full-pretrain/Step": 5879, "Full-pretrain/Step Time": 17.6444672960788} +{"Full-pretrain/Learning Rate": 1.6920141186980544e-05, "Full-pretrain/Loss": 1.9575376510620117, "Full-pretrain/Loss (Raw)": 2.027526378631592, "Full-pretrain/Step": 5880, "Full-pretrain/Step Time": 17.641330920159817} +{"Full-pretrain/Learning Rate": 1.6912106540765583e-05, "Full-pretrain/Loss": 1.9544856548309326, "Full-pretrain/Loss (Raw)": 1.9703257083892822, "Full-pretrain/Step": 5881, "Full-pretrain/Step Time": 17.651357589289546} +{"Full-pretrain/Learning Rate": 1.69040728274863e-05, "Full-pretrain/Loss": 1.945908784866333, "Full-pretrain/Loss (Raw)": 1.8309061527252197, "Full-pretrain/Step": 5882, "Full-pretrain/Step Time": 17.648729898035526} +{"Full-pretrain/Learning Rate": 1.6896040048069362e-05, "Full-pretrain/Loss": 1.956350564956665, "Full-pretrain/Loss (Raw)": 1.9048545360565186, "Full-pretrain/Step": 5883, "Full-pretrain/Step Time": 17.646214490756392} +{"Full-pretrain/Learning Rate": 1.6888008203441353e-05, "Full-pretrain/Loss": 1.950350284576416, "Full-pretrain/Loss (Raw)": 1.804036259651184, "Full-pretrain/Step": 5884, "Full-pretrain/Step Time": 17.641089161857963} +{"Full-pretrain/Learning Rate": 1.687997729452875e-05, "Full-pretrain/Loss": 1.9495737552642822, "Full-pretrain/Loss (Raw)": 1.824185848236084, "Full-pretrain/Step": 5885, "Full-pretrain/Step Time": 17.6485744882375} +{"Full-pretrain/Learning Rate": 1.6871947322257915e-05, "Full-pretrain/Loss": 1.9553675651550293, "Full-pretrain/Loss (Raw)": 2.133777618408203, "Full-pretrain/Step": 5886, "Full-pretrain/Step Time": 17.64894870109856} +{"Full-pretrain/Learning Rate": 1.6863918287555104e-05, "Full-pretrain/Loss": 1.9559749364852905, "Full-pretrain/Loss (Raw)": 1.8795098066329956, "Full-pretrain/Step": 5887, "Full-pretrain/Step Time": 17.65157648548484} +{"Full-pretrain/Learning Rate": 1.6855890191346455e-05, "Full-pretrain/Loss": 1.9518071413040161, "Full-pretrain/Loss (Raw)": 1.8568302392959595, "Full-pretrain/Step": 5888, "Full-pretrain/Step Time": 17.65066085755825} +{"Full-pretrain/Learning Rate": 1.6847863034558013e-05, "Full-pretrain/Loss": 1.9366834163665771, "Full-pretrain/Loss (Raw)": 1.5091291666030884, "Full-pretrain/Step": 5889, "Full-pretrain/Step Time": 17.649343315511942} +{"Full-pretrain/Learning Rate": 1.68398368181157e-05, "Full-pretrain/Loss": 1.9368517398834229, "Full-pretrain/Loss (Raw)": 2.1139211654663086, "Full-pretrain/Step": 5890, "Full-pretrain/Step Time": 17.648875208571553} +{"Full-pretrain/Learning Rate": 1.683181154294534e-05, "Full-pretrain/Loss": 1.9360108375549316, "Full-pretrain/Loss (Raw)": 2.0840859413146973, "Full-pretrain/Step": 5891, "Full-pretrain/Step Time": 17.65015792660415} +{"Full-pretrain/Learning Rate": 1.682378720997265e-05, "Full-pretrain/Loss": 1.9337096214294434, "Full-pretrain/Loss (Raw)": 2.044036388397217, "Full-pretrain/Step": 5892, "Full-pretrain/Step Time": 17.64897983521223} +{"Full-pretrain/Learning Rate": 1.6815763820123247e-05, "Full-pretrain/Loss": 1.9238859415054321, "Full-pretrain/Loss (Raw)": 1.8122632503509521, "Full-pretrain/Step": 5893, "Full-pretrain/Step Time": 17.650452142581344} +{"Full-pretrain/Learning Rate": 1.6807741374322596e-05, "Full-pretrain/Loss": 1.9099860191345215, "Full-pretrain/Loss (Raw)": 1.3918075561523438, "Full-pretrain/Step": 5894, "Full-pretrain/Step Time": 17.647047774866223} +{"Full-pretrain/Learning Rate": 1.67997198734961e-05, "Full-pretrain/Loss": 1.913407564163208, "Full-pretrain/Loss (Raw)": 2.018725633621216, "Full-pretrain/Step": 5895, "Full-pretrain/Step Time": 17.64512038603425} +{"Full-pretrain/Learning Rate": 1.679169931856904e-05, "Full-pretrain/Loss": 1.907654047012329, "Full-pretrain/Loss (Raw)": 1.9178258180618286, "Full-pretrain/Step": 5896, "Full-pretrain/Step Time": 17.64650009199977} +{"Full-pretrain/Learning Rate": 1.678367971046657e-05, "Full-pretrain/Loss": 1.899330973625183, "Full-pretrain/Loss (Raw)": 1.9136896133422852, "Full-pretrain/Step": 5897, "Full-pretrain/Step Time": 17.645775010809302} +{"Full-pretrain/Learning Rate": 1.6775661050113772e-05, "Full-pretrain/Loss": 1.9039326906204224, "Full-pretrain/Loss (Raw)": 2.080307960510254, "Full-pretrain/Step": 5898, "Full-pretrain/Step Time": 17.644785976037383} +{"Full-pretrain/Learning Rate": 1.6767643338435574e-05, "Full-pretrain/Loss": 1.9080705642700195, "Full-pretrain/Loss (Raw)": 2.0325393676757812, "Full-pretrain/Step": 5899, "Full-pretrain/Step Time": 17.642832834273577} +{"Full-pretrain/Learning Rate": 1.675962657635682e-05, "Full-pretrain/Loss": 1.902541160583496, "Full-pretrain/Loss (Raw)": 1.9682000875473022, "Full-pretrain/Step": 5900, "Full-pretrain/Step Time": 17.641769375652075} +{"Full-pretrain/Learning Rate": 1.6751610764802245e-05, "Full-pretrain/Loss": 1.8967134952545166, "Full-pretrain/Loss (Raw)": 1.8275153636932373, "Full-pretrain/Step": 5901, "Full-pretrain/Step Time": 17.64560706168413} +{"Full-pretrain/Learning Rate": 1.674359590469647e-05, "Full-pretrain/Loss": 1.904797911643982, "Full-pretrain/Loss (Raw)": 2.2893056869506836, "Full-pretrain/Step": 5902, "Full-pretrain/Step Time": 17.64193787612021} +{"Full-pretrain/Learning Rate": 1.6735581996964014e-05, "Full-pretrain/Loss": 1.9126014709472656, "Full-pretrain/Loss (Raw)": 1.8237395286560059, "Full-pretrain/Step": 5903, "Full-pretrain/Step Time": 17.6397313028574} +{"Full-pretrain/Learning Rate": 1.672756904252926e-05, "Full-pretrain/Loss": 1.8945561647415161, "Full-pretrain/Loss (Raw)": 1.4983842372894287, "Full-pretrain/Step": 5904, "Full-pretrain/Step Time": 17.640397692099214} +{"Full-pretrain/Learning Rate": 1.671955704231652e-05, "Full-pretrain/Loss": 1.880846381187439, "Full-pretrain/Loss (Raw)": 1.6081125736236572, "Full-pretrain/Step": 5905, "Full-pretrain/Step Time": 17.636206163093448} +{"Full-pretrain/Learning Rate": 1.6711545997249955e-05, "Full-pretrain/Loss": 1.8913941383361816, "Full-pretrain/Loss (Raw)": 2.0517396926879883, "Full-pretrain/Step": 5906, "Full-pretrain/Step Time": 17.635328866541386} +{"Full-pretrain/Learning Rate": 1.670353590825365e-05, "Full-pretrain/Loss": 1.8874768018722534, "Full-pretrain/Loss (Raw)": 1.8294830322265625, "Full-pretrain/Step": 5907, "Full-pretrain/Step Time": 17.633143777027726} +{"Full-pretrain/Learning Rate": 1.669552677625156e-05, "Full-pretrain/Loss": 1.8873276710510254, "Full-pretrain/Loss (Raw)": 2.0124425888061523, "Full-pretrain/Step": 5908, "Full-pretrain/Step Time": 17.634565383195877} +{"Full-pretrain/Learning Rate": 1.6687518602167552e-05, "Full-pretrain/Loss": 1.891310691833496, "Full-pretrain/Loss (Raw)": 2.0388906002044678, "Full-pretrain/Step": 5909, "Full-pretrain/Step Time": 17.628348007798195} +{"Full-pretrain/Learning Rate": 1.6679511386925337e-05, "Full-pretrain/Loss": 1.9049031734466553, "Full-pretrain/Loss (Raw)": 2.137881278991699, "Full-pretrain/Step": 5910, "Full-pretrain/Step Time": 17.630521221086383} +{"Full-pretrain/Learning Rate": 1.667150513144856e-05, "Full-pretrain/Loss": 1.911644697189331, "Full-pretrain/Loss (Raw)": 1.9366533756256104, "Full-pretrain/Step": 5911, "Full-pretrain/Step Time": 17.627116499468684} +{"Full-pretrain/Learning Rate": 1.6663499836660745e-05, "Full-pretrain/Loss": 1.9107561111450195, "Full-pretrain/Loss (Raw)": 1.9990891218185425, "Full-pretrain/Step": 5912, "Full-pretrain/Step Time": 17.627230506390333} +{"Full-pretrain/Learning Rate": 1.665549550348529e-05, "Full-pretrain/Loss": 1.9075676202774048, "Full-pretrain/Loss (Raw)": 1.8682935237884521, "Full-pretrain/Step": 5913, "Full-pretrain/Step Time": 17.631072115153074} +{"Full-pretrain/Learning Rate": 1.6647492132845508e-05, "Full-pretrain/Loss": 1.9058374166488647, "Full-pretrain/Loss (Raw)": 1.7755401134490967, "Full-pretrain/Step": 5914, "Full-pretrain/Step Time": 17.632395027205348} +{"Full-pretrain/Learning Rate": 1.6639489725664563e-05, "Full-pretrain/Loss": 1.9072136878967285, "Full-pretrain/Loss (Raw)": 1.9488964080810547, "Full-pretrain/Step": 5915, "Full-pretrain/Step Time": 17.628823088482022} +{"Full-pretrain/Learning Rate": 1.6631488282865537e-05, "Full-pretrain/Loss": 1.9075452089309692, "Full-pretrain/Loss (Raw)": 1.8146429061889648, "Full-pretrain/Step": 5916, "Full-pretrain/Step Time": 17.631989046931267} +{"Full-pretrain/Learning Rate": 1.6623487805371397e-05, "Full-pretrain/Loss": 1.912011742591858, "Full-pretrain/Loss (Raw)": 1.9671156406402588, "Full-pretrain/Step": 5917, "Full-pretrain/Step Time": 17.626398457214236} +{"Full-pretrain/Learning Rate": 1.6615488294105e-05, "Full-pretrain/Loss": 1.9087326526641846, "Full-pretrain/Loss (Raw)": 2.0288493633270264, "Full-pretrain/Step": 5918, "Full-pretrain/Step Time": 17.63368159160018} +{"Full-pretrain/Learning Rate": 1.6607489749989087e-05, "Full-pretrain/Loss": 1.9087179899215698, "Full-pretrain/Loss (Raw)": 1.8790396451950073, "Full-pretrain/Step": 5919, "Full-pretrain/Step Time": 17.635011034086347} +{"Full-pretrain/Learning Rate": 1.659949217394627e-05, "Full-pretrain/Loss": 1.9048877954483032, "Full-pretrain/Loss (Raw)": 1.7342638969421387, "Full-pretrain/Step": 5920, "Full-pretrain/Step Time": 17.635413274168968} +{"Full-pretrain/Learning Rate": 1.6591495566899085e-05, "Full-pretrain/Loss": 1.9241676330566406, "Full-pretrain/Loss (Raw)": 2.1260862350463867, "Full-pretrain/Step": 5921, "Full-pretrain/Step Time": 17.63595601543784} +{"Full-pretrain/Learning Rate": 1.658349992976993e-05, "Full-pretrain/Loss": 1.9172192811965942, "Full-pretrain/Loss (Raw)": 1.8915719985961914, "Full-pretrain/Step": 5922, "Full-pretrain/Step Time": 17.63509676605463} +{"Full-pretrain/Learning Rate": 1.6575505263481095e-05, "Full-pretrain/Loss": 1.914212942123413, "Full-pretrain/Loss (Raw)": 1.9878840446472168, "Full-pretrain/Step": 5923, "Full-pretrain/Step Time": 17.63784690760076} +{"Full-pretrain/Learning Rate": 1.656751156895478e-05, "Full-pretrain/Loss": 1.9196009635925293, "Full-pretrain/Loss (Raw)": 2.216449499130249, "Full-pretrain/Step": 5924, "Full-pretrain/Step Time": 17.636819936335087} +{"Full-pretrain/Learning Rate": 1.6559518847113035e-05, "Full-pretrain/Loss": 1.921973705291748, "Full-pretrain/Loss (Raw)": 1.8881940841674805, "Full-pretrain/Step": 5925, "Full-pretrain/Step Time": 17.642345855012536} +{"Full-pretrain/Learning Rate": 1.655152709887782e-05, "Full-pretrain/Loss": 1.9441797733306885, "Full-pretrain/Loss (Raw)": 2.1024022102355957, "Full-pretrain/Step": 5926, "Full-pretrain/Step Time": 17.637985596433282} +{"Full-pretrain/Learning Rate": 1.654353632517099e-05, "Full-pretrain/Loss": 1.9400668144226074, "Full-pretrain/Loss (Raw)": 1.8871091604232788, "Full-pretrain/Step": 5927, "Full-pretrain/Step Time": 17.634864507243037} +{"Full-pretrain/Learning Rate": 1.6535546526914274e-05, "Full-pretrain/Loss": 1.939234972000122, "Full-pretrain/Loss (Raw)": 1.8912062644958496, "Full-pretrain/Step": 5928, "Full-pretrain/Step Time": 17.634635470807552} +{"Full-pretrain/Learning Rate": 1.6527557705029286e-05, "Full-pretrain/Loss": 1.937018632888794, "Full-pretrain/Loss (Raw)": 1.8427667617797852, "Full-pretrain/Step": 5929, "Full-pretrain/Step Time": 17.641830805689096} +{"Full-pretrain/Learning Rate": 1.6519569860437547e-05, "Full-pretrain/Loss": 1.9327871799468994, "Full-pretrain/Loss (Raw)": 1.94490385055542, "Full-pretrain/Step": 5930, "Full-pretrain/Step Time": 17.64016266539693} +{"Full-pretrain/Learning Rate": 1.6511582994060442e-05, "Full-pretrain/Loss": 1.926487684249878, "Full-pretrain/Loss (Raw)": 1.830953598022461, "Full-pretrain/Step": 5931, "Full-pretrain/Step Time": 17.63738264888525} +{"Full-pretrain/Learning Rate": 1.6503597106819255e-05, "Full-pretrain/Loss": 1.924248218536377, "Full-pretrain/Loss (Raw)": 1.8965378999710083, "Full-pretrain/Step": 5932, "Full-pretrain/Step Time": 17.64061680622399} +{"Full-pretrain/Learning Rate": 1.6495612199635154e-05, "Full-pretrain/Loss": 1.932976484298706, "Full-pretrain/Loss (Raw)": 2.106818675994873, "Full-pretrain/Step": 5933, "Full-pretrain/Step Time": 17.64447444304824} +{"Full-pretrain/Learning Rate": 1.6487628273429196e-05, "Full-pretrain/Loss": 1.905836820602417, "Full-pretrain/Loss (Raw)": 1.420839548110962, "Full-pretrain/Step": 5934, "Full-pretrain/Step Time": 17.64794072136283} +{"Full-pretrain/Learning Rate": 1.6479645329122333e-05, "Full-pretrain/Loss": 1.9150142669677734, "Full-pretrain/Loss (Raw)": 2.117417335510254, "Full-pretrain/Step": 5935, "Full-pretrain/Step Time": 17.64743691124022} +{"Full-pretrain/Learning Rate": 1.647166336763538e-05, "Full-pretrain/Loss": 1.9199285507202148, "Full-pretrain/Loss (Raw)": 1.655637264251709, "Full-pretrain/Step": 5936, "Full-pretrain/Step Time": 17.644813092425466} +{"Full-pretrain/Learning Rate": 1.646368238988906e-05, "Full-pretrain/Loss": 1.919535756111145, "Full-pretrain/Loss (Raw)": 1.595546007156372, "Full-pretrain/Step": 5937, "Full-pretrain/Step Time": 17.647995805367827} +{"Full-pretrain/Learning Rate": 1.6455702396803983e-05, "Full-pretrain/Loss": 1.9151458740234375, "Full-pretrain/Loss (Raw)": 1.9112639427185059, "Full-pretrain/Step": 5938, "Full-pretrain/Step Time": 17.64686575345695} +{"Full-pretrain/Learning Rate": 1.6447723389300623e-05, "Full-pretrain/Loss": 1.9135091304779053, "Full-pretrain/Loss (Raw)": 1.7771047353744507, "Full-pretrain/Step": 5939, "Full-pretrain/Step Time": 17.647588415071368} +{"Full-pretrain/Learning Rate": 1.643974536829938e-05, "Full-pretrain/Loss": 1.9050989151000977, "Full-pretrain/Loss (Raw)": 1.7433174848556519, "Full-pretrain/Step": 5940, "Full-pretrain/Step Time": 17.644785948097706} +{"Full-pretrain/Learning Rate": 1.6431768334720485e-05, "Full-pretrain/Loss": 1.9041134119033813, "Full-pretrain/Loss (Raw)": 2.007355213165283, "Full-pretrain/Step": 5941, "Full-pretrain/Step Time": 17.644354328513145} +{"Full-pretrain/Learning Rate": 1.6423792289484103e-05, "Full-pretrain/Loss": 1.8945692777633667, "Full-pretrain/Loss (Raw)": 1.8324681520462036, "Full-pretrain/Step": 5942, "Full-pretrain/Step Time": 17.63895446807146} +{"Full-pretrain/Learning Rate": 1.6415817233510266e-05, "Full-pretrain/Loss": 1.9021213054656982, "Full-pretrain/Loss (Raw)": 2.178316116333008, "Full-pretrain/Step": 5943, "Full-pretrain/Step Time": 17.64626377634704} +{"Full-pretrain/Learning Rate": 1.6407843167718897e-05, "Full-pretrain/Loss": 1.8875610828399658, "Full-pretrain/Loss (Raw)": 1.53316068649292, "Full-pretrain/Step": 5944, "Full-pretrain/Step Time": 17.643762217834592} +{"Full-pretrain/Learning Rate": 1.6399870093029808e-05, "Full-pretrain/Loss": 1.893102765083313, "Full-pretrain/Loss (Raw)": 2.0456290245056152, "Full-pretrain/Step": 5945, "Full-pretrain/Step Time": 17.64538018591702} +{"Full-pretrain/Learning Rate": 1.639189801036267e-05, "Full-pretrain/Loss": 1.8993875980377197, "Full-pretrain/Loss (Raw)": 1.9766547679901123, "Full-pretrain/Step": 5946, "Full-pretrain/Step Time": 17.644488541409373} +{"Full-pretrain/Learning Rate": 1.6383926920637077e-05, "Full-pretrain/Loss": 1.90318763256073, "Full-pretrain/Loss (Raw)": 2.0704991817474365, "Full-pretrain/Step": 5947, "Full-pretrain/Step Time": 17.64729024283588} +{"Full-pretrain/Learning Rate": 1.637595682477248e-05, "Full-pretrain/Loss": 1.9051216840744019, "Full-pretrain/Loss (Raw)": 1.8765318393707275, "Full-pretrain/Step": 5948, "Full-pretrain/Step Time": 17.644322402775288} +{"Full-pretrain/Learning Rate": 1.6367987723688237e-05, "Full-pretrain/Loss": 1.9029335975646973, "Full-pretrain/Loss (Raw)": 1.8970956802368164, "Full-pretrain/Step": 5949, "Full-pretrain/Step Time": 17.639552710577846} +{"Full-pretrain/Learning Rate": 1.6360019618303573e-05, "Full-pretrain/Loss": 1.9005460739135742, "Full-pretrain/Loss (Raw)": 1.9524496793746948, "Full-pretrain/Step": 5950, "Full-pretrain/Step Time": 17.65058303438127} +{"Full-pretrain/Learning Rate": 1.635205250953762e-05, "Full-pretrain/Loss": 1.9024338722229004, "Full-pretrain/Loss (Raw)": 1.9394487142562866, "Full-pretrain/Step": 5951, "Full-pretrain/Step Time": 17.644801076501608} +{"Full-pretrain/Learning Rate": 1.634408639830936e-05, "Full-pretrain/Loss": 1.9032444953918457, "Full-pretrain/Loss (Raw)": 1.760202169418335, "Full-pretrain/Step": 5952, "Full-pretrain/Step Time": 17.646165892481804} +{"Full-pretrain/Learning Rate": 1.6336121285537695e-05, "Full-pretrain/Loss": 1.887091040611267, "Full-pretrain/Loss (Raw)": 1.6091787815093994, "Full-pretrain/Step": 5953, "Full-pretrain/Step Time": 17.64601980149746} +{"Full-pretrain/Learning Rate": 1.63281571721414e-05, "Full-pretrain/Loss": 1.8838179111480713, "Full-pretrain/Loss (Raw)": 1.7868272066116333, "Full-pretrain/Step": 5954, "Full-pretrain/Step Time": 17.6453627217561} +{"Full-pretrain/Learning Rate": 1.6320194059039118e-05, "Full-pretrain/Loss": 1.8865394592285156, "Full-pretrain/Loss (Raw)": 2.07497501373291, "Full-pretrain/Step": 5955, "Full-pretrain/Step Time": 17.64113182760775} +{"Full-pretrain/Learning Rate": 1.6312231947149413e-05, "Full-pretrain/Loss": 1.88033127784729, "Full-pretrain/Loss (Raw)": 2.0177929401397705, "Full-pretrain/Step": 5956, "Full-pretrain/Step Time": 17.64163388684392} +{"Full-pretrain/Learning Rate": 1.6304270837390694e-05, "Full-pretrain/Loss": 1.8785732984542847, "Full-pretrain/Loss (Raw)": 1.8319368362426758, "Full-pretrain/Step": 5957, "Full-pretrain/Step Time": 17.641870385035872} +{"Full-pretrain/Learning Rate": 1.6296310730681275e-05, "Full-pretrain/Loss": 1.878415822982788, "Full-pretrain/Loss (Raw)": 2.0973613262176514, "Full-pretrain/Step": 5958, "Full-pretrain/Step Time": 17.641591550782323} +{"Full-pretrain/Learning Rate": 1.628835162793935e-05, "Full-pretrain/Loss": 1.8759427070617676, "Full-pretrain/Loss (Raw)": 1.8079686164855957, "Full-pretrain/Step": 5959, "Full-pretrain/Step Time": 17.642599031329155} +{"Full-pretrain/Learning Rate": 1.6280393530083012e-05, "Full-pretrain/Loss": 1.8825151920318604, "Full-pretrain/Loss (Raw)": 2.1015310287475586, "Full-pretrain/Step": 5960, "Full-pretrain/Step Time": 17.633753802627325} +{"Full-pretrain/Learning Rate": 1.627243643803022e-05, "Full-pretrain/Loss": 1.8784925937652588, "Full-pretrain/Loss (Raw)": 1.7140401601791382, "Full-pretrain/Step": 5961, "Full-pretrain/Step Time": 17.63790361210704} +{"Full-pretrain/Learning Rate": 1.6264480352698812e-05, "Full-pretrain/Loss": 1.8781492710113525, "Full-pretrain/Loss (Raw)": 1.9339168071746826, "Full-pretrain/Step": 5962, "Full-pretrain/Step Time": 17.63244886510074} +{"Full-pretrain/Learning Rate": 1.6256525275006527e-05, "Full-pretrain/Loss": 1.8814265727996826, "Full-pretrain/Loss (Raw)": 1.935828685760498, "Full-pretrain/Step": 5963, "Full-pretrain/Step Time": 17.626883195713162} +{"Full-pretrain/Learning Rate": 1.624857120587097e-05, "Full-pretrain/Loss": 1.8948876857757568, "Full-pretrain/Loss (Raw)": 2.327296257019043, "Full-pretrain/Step": 5964, "Full-pretrain/Step Time": 17.621616354212165} +{"Full-pretrain/Learning Rate": 1.6240618146209658e-05, "Full-pretrain/Loss": 1.8812837600708008, "Full-pretrain/Loss (Raw)": 1.6714916229248047, "Full-pretrain/Step": 5965, "Full-pretrain/Step Time": 17.61943125538528} +{"Full-pretrain/Learning Rate": 1.6232666096939968e-05, "Full-pretrain/Loss": 1.9011127948760986, "Full-pretrain/Loss (Raw)": 2.0553665161132812, "Full-pretrain/Step": 5966, "Full-pretrain/Step Time": 17.619657088071108} +{"Full-pretrain/Learning Rate": 1.6224715058979157e-05, "Full-pretrain/Loss": 1.8969887495040894, "Full-pretrain/Loss (Raw)": 1.9854496717453003, "Full-pretrain/Step": 5967, "Full-pretrain/Step Time": 17.615485794842243} +{"Full-pretrain/Learning Rate": 1.6216765033244377e-05, "Full-pretrain/Loss": 1.9149508476257324, "Full-pretrain/Loss (Raw)": 2.2304205894470215, "Full-pretrain/Step": 5968, "Full-pretrain/Step Time": 17.614120811223984} +{"Full-pretrain/Learning Rate": 1.6208816020652666e-05, "Full-pretrain/Loss": 1.9344158172607422, "Full-pretrain/Loss (Raw)": 2.21842622756958, "Full-pretrain/Step": 5969, "Full-pretrain/Step Time": 17.620120955631137} +{"Full-pretrain/Learning Rate": 1.620086802212094e-05, "Full-pretrain/Loss": 1.9381346702575684, "Full-pretrain/Loss (Raw)": 2.030271053314209, "Full-pretrain/Step": 5970, "Full-pretrain/Step Time": 17.616883708164096} +{"Full-pretrain/Learning Rate": 1.6192921038565992e-05, "Full-pretrain/Loss": 1.9335397481918335, "Full-pretrain/Loss (Raw)": 1.6300655603408813, "Full-pretrain/Step": 5971, "Full-pretrain/Step Time": 17.616799341514707} +{"Full-pretrain/Learning Rate": 1.618497507090451e-05, "Full-pretrain/Loss": 1.9434230327606201, "Full-pretrain/Loss (Raw)": 2.059579849243164, "Full-pretrain/Step": 5972, "Full-pretrain/Step Time": 17.61701259203255} +{"Full-pretrain/Learning Rate": 1.617703012005306e-05, "Full-pretrain/Loss": 1.9360284805297852, "Full-pretrain/Loss (Raw)": 1.7707266807556152, "Full-pretrain/Step": 5973, "Full-pretrain/Step Time": 17.615783790126443} +{"Full-pretrain/Learning Rate": 1.6169086186928075e-05, "Full-pretrain/Loss": 1.938076138496399, "Full-pretrain/Loss (Raw)": 1.8979979753494263, "Full-pretrain/Step": 5974, "Full-pretrain/Step Time": 17.611501602455974} +{"Full-pretrain/Learning Rate": 1.61611432724459e-05, "Full-pretrain/Loss": 1.9305827617645264, "Full-pretrain/Loss (Raw)": 1.9385249614715576, "Full-pretrain/Step": 5975, "Full-pretrain/Step Time": 17.611154137179255} +{"Full-pretrain/Learning Rate": 1.615320137752274e-05, "Full-pretrain/Loss": 1.9404618740081787, "Full-pretrain/Loss (Raw)": 1.849295973777771, "Full-pretrain/Step": 5976, "Full-pretrain/Step Time": 17.61313190497458} +{"Full-pretrain/Learning Rate": 1.61452605030747e-05, "Full-pretrain/Loss": 1.9421114921569824, "Full-pretrain/Loss (Raw)": 2.0984108448028564, "Full-pretrain/Step": 5977, "Full-pretrain/Step Time": 17.611868115141988} +{"Full-pretrain/Learning Rate": 1.6137320650017743e-05, "Full-pretrain/Loss": 1.9460704326629639, "Full-pretrain/Loss (Raw)": 2.1033437252044678, "Full-pretrain/Step": 5978, "Full-pretrain/Step Time": 17.607746113091707} +{"Full-pretrain/Learning Rate": 1.612938181926773e-05, "Full-pretrain/Loss": 1.9428454637527466, "Full-pretrain/Loss (Raw)": 1.967299222946167, "Full-pretrain/Step": 5979, "Full-pretrain/Step Time": 17.613600095734} +{"Full-pretrain/Learning Rate": 1.6121444011740417e-05, "Full-pretrain/Loss": 1.9469406604766846, "Full-pretrain/Loss (Raw)": 2.0075762271881104, "Full-pretrain/Step": 5980, "Full-pretrain/Step Time": 17.60988443531096} +{"Full-pretrain/Learning Rate": 1.611350722835141e-05, "Full-pretrain/Loss": 1.9497950077056885, "Full-pretrain/Loss (Raw)": 1.9884341955184937, "Full-pretrain/Step": 5981, "Full-pretrain/Step Time": 17.612982742488384} +{"Full-pretrain/Learning Rate": 1.610557147001623e-05, "Full-pretrain/Loss": 1.9543967247009277, "Full-pretrain/Loss (Raw)": 2.0997085571289062, "Full-pretrain/Step": 5982, "Full-pretrain/Step Time": 17.60715789720416} +{"Full-pretrain/Learning Rate": 1.6097636737650245e-05, "Full-pretrain/Loss": 1.9565374851226807, "Full-pretrain/Loss (Raw)": 2.0079550743103027, "Full-pretrain/Step": 5983, "Full-pretrain/Step Time": 17.614494996145368} +{"Full-pretrain/Learning Rate": 1.6089703032168733e-05, "Full-pretrain/Loss": 1.960663080215454, "Full-pretrain/Loss (Raw)": 1.8922202587127686, "Full-pretrain/Step": 5984, "Full-pretrain/Step Time": 17.60990334674716} +{"Full-pretrain/Learning Rate": 1.6081770354486846e-05, "Full-pretrain/Loss": 1.9798818826675415, "Full-pretrain/Loss (Raw)": 2.224180221557617, "Full-pretrain/Step": 5985, "Full-pretrain/Step Time": 17.60598578862846} +{"Full-pretrain/Learning Rate": 1.6073838705519616e-05, "Full-pretrain/Loss": 1.987603783607483, "Full-pretrain/Loss (Raw)": 2.0339279174804688, "Full-pretrain/Step": 5986, "Full-pretrain/Step Time": 17.604843992739916} +{"Full-pretrain/Learning Rate": 1.606590808618196e-05, "Full-pretrain/Loss": 1.9800801277160645, "Full-pretrain/Loss (Raw)": 1.8342204093933105, "Full-pretrain/Step": 5987, "Full-pretrain/Step Time": 17.604042761027813} +{"Full-pretrain/Learning Rate": 1.6057978497388664e-05, "Full-pretrain/Loss": 1.9804604053497314, "Full-pretrain/Loss (Raw)": 2.029958963394165, "Full-pretrain/Step": 5988, "Full-pretrain/Step Time": 17.603228338062763} +{"Full-pretrain/Learning Rate": 1.6050049940054408e-05, "Full-pretrain/Loss": 1.9862112998962402, "Full-pretrain/Loss (Raw)": 2.0159642696380615, "Full-pretrain/Step": 5989, "Full-pretrain/Step Time": 17.5958990752697} +{"Full-pretrain/Learning Rate": 1.604212241509374e-05, "Full-pretrain/Loss": 1.9730255603790283, "Full-pretrain/Loss (Raw)": 1.6754180192947388, "Full-pretrain/Step": 5990, "Full-pretrain/Step Time": 17.600961374118924} +{"Full-pretrain/Learning Rate": 1.6034195923421105e-05, "Full-pretrain/Loss": 1.9868905544281006, "Full-pretrain/Loss (Raw)": 2.2516469955444336, "Full-pretrain/Step": 5991, "Full-pretrain/Step Time": 17.59521307423711} +{"Full-pretrain/Learning Rate": 1.602627046595082e-05, "Full-pretrain/Loss": 1.9795783758163452, "Full-pretrain/Loss (Raw)": 1.867539405822754, "Full-pretrain/Step": 5992, "Full-pretrain/Step Time": 17.599723802879453} +{"Full-pretrain/Learning Rate": 1.6018346043597092e-05, "Full-pretrain/Loss": 1.9902839660644531, "Full-pretrain/Loss (Raw)": 2.05662202835083, "Full-pretrain/Step": 5993, "Full-pretrain/Step Time": 17.595458449795842} +{"Full-pretrain/Learning Rate": 1.601042265727398e-05, "Full-pretrain/Loss": 1.994621753692627, "Full-pretrain/Loss (Raw)": 2.0727298259735107, "Full-pretrain/Step": 5994, "Full-pretrain/Step Time": 17.594622815027833} +{"Full-pretrain/Learning Rate": 1.6002500307895458e-05, "Full-pretrain/Loss": 1.9920222759246826, "Full-pretrain/Loss (Raw)": 1.8526417016983032, "Full-pretrain/Step": 5995, "Full-pretrain/Step Time": 17.596330558881164} +{"Full-pretrain/Learning Rate": 1.5994578996375363e-05, "Full-pretrain/Loss": 1.9907488822937012, "Full-pretrain/Loss (Raw)": 2.286547899246216, "Full-pretrain/Step": 5996, "Full-pretrain/Step Time": 17.597689041867852} +{"Full-pretrain/Learning Rate": 1.598665872362742e-05, "Full-pretrain/Loss": 2.017303466796875, "Full-pretrain/Loss (Raw)": 2.521237850189209, "Full-pretrain/Step": 5997, "Full-pretrain/Step Time": 17.59745510853827} +{"Full-pretrain/Learning Rate": 1.5978739490565227e-05, "Full-pretrain/Loss": 2.0183310508728027, "Full-pretrain/Loss (Raw)": 2.0882506370544434, "Full-pretrain/Step": 5998, "Full-pretrain/Step Time": 17.601720951497555} +{"Full-pretrain/Learning Rate": 1.5970821298102255e-05, "Full-pretrain/Loss": 2.025452136993408, "Full-pretrain/Loss (Raw)": 2.2133235931396484, "Full-pretrain/Step": 5999, "Full-pretrain/Step Time": 17.600171329453588} +{"Full-pretrain/Learning Rate": 1.5962904147151876e-05, "Full-pretrain/Loss": 2.0161566734313965, "Full-pretrain/Loss (Raw)": 1.9329643249511719, "Full-pretrain/Step": 6000, "Full-pretrain/Step Time": 17.599768726155162} +{"Full-pretrain/Learning Rate": 1.5954988038627328e-05, "Full-pretrain/Loss": 2.012970447540283, "Full-pretrain/Loss (Raw)": 2.116469144821167, "Full-pretrain/Step": 6001, "Full-pretrain/Step Time": 17.600528778508306} +{"Full-pretrain/Learning Rate": 1.594707297344173e-05, "Full-pretrain/Loss": 2.0146422386169434, "Full-pretrain/Loss (Raw)": 2.0837690830230713, "Full-pretrain/Step": 6002, "Full-pretrain/Step Time": 17.60432724095881} +{"Full-pretrain/Learning Rate": 1.5939158952508092e-05, "Full-pretrain/Loss": 2.026576280593872, "Full-pretrain/Loss (Raw)": 2.011958599090576, "Full-pretrain/Step": 6003, "Full-pretrain/Step Time": 17.595746966078877} +{"Full-pretrain/Learning Rate": 1.593124597673928e-05, "Full-pretrain/Loss": 2.0278749465942383, "Full-pretrain/Loss (Raw)": 2.1011316776275635, "Full-pretrain/Step": 6004, "Full-pretrain/Step Time": 17.597444580867887} +{"Full-pretrain/Learning Rate": 1.5923334047048056e-05, "Full-pretrain/Loss": 2.022165536880493, "Full-pretrain/Loss (Raw)": 1.5880333185195923, "Full-pretrain/Step": 6005, "Full-pretrain/Step Time": 17.603127297013998} +{"Full-pretrain/Learning Rate": 1.5915423164347055e-05, "Full-pretrain/Loss": 2.022979736328125, "Full-pretrain/Loss (Raw)": 1.924047589302063, "Full-pretrain/Step": 6006, "Full-pretrain/Step Time": 17.602898366749287} +{"Full-pretrain/Learning Rate": 1.5907513329548802e-05, "Full-pretrain/Loss": 2.027920961380005, "Full-pretrain/Loss (Raw)": 2.0966432094573975, "Full-pretrain/Step": 6007, "Full-pretrain/Step Time": 17.599658647552133} +{"Full-pretrain/Learning Rate": 1.589960454356569e-05, "Full-pretrain/Loss": 2.0222506523132324, "Full-pretrain/Loss (Raw)": 1.6678457260131836, "Full-pretrain/Step": 6008, "Full-pretrain/Step Time": 17.597497064620256} +{"Full-pretrain/Learning Rate": 1.5891696807310007e-05, "Full-pretrain/Loss": 2.0145018100738525, "Full-pretrain/Loss (Raw)": 1.850450038909912, "Full-pretrain/Step": 6009, "Full-pretrain/Step Time": 17.59436697140336} +{"Full-pretrain/Learning Rate": 1.5883790121693885e-05, "Full-pretrain/Loss": 2.0171632766723633, "Full-pretrain/Loss (Raw)": 2.1885061264038086, "Full-pretrain/Step": 6010, "Full-pretrain/Step Time": 17.593127639964223} +{"Full-pretrain/Learning Rate": 1.587588448762937e-05, "Full-pretrain/Loss": 2.009410858154297, "Full-pretrain/Loss (Raw)": 1.7192245721817017, "Full-pretrain/Step": 6011, "Full-pretrain/Step Time": 17.5962503105402} +{"Full-pretrain/Learning Rate": 1.586797990602838e-05, "Full-pretrain/Loss": 2.013762950897217, "Full-pretrain/Loss (Raw)": 2.1468496322631836, "Full-pretrain/Step": 6012, "Full-pretrain/Step Time": 17.60148500278592} +{"Full-pretrain/Learning Rate": 1.586007637780269e-05, "Full-pretrain/Loss": 2.007734537124634, "Full-pretrain/Loss (Raw)": 1.7955186367034912, "Full-pretrain/Step": 6013, "Full-pretrain/Step Time": 17.59922249428928} +{"Full-pretrain/Learning Rate": 1.5852173903863986e-05, "Full-pretrain/Loss": 1.9991834163665771, "Full-pretrain/Loss (Raw)": 1.8260715007781982, "Full-pretrain/Step": 6014, "Full-pretrain/Step Time": 17.596972158178687} +{"Full-pretrain/Learning Rate": 1.5844272485123806e-05, "Full-pretrain/Loss": 1.9990688562393188, "Full-pretrain/Loss (Raw)": 2.004291296005249, "Full-pretrain/Step": 6015, "Full-pretrain/Step Time": 17.596173100173473} +{"Full-pretrain/Learning Rate": 1.583637212249357e-05, "Full-pretrain/Loss": 1.9994562864303589, "Full-pretrain/Loss (Raw)": 1.9046210050582886, "Full-pretrain/Step": 6016, "Full-pretrain/Step Time": 17.601096661761403} +{"Full-pretrain/Learning Rate": 1.5828472816884594e-05, "Full-pretrain/Loss": 1.9908130168914795, "Full-pretrain/Loss (Raw)": 1.947594404220581, "Full-pretrain/Step": 6017, "Full-pretrain/Step Time": 17.596289582550526} +{"Full-pretrain/Learning Rate": 1.5820574569208053e-05, "Full-pretrain/Loss": 1.9768157005310059, "Full-pretrain/Loss (Raw)": 1.5860142707824707, "Full-pretrain/Step": 6018, "Full-pretrain/Step Time": 17.59298308752477} +{"Full-pretrain/Learning Rate": 1.5812677380375018e-05, "Full-pretrain/Loss": 1.9848085641860962, "Full-pretrain/Loss (Raw)": 2.08998966217041, "Full-pretrain/Step": 6019, "Full-pretrain/Step Time": 17.59241190738976} +{"Full-pretrain/Learning Rate": 1.5804781251296406e-05, "Full-pretrain/Loss": 1.9811948537826538, "Full-pretrain/Loss (Raw)": 1.914319634437561, "Full-pretrain/Step": 6020, "Full-pretrain/Step Time": 17.600659439340234} +{"Full-pretrain/Learning Rate": 1.5796886182883053e-05, "Full-pretrain/Loss": 1.9803121089935303, "Full-pretrain/Loss (Raw)": 1.987717866897583, "Full-pretrain/Step": 6021, "Full-pretrain/Step Time": 17.597293250262737} +{"Full-pretrain/Learning Rate": 1.5788992176045643e-05, "Full-pretrain/Loss": 1.9863704442977905, "Full-pretrain/Loss (Raw)": 1.869283676147461, "Full-pretrain/Step": 6022, "Full-pretrain/Step Time": 17.598456494510174} +{"Full-pretrain/Learning Rate": 1.5781099231694747e-05, "Full-pretrain/Loss": 1.9782096147537231, "Full-pretrain/Loss (Raw)": 1.9905014038085938, "Full-pretrain/Step": 6023, "Full-pretrain/Step Time": 17.599025316536427} +{"Full-pretrain/Learning Rate": 1.5773207350740825e-05, "Full-pretrain/Loss": 1.9804506301879883, "Full-pretrain/Loss (Raw)": 1.9392516613006592, "Full-pretrain/Step": 6024, "Full-pretrain/Step Time": 17.608761303126812} +{"Full-pretrain/Learning Rate": 1.5765316534094182e-05, "Full-pretrain/Loss": 1.9851024150848389, "Full-pretrain/Loss (Raw)": 2.205475330352783, "Full-pretrain/Step": 6025, "Full-pretrain/Step Time": 17.60527284629643} +{"Full-pretrain/Learning Rate": 1.575742678266503e-05, "Full-pretrain/Loss": 1.9840424060821533, "Full-pretrain/Loss (Raw)": 2.0388097763061523, "Full-pretrain/Step": 6026, "Full-pretrain/Step Time": 17.60339775495231} +{"Full-pretrain/Learning Rate": 1.5749538097363452e-05, "Full-pretrain/Loss": 1.9932971000671387, "Full-pretrain/Loss (Raw)": 2.1487956047058105, "Full-pretrain/Step": 6027, "Full-pretrain/Step Time": 17.607395388185978} +{"Full-pretrain/Learning Rate": 1.57416504790994e-05, "Full-pretrain/Loss": 1.9850776195526123, "Full-pretrain/Loss (Raw)": 2.023521900177002, "Full-pretrain/Step": 6028, "Full-pretrain/Step Time": 17.61591020412743} +{"Full-pretrain/Learning Rate": 1.5733763928782723e-05, "Full-pretrain/Loss": 1.96482515335083, "Full-pretrain/Loss (Raw)": 1.8731602430343628, "Full-pretrain/Step": 6029, "Full-pretrain/Step Time": 17.61041136085987} +{"Full-pretrain/Learning Rate": 1.572587844732312e-05, "Full-pretrain/Loss": 1.9664978981018066, "Full-pretrain/Loss (Raw)": 2.1417741775512695, "Full-pretrain/Step": 6030, "Full-pretrain/Step Time": 17.609756913036108} +{"Full-pretrain/Learning Rate": 1.5717994035630174e-05, "Full-pretrain/Loss": 1.9589362144470215, "Full-pretrain/Loss (Raw)": 1.9713517427444458, "Full-pretrain/Step": 6031, "Full-pretrain/Step Time": 17.61535313539207} +{"Full-pretrain/Learning Rate": 1.571011069461335e-05, "Full-pretrain/Loss": 1.9599781036376953, "Full-pretrain/Loss (Raw)": 1.966306447982788, "Full-pretrain/Step": 6032, "Full-pretrain/Step Time": 17.611376851797104} +{"Full-pretrain/Learning Rate": 1.5702228425181995e-05, "Full-pretrain/Loss": 1.950613021850586, "Full-pretrain/Loss (Raw)": 1.8167877197265625, "Full-pretrain/Step": 6033, "Full-pretrain/Step Time": 17.61591866798699} +{"Full-pretrain/Learning Rate": 1.569434722824532e-05, "Full-pretrain/Loss": 1.944515347480774, "Full-pretrain/Loss (Raw)": 1.8886412382125854, "Full-pretrain/Step": 6034, "Full-pretrain/Step Time": 17.609014339745045} +{"Full-pretrain/Learning Rate": 1.568646710471244e-05, "Full-pretrain/Loss": 1.9380621910095215, "Full-pretrain/Loss (Raw)": 1.805457353591919, "Full-pretrain/Step": 6035, "Full-pretrain/Step Time": 17.611636927351356} +{"Full-pretrain/Learning Rate": 1.567858805549229e-05, "Full-pretrain/Loss": 1.925150990486145, "Full-pretrain/Loss (Raw)": 1.6879761219024658, "Full-pretrain/Step": 6036, "Full-pretrain/Step Time": 17.610297629609704} +{"Full-pretrain/Learning Rate": 1.567071008149373e-05, "Full-pretrain/Loss": 1.936614751815796, "Full-pretrain/Loss (Raw)": 1.9548743963241577, "Full-pretrain/Step": 6037, "Full-pretrain/Step Time": 17.614644203335047} +{"Full-pretrain/Learning Rate": 1.5662833183625493e-05, "Full-pretrain/Loss": 1.9412977695465088, "Full-pretrain/Loss (Raw)": 2.073902130126953, "Full-pretrain/Step": 6038, "Full-pretrain/Step Time": 17.614060239866376} +{"Full-pretrain/Learning Rate": 1.5654957362796162e-05, "Full-pretrain/Loss": 1.9362177848815918, "Full-pretrain/Loss (Raw)": 1.9340847730636597, "Full-pretrain/Step": 6039, "Full-pretrain/Step Time": 17.61395078152418} +{"Full-pretrain/Learning Rate": 1.564708261991422e-05, "Full-pretrain/Loss": 1.9496164321899414, "Full-pretrain/Loss (Raw)": 2.096604585647583, "Full-pretrain/Step": 6040, "Full-pretrain/Step Time": 17.61495358683169} +{"Full-pretrain/Learning Rate": 1.5639208955888007e-05, "Full-pretrain/Loss": 1.9501914978027344, "Full-pretrain/Loss (Raw)": 1.8688480854034424, "Full-pretrain/Step": 6041, "Full-pretrain/Step Time": 17.613434690982103} +{"Full-pretrain/Learning Rate": 1.563133637162575e-05, "Full-pretrain/Loss": 1.9536097049713135, "Full-pretrain/Loss (Raw)": 2.29789137840271, "Full-pretrain/Step": 6042, "Full-pretrain/Step Time": 17.61027837730944} +{"Full-pretrain/Learning Rate": 1.5623464868035548e-05, "Full-pretrain/Loss": 1.9576468467712402, "Full-pretrain/Loss (Raw)": 1.8484117984771729, "Full-pretrain/Step": 6043, "Full-pretrain/Step Time": 17.61406403966248} +{"Full-pretrain/Learning Rate": 1.561559444602538e-05, "Full-pretrain/Loss": 1.9399210214614868, "Full-pretrain/Loss (Raw)": 1.5796217918395996, "Full-pretrain/Step": 6044, "Full-pretrain/Step Time": 17.61468769982457} +{"Full-pretrain/Learning Rate": 1.5607725106503105e-05, "Full-pretrain/Loss": 1.9392790794372559, "Full-pretrain/Loss (Raw)": 1.774979829788208, "Full-pretrain/Step": 6045, "Full-pretrain/Step Time": 17.61235835030675} +{"Full-pretrain/Learning Rate": 1.5599856850376426e-05, "Full-pretrain/Loss": 1.9414489269256592, "Full-pretrain/Loss (Raw)": 1.895500898361206, "Full-pretrain/Step": 6046, "Full-pretrain/Step Time": 17.606074264273047} +{"Full-pretrain/Learning Rate": 1.5591989678552963e-05, "Full-pretrain/Loss": 1.9417792558670044, "Full-pretrain/Loss (Raw)": 2.0148661136627197, "Full-pretrain/Step": 6047, "Full-pretrain/Step Time": 17.600588152185082} +{"Full-pretrain/Learning Rate": 1.5584123591940178e-05, "Full-pretrain/Loss": 1.947526454925537, "Full-pretrain/Loss (Raw)": 2.0885283946990967, "Full-pretrain/Step": 6048, "Full-pretrain/Step Time": 17.602960685268044} +{"Full-pretrain/Learning Rate": 1.557625859144543e-05, "Full-pretrain/Loss": 1.9472428560256958, "Full-pretrain/Loss (Raw)": 1.9385223388671875, "Full-pretrain/Step": 6049, "Full-pretrain/Step Time": 17.59961318783462} +{"Full-pretrain/Learning Rate": 1.556839467797594e-05, "Full-pretrain/Loss": 1.959341287612915, "Full-pretrain/Loss (Raw)": 1.9731621742248535, "Full-pretrain/Step": 6050, "Full-pretrain/Step Time": 17.599499644711614} +{"Full-pretrain/Learning Rate": 1.556053185243882e-05, "Full-pretrain/Loss": 1.9623042345046997, "Full-pretrain/Loss (Raw)": 2.1848092079162598, "Full-pretrain/Step": 6051, "Full-pretrain/Step Time": 17.596147630363703} +{"Full-pretrain/Learning Rate": 1.5552670115741024e-05, "Full-pretrain/Loss": 1.9571175575256348, "Full-pretrain/Loss (Raw)": 1.7483432292938232, "Full-pretrain/Step": 6052, "Full-pretrain/Step Time": 17.592737013474107} +{"Full-pretrain/Learning Rate": 1.5544809468789407e-05, "Full-pretrain/Loss": 1.9611456394195557, "Full-pretrain/Loss (Raw)": 2.11661434173584, "Full-pretrain/Step": 6053, "Full-pretrain/Step Time": 17.597537713125348} +{"Full-pretrain/Learning Rate": 1.5536949912490702e-05, "Full-pretrain/Loss": 1.9642891883850098, "Full-pretrain/Loss (Raw)": 1.9698787927627563, "Full-pretrain/Step": 6054, "Full-pretrain/Step Time": 17.59257628954947} +{"Full-pretrain/Learning Rate": 1.5529091447751495e-05, "Full-pretrain/Loss": 1.971287727355957, "Full-pretrain/Loss (Raw)": 2.2144548892974854, "Full-pretrain/Step": 6055, "Full-pretrain/Step Time": 17.5905515383929} +{"Full-pretrain/Learning Rate": 1.5521234075478265e-05, "Full-pretrain/Loss": 1.9672915935516357, "Full-pretrain/Loss (Raw)": 1.811370849609375, "Full-pretrain/Step": 6056, "Full-pretrain/Step Time": 17.590610271319747} +{"Full-pretrain/Learning Rate": 1.5513377796577356e-05, "Full-pretrain/Loss": 1.9672160148620605, "Full-pretrain/Loss (Raw)": 2.203056573867798, "Full-pretrain/Step": 6057, "Full-pretrain/Step Time": 17.579416263848543} +{"Full-pretrain/Learning Rate": 1.5505522611954975e-05, "Full-pretrain/Loss": 1.9614746570587158, "Full-pretrain/Loss (Raw)": 1.8550848960876465, "Full-pretrain/Step": 6058, "Full-pretrain/Step Time": 17.585769951343536} +{"Full-pretrain/Learning Rate": 1.549766852251723e-05, "Full-pretrain/Loss": 1.9599032402038574, "Full-pretrain/Loss (Raw)": 2.0985140800476074, "Full-pretrain/Step": 6059, "Full-pretrain/Step Time": 17.586071452125907} +{"Full-pretrain/Learning Rate": 1.5489815529170078e-05, "Full-pretrain/Loss": 1.9593936204910278, "Full-pretrain/Loss (Raw)": 2.007213592529297, "Full-pretrain/Step": 6060, "Full-pretrain/Step Time": 17.583717530593276} +{"Full-pretrain/Learning Rate": 1.548196363281937e-05, "Full-pretrain/Loss": 1.9662082195281982, "Full-pretrain/Loss (Raw)": 2.091226100921631, "Full-pretrain/Step": 6061, "Full-pretrain/Step Time": 17.57879122532904} +{"Full-pretrain/Learning Rate": 1.5474112834370802e-05, "Full-pretrain/Loss": 1.955560326576233, "Full-pretrain/Loss (Raw)": 1.8010433912277222, "Full-pretrain/Step": 6062, "Full-pretrain/Step Time": 17.58138858154416} +{"Full-pretrain/Learning Rate": 1.5466263134729975e-05, "Full-pretrain/Loss": 1.9544498920440674, "Full-pretrain/Loss (Raw)": 1.9358158111572266, "Full-pretrain/Step": 6063, "Full-pretrain/Step Time": 17.581897366791964} +{"Full-pretrain/Learning Rate": 1.5458414534802348e-05, "Full-pretrain/Loss": 1.948265552520752, "Full-pretrain/Loss (Raw)": 1.7684102058410645, "Full-pretrain/Step": 6064, "Full-pretrain/Step Time": 17.584593672305346} +{"Full-pretrain/Learning Rate": 1.5450567035493246e-05, "Full-pretrain/Loss": 1.9630106687545776, "Full-pretrain/Loss (Raw)": 2.288630485534668, "Full-pretrain/Step": 6065, "Full-pretrain/Step Time": 17.579335030168295} +{"Full-pretrain/Learning Rate": 1.5442720637707892e-05, "Full-pretrain/Loss": 1.970432162284851, "Full-pretrain/Loss (Raw)": 2.126131772994995, "Full-pretrain/Step": 6066, "Full-pretrain/Step Time": 17.583015156909823} +{"Full-pretrain/Learning Rate": 1.5434875342351342e-05, "Full-pretrain/Loss": 1.9736902713775635, "Full-pretrain/Loss (Raw)": 1.9097132682800293, "Full-pretrain/Step": 6067, "Full-pretrain/Step Time": 17.577130349352956} +{"Full-pretrain/Learning Rate": 1.5427031150328563e-05, "Full-pretrain/Loss": 1.9795182943344116, "Full-pretrain/Loss (Raw)": 1.8744757175445557, "Full-pretrain/Step": 6068, "Full-pretrain/Step Time": 17.579111631959677} +{"Full-pretrain/Learning Rate": 1.5419188062544374e-05, "Full-pretrain/Loss": 1.9795626401901245, "Full-pretrain/Loss (Raw)": 1.9562934637069702, "Full-pretrain/Step": 6069, "Full-pretrain/Step Time": 17.580067615956068} +{"Full-pretrain/Learning Rate": 1.5411346079903476e-05, "Full-pretrain/Loss": 1.9687434434890747, "Full-pretrain/Loss (Raw)": 1.7276883125305176, "Full-pretrain/Step": 6070, "Full-pretrain/Step Time": 17.578429432585835} +{"Full-pretrain/Learning Rate": 1.540350520331044e-05, "Full-pretrain/Loss": 1.9719845056533813, "Full-pretrain/Loss (Raw)": 2.037799119949341, "Full-pretrain/Step": 6071, "Full-pretrain/Step Time": 17.578690119087696} +{"Full-pretrain/Learning Rate": 1.539566543366971e-05, "Full-pretrain/Loss": 1.9773188829421997, "Full-pretrain/Loss (Raw)": 2.2673027515411377, "Full-pretrain/Step": 6072, "Full-pretrain/Step Time": 17.57851585932076} +{"Full-pretrain/Learning Rate": 1.5387826771885597e-05, "Full-pretrain/Loss": 1.9753532409667969, "Full-pretrain/Loss (Raw)": 1.8059450387954712, "Full-pretrain/Step": 6073, "Full-pretrain/Step Time": 17.578930346295238} +{"Full-pretrain/Learning Rate": 1.537998921886228e-05, "Full-pretrain/Loss": 1.964766025543213, "Full-pretrain/Loss (Raw)": 1.9591013193130493, "Full-pretrain/Step": 6074, "Full-pretrain/Step Time": 17.577311389148235} +{"Full-pretrain/Learning Rate": 1.5372152775503827e-05, "Full-pretrain/Loss": 1.967619776725769, "Full-pretrain/Loss (Raw)": 1.939734935760498, "Full-pretrain/Step": 6075, "Full-pretrain/Step Time": 17.576939893886447} +{"Full-pretrain/Learning Rate": 1.536431744271417e-05, "Full-pretrain/Loss": 1.9797587394714355, "Full-pretrain/Loss (Raw)": 1.9680676460266113, "Full-pretrain/Step": 6076, "Full-pretrain/Step Time": 17.579939901828766} +{"Full-pretrain/Learning Rate": 1.535648322139712e-05, "Full-pretrain/Loss": 1.9775117635726929, "Full-pretrain/Loss (Raw)": 1.70307457447052, "Full-pretrain/Step": 6077, "Full-pretrain/Step Time": 17.58773149177432} +{"Full-pretrain/Learning Rate": 1.534865011245633e-05, "Full-pretrain/Loss": 1.9821701049804688, "Full-pretrain/Loss (Raw)": 2.0445685386657715, "Full-pretrain/Step": 6078, "Full-pretrain/Step Time": 17.578709561377764} +{"Full-pretrain/Learning Rate": 1.5340818116795357e-05, "Full-pretrain/Loss": 1.9862608909606934, "Full-pretrain/Loss (Raw)": 2.145775079727173, "Full-pretrain/Step": 6079, "Full-pretrain/Step Time": 17.58773453347385} +{"Full-pretrain/Learning Rate": 1.5332987235317626e-05, "Full-pretrain/Loss": 1.9860079288482666, "Full-pretrain/Loss (Raw)": 2.080432415008545, "Full-pretrain/Step": 6080, "Full-pretrain/Step Time": 17.587852651253343} +{"Full-pretrain/Learning Rate": 1.5325157468926414e-05, "Full-pretrain/Loss": 1.9839162826538086, "Full-pretrain/Loss (Raw)": 1.8715875148773193, "Full-pretrain/Step": 6081, "Full-pretrain/Step Time": 17.589584302157164} +{"Full-pretrain/Learning Rate": 1.53173288185249e-05, "Full-pretrain/Loss": 1.9860929250717163, "Full-pretrain/Loss (Raw)": 2.0428175926208496, "Full-pretrain/Step": 6082, "Full-pretrain/Step Time": 17.587985888123512} +{"Full-pretrain/Learning Rate": 1.5309501285016093e-05, "Full-pretrain/Loss": 1.979330062866211, "Full-pretrain/Loss (Raw)": 1.9683973789215088, "Full-pretrain/Step": 6083, "Full-pretrain/Step Time": 17.586731990799308} +{"Full-pretrain/Learning Rate": 1.5301674869302906e-05, "Full-pretrain/Loss": 1.9897079467773438, "Full-pretrain/Loss (Raw)": 2.0804381370544434, "Full-pretrain/Step": 6084, "Full-pretrain/Step Time": 17.589780516922474} +{"Full-pretrain/Learning Rate": 1.5293849572288117e-05, "Full-pretrain/Loss": 1.9901156425476074, "Full-pretrain/Loss (Raw)": 2.129655361175537, "Full-pretrain/Step": 6085, "Full-pretrain/Step Time": 17.58648681268096} +{"Full-pretrain/Learning Rate": 1.5286025394874364e-05, "Full-pretrain/Loss": 1.9839823246002197, "Full-pretrain/Loss (Raw)": 1.773613452911377, "Full-pretrain/Step": 6086, "Full-pretrain/Step Time": 17.58615145459771} +{"Full-pretrain/Learning Rate": 1.5278202337964182e-05, "Full-pretrain/Loss": 1.9674900770187378, "Full-pretrain/Loss (Raw)": 1.6867034435272217, "Full-pretrain/Step": 6087, "Full-pretrain/Step Time": 17.579355398193} +{"Full-pretrain/Learning Rate": 1.5270380402459933e-05, "Full-pretrain/Loss": 1.9679161310195923, "Full-pretrain/Loss (Raw)": 1.8250060081481934, "Full-pretrain/Step": 6088, "Full-pretrain/Step Time": 17.59203291684389} +{"Full-pretrain/Learning Rate": 1.526255958926389e-05, "Full-pretrain/Loss": 1.9619090557098389, "Full-pretrain/Loss (Raw)": 2.010831356048584, "Full-pretrain/Step": 6089, "Full-pretrain/Step Time": 17.587907545268536} +{"Full-pretrain/Learning Rate": 1.5254739899278173e-05, "Full-pretrain/Loss": 1.9752624034881592, "Full-pretrain/Loss (Raw)": 2.282396078109741, "Full-pretrain/Step": 6090, "Full-pretrain/Step Time": 17.591422831639647} +{"Full-pretrain/Learning Rate": 1.5246921333404784e-05, "Full-pretrain/Loss": 1.9703463315963745, "Full-pretrain/Loss (Raw)": 1.9411962032318115, "Full-pretrain/Step": 6091, "Full-pretrain/Step Time": 17.591249445453286} +{"Full-pretrain/Learning Rate": 1.5239103892545589e-05, "Full-pretrain/Loss": 1.9649147987365723, "Full-pretrain/Loss (Raw)": 1.83340585231781, "Full-pretrain/Step": 6092, "Full-pretrain/Step Time": 17.603143451735377} +{"Full-pretrain/Learning Rate": 1.5231287577602343e-05, "Full-pretrain/Loss": 1.957398772239685, "Full-pretrain/Loss (Raw)": 1.8507094383239746, "Full-pretrain/Step": 6093, "Full-pretrain/Step Time": 17.596678590402007} +{"Full-pretrain/Learning Rate": 1.5223472389476628e-05, "Full-pretrain/Loss": 1.9660680294036865, "Full-pretrain/Loss (Raw)": 2.078462839126587, "Full-pretrain/Step": 6094, "Full-pretrain/Step Time": 17.597042478621006} +{"Full-pretrain/Learning Rate": 1.521565832906994e-05, "Full-pretrain/Loss": 1.9690139293670654, "Full-pretrain/Loss (Raw)": 2.030082941055298, "Full-pretrain/Step": 6095, "Full-pretrain/Step Time": 17.600788405165076} +{"Full-pretrain/Learning Rate": 1.520784539728363e-05, "Full-pretrain/Loss": 1.9707814455032349, "Full-pretrain/Loss (Raw)": 1.8249691724777222, "Full-pretrain/Step": 6096, "Full-pretrain/Step Time": 17.60650041140616} +{"Full-pretrain/Learning Rate": 1.520003359501891e-05, "Full-pretrain/Loss": 1.9575812816619873, "Full-pretrain/Loss (Raw)": 1.8662230968475342, "Full-pretrain/Step": 6097, "Full-pretrain/Step Time": 17.59433059953153} +{"Full-pretrain/Learning Rate": 1.519222292317687e-05, "Full-pretrain/Loss": 1.9549967050552368, "Full-pretrain/Loss (Raw)": 2.043426513671875, "Full-pretrain/Step": 6098, "Full-pretrain/Step Time": 17.591172881424427} +{"Full-pretrain/Learning Rate": 1.5184413382658471e-05, "Full-pretrain/Loss": 1.9519293308258057, "Full-pretrain/Loss (Raw)": 1.8115588426589966, "Full-pretrain/Step": 6099, "Full-pretrain/Step Time": 17.591945515945554} +{"Full-pretrain/Learning Rate": 1.5176604974364533e-05, "Full-pretrain/Loss": 1.953172206878662, "Full-pretrain/Loss (Raw)": 1.9142439365386963, "Full-pretrain/Step": 6100, "Full-pretrain/Step Time": 17.60128833167255} +{"Full-pretrain/Learning Rate": 1.5168797699195763e-05, "Full-pretrain/Loss": 1.9548494815826416, "Full-pretrain/Loss (Raw)": 2.009967803955078, "Full-pretrain/Step": 6101, "Full-pretrain/Step Time": 17.599381180480123} +{"Full-pretrain/Learning Rate": 1.5160991558052722e-05, "Full-pretrain/Loss": 1.9613522291183472, "Full-pretrain/Loss (Raw)": 1.935776710510254, "Full-pretrain/Step": 6102, "Full-pretrain/Step Time": 17.601398991420865} +{"Full-pretrain/Learning Rate": 1.5153186551835857e-05, "Full-pretrain/Loss": 1.9588453769683838, "Full-pretrain/Loss (Raw)": 1.95758056640625, "Full-pretrain/Step": 6103, "Full-pretrain/Step Time": 17.602288767695427} +{"Full-pretrain/Learning Rate": 1.5145382681445453e-05, "Full-pretrain/Loss": 1.9495536088943481, "Full-pretrain/Loss (Raw)": 1.9699660539627075, "Full-pretrain/Step": 6104, "Full-pretrain/Step Time": 17.607575045898557} +{"Full-pretrain/Learning Rate": 1.513757994778169e-05, "Full-pretrain/Loss": 1.9568054676055908, "Full-pretrain/Loss (Raw)": 2.0380067825317383, "Full-pretrain/Step": 6105, "Full-pretrain/Step Time": 17.602275043725967} +{"Full-pretrain/Learning Rate": 1.5129778351744623e-05, "Full-pretrain/Loss": 1.9579983949661255, "Full-pretrain/Loss (Raw)": 1.9972724914550781, "Full-pretrain/Step": 6106, "Full-pretrain/Step Time": 17.600941095501184} +{"Full-pretrain/Learning Rate": 1.5121977894234147e-05, "Full-pretrain/Loss": 1.9633607864379883, "Full-pretrain/Loss (Raw)": 2.111330270767212, "Full-pretrain/Step": 6107, "Full-pretrain/Step Time": 17.599977618083358} +{"Full-pretrain/Learning Rate": 1.511417857615005e-05, "Full-pretrain/Loss": 1.9597371816635132, "Full-pretrain/Loss (Raw)": 1.8521132469177246, "Full-pretrain/Step": 6108, "Full-pretrain/Step Time": 17.60407004132867} +{"Full-pretrain/Learning Rate": 1.5106380398391993e-05, "Full-pretrain/Loss": 1.9666883945465088, "Full-pretrain/Loss (Raw)": 1.9255108833312988, "Full-pretrain/Step": 6109, "Full-pretrain/Step Time": 17.601778829470277} +{"Full-pretrain/Learning Rate": 1.509858336185947e-05, "Full-pretrain/Loss": 1.9640252590179443, "Full-pretrain/Loss (Raw)": 1.9593515396118164, "Full-pretrain/Step": 6110, "Full-pretrain/Step Time": 17.60435282625258} +{"Full-pretrain/Learning Rate": 1.5090787467451872e-05, "Full-pretrain/Loss": 1.9425675868988037, "Full-pretrain/Loss (Raw)": 1.4591286182403564, "Full-pretrain/Step": 6111, "Full-pretrain/Step Time": 17.600952979177237} +{"Full-pretrain/Learning Rate": 1.5082992716068461e-05, "Full-pretrain/Loss": 1.935516119003296, "Full-pretrain/Loss (Raw)": 1.8547860383987427, "Full-pretrain/Step": 6112, "Full-pretrain/Step Time": 17.60540099069476} +{"Full-pretrain/Learning Rate": 1.5075199108608357e-05, "Full-pretrain/Loss": 1.9312524795532227, "Full-pretrain/Loss (Raw)": 1.7351499795913696, "Full-pretrain/Step": 6113, "Full-pretrain/Step Time": 17.609385635703802} +{"Full-pretrain/Learning Rate": 1.506740664597055e-05, "Full-pretrain/Loss": 1.9274277687072754, "Full-pretrain/Loss (Raw)": 1.920426368713379, "Full-pretrain/Step": 6114, "Full-pretrain/Step Time": 17.605675134807825} +{"Full-pretrain/Learning Rate": 1.50596153290539e-05, "Full-pretrain/Loss": 1.924965262413025, "Full-pretrain/Loss (Raw)": 1.8895965814590454, "Full-pretrain/Step": 6115, "Full-pretrain/Step Time": 17.606236113235354} +{"Full-pretrain/Learning Rate": 1.5051825158757116e-05, "Full-pretrain/Loss": 1.9086476564407349, "Full-pretrain/Loss (Raw)": 1.5582761764526367, "Full-pretrain/Step": 6116, "Full-pretrain/Step Time": 17.606368109583855} +{"Full-pretrain/Learning Rate": 1.5044036135978809e-05, "Full-pretrain/Loss": 1.8984414339065552, "Full-pretrain/Loss (Raw)": 1.8030591011047363, "Full-pretrain/Step": 6117, "Full-pretrain/Step Time": 17.61445460654795} +{"Full-pretrain/Learning Rate": 1.5036248261617433e-05, "Full-pretrain/Loss": 1.9034180641174316, "Full-pretrain/Loss (Raw)": 1.9328622817993164, "Full-pretrain/Step": 6118, "Full-pretrain/Step Time": 17.609777426347136} +{"Full-pretrain/Learning Rate": 1.5028461536571328e-05, "Full-pretrain/Loss": 1.9098788499832153, "Full-pretrain/Loss (Raw)": 1.8934473991394043, "Full-pretrain/Step": 6119, "Full-pretrain/Step Time": 17.611025359481573} +{"Full-pretrain/Learning Rate": 1.5020675961738672e-05, "Full-pretrain/Loss": 1.9110674858093262, "Full-pretrain/Loss (Raw)": 1.8630414009094238, "Full-pretrain/Step": 6120, "Full-pretrain/Step Time": 17.607664201408625} +{"Full-pretrain/Learning Rate": 1.5012891538017537e-05, "Full-pretrain/Loss": 1.9088709354400635, "Full-pretrain/Loss (Raw)": 1.9405466318130493, "Full-pretrain/Step": 6121, "Full-pretrain/Step Time": 17.6142931971699} +{"Full-pretrain/Learning Rate": 1.5005108266305856e-05, "Full-pretrain/Loss": 1.8963332176208496, "Full-pretrain/Loss (Raw)": 1.8811852931976318, "Full-pretrain/Step": 6122, "Full-pretrain/Step Time": 17.616948168724775} +{"Full-pretrain/Learning Rate": 1.4997326147501422e-05, "Full-pretrain/Loss": 1.8973190784454346, "Full-pretrain/Loss (Raw)": 1.9727466106414795, "Full-pretrain/Step": 6123, "Full-pretrain/Step Time": 17.60907393321395} +{"Full-pretrain/Learning Rate": 1.498954518250191e-05, "Full-pretrain/Loss": 1.8992444276809692, "Full-pretrain/Loss (Raw)": 1.8950152397155762, "Full-pretrain/Step": 6124, "Full-pretrain/Step Time": 17.61669241823256} +{"Full-pretrain/Learning Rate": 1.4981765372204834e-05, "Full-pretrain/Loss": 1.9056974649429321, "Full-pretrain/Loss (Raw)": 2.057209014892578, "Full-pretrain/Step": 6125, "Full-pretrain/Step Time": 17.614245783537626} +{"Full-pretrain/Learning Rate": 1.4973986717507599e-05, "Full-pretrain/Loss": 1.884995460510254, "Full-pretrain/Loss (Raw)": 1.4159979820251465, "Full-pretrain/Step": 6126, "Full-pretrain/Step Time": 17.61370793171227} +{"Full-pretrain/Learning Rate": 1.4966209219307476e-05, "Full-pretrain/Loss": 1.8858270645141602, "Full-pretrain/Loss (Raw)": 2.0566930770874023, "Full-pretrain/Step": 6127, "Full-pretrain/Step Time": 17.609901463612914} +{"Full-pretrain/Learning Rate": 1.4958432878501593e-05, "Full-pretrain/Loss": 1.8977932929992676, "Full-pretrain/Loss (Raw)": 2.2078909873962402, "Full-pretrain/Step": 6128, "Full-pretrain/Step Time": 17.60716982372105} +{"Full-pretrain/Learning Rate": 1.4950657695986952e-05, "Full-pretrain/Loss": 1.900512456893921, "Full-pretrain/Loss (Raw)": 1.9532338380813599, "Full-pretrain/Step": 6129, "Full-pretrain/Step Time": 17.605234222486615} +{"Full-pretrain/Learning Rate": 1.4942883672660418e-05, "Full-pretrain/Loss": 1.8924689292907715, "Full-pretrain/Loss (Raw)": 1.7860348224639893, "Full-pretrain/Step": 6130, "Full-pretrain/Step Time": 17.609389629215002} +{"Full-pretrain/Learning Rate": 1.4935110809418712e-05, "Full-pretrain/Loss": 1.905741572380066, "Full-pretrain/Loss (Raw)": 2.2362828254699707, "Full-pretrain/Step": 6131, "Full-pretrain/Step Time": 17.607938554137945} +{"Full-pretrain/Learning Rate": 1.4927339107158437e-05, "Full-pretrain/Loss": 1.9076496362686157, "Full-pretrain/Loss (Raw)": 1.975302815437317, "Full-pretrain/Step": 6132, "Full-pretrain/Step Time": 17.603222623467445} +{"Full-pretrain/Learning Rate": 1.4919568566776055e-05, "Full-pretrain/Loss": 1.9004828929901123, "Full-pretrain/Loss (Raw)": 1.780630111694336, "Full-pretrain/Step": 6133, "Full-pretrain/Step Time": 17.600418826565146} +{"Full-pretrain/Learning Rate": 1.4911799189167896e-05, "Full-pretrain/Loss": 1.897581696510315, "Full-pretrain/Loss (Raw)": 1.8429396152496338, "Full-pretrain/Step": 6134, "Full-pretrain/Step Time": 17.606622006744146} +{"Full-pretrain/Learning Rate": 1.4904030975230166e-05, "Full-pretrain/Loss": 1.894242763519287, "Full-pretrain/Loss (Raw)": 1.8507347106933594, "Full-pretrain/Step": 6135, "Full-pretrain/Step Time": 17.603031165897846} +{"Full-pretrain/Learning Rate": 1.4896263925858903e-05, "Full-pretrain/Loss": 1.8888320922851562, "Full-pretrain/Loss (Raw)": 1.7968236207962036, "Full-pretrain/Step": 6136, "Full-pretrain/Step Time": 17.601723857223988} +{"Full-pretrain/Learning Rate": 1.4888498041950045e-05, "Full-pretrain/Loss": 1.8849014043807983, "Full-pretrain/Loss (Raw)": 1.9122250080108643, "Full-pretrain/Step": 6137, "Full-pretrain/Step Time": 17.60288575105369} +{"Full-pretrain/Learning Rate": 1.4880733324399394e-05, "Full-pretrain/Loss": 1.8839083909988403, "Full-pretrain/Loss (Raw)": 1.965496301651001, "Full-pretrain/Step": 6138, "Full-pretrain/Step Time": 17.610735038295388} +{"Full-pretrain/Learning Rate": 1.4872969774102589e-05, "Full-pretrain/Loss": 1.8845006227493286, "Full-pretrain/Loss (Raw)": 2.130281448364258, "Full-pretrain/Step": 6139, "Full-pretrain/Step Time": 17.608015585690737} +{"Full-pretrain/Learning Rate": 1.4865207391955171e-05, "Full-pretrain/Loss": 1.885218620300293, "Full-pretrain/Loss (Raw)": 1.8750863075256348, "Full-pretrain/Step": 6140, "Full-pretrain/Step Time": 17.601654086261988} +{"Full-pretrain/Learning Rate": 1.485744617885251e-05, "Full-pretrain/Loss": 1.8888559341430664, "Full-pretrain/Loss (Raw)": 2.0419063568115234, "Full-pretrain/Step": 6141, "Full-pretrain/Step Time": 17.604508005082607} +{"Full-pretrain/Learning Rate": 1.484968613568987e-05, "Full-pretrain/Loss": 1.889149785041809, "Full-pretrain/Loss (Raw)": 1.9687576293945312, "Full-pretrain/Step": 6142, "Full-pretrain/Step Time": 17.609092380851507} +{"Full-pretrain/Learning Rate": 1.4841927263362365e-05, "Full-pretrain/Loss": 1.9019267559051514, "Full-pretrain/Loss (Raw)": 1.8679907321929932, "Full-pretrain/Step": 6143, "Full-pretrain/Step Time": 17.60945476964116} +{"Full-pretrain/Learning Rate": 1.483416956276498e-05, "Full-pretrain/Loss": 1.9033390283584595, "Full-pretrain/Loss (Raw)": 1.8999779224395752, "Full-pretrain/Step": 6144, "Full-pretrain/Step Time": 17.602127887308598} +{"Full-pretrain/Learning Rate": 1.4826413034792574e-05, "Full-pretrain/Loss": 1.9107468128204346, "Full-pretrain/Loss (Raw)": 1.9722007513046265, "Full-pretrain/Step": 6145, "Full-pretrain/Step Time": 17.602723322808743} +{"Full-pretrain/Learning Rate": 1.481865768033984e-05, "Full-pretrain/Loss": 1.9074217081069946, "Full-pretrain/Loss (Raw)": 1.8140225410461426, "Full-pretrain/Step": 6146, "Full-pretrain/Step Time": 17.604321582242846} +{"Full-pretrain/Learning Rate": 1.4810903500301365e-05, "Full-pretrain/Loss": 1.9052743911743164, "Full-pretrain/Loss (Raw)": 1.8208802938461304, "Full-pretrain/Step": 6147, "Full-pretrain/Step Time": 17.608838837593794} +{"Full-pretrain/Learning Rate": 1.4803150495571594e-05, "Full-pretrain/Loss": 1.9194958209991455, "Full-pretrain/Loss (Raw)": 2.0133657455444336, "Full-pretrain/Step": 6148, "Full-pretrain/Step Time": 17.603693103417754} +{"Full-pretrain/Learning Rate": 1.4795398667044824e-05, "Full-pretrain/Loss": 1.9286519289016724, "Full-pretrain/Loss (Raw)": 2.0960540771484375, "Full-pretrain/Step": 6149, "Full-pretrain/Step Time": 17.603127412497997} +{"Full-pretrain/Learning Rate": 1.4787648015615235e-05, "Full-pretrain/Loss": 1.9295599460601807, "Full-pretrain/Loss (Raw)": 1.9619178771972656, "Full-pretrain/Step": 6150, "Full-pretrain/Step Time": 17.603621812537313} +{"Full-pretrain/Learning Rate": 1.4779898542176865e-05, "Full-pretrain/Loss": 1.931439995765686, "Full-pretrain/Loss (Raw)": 1.9536080360412598, "Full-pretrain/Step": 6151, "Full-pretrain/Step Time": 17.602323899045587} +{"Full-pretrain/Learning Rate": 1.4772150247623598e-05, "Full-pretrain/Loss": 1.9394457340240479, "Full-pretrain/Loss (Raw)": 2.1192245483398438, "Full-pretrain/Step": 6152, "Full-pretrain/Step Time": 17.593069046735764} +{"Full-pretrain/Learning Rate": 1.4764403132849205e-05, "Full-pretrain/Loss": 1.9375555515289307, "Full-pretrain/Loss (Raw)": 1.8800625801086426, "Full-pretrain/Step": 6153, "Full-pretrain/Step Time": 17.59014981985092} +{"Full-pretrain/Learning Rate": 1.4756657198747314e-05, "Full-pretrain/Loss": 1.9471944570541382, "Full-pretrain/Loss (Raw)": 2.189629077911377, "Full-pretrain/Step": 6154, "Full-pretrain/Step Time": 17.59589272737503} +{"Full-pretrain/Learning Rate": 1.4748912446211422e-05, "Full-pretrain/Loss": 1.9438741207122803, "Full-pretrain/Loss (Raw)": 1.8664937019348145, "Full-pretrain/Step": 6155, "Full-pretrain/Step Time": 17.601382076740265} +{"Full-pretrain/Learning Rate": 1.4741168876134876e-05, "Full-pretrain/Loss": 1.9444612264633179, "Full-pretrain/Loss (Raw)": 1.9138025045394897, "Full-pretrain/Step": 6156, "Full-pretrain/Step Time": 17.591244829818606} +{"Full-pretrain/Learning Rate": 1.4733426489410895e-05, "Full-pretrain/Loss": 1.9373948574066162, "Full-pretrain/Loss (Raw)": 1.8310872316360474, "Full-pretrain/Step": 6157, "Full-pretrain/Step Time": 17.590218391269445} +{"Full-pretrain/Learning Rate": 1.4725685286932556e-05, "Full-pretrain/Loss": 1.9564979076385498, "Full-pretrain/Loss (Raw)": 2.0272934436798096, "Full-pretrain/Step": 6158, "Full-pretrain/Step Time": 17.59515792503953} +{"Full-pretrain/Learning Rate": 1.4717945269592803e-05, "Full-pretrain/Loss": 1.9430025815963745, "Full-pretrain/Loss (Raw)": 1.624843955039978, "Full-pretrain/Step": 6159, "Full-pretrain/Step Time": 17.59502629749477} +{"Full-pretrain/Learning Rate": 1.4710206438284457e-05, "Full-pretrain/Loss": 1.9306409358978271, "Full-pretrain/Loss (Raw)": 1.8123207092285156, "Full-pretrain/Step": 6160, "Full-pretrain/Step Time": 17.59189422428608} +{"Full-pretrain/Learning Rate": 1.4702468793900188e-05, "Full-pretrain/Loss": 1.9325759410858154, "Full-pretrain/Loss (Raw)": 2.0151548385620117, "Full-pretrain/Step": 6161, "Full-pretrain/Step Time": 17.58675454929471} +{"Full-pretrain/Learning Rate": 1.4694732337332517e-05, "Full-pretrain/Loss": 1.9304323196411133, "Full-pretrain/Loss (Raw)": 1.7174378633499146, "Full-pretrain/Step": 6162, "Full-pretrain/Step Time": 17.58810351975262} +{"Full-pretrain/Learning Rate": 1.468699706947385e-05, "Full-pretrain/Loss": 1.9205856323242188, "Full-pretrain/Loss (Raw)": 1.9211888313293457, "Full-pretrain/Step": 6163, "Full-pretrain/Step Time": 17.595137543976307} +{"Full-pretrain/Learning Rate": 1.467926299121645e-05, "Full-pretrain/Loss": 1.927297592163086, "Full-pretrain/Loss (Raw)": 2.1900875568389893, "Full-pretrain/Step": 6164, "Full-pretrain/Step Time": 17.593577736988664} +{"Full-pretrain/Learning Rate": 1.467153010345243e-05, "Full-pretrain/Loss": 1.9309526681900024, "Full-pretrain/Loss (Raw)": 1.8975895643234253, "Full-pretrain/Step": 6165, "Full-pretrain/Step Time": 17.590072374790907} +{"Full-pretrain/Learning Rate": 1.4663798407073799e-05, "Full-pretrain/Loss": 1.9340951442718506, "Full-pretrain/Loss (Raw)": 1.9434984922409058, "Full-pretrain/Step": 6166, "Full-pretrain/Step Time": 17.59340165928006} +{"Full-pretrain/Learning Rate": 1.4656067902972375e-05, "Full-pretrain/Loss": 1.9338675737380981, "Full-pretrain/Loss (Raw)": 1.8434512615203857, "Full-pretrain/Step": 6167, "Full-pretrain/Step Time": 17.597586788237095} +{"Full-pretrain/Learning Rate": 1.4648338592039884e-05, "Full-pretrain/Loss": 1.944749355316162, "Full-pretrain/Loss (Raw)": 2.145042896270752, "Full-pretrain/Step": 6168, "Full-pretrain/Step Time": 17.590807231143117} +{"Full-pretrain/Learning Rate": 1.4640610475167898e-05, "Full-pretrain/Loss": 1.9492547512054443, "Full-pretrain/Loss (Raw)": 2.056392192840576, "Full-pretrain/Step": 6169, "Full-pretrain/Step Time": 17.587645495310426} +{"Full-pretrain/Learning Rate": 1.4632883553247854e-05, "Full-pretrain/Loss": 1.960679531097412, "Full-pretrain/Loss (Raw)": 2.331094264984131, "Full-pretrain/Step": 6170, "Full-pretrain/Step Time": 17.590513423085213} +{"Full-pretrain/Learning Rate": 1.4625157827171054e-05, "Full-pretrain/Loss": 1.9539653062820435, "Full-pretrain/Loss (Raw)": 1.9154231548309326, "Full-pretrain/Step": 6171, "Full-pretrain/Step Time": 17.59395873360336} +{"Full-pretrain/Learning Rate": 1.461743329782865e-05, "Full-pretrain/Loss": 1.9662312269210815, "Full-pretrain/Loss (Raw)": 2.2675981521606445, "Full-pretrain/Step": 6172, "Full-pretrain/Step Time": 17.590978667140007} +{"Full-pretrain/Learning Rate": 1.4609709966111668e-05, "Full-pretrain/Loss": 1.9653968811035156, "Full-pretrain/Loss (Raw)": 2.0152080059051514, "Full-pretrain/Step": 6173, "Full-pretrain/Step Time": 17.59312940388918} +{"Full-pretrain/Learning Rate": 1.4601987832910988e-05, "Full-pretrain/Loss": 1.9662197828292847, "Full-pretrain/Loss (Raw)": 1.995090126991272, "Full-pretrain/Step": 6174, "Full-pretrain/Step Time": 17.59115049429238} +{"Full-pretrain/Learning Rate": 1.4594266899117348e-05, "Full-pretrain/Loss": 1.9682343006134033, "Full-pretrain/Loss (Raw)": 1.9324560165405273, "Full-pretrain/Step": 6175, "Full-pretrain/Step Time": 17.600226897746325} +{"Full-pretrain/Learning Rate": 1.4586547165621384e-05, "Full-pretrain/Loss": 1.9730920791625977, "Full-pretrain/Loss (Raw)": 2.055429458618164, "Full-pretrain/Step": 6176, "Full-pretrain/Step Time": 17.600716926157475} +{"Full-pretrain/Learning Rate": 1.457882863331353e-05, "Full-pretrain/Loss": 1.968923807144165, "Full-pretrain/Loss (Raw)": 1.8388135433197021, "Full-pretrain/Step": 6177, "Full-pretrain/Step Time": 17.5993695538491} +{"Full-pretrain/Learning Rate": 1.4571111303084145e-05, "Full-pretrain/Loss": 1.9758033752441406, "Full-pretrain/Loss (Raw)": 2.0341711044311523, "Full-pretrain/Step": 6178, "Full-pretrain/Step Time": 17.597479673102498} +{"Full-pretrain/Learning Rate": 1.4563395175823394e-05, "Full-pretrain/Loss": 1.9702516794204712, "Full-pretrain/Loss (Raw)": 1.643223524093628, "Full-pretrain/Step": 6179, "Full-pretrain/Step Time": 17.604797918349504} +{"Full-pretrain/Learning Rate": 1.4555680252421341e-05, "Full-pretrain/Loss": 1.9783971309661865, "Full-pretrain/Loss (Raw)": 2.2740237712860107, "Full-pretrain/Step": 6180, "Full-pretrain/Step Time": 17.604840844869614} +{"Full-pretrain/Learning Rate": 1.4547966533767904e-05, "Full-pretrain/Loss": 1.9737910032272339, "Full-pretrain/Loss (Raw)": 1.9486548900604248, "Full-pretrain/Step": 6181, "Full-pretrain/Step Time": 17.60232687741518} +{"Full-pretrain/Learning Rate": 1.4540254020752859e-05, "Full-pretrain/Loss": 1.9754018783569336, "Full-pretrain/Loss (Raw)": 2.0134687423706055, "Full-pretrain/Step": 6182, "Full-pretrain/Step Time": 17.6045285705477} +{"Full-pretrain/Learning Rate": 1.4532542714265829e-05, "Full-pretrain/Loss": 1.9640823602676392, "Full-pretrain/Loss (Raw)": 1.5913804769515991, "Full-pretrain/Step": 6183, "Full-pretrain/Step Time": 17.60789103806019} +{"Full-pretrain/Learning Rate": 1.452483261519632e-05, "Full-pretrain/Loss": 1.969797134399414, "Full-pretrain/Loss (Raw)": 2.302095413208008, "Full-pretrain/Step": 6184, "Full-pretrain/Step Time": 17.610321750864387} +{"Full-pretrain/Learning Rate": 1.4517123724433686e-05, "Full-pretrain/Loss": 1.9713895320892334, "Full-pretrain/Loss (Raw)": 1.9310216903686523, "Full-pretrain/Step": 6185, "Full-pretrain/Step Time": 17.61302845366299} +{"Full-pretrain/Learning Rate": 1.4509416042867149e-05, "Full-pretrain/Loss": 1.9675734043121338, "Full-pretrain/Loss (Raw)": 2.0675134658813477, "Full-pretrain/Step": 6186, "Full-pretrain/Step Time": 17.60620131716132} +{"Full-pretrain/Learning Rate": 1.450170957138579e-05, "Full-pretrain/Loss": 1.9650049209594727, "Full-pretrain/Loss (Raw)": 1.7843036651611328, "Full-pretrain/Step": 6187, "Full-pretrain/Step Time": 17.606322336941957} +{"Full-pretrain/Learning Rate": 1.449400431087854e-05, "Full-pretrain/Loss": 1.9710190296173096, "Full-pretrain/Loss (Raw)": 2.106245517730713, "Full-pretrain/Step": 6188, "Full-pretrain/Step Time": 17.607687011361122} +{"Full-pretrain/Learning Rate": 1.4486300262234193e-05, "Full-pretrain/Loss": 1.9628410339355469, "Full-pretrain/Loss (Raw)": 1.5693957805633545, "Full-pretrain/Step": 6189, "Full-pretrain/Step Time": 17.61244235932827} +{"Full-pretrain/Learning Rate": 1.4478597426341422e-05, "Full-pretrain/Loss": 1.9606783390045166, "Full-pretrain/Loss (Raw)": 1.958089828491211, "Full-pretrain/Step": 6190, "Full-pretrain/Step Time": 17.608172656968236} +{"Full-pretrain/Learning Rate": 1.4470895804088736e-05, "Full-pretrain/Loss": 1.9744793176651, "Full-pretrain/Loss (Raw)": 2.066473960876465, "Full-pretrain/Step": 6191, "Full-pretrain/Step Time": 17.609833544120193} +{"Full-pretrain/Learning Rate": 1.4463195396364531e-05, "Full-pretrain/Loss": 1.978770136833191, "Full-pretrain/Loss (Raw)": 1.9496235847473145, "Full-pretrain/Step": 6192, "Full-pretrain/Step Time": 17.61427284218371} +{"Full-pretrain/Learning Rate": 1.4455496204057023e-05, "Full-pretrain/Loss": 1.9751183986663818, "Full-pretrain/Loss (Raw)": 1.898300051689148, "Full-pretrain/Step": 6193, "Full-pretrain/Step Time": 17.608257511630654} +{"Full-pretrain/Learning Rate": 1.4447798228054333e-05, "Full-pretrain/Loss": 1.9780470132827759, "Full-pretrain/Loss (Raw)": 1.8111554384231567, "Full-pretrain/Step": 6194, "Full-pretrain/Step Time": 17.604637095704675} +{"Full-pretrain/Learning Rate": 1.44401014692444e-05, "Full-pretrain/Loss": 1.9795045852661133, "Full-pretrain/Loss (Raw)": 1.967832088470459, "Full-pretrain/Step": 6195, "Full-pretrain/Step Time": 17.604415085166693} +{"Full-pretrain/Learning Rate": 1.443240592851505e-05, "Full-pretrain/Loss": 1.974069595336914, "Full-pretrain/Loss (Raw)": 2.016169548034668, "Full-pretrain/Step": 6196, "Full-pretrain/Step Time": 17.60642471909523} +{"Full-pretrain/Learning Rate": 1.4424711606753964e-05, "Full-pretrain/Loss": 1.9772520065307617, "Full-pretrain/Loss (Raw)": 1.999422311782837, "Full-pretrain/Step": 6197, "Full-pretrain/Step Time": 17.60750220529735} +{"Full-pretrain/Learning Rate": 1.4417018504848684e-05, "Full-pretrain/Loss": 1.9716160297393799, "Full-pretrain/Loss (Raw)": 1.7631464004516602, "Full-pretrain/Step": 6198, "Full-pretrain/Step Time": 17.60874442011118} +{"Full-pretrain/Learning Rate": 1.4409326623686592e-05, "Full-pretrain/Loss": 1.9607043266296387, "Full-pretrain/Loss (Raw)": 1.4942805767059326, "Full-pretrain/Step": 6199, "Full-pretrain/Step Time": 17.60981041006744} +{"Full-pretrain/Learning Rate": 1.4401635964154956e-05, "Full-pretrain/Loss": 1.9546539783477783, "Full-pretrain/Loss (Raw)": 1.9514317512512207, "Full-pretrain/Step": 6200, "Full-pretrain/Step Time": 17.60590910539031} +{"Full-pretrain/Learning Rate": 1.4393946527140884e-05, "Full-pretrain/Loss": 1.953344464302063, "Full-pretrain/Loss (Raw)": 2.014486789703369, "Full-pretrain/Step": 6201, "Full-pretrain/Step Time": 17.60751073807478} +{"Full-pretrain/Learning Rate": 1.4386258313531353e-05, "Full-pretrain/Loss": 1.9432239532470703, "Full-pretrain/Loss (Raw)": 2.0072364807128906, "Full-pretrain/Step": 6202, "Full-pretrain/Step Time": 17.60620452836156} +{"Full-pretrain/Learning Rate": 1.4378571324213203e-05, "Full-pretrain/Loss": 1.946714162826538, "Full-pretrain/Loss (Raw)": 2.0271103382110596, "Full-pretrain/Step": 6203, "Full-pretrain/Step Time": 17.606028974056244} +{"Full-pretrain/Learning Rate": 1.437088556007311e-05, "Full-pretrain/Loss": 1.9358137845993042, "Full-pretrain/Loss (Raw)": 1.9187856912612915, "Full-pretrain/Step": 6204, "Full-pretrain/Step Time": 17.60873490013182} +{"Full-pretrain/Learning Rate": 1.4363201021997635e-05, "Full-pretrain/Loss": 1.9379615783691406, "Full-pretrain/Loss (Raw)": 2.0839383602142334, "Full-pretrain/Step": 6205, "Full-pretrain/Step Time": 17.59883134998381} +{"Full-pretrain/Learning Rate": 1.4355517710873184e-05, "Full-pretrain/Loss": 1.9314887523651123, "Full-pretrain/Loss (Raw)": 1.7879595756530762, "Full-pretrain/Step": 6206, "Full-pretrain/Step Time": 17.599528469145298} +{"Full-pretrain/Learning Rate": 1.434783562758602e-05, "Full-pretrain/Loss": 1.934046745300293, "Full-pretrain/Loss (Raw)": 2.0143134593963623, "Full-pretrain/Step": 6207, "Full-pretrain/Step Time": 17.593938041478395} +{"Full-pretrain/Learning Rate": 1.4340154773022286e-05, "Full-pretrain/Loss": 1.9331287145614624, "Full-pretrain/Loss (Raw)": 2.026050090789795, "Full-pretrain/Step": 6208, "Full-pretrain/Step Time": 17.597970673814416} +{"Full-pretrain/Learning Rate": 1.4332475148067943e-05, "Full-pretrain/Loss": 1.939436912536621, "Full-pretrain/Loss (Raw)": 2.040677070617676, "Full-pretrain/Step": 6209, "Full-pretrain/Step Time": 17.593063954263926} +{"Full-pretrain/Learning Rate": 1.4324796753608841e-05, "Full-pretrain/Loss": 1.9403839111328125, "Full-pretrain/Loss (Raw)": 2.0644750595092773, "Full-pretrain/Step": 6210, "Full-pretrain/Step Time": 17.59047989733517} +{"Full-pretrain/Learning Rate": 1.4317119590530692e-05, "Full-pretrain/Loss": 1.9394625425338745, "Full-pretrain/Loss (Raw)": 1.6137425899505615, "Full-pretrain/Step": 6211, "Full-pretrain/Step Time": 17.59433178603649} +{"Full-pretrain/Learning Rate": 1.4309443659719036e-05, "Full-pretrain/Loss": 1.9258153438568115, "Full-pretrain/Loss (Raw)": 1.837311863899231, "Full-pretrain/Step": 6212, "Full-pretrain/Step Time": 17.589786337688565} +{"Full-pretrain/Learning Rate": 1.4301768962059295e-05, "Full-pretrain/Loss": 1.9268665313720703, "Full-pretrain/Loss (Raw)": 1.9822912216186523, "Full-pretrain/Step": 6213, "Full-pretrain/Step Time": 17.585615400224924} +{"Full-pretrain/Learning Rate": 1.4294095498436755e-05, "Full-pretrain/Loss": 1.9220085144042969, "Full-pretrain/Loss (Raw)": 1.8580114841461182, "Full-pretrain/Step": 6214, "Full-pretrain/Step Time": 17.594055362045765} +{"Full-pretrain/Learning Rate": 1.4286423269736526e-05, "Full-pretrain/Loss": 1.9330205917358398, "Full-pretrain/Loss (Raw)": 1.9437662363052368, "Full-pretrain/Step": 6215, "Full-pretrain/Step Time": 17.592183589935303} +{"Full-pretrain/Learning Rate": 1.427875227684361e-05, "Full-pretrain/Loss": 1.933730125427246, "Full-pretrain/Loss (Raw)": 2.3248026371002197, "Full-pretrain/Step": 6216, "Full-pretrain/Step Time": 17.591258879750967} +{"Full-pretrain/Learning Rate": 1.4271082520642854e-05, "Full-pretrain/Loss": 1.9260141849517822, "Full-pretrain/Loss (Raw)": 1.684112787246704, "Full-pretrain/Step": 6217, "Full-pretrain/Step Time": 17.59072300978005} +{"Full-pretrain/Learning Rate": 1.4263414002018955e-05, "Full-pretrain/Loss": 1.9184424877166748, "Full-pretrain/Loss (Raw)": 1.8252201080322266, "Full-pretrain/Step": 6218, "Full-pretrain/Step Time": 17.591811411082745} +{"Full-pretrain/Learning Rate": 1.4255746721856486e-05, "Full-pretrain/Loss": 1.927734375, "Full-pretrain/Loss (Raw)": 2.081641674041748, "Full-pretrain/Step": 6219, "Full-pretrain/Step Time": 17.59165060892701} +{"Full-pretrain/Learning Rate": 1.424808068103985e-05, "Full-pretrain/Loss": 1.9156630039215088, "Full-pretrain/Loss (Raw)": 1.7199630737304688, "Full-pretrain/Step": 6220, "Full-pretrain/Step Time": 17.58316238038242} +{"Full-pretrain/Learning Rate": 1.4240415880453326e-05, "Full-pretrain/Loss": 1.9289824962615967, "Full-pretrain/Loss (Raw)": 1.9956198930740356, "Full-pretrain/Step": 6221, "Full-pretrain/Step Time": 17.582293428480625} +{"Full-pretrain/Learning Rate": 1.4232752320981052e-05, "Full-pretrain/Loss": 1.9347742795944214, "Full-pretrain/Loss (Raw)": 2.143423557281494, "Full-pretrain/Step": 6222, "Full-pretrain/Step Time": 17.584770752117038} +{"Full-pretrain/Learning Rate": 1.4225090003507013e-05, "Full-pretrain/Loss": 1.9231605529785156, "Full-pretrain/Loss (Raw)": 1.6948357820510864, "Full-pretrain/Step": 6223, "Full-pretrain/Step Time": 17.58166717737913} +{"Full-pretrain/Learning Rate": 1.4217428928915064e-05, "Full-pretrain/Loss": 1.9194376468658447, "Full-pretrain/Loss (Raw)": 1.8304896354675293, "Full-pretrain/Step": 6224, "Full-pretrain/Step Time": 17.58263242803514} +{"Full-pretrain/Learning Rate": 1.4209769098088888e-05, "Full-pretrain/Loss": 1.919638991355896, "Full-pretrain/Loss (Raw)": 1.9047441482543945, "Full-pretrain/Step": 6225, "Full-pretrain/Step Time": 17.585690427571535} +{"Full-pretrain/Learning Rate": 1.420211051191206e-05, "Full-pretrain/Loss": 1.9267991781234741, "Full-pretrain/Loss (Raw)": 2.040278673171997, "Full-pretrain/Step": 6226, "Full-pretrain/Step Time": 17.589029651135206} +{"Full-pretrain/Learning Rate": 1.4194453171267996e-05, "Full-pretrain/Loss": 1.927833914756775, "Full-pretrain/Loss (Raw)": 2.0009477138519287, "Full-pretrain/Step": 6227, "Full-pretrain/Step Time": 17.583410749211907} +{"Full-pretrain/Learning Rate": 1.4186797077039948e-05, "Full-pretrain/Loss": 1.9150292873382568, "Full-pretrain/Loss (Raw)": 1.606418490409851, "Full-pretrain/Step": 6228, "Full-pretrain/Step Time": 17.57910164631903} +{"Full-pretrain/Learning Rate": 1.4179142230111065e-05, "Full-pretrain/Loss": 1.9168404340744019, "Full-pretrain/Loss (Raw)": 2.0573806762695312, "Full-pretrain/Step": 6229, "Full-pretrain/Step Time": 17.583579804748297} +{"Full-pretrain/Learning Rate": 1.4171488631364327e-05, "Full-pretrain/Loss": 1.922485589981079, "Full-pretrain/Loss (Raw)": 1.9437909126281738, "Full-pretrain/Step": 6230, "Full-pretrain/Step Time": 17.583707440644503} +{"Full-pretrain/Learning Rate": 1.4163836281682563e-05, "Full-pretrain/Loss": 1.9353461265563965, "Full-pretrain/Loss (Raw)": 1.9058163166046143, "Full-pretrain/Step": 6231, "Full-pretrain/Step Time": 17.580136585980654} +{"Full-pretrain/Learning Rate": 1.4156185181948473e-05, "Full-pretrain/Loss": 1.9331722259521484, "Full-pretrain/Loss (Raw)": 1.8818652629852295, "Full-pretrain/Step": 6232, "Full-pretrain/Step Time": 17.577965781092644} +{"Full-pretrain/Learning Rate": 1.4148535333044613e-05, "Full-pretrain/Loss": 1.9351623058319092, "Full-pretrain/Loss (Raw)": 2.0781731605529785, "Full-pretrain/Step": 6233, "Full-pretrain/Step Time": 17.58301050402224} +{"Full-pretrain/Learning Rate": 1.4140886735853387e-05, "Full-pretrain/Loss": 1.9269298315048218, "Full-pretrain/Loss (Raw)": 1.7437989711761475, "Full-pretrain/Step": 6234, "Full-pretrain/Step Time": 17.584924563765526} +{"Full-pretrain/Learning Rate": 1.4133239391257075e-05, "Full-pretrain/Loss": 1.919703722000122, "Full-pretrain/Loss (Raw)": 1.7958738803863525, "Full-pretrain/Step": 6235, "Full-pretrain/Step Time": 17.579124813899398} +{"Full-pretrain/Learning Rate": 1.4125593300137766e-05, "Full-pretrain/Loss": 1.9197607040405273, "Full-pretrain/Loss (Raw)": 1.9206058979034424, "Full-pretrain/Step": 6236, "Full-pretrain/Step Time": 17.57533073052764} +{"Full-pretrain/Learning Rate": 1.411794846337745e-05, "Full-pretrain/Loss": 1.9112727642059326, "Full-pretrain/Loss (Raw)": 1.812326192855835, "Full-pretrain/Step": 6237, "Full-pretrain/Step Time": 17.579066783189774} +{"Full-pretrain/Learning Rate": 1.4110304881857955e-05, "Full-pretrain/Loss": 1.909475564956665, "Full-pretrain/Loss (Raw)": 1.7304513454437256, "Full-pretrain/Step": 6238, "Full-pretrain/Step Time": 17.577624971047044} +{"Full-pretrain/Learning Rate": 1.410266255646096e-05, "Full-pretrain/Loss": 1.8975167274475098, "Full-pretrain/Loss (Raw)": 1.631626844406128, "Full-pretrain/Step": 6239, "Full-pretrain/Step Time": 17.57672936283052} +{"Full-pretrain/Learning Rate": 1.4095021488068028e-05, "Full-pretrain/Loss": 1.8871245384216309, "Full-pretrain/Loss (Raw)": 1.6935032606124878, "Full-pretrain/Step": 6240, "Full-pretrain/Step Time": 17.5734344702214} +{"Full-pretrain/Learning Rate": 1.4087381677560518e-05, "Full-pretrain/Loss": 1.8871665000915527, "Full-pretrain/Loss (Raw)": 2.0420191287994385, "Full-pretrain/Step": 6241, "Full-pretrain/Step Time": 17.56823368743062} +{"Full-pretrain/Learning Rate": 1.40797431258197e-05, "Full-pretrain/Loss": 1.8699215650558472, "Full-pretrain/Loss (Raw)": 1.512637972831726, "Full-pretrain/Step": 6242, "Full-pretrain/Step Time": 17.577471435070038} +{"Full-pretrain/Learning Rate": 1.4072105833726684e-05, "Full-pretrain/Loss": 1.8828059434890747, "Full-pretrain/Loss (Raw)": 2.026041269302368, "Full-pretrain/Step": 6243, "Full-pretrain/Step Time": 17.57702055759728} +{"Full-pretrain/Learning Rate": 1.4064469802162411e-05, "Full-pretrain/Loss": 1.884981632232666, "Full-pretrain/Loss (Raw)": 1.9069358110427856, "Full-pretrain/Step": 6244, "Full-pretrain/Step Time": 17.576103935018182} +{"Full-pretrain/Learning Rate": 1.405683503200771e-05, "Full-pretrain/Loss": 1.8818098306655884, "Full-pretrain/Loss (Raw)": 1.8807919025421143, "Full-pretrain/Step": 6245, "Full-pretrain/Step Time": 17.576312171295285} +{"Full-pretrain/Learning Rate": 1.4049201524143236e-05, "Full-pretrain/Loss": 1.893119215965271, "Full-pretrain/Loss (Raw)": 2.2199130058288574, "Full-pretrain/Step": 6246, "Full-pretrain/Step Time": 17.579960430040956} +{"Full-pretrain/Learning Rate": 1.4041569279449513e-05, "Full-pretrain/Loss": 1.897782564163208, "Full-pretrain/Loss (Raw)": 2.092991828918457, "Full-pretrain/Step": 6247, "Full-pretrain/Step Time": 17.57873586565256} +{"Full-pretrain/Learning Rate": 1.4033938298806925e-05, "Full-pretrain/Loss": 1.8882042169570923, "Full-pretrain/Loss (Raw)": 2.0182974338531494, "Full-pretrain/Step": 6248, "Full-pretrain/Step Time": 17.578876476734877} +{"Full-pretrain/Learning Rate": 1.4026308583095704e-05, "Full-pretrain/Loss": 1.894127607345581, "Full-pretrain/Loss (Raw)": 1.8736571073532104, "Full-pretrain/Step": 6249, "Full-pretrain/Step Time": 17.57385792210698} +{"Full-pretrain/Learning Rate": 1.4018680133195928e-05, "Full-pretrain/Loss": 1.8876752853393555, "Full-pretrain/Loss (Raw)": 1.618748426437378, "Full-pretrain/Step": 6250, "Full-pretrain/Step Time": 17.571789307519794} +{"Full-pretrain/Learning Rate": 1.401105294998755e-05, "Full-pretrain/Loss": 1.8862779140472412, "Full-pretrain/Loss (Raw)": 2.0369269847869873, "Full-pretrain/Step": 6251, "Full-pretrain/Step Time": 17.582325626164675} +{"Full-pretrain/Learning Rate": 1.4003427034350341e-05, "Full-pretrain/Loss": 1.8858559131622314, "Full-pretrain/Loss (Raw)": 1.7064580917358398, "Full-pretrain/Step": 6252, "Full-pretrain/Step Time": 17.58002525754273} +{"Full-pretrain/Learning Rate": 1.3995802387163964e-05, "Full-pretrain/Loss": 1.8828709125518799, "Full-pretrain/Loss (Raw)": 1.9001009464263916, "Full-pretrain/Step": 6253, "Full-pretrain/Step Time": 17.57924328185618} +{"Full-pretrain/Learning Rate": 1.3988179009307911e-05, "Full-pretrain/Loss": 1.8799917697906494, "Full-pretrain/Loss (Raw)": 2.0512893199920654, "Full-pretrain/Step": 6254, "Full-pretrain/Step Time": 17.57870865985751} +{"Full-pretrain/Learning Rate": 1.398055690166154e-05, "Full-pretrain/Loss": 1.8909218311309814, "Full-pretrain/Loss (Raw)": 2.044600009918213, "Full-pretrain/Step": 6255, "Full-pretrain/Step Time": 17.581100095063448} +{"Full-pretrain/Learning Rate": 1.3972936065104063e-05, "Full-pretrain/Loss": 1.8923771381378174, "Full-pretrain/Loss (Raw)": 1.8770561218261719, "Full-pretrain/Step": 6256, "Full-pretrain/Step Time": 17.58496386744082} +{"Full-pretrain/Learning Rate": 1.3965316500514534e-05, "Full-pretrain/Loss": 1.890746831893921, "Full-pretrain/Loss (Raw)": 1.8525772094726562, "Full-pretrain/Step": 6257, "Full-pretrain/Step Time": 17.582220181822777} +{"Full-pretrain/Learning Rate": 1.3957698208771863e-05, "Full-pretrain/Loss": 1.879135012626648, "Full-pretrain/Loss (Raw)": 1.6686995029449463, "Full-pretrain/Step": 6258, "Full-pretrain/Step Time": 17.577505564317107} +{"Full-pretrain/Learning Rate": 1.3950081190754827e-05, "Full-pretrain/Loss": 1.8710559606552124, "Full-pretrain/Loss (Raw)": 1.7424190044403076, "Full-pretrain/Step": 6259, "Full-pretrain/Step Time": 17.583966355770826} +{"Full-pretrain/Learning Rate": 1.3942465447342052e-05, "Full-pretrain/Loss": 1.8883819580078125, "Full-pretrain/Loss (Raw)": 2.160850763320923, "Full-pretrain/Step": 6260, "Full-pretrain/Step Time": 17.591273495927453} +{"Full-pretrain/Learning Rate": 1.393485097941199e-05, "Full-pretrain/Loss": 1.8886033296585083, "Full-pretrain/Loss (Raw)": 2.0644636154174805, "Full-pretrain/Step": 6261, "Full-pretrain/Step Time": 17.58709384687245} +{"Full-pretrain/Learning Rate": 1.3927237787842987e-05, "Full-pretrain/Loss": 1.9058830738067627, "Full-pretrain/Loss (Raw)": 2.4967432022094727, "Full-pretrain/Step": 6262, "Full-pretrain/Step Time": 17.577867353335023} +{"Full-pretrain/Learning Rate": 1.3919625873513206e-05, "Full-pretrain/Loss": 1.8969584703445435, "Full-pretrain/Loss (Raw)": 1.6202268600463867, "Full-pretrain/Step": 6263, "Full-pretrain/Step Time": 17.588050723075867} +{"Full-pretrain/Learning Rate": 1.3912015237300687e-05, "Full-pretrain/Loss": 1.905439853668213, "Full-pretrain/Loss (Raw)": 2.1532673835754395, "Full-pretrain/Step": 6264, "Full-pretrain/Step Time": 17.591777643188834} +{"Full-pretrain/Learning Rate": 1.3904405880083316e-05, "Full-pretrain/Loss": 1.9050326347351074, "Full-pretrain/Loss (Raw)": 2.0651423931121826, "Full-pretrain/Step": 6265, "Full-pretrain/Step Time": 17.591280456632376} +{"Full-pretrain/Learning Rate": 1.3896797802738832e-05, "Full-pretrain/Loss": 1.910787582397461, "Full-pretrain/Loss (Raw)": 1.9279593229293823, "Full-pretrain/Step": 6266, "Full-pretrain/Step Time": 17.588828461244702} +{"Full-pretrain/Learning Rate": 1.3889191006144814e-05, "Full-pretrain/Loss": 1.9165136814117432, "Full-pretrain/Loss (Raw)": 1.9791076183319092, "Full-pretrain/Step": 6267, "Full-pretrain/Step Time": 17.590449180454016} +{"Full-pretrain/Learning Rate": 1.3881585491178706e-05, "Full-pretrain/Loss": 1.9189130067825317, "Full-pretrain/Loss (Raw)": 1.9973829984664917, "Full-pretrain/Step": 6268, "Full-pretrain/Step Time": 17.59407184459269} +{"Full-pretrain/Learning Rate": 1.3873981258717805e-05, "Full-pretrain/Loss": 1.9165306091308594, "Full-pretrain/Loss (Raw)": 1.7360907793045044, "Full-pretrain/Step": 6269, "Full-pretrain/Step Time": 17.58897952362895} +{"Full-pretrain/Learning Rate": 1.3866378309639258e-05, "Full-pretrain/Loss": 1.9220502376556396, "Full-pretrain/Loss (Raw)": 1.9070788621902466, "Full-pretrain/Step": 6270, "Full-pretrain/Step Time": 17.591239465400577} +{"Full-pretrain/Learning Rate": 1.385877664482006e-05, "Full-pretrain/Loss": 1.9304851293563843, "Full-pretrain/Loss (Raw)": 1.9015451669692993, "Full-pretrain/Step": 6271, "Full-pretrain/Step Time": 17.58740304596722} +{"Full-pretrain/Learning Rate": 1.3851176265137067e-05, "Full-pretrain/Loss": 1.9322422742843628, "Full-pretrain/Loss (Raw)": 1.7497326135635376, "Full-pretrain/Step": 6272, "Full-pretrain/Step Time": 17.591544959694147} +{"Full-pretrain/Learning Rate": 1.3843577171466968e-05, "Full-pretrain/Loss": 1.9229817390441895, "Full-pretrain/Loss (Raw)": 1.7456817626953125, "Full-pretrain/Step": 6273, "Full-pretrain/Step Time": 17.589993527159095} +{"Full-pretrain/Learning Rate": 1.3835979364686319e-05, "Full-pretrain/Loss": 1.9253989458084106, "Full-pretrain/Loss (Raw)": 1.589986801147461, "Full-pretrain/Step": 6274, "Full-pretrain/Step Time": 17.595586471259594} +{"Full-pretrain/Learning Rate": 1.3828382845671529e-05, "Full-pretrain/Loss": 1.9193861484527588, "Full-pretrain/Loss (Raw)": 1.8336331844329834, "Full-pretrain/Step": 6275, "Full-pretrain/Step Time": 17.59305713698268} +{"Full-pretrain/Learning Rate": 1.382078761529886e-05, "Full-pretrain/Loss": 1.9213619232177734, "Full-pretrain/Loss (Raw)": 1.9701611995697021, "Full-pretrain/Step": 6276, "Full-pretrain/Step Time": 17.592467745766044} +{"Full-pretrain/Learning Rate": 1.3813193674444402e-05, "Full-pretrain/Loss": 1.9250493049621582, "Full-pretrain/Loss (Raw)": 1.9987890720367432, "Full-pretrain/Step": 6277, "Full-pretrain/Step Time": 17.591741597279906} +{"Full-pretrain/Learning Rate": 1.3805601023984132e-05, "Full-pretrain/Loss": 1.913274884223938, "Full-pretrain/Loss (Raw)": 1.8431313037872314, "Full-pretrain/Step": 6278, "Full-pretrain/Step Time": 17.591593377292156} +{"Full-pretrain/Learning Rate": 1.379800966479384e-05, "Full-pretrain/Loss": 1.9135444164276123, "Full-pretrain/Loss (Raw)": 2.1016180515289307, "Full-pretrain/Step": 6279, "Full-pretrain/Step Time": 17.599035946652293} +{"Full-pretrain/Learning Rate": 1.3790419597749199e-05, "Full-pretrain/Loss": 1.9132089614868164, "Full-pretrain/Loss (Raw)": 2.0075595378875732, "Full-pretrain/Step": 6280, "Full-pretrain/Step Time": 17.597991786897182} +{"Full-pretrain/Learning Rate": 1.3782830823725713e-05, "Full-pretrain/Loss": 1.920506238937378, "Full-pretrain/Loss (Raw)": 2.107170581817627, "Full-pretrain/Step": 6281, "Full-pretrain/Step Time": 17.598220393061638} +{"Full-pretrain/Learning Rate": 1.3775243343598762e-05, "Full-pretrain/Loss": 1.9278825521469116, "Full-pretrain/Loss (Raw)": 1.8547911643981934, "Full-pretrain/Step": 6282, "Full-pretrain/Step Time": 17.592859281226993} +{"Full-pretrain/Learning Rate": 1.3767657158243535e-05, "Full-pretrain/Loss": 1.9357075691223145, "Full-pretrain/Loss (Raw)": 2.2873291969299316, "Full-pretrain/Step": 6283, "Full-pretrain/Step Time": 17.592211235314608} +{"Full-pretrain/Learning Rate": 1.3760072268535112e-05, "Full-pretrain/Loss": 1.9462838172912598, "Full-pretrain/Loss (Raw)": 2.04489803314209, "Full-pretrain/Step": 6284, "Full-pretrain/Step Time": 17.594710050150752} +{"Full-pretrain/Learning Rate": 1.3752488675348401e-05, "Full-pretrain/Loss": 1.9450197219848633, "Full-pretrain/Loss (Raw)": 1.859649419784546, "Full-pretrain/Step": 6285, "Full-pretrain/Step Time": 17.59094461426139} +{"Full-pretrain/Learning Rate": 1.3744906379558165e-05, "Full-pretrain/Loss": 1.9465876817703247, "Full-pretrain/Loss (Raw)": 2.1014623641967773, "Full-pretrain/Step": 6286, "Full-pretrain/Step Time": 17.588174169883132} +{"Full-pretrain/Learning Rate": 1.3737325382039037e-05, "Full-pretrain/Loss": 1.9442880153656006, "Full-pretrain/Loss (Raw)": 1.971011996269226, "Full-pretrain/Step": 6287, "Full-pretrain/Step Time": 17.587796485051513} +{"Full-pretrain/Learning Rate": 1.3729745683665457e-05, "Full-pretrain/Loss": 1.9520410299301147, "Full-pretrain/Loss (Raw)": 2.125152826309204, "Full-pretrain/Step": 6288, "Full-pretrain/Step Time": 17.591475987806916} +{"Full-pretrain/Learning Rate": 1.3722167285311749e-05, "Full-pretrain/Loss": 1.9552106857299805, "Full-pretrain/Loss (Raw)": 1.9540033340454102, "Full-pretrain/Step": 6289, "Full-pretrain/Step Time": 17.592695156112313} +{"Full-pretrain/Learning Rate": 1.3714590187852086e-05, "Full-pretrain/Loss": 1.9477297067642212, "Full-pretrain/Loss (Raw)": 1.4293091297149658, "Full-pretrain/Step": 6290, "Full-pretrain/Step Time": 17.5924336258322} +{"Full-pretrain/Learning Rate": 1.3707014392160477e-05, "Full-pretrain/Loss": 1.9572724103927612, "Full-pretrain/Loss (Raw)": 2.047783851623535, "Full-pretrain/Step": 6291, "Full-pretrain/Step Time": 17.59048659540713} +{"Full-pretrain/Learning Rate": 1.36994398991108e-05, "Full-pretrain/Loss": 1.950207233428955, "Full-pretrain/Loss (Raw)": 1.9347667694091797, "Full-pretrain/Step": 6292, "Full-pretrain/Step Time": 17.592244630679488} +{"Full-pretrain/Learning Rate": 1.3691866709576744e-05, "Full-pretrain/Loss": 1.9499528408050537, "Full-pretrain/Loss (Raw)": 2.056321620941162, "Full-pretrain/Step": 6293, "Full-pretrain/Step Time": 17.592924742028117} +{"Full-pretrain/Learning Rate": 1.3684294824431895e-05, "Full-pretrain/Loss": 1.931107997894287, "Full-pretrain/Loss (Raw)": 1.893707036972046, "Full-pretrain/Step": 6294, "Full-pretrain/Step Time": 17.587641160935163} +{"Full-pretrain/Learning Rate": 1.3676724244549672e-05, "Full-pretrain/Loss": 1.9415616989135742, "Full-pretrain/Loss (Raw)": 1.954745888710022, "Full-pretrain/Step": 6295, "Full-pretrain/Step Time": 17.585092309862375} +{"Full-pretrain/Learning Rate": 1.3669154970803313e-05, "Full-pretrain/Loss": 1.9279389381408691, "Full-pretrain/Loss (Raw)": 1.7173421382904053, "Full-pretrain/Step": 6296, "Full-pretrain/Step Time": 17.59439936093986} +{"Full-pretrain/Learning Rate": 1.366158700406595e-05, "Full-pretrain/Loss": 1.9263942241668701, "Full-pretrain/Loss (Raw)": 2.015709638595581, "Full-pretrain/Step": 6297, "Full-pretrain/Step Time": 17.59334286674857} +{"Full-pretrain/Learning Rate": 1.365402034521055e-05, "Full-pretrain/Loss": 1.920870065689087, "Full-pretrain/Loss (Raw)": 1.7511918544769287, "Full-pretrain/Step": 6298, "Full-pretrain/Step Time": 17.593778109177947} +{"Full-pretrain/Learning Rate": 1.3646454995109905e-05, "Full-pretrain/Loss": 1.9229129552841187, "Full-pretrain/Loss (Raw)": 2.044475555419922, "Full-pretrain/Step": 6299, "Full-pretrain/Step Time": 17.590239822864532} +{"Full-pretrain/Learning Rate": 1.3638890954636691e-05, "Full-pretrain/Loss": 1.9151796102523804, "Full-pretrain/Loss (Raw)": 1.7499167919158936, "Full-pretrain/Step": 6300, "Full-pretrain/Step Time": 17.59280570037663} +{"Full-pretrain/Learning Rate": 1.3631328224663408e-05, "Full-pretrain/Loss": 1.9248096942901611, "Full-pretrain/Loss (Raw)": 2.044255256652832, "Full-pretrain/Step": 6301, "Full-pretrain/Step Time": 17.593590127304196} +{"Full-pretrain/Learning Rate": 1.3623766806062421e-05, "Full-pretrain/Loss": 1.9294402599334717, "Full-pretrain/Loss (Raw)": 2.055257797241211, "Full-pretrain/Step": 6302, "Full-pretrain/Step Time": 17.591287422925234} +{"Full-pretrain/Learning Rate": 1.3616206699705944e-05, "Full-pretrain/Loss": 1.9331235885620117, "Full-pretrain/Loss (Raw)": 2.019411087036133, "Full-pretrain/Step": 6303, "Full-pretrain/Step Time": 17.58742938376963} +{"Full-pretrain/Learning Rate": 1.3608647906466016e-05, "Full-pretrain/Loss": 1.9287261962890625, "Full-pretrain/Loss (Raw)": 1.6090142726898193, "Full-pretrain/Step": 6304, "Full-pretrain/Step Time": 17.590665632858872} +{"Full-pretrain/Learning Rate": 1.3601090427214547e-05, "Full-pretrain/Loss": 1.9551780223846436, "Full-pretrain/Loss (Raw)": 2.5921406745910645, "Full-pretrain/Step": 6305, "Full-pretrain/Step Time": 17.5930004902184} +{"Full-pretrain/Learning Rate": 1.3593534262823288e-05, "Full-pretrain/Loss": 1.9598164558410645, "Full-pretrain/Loss (Raw)": 1.7384169101715088, "Full-pretrain/Step": 6306, "Full-pretrain/Step Time": 17.58987151272595} +{"Full-pretrain/Learning Rate": 1.3585979414163847e-05, "Full-pretrain/Loss": 1.9571013450622559, "Full-pretrain/Loss (Raw)": 1.7467520236968994, "Full-pretrain/Step": 6307, "Full-pretrain/Step Time": 17.587376594543457} +{"Full-pretrain/Learning Rate": 1.357842588210768e-05, "Full-pretrain/Loss": 1.9536641836166382, "Full-pretrain/Loss (Raw)": 1.8601700067520142, "Full-pretrain/Step": 6308, "Full-pretrain/Step Time": 17.590755129233003} +{"Full-pretrain/Learning Rate": 1.3570873667526063e-05, "Full-pretrain/Loss": 1.9560679197311401, "Full-pretrain/Loss (Raw)": 2.0757102966308594, "Full-pretrain/Step": 6309, "Full-pretrain/Step Time": 17.585412859916687} +{"Full-pretrain/Learning Rate": 1.3563322771290151e-05, "Full-pretrain/Loss": 1.9604308605194092, "Full-pretrain/Loss (Raw)": 1.982743263244629, "Full-pretrain/Step": 6310, "Full-pretrain/Step Time": 17.58434348553419} +{"Full-pretrain/Learning Rate": 1.3555773194270948e-05, "Full-pretrain/Loss": 1.9640624523162842, "Full-pretrain/Loss (Raw)": 2.217832088470459, "Full-pretrain/Step": 6311, "Full-pretrain/Step Time": 17.583426462486386} +{"Full-pretrain/Learning Rate": 1.3548224937339276e-05, "Full-pretrain/Loss": 1.9591472148895264, "Full-pretrain/Loss (Raw)": 1.8502699136734009, "Full-pretrain/Step": 6312, "Full-pretrain/Step Time": 17.583779046311975} +{"Full-pretrain/Learning Rate": 1.3540678001365836e-05, "Full-pretrain/Loss": 1.9538662433624268, "Full-pretrain/Loss (Raw)": 1.9381779432296753, "Full-pretrain/Step": 6313, "Full-pretrain/Step Time": 17.587735038250685} +{"Full-pretrain/Learning Rate": 1.3533132387221168e-05, "Full-pretrain/Loss": 1.9500765800476074, "Full-pretrain/Loss (Raw)": 1.7335186004638672, "Full-pretrain/Step": 6314, "Full-pretrain/Step Time": 17.59136275202036} +{"Full-pretrain/Learning Rate": 1.352558809577564e-05, "Full-pretrain/Loss": 1.9315779209136963, "Full-pretrain/Loss (Raw)": 1.6953730583190918, "Full-pretrain/Step": 6315, "Full-pretrain/Step Time": 17.591180343180895} +{"Full-pretrain/Learning Rate": 1.3518045127899493e-05, "Full-pretrain/Loss": 1.9287140369415283, "Full-pretrain/Loss (Raw)": 1.9532504081726074, "Full-pretrain/Step": 6316, "Full-pretrain/Step Time": 17.59301789291203} +{"Full-pretrain/Learning Rate": 1.3510503484462805e-05, "Full-pretrain/Loss": 1.9383063316345215, "Full-pretrain/Loss (Raw)": 2.1666064262390137, "Full-pretrain/Step": 6317, "Full-pretrain/Step Time": 17.58942806906998} +{"Full-pretrain/Learning Rate": 1.3502963166335504e-05, "Full-pretrain/Loss": 1.9324846267700195, "Full-pretrain/Loss (Raw)": 1.9151673316955566, "Full-pretrain/Step": 6318, "Full-pretrain/Step Time": 17.58938759751618} +{"Full-pretrain/Learning Rate": 1.3495424174387367e-05, "Full-pretrain/Loss": 1.9394726753234863, "Full-pretrain/Loss (Raw)": 2.1946301460266113, "Full-pretrain/Step": 6319, "Full-pretrain/Step Time": 17.589988954365253} +{"Full-pretrain/Learning Rate": 1.3487886509488002e-05, "Full-pretrain/Loss": 1.9362469911575317, "Full-pretrain/Loss (Raw)": 2.0219273567199707, "Full-pretrain/Step": 6320, "Full-pretrain/Step Time": 17.581742277368903} +{"Full-pretrain/Learning Rate": 1.3480350172506883e-05, "Full-pretrain/Loss": 1.9316411018371582, "Full-pretrain/Loss (Raw)": 1.8066210746765137, "Full-pretrain/Step": 6321, "Full-pretrain/Step Time": 17.590627750381827} +{"Full-pretrain/Learning Rate": 1.3472815164313325e-05, "Full-pretrain/Loss": 1.9412506818771362, "Full-pretrain/Loss (Raw)": 1.7368109226226807, "Full-pretrain/Step": 6322, "Full-pretrain/Step Time": 17.58781568519771} +{"Full-pretrain/Learning Rate": 1.3465281485776481e-05, "Full-pretrain/Loss": 1.9333889484405518, "Full-pretrain/Loss (Raw)": 1.7962093353271484, "Full-pretrain/Step": 6323, "Full-pretrain/Step Time": 17.5861679520458} +{"Full-pretrain/Learning Rate": 1.345774913776538e-05, "Full-pretrain/Loss": 1.9344959259033203, "Full-pretrain/Loss (Raw)": 1.970192551612854, "Full-pretrain/Step": 6324, "Full-pretrain/Step Time": 17.58319160155952} +{"Full-pretrain/Learning Rate": 1.3450218121148844e-05, "Full-pretrain/Loss": 1.9367519617080688, "Full-pretrain/Loss (Raw)": 2.1285152435302734, "Full-pretrain/Step": 6325, "Full-pretrain/Step Time": 17.582020696252584} +{"Full-pretrain/Learning Rate": 1.3442688436795592e-05, "Full-pretrain/Loss": 1.939737319946289, "Full-pretrain/Loss (Raw)": 1.9892361164093018, "Full-pretrain/Step": 6326, "Full-pretrain/Step Time": 17.58293610624969} +{"Full-pretrain/Learning Rate": 1.3435160085574177e-05, "Full-pretrain/Loss": 1.945431113243103, "Full-pretrain/Loss (Raw)": 2.136948823928833, "Full-pretrain/Step": 6327, "Full-pretrain/Step Time": 17.579440336674452} +{"Full-pretrain/Learning Rate": 1.3427633068352974e-05, "Full-pretrain/Loss": 1.9654884338378906, "Full-pretrain/Loss (Raw)": 2.3591790199279785, "Full-pretrain/Step": 6328, "Full-pretrain/Step Time": 17.584301372990012} +{"Full-pretrain/Learning Rate": 1.3420107386000227e-05, "Full-pretrain/Loss": 1.955273151397705, "Full-pretrain/Loss (Raw)": 1.6888208389282227, "Full-pretrain/Step": 6329, "Full-pretrain/Step Time": 17.581693090498447} +{"Full-pretrain/Learning Rate": 1.3412583039384036e-05, "Full-pretrain/Loss": 1.9687080383300781, "Full-pretrain/Loss (Raw)": 2.1811065673828125, "Full-pretrain/Step": 6330, "Full-pretrain/Step Time": 17.584549413993955} +{"Full-pretrain/Learning Rate": 1.3405060029372308e-05, "Full-pretrain/Loss": 1.964369773864746, "Full-pretrain/Loss (Raw)": 1.905651330947876, "Full-pretrain/Step": 6331, "Full-pretrain/Step Time": 17.58371514454484} +{"Full-pretrain/Learning Rate": 1.3397538356832828e-05, "Full-pretrain/Loss": 1.963578224182129, "Full-pretrain/Loss (Raw)": 1.7245886325836182, "Full-pretrain/Step": 6332, "Full-pretrain/Step Time": 17.581665948033333} +{"Full-pretrain/Learning Rate": 1.3390018022633225e-05, "Full-pretrain/Loss": 1.9751439094543457, "Full-pretrain/Loss (Raw)": 2.414357900619507, "Full-pretrain/Step": 6333, "Full-pretrain/Step Time": 17.580666601657867} +{"Full-pretrain/Learning Rate": 1.338249902764096e-05, "Full-pretrain/Loss": 1.9632763862609863, "Full-pretrain/Loss (Raw)": 1.6754966974258423, "Full-pretrain/Step": 6334, "Full-pretrain/Step Time": 17.5872253049165} +{"Full-pretrain/Learning Rate": 1.3374981372723362e-05, "Full-pretrain/Loss": 1.9627612829208374, "Full-pretrain/Loss (Raw)": 2.0029263496398926, "Full-pretrain/Step": 6335, "Full-pretrain/Step Time": 17.585108222439885} +{"Full-pretrain/Learning Rate": 1.3367465058747567e-05, "Full-pretrain/Loss": 1.9728693962097168, "Full-pretrain/Loss (Raw)": 1.9324753284454346, "Full-pretrain/Step": 6336, "Full-pretrain/Step Time": 17.586162542924285} +{"Full-pretrain/Learning Rate": 1.3359950086580588e-05, "Full-pretrain/Loss": 1.9499468803405762, "Full-pretrain/Loss (Raw)": 1.8586199283599854, "Full-pretrain/Step": 6337, "Full-pretrain/Step Time": 17.587989976629615} +{"Full-pretrain/Learning Rate": 1.335243645708928e-05, "Full-pretrain/Loss": 1.958693504333496, "Full-pretrain/Loss (Raw)": 2.0183115005493164, "Full-pretrain/Step": 6338, "Full-pretrain/Step Time": 17.59312628209591} +{"Full-pretrain/Learning Rate": 1.3344924171140328e-05, "Full-pretrain/Loss": 1.9629783630371094, "Full-pretrain/Loss (Raw)": 1.8838632106781006, "Full-pretrain/Step": 6339, "Full-pretrain/Step Time": 17.590113112702966} +{"Full-pretrain/Learning Rate": 1.333741322960029e-05, "Full-pretrain/Loss": 1.9611393213272095, "Full-pretrain/Loss (Raw)": 1.8013253211975098, "Full-pretrain/Step": 6340, "Full-pretrain/Step Time": 17.58971980586648} +{"Full-pretrain/Learning Rate": 1.3329903633335528e-05, "Full-pretrain/Loss": 1.9424753189086914, "Full-pretrain/Loss (Raw)": 1.4784595966339111, "Full-pretrain/Step": 6341, "Full-pretrain/Step Time": 17.588172985240817} +{"Full-pretrain/Learning Rate": 1.3322395383212277e-05, "Full-pretrain/Loss": 1.9391961097717285, "Full-pretrain/Loss (Raw)": 1.8778101205825806, "Full-pretrain/Step": 6342, "Full-pretrain/Step Time": 17.58196148276329} +{"Full-pretrain/Learning Rate": 1.3314888480096618e-05, "Full-pretrain/Loss": 1.941596269607544, "Full-pretrain/Loss (Raw)": 2.294635772705078, "Full-pretrain/Step": 6343, "Full-pretrain/Step Time": 17.590565929189324} +{"Full-pretrain/Learning Rate": 1.3307382924854479e-05, "Full-pretrain/Loss": 1.9533772468566895, "Full-pretrain/Loss (Raw)": 2.227259635925293, "Full-pretrain/Step": 6344, "Full-pretrain/Step Time": 17.586425667628646} +{"Full-pretrain/Learning Rate": 1.3299878718351594e-05, "Full-pretrain/Loss": 1.953801155090332, "Full-pretrain/Loss (Raw)": 1.9517416954040527, "Full-pretrain/Step": 6345, "Full-pretrain/Step Time": 17.58336210809648} +{"Full-pretrain/Learning Rate": 1.3292375861453598e-05, "Full-pretrain/Loss": 1.9563196897506714, "Full-pretrain/Loss (Raw)": 1.8141134977340698, "Full-pretrain/Step": 6346, "Full-pretrain/Step Time": 17.583157869055867} +{"Full-pretrain/Learning Rate": 1.3284874355025928e-05, "Full-pretrain/Loss": 1.966465950012207, "Full-pretrain/Loss (Raw)": 2.020052433013916, "Full-pretrain/Step": 6347, "Full-pretrain/Step Time": 17.583204358816147} +{"Full-pretrain/Learning Rate": 1.3277374199933879e-05, "Full-pretrain/Loss": 1.9627752304077148, "Full-pretrain/Loss (Raw)": 1.8351441621780396, "Full-pretrain/Step": 6348, "Full-pretrain/Step Time": 17.582369051873684} +{"Full-pretrain/Learning Rate": 1.3269875397042598e-05, "Full-pretrain/Loss": 1.9541735649108887, "Full-pretrain/Loss (Raw)": 1.8913558721542358, "Full-pretrain/Step": 6349, "Full-pretrain/Step Time": 17.588443027809262} +{"Full-pretrain/Learning Rate": 1.3262377947217069e-05, "Full-pretrain/Loss": 1.9617063999176025, "Full-pretrain/Loss (Raw)": 2.1562204360961914, "Full-pretrain/Step": 6350, "Full-pretrain/Step Time": 17.59056126885116} +{"Full-pretrain/Learning Rate": 1.3254881851322126e-05, "Full-pretrain/Loss": 1.9454870223999023, "Full-pretrain/Loss (Raw)": 1.6756037473678589, "Full-pretrain/Step": 6351, "Full-pretrain/Step Time": 17.591873675584793} +{"Full-pretrain/Learning Rate": 1.3247387110222426e-05, "Full-pretrain/Loss": 1.9402828216552734, "Full-pretrain/Loss (Raw)": 1.8553962707519531, "Full-pretrain/Step": 6352, "Full-pretrain/Step Time": 17.587019061669707} +{"Full-pretrain/Learning Rate": 1.3239893724782492e-05, "Full-pretrain/Loss": 1.948506236076355, "Full-pretrain/Loss (Raw)": 2.069769859313965, "Full-pretrain/Step": 6353, "Full-pretrain/Step Time": 17.587784541770816} +{"Full-pretrain/Learning Rate": 1.3232401695866687e-05, "Full-pretrain/Loss": 1.9603238105773926, "Full-pretrain/Loss (Raw)": 2.114978790283203, "Full-pretrain/Step": 6354, "Full-pretrain/Step Time": 17.591199461370707} +{"Full-pretrain/Learning Rate": 1.3224911024339207e-05, "Full-pretrain/Loss": 1.9635902643203735, "Full-pretrain/Loss (Raw)": 1.9007303714752197, "Full-pretrain/Step": 6355, "Full-pretrain/Step Time": 17.593951296061277} +{"Full-pretrain/Learning Rate": 1.3217421711064112e-05, "Full-pretrain/Loss": 1.9674540758132935, "Full-pretrain/Loss (Raw)": 2.093834638595581, "Full-pretrain/Step": 6356, "Full-pretrain/Step Time": 17.58978148549795} +{"Full-pretrain/Learning Rate": 1.3209933756905274e-05, "Full-pretrain/Loss": 1.9578806161880493, "Full-pretrain/Loss (Raw)": 1.8221652507781982, "Full-pretrain/Step": 6357, "Full-pretrain/Step Time": 17.591903468593955} +{"Full-pretrain/Learning Rate": 1.3202447162726433e-05, "Full-pretrain/Loss": 1.963366985321045, "Full-pretrain/Loss (Raw)": 2.1648035049438477, "Full-pretrain/Step": 6358, "Full-pretrain/Step Time": 17.588757494464517} +{"Full-pretrain/Learning Rate": 1.3194961929391167e-05, "Full-pretrain/Loss": 1.954329490661621, "Full-pretrain/Loss (Raw)": 1.8477463722229004, "Full-pretrain/Step": 6359, "Full-pretrain/Step Time": 17.590043153613806} +{"Full-pretrain/Learning Rate": 1.3187478057762904e-05, "Full-pretrain/Loss": 1.9401981830596924, "Full-pretrain/Loss (Raw)": 1.9069757461547852, "Full-pretrain/Step": 6360, "Full-pretrain/Step Time": 17.588293250650167} +{"Full-pretrain/Learning Rate": 1.3179995548704883e-05, "Full-pretrain/Loss": 1.938339114189148, "Full-pretrain/Loss (Raw)": 1.6293318271636963, "Full-pretrain/Step": 6361, "Full-pretrain/Step Time": 17.58752141147852} +{"Full-pretrain/Learning Rate": 1.3172514403080233e-05, "Full-pretrain/Loss": 1.9240213632583618, "Full-pretrain/Loss (Raw)": 1.7229382991790771, "Full-pretrain/Step": 6362, "Full-pretrain/Step Time": 17.591475619003177} +{"Full-pretrain/Learning Rate": 1.3165034621751882e-05, "Full-pretrain/Loss": 1.9256970882415771, "Full-pretrain/Loss (Raw)": 1.959273338317871, "Full-pretrain/Step": 6363, "Full-pretrain/Step Time": 17.596205722540617} +{"Full-pretrain/Learning Rate": 1.3157556205582627e-05, "Full-pretrain/Loss": 1.9242424964904785, "Full-pretrain/Loss (Raw)": 1.6780439615249634, "Full-pretrain/Step": 6364, "Full-pretrain/Step Time": 17.602332646027207} +{"Full-pretrain/Learning Rate": 1.3150079155435102e-05, "Full-pretrain/Loss": 1.9043078422546387, "Full-pretrain/Loss (Raw)": 1.7764508724212646, "Full-pretrain/Step": 6365, "Full-pretrain/Step Time": 17.595097232609987} +{"Full-pretrain/Learning Rate": 1.3142603472171788e-05, "Full-pretrain/Loss": 1.903857707977295, "Full-pretrain/Loss (Raw)": 1.6610875129699707, "Full-pretrain/Step": 6366, "Full-pretrain/Step Time": 17.60035232640803} +{"Full-pretrain/Learning Rate": 1.3135129156654991e-05, "Full-pretrain/Loss": 1.898996114730835, "Full-pretrain/Loss (Raw)": 1.8473594188690186, "Full-pretrain/Step": 6367, "Full-pretrain/Step Time": 17.60125326924026} +{"Full-pretrain/Learning Rate": 1.3127656209746875e-05, "Full-pretrain/Loss": 1.8904602527618408, "Full-pretrain/Loss (Raw)": 1.6593279838562012, "Full-pretrain/Step": 6368, "Full-pretrain/Step Time": 17.605474803596735} +{"Full-pretrain/Learning Rate": 1.3120184632309446e-05, "Full-pretrain/Loss": 1.906346321105957, "Full-pretrain/Loss (Raw)": 2.3669698238372803, "Full-pretrain/Step": 6369, "Full-pretrain/Step Time": 17.60573111847043} +{"Full-pretrain/Learning Rate": 1.3112714425204541e-05, "Full-pretrain/Loss": 1.9078330993652344, "Full-pretrain/Loss (Raw)": 2.0658888816833496, "Full-pretrain/Step": 6370, "Full-pretrain/Step Time": 17.602623900398612} +{"Full-pretrain/Learning Rate": 1.3105245589293851e-05, "Full-pretrain/Loss": 1.9094126224517822, "Full-pretrain/Loss (Raw)": 1.9344121217727661, "Full-pretrain/Step": 6371, "Full-pretrain/Step Time": 17.60047055967152} +{"Full-pretrain/Learning Rate": 1.3097778125438912e-05, "Full-pretrain/Loss": 1.9111149311065674, "Full-pretrain/Loss (Raw)": 1.8557953834533691, "Full-pretrain/Step": 6372, "Full-pretrain/Step Time": 17.598056266084313} +{"Full-pretrain/Learning Rate": 1.3090312034501073e-05, "Full-pretrain/Loss": 1.9279706478118896, "Full-pretrain/Loss (Raw)": 2.0178451538085938, "Full-pretrain/Step": 6373, "Full-pretrain/Step Time": 17.59572389163077} +{"Full-pretrain/Learning Rate": 1.3082847317341557e-05, "Full-pretrain/Loss": 1.9256296157836914, "Full-pretrain/Loss (Raw)": 1.8028943538665771, "Full-pretrain/Step": 6374, "Full-pretrain/Step Time": 17.588267654180527} +{"Full-pretrain/Learning Rate": 1.3075383974821415e-05, "Full-pretrain/Loss": 1.910705327987671, "Full-pretrain/Loss (Raw)": 1.817061185836792, "Full-pretrain/Step": 6375, "Full-pretrain/Step Time": 17.59520960226655} +{"Full-pretrain/Learning Rate": 1.3067922007801547e-05, "Full-pretrain/Loss": 1.896259069442749, "Full-pretrain/Loss (Raw)": 1.7649788856506348, "Full-pretrain/Step": 6376, "Full-pretrain/Step Time": 17.59584615379572} +{"Full-pretrain/Learning Rate": 1.3060461417142677e-05, "Full-pretrain/Loss": 1.8857064247131348, "Full-pretrain/Loss (Raw)": 1.614058256149292, "Full-pretrain/Step": 6377, "Full-pretrain/Step Time": 17.594561655074358} +{"Full-pretrain/Learning Rate": 1.3053002203705395e-05, "Full-pretrain/Loss": 1.8856393098831177, "Full-pretrain/Loss (Raw)": 1.8119618892669678, "Full-pretrain/Step": 6378, "Full-pretrain/Step Time": 17.596268130466342} +{"Full-pretrain/Learning Rate": 1.3045544368350098e-05, "Full-pretrain/Loss": 1.8771557807922363, "Full-pretrain/Loss (Raw)": 1.7485814094543457, "Full-pretrain/Step": 6379, "Full-pretrain/Step Time": 17.59405948780477} +{"Full-pretrain/Learning Rate": 1.3038087911937058e-05, "Full-pretrain/Loss": 1.8847970962524414, "Full-pretrain/Loss (Raw)": 2.079667568206787, "Full-pretrain/Step": 6380, "Full-pretrain/Step Time": 17.58657362125814} +{"Full-pretrain/Learning Rate": 1.3030632835326379e-05, "Full-pretrain/Loss": 1.8927817344665527, "Full-pretrain/Loss (Raw)": 2.1468656063079834, "Full-pretrain/Step": 6381, "Full-pretrain/Step Time": 17.58834526874125} +{"Full-pretrain/Learning Rate": 1.3023179139378e-05, "Full-pretrain/Loss": 1.8865759372711182, "Full-pretrain/Loss (Raw)": 1.9576294422149658, "Full-pretrain/Step": 6382, "Full-pretrain/Step Time": 17.59048667922616} +{"Full-pretrain/Learning Rate": 1.301572682495169e-05, "Full-pretrain/Loss": 1.8908698558807373, "Full-pretrain/Loss (Raw)": 1.8130102157592773, "Full-pretrain/Step": 6383, "Full-pretrain/Step Time": 17.597545193508267} +{"Full-pretrain/Learning Rate": 1.300827589290708e-05, "Full-pretrain/Loss": 1.9051477909088135, "Full-pretrain/Loss (Raw)": 2.312293529510498, "Full-pretrain/Step": 6384, "Full-pretrain/Step Time": 17.59686267375946} +{"Full-pretrain/Learning Rate": 1.3000826344103629e-05, "Full-pretrain/Loss": 1.9020531177520752, "Full-pretrain/Loss (Raw)": 1.970734715461731, "Full-pretrain/Step": 6385, "Full-pretrain/Step Time": 17.59880506619811} +{"Full-pretrain/Learning Rate": 1.2993378179400645e-05, "Full-pretrain/Loss": 1.8995085954666138, "Full-pretrain/Loss (Raw)": 2.033557415008545, "Full-pretrain/Step": 6386, "Full-pretrain/Step Time": 17.600514765828848} +{"Full-pretrain/Learning Rate": 1.2985931399657279e-05, "Full-pretrain/Loss": 1.9051284790039062, "Full-pretrain/Loss (Raw)": 2.080568790435791, "Full-pretrain/Step": 6387, "Full-pretrain/Step Time": 17.60415335185826} +{"Full-pretrain/Learning Rate": 1.2978486005732493e-05, "Full-pretrain/Loss": 1.8974976539611816, "Full-pretrain/Loss (Raw)": 1.849644660949707, "Full-pretrain/Step": 6388, "Full-pretrain/Step Time": 17.602520242333412} +{"Full-pretrain/Learning Rate": 1.297104199848512e-05, "Full-pretrain/Loss": 1.8977843523025513, "Full-pretrain/Loss (Raw)": 1.8313395977020264, "Full-pretrain/Step": 6389, "Full-pretrain/Step Time": 17.59911434724927} +{"Full-pretrain/Learning Rate": 1.2963599378773828e-05, "Full-pretrain/Loss": 1.8890725374221802, "Full-pretrain/Loss (Raw)": 1.8860262632369995, "Full-pretrain/Step": 6390, "Full-pretrain/Step Time": 17.608117079362273} +{"Full-pretrain/Learning Rate": 1.2956158147457115e-05, "Full-pretrain/Loss": 1.890185832977295, "Full-pretrain/Loss (Raw)": 1.883376121520996, "Full-pretrain/Step": 6391, "Full-pretrain/Step Time": 17.60166391544044} +{"Full-pretrain/Learning Rate": 1.2948718305393329e-05, "Full-pretrain/Loss": 1.894029140472412, "Full-pretrain/Loss (Raw)": 2.029956340789795, "Full-pretrain/Step": 6392, "Full-pretrain/Step Time": 17.605565775185823} +{"Full-pretrain/Learning Rate": 1.294127985344066e-05, "Full-pretrain/Loss": 1.8988018035888672, "Full-pretrain/Loss (Raw)": 1.782063603401184, "Full-pretrain/Step": 6393, "Full-pretrain/Step Time": 17.60638071037829} +{"Full-pretrain/Learning Rate": 1.2933842792457113e-05, "Full-pretrain/Loss": 1.9021830558776855, "Full-pretrain/Loss (Raw)": 1.8311309814453125, "Full-pretrain/Step": 6394, "Full-pretrain/Step Time": 17.606228912249207} +{"Full-pretrain/Learning Rate": 1.2926407123300571e-05, "Full-pretrain/Loss": 1.9039366245269775, "Full-pretrain/Loss (Raw)": 2.0153932571411133, "Full-pretrain/Step": 6395, "Full-pretrain/Step Time": 17.604380641132593} +{"Full-pretrain/Learning Rate": 1.2918972846828712e-05, "Full-pretrain/Loss": 1.911475419998169, "Full-pretrain/Loss (Raw)": 1.9192804098129272, "Full-pretrain/Step": 6396, "Full-pretrain/Step Time": 17.608167693018913} +{"Full-pretrain/Learning Rate": 1.291153996389909e-05, "Full-pretrain/Loss": 1.919325351715088, "Full-pretrain/Loss (Raw)": 2.027653217315674, "Full-pretrain/Step": 6397, "Full-pretrain/Step Time": 17.607848197221756} +{"Full-pretrain/Learning Rate": 1.2904108475369096e-05, "Full-pretrain/Loss": 1.9205257892608643, "Full-pretrain/Loss (Raw)": 1.6994973421096802, "Full-pretrain/Step": 6398, "Full-pretrain/Step Time": 17.602872187271714} +{"Full-pretrain/Learning Rate": 1.2896678382095928e-05, "Full-pretrain/Loss": 1.919236183166504, "Full-pretrain/Loss (Raw)": 1.8060957193374634, "Full-pretrain/Step": 6399, "Full-pretrain/Step Time": 17.602155938744545} +{"Full-pretrain/Learning Rate": 1.2889249684936655e-05, "Full-pretrain/Loss": 1.9248074293136597, "Full-pretrain/Loss (Raw)": 1.8376069068908691, "Full-pretrain/Step": 6400, "Full-pretrain/Step Time": 17.602770749479532} +{"Full-pretrain/Learning Rate": 1.2881822384748177e-05, "Full-pretrain/Loss": 1.9068522453308105, "Full-pretrain/Loss (Raw)": 1.7924036979675293, "Full-pretrain/Step": 6401, "Full-pretrain/Step Time": 17.60673481039703} +{"Full-pretrain/Learning Rate": 1.2874396482387224e-05, "Full-pretrain/Loss": 1.905784010887146, "Full-pretrain/Loss (Raw)": 2.031703233718872, "Full-pretrain/Step": 6402, "Full-pretrain/Step Time": 17.60131928138435} +{"Full-pretrain/Learning Rate": 1.286697197871039e-05, "Full-pretrain/Loss": 1.9182615280151367, "Full-pretrain/Loss (Raw)": 2.33369517326355, "Full-pretrain/Step": 6403, "Full-pretrain/Step Time": 17.598023949190974} +{"Full-pretrain/Learning Rate": 1.2859548874574062e-05, "Full-pretrain/Loss": 1.9177136421203613, "Full-pretrain/Loss (Raw)": 1.838263750076294, "Full-pretrain/Step": 6404, "Full-pretrain/Step Time": 17.597406797111034} +{"Full-pretrain/Learning Rate": 1.2852127170834505e-05, "Full-pretrain/Loss": 1.9130527973175049, "Full-pretrain/Loss (Raw)": 1.8686974048614502, "Full-pretrain/Step": 6405, "Full-pretrain/Step Time": 17.598525177687407} +{"Full-pretrain/Learning Rate": 1.284470686834781e-05, "Full-pretrain/Loss": 1.9249597787857056, "Full-pretrain/Loss (Raw)": 2.1839170455932617, "Full-pretrain/Step": 6406, "Full-pretrain/Step Time": 17.594401877373457} +{"Full-pretrain/Learning Rate": 1.2837287967969905e-05, "Full-pretrain/Loss": 1.9304866790771484, "Full-pretrain/Loss (Raw)": 1.993922472000122, "Full-pretrain/Step": 6407, "Full-pretrain/Step Time": 17.58977403678} +{"Full-pretrain/Learning Rate": 1.282987047055657e-05, "Full-pretrain/Loss": 1.9316792488098145, "Full-pretrain/Loss (Raw)": 1.8031429052352905, "Full-pretrain/Step": 6408, "Full-pretrain/Step Time": 17.591555362567306} +{"Full-pretrain/Learning Rate": 1.282245437696339e-05, "Full-pretrain/Loss": 1.9333360195159912, "Full-pretrain/Loss (Raw)": 1.6670730113983154, "Full-pretrain/Step": 6409, "Full-pretrain/Step Time": 17.593260992318392} +{"Full-pretrain/Learning Rate": 1.2815039688045815e-05, "Full-pretrain/Loss": 1.9430655241012573, "Full-pretrain/Loss (Raw)": 2.123304605484009, "Full-pretrain/Step": 6410, "Full-pretrain/Step Time": 17.593808252364397} +{"Full-pretrain/Learning Rate": 1.2807626404659142e-05, "Full-pretrain/Loss": 1.9561455249786377, "Full-pretrain/Loss (Raw)": 2.1671438217163086, "Full-pretrain/Step": 6411, "Full-pretrain/Step Time": 17.58955815434456} +{"Full-pretrain/Learning Rate": 1.280021452765847e-05, "Full-pretrain/Loss": 1.9498727321624756, "Full-pretrain/Loss (Raw)": 1.8789339065551758, "Full-pretrain/Step": 6412, "Full-pretrain/Step Time": 17.59711165726185} +{"Full-pretrain/Learning Rate": 1.2792804057898764e-05, "Full-pretrain/Loss": 1.936133861541748, "Full-pretrain/Loss (Raw)": 1.7072205543518066, "Full-pretrain/Step": 6413, "Full-pretrain/Step Time": 17.59969305060804} +{"Full-pretrain/Learning Rate": 1.2785394996234828e-05, "Full-pretrain/Loss": 1.926276683807373, "Full-pretrain/Loss (Raw)": 1.6422014236450195, "Full-pretrain/Step": 6414, "Full-pretrain/Step Time": 17.599375665187836} +{"Full-pretrain/Learning Rate": 1.2777987343521277e-05, "Full-pretrain/Loss": 1.9287068843841553, "Full-pretrain/Loss (Raw)": 1.890777826309204, "Full-pretrain/Step": 6415, "Full-pretrain/Step Time": 17.594473341479897} +{"Full-pretrain/Learning Rate": 1.2770581100612594e-05, "Full-pretrain/Loss": 1.9165313243865967, "Full-pretrain/Loss (Raw)": 1.9226741790771484, "Full-pretrain/Step": 6416, "Full-pretrain/Step Time": 17.599505750462413} +{"Full-pretrain/Learning Rate": 1.2763176268363081e-05, "Full-pretrain/Loss": 1.9014928340911865, "Full-pretrain/Loss (Raw)": 1.4895055294036865, "Full-pretrain/Step": 6417, "Full-pretrain/Step Time": 17.603555651381612} +{"Full-pretrain/Learning Rate": 1.2755772847626884e-05, "Full-pretrain/Loss": 1.9044108390808105, "Full-pretrain/Loss (Raw)": 2.1269326210021973, "Full-pretrain/Step": 6418, "Full-pretrain/Step Time": 17.60162241756916} +{"Full-pretrain/Learning Rate": 1.2748370839258e-05, "Full-pretrain/Loss": 1.9064807891845703, "Full-pretrain/Loss (Raw)": 2.1468069553375244, "Full-pretrain/Step": 6419, "Full-pretrain/Step Time": 17.602150032296777} +{"Full-pretrain/Learning Rate": 1.274097024411022e-05, "Full-pretrain/Loss": 1.9059653282165527, "Full-pretrain/Loss (Raw)": 1.83315110206604, "Full-pretrain/Step": 6420, "Full-pretrain/Step Time": 17.602602493017912} +{"Full-pretrain/Learning Rate": 1.2733571063037214e-05, "Full-pretrain/Loss": 1.9034020900726318, "Full-pretrain/Loss (Raw)": 1.7493138313293457, "Full-pretrain/Step": 6421, "Full-pretrain/Step Time": 17.604656672105193} +{"Full-pretrain/Learning Rate": 1.272617329689248e-05, "Full-pretrain/Loss": 1.9012477397918701, "Full-pretrain/Loss (Raw)": 1.8170931339263916, "Full-pretrain/Step": 6422, "Full-pretrain/Step Time": 17.60200816951692} +{"Full-pretrain/Learning Rate": 1.2718776946529337e-05, "Full-pretrain/Loss": 1.896904706954956, "Full-pretrain/Loss (Raw)": 1.7443938255310059, "Full-pretrain/Step": 6423, "Full-pretrain/Step Time": 17.60190975293517} +{"Full-pretrain/Learning Rate": 1.271138201280097e-05, "Full-pretrain/Loss": 1.8864024877548218, "Full-pretrain/Loss (Raw)": 1.6938867568969727, "Full-pretrain/Step": 6424, "Full-pretrain/Step Time": 17.604658503085375} +{"Full-pretrain/Learning Rate": 1.2703988496560363e-05, "Full-pretrain/Loss": 1.8973532915115356, "Full-pretrain/Loss (Raw)": 2.1324892044067383, "Full-pretrain/Step": 6425, "Full-pretrain/Step Time": 17.606606198474765} +{"Full-pretrain/Learning Rate": 1.2696596398660357e-05, "Full-pretrain/Loss": 1.8971140384674072, "Full-pretrain/Loss (Raw)": 1.8234745264053345, "Full-pretrain/Step": 6426, "Full-pretrain/Step Time": 17.60750373452902} +{"Full-pretrain/Learning Rate": 1.2689205719953633e-05, "Full-pretrain/Loss": 1.888286828994751, "Full-pretrain/Loss (Raw)": 1.732924461364746, "Full-pretrain/Step": 6427, "Full-pretrain/Step Time": 17.604444317519665} +{"Full-pretrain/Learning Rate": 1.2681816461292715e-05, "Full-pretrain/Loss": 1.890852689743042, "Full-pretrain/Loss (Raw)": 2.0013861656188965, "Full-pretrain/Step": 6428, "Full-pretrain/Step Time": 17.605899535119534} +{"Full-pretrain/Learning Rate": 1.2674428623529926e-05, "Full-pretrain/Loss": 1.8893351554870605, "Full-pretrain/Loss (Raw)": 1.9790887832641602, "Full-pretrain/Step": 6429, "Full-pretrain/Step Time": 17.601138366386294} +{"Full-pretrain/Learning Rate": 1.2667042207517477e-05, "Full-pretrain/Loss": 1.8876163959503174, "Full-pretrain/Loss (Raw)": 1.6445014476776123, "Full-pretrain/Step": 6430, "Full-pretrain/Step Time": 17.610743675380945} +{"Full-pretrain/Learning Rate": 1.2659657214107365e-05, "Full-pretrain/Loss": 1.8856923580169678, "Full-pretrain/Loss (Raw)": 1.744524598121643, "Full-pretrain/Step": 6431, "Full-pretrain/Step Time": 17.60743284225464} +{"Full-pretrain/Learning Rate": 1.2652273644151458e-05, "Full-pretrain/Loss": 1.891163945198059, "Full-pretrain/Loss (Raw)": 2.012698173522949, "Full-pretrain/Step": 6432, "Full-pretrain/Step Time": 17.608524003997445} +{"Full-pretrain/Learning Rate": 1.2644891498501443e-05, "Full-pretrain/Loss": 1.8961905241012573, "Full-pretrain/Loss (Raw)": 1.9532548189163208, "Full-pretrain/Step": 6433, "Full-pretrain/Step Time": 17.61095902323723} +{"Full-pretrain/Learning Rate": 1.2637510778008854e-05, "Full-pretrain/Loss": 1.8891592025756836, "Full-pretrain/Loss (Raw)": 1.8067022562026978, "Full-pretrain/Step": 6434, "Full-pretrain/Step Time": 17.61535270139575} +{"Full-pretrain/Learning Rate": 1.263013148352506e-05, "Full-pretrain/Loss": 1.8853700160980225, "Full-pretrain/Loss (Raw)": 2.212437629699707, "Full-pretrain/Step": 6435, "Full-pretrain/Step Time": 17.615245824679732} +{"Full-pretrain/Learning Rate": 1.2622753615901244e-05, "Full-pretrain/Loss": 1.8829967975616455, "Full-pretrain/Loss (Raw)": 1.7623217105865479, "Full-pretrain/Step": 6436, "Full-pretrain/Step Time": 17.611288115382195} +{"Full-pretrain/Learning Rate": 1.2615377175988449e-05, "Full-pretrain/Loss": 1.8667638301849365, "Full-pretrain/Loss (Raw)": 1.3492436408996582, "Full-pretrain/Step": 6437, "Full-pretrain/Step Time": 17.608859483152628} +{"Full-pretrain/Learning Rate": 1.2608002164637544e-05, "Full-pretrain/Loss": 1.8650367259979248, "Full-pretrain/Loss (Raw)": 2.128647804260254, "Full-pretrain/Step": 6438, "Full-pretrain/Step Time": 17.610564932227135} +{"Full-pretrain/Learning Rate": 1.2600628582699236e-05, "Full-pretrain/Loss": 1.864116907119751, "Full-pretrain/Loss (Raw)": 1.9644867181777954, "Full-pretrain/Step": 6439, "Full-pretrain/Step Time": 17.607858888804913} +{"Full-pretrain/Learning Rate": 1.259325643102407e-05, "Full-pretrain/Loss": 1.8528366088867188, "Full-pretrain/Loss (Raw)": 1.4421746730804443, "Full-pretrain/Step": 6440, "Full-pretrain/Step Time": 17.61248424462974} +{"Full-pretrain/Learning Rate": 1.2585885710462408e-05, "Full-pretrain/Loss": 1.8658134937286377, "Full-pretrain/Loss (Raw)": 2.082334280014038, "Full-pretrain/Step": 6441, "Full-pretrain/Step Time": 17.607699880376458} +{"Full-pretrain/Learning Rate": 1.2578516421864467e-05, "Full-pretrain/Loss": 1.862432837486267, "Full-pretrain/Loss (Raw)": 2.0151236057281494, "Full-pretrain/Step": 6442, "Full-pretrain/Step Time": 17.60837920755148} +{"Full-pretrain/Learning Rate": 1.2571148566080288e-05, "Full-pretrain/Loss": 1.8426573276519775, "Full-pretrain/Loss (Raw)": 1.5343269109725952, "Full-pretrain/Step": 6443, "Full-pretrain/Step Time": 17.608269089832902} +{"Full-pretrain/Learning Rate": 1.2563782143959769e-05, "Full-pretrain/Loss": 1.8402786254882812, "Full-pretrain/Loss (Raw)": 1.8028180599212646, "Full-pretrain/Step": 6444, "Full-pretrain/Step Time": 17.608407055959105} +{"Full-pretrain/Learning Rate": 1.2556417156352596e-05, "Full-pretrain/Loss": 1.848542332649231, "Full-pretrain/Loss (Raw)": 1.9716565608978271, "Full-pretrain/Step": 6445, "Full-pretrain/Step Time": 17.60683935135603} +{"Full-pretrain/Learning Rate": 1.2549053604108341e-05, "Full-pretrain/Loss": 1.856773853302002, "Full-pretrain/Loss (Raw)": 1.9056143760681152, "Full-pretrain/Step": 6446, "Full-pretrain/Step Time": 17.608310213312507} +{"Full-pretrain/Learning Rate": 1.2541691488076369e-05, "Full-pretrain/Loss": 1.8561805486679077, "Full-pretrain/Loss (Raw)": 1.8717880249023438, "Full-pretrain/Step": 6447, "Full-pretrain/Step Time": 17.606981126591563} +{"Full-pretrain/Learning Rate": 1.2534330809105902e-05, "Full-pretrain/Loss": 1.857155203819275, "Full-pretrain/Loss (Raw)": 1.9538633823394775, "Full-pretrain/Step": 6448, "Full-pretrain/Step Time": 17.61107810586691} +{"Full-pretrain/Learning Rate": 1.2526971568045998e-05, "Full-pretrain/Loss": 1.877109408378601, "Full-pretrain/Loss (Raw)": 2.128040313720703, "Full-pretrain/Step": 6449, "Full-pretrain/Step Time": 17.608777597546577} +{"Full-pretrain/Learning Rate": 1.2519613765745542e-05, "Full-pretrain/Loss": 1.8712035417556763, "Full-pretrain/Loss (Raw)": 1.937946081161499, "Full-pretrain/Step": 6450, "Full-pretrain/Step Time": 17.60653885640204} +{"Full-pretrain/Learning Rate": 1.2512257403053257e-05, "Full-pretrain/Loss": 1.882522463798523, "Full-pretrain/Loss (Raw)": 2.50900936126709, "Full-pretrain/Step": 6451, "Full-pretrain/Step Time": 17.610791889950633} +{"Full-pretrain/Learning Rate": 1.2504902480817687e-05, "Full-pretrain/Loss": 1.887953519821167, "Full-pretrain/Loss (Raw)": 2.006943702697754, "Full-pretrain/Step": 6452, "Full-pretrain/Step Time": 17.609363244846463} +{"Full-pretrain/Learning Rate": 1.2497548999887224e-05, "Full-pretrain/Loss": 1.8954784870147705, "Full-pretrain/Loss (Raw)": 1.9901143312454224, "Full-pretrain/Step": 6453, "Full-pretrain/Step Time": 17.608288563787937} +{"Full-pretrain/Learning Rate": 1.2490196961110088e-05, "Full-pretrain/Loss": 1.9058706760406494, "Full-pretrain/Loss (Raw)": 2.1496429443359375, "Full-pretrain/Step": 6454, "Full-pretrain/Step Time": 17.607928158715367} +{"Full-pretrain/Learning Rate": 1.2482846365334339e-05, "Full-pretrain/Loss": 1.9196033477783203, "Full-pretrain/Loss (Raw)": 2.183839797973633, "Full-pretrain/Step": 6455, "Full-pretrain/Step Time": 17.60583471134305} +{"Full-pretrain/Learning Rate": 1.2475497213407869e-05, "Full-pretrain/Loss": 1.9245548248291016, "Full-pretrain/Loss (Raw)": 1.8523319959640503, "Full-pretrain/Step": 6456, "Full-pretrain/Step Time": 17.608674133196473} +{"Full-pretrain/Learning Rate": 1.2468149506178386e-05, "Full-pretrain/Loss": 1.915915846824646, "Full-pretrain/Loss (Raw)": 1.8560454845428467, "Full-pretrain/Step": 6457, "Full-pretrain/Step Time": 17.60831884853542} +{"Full-pretrain/Learning Rate": 1.2460803244493454e-05, "Full-pretrain/Loss": 1.9078569412231445, "Full-pretrain/Loss (Raw)": 1.565588355064392, "Full-pretrain/Step": 6458, "Full-pretrain/Step Time": 17.607864156365395} +{"Full-pretrain/Learning Rate": 1.2453458429200463e-05, "Full-pretrain/Loss": 1.9101324081420898, "Full-pretrain/Loss (Raw)": 1.805741310119629, "Full-pretrain/Step": 6459, "Full-pretrain/Step Time": 17.606678150594234} +{"Full-pretrain/Learning Rate": 1.244611506114664e-05, "Full-pretrain/Loss": 1.9095532894134521, "Full-pretrain/Loss (Raw)": 1.9828510284423828, "Full-pretrain/Step": 6460, "Full-pretrain/Step Time": 17.608193203806877} +{"Full-pretrain/Learning Rate": 1.2438773141179025e-05, "Full-pretrain/Loss": 1.906996726989746, "Full-pretrain/Loss (Raw)": 1.8972790241241455, "Full-pretrain/Step": 6461, "Full-pretrain/Step Time": 17.60965039767325} +{"Full-pretrain/Learning Rate": 1.2431432670144521e-05, "Full-pretrain/Loss": 1.9137852191925049, "Full-pretrain/Loss (Raw)": 1.8617353439331055, "Full-pretrain/Step": 6462, "Full-pretrain/Step Time": 17.606474684551358} +{"Full-pretrain/Learning Rate": 1.2424093648889834e-05, "Full-pretrain/Loss": 1.9183905124664307, "Full-pretrain/Loss (Raw)": 1.8918941020965576, "Full-pretrain/Step": 6463, "Full-pretrain/Step Time": 17.60599093325436} +{"Full-pretrain/Learning Rate": 1.2416756078261527e-05, "Full-pretrain/Loss": 1.9167653322219849, "Full-pretrain/Loss (Raw)": 1.960691213607788, "Full-pretrain/Step": 6464, "Full-pretrain/Step Time": 17.607247591018677} +{"Full-pretrain/Learning Rate": 1.2409419959105981e-05, "Full-pretrain/Loss": 1.9107775688171387, "Full-pretrain/Loss (Raw)": 1.7616441249847412, "Full-pretrain/Step": 6465, "Full-pretrain/Step Time": 17.60931423306465} +{"Full-pretrain/Learning Rate": 1.2402085292269428e-05, "Full-pretrain/Loss": 1.9201468229293823, "Full-pretrain/Loss (Raw)": 2.1065218448638916, "Full-pretrain/Step": 6466, "Full-pretrain/Step Time": 17.610858300700784} +{"Full-pretrain/Learning Rate": 1.2394752078597902e-05, "Full-pretrain/Loss": 1.901409387588501, "Full-pretrain/Loss (Raw)": 1.6128382682800293, "Full-pretrain/Step": 6467, "Full-pretrain/Step Time": 17.613072277978063} +{"Full-pretrain/Learning Rate": 1.238742031893729e-05, "Full-pretrain/Loss": 1.9020028114318848, "Full-pretrain/Loss (Raw)": 1.781313180923462, "Full-pretrain/Step": 6468, "Full-pretrain/Step Time": 17.62126655690372} +{"Full-pretrain/Learning Rate": 1.2380090014133317e-05, "Full-pretrain/Loss": 1.9195857048034668, "Full-pretrain/Loss (Raw)": 1.9118963479995728, "Full-pretrain/Step": 6469, "Full-pretrain/Step Time": 17.625010550022125} +{"Full-pretrain/Learning Rate": 1.2372761165031521e-05, "Full-pretrain/Loss": 1.9189436435699463, "Full-pretrain/Loss (Raw)": 2.108103036880493, "Full-pretrain/Step": 6470, "Full-pretrain/Step Time": 17.628820441663265} +{"Full-pretrain/Learning Rate": 1.2365433772477289e-05, "Full-pretrain/Loss": 1.914249300956726, "Full-pretrain/Loss (Raw)": 1.8142642974853516, "Full-pretrain/Step": 6471, "Full-pretrain/Step Time": 17.62721762433648} +{"Full-pretrain/Learning Rate": 1.2358107837315841e-05, "Full-pretrain/Loss": 1.9353784322738647, "Full-pretrain/Loss (Raw)": 2.118309259414673, "Full-pretrain/Step": 6472, "Full-pretrain/Step Time": 17.626965099945664} +{"Full-pretrain/Learning Rate": 1.2350783360392201e-05, "Full-pretrain/Loss": 1.9253416061401367, "Full-pretrain/Loss (Raw)": 1.7611525058746338, "Full-pretrain/Step": 6473, "Full-pretrain/Step Time": 17.63008163869381} +{"Full-pretrain/Learning Rate": 1.2343460342551258e-05, "Full-pretrain/Loss": 1.92356276512146, "Full-pretrain/Loss (Raw)": 1.9582003355026245, "Full-pretrain/Step": 6474, "Full-pretrain/Step Time": 17.63452959060669} +{"Full-pretrain/Learning Rate": 1.2336138784637713e-05, "Full-pretrain/Loss": 1.9356143474578857, "Full-pretrain/Loss (Raw)": 1.9199802875518799, "Full-pretrain/Step": 6475, "Full-pretrain/Step Time": 17.639958929270506} +{"Full-pretrain/Learning Rate": 1.232881868749611e-05, "Full-pretrain/Loss": 1.930586576461792, "Full-pretrain/Loss (Raw)": 1.641932487487793, "Full-pretrain/Step": 6476, "Full-pretrain/Step Time": 17.6463972479105} +{"Full-pretrain/Learning Rate": 1.232150005197083e-05, "Full-pretrain/Loss": 1.9246010780334473, "Full-pretrain/Loss (Raw)": 1.7801194190979004, "Full-pretrain/Step": 6477, "Full-pretrain/Step Time": 17.645795464515686} +{"Full-pretrain/Learning Rate": 1.2314182878906052e-05, "Full-pretrain/Loss": 1.9194804430007935, "Full-pretrain/Loss (Raw)": 1.7417521476745605, "Full-pretrain/Step": 6478, "Full-pretrain/Step Time": 17.64808313548565} +{"Full-pretrain/Learning Rate": 1.230686716914583e-05, "Full-pretrain/Loss": 1.9241526126861572, "Full-pretrain/Loss (Raw)": 2.0212974548339844, "Full-pretrain/Step": 6479, "Full-pretrain/Step Time": 17.646631710231304} +{"Full-pretrain/Learning Rate": 1.229955292353401e-05, "Full-pretrain/Loss": 1.909364938735962, "Full-pretrain/Loss (Raw)": 1.4806548357009888, "Full-pretrain/Step": 6480, "Full-pretrain/Step Time": 17.654578123241663} +{"Full-pretrain/Learning Rate": 1.22922401429143e-05, "Full-pretrain/Loss": 1.8947041034698486, "Full-pretrain/Loss (Raw)": 1.6588976383209229, "Full-pretrain/Step": 6481, "Full-pretrain/Step Time": 17.655521282926202} +{"Full-pretrain/Learning Rate": 1.228492882813023e-05, "Full-pretrain/Loss": 1.8984580039978027, "Full-pretrain/Loss (Raw)": 2.0580687522888184, "Full-pretrain/Step": 6482, "Full-pretrain/Step Time": 17.653980318456888} +{"Full-pretrain/Learning Rate": 1.2277618980025141e-05, "Full-pretrain/Loss": 1.8751965761184692, "Full-pretrain/Loss (Raw)": 1.7646459341049194, "Full-pretrain/Step": 6483, "Full-pretrain/Step Time": 17.65711443684995} +{"Full-pretrain/Learning Rate": 1.2270310599442234e-05, "Full-pretrain/Loss": 1.8713444471359253, "Full-pretrain/Loss (Raw)": 1.8836727142333984, "Full-pretrain/Step": 6484, "Full-pretrain/Step Time": 17.65966630168259} +{"Full-pretrain/Learning Rate": 1.2263003687224524e-05, "Full-pretrain/Loss": 1.8710182905197144, "Full-pretrain/Loss (Raw)": 1.9796805381774902, "Full-pretrain/Step": 6485, "Full-pretrain/Step Time": 17.658550949767232} +{"Full-pretrain/Learning Rate": 1.2255698244214864e-05, "Full-pretrain/Loss": 1.8656151294708252, "Full-pretrain/Loss (Raw)": 1.976740837097168, "Full-pretrain/Step": 6486, "Full-pretrain/Step Time": 17.668732691556215} +{"Full-pretrain/Learning Rate": 1.2248394271255942e-05, "Full-pretrain/Loss": 1.8573400974273682, "Full-pretrain/Loss (Raw)": 1.9190397262573242, "Full-pretrain/Step": 6487, "Full-pretrain/Step Time": 17.671971617266536} +{"Full-pretrain/Learning Rate": 1.224109176919025e-05, "Full-pretrain/Loss": 1.8619041442871094, "Full-pretrain/Loss (Raw)": 1.998382329940796, "Full-pretrain/Step": 6488, "Full-pretrain/Step Time": 17.672388369217515} +{"Full-pretrain/Learning Rate": 1.223379073886014e-05, "Full-pretrain/Loss": 1.858263373374939, "Full-pretrain/Loss (Raw)": 1.7395386695861816, "Full-pretrain/Step": 6489, "Full-pretrain/Step Time": 17.672822093591094} +{"Full-pretrain/Learning Rate": 1.222649118110778e-05, "Full-pretrain/Loss": 1.8679885864257812, "Full-pretrain/Loss (Raw)": 1.8768000602722168, "Full-pretrain/Step": 6490, "Full-pretrain/Step Time": 17.67746158875525} +{"Full-pretrain/Learning Rate": 1.2219193096775172e-05, "Full-pretrain/Loss": 1.87274169921875, "Full-pretrain/Loss (Raw)": 1.9578410387039185, "Full-pretrain/Step": 6491, "Full-pretrain/Step Time": 17.677230266854167} +{"Full-pretrain/Learning Rate": 1.2211896486704152e-05, "Full-pretrain/Loss": 1.8641177415847778, "Full-pretrain/Loss (Raw)": 1.7068815231323242, "Full-pretrain/Step": 6492, "Full-pretrain/Step Time": 17.671655220910907} +{"Full-pretrain/Learning Rate": 1.2204601351736385e-05, "Full-pretrain/Loss": 1.864000678062439, "Full-pretrain/Loss (Raw)": 1.893530011177063, "Full-pretrain/Step": 6493, "Full-pretrain/Step Time": 17.674776097759604} +{"Full-pretrain/Learning Rate": 1.2197307692713348e-05, "Full-pretrain/Loss": 1.8648433685302734, "Full-pretrain/Loss (Raw)": 1.8887073993682861, "Full-pretrain/Step": 6494, "Full-pretrain/Step Time": 17.676279336214066} +{"Full-pretrain/Learning Rate": 1.2190015510476379e-05, "Full-pretrain/Loss": 1.8702290058135986, "Full-pretrain/Loss (Raw)": 2.0642311573028564, "Full-pretrain/Step": 6495, "Full-pretrain/Step Time": 17.675121868029237} +{"Full-pretrain/Learning Rate": 1.2182724805866607e-05, "Full-pretrain/Loss": 1.8611044883728027, "Full-pretrain/Loss (Raw)": 1.6687071323394775, "Full-pretrain/Step": 6496, "Full-pretrain/Step Time": 17.66971717402339} +{"Full-pretrain/Learning Rate": 1.2175435579725029e-05, "Full-pretrain/Loss": 1.8725948333740234, "Full-pretrain/Loss (Raw)": 2.1293346881866455, "Full-pretrain/Step": 6497, "Full-pretrain/Step Time": 17.665104400366545} +{"Full-pretrain/Learning Rate": 1.2168147832892457e-05, "Full-pretrain/Loss": 1.855026364326477, "Full-pretrain/Loss (Raw)": 1.5443328619003296, "Full-pretrain/Step": 6498, "Full-pretrain/Step Time": 17.66664319485426} +{"Full-pretrain/Learning Rate": 1.2160861566209512e-05, "Full-pretrain/Loss": 1.872545599937439, "Full-pretrain/Loss (Raw)": 2.1734511852264404, "Full-pretrain/Step": 6499, "Full-pretrain/Step Time": 17.66777502000332} +{"Full-pretrain/Learning Rate": 1.2153576780516674e-05, "Full-pretrain/Loss": 1.8786509037017822, "Full-pretrain/Loss (Raw)": 1.9766819477081299, "Full-pretrain/Step": 6500, "Full-pretrain/Step Time": 17.667804704979062} +{"Full-pretrain/Learning Rate": 1.2146293476654242e-05, "Full-pretrain/Loss": 1.8795686960220337, "Full-pretrain/Loss (Raw)": 1.9412692785263062, "Full-pretrain/Step": 6501, "Full-pretrain/Step Time": 17.666501639410853} +{"Full-pretrain/Learning Rate": 1.2139011655462337e-05, "Full-pretrain/Loss": 1.871757984161377, "Full-pretrain/Loss (Raw)": 1.8581570386886597, "Full-pretrain/Step": 6502, "Full-pretrain/Step Time": 17.673894366249442} +{"Full-pretrain/Learning Rate": 1.2131731317780932e-05, "Full-pretrain/Loss": 1.8772884607315063, "Full-pretrain/Loss (Raw)": 1.9912407398223877, "Full-pretrain/Step": 6503, "Full-pretrain/Step Time": 17.66734296642244} +{"Full-pretrain/Learning Rate": 1.2124452464449784e-05, "Full-pretrain/Loss": 1.8712151050567627, "Full-pretrain/Loss (Raw)": 1.9239612817764282, "Full-pretrain/Step": 6504, "Full-pretrain/Step Time": 17.670390648767352} +{"Full-pretrain/Learning Rate": 1.211717509630852e-05, "Full-pretrain/Loss": 1.8702634572982788, "Full-pretrain/Loss (Raw)": 1.7306997776031494, "Full-pretrain/Step": 6505, "Full-pretrain/Step Time": 17.671211265027523} +{"Full-pretrain/Learning Rate": 1.2109899214196582e-05, "Full-pretrain/Loss": 1.873790979385376, "Full-pretrain/Loss (Raw)": 2.0710811614990234, "Full-pretrain/Step": 6506, "Full-pretrain/Step Time": 17.674210721626878} +{"Full-pretrain/Learning Rate": 1.210262481895324e-05, "Full-pretrain/Loss": 1.8769186735153198, "Full-pretrain/Loss (Raw)": 2.0200653076171875, "Full-pretrain/Step": 6507, "Full-pretrain/Step Time": 17.67266902886331} +{"Full-pretrain/Learning Rate": 1.2095351911417599e-05, "Full-pretrain/Loss": 1.8877995014190674, "Full-pretrain/Loss (Raw)": 1.9901210069656372, "Full-pretrain/Step": 6508, "Full-pretrain/Step Time": 17.682950360700488} +{"Full-pretrain/Learning Rate": 1.2088080492428574e-05, "Full-pretrain/Loss": 1.8912420272827148, "Full-pretrain/Loss (Raw)": 1.890277624130249, "Full-pretrain/Step": 6509, "Full-pretrain/Step Time": 17.679175628349185} +{"Full-pretrain/Learning Rate": 1.2080810562824927e-05, "Full-pretrain/Loss": 1.8936612606048584, "Full-pretrain/Loss (Raw)": 1.8191709518432617, "Full-pretrain/Step": 6510, "Full-pretrain/Step Time": 17.6811511144042} +{"Full-pretrain/Learning Rate": 1.2073542123445239e-05, "Full-pretrain/Loss": 1.8892606496810913, "Full-pretrain/Loss (Raw)": 1.8804751634597778, "Full-pretrain/Step": 6511, "Full-pretrain/Step Time": 17.676581474021077} +{"Full-pretrain/Learning Rate": 1.2066275175127936e-05, "Full-pretrain/Loss": 1.9036836624145508, "Full-pretrain/Loss (Raw)": 1.942195177078247, "Full-pretrain/Step": 6512, "Full-pretrain/Step Time": 17.679901065304875} +{"Full-pretrain/Learning Rate": 1.2059009718711234e-05, "Full-pretrain/Loss": 1.9178524017333984, "Full-pretrain/Loss (Raw)": 2.1122961044311523, "Full-pretrain/Step": 6513, "Full-pretrain/Step Time": 17.678253458812833} +{"Full-pretrain/Learning Rate": 1.2051745755033226e-05, "Full-pretrain/Loss": 1.9126124382019043, "Full-pretrain/Loss (Raw)": 1.8903878927230835, "Full-pretrain/Step": 6514, "Full-pretrain/Step Time": 17.680509142577648} +{"Full-pretrain/Learning Rate": 1.2044483284931785e-05, "Full-pretrain/Loss": 1.9185409545898438, "Full-pretrain/Loss (Raw)": 1.95435631275177, "Full-pretrain/Step": 6515, "Full-pretrain/Step Time": 17.676757223904133} +{"Full-pretrain/Learning Rate": 1.2037222309244642e-05, "Full-pretrain/Loss": 1.9189958572387695, "Full-pretrain/Loss (Raw)": 1.898228406906128, "Full-pretrain/Step": 6516, "Full-pretrain/Step Time": 17.67247986793518} +{"Full-pretrain/Learning Rate": 1.2029962828809351e-05, "Full-pretrain/Loss": 1.9266750812530518, "Full-pretrain/Loss (Raw)": 2.225419521331787, "Full-pretrain/Step": 6517, "Full-pretrain/Step Time": 17.68022369965911} +{"Full-pretrain/Learning Rate": 1.202270484446329e-05, "Full-pretrain/Loss": 1.9223995208740234, "Full-pretrain/Loss (Raw)": 1.83992338180542, "Full-pretrain/Step": 6518, "Full-pretrain/Step Time": 17.672254044562578} +{"Full-pretrain/Learning Rate": 1.2015448357043674e-05, "Full-pretrain/Loss": 1.9241501092910767, "Full-pretrain/Loss (Raw)": 1.9750571250915527, "Full-pretrain/Step": 6519, "Full-pretrain/Step Time": 17.676006888970733} +{"Full-pretrain/Learning Rate": 1.2008193367387519e-05, "Full-pretrain/Loss": 1.9230161905288696, "Full-pretrain/Loss (Raw)": 1.9620954990386963, "Full-pretrain/Step": 6520, "Full-pretrain/Step Time": 17.667680982500315} +{"Full-pretrain/Learning Rate": 1.200093987633169e-05, "Full-pretrain/Loss": 1.9282526969909668, "Full-pretrain/Loss (Raw)": 1.907109022140503, "Full-pretrain/Step": 6521, "Full-pretrain/Step Time": 17.667912375181913} +{"Full-pretrain/Learning Rate": 1.1993687884712882e-05, "Full-pretrain/Loss": 1.9269018173217773, "Full-pretrain/Loss (Raw)": 1.8335707187652588, "Full-pretrain/Step": 6522, "Full-pretrain/Step Time": 17.666037069633603} +{"Full-pretrain/Learning Rate": 1.1986437393367604e-05, "Full-pretrain/Loss": 1.9220037460327148, "Full-pretrain/Loss (Raw)": 1.8011012077331543, "Full-pretrain/Step": 6523, "Full-pretrain/Step Time": 17.664566976949573} +{"Full-pretrain/Learning Rate": 1.1979188403132208e-05, "Full-pretrain/Loss": 1.9224648475646973, "Full-pretrain/Loss (Raw)": 1.7216393947601318, "Full-pretrain/Step": 6524, "Full-pretrain/Step Time": 17.66400064714253} +{"Full-pretrain/Learning Rate": 1.1971940914842845e-05, "Full-pretrain/Loss": 1.9282147884368896, "Full-pretrain/Loss (Raw)": 2.0775272846221924, "Full-pretrain/Step": 6525, "Full-pretrain/Step Time": 17.664979871362448} +{"Full-pretrain/Learning Rate": 1.1964694929335518e-05, "Full-pretrain/Loss": 1.918595790863037, "Full-pretrain/Loss (Raw)": 1.580899715423584, "Full-pretrain/Step": 6526, "Full-pretrain/Step Time": 17.67143259756267} +{"Full-pretrain/Learning Rate": 1.195745044744605e-05, "Full-pretrain/Loss": 1.915421485900879, "Full-pretrain/Loss (Raw)": 1.9626511335372925, "Full-pretrain/Step": 6527, "Full-pretrain/Step Time": 17.668467666953802} +{"Full-pretrain/Learning Rate": 1.1950207470010102e-05, "Full-pretrain/Loss": 1.925036907196045, "Full-pretrain/Loss (Raw)": 1.9764052629470825, "Full-pretrain/Step": 6528, "Full-pretrain/Step Time": 17.672204952687025} +{"Full-pretrain/Learning Rate": 1.1942965997863123e-05, "Full-pretrain/Loss": 1.918755292892456, "Full-pretrain/Loss (Raw)": 1.9283220767974854, "Full-pretrain/Step": 6529, "Full-pretrain/Step Time": 17.6724397521466} +{"Full-pretrain/Learning Rate": 1.193572603184044e-05, "Full-pretrain/Loss": 1.9392063617706299, "Full-pretrain/Loss (Raw)": 2.1987671852111816, "Full-pretrain/Step": 6530, "Full-pretrain/Step Time": 17.672761868685484} +{"Full-pretrain/Learning Rate": 1.1928487572777159e-05, "Full-pretrain/Loss": 1.9339478015899658, "Full-pretrain/Loss (Raw)": 2.0051751136779785, "Full-pretrain/Step": 6531, "Full-pretrain/Step Time": 17.6688150446862} +{"Full-pretrain/Learning Rate": 1.192125062150824e-05, "Full-pretrain/Loss": 1.9283086061477661, "Full-pretrain/Loss (Raw)": 1.796230673789978, "Full-pretrain/Step": 6532, "Full-pretrain/Step Time": 17.668256036937237} +{"Full-pretrain/Learning Rate": 1.1914015178868468e-05, "Full-pretrain/Loss": 1.931036114692688, "Full-pretrain/Loss (Raw)": 2.0285494327545166, "Full-pretrain/Step": 6533, "Full-pretrain/Step Time": 17.67255813255906} +{"Full-pretrain/Learning Rate": 1.1906781245692444e-05, "Full-pretrain/Loss": 1.925628662109375, "Full-pretrain/Loss (Raw)": 1.6851186752319336, "Full-pretrain/Step": 6534, "Full-pretrain/Step Time": 17.676456231623888} +{"Full-pretrain/Learning Rate": 1.1899548822814613e-05, "Full-pretrain/Loss": 1.9244307279586792, "Full-pretrain/Loss (Raw)": 1.9529078006744385, "Full-pretrain/Step": 6535, "Full-pretrain/Step Time": 17.673037072643638} +{"Full-pretrain/Learning Rate": 1.1892317911069212e-05, "Full-pretrain/Loss": 1.9268746376037598, "Full-pretrain/Loss (Raw)": 2.002166271209717, "Full-pretrain/Step": 6536, "Full-pretrain/Step Time": 17.671249601989985} +{"Full-pretrain/Learning Rate": 1.1885088511290332e-05, "Full-pretrain/Loss": 1.9356555938720703, "Full-pretrain/Loss (Raw)": 2.011688709259033, "Full-pretrain/Step": 6537, "Full-pretrain/Step Time": 17.681613381952047} +{"Full-pretrain/Learning Rate": 1.1877860624311887e-05, "Full-pretrain/Loss": 1.932558536529541, "Full-pretrain/Loss (Raw)": 1.9719765186309814, "Full-pretrain/Step": 6538, "Full-pretrain/Step Time": 17.682947082445025} +{"Full-pretrain/Learning Rate": 1.1870634250967605e-05, "Full-pretrain/Loss": 1.9328069686889648, "Full-pretrain/Loss (Raw)": 2.0280141830444336, "Full-pretrain/Step": 6539, "Full-pretrain/Step Time": 17.679407604038715} +{"Full-pretrain/Learning Rate": 1.1863409392091057e-05, "Full-pretrain/Loss": 1.9400866031646729, "Full-pretrain/Loss (Raw)": 2.2230687141418457, "Full-pretrain/Step": 6540, "Full-pretrain/Step Time": 17.667538836598396} +{"Full-pretrain/Learning Rate": 1.1856186048515611e-05, "Full-pretrain/Loss": 1.9338916540145874, "Full-pretrain/Loss (Raw)": 1.6920393705368042, "Full-pretrain/Step": 6541, "Full-pretrain/Step Time": 17.676138853654265} +{"Full-pretrain/Learning Rate": 1.1848964221074486e-05, "Full-pretrain/Loss": 1.934333086013794, "Full-pretrain/Loss (Raw)": 1.8332984447479248, "Full-pretrain/Step": 6542, "Full-pretrain/Step Time": 17.678935255855322} +{"Full-pretrain/Learning Rate": 1.1841743910600713e-05, "Full-pretrain/Loss": 1.9279407262802124, "Full-pretrain/Loss (Raw)": 1.675917387008667, "Full-pretrain/Step": 6543, "Full-pretrain/Step Time": 17.68172292597592} +{"Full-pretrain/Learning Rate": 1.183452511792717e-05, "Full-pretrain/Loss": 1.9282493591308594, "Full-pretrain/Loss (Raw)": 1.9520704746246338, "Full-pretrain/Step": 6544, "Full-pretrain/Step Time": 17.672123989090323} +{"Full-pretrain/Learning Rate": 1.1827307843886515e-05, "Full-pretrain/Loss": 1.9253931045532227, "Full-pretrain/Loss (Raw)": 2.0209007263183594, "Full-pretrain/Step": 6545, "Full-pretrain/Step Time": 17.674847370013595} +{"Full-pretrain/Learning Rate": 1.182009208931128e-05, "Full-pretrain/Loss": 1.9193378686904907, "Full-pretrain/Loss (Raw)": 1.6966204643249512, "Full-pretrain/Step": 6546, "Full-pretrain/Step Time": 17.681169535964727} +{"Full-pretrain/Learning Rate": 1.1812877855033782e-05, "Full-pretrain/Loss": 1.9246071577072144, "Full-pretrain/Loss (Raw)": 2.1229705810546875, "Full-pretrain/Step": 6547, "Full-pretrain/Step Time": 17.675464449450374} +{"Full-pretrain/Learning Rate": 1.1805665141886191e-05, "Full-pretrain/Loss": 1.9267688989639282, "Full-pretrain/Loss (Raw)": 1.967406988143921, "Full-pretrain/Step": 6548, "Full-pretrain/Step Time": 17.675079038366675} +{"Full-pretrain/Learning Rate": 1.1798453950700488e-05, "Full-pretrain/Loss": 1.9116876125335693, "Full-pretrain/Loss (Raw)": 1.7428178787231445, "Full-pretrain/Step": 6549, "Full-pretrain/Step Time": 17.676235744729638} +{"Full-pretrain/Learning Rate": 1.1791244282308484e-05, "Full-pretrain/Loss": 1.9149138927459717, "Full-pretrain/Loss (Raw)": 1.9431641101837158, "Full-pretrain/Step": 6550, "Full-pretrain/Step Time": 17.681038077920675} +{"Full-pretrain/Learning Rate": 1.1784036137541818e-05, "Full-pretrain/Loss": 1.9109249114990234, "Full-pretrain/Loss (Raw)": 1.8474090099334717, "Full-pretrain/Step": 6551, "Full-pretrain/Step Time": 17.676373288035393} +{"Full-pretrain/Learning Rate": 1.177682951723193e-05, "Full-pretrain/Loss": 1.9020206928253174, "Full-pretrain/Loss (Raw)": 1.6771597862243652, "Full-pretrain/Step": 6552, "Full-pretrain/Step Time": 17.673121387138963} +{"Full-pretrain/Learning Rate": 1.176962442221011e-05, "Full-pretrain/Loss": 1.9061932563781738, "Full-pretrain/Loss (Raw)": 2.0406322479248047, "Full-pretrain/Step": 6553, "Full-pretrain/Step Time": 17.673607360571623} +{"Full-pretrain/Learning Rate": 1.1762420853307463e-05, "Full-pretrain/Loss": 1.9150190353393555, "Full-pretrain/Loss (Raw)": 2.115995407104492, "Full-pretrain/Step": 6554, "Full-pretrain/Step Time": 17.675768984481692} +{"Full-pretrain/Learning Rate": 1.1755218811354918e-05, "Full-pretrain/Loss": 1.9186136722564697, "Full-pretrain/Loss (Raw)": 1.9161313772201538, "Full-pretrain/Step": 6555, "Full-pretrain/Step Time": 17.67821018770337} +{"Full-pretrain/Learning Rate": 1.1748018297183238e-05, "Full-pretrain/Loss": 1.9237871170043945, "Full-pretrain/Loss (Raw)": 1.8871854543685913, "Full-pretrain/Step": 6556, "Full-pretrain/Step Time": 17.67766036465764} +{"Full-pretrain/Learning Rate": 1.1740819311622982e-05, "Full-pretrain/Loss": 1.917046070098877, "Full-pretrain/Loss (Raw)": 1.8618158102035522, "Full-pretrain/Step": 6557, "Full-pretrain/Step Time": 17.682480540126562} +{"Full-pretrain/Learning Rate": 1.1733621855504559e-05, "Full-pretrain/Loss": 1.9284570217132568, "Full-pretrain/Loss (Raw)": 1.946048617362976, "Full-pretrain/Step": 6558, "Full-pretrain/Step Time": 17.67684897966683} +{"Full-pretrain/Learning Rate": 1.1726425929658194e-05, "Full-pretrain/Loss": 1.9295322895050049, "Full-pretrain/Loss (Raw)": 1.9970600605010986, "Full-pretrain/Step": 6559, "Full-pretrain/Step Time": 17.68070350214839} +{"Full-pretrain/Learning Rate": 1.1719231534913933e-05, "Full-pretrain/Loss": 1.9217426776885986, "Full-pretrain/Loss (Raw)": 1.7271379232406616, "Full-pretrain/Step": 6560, "Full-pretrain/Step Time": 17.67400841228664} +{"Full-pretrain/Learning Rate": 1.1712038672101654e-05, "Full-pretrain/Loss": 1.9300663471221924, "Full-pretrain/Loss (Raw)": 2.194681167602539, "Full-pretrain/Step": 6561, "Full-pretrain/Step Time": 17.671077389270067} +{"Full-pretrain/Learning Rate": 1.1704847342051037e-05, "Full-pretrain/Loss": 1.9023128747940063, "Full-pretrain/Loss (Raw)": 1.3106530904769897, "Full-pretrain/Step": 6562, "Full-pretrain/Step Time": 17.674086652696133} +{"Full-pretrain/Learning Rate": 1.1697657545591615e-05, "Full-pretrain/Loss": 1.901224136352539, "Full-pretrain/Loss (Raw)": 1.9703388214111328, "Full-pretrain/Step": 6563, "Full-pretrain/Step Time": 17.675792403519154} +{"Full-pretrain/Learning Rate": 1.1690469283552713e-05, "Full-pretrain/Loss": 1.9022128582000732, "Full-pretrain/Loss (Raw)": 1.8278707265853882, "Full-pretrain/Step": 6564, "Full-pretrain/Step Time": 17.67616157606244} +{"Full-pretrain/Learning Rate": 1.16832825567635e-05, "Full-pretrain/Loss": 1.8991292715072632, "Full-pretrain/Loss (Raw)": 1.9298713207244873, "Full-pretrain/Step": 6565, "Full-pretrain/Step Time": 17.67830359376967} +{"Full-pretrain/Learning Rate": 1.1676097366052974e-05, "Full-pretrain/Loss": 1.9019434452056885, "Full-pretrain/Loss (Raw)": 1.7751747369766235, "Full-pretrain/Step": 6566, "Full-pretrain/Step Time": 17.681769905611873} +{"Full-pretrain/Learning Rate": 1.1668913712249924e-05, "Full-pretrain/Loss": 1.9021039009094238, "Full-pretrain/Loss (Raw)": 1.958040475845337, "Full-pretrain/Step": 6567, "Full-pretrain/Step Time": 17.686487019062042} +{"Full-pretrain/Learning Rate": 1.1661731596182995e-05, "Full-pretrain/Loss": 1.8948395252227783, "Full-pretrain/Loss (Raw)": 1.7697086334228516, "Full-pretrain/Step": 6568, "Full-pretrain/Step Time": 17.680238300934434} +{"Full-pretrain/Learning Rate": 1.1654551018680637e-05, "Full-pretrain/Loss": 1.8958170413970947, "Full-pretrain/Loss (Raw)": 2.042965888977051, "Full-pretrain/Step": 6569, "Full-pretrain/Step Time": 17.681869151070714} +{"Full-pretrain/Learning Rate": 1.164737198057113e-05, "Full-pretrain/Loss": 1.881898045539856, "Full-pretrain/Loss (Raw)": 1.5265700817108154, "Full-pretrain/Step": 6570, "Full-pretrain/Step Time": 17.67942943237722} +{"Full-pretrain/Learning Rate": 1.1640194482682573e-05, "Full-pretrain/Loss": 1.881323218345642, "Full-pretrain/Loss (Raw)": 2.009617328643799, "Full-pretrain/Step": 6571, "Full-pretrain/Step Time": 17.685488982126117} +{"Full-pretrain/Learning Rate": 1.1633018525842895e-05, "Full-pretrain/Loss": 1.8698539733886719, "Full-pretrain/Loss (Raw)": 1.8560556173324585, "Full-pretrain/Step": 6572, "Full-pretrain/Step Time": 17.683586962521076} +{"Full-pretrain/Learning Rate": 1.1625844110879825e-05, "Full-pretrain/Loss": 1.8794649839401245, "Full-pretrain/Loss (Raw)": 1.999589204788208, "Full-pretrain/Step": 6573, "Full-pretrain/Step Time": 17.68539549037814} +{"Full-pretrain/Learning Rate": 1.1618671238620938e-05, "Full-pretrain/Loss": 1.8822280168533325, "Full-pretrain/Loss (Raw)": 1.9217160940170288, "Full-pretrain/Step": 6574, "Full-pretrain/Step Time": 17.687953600659966} +{"Full-pretrain/Learning Rate": 1.1611499909893616e-05, "Full-pretrain/Loss": 1.8924366235733032, "Full-pretrain/Loss (Raw)": 2.002591848373413, "Full-pretrain/Step": 6575, "Full-pretrain/Step Time": 17.692656736820936} +{"Full-pretrain/Learning Rate": 1.1604330125525079e-05, "Full-pretrain/Loss": 1.8878053426742554, "Full-pretrain/Loss (Raw)": 1.8038699626922607, "Full-pretrain/Step": 6576, "Full-pretrain/Step Time": 17.686617620289326} +{"Full-pretrain/Learning Rate": 1.1597161886342362e-05, "Full-pretrain/Loss": 1.8815932273864746, "Full-pretrain/Loss (Raw)": 1.8221114873886108, "Full-pretrain/Step": 6577, "Full-pretrain/Step Time": 17.687869530171156} +{"Full-pretrain/Learning Rate": 1.1589995193172303e-05, "Full-pretrain/Loss": 1.8906779289245605, "Full-pretrain/Loss (Raw)": 1.9873311519622803, "Full-pretrain/Step": 6578, "Full-pretrain/Step Time": 17.696840081363916} +{"Full-pretrain/Learning Rate": 1.1582830046841595e-05, "Full-pretrain/Loss": 1.8862497806549072, "Full-pretrain/Loss (Raw)": 1.9812703132629395, "Full-pretrain/Step": 6579, "Full-pretrain/Step Time": 17.698759565129876} +{"Full-pretrain/Learning Rate": 1.1575666448176717e-05, "Full-pretrain/Loss": 1.8871721029281616, "Full-pretrain/Loss (Raw)": 1.996920108795166, "Full-pretrain/Step": 6580, "Full-pretrain/Step Time": 17.698904329910874} +{"Full-pretrain/Learning Rate": 1.1568504398003996e-05, "Full-pretrain/Loss": 1.8884365558624268, "Full-pretrain/Loss (Raw)": 1.7832820415496826, "Full-pretrain/Step": 6581, "Full-pretrain/Step Time": 17.699670048430562} +{"Full-pretrain/Learning Rate": 1.1561343897149583e-05, "Full-pretrain/Loss": 1.8904927968978882, "Full-pretrain/Loss (Raw)": 2.0089657306671143, "Full-pretrain/Step": 6582, "Full-pretrain/Step Time": 17.700759075582027} +{"Full-pretrain/Learning Rate": 1.1554184946439417e-05, "Full-pretrain/Loss": 1.8913847208023071, "Full-pretrain/Loss (Raw)": 1.8759477138519287, "Full-pretrain/Step": 6583, "Full-pretrain/Step Time": 17.70608587935567} +{"Full-pretrain/Learning Rate": 1.1547027546699293e-05, "Full-pretrain/Loss": 1.909315824508667, "Full-pretrain/Loss (Raw)": 2.2509565353393555, "Full-pretrain/Step": 6584, "Full-pretrain/Step Time": 17.698815397918224} +{"Full-pretrain/Learning Rate": 1.1539871698754814e-05, "Full-pretrain/Loss": 1.899423599243164, "Full-pretrain/Loss (Raw)": 1.724084496498108, "Full-pretrain/Step": 6585, "Full-pretrain/Step Time": 17.69998207874596} +{"Full-pretrain/Learning Rate": 1.1532717403431403e-05, "Full-pretrain/Loss": 1.890921950340271, "Full-pretrain/Loss (Raw)": 1.843941330909729, "Full-pretrain/Step": 6586, "Full-pretrain/Step Time": 17.704182893037796} +{"Full-pretrain/Learning Rate": 1.152556466155432e-05, "Full-pretrain/Loss": 1.889188289642334, "Full-pretrain/Loss (Raw)": 1.8606537580490112, "Full-pretrain/Step": 6587, "Full-pretrain/Step Time": 17.707373743876815} +{"Full-pretrain/Learning Rate": 1.1518413473948606e-05, "Full-pretrain/Loss": 1.8932037353515625, "Full-pretrain/Loss (Raw)": 2.0156803131103516, "Full-pretrain/Step": 6588, "Full-pretrain/Step Time": 17.70846643857658} +{"Full-pretrain/Learning Rate": 1.151126384143916e-05, "Full-pretrain/Loss": 1.8838011026382446, "Full-pretrain/Loss (Raw)": 1.5609294176101685, "Full-pretrain/Step": 6589, "Full-pretrain/Step Time": 17.70749964378774} +{"Full-pretrain/Learning Rate": 1.150411576485069e-05, "Full-pretrain/Loss": 1.8811819553375244, "Full-pretrain/Loss (Raw)": 1.862236738204956, "Full-pretrain/Step": 6590, "Full-pretrain/Step Time": 17.709225663915277} +{"Full-pretrain/Learning Rate": 1.1496969245007721e-05, "Full-pretrain/Loss": 1.8722004890441895, "Full-pretrain/Loss (Raw)": 1.7096543312072754, "Full-pretrain/Step": 6591, "Full-pretrain/Step Time": 17.713524293154478} +{"Full-pretrain/Learning Rate": 1.1489824282734609e-05, "Full-pretrain/Loss": 1.8755533695220947, "Full-pretrain/Loss (Raw)": 1.834428071975708, "Full-pretrain/Step": 6592, "Full-pretrain/Step Time": 17.70749617367983} +{"Full-pretrain/Learning Rate": 1.1482680878855526e-05, "Full-pretrain/Loss": 1.8759346008300781, "Full-pretrain/Loss (Raw)": 2.206879138946533, "Full-pretrain/Step": 6593, "Full-pretrain/Step Time": 17.703636936843395} +{"Full-pretrain/Learning Rate": 1.1475539034194443e-05, "Full-pretrain/Loss": 1.8993635177612305, "Full-pretrain/Loss (Raw)": 2.060382127761841, "Full-pretrain/Step": 6594, "Full-pretrain/Step Time": 17.70391657948494} +{"Full-pretrain/Learning Rate": 1.1468398749575188e-05, "Full-pretrain/Loss": 1.901656150817871, "Full-pretrain/Loss (Raw)": 2.0437028408050537, "Full-pretrain/Step": 6595, "Full-pretrain/Step Time": 17.70201463252306} +{"Full-pretrain/Learning Rate": 1.1461260025821375e-05, "Full-pretrain/Loss": 1.9038573503494263, "Full-pretrain/Loss (Raw)": 1.8983062505722046, "Full-pretrain/Step": 6596, "Full-pretrain/Step Time": 17.69323816522956} +{"Full-pretrain/Learning Rate": 1.1454122863756459e-05, "Full-pretrain/Loss": 1.8963007926940918, "Full-pretrain/Loss (Raw)": 1.688061237335205, "Full-pretrain/Step": 6597, "Full-pretrain/Step Time": 17.69476019591093} +{"Full-pretrain/Learning Rate": 1.144698726420372e-05, "Full-pretrain/Loss": 1.8981261253356934, "Full-pretrain/Loss (Raw)": 1.8335895538330078, "Full-pretrain/Step": 6598, "Full-pretrain/Step Time": 17.692839732393622} +{"Full-pretrain/Learning Rate": 1.1439853227986228e-05, "Full-pretrain/Loss": 1.8984363079071045, "Full-pretrain/Loss (Raw)": 1.967961311340332, "Full-pretrain/Step": 6599, "Full-pretrain/Step Time": 17.69366613216698} +{"Full-pretrain/Learning Rate": 1.1432720755926898e-05, "Full-pretrain/Loss": 1.9137917757034302, "Full-pretrain/Loss (Raw)": 2.2610867023468018, "Full-pretrain/Step": 6600, "Full-pretrain/Step Time": 17.692902008071542} +{"Full-pretrain/Learning Rate": 1.1425589848848464e-05, "Full-pretrain/Loss": 1.905733585357666, "Full-pretrain/Loss (Raw)": 1.7851037979125977, "Full-pretrain/Step": 6601, "Full-pretrain/Step Time": 17.687632394954562} +{"Full-pretrain/Learning Rate": 1.141846050757347e-05, "Full-pretrain/Loss": 1.9103010892868042, "Full-pretrain/Loss (Raw)": 1.672728180885315, "Full-pretrain/Step": 6602, "Full-pretrain/Step Time": 17.685258027166128} +{"Full-pretrain/Learning Rate": 1.1411332732924293e-05, "Full-pretrain/Loss": 1.9081337451934814, "Full-pretrain/Loss (Raw)": 1.9402611255645752, "Full-pretrain/Step": 6603, "Full-pretrain/Step Time": 17.68610762618482} +{"Full-pretrain/Learning Rate": 1.1404206525723103e-05, "Full-pretrain/Loss": 1.9132063388824463, "Full-pretrain/Loss (Raw)": 2.0183820724487305, "Full-pretrain/Step": 6604, "Full-pretrain/Step Time": 17.68434078618884} +{"Full-pretrain/Learning Rate": 1.1397081886791907e-05, "Full-pretrain/Loss": 1.9139854907989502, "Full-pretrain/Loss (Raw)": 2.0245187282562256, "Full-pretrain/Step": 6605, "Full-pretrain/Step Time": 17.6758328191936} +{"Full-pretrain/Learning Rate": 1.1389958816952537e-05, "Full-pretrain/Loss": 1.911836862564087, "Full-pretrain/Loss (Raw)": 1.8529629707336426, "Full-pretrain/Step": 6606, "Full-pretrain/Step Time": 17.671082619577646} +{"Full-pretrain/Learning Rate": 1.1382837317026638e-05, "Full-pretrain/Loss": 1.9064793586730957, "Full-pretrain/Loss (Raw)": 1.8311536312103271, "Full-pretrain/Step": 6607, "Full-pretrain/Step Time": 17.67021089605987} +{"Full-pretrain/Learning Rate": 1.1375717387835675e-05, "Full-pretrain/Loss": 1.910775899887085, "Full-pretrain/Loss (Raw)": 1.9413563013076782, "Full-pretrain/Step": 6608, "Full-pretrain/Step Time": 17.66750174202025} +{"Full-pretrain/Learning Rate": 1.1368599030200913e-05, "Full-pretrain/Loss": 1.9156391620635986, "Full-pretrain/Loss (Raw)": 1.977735996246338, "Full-pretrain/Step": 6609, "Full-pretrain/Step Time": 17.659655386582017} +{"Full-pretrain/Learning Rate": 1.1361482244943463e-05, "Full-pretrain/Loss": 1.9177489280700684, "Full-pretrain/Loss (Raw)": 2.054842948913574, "Full-pretrain/Step": 6610, "Full-pretrain/Step Time": 17.6592708658427} +{"Full-pretrain/Learning Rate": 1.1354367032884244e-05, "Full-pretrain/Loss": 1.9136117696762085, "Full-pretrain/Loss (Raw)": 1.8488819599151611, "Full-pretrain/Step": 6611, "Full-pretrain/Step Time": 17.657367108389735} +{"Full-pretrain/Learning Rate": 1.1347253394844004e-05, "Full-pretrain/Loss": 1.9042294025421143, "Full-pretrain/Loss (Raw)": 1.69668710231781, "Full-pretrain/Step": 6612, "Full-pretrain/Step Time": 17.656989857554436} +{"Full-pretrain/Learning Rate": 1.1340141331643276e-05, "Full-pretrain/Loss": 1.9076108932495117, "Full-pretrain/Loss (Raw)": 1.8914847373962402, "Full-pretrain/Step": 6613, "Full-pretrain/Step Time": 17.649847779423} +{"Full-pretrain/Learning Rate": 1.1333030844102452e-05, "Full-pretrain/Loss": 1.906598448753357, "Full-pretrain/Loss (Raw)": 1.9765703678131104, "Full-pretrain/Step": 6614, "Full-pretrain/Step Time": 17.643463933840394} +{"Full-pretrain/Learning Rate": 1.1325921933041711e-05, "Full-pretrain/Loss": 1.9127877950668335, "Full-pretrain/Loss (Raw)": 2.0740036964416504, "Full-pretrain/Step": 6615, "Full-pretrain/Step Time": 17.642964718863368} +{"Full-pretrain/Learning Rate": 1.131881459928107e-05, "Full-pretrain/Loss": 1.89750337600708, "Full-pretrain/Loss (Raw)": 1.761855959892273, "Full-pretrain/Step": 6616, "Full-pretrain/Step Time": 17.641727382317185} +{"Full-pretrain/Learning Rate": 1.1311708843640354e-05, "Full-pretrain/Loss": 1.8963863849639893, "Full-pretrain/Loss (Raw)": 1.6883430480957031, "Full-pretrain/Step": 6617, "Full-pretrain/Step Time": 17.63623932003975} +{"Full-pretrain/Learning Rate": 1.1304604666939214e-05, "Full-pretrain/Loss": 1.8970388174057007, "Full-pretrain/Loss (Raw)": 1.8648184537887573, "Full-pretrain/Step": 6618, "Full-pretrain/Step Time": 17.628551306203008} +{"Full-pretrain/Learning Rate": 1.1297502069997121e-05, "Full-pretrain/Loss": 1.896862268447876, "Full-pretrain/Loss (Raw)": 1.8550045490264893, "Full-pretrain/Step": 6619, "Full-pretrain/Step Time": 17.626442469656467} +{"Full-pretrain/Learning Rate": 1.1290401053633339e-05, "Full-pretrain/Loss": 1.8985131978988647, "Full-pretrain/Loss (Raw)": 2.068507671356201, "Full-pretrain/Step": 6620, "Full-pretrain/Step Time": 17.6290099658072} +{"Full-pretrain/Learning Rate": 1.128330161866698e-05, "Full-pretrain/Loss": 1.910986304283142, "Full-pretrain/Loss (Raw)": 1.960068702697754, "Full-pretrain/Step": 6621, "Full-pretrain/Step Time": 17.62941889092326} +{"Full-pretrain/Learning Rate": 1.127620376591696e-05, "Full-pretrain/Loss": 1.914668321609497, "Full-pretrain/Loss (Raw)": 1.9800620079040527, "Full-pretrain/Step": 6622, "Full-pretrain/Step Time": 17.618629910051823} +{"Full-pretrain/Learning Rate": 1.1269107496202008e-05, "Full-pretrain/Loss": 1.9270566701889038, "Full-pretrain/Loss (Raw)": 2.106081962585449, "Full-pretrain/Step": 6623, "Full-pretrain/Step Time": 17.62206874229014} +{"Full-pretrain/Learning Rate": 1.1262012810340694e-05, "Full-pretrain/Loss": 1.9324619770050049, "Full-pretrain/Loss (Raw)": 2.0073986053466797, "Full-pretrain/Step": 6624, "Full-pretrain/Step Time": 17.630417343229055} +{"Full-pretrain/Learning Rate": 1.1254919709151365e-05, "Full-pretrain/Loss": 1.919069528579712, "Full-pretrain/Loss (Raw)": 1.778318166732788, "Full-pretrain/Step": 6625, "Full-pretrain/Step Time": 17.6347948461771} +{"Full-pretrain/Learning Rate": 1.1247828193452214e-05, "Full-pretrain/Loss": 1.9092341661453247, "Full-pretrain/Loss (Raw)": 1.745652675628662, "Full-pretrain/Step": 6626, "Full-pretrain/Step Time": 17.62570903636515} +{"Full-pretrain/Learning Rate": 1.1240738264061252e-05, "Full-pretrain/Loss": 1.9059052467346191, "Full-pretrain/Loss (Raw)": 1.937174677848816, "Full-pretrain/Step": 6627, "Full-pretrain/Step Time": 17.629512386396527} +{"Full-pretrain/Learning Rate": 1.1233649921796305e-05, "Full-pretrain/Loss": 1.9130990505218506, "Full-pretrain/Loss (Raw)": 2.128513813018799, "Full-pretrain/Step": 6628, "Full-pretrain/Step Time": 17.6338379830122} +{"Full-pretrain/Learning Rate": 1.122656316747499e-05, "Full-pretrain/Loss": 1.9160034656524658, "Full-pretrain/Loss (Raw)": 1.7809998989105225, "Full-pretrain/Step": 6629, "Full-pretrain/Step Time": 17.63510669209063} +{"Full-pretrain/Learning Rate": 1.1219478001914782e-05, "Full-pretrain/Loss": 1.9208779335021973, "Full-pretrain/Loss (Raw)": 1.9895713329315186, "Full-pretrain/Step": 6630, "Full-pretrain/Step Time": 17.633551163598895} +{"Full-pretrain/Learning Rate": 1.1212394425932936e-05, "Full-pretrain/Loss": 1.9209668636322021, "Full-pretrain/Loss (Raw)": 1.9708075523376465, "Full-pretrain/Step": 6631, "Full-pretrain/Step Time": 17.63796354830265} +{"Full-pretrain/Learning Rate": 1.120531244034655e-05, "Full-pretrain/Loss": 1.9047013521194458, "Full-pretrain/Loss (Raw)": 1.7405915260314941, "Full-pretrain/Step": 6632, "Full-pretrain/Step Time": 17.6339911185205} +{"Full-pretrain/Learning Rate": 1.1198232045972523e-05, "Full-pretrain/Loss": 1.913486361503601, "Full-pretrain/Loss (Raw)": 2.066222667694092, "Full-pretrain/Step": 6633, "Full-pretrain/Step Time": 17.637804701924324} +{"Full-pretrain/Learning Rate": 1.1191153243627577e-05, "Full-pretrain/Loss": 1.9184982776641846, "Full-pretrain/Loss (Raw)": 1.833113193511963, "Full-pretrain/Step": 6634, "Full-pretrain/Step Time": 17.629710042849183} +{"Full-pretrain/Learning Rate": 1.1184076034128266e-05, "Full-pretrain/Loss": 1.908387303352356, "Full-pretrain/Loss (Raw)": 1.6167067289352417, "Full-pretrain/Step": 6635, "Full-pretrain/Step Time": 17.62884672731161} +{"Full-pretrain/Learning Rate": 1.1177000418290917e-05, "Full-pretrain/Loss": 1.9023466110229492, "Full-pretrain/Loss (Raw)": 1.8250808715820312, "Full-pretrain/Step": 6636, "Full-pretrain/Step Time": 17.62971326522529} +{"Full-pretrain/Learning Rate": 1.1169926396931712e-05, "Full-pretrain/Loss": 1.9041416645050049, "Full-pretrain/Loss (Raw)": 2.081958770751953, "Full-pretrain/Step": 6637, "Full-pretrain/Step Time": 17.632869709283113} +{"Full-pretrain/Learning Rate": 1.1162853970866638e-05, "Full-pretrain/Loss": 1.8970081806182861, "Full-pretrain/Loss (Raw)": 1.624692678451538, "Full-pretrain/Step": 6638, "Full-pretrain/Step Time": 17.630815057083964} +{"Full-pretrain/Learning Rate": 1.1155783140911496e-05, "Full-pretrain/Loss": 1.8805395364761353, "Full-pretrain/Loss (Raw)": 1.3041566610336304, "Full-pretrain/Step": 6639, "Full-pretrain/Step Time": 17.63563984632492} +{"Full-pretrain/Learning Rate": 1.1148713907881913e-05, "Full-pretrain/Loss": 1.9036223888397217, "Full-pretrain/Loss (Raw)": 2.680009365081787, "Full-pretrain/Step": 6640, "Full-pretrain/Step Time": 17.635869869962335} +{"Full-pretrain/Learning Rate": 1.1141646272593303e-05, "Full-pretrain/Loss": 1.9078423976898193, "Full-pretrain/Loss (Raw)": 2.112771511077881, "Full-pretrain/Step": 6641, "Full-pretrain/Step Time": 17.634681751951575} +{"Full-pretrain/Learning Rate": 1.1134580235860926e-05, "Full-pretrain/Loss": 1.9012579917907715, "Full-pretrain/Loss (Raw)": 1.8441433906555176, "Full-pretrain/Step": 6642, "Full-pretrain/Step Time": 17.629232745617628} +{"Full-pretrain/Learning Rate": 1.1127515798499844e-05, "Full-pretrain/Loss": 1.9063524007797241, "Full-pretrain/Loss (Raw)": 2.0119051933288574, "Full-pretrain/Step": 6643, "Full-pretrain/Step Time": 17.628998404368758} +{"Full-pretrain/Learning Rate": 1.112045296132494e-05, "Full-pretrain/Loss": 1.9174902439117432, "Full-pretrain/Loss (Raw)": 2.0530965328216553, "Full-pretrain/Step": 6644, "Full-pretrain/Step Time": 17.637582026422024} +{"Full-pretrain/Learning Rate": 1.111339172515092e-05, "Full-pretrain/Loss": 1.9239572286605835, "Full-pretrain/Loss (Raw)": 2.098428726196289, "Full-pretrain/Step": 6645, "Full-pretrain/Step Time": 17.63307356648147} +{"Full-pretrain/Learning Rate": 1.1106332090792274e-05, "Full-pretrain/Loss": 1.9283188581466675, "Full-pretrain/Loss (Raw)": 2.116140604019165, "Full-pretrain/Step": 6646, "Full-pretrain/Step Time": 17.640274370089173} +{"Full-pretrain/Learning Rate": 1.109927405906335e-05, "Full-pretrain/Loss": 1.9309327602386475, "Full-pretrain/Loss (Raw)": 2.157651901245117, "Full-pretrain/Step": 6647, "Full-pretrain/Step Time": 17.638170290738344} +{"Full-pretrain/Learning Rate": 1.1092217630778268e-05, "Full-pretrain/Loss": 1.9377048015594482, "Full-pretrain/Loss (Raw)": 1.978559136390686, "Full-pretrain/Step": 6648, "Full-pretrain/Step Time": 17.644323881715536} +{"Full-pretrain/Learning Rate": 1.1085162806750992e-05, "Full-pretrain/Loss": 1.9440200328826904, "Full-pretrain/Loss (Raw)": 1.8904340267181396, "Full-pretrain/Step": 6649, "Full-pretrain/Step Time": 17.638291405513883} +{"Full-pretrain/Learning Rate": 1.107810958779531e-05, "Full-pretrain/Loss": 1.94053316116333, "Full-pretrain/Loss (Raw)": 1.7532320022583008, "Full-pretrain/Step": 6650, "Full-pretrain/Step Time": 17.637803798541427} +{"Full-pretrain/Learning Rate": 1.1071057974724782e-05, "Full-pretrain/Loss": 1.947100043296814, "Full-pretrain/Loss (Raw)": 2.065150499343872, "Full-pretrain/Step": 6651, "Full-pretrain/Step Time": 17.64302776195109} +{"Full-pretrain/Learning Rate": 1.1064007968352821e-05, "Full-pretrain/Loss": 1.9470467567443848, "Full-pretrain/Loss (Raw)": 2.066800117492676, "Full-pretrain/Step": 6652, "Full-pretrain/Step Time": 17.64283045195043} +{"Full-pretrain/Learning Rate": 1.1056959569492648e-05, "Full-pretrain/Loss": 1.9412310123443604, "Full-pretrain/Loss (Raw)": 1.7739661931991577, "Full-pretrain/Step": 6653, "Full-pretrain/Step Time": 17.644066432490945} +{"Full-pretrain/Learning Rate": 1.1049912778957284e-05, "Full-pretrain/Loss": 1.9461078643798828, "Full-pretrain/Loss (Raw)": 2.136121988296509, "Full-pretrain/Step": 6654, "Full-pretrain/Step Time": 17.637338092550635} +{"Full-pretrain/Learning Rate": 1.1042867597559581e-05, "Full-pretrain/Loss": 1.9378703832626343, "Full-pretrain/Loss (Raw)": 1.8424803018569946, "Full-pretrain/Step": 6655, "Full-pretrain/Step Time": 17.642171563580632} +{"Full-pretrain/Learning Rate": 1.1035824026112204e-05, "Full-pretrain/Loss": 1.939906120300293, "Full-pretrain/Loss (Raw)": 2.072539806365967, "Full-pretrain/Step": 6656, "Full-pretrain/Step Time": 17.637268332764506} +{"Full-pretrain/Learning Rate": 1.102878206542761e-05, "Full-pretrain/Loss": 1.9444934129714966, "Full-pretrain/Loss (Raw)": 1.9251132011413574, "Full-pretrain/Step": 6657, "Full-pretrain/Step Time": 17.634288653731346} +{"Full-pretrain/Learning Rate": 1.1021741716318093e-05, "Full-pretrain/Loss": 1.9494868516921997, "Full-pretrain/Loss (Raw)": 1.9054453372955322, "Full-pretrain/Step": 6658, "Full-pretrain/Step Time": 17.637121396139264} +{"Full-pretrain/Learning Rate": 1.1014702979595759e-05, "Full-pretrain/Loss": 1.953865647315979, "Full-pretrain/Loss (Raw)": 2.07729434967041, "Full-pretrain/Step": 6659, "Full-pretrain/Step Time": 17.644465371966362} +{"Full-pretrain/Learning Rate": 1.100766585607252e-05, "Full-pretrain/Loss": 1.94235098361969, "Full-pretrain/Loss (Raw)": 1.760042428970337, "Full-pretrain/Step": 6660, "Full-pretrain/Step Time": 17.643192822113633} +{"Full-pretrain/Learning Rate": 1.1000630346560117e-05, "Full-pretrain/Loss": 1.940185546875, "Full-pretrain/Loss (Raw)": 1.7117078304290771, "Full-pretrain/Step": 6661, "Full-pretrain/Step Time": 17.64421621337533} +{"Full-pretrain/Learning Rate": 1.0993596451870075e-05, "Full-pretrain/Loss": 1.9335018396377563, "Full-pretrain/Loss (Raw)": 1.7756956815719604, "Full-pretrain/Step": 6662, "Full-pretrain/Step Time": 17.640862429514527} +{"Full-pretrain/Learning Rate": 1.0986564172813768e-05, "Full-pretrain/Loss": 1.9300645589828491, "Full-pretrain/Loss (Raw)": 1.860814094543457, "Full-pretrain/Step": 6663, "Full-pretrain/Step Time": 17.649472562596202} +{"Full-pretrain/Learning Rate": 1.097953351020235e-05, "Full-pretrain/Loss": 1.9353573322296143, "Full-pretrain/Loss (Raw)": 1.9099602699279785, "Full-pretrain/Step": 6664, "Full-pretrain/Step Time": 17.653751231729984} +{"Full-pretrain/Learning Rate": 1.0972504464846817e-05, "Full-pretrain/Loss": 1.931361436843872, "Full-pretrain/Loss (Raw)": 1.938353419303894, "Full-pretrain/Step": 6665, "Full-pretrain/Step Time": 17.646288584917784} +{"Full-pretrain/Learning Rate": 1.0965477037557972e-05, "Full-pretrain/Loss": 1.9388134479522705, "Full-pretrain/Loss (Raw)": 2.0715794563293457, "Full-pretrain/Step": 6666, "Full-pretrain/Step Time": 17.64642317406833} +{"Full-pretrain/Learning Rate": 1.0958451229146408e-05, "Full-pretrain/Loss": 1.9514856338500977, "Full-pretrain/Loss (Raw)": 2.0222158432006836, "Full-pretrain/Step": 6667, "Full-pretrain/Step Time": 17.646010234951973} +{"Full-pretrain/Learning Rate": 1.0951427040422562e-05, "Full-pretrain/Loss": 1.9575426578521729, "Full-pretrain/Loss (Raw)": 2.0189037322998047, "Full-pretrain/Step": 6668, "Full-pretrain/Step Time": 17.658042773604393} +{"Full-pretrain/Learning Rate": 1.0944404472196667e-05, "Full-pretrain/Loss": 1.9496841430664062, "Full-pretrain/Loss (Raw)": 1.8304885625839233, "Full-pretrain/Step": 6669, "Full-pretrain/Step Time": 17.64991295710206} +{"Full-pretrain/Learning Rate": 1.093738352527878e-05, "Full-pretrain/Loss": 1.9612981081008911, "Full-pretrain/Loss (Raw)": 1.9963369369506836, "Full-pretrain/Step": 6670, "Full-pretrain/Step Time": 17.651571137830615} +{"Full-pretrain/Learning Rate": 1.093036420047876e-05, "Full-pretrain/Loss": 1.9769787788391113, "Full-pretrain/Loss (Raw)": 1.8059377670288086, "Full-pretrain/Step": 6671, "Full-pretrain/Step Time": 17.651918133720756} +{"Full-pretrain/Learning Rate": 1.0923346498606297e-05, "Full-pretrain/Loss": 1.9549281597137451, "Full-pretrain/Loss (Raw)": 1.974390983581543, "Full-pretrain/Step": 6672, "Full-pretrain/Step Time": 17.654495503753424} +{"Full-pretrain/Learning Rate": 1.0916330420470854e-05, "Full-pretrain/Loss": 1.9514813423156738, "Full-pretrain/Loss (Raw)": 2.0024733543395996, "Full-pretrain/Step": 6673, "Full-pretrain/Step Time": 17.65040712058544} +{"Full-pretrain/Learning Rate": 1.090931596688175e-05, "Full-pretrain/Loss": 1.9578888416290283, "Full-pretrain/Loss (Raw)": 2.0491786003112793, "Full-pretrain/Step": 6674, "Full-pretrain/Step Time": 17.650902876630425} +{"Full-pretrain/Learning Rate": 1.0902303138648098e-05, "Full-pretrain/Loss": 1.9667692184448242, "Full-pretrain/Loss (Raw)": 2.2960829734802246, "Full-pretrain/Step": 6675, "Full-pretrain/Step Time": 17.65088116377592} +{"Full-pretrain/Learning Rate": 1.0895291936578825e-05, "Full-pretrain/Loss": 1.9647842645645142, "Full-pretrain/Loss (Raw)": 1.9895764589309692, "Full-pretrain/Step": 6676, "Full-pretrain/Step Time": 17.651382245123386} +{"Full-pretrain/Learning Rate": 1.088828236148268e-05, "Full-pretrain/Loss": 1.9574497938156128, "Full-pretrain/Loss (Raw)": 1.8637281656265259, "Full-pretrain/Step": 6677, "Full-pretrain/Step Time": 17.650638492777944} +{"Full-pretrain/Learning Rate": 1.0881274414168194e-05, "Full-pretrain/Loss": 1.9541256427764893, "Full-pretrain/Loss (Raw)": 2.0097615718841553, "Full-pretrain/Step": 6678, "Full-pretrain/Step Time": 17.646890088915825} +{"Full-pretrain/Learning Rate": 1.0874268095443755e-05, "Full-pretrain/Loss": 1.9478296041488647, "Full-pretrain/Loss (Raw)": 1.9561853408813477, "Full-pretrain/Step": 6679, "Full-pretrain/Step Time": 17.650059400126338} +{"Full-pretrain/Learning Rate": 1.0867263406117515e-05, "Full-pretrain/Loss": 1.9478579759597778, "Full-pretrain/Loss (Raw)": 1.9794652462005615, "Full-pretrain/Step": 6680, "Full-pretrain/Step Time": 17.64927252009511} +{"Full-pretrain/Learning Rate": 1.0860260346997474e-05, "Full-pretrain/Loss": 1.9497413635253906, "Full-pretrain/Loss (Raw)": 1.9507063627243042, "Full-pretrain/Step": 6681, "Full-pretrain/Step Time": 17.64930315129459} +{"Full-pretrain/Learning Rate": 1.0853258918891446e-05, "Full-pretrain/Loss": 1.9575812816619873, "Full-pretrain/Loss (Raw)": 2.0041022300720215, "Full-pretrain/Step": 6682, "Full-pretrain/Step Time": 17.643548952415586} +{"Full-pretrain/Learning Rate": 1.0846259122607017e-05, "Full-pretrain/Loss": 1.951779842376709, "Full-pretrain/Loss (Raw)": 1.879507064819336, "Full-pretrain/Step": 6683, "Full-pretrain/Step Time": 17.646869963034987} +{"Full-pretrain/Learning Rate": 1.0839260958951628e-05, "Full-pretrain/Loss": 1.9500335454940796, "Full-pretrain/Loss (Raw)": 2.0109171867370605, "Full-pretrain/Step": 6684, "Full-pretrain/Step Time": 17.64521233178675} +{"Full-pretrain/Learning Rate": 1.0832264428732509e-05, "Full-pretrain/Loss": 1.9583494663238525, "Full-pretrain/Loss (Raw)": 2.0400781631469727, "Full-pretrain/Step": 6685, "Full-pretrain/Step Time": 17.649276176467538} +{"Full-pretrain/Learning Rate": 1.0825269532756707e-05, "Full-pretrain/Loss": 1.9496533870697021, "Full-pretrain/Loss (Raw)": 1.8578428030014038, "Full-pretrain/Step": 6686, "Full-pretrain/Step Time": 17.64921790920198} +{"Full-pretrain/Learning Rate": 1.0818276271831093e-05, "Full-pretrain/Loss": 1.9470796585083008, "Full-pretrain/Loss (Raw)": 1.7601265907287598, "Full-pretrain/Step": 6687, "Full-pretrain/Step Time": 17.643495885655284} +{"Full-pretrain/Learning Rate": 1.0811284646762321e-05, "Full-pretrain/Loss": 1.9448609352111816, "Full-pretrain/Loss (Raw)": 2.001537322998047, "Full-pretrain/Step": 6688, "Full-pretrain/Step Time": 17.64797024615109} +{"Full-pretrain/Learning Rate": 1.0804294658356876e-05, "Full-pretrain/Loss": 1.9531221389770508, "Full-pretrain/Loss (Raw)": 2.1894707679748535, "Full-pretrain/Step": 6689, "Full-pretrain/Step Time": 17.649870755150914} +{"Full-pretrain/Learning Rate": 1.0797306307421054e-05, "Full-pretrain/Loss": 1.9651520252227783, "Full-pretrain/Loss (Raw)": 2.290405750274658, "Full-pretrain/Step": 6690, "Full-pretrain/Step Time": 17.645392576232553} +{"Full-pretrain/Learning Rate": 1.0790319594760958e-05, "Full-pretrain/Loss": 1.965287208557129, "Full-pretrain/Loss (Raw)": 2.0816216468811035, "Full-pretrain/Step": 6691, "Full-pretrain/Step Time": 17.63875862583518} +{"Full-pretrain/Learning Rate": 1.0783334521182507e-05, "Full-pretrain/Loss": 1.9767097234725952, "Full-pretrain/Loss (Raw)": 2.125560760498047, "Full-pretrain/Step": 6692, "Full-pretrain/Step Time": 17.644286647439003} +{"Full-pretrain/Learning Rate": 1.0776351087491426e-05, "Full-pretrain/Loss": 1.9921873807907104, "Full-pretrain/Loss (Raw)": 2.2069902420043945, "Full-pretrain/Step": 6693, "Full-pretrain/Step Time": 17.64266628958285} +{"Full-pretrain/Learning Rate": 1.0769369294493245e-05, "Full-pretrain/Loss": 2.0071496963500977, "Full-pretrain/Loss (Raw)": 2.254493236541748, "Full-pretrain/Step": 6694, "Full-pretrain/Step Time": 17.643463525921106} +{"Full-pretrain/Learning Rate": 1.0762389142993312e-05, "Full-pretrain/Loss": 2.0039048194885254, "Full-pretrain/Loss (Raw)": 1.7569783926010132, "Full-pretrain/Step": 6695, "Full-pretrain/Step Time": 17.636746793985367} +{"Full-pretrain/Learning Rate": 1.0755410633796798e-05, "Full-pretrain/Loss": 2.011371374130249, "Full-pretrain/Loss (Raw)": 2.1488914489746094, "Full-pretrain/Step": 6696, "Full-pretrain/Step Time": 17.63874826580286} +{"Full-pretrain/Learning Rate": 1.074843376770865e-05, "Full-pretrain/Loss": 2.0115761756896973, "Full-pretrain/Loss (Raw)": 1.9449050426483154, "Full-pretrain/Step": 6697, "Full-pretrain/Step Time": 17.63666445761919} +{"Full-pretrain/Learning Rate": 1.0741458545533669e-05, "Full-pretrain/Loss": 2.014350175857544, "Full-pretrain/Loss (Raw)": 2.1603472232818604, "Full-pretrain/Step": 6698, "Full-pretrain/Step Time": 17.64206837490201} +{"Full-pretrain/Learning Rate": 1.0734484968076425e-05, "Full-pretrain/Loss": 2.014616012573242, "Full-pretrain/Loss (Raw)": 2.0307254791259766, "Full-pretrain/Step": 6699, "Full-pretrain/Step Time": 17.63248249515891} +{"Full-pretrain/Learning Rate": 1.0727513036141326e-05, "Full-pretrain/Loss": 2.0096933841705322, "Full-pretrain/Loss (Raw)": 1.861377239227295, "Full-pretrain/Step": 6700, "Full-pretrain/Step Time": 17.63320860825479} +{"Full-pretrain/Learning Rate": 1.0720542750532584e-05, "Full-pretrain/Loss": 2.0121052265167236, "Full-pretrain/Loss (Raw)": 1.9076660871505737, "Full-pretrain/Step": 6701, "Full-pretrain/Step Time": 17.636894647032022} +{"Full-pretrain/Learning Rate": 1.0713574112054216e-05, "Full-pretrain/Loss": 2.0165367126464844, "Full-pretrain/Loss (Raw)": 2.1381425857543945, "Full-pretrain/Step": 6702, "Full-pretrain/Step Time": 17.63499574176967} +{"Full-pretrain/Learning Rate": 1.0706607121510065e-05, "Full-pretrain/Loss": 2.0145792961120605, "Full-pretrain/Loss (Raw)": 1.7433068752288818, "Full-pretrain/Step": 6703, "Full-pretrain/Step Time": 17.63420826755464} +{"Full-pretrain/Learning Rate": 1.0699641779703747e-05, "Full-pretrain/Loss": 2.0150630474090576, "Full-pretrain/Loss (Raw)": 1.989863634109497, "Full-pretrain/Step": 6704, "Full-pretrain/Step Time": 17.640154227614403} +{"Full-pretrain/Learning Rate": 1.0692678087438728e-05, "Full-pretrain/Loss": 2.011798858642578, "Full-pretrain/Loss (Raw)": 1.8980189561843872, "Full-pretrain/Step": 6705, "Full-pretrain/Step Time": 17.643119007349014} +{"Full-pretrain/Learning Rate": 1.0685716045518262e-05, "Full-pretrain/Loss": 2.006815195083618, "Full-pretrain/Loss (Raw)": 1.8897079229354858, "Full-pretrain/Step": 6706, "Full-pretrain/Step Time": 17.638775112107396} +{"Full-pretrain/Learning Rate": 1.0678755654745418e-05, "Full-pretrain/Loss": 1.9995380640029907, "Full-pretrain/Loss (Raw)": 2.0632152557373047, "Full-pretrain/Step": 6707, "Full-pretrain/Step Time": 17.638846799731255} +{"Full-pretrain/Learning Rate": 1.0671796915923088e-05, "Full-pretrain/Loss": 1.9926457405090332, "Full-pretrain/Loss (Raw)": 1.7690167427062988, "Full-pretrain/Step": 6708, "Full-pretrain/Step Time": 17.637731147930026} +{"Full-pretrain/Learning Rate": 1.066483982985394e-05, "Full-pretrain/Loss": 1.9937410354614258, "Full-pretrain/Loss (Raw)": 1.8987810611724854, "Full-pretrain/Step": 6709, "Full-pretrain/Step Time": 17.640945594757795} +{"Full-pretrain/Learning Rate": 1.0657884397340475e-05, "Full-pretrain/Loss": 1.992776870727539, "Full-pretrain/Loss (Raw)": 1.9789092540740967, "Full-pretrain/Step": 6710, "Full-pretrain/Step Time": 17.641107089817524} +{"Full-pretrain/Learning Rate": 1.065093061918501e-05, "Full-pretrain/Loss": 1.9919716119766235, "Full-pretrain/Loss (Raw)": 1.9304183721542358, "Full-pretrain/Step": 6711, "Full-pretrain/Step Time": 17.638926900923252} +{"Full-pretrain/Learning Rate": 1.0643978496189663e-05, "Full-pretrain/Loss": 1.9893724918365479, "Full-pretrain/Loss (Raw)": 1.8962922096252441, "Full-pretrain/Step": 6712, "Full-pretrain/Step Time": 17.642781438305974} +{"Full-pretrain/Learning Rate": 1.063702802915634e-05, "Full-pretrain/Loss": 1.9865756034851074, "Full-pretrain/Loss (Raw)": 1.861204743385315, "Full-pretrain/Step": 6713, "Full-pretrain/Step Time": 17.643758784979582} +{"Full-pretrain/Learning Rate": 1.06300792188868e-05, "Full-pretrain/Loss": 1.9838979244232178, "Full-pretrain/Loss (Raw)": 1.918416976928711, "Full-pretrain/Step": 6714, "Full-pretrain/Step Time": 17.640783505514264} +{"Full-pretrain/Learning Rate": 1.062313206618256e-05, "Full-pretrain/Loss": 1.98610520362854, "Full-pretrain/Loss (Raw)": 1.950138807296753, "Full-pretrain/Step": 6715, "Full-pretrain/Step Time": 17.638058116659522} +{"Full-pretrain/Learning Rate": 1.0616186571844982e-05, "Full-pretrain/Loss": 1.9852638244628906, "Full-pretrain/Loss (Raw)": 1.9839966297149658, "Full-pretrain/Step": 6716, "Full-pretrain/Step Time": 17.63171917386353} +{"Full-pretrain/Learning Rate": 1.0609242736675232e-05, "Full-pretrain/Loss": 1.9812753200531006, "Full-pretrain/Loss (Raw)": 1.9124412536621094, "Full-pretrain/Step": 6717, "Full-pretrain/Step Time": 17.63637159205973} +{"Full-pretrain/Learning Rate": 1.0602300561474271e-05, "Full-pretrain/Loss": 1.9854938983917236, "Full-pretrain/Loss (Raw)": 1.9928356409072876, "Full-pretrain/Step": 6718, "Full-pretrain/Step Time": 17.632072053849697} +{"Full-pretrain/Learning Rate": 1.0595360047042893e-05, "Full-pretrain/Loss": 1.9874531030654907, "Full-pretrain/Loss (Raw)": 1.8228232860565186, "Full-pretrain/Step": 6719, "Full-pretrain/Step Time": 17.629304578527808} +{"Full-pretrain/Learning Rate": 1.058842119418166e-05, "Full-pretrain/Loss": 1.985414981842041, "Full-pretrain/Loss (Raw)": 1.9363189935684204, "Full-pretrain/Step": 6720, "Full-pretrain/Step Time": 17.62667914479971} +{"Full-pretrain/Learning Rate": 1.0581484003690981e-05, "Full-pretrain/Loss": 1.9793496131896973, "Full-pretrain/Loss (Raw)": 1.995378017425537, "Full-pretrain/Step": 6721, "Full-pretrain/Step Time": 17.63170707412064} +{"Full-pretrain/Learning Rate": 1.0574548476371051e-05, "Full-pretrain/Loss": 1.9639532566070557, "Full-pretrain/Loss (Raw)": 1.7977207899093628, "Full-pretrain/Step": 6722, "Full-pretrain/Step Time": 17.627710442990065} +{"Full-pretrain/Learning Rate": 1.0567614613021886e-05, "Full-pretrain/Loss": 1.9639471769332886, "Full-pretrain/Loss (Raw)": 2.0814290046691895, "Full-pretrain/Step": 6723, "Full-pretrain/Step Time": 17.624110026285052} +{"Full-pretrain/Learning Rate": 1.0560682414443315e-05, "Full-pretrain/Loss": 1.9548685550689697, "Full-pretrain/Loss (Raw)": 1.835041880607605, "Full-pretrain/Step": 6724, "Full-pretrain/Step Time": 17.628003666177392} +{"Full-pretrain/Learning Rate": 1.0553751881434943e-05, "Full-pretrain/Loss": 1.9492356777191162, "Full-pretrain/Loss (Raw)": 2.0267388820648193, "Full-pretrain/Step": 6725, "Full-pretrain/Step Time": 17.630929566919804} +{"Full-pretrain/Learning Rate": 1.0546823014796214e-05, "Full-pretrain/Loss": 1.9379024505615234, "Full-pretrain/Loss (Raw)": 1.891831398010254, "Full-pretrain/Step": 6726, "Full-pretrain/Step Time": 17.62607056647539} +{"Full-pretrain/Learning Rate": 1.053989581532637e-05, "Full-pretrain/Loss": 1.9614042043685913, "Full-pretrain/Loss (Raw)": 2.50903582572937, "Full-pretrain/Step": 6727, "Full-pretrain/Step Time": 17.62585588544607} +{"Full-pretrain/Learning Rate": 1.0532970283824473e-05, "Full-pretrain/Loss": 1.9583780765533447, "Full-pretrain/Loss (Raw)": 2.0520544052124023, "Full-pretrain/Step": 6728, "Full-pretrain/Step Time": 17.622154572978616} +{"Full-pretrain/Learning Rate": 1.0526046421089358e-05, "Full-pretrain/Loss": 1.9536221027374268, "Full-pretrain/Loss (Raw)": 1.792714238166809, "Full-pretrain/Step": 6729, "Full-pretrain/Step Time": 17.62998945079744} +{"Full-pretrain/Learning Rate": 1.0519124227919705e-05, "Full-pretrain/Loss": 1.9420099258422852, "Full-pretrain/Loss (Raw)": 1.7887574434280396, "Full-pretrain/Step": 6730, "Full-pretrain/Step Time": 17.627370830625296} +{"Full-pretrain/Learning Rate": 1.051220370511399e-05, "Full-pretrain/Loss": 1.9347593784332275, "Full-pretrain/Loss (Raw)": 1.7987101078033447, "Full-pretrain/Step": 6731, "Full-pretrain/Step Time": 17.623685309663415} +{"Full-pretrain/Learning Rate": 1.050528485347048e-05, "Full-pretrain/Loss": 1.9325873851776123, "Full-pretrain/Loss (Raw)": 1.791870355606079, "Full-pretrain/Step": 6732, "Full-pretrain/Step Time": 17.62212553061545} +{"Full-pretrain/Learning Rate": 1.0498367673787265e-05, "Full-pretrain/Loss": 1.9316966533660889, "Full-pretrain/Loss (Raw)": 1.8791606426239014, "Full-pretrain/Step": 6733, "Full-pretrain/Step Time": 17.62300825677812} +{"Full-pretrain/Learning Rate": 1.0491452166862245e-05, "Full-pretrain/Loss": 1.92952299118042, "Full-pretrain/Loss (Raw)": 2.068584442138672, "Full-pretrain/Step": 6734, "Full-pretrain/Step Time": 17.62702388688922} +{"Full-pretrain/Learning Rate": 1.0484538333493128e-05, "Full-pretrain/Loss": 1.931300163269043, "Full-pretrain/Loss (Raw)": 1.800180435180664, "Full-pretrain/Step": 6735, "Full-pretrain/Step Time": 17.629851883277297} +{"Full-pretrain/Learning Rate": 1.0477626174477404e-05, "Full-pretrain/Loss": 1.926304817199707, "Full-pretrain/Loss (Raw)": 1.830012321472168, "Full-pretrain/Step": 6736, "Full-pretrain/Step Time": 17.624649591743946} +{"Full-pretrain/Learning Rate": 1.0470715690612395e-05, "Full-pretrain/Loss": 1.917983889579773, "Full-pretrain/Loss (Raw)": 1.6317462921142578, "Full-pretrain/Step": 6737, "Full-pretrain/Step Time": 17.631402825936675} +{"Full-pretrain/Learning Rate": 1.046380688269523e-05, "Full-pretrain/Loss": 1.9225881099700928, "Full-pretrain/Loss (Raw)": 2.037044048309326, "Full-pretrain/Step": 6738, "Full-pretrain/Step Time": 17.634881164878607} +{"Full-pretrain/Learning Rate": 1.0456899751522827e-05, "Full-pretrain/Loss": 1.9238836765289307, "Full-pretrain/Loss (Raw)": 2.104672431945801, "Full-pretrain/Step": 6739, "Full-pretrain/Step Time": 17.634819062426686} +{"Full-pretrain/Learning Rate": 1.0449994297891938e-05, "Full-pretrain/Loss": 1.9330424070358276, "Full-pretrain/Loss (Raw)": 2.0620980262756348, "Full-pretrain/Step": 6740, "Full-pretrain/Step Time": 17.631140353158116} +{"Full-pretrain/Learning Rate": 1.0443090522599085e-05, "Full-pretrain/Loss": 1.9251341819763184, "Full-pretrain/Loss (Raw)": 1.6457152366638184, "Full-pretrain/Step": 6741, "Full-pretrain/Step Time": 17.63590394705534} +{"Full-pretrain/Learning Rate": 1.0436188426440623e-05, "Full-pretrain/Loss": 1.9239566326141357, "Full-pretrain/Loss (Raw)": 1.9412269592285156, "Full-pretrain/Step": 6742, "Full-pretrain/Step Time": 17.638651365414262} +{"Full-pretrain/Learning Rate": 1.0429288010212713e-05, "Full-pretrain/Loss": 1.9298639297485352, "Full-pretrain/Loss (Raw)": 2.1194558143615723, "Full-pretrain/Step": 6743, "Full-pretrain/Step Time": 17.632896108552814} +{"Full-pretrain/Learning Rate": 1.0422389274711306e-05, "Full-pretrain/Loss": 1.9328337907791138, "Full-pretrain/Loss (Raw)": 1.9913256168365479, "Full-pretrain/Step": 6744, "Full-pretrain/Step Time": 17.635676937177777} +{"Full-pretrain/Learning Rate": 1.0415492220732182e-05, "Full-pretrain/Loss": 1.9326127767562866, "Full-pretrain/Loss (Raw)": 1.8541340827941895, "Full-pretrain/Step": 6745, "Full-pretrain/Step Time": 17.634940022602677} +{"Full-pretrain/Learning Rate": 1.0408596849070898e-05, "Full-pretrain/Loss": 1.932925820350647, "Full-pretrain/Loss (Raw)": 1.928432822227478, "Full-pretrain/Step": 6746, "Full-pretrain/Step Time": 17.6343782749027} +{"Full-pretrain/Learning Rate": 1.0401703160522846e-05, "Full-pretrain/Loss": 1.9306505918502808, "Full-pretrain/Loss (Raw)": 1.8773322105407715, "Full-pretrain/Step": 6747, "Full-pretrain/Step Time": 17.63542938232422} +{"Full-pretrain/Learning Rate": 1.0394811155883196e-05, "Full-pretrain/Loss": 1.9217921495437622, "Full-pretrain/Loss (Raw)": 1.7005248069763184, "Full-pretrain/Step": 6748, "Full-pretrain/Step Time": 17.636050203815103} +{"Full-pretrain/Learning Rate": 1.0387920835946949e-05, "Full-pretrain/Loss": 1.9267072677612305, "Full-pretrain/Loss (Raw)": 2.069729804992676, "Full-pretrain/Step": 6749, "Full-pretrain/Step Time": 17.63598647341132} +{"Full-pretrain/Learning Rate": 1.0381032201508906e-05, "Full-pretrain/Loss": 1.9234867095947266, "Full-pretrain/Loss (Raw)": 1.8897716999053955, "Full-pretrain/Step": 6750, "Full-pretrain/Step Time": 17.639794623479247} +{"Full-pretrain/Learning Rate": 1.037414525336365e-05, "Full-pretrain/Loss": 1.9227638244628906, "Full-pretrain/Loss (Raw)": 1.7996940612792969, "Full-pretrain/Step": 6751, "Full-pretrain/Step Time": 17.639890775084496} +{"Full-pretrain/Learning Rate": 1.0367259992305602e-05, "Full-pretrain/Loss": 1.923645257949829, "Full-pretrain/Loss (Raw)": 1.9645254611968994, "Full-pretrain/Step": 6752, "Full-pretrain/Step Time": 17.630766578018665} +{"Full-pretrain/Learning Rate": 1.0360376419128973e-05, "Full-pretrain/Loss": 1.9280829429626465, "Full-pretrain/Loss (Raw)": 2.1373825073242188, "Full-pretrain/Step": 6753, "Full-pretrain/Step Time": 17.628982855007052} +{"Full-pretrain/Learning Rate": 1.0353494534627776e-05, "Full-pretrain/Loss": 1.9333386421203613, "Full-pretrain/Loss (Raw)": 1.9658993482589722, "Full-pretrain/Step": 6754, "Full-pretrain/Step Time": 17.636889711022377} +{"Full-pretrain/Learning Rate": 1.034661433959584e-05, "Full-pretrain/Loss": 1.9184751510620117, "Full-pretrain/Loss (Raw)": 1.6058039665222168, "Full-pretrain/Step": 6755, "Full-pretrain/Step Time": 17.630456190556288} +{"Full-pretrain/Learning Rate": 1.0339735834826797e-05, "Full-pretrain/Loss": 1.9218839406967163, "Full-pretrain/Loss (Raw)": 1.9441192150115967, "Full-pretrain/Step": 6756, "Full-pretrain/Step Time": 17.631070472300053} +{"Full-pretrain/Learning Rate": 1.0332859021114063e-05, "Full-pretrain/Loss": 1.913177251815796, "Full-pretrain/Loss (Raw)": 1.7481228113174438, "Full-pretrain/Step": 6757, "Full-pretrain/Step Time": 17.63380479067564} +{"Full-pretrain/Learning Rate": 1.0325983899250891e-05, "Full-pretrain/Loss": 1.911907434463501, "Full-pretrain/Loss (Raw)": 1.8511990308761597, "Full-pretrain/Step": 6758, "Full-pretrain/Step Time": 17.626925809308887} +{"Full-pretrain/Learning Rate": 1.0319110470030315e-05, "Full-pretrain/Loss": 1.89471435546875, "Full-pretrain/Loss (Raw)": 1.9588608741760254, "Full-pretrain/Step": 6759, "Full-pretrain/Step Time": 17.628417076542974} +{"Full-pretrain/Learning Rate": 1.0312238734245191e-05, "Full-pretrain/Loss": 1.8938279151916504, "Full-pretrain/Loss (Raw)": 2.0236849784851074, "Full-pretrain/Step": 6760, "Full-pretrain/Step Time": 17.631000142544508} +{"Full-pretrain/Learning Rate": 1.0305368692688174e-05, "Full-pretrain/Loss": 1.8975979089736938, "Full-pretrain/Loss (Raw)": 1.9133546352386475, "Full-pretrain/Step": 6761, "Full-pretrain/Step Time": 17.62769907899201} +{"Full-pretrain/Learning Rate": 1.0298500346151708e-05, "Full-pretrain/Loss": 1.8969630002975464, "Full-pretrain/Loss (Raw)": 1.7684416770935059, "Full-pretrain/Step": 6762, "Full-pretrain/Step Time": 17.63071747869253} +{"Full-pretrain/Learning Rate": 1.0291633695428065e-05, "Full-pretrain/Loss": 1.898097038269043, "Full-pretrain/Loss (Raw)": 1.83500075340271, "Full-pretrain/Step": 6763, "Full-pretrain/Step Time": 17.626798616722226} +{"Full-pretrain/Learning Rate": 1.0284768741309301e-05, "Full-pretrain/Loss": 1.9049124717712402, "Full-pretrain/Loss (Raw)": 2.009960174560547, "Full-pretrain/Step": 6764, "Full-pretrain/Step Time": 17.62263200432062} +{"Full-pretrain/Learning Rate": 1.0277905484587289e-05, "Full-pretrain/Loss": 1.9021438360214233, "Full-pretrain/Loss (Raw)": 1.7905669212341309, "Full-pretrain/Step": 6765, "Full-pretrain/Step Time": 17.62459760904312} +{"Full-pretrain/Learning Rate": 1.0271043926053716e-05, "Full-pretrain/Loss": 1.8879727125167847, "Full-pretrain/Loss (Raw)": 1.615107536315918, "Full-pretrain/Step": 6766, "Full-pretrain/Step Time": 17.627073952928185} +{"Full-pretrain/Learning Rate": 1.026418406650004e-05, "Full-pretrain/Loss": 1.8906376361846924, "Full-pretrain/Loss (Raw)": 1.885457992553711, "Full-pretrain/Step": 6767, "Full-pretrain/Step Time": 17.614987844601274} +{"Full-pretrain/Learning Rate": 1.0257325906717554e-05, "Full-pretrain/Loss": 1.895460844039917, "Full-pretrain/Loss (Raw)": 1.984355092048645, "Full-pretrain/Step": 6768, "Full-pretrain/Step Time": 17.616546899080276} +{"Full-pretrain/Learning Rate": 1.0250469447497347e-05, "Full-pretrain/Loss": 1.8843193054199219, "Full-pretrain/Loss (Raw)": 1.2752156257629395, "Full-pretrain/Step": 6769, "Full-pretrain/Step Time": 17.6250110398978} +{"Full-pretrain/Learning Rate": 1.0243614689630302e-05, "Full-pretrain/Loss": 1.8839662075042725, "Full-pretrain/Loss (Raw)": 2.0257482528686523, "Full-pretrain/Step": 6770, "Full-pretrain/Step Time": 17.62996026687324} +{"Full-pretrain/Learning Rate": 1.0236761633907125e-05, "Full-pretrain/Loss": 1.8710001707077026, "Full-pretrain/Loss (Raw)": 1.6897560358047485, "Full-pretrain/Step": 6771, "Full-pretrain/Step Time": 17.624361600726843} +{"Full-pretrain/Learning Rate": 1.02299102811183e-05, "Full-pretrain/Loss": 1.8743659257888794, "Full-pretrain/Loss (Raw)": 2.169802665710449, "Full-pretrain/Step": 6772, "Full-pretrain/Step Time": 17.621552258729935} +{"Full-pretrain/Learning Rate": 1.022306063205413e-05, "Full-pretrain/Loss": 1.8799405097961426, "Full-pretrain/Loss (Raw)": 1.824103832244873, "Full-pretrain/Step": 6773, "Full-pretrain/Step Time": 17.62925574928522} +{"Full-pretrain/Learning Rate": 1.0216212687504725e-05, "Full-pretrain/Loss": 1.8820793628692627, "Full-pretrain/Loss (Raw)": 2.009667158126831, "Full-pretrain/Step": 6774, "Full-pretrain/Step Time": 17.626399133354425} +{"Full-pretrain/Learning Rate": 1.0209366448259991e-05, "Full-pretrain/Loss": 1.8848743438720703, "Full-pretrain/Loss (Raw)": 2.2088990211486816, "Full-pretrain/Step": 6775, "Full-pretrain/Step Time": 17.623830549418926} +{"Full-pretrain/Learning Rate": 1.020252191510964e-05, "Full-pretrain/Loss": 1.8751822710037231, "Full-pretrain/Loss (Raw)": 1.6811764240264893, "Full-pretrain/Step": 6776, "Full-pretrain/Step Time": 17.62379822693765} +{"Full-pretrain/Learning Rate": 1.019567908884319e-05, "Full-pretrain/Loss": 1.8766475915908813, "Full-pretrain/Loss (Raw)": 1.9010241031646729, "Full-pretrain/Step": 6777, "Full-pretrain/Step Time": 17.629241343587637} +{"Full-pretrain/Learning Rate": 1.018883797024995e-05, "Full-pretrain/Loss": 1.876845121383667, "Full-pretrain/Loss (Raw)": 1.9347522258758545, "Full-pretrain/Step": 6778, "Full-pretrain/Step Time": 17.62673888914287} +{"Full-pretrain/Learning Rate": 1.0181998560119047e-05, "Full-pretrain/Loss": 1.8800381422042847, "Full-pretrain/Loss (Raw)": 1.9795109033584595, "Full-pretrain/Step": 6779, "Full-pretrain/Step Time": 17.62738150730729} +{"Full-pretrain/Learning Rate": 1.0175160859239408e-05, "Full-pretrain/Loss": 1.8833078145980835, "Full-pretrain/Loss (Raw)": 1.8051549196243286, "Full-pretrain/Step": 6780, "Full-pretrain/Step Time": 17.62557504698634} +{"Full-pretrain/Learning Rate": 1.0168324868399748e-05, "Full-pretrain/Loss": 1.8746349811553955, "Full-pretrain/Loss (Raw)": 1.792199969291687, "Full-pretrain/Step": 6781, "Full-pretrain/Step Time": 17.6270410399884} +{"Full-pretrain/Learning Rate": 1.0161490588388608e-05, "Full-pretrain/Loss": 1.8736109733581543, "Full-pretrain/Loss (Raw)": 1.8570048809051514, "Full-pretrain/Step": 6782, "Full-pretrain/Step Time": 17.63010999560356} +{"Full-pretrain/Learning Rate": 1.0154658019994307e-05, "Full-pretrain/Loss": 1.883274793624878, "Full-pretrain/Loss (Raw)": 2.108935832977295, "Full-pretrain/Step": 6783, "Full-pretrain/Step Time": 17.632541738450527} +{"Full-pretrain/Learning Rate": 1.0147827164004986e-05, "Full-pretrain/Loss": 1.8866196870803833, "Full-pretrain/Loss (Raw)": 2.071561813354492, "Full-pretrain/Step": 6784, "Full-pretrain/Step Time": 17.631726246327162} +{"Full-pretrain/Learning Rate": 1.0140998021208581e-05, "Full-pretrain/Loss": 1.875978708267212, "Full-pretrain/Loss (Raw)": 1.7968716621398926, "Full-pretrain/Step": 6785, "Full-pretrain/Step Time": 17.63401317410171} +{"Full-pretrain/Learning Rate": 1.0134170592392836e-05, "Full-pretrain/Loss": 1.8780757188796997, "Full-pretrain/Loss (Raw)": 2.033003807067871, "Full-pretrain/Step": 6786, "Full-pretrain/Step Time": 17.635839177295566} +{"Full-pretrain/Learning Rate": 1.0127344878345293e-05, "Full-pretrain/Loss": 1.8883800506591797, "Full-pretrain/Loss (Raw)": 1.9355428218841553, "Full-pretrain/Step": 6787, "Full-pretrain/Step Time": 17.63027374073863} +{"Full-pretrain/Learning Rate": 1.0120520879853287e-05, "Full-pretrain/Loss": 1.884483814239502, "Full-pretrain/Loss (Raw)": 1.8194375038146973, "Full-pretrain/Step": 6788, "Full-pretrain/Step Time": 17.632022004574537} +{"Full-pretrain/Learning Rate": 1.0113698597703967e-05, "Full-pretrain/Loss": 1.8902605772018433, "Full-pretrain/Loss (Raw)": 1.9329826831817627, "Full-pretrain/Step": 6789, "Full-pretrain/Step Time": 17.626719055697322} +{"Full-pretrain/Learning Rate": 1.010687803268428e-05, "Full-pretrain/Loss": 1.8972804546356201, "Full-pretrain/Loss (Raw)": 2.0758347511291504, "Full-pretrain/Step": 6790, "Full-pretrain/Step Time": 17.62811298109591} +{"Full-pretrain/Learning Rate": 1.0100059185580981e-05, "Full-pretrain/Loss": 1.8940616846084595, "Full-pretrain/Loss (Raw)": 1.8558589220046997, "Full-pretrain/Step": 6791, "Full-pretrain/Step Time": 17.624652057886124} +{"Full-pretrain/Learning Rate": 1.009324205718062e-05, "Full-pretrain/Loss": 1.891128420829773, "Full-pretrain/Loss (Raw)": 1.9298179149627686, "Full-pretrain/Step": 6792, "Full-pretrain/Step Time": 17.62226888537407} +{"Full-pretrain/Learning Rate": 1.0086426648269553e-05, "Full-pretrain/Loss": 1.8933348655700684, "Full-pretrain/Loss (Raw)": 1.9839649200439453, "Full-pretrain/Step": 6793, "Full-pretrain/Step Time": 17.61949379555881} +{"Full-pretrain/Learning Rate": 1.0079612959633928e-05, "Full-pretrain/Loss": 1.8966699838638306, "Full-pretrain/Loss (Raw)": 1.8751649856567383, "Full-pretrain/Step": 6794, "Full-pretrain/Step Time": 17.62000610306859} +{"Full-pretrain/Learning Rate": 1.00728009920597e-05, "Full-pretrain/Loss": 1.894709825515747, "Full-pretrain/Loss (Raw)": 1.7722750902175903, "Full-pretrain/Step": 6795, "Full-pretrain/Step Time": 17.622178772464395} +{"Full-pretrain/Learning Rate": 1.0065990746332643e-05, "Full-pretrain/Loss": 1.8907074928283691, "Full-pretrain/Loss (Raw)": 1.8818835020065308, "Full-pretrain/Step": 6796, "Full-pretrain/Step Time": 17.614944389089942} +{"Full-pretrain/Learning Rate": 1.0059182223238296e-05, "Full-pretrain/Loss": 1.877364993095398, "Full-pretrain/Loss (Raw)": 1.3636083602905273, "Full-pretrain/Step": 6797, "Full-pretrain/Step Time": 17.61984301917255} +{"Full-pretrain/Learning Rate": 1.0052375423562038e-05, "Full-pretrain/Loss": 1.8897788524627686, "Full-pretrain/Loss (Raw)": 2.01234769821167, "Full-pretrain/Step": 6798, "Full-pretrain/Step Time": 17.62375790067017} +{"Full-pretrain/Learning Rate": 1.0045570348089012e-05, "Full-pretrain/Loss": 1.8879112005233765, "Full-pretrain/Loss (Raw)": 1.8256947994232178, "Full-pretrain/Step": 6799, "Full-pretrain/Step Time": 17.62150871567428} +{"Full-pretrain/Learning Rate": 1.003876699760419e-05, "Full-pretrain/Loss": 1.8830716609954834, "Full-pretrain/Loss (Raw)": 1.8294909000396729, "Full-pretrain/Step": 6800, "Full-pretrain/Step Time": 17.621672762557864} +{"Full-pretrain/Learning Rate": 1.003196537289234e-05, "Full-pretrain/Loss": 1.9020767211914062, "Full-pretrain/Loss (Raw)": 1.883377194404602, "Full-pretrain/Step": 6801, "Full-pretrain/Step Time": 17.620749106630683} +{"Full-pretrain/Learning Rate": 1.0025165474738024e-05, "Full-pretrain/Loss": 1.9032422304153442, "Full-pretrain/Loss (Raw)": 2.063041925430298, "Full-pretrain/Step": 6802, "Full-pretrain/Step Time": 17.61691136099398} +{"Full-pretrain/Learning Rate": 1.0018367303925617e-05, "Full-pretrain/Loss": 1.9071998596191406, "Full-pretrain/Loss (Raw)": 1.8163983821868896, "Full-pretrain/Step": 6803, "Full-pretrain/Step Time": 17.620339896529913} +{"Full-pretrain/Learning Rate": 1.0011570861239264e-05, "Full-pretrain/Loss": 1.8986886739730835, "Full-pretrain/Loss (Raw)": 1.8974456787109375, "Full-pretrain/Step": 6804, "Full-pretrain/Step Time": 17.61716590076685} +{"Full-pretrain/Learning Rate": 1.0004776147462946e-05, "Full-pretrain/Loss": 1.894063949584961, "Full-pretrain/Loss (Raw)": 1.6761127710342407, "Full-pretrain/Step": 6805, "Full-pretrain/Step Time": 17.619141658768058} +{"Full-pretrain/Learning Rate": 9.997983163380435e-06, "Full-pretrain/Loss": 1.8925065994262695, "Full-pretrain/Loss (Raw)": 1.9598301649093628, "Full-pretrain/Step": 6806, "Full-pretrain/Step Time": 17.61653035506606} +{"Full-pretrain/Learning Rate": 9.991191909775289e-06, "Full-pretrain/Loss": 1.8776849508285522, "Full-pretrain/Loss (Raw)": 1.7346103191375732, "Full-pretrain/Step": 6807, "Full-pretrain/Step Time": 17.622244795784354} +{"Full-pretrain/Learning Rate": 9.98440238743089e-06, "Full-pretrain/Loss": 1.8870720863342285, "Full-pretrain/Loss (Raw)": 1.9815611839294434, "Full-pretrain/Step": 6808, "Full-pretrain/Step Time": 17.61983920633793} +{"Full-pretrain/Learning Rate": 9.977614597130392e-06, "Full-pretrain/Loss": 1.8879711627960205, "Full-pretrain/Loss (Raw)": 1.9297970533370972, "Full-pretrain/Step": 6809, "Full-pretrain/Step Time": 17.619007151573896} +{"Full-pretrain/Learning Rate": 9.97082853965677e-06, "Full-pretrain/Loss": 1.8861535787582397, "Full-pretrain/Loss (Raw)": 1.8765898942947388, "Full-pretrain/Step": 6810, "Full-pretrain/Step Time": 17.625075936317444} +{"Full-pretrain/Learning Rate": 9.964044215792796e-06, "Full-pretrain/Loss": 1.871081829071045, "Full-pretrain/Loss (Raw)": 1.4972193241119385, "Full-pretrain/Step": 6811, "Full-pretrain/Step Time": 17.62191043794155} +{"Full-pretrain/Learning Rate": 9.957261626321046e-06, "Full-pretrain/Loss": 1.8716588020324707, "Full-pretrain/Loss (Raw)": 1.8236169815063477, "Full-pretrain/Step": 6812, "Full-pretrain/Step Time": 17.62102072313428} +{"Full-pretrain/Learning Rate": 9.950480772023871e-06, "Full-pretrain/Loss": 1.8752036094665527, "Full-pretrain/Loss (Raw)": 1.905632734298706, "Full-pretrain/Step": 6813, "Full-pretrain/Step Time": 17.61767523922026} +{"Full-pretrain/Learning Rate": 9.943701653683449e-06, "Full-pretrain/Loss": 1.880408763885498, "Full-pretrain/Loss (Raw)": 2.0235681533813477, "Full-pretrain/Step": 6814, "Full-pretrain/Step Time": 17.618386916816235} +{"Full-pretrain/Learning Rate": 9.936924272081764e-06, "Full-pretrain/Loss": 1.8750052452087402, "Full-pretrain/Loss (Raw)": 1.9360270500183105, "Full-pretrain/Step": 6815, "Full-pretrain/Step Time": 17.623720163479447} +{"Full-pretrain/Learning Rate": 9.930148628000557e-06, "Full-pretrain/Loss": 1.8738715648651123, "Full-pretrain/Loss (Raw)": 2.0352797508239746, "Full-pretrain/Step": 6816, "Full-pretrain/Step Time": 17.619251573458314} +{"Full-pretrain/Learning Rate": 9.92337472222141e-06, "Full-pretrain/Loss": 1.88519287109375, "Full-pretrain/Loss (Raw)": 2.1591567993164062, "Full-pretrain/Step": 6817, "Full-pretrain/Step Time": 17.617312123999} +{"Full-pretrain/Learning Rate": 9.916602555525692e-06, "Full-pretrain/Loss": 1.888756513595581, "Full-pretrain/Loss (Raw)": 2.147036552429199, "Full-pretrain/Step": 6818, "Full-pretrain/Step Time": 17.622606866061687} +{"Full-pretrain/Learning Rate": 9.909832128694576e-06, "Full-pretrain/Loss": 1.8841166496276855, "Full-pretrain/Loss (Raw)": 1.7870687246322632, "Full-pretrain/Step": 6819, "Full-pretrain/Step Time": 17.625590531155467} +{"Full-pretrain/Learning Rate": 9.903063442509015e-06, "Full-pretrain/Loss": 1.8630757331848145, "Full-pretrain/Loss (Raw)": 1.1461267471313477, "Full-pretrain/Step": 6820, "Full-pretrain/Step Time": 17.621207842603326} +{"Full-pretrain/Learning Rate": 9.89629649774978e-06, "Full-pretrain/Loss": 1.8604533672332764, "Full-pretrain/Loss (Raw)": 1.8490718603134155, "Full-pretrain/Step": 6821, "Full-pretrain/Step Time": 17.617342226207256} +{"Full-pretrain/Learning Rate": 9.889531295197432e-06, "Full-pretrain/Loss": 1.8565784692764282, "Full-pretrain/Loss (Raw)": 1.9518340826034546, "Full-pretrain/Step": 6822, "Full-pretrain/Step Time": 17.61488982848823} +{"Full-pretrain/Learning Rate": 9.882767835632342e-06, "Full-pretrain/Loss": 1.8611116409301758, "Full-pretrain/Loss (Raw)": 2.0009241104125977, "Full-pretrain/Step": 6823, "Full-pretrain/Step Time": 17.622569059953094} +{"Full-pretrain/Learning Rate": 9.87600611983468e-06, "Full-pretrain/Loss": 1.85990309715271, "Full-pretrain/Loss (Raw)": 1.8911391496658325, "Full-pretrain/Step": 6824, "Full-pretrain/Step Time": 17.62320980615914} +{"Full-pretrain/Learning Rate": 9.869246148584385e-06, "Full-pretrain/Loss": 1.8549588918685913, "Full-pretrain/Loss (Raw)": 1.8257534503936768, "Full-pretrain/Step": 6825, "Full-pretrain/Step Time": 17.623993972316384} +{"Full-pretrain/Learning Rate": 9.862487922661231e-06, "Full-pretrain/Loss": 1.8556524515151978, "Full-pretrain/Loss (Raw)": 1.8973573446273804, "Full-pretrain/Step": 6826, "Full-pretrain/Step Time": 17.61897162348032} +{"Full-pretrain/Learning Rate": 9.855731442844775e-06, "Full-pretrain/Loss": 1.8634707927703857, "Full-pretrain/Loss (Raw)": 2.022463083267212, "Full-pretrain/Step": 6827, "Full-pretrain/Step Time": 17.623511353507638} +{"Full-pretrain/Learning Rate": 9.848976709914376e-06, "Full-pretrain/Loss": 1.8661680221557617, "Full-pretrain/Loss (Raw)": 1.9681930541992188, "Full-pretrain/Step": 6828, "Full-pretrain/Step Time": 17.626559749245644} +{"Full-pretrain/Learning Rate": 9.842223724649199e-06, "Full-pretrain/Loss": 1.897721290588379, "Full-pretrain/Loss (Raw)": 2.3733139038085938, "Full-pretrain/Step": 6829, "Full-pretrain/Step Time": 17.621313041076064} +{"Full-pretrain/Learning Rate": 9.835472487828176e-06, "Full-pretrain/Loss": 1.8952409029006958, "Full-pretrain/Loss (Raw)": 1.9329746961593628, "Full-pretrain/Step": 6830, "Full-pretrain/Step Time": 17.617595318704844} +{"Full-pretrain/Learning Rate": 9.828723000230084e-06, "Full-pretrain/Loss": 1.9026933908462524, "Full-pretrain/Loss (Raw)": 2.0641753673553467, "Full-pretrain/Step": 6831, "Full-pretrain/Step Time": 17.613835720345378} +{"Full-pretrain/Learning Rate": 9.821975262633453e-06, "Full-pretrain/Loss": 1.9068329334259033, "Full-pretrain/Loss (Raw)": 1.9619550704956055, "Full-pretrain/Step": 6832, "Full-pretrain/Step Time": 17.61396101489663} +{"Full-pretrain/Learning Rate": 9.815229275816643e-06, "Full-pretrain/Loss": 1.908453345298767, "Full-pretrain/Loss (Raw)": 1.9352331161499023, "Full-pretrain/Step": 6833, "Full-pretrain/Step Time": 17.611867912113667} +{"Full-pretrain/Learning Rate": 9.808485040557796e-06, "Full-pretrain/Loss": 1.9049209356307983, "Full-pretrain/Loss (Raw)": 1.9500024318695068, "Full-pretrain/Step": 6834, "Full-pretrain/Step Time": 17.608832720667124} +{"Full-pretrain/Learning Rate": 9.801742557634872e-06, "Full-pretrain/Loss": 1.9145805835723877, "Full-pretrain/Loss (Raw)": 2.1255087852478027, "Full-pretrain/Step": 6835, "Full-pretrain/Step Time": 17.61010307446122} +{"Full-pretrain/Learning Rate": 9.795001827825596e-06, "Full-pretrain/Loss": 1.9126613140106201, "Full-pretrain/Loss (Raw)": 1.8360278606414795, "Full-pretrain/Step": 6836, "Full-pretrain/Step Time": 17.614289270713925} +{"Full-pretrain/Learning Rate": 9.788262851907512e-06, "Full-pretrain/Loss": 1.9175254106521606, "Full-pretrain/Loss (Raw)": 1.8317643404006958, "Full-pretrain/Step": 6837, "Full-pretrain/Step Time": 17.61463887616992} +{"Full-pretrain/Learning Rate": 9.781525630657964e-06, "Full-pretrain/Loss": 1.9245269298553467, "Full-pretrain/Loss (Raw)": 2.1838767528533936, "Full-pretrain/Step": 6838, "Full-pretrain/Step Time": 17.61429025605321} +{"Full-pretrain/Learning Rate": 9.774790164854087e-06, "Full-pretrain/Loss": 1.9355502128601074, "Full-pretrain/Loss (Raw)": 2.087360382080078, "Full-pretrain/Step": 6839, "Full-pretrain/Step Time": 17.611062724143267} +{"Full-pretrain/Learning Rate": 9.76805645527282e-06, "Full-pretrain/Loss": 1.9410542249679565, "Full-pretrain/Loss (Raw)": 2.157691240310669, "Full-pretrain/Step": 6840, "Full-pretrain/Step Time": 17.612901769578457} +{"Full-pretrain/Learning Rate": 9.76132450269088e-06, "Full-pretrain/Loss": 1.933566689491272, "Full-pretrain/Loss (Raw)": 1.6901907920837402, "Full-pretrain/Step": 6841, "Full-pretrain/Step Time": 17.61309283412993} +{"Full-pretrain/Learning Rate": 9.754594307884808e-06, "Full-pretrain/Loss": 1.9305644035339355, "Full-pretrain/Loss (Raw)": 1.7805192470550537, "Full-pretrain/Step": 6842, "Full-pretrain/Step Time": 17.614582424983382} +{"Full-pretrain/Learning Rate": 9.747865871630917e-06, "Full-pretrain/Loss": 1.949892282485962, "Full-pretrain/Loss (Raw)": 2.115710735321045, "Full-pretrain/Step": 6843, "Full-pretrain/Step Time": 17.61334329098463} +{"Full-pretrain/Learning Rate": 9.741139194705345e-06, "Full-pretrain/Loss": 1.9552631378173828, "Full-pretrain/Loss (Raw)": 1.995487928390503, "Full-pretrain/Step": 6844, "Full-pretrain/Step Time": 17.619034957140684} +{"Full-pretrain/Learning Rate": 9.73441427788401e-06, "Full-pretrain/Loss": 1.9558188915252686, "Full-pretrain/Loss (Raw)": 1.923412561416626, "Full-pretrain/Step": 6845, "Full-pretrain/Step Time": 17.620460595935583} +{"Full-pretrain/Learning Rate": 9.727691121942614e-06, "Full-pretrain/Loss": 1.952559471130371, "Full-pretrain/Loss (Raw)": 1.9192698001861572, "Full-pretrain/Step": 6846, "Full-pretrain/Step Time": 17.6190620418638} +{"Full-pretrain/Learning Rate": 9.72096972765669e-06, "Full-pretrain/Loss": 1.9549779891967773, "Full-pretrain/Loss (Raw)": 2.013416290283203, "Full-pretrain/Step": 6847, "Full-pretrain/Step Time": 17.617561534047127} +{"Full-pretrain/Learning Rate": 9.71425009580153e-06, "Full-pretrain/Loss": 1.95065438747406, "Full-pretrain/Loss (Raw)": 1.896923542022705, "Full-pretrain/Step": 6848, "Full-pretrain/Step Time": 17.623759681358933} +{"Full-pretrain/Learning Rate": 9.70753222715225e-06, "Full-pretrain/Loss": 1.9412813186645508, "Full-pretrain/Loss (Raw)": 1.8592195510864258, "Full-pretrain/Step": 6849, "Full-pretrain/Step Time": 17.623479144647717} +{"Full-pretrain/Learning Rate": 9.70081612248376e-06, "Full-pretrain/Loss": 1.9359796047210693, "Full-pretrain/Loss (Raw)": 1.9773807525634766, "Full-pretrain/Step": 6850, "Full-pretrain/Step Time": 17.622464941814542} +{"Full-pretrain/Learning Rate": 9.694101782570747e-06, "Full-pretrain/Loss": 1.9342707395553589, "Full-pretrain/Loss (Raw)": 1.7323873043060303, "Full-pretrain/Step": 6851, "Full-pretrain/Step Time": 17.627773052081466} +{"Full-pretrain/Learning Rate": 9.687389208187713e-06, "Full-pretrain/Loss": 1.9607828855514526, "Full-pretrain/Loss (Raw)": 1.9945111274719238, "Full-pretrain/Step": 6852, "Full-pretrain/Step Time": 17.62724213115871} +{"Full-pretrain/Learning Rate": 9.680678400108955e-06, "Full-pretrain/Loss": 1.9705030918121338, "Full-pretrain/Loss (Raw)": 2.160123825073242, "Full-pretrain/Step": 6853, "Full-pretrain/Step Time": 17.62548199109733} +{"Full-pretrain/Learning Rate": 9.673969359108559e-06, "Full-pretrain/Loss": 1.974384069442749, "Full-pretrain/Loss (Raw)": 2.0760185718536377, "Full-pretrain/Step": 6854, "Full-pretrain/Step Time": 17.62825416214764} +{"Full-pretrain/Learning Rate": 9.66726208596041e-06, "Full-pretrain/Loss": 1.9788663387298584, "Full-pretrain/Loss (Raw)": 2.144362449645996, "Full-pretrain/Step": 6855, "Full-pretrain/Step Time": 17.625809017568827} +{"Full-pretrain/Learning Rate": 9.660556581438201e-06, "Full-pretrain/Loss": 1.9772605895996094, "Full-pretrain/Loss (Raw)": 1.839754343032837, "Full-pretrain/Step": 6856, "Full-pretrain/Step Time": 17.62943277321756} +{"Full-pretrain/Learning Rate": 9.653852846315391e-06, "Full-pretrain/Loss": 1.985395908355713, "Full-pretrain/Loss (Raw)": 2.0860819816589355, "Full-pretrain/Step": 6857, "Full-pretrain/Step Time": 17.627955911681056} +{"Full-pretrain/Learning Rate": 9.647150881365264e-06, "Full-pretrain/Loss": 1.9894397258758545, "Full-pretrain/Loss (Raw)": 2.0267553329467773, "Full-pretrain/Step": 6858, "Full-pretrain/Step Time": 17.63003921881318} +{"Full-pretrain/Learning Rate": 9.640450687360882e-06, "Full-pretrain/Loss": 1.9848982095718384, "Full-pretrain/Loss (Raw)": 1.8771412372589111, "Full-pretrain/Step": 6859, "Full-pretrain/Step Time": 17.630675703287125} +{"Full-pretrain/Learning Rate": 9.633752265075122e-06, "Full-pretrain/Loss": 1.9888263940811157, "Full-pretrain/Loss (Raw)": 2.0938949584960938, "Full-pretrain/Step": 6860, "Full-pretrain/Step Time": 17.628456130623817} +{"Full-pretrain/Learning Rate": 9.627055615280642e-06, "Full-pretrain/Loss": 1.9739363193511963, "Full-pretrain/Loss (Raw)": 1.8968288898468018, "Full-pretrain/Step": 6861, "Full-pretrain/Step Time": 17.640252102166414} +{"Full-pretrain/Learning Rate": 9.620360738749888e-06, "Full-pretrain/Loss": 1.9718070030212402, "Full-pretrain/Loss (Raw)": 1.8648357391357422, "Full-pretrain/Step": 6862, "Full-pretrain/Step Time": 17.635024970397353} +{"Full-pretrain/Learning Rate": 9.613667636255116e-06, "Full-pretrain/Loss": 1.9680975675582886, "Full-pretrain/Loss (Raw)": 1.9454755783081055, "Full-pretrain/Step": 6863, "Full-pretrain/Step Time": 17.630476839840412} +{"Full-pretrain/Learning Rate": 9.606976308568386e-06, "Full-pretrain/Loss": 1.9625458717346191, "Full-pretrain/Loss (Raw)": 1.7842991352081299, "Full-pretrain/Step": 6864, "Full-pretrain/Step Time": 17.637961013242602} +{"Full-pretrain/Learning Rate": 9.600286756461519e-06, "Full-pretrain/Loss": 1.9572010040283203, "Full-pretrain/Loss (Raw)": 1.7641996145248413, "Full-pretrain/Step": 6865, "Full-pretrain/Step Time": 17.641604540869594} +{"Full-pretrain/Learning Rate": 9.593598980706173e-06, "Full-pretrain/Loss": 1.9746811389923096, "Full-pretrain/Loss (Raw)": 2.5093648433685303, "Full-pretrain/Step": 6866, "Full-pretrain/Step Time": 17.63453915156424} +{"Full-pretrain/Learning Rate": 9.586912982073763e-06, "Full-pretrain/Loss": 1.9740427732467651, "Full-pretrain/Loss (Raw)": 2.1050829887390137, "Full-pretrain/Step": 6867, "Full-pretrain/Step Time": 17.6330354642123} +{"Full-pretrain/Learning Rate": 9.580228761335519e-06, "Full-pretrain/Loss": 1.9769359827041626, "Full-pretrain/Loss (Raw)": 1.9286112785339355, "Full-pretrain/Step": 6868, "Full-pretrain/Step Time": 17.63671657256782} +{"Full-pretrain/Learning Rate": 9.573546319262473e-06, "Full-pretrain/Loss": 1.982541799545288, "Full-pretrain/Loss (Raw)": 2.0111536979675293, "Full-pretrain/Step": 6869, "Full-pretrain/Step Time": 17.642596062272787} +{"Full-pretrain/Learning Rate": 9.566865656625434e-06, "Full-pretrain/Loss": 1.969738483428955, "Full-pretrain/Loss (Raw)": 1.7741655111312866, "Full-pretrain/Step": 6870, "Full-pretrain/Step Time": 17.640803892165422} +{"Full-pretrain/Learning Rate": 9.56018677419503e-06, "Full-pretrain/Loss": 1.9649906158447266, "Full-pretrain/Loss (Raw)": 1.9354287385940552, "Full-pretrain/Step": 6871, "Full-pretrain/Step Time": 17.640802703797817} +{"Full-pretrain/Learning Rate": 9.553509672741645e-06, "Full-pretrain/Loss": 1.9587137699127197, "Full-pretrain/Loss (Raw)": 1.9568333625793457, "Full-pretrain/Step": 6872, "Full-pretrain/Step Time": 17.64085854962468} +{"Full-pretrain/Learning Rate": 9.546834353035492e-06, "Full-pretrain/Loss": 1.9702755212783813, "Full-pretrain/Loss (Raw)": 2.0601675510406494, "Full-pretrain/Step": 6873, "Full-pretrain/Step Time": 17.648748895153403} +{"Full-pretrain/Learning Rate": 9.540160815846566e-06, "Full-pretrain/Loss": 1.9912052154541016, "Full-pretrain/Loss (Raw)": 2.4502716064453125, "Full-pretrain/Step": 6874, "Full-pretrain/Step Time": 17.650103580206633} +{"Full-pretrain/Learning Rate": 9.533489061944655e-06, "Full-pretrain/Loss": 1.9748231172561646, "Full-pretrain/Loss (Raw)": 1.5914790630340576, "Full-pretrain/Step": 6875, "Full-pretrain/Step Time": 17.647117452695966} +{"Full-pretrain/Learning Rate": 9.526819092099348e-06, "Full-pretrain/Loss": 1.9628360271453857, "Full-pretrain/Loss (Raw)": 1.6119036674499512, "Full-pretrain/Step": 6876, "Full-pretrain/Step Time": 17.642167672514915} +{"Full-pretrain/Learning Rate": 9.520150907080028e-06, "Full-pretrain/Loss": 1.9629931449890137, "Full-pretrain/Loss (Raw)": 1.9284403324127197, "Full-pretrain/Step": 6877, "Full-pretrain/Step Time": 17.647238293662667} +{"Full-pretrain/Learning Rate": 9.513484507655854e-06, "Full-pretrain/Loss": 1.959802269935608, "Full-pretrain/Loss (Raw)": 1.8171637058258057, "Full-pretrain/Step": 6878, "Full-pretrain/Step Time": 17.648661080747843} +{"Full-pretrain/Learning Rate": 9.506819894595798e-06, "Full-pretrain/Loss": 1.9575064182281494, "Full-pretrain/Loss (Raw)": 1.9399445056915283, "Full-pretrain/Step": 6879, "Full-pretrain/Step Time": 17.64467770792544} +{"Full-pretrain/Learning Rate": 9.500157068668632e-06, "Full-pretrain/Loss": 1.9506175518035889, "Full-pretrain/Loss (Raw)": 1.6764825582504272, "Full-pretrain/Step": 6880, "Full-pretrain/Step Time": 17.64819810912013} +{"Full-pretrain/Learning Rate": 9.493496030642893e-06, "Full-pretrain/Loss": 1.9574806690216064, "Full-pretrain/Loss (Raw)": 2.078835964202881, "Full-pretrain/Step": 6881, "Full-pretrain/Step Time": 17.651586467400193} +{"Full-pretrain/Learning Rate": 9.486836781286945e-06, "Full-pretrain/Loss": 1.957019329071045, "Full-pretrain/Loss (Raw)": 1.9626200199127197, "Full-pretrain/Step": 6882, "Full-pretrain/Step Time": 17.650775304064155} +{"Full-pretrain/Learning Rate": 9.480179321368912e-06, "Full-pretrain/Loss": 1.9697562456130981, "Full-pretrain/Loss (Raw)": 2.1399686336517334, "Full-pretrain/Step": 6883, "Full-pretrain/Step Time": 17.652246432378888} +{"Full-pretrain/Learning Rate": 9.473523651656744e-06, "Full-pretrain/Loss": 1.9710463285446167, "Full-pretrain/Loss (Raw)": 2.035792350769043, "Full-pretrain/Step": 6884, "Full-pretrain/Step Time": 17.654413992539048} +{"Full-pretrain/Learning Rate": 9.466869772918163e-06, "Full-pretrain/Loss": 1.9632521867752075, "Full-pretrain/Loss (Raw)": 1.9107122421264648, "Full-pretrain/Step": 6885, "Full-pretrain/Step Time": 17.64933478459716} +{"Full-pretrain/Learning Rate": 9.460217685920697e-06, "Full-pretrain/Loss": 1.959031581878662, "Full-pretrain/Loss (Raw)": 1.9409575462341309, "Full-pretrain/Step": 6886, "Full-pretrain/Step Time": 17.6539472527802} +{"Full-pretrain/Learning Rate": 9.45356739143167e-06, "Full-pretrain/Loss": 1.949516773223877, "Full-pretrain/Loss (Raw)": 1.839890480041504, "Full-pretrain/Step": 6887, "Full-pretrain/Step Time": 17.65206445939839} +{"Full-pretrain/Learning Rate": 9.44691889021817e-06, "Full-pretrain/Loss": 1.9492883682250977, "Full-pretrain/Loss (Raw)": 1.8324451446533203, "Full-pretrain/Step": 6888, "Full-pretrain/Step Time": 17.64993368089199} +{"Full-pretrain/Learning Rate": 9.440272183047112e-06, "Full-pretrain/Loss": 1.9454152584075928, "Full-pretrain/Loss (Raw)": 1.962144136428833, "Full-pretrain/Step": 6889, "Full-pretrain/Step Time": 17.650160355493426} +{"Full-pretrain/Learning Rate": 9.433627270685185e-06, "Full-pretrain/Loss": 1.9479182958602905, "Full-pretrain/Loss (Raw)": 2.1068520545959473, "Full-pretrain/Step": 6890, "Full-pretrain/Step Time": 17.652039086446166} +{"Full-pretrain/Learning Rate": 9.426984153898888e-06, "Full-pretrain/Loss": 1.9481079578399658, "Full-pretrain/Loss (Raw)": 1.883206844329834, "Full-pretrain/Step": 6891, "Full-pretrain/Step Time": 17.654723906889558} +{"Full-pretrain/Learning Rate": 9.420342833454493e-06, "Full-pretrain/Loss": 1.942508578300476, "Full-pretrain/Loss (Raw)": 1.9147148132324219, "Full-pretrain/Step": 6892, "Full-pretrain/Step Time": 17.6565371863544} +{"Full-pretrain/Learning Rate": 9.413703310118085e-06, "Full-pretrain/Loss": 1.9520184993743896, "Full-pretrain/Loss (Raw)": 2.2011466026306152, "Full-pretrain/Step": 6893, "Full-pretrain/Step Time": 17.657903365790844} +{"Full-pretrain/Learning Rate": 9.407065584655516e-06, "Full-pretrain/Loss": 1.9495933055877686, "Full-pretrain/Loss (Raw)": 1.7872347831726074, "Full-pretrain/Step": 6894, "Full-pretrain/Step Time": 17.653557006269693} +{"Full-pretrain/Learning Rate": 9.400429657832451e-06, "Full-pretrain/Loss": 1.9410251379013062, "Full-pretrain/Loss (Raw)": 1.6712913513183594, "Full-pretrain/Step": 6895, "Full-pretrain/Step Time": 17.65720553509891} +{"Full-pretrain/Learning Rate": 9.393795530414354e-06, "Full-pretrain/Loss": 1.947818398475647, "Full-pretrain/Loss (Raw)": 2.001682996749878, "Full-pretrain/Step": 6896, "Full-pretrain/Step Time": 17.654082277789712} +{"Full-pretrain/Learning Rate": 9.387163203166447e-06, "Full-pretrain/Loss": 1.9535719156265259, "Full-pretrain/Loss (Raw)": 1.9483131170272827, "Full-pretrain/Step": 6897, "Full-pretrain/Step Time": 17.653829315677285} +{"Full-pretrain/Learning Rate": 9.380532676853776e-06, "Full-pretrain/Loss": 1.9427237510681152, "Full-pretrain/Loss (Raw)": 2.1622209548950195, "Full-pretrain/Step": 6898, "Full-pretrain/Step Time": 17.64943645335734} +{"Full-pretrain/Learning Rate": 9.373903952241183e-06, "Full-pretrain/Loss": 1.9337186813354492, "Full-pretrain/Loss (Raw)": 1.8169223070144653, "Full-pretrain/Step": 6899, "Full-pretrain/Step Time": 17.652354272082448} +{"Full-pretrain/Learning Rate": 9.36727703009327e-06, "Full-pretrain/Loss": 1.9292484521865845, "Full-pretrain/Loss (Raw)": 1.7855653762817383, "Full-pretrain/Step": 6900, "Full-pretrain/Step Time": 17.651587737724185} +{"Full-pretrain/Learning Rate": 9.360651911174455e-06, "Full-pretrain/Loss": 1.9261752367019653, "Full-pretrain/Loss (Raw)": 1.9128105640411377, "Full-pretrain/Step": 6901, "Full-pretrain/Step Time": 17.647878786548972} +{"Full-pretrain/Learning Rate": 9.354028596248949e-06, "Full-pretrain/Loss": 1.932884931564331, "Full-pretrain/Loss (Raw)": 1.9888707399368286, "Full-pretrain/Step": 6902, "Full-pretrain/Step Time": 17.645065179094672} +{"Full-pretrain/Learning Rate": 9.347407086080754e-06, "Full-pretrain/Loss": 1.9299819469451904, "Full-pretrain/Loss (Raw)": 1.8425379991531372, "Full-pretrain/Step": 6903, "Full-pretrain/Step Time": 17.650217924267054} +{"Full-pretrain/Learning Rate": 9.340787381433639e-06, "Full-pretrain/Loss": 1.9338624477386475, "Full-pretrain/Loss (Raw)": 2.081007957458496, "Full-pretrain/Step": 6904, "Full-pretrain/Step Time": 17.652157217264175} +{"Full-pretrain/Learning Rate": 9.3341694830712e-06, "Full-pretrain/Loss": 1.9342222213745117, "Full-pretrain/Loss (Raw)": 2.0716781616210938, "Full-pretrain/Step": 6905, "Full-pretrain/Step Time": 17.652370056137443} +{"Full-pretrain/Learning Rate": 9.327553391756806e-06, "Full-pretrain/Loss": 1.9098284244537354, "Full-pretrain/Loss (Raw)": 1.6696712970733643, "Full-pretrain/Step": 6906, "Full-pretrain/Step Time": 17.65263970941305} +{"Full-pretrain/Learning Rate": 9.320939108253619e-06, "Full-pretrain/Loss": 1.9260592460632324, "Full-pretrain/Loss (Raw)": 2.1108648777008057, "Full-pretrain/Step": 6907, "Full-pretrain/Step Time": 17.651715461164713} +{"Full-pretrain/Learning Rate": 9.314326633324603e-06, "Full-pretrain/Loss": 1.9279600381851196, "Full-pretrain/Loss (Raw)": 1.672729730606079, "Full-pretrain/Step": 6908, "Full-pretrain/Step Time": 17.6505383644253} +{"Full-pretrain/Learning Rate": 9.307715967732491e-06, "Full-pretrain/Loss": 1.928297758102417, "Full-pretrain/Loss (Raw)": 1.9392460584640503, "Full-pretrain/Step": 6909, "Full-pretrain/Step Time": 17.64919077605009} +{"Full-pretrain/Learning Rate": 9.301107112239827e-06, "Full-pretrain/Loss": 1.9293171167373657, "Full-pretrain/Loss (Raw)": 1.8497841358184814, "Full-pretrain/Step": 6910, "Full-pretrain/Step Time": 17.649584406986833} +{"Full-pretrain/Learning Rate": 9.29450006760894e-06, "Full-pretrain/Loss": 1.9297078847885132, "Full-pretrain/Loss (Raw)": 1.9524511098861694, "Full-pretrain/Step": 6911, "Full-pretrain/Step Time": 17.64663835056126} +{"Full-pretrain/Learning Rate": 9.287894834601951e-06, "Full-pretrain/Loss": 1.9388879537582397, "Full-pretrain/Loss (Raw)": 1.9702425003051758, "Full-pretrain/Step": 6912, "Full-pretrain/Step Time": 17.649921344593167} +{"Full-pretrain/Learning Rate": 9.28129141398078e-06, "Full-pretrain/Loss": 1.936863660812378, "Full-pretrain/Loss (Raw)": 2.0140581130981445, "Full-pretrain/Step": 6913, "Full-pretrain/Step Time": 17.64726777933538} +{"Full-pretrain/Learning Rate": 9.274689806507114e-06, "Full-pretrain/Loss": 1.9384586811065674, "Full-pretrain/Loss (Raw)": 2.013662815093994, "Full-pretrain/Step": 6914, "Full-pretrain/Step Time": 17.64912942610681} +{"Full-pretrain/Learning Rate": 9.26809001294246e-06, "Full-pretrain/Loss": 1.937707781791687, "Full-pretrain/Loss (Raw)": 2.1159396171569824, "Full-pretrain/Step": 6915, "Full-pretrain/Step Time": 17.65171796642244} +{"Full-pretrain/Learning Rate": 9.261492034048083e-06, "Full-pretrain/Loss": 1.936322569847107, "Full-pretrain/Loss (Raw)": 1.991464614868164, "Full-pretrain/Step": 6916, "Full-pretrain/Step Time": 17.654744004830718} +{"Full-pretrain/Learning Rate": 9.254895870585072e-06, "Full-pretrain/Loss": 1.9252263307571411, "Full-pretrain/Loss (Raw)": 1.555632472038269, "Full-pretrain/Step": 6917, "Full-pretrain/Step Time": 17.652304334565997} +{"Full-pretrain/Learning Rate": 9.24830152331429e-06, "Full-pretrain/Loss": 1.9230152368545532, "Full-pretrain/Loss (Raw)": 1.8702008724212646, "Full-pretrain/Step": 6918, "Full-pretrain/Step Time": 17.656338637694716} +{"Full-pretrain/Learning Rate": 9.241708992996397e-06, "Full-pretrain/Loss": 1.928228735923767, "Full-pretrain/Loss (Raw)": 2.0067241191864014, "Full-pretrain/Step": 6919, "Full-pretrain/Step Time": 17.65058482438326} +{"Full-pretrain/Learning Rate": 9.235118280391827e-06, "Full-pretrain/Loss": 1.938326358795166, "Full-pretrain/Loss (Raw)": 2.1555674076080322, "Full-pretrain/Step": 6920, "Full-pretrain/Step Time": 17.65742746181786} +{"Full-pretrain/Learning Rate": 9.228529386260823e-06, "Full-pretrain/Loss": 1.9319634437561035, "Full-pretrain/Loss (Raw)": 1.7585307359695435, "Full-pretrain/Step": 6921, "Full-pretrain/Step Time": 17.66021484695375} +{"Full-pretrain/Learning Rate": 9.221942311363413e-06, "Full-pretrain/Loss": 1.928504467010498, "Full-pretrain/Loss (Raw)": 1.996166706085205, "Full-pretrain/Step": 6922, "Full-pretrain/Step Time": 17.661867756396532} +{"Full-pretrain/Learning Rate": 9.215357056459412e-06, "Full-pretrain/Loss": 1.9160572290420532, "Full-pretrain/Loss (Raw)": 1.4848952293395996, "Full-pretrain/Step": 6923, "Full-pretrain/Step Time": 17.656052762642503} +{"Full-pretrain/Learning Rate": 9.208773622308434e-06, "Full-pretrain/Loss": 1.9138818979263306, "Full-pretrain/Loss (Raw)": 1.8451054096221924, "Full-pretrain/Step": 6924, "Full-pretrain/Step Time": 17.66014581359923} +{"Full-pretrain/Learning Rate": 9.202192009669863e-06, "Full-pretrain/Loss": 1.9102797508239746, "Full-pretrain/Loss (Raw)": 2.0858778953552246, "Full-pretrain/Step": 6925, "Full-pretrain/Step Time": 17.66108931787312} +{"Full-pretrain/Learning Rate": 9.19561221930289e-06, "Full-pretrain/Loss": 1.9074735641479492, "Full-pretrain/Loss (Raw)": 1.6974352598190308, "Full-pretrain/Step": 6926, "Full-pretrain/Step Time": 17.651275493204594} +{"Full-pretrain/Learning Rate": 9.189034251966494e-06, "Full-pretrain/Loss": 1.9185073375701904, "Full-pretrain/Loss (Raw)": 2.0243749618530273, "Full-pretrain/Step": 6927, "Full-pretrain/Step Time": 17.65229345858097} +{"Full-pretrain/Learning Rate": 9.182458108419442e-06, "Full-pretrain/Loss": 1.9201340675354004, "Full-pretrain/Loss (Raw)": 2.0537354946136475, "Full-pretrain/Step": 6928, "Full-pretrain/Step Time": 17.65668250620365} +{"Full-pretrain/Learning Rate": 9.175883789420295e-06, "Full-pretrain/Loss": 1.9200351238250732, "Full-pretrain/Loss (Raw)": 1.9451476335525513, "Full-pretrain/Step": 6929, "Full-pretrain/Step Time": 17.658930826932192} +{"Full-pretrain/Learning Rate": 9.169311295727387e-06, "Full-pretrain/Loss": 1.9101734161376953, "Full-pretrain/Loss (Raw)": 1.8466508388519287, "Full-pretrain/Step": 6930, "Full-pretrain/Step Time": 17.66017478518188} +{"Full-pretrain/Learning Rate": 9.162740628098861e-06, "Full-pretrain/Loss": 1.914729118347168, "Full-pretrain/Loss (Raw)": 1.9627013206481934, "Full-pretrain/Step": 6931, "Full-pretrain/Step Time": 17.65534483268857} +{"Full-pretrain/Learning Rate": 9.156171787292633e-06, "Full-pretrain/Loss": 1.9241032600402832, "Full-pretrain/Loss (Raw)": 2.085538864135742, "Full-pretrain/Step": 6932, "Full-pretrain/Step Time": 17.66046915948391} +{"Full-pretrain/Learning Rate": 9.149604774066423e-06, "Full-pretrain/Loss": 1.9292354583740234, "Full-pretrain/Loss (Raw)": 2.0770363807678223, "Full-pretrain/Step": 6933, "Full-pretrain/Step Time": 17.654003025963902} +{"Full-pretrain/Learning Rate": 9.14303958917773e-06, "Full-pretrain/Loss": 1.9219751358032227, "Full-pretrain/Loss (Raw)": 1.7565466165542603, "Full-pretrain/Step": 6934, "Full-pretrain/Step Time": 17.663546888157725} +{"Full-pretrain/Learning Rate": 9.136476233383853e-06, "Full-pretrain/Loss": 1.9334113597869873, "Full-pretrain/Loss (Raw)": 2.2084908485412598, "Full-pretrain/Step": 6935, "Full-pretrain/Step Time": 17.65360927954316} +{"Full-pretrain/Learning Rate": 9.129914707441864e-06, "Full-pretrain/Loss": 1.9286712408065796, "Full-pretrain/Loss (Raw)": 1.9293279647827148, "Full-pretrain/Step": 6936, "Full-pretrain/Step Time": 17.657391162589192} +{"Full-pretrain/Learning Rate": 9.123355012108634e-06, "Full-pretrain/Loss": 1.925839900970459, "Full-pretrain/Loss (Raw)": 1.9810733795166016, "Full-pretrain/Step": 6937, "Full-pretrain/Step Time": 17.659676253795624} +{"Full-pretrain/Learning Rate": 9.116797148140823e-06, "Full-pretrain/Loss": 1.9309706687927246, "Full-pretrain/Loss (Raw)": 1.833857774734497, "Full-pretrain/Step": 6938, "Full-pretrain/Step Time": 17.65579577162862} +{"Full-pretrain/Learning Rate": 9.110241116294883e-06, "Full-pretrain/Loss": 1.9297864437103271, "Full-pretrain/Loss (Raw)": 2.072967767715454, "Full-pretrain/Step": 6939, "Full-pretrain/Step Time": 17.653627226129174} +{"Full-pretrain/Learning Rate": 9.103686917327053e-06, "Full-pretrain/Loss": 1.938295841217041, "Full-pretrain/Loss (Raw)": 1.9450289011001587, "Full-pretrain/Step": 6940, "Full-pretrain/Step Time": 17.65448136627674} +{"Full-pretrain/Learning Rate": 9.097134551993341e-06, "Full-pretrain/Loss": 1.9358670711517334, "Full-pretrain/Loss (Raw)": 1.8615285158157349, "Full-pretrain/Step": 6941, "Full-pretrain/Step Time": 17.66115729510784} +{"Full-pretrain/Learning Rate": 9.09058402104957e-06, "Full-pretrain/Loss": 1.9333908557891846, "Full-pretrain/Loss (Raw)": 1.7705416679382324, "Full-pretrain/Step": 6942, "Full-pretrain/Step Time": 17.66093049198389} +{"Full-pretrain/Learning Rate": 9.084035325251342e-06, "Full-pretrain/Loss": 1.9267377853393555, "Full-pretrain/Loss (Raw)": 1.7395576238632202, "Full-pretrain/Step": 6943, "Full-pretrain/Step Time": 17.659343469887972} +{"Full-pretrain/Learning Rate": 9.077488465354044e-06, "Full-pretrain/Loss": 1.9228417873382568, "Full-pretrain/Loss (Raw)": 1.8455679416656494, "Full-pretrain/Step": 6944, "Full-pretrain/Step Time": 17.658407159149647} +{"Full-pretrain/Learning Rate": 9.070943442112868e-06, "Full-pretrain/Loss": 1.917198896408081, "Full-pretrain/Loss (Raw)": 1.833486557006836, "Full-pretrain/Step": 6945, "Full-pretrain/Step Time": 17.663749877363443} +{"Full-pretrain/Learning Rate": 9.064400256282757e-06, "Full-pretrain/Loss": 1.9147365093231201, "Full-pretrain/Loss (Raw)": 1.9348663091659546, "Full-pretrain/Step": 6946, "Full-pretrain/Step Time": 17.660094168037176} +{"Full-pretrain/Learning Rate": 9.057858908618477e-06, "Full-pretrain/Loss": 1.9061199426651, "Full-pretrain/Loss (Raw)": 1.8402128219604492, "Full-pretrain/Step": 6947, "Full-pretrain/Step Time": 17.658265819773078} +{"Full-pretrain/Learning Rate": 9.051319399874577e-06, "Full-pretrain/Loss": 1.9103481769561768, "Full-pretrain/Loss (Raw)": 2.1267662048339844, "Full-pretrain/Step": 6948, "Full-pretrain/Step Time": 17.658333813771605} +{"Full-pretrain/Learning Rate": 9.044781730805373e-06, "Full-pretrain/Loss": 1.9245173931121826, "Full-pretrain/Loss (Raw)": 2.009049892425537, "Full-pretrain/Step": 6949, "Full-pretrain/Step Time": 17.67325484007597} +{"Full-pretrain/Learning Rate": 9.038245902164996e-06, "Full-pretrain/Loss": 1.919506311416626, "Full-pretrain/Loss (Raw)": 1.7098442316055298, "Full-pretrain/Step": 6950, "Full-pretrain/Step Time": 17.67068243958056} +{"Full-pretrain/Learning Rate": 9.03171191470734e-06, "Full-pretrain/Loss": 1.9174931049346924, "Full-pretrain/Loss (Raw)": 1.9423036575317383, "Full-pretrain/Step": 6951, "Full-pretrain/Step Time": 17.665312802419066} +{"Full-pretrain/Learning Rate": 9.025179769186098e-06, "Full-pretrain/Loss": 1.9167956113815308, "Full-pretrain/Loss (Raw)": 2.1332449913024902, "Full-pretrain/Step": 6952, "Full-pretrain/Step Time": 17.664321126416326} +{"Full-pretrain/Learning Rate": 9.01864946635476e-06, "Full-pretrain/Loss": 1.9098011255264282, "Full-pretrain/Loss (Raw)": 1.534708023071289, "Full-pretrain/Step": 6953, "Full-pretrain/Step Time": 17.670583425089717} +{"Full-pretrain/Learning Rate": 9.012121006966584e-06, "Full-pretrain/Loss": 1.9057304859161377, "Full-pretrain/Loss (Raw)": 1.865905523300171, "Full-pretrain/Step": 6954, "Full-pretrain/Step Time": 17.67372629418969} +{"Full-pretrain/Learning Rate": 9.005594391774635e-06, "Full-pretrain/Loss": 1.9217181205749512, "Full-pretrain/Loss (Raw)": 1.996503233909607, "Full-pretrain/Step": 6955, "Full-pretrain/Step Time": 17.67333540506661} +{"Full-pretrain/Learning Rate": 8.99906962153176e-06, "Full-pretrain/Loss": 1.9262216091156006, "Full-pretrain/Loss (Raw)": 1.989214301109314, "Full-pretrain/Step": 6956, "Full-pretrain/Step Time": 17.66695418395102} +{"Full-pretrain/Learning Rate": 8.992546696990576e-06, "Full-pretrain/Loss": 1.9205546379089355, "Full-pretrain/Loss (Raw)": 1.9045331478118896, "Full-pretrain/Step": 6957, "Full-pretrain/Step Time": 17.67052123323083} +{"Full-pretrain/Learning Rate": 8.986025618903498e-06, "Full-pretrain/Loss": 1.9262454509735107, "Full-pretrain/Loss (Raw)": 1.8795435428619385, "Full-pretrain/Step": 6958, "Full-pretrain/Step Time": 17.675584129989147} +{"Full-pretrain/Learning Rate": 8.979506388022743e-06, "Full-pretrain/Loss": 1.9205591678619385, "Full-pretrain/Loss (Raw)": 1.8424100875854492, "Full-pretrain/Step": 6959, "Full-pretrain/Step Time": 17.674437027424574} +{"Full-pretrain/Learning Rate": 8.972989005100294e-06, "Full-pretrain/Loss": 1.9215316772460938, "Full-pretrain/Loss (Raw)": 2.0848541259765625, "Full-pretrain/Step": 6960, "Full-pretrain/Step Time": 17.672415047883987} +{"Full-pretrain/Learning Rate": 8.96647347088794e-06, "Full-pretrain/Loss": 1.918363332748413, "Full-pretrain/Loss (Raw)": 1.84376060962677, "Full-pretrain/Step": 6961, "Full-pretrain/Step Time": 17.672196002677083} +{"Full-pretrain/Learning Rate": 8.959959786137228e-06, "Full-pretrain/Loss": 1.9225425720214844, "Full-pretrain/Loss (Raw)": 1.9803900718688965, "Full-pretrain/Step": 6962, "Full-pretrain/Step Time": 17.673986023291945} +{"Full-pretrain/Learning Rate": 8.953447951599517e-06, "Full-pretrain/Loss": 1.9287562370300293, "Full-pretrain/Loss (Raw)": 2.1615402698516846, "Full-pretrain/Step": 6963, "Full-pretrain/Step Time": 17.669094681739807} +{"Full-pretrain/Learning Rate": 8.946937968025956e-06, "Full-pretrain/Loss": 1.9242770671844482, "Full-pretrain/Loss (Raw)": 1.942202091217041, "Full-pretrain/Step": 6964, "Full-pretrain/Step Time": 17.666436687111855} +{"Full-pretrain/Learning Rate": 8.94042983616745e-06, "Full-pretrain/Loss": 1.9243297576904297, "Full-pretrain/Loss (Raw)": 2.0787227153778076, "Full-pretrain/Step": 6965, "Full-pretrain/Step Time": 17.66470635868609} +{"Full-pretrain/Learning Rate": 8.933923556774726e-06, "Full-pretrain/Loss": 1.9305497407913208, "Full-pretrain/Loss (Raw)": 1.955585241317749, "Full-pretrain/Step": 6966, "Full-pretrain/Step Time": 17.6619458720088} +{"Full-pretrain/Learning Rate": 8.927419130598263e-06, "Full-pretrain/Loss": 1.9252912998199463, "Full-pretrain/Loss (Raw)": 2.040221929550171, "Full-pretrain/Step": 6967, "Full-pretrain/Step Time": 17.67116012237966} +{"Full-pretrain/Learning Rate": 8.92091655838836e-06, "Full-pretrain/Loss": 1.9222846031188965, "Full-pretrain/Loss (Raw)": 1.833113193511963, "Full-pretrain/Step": 6968, "Full-pretrain/Step Time": 17.666056737303734} +{"Full-pretrain/Learning Rate": 8.914415840895077e-06, "Full-pretrain/Loss": 1.9242122173309326, "Full-pretrain/Loss (Raw)": 2.042759895324707, "Full-pretrain/Step": 6969, "Full-pretrain/Step Time": 17.662958201020956} +{"Full-pretrain/Learning Rate": 8.907916978868278e-06, "Full-pretrain/Loss": 1.930356502532959, "Full-pretrain/Loss (Raw)": 2.030470609664917, "Full-pretrain/Step": 6970, "Full-pretrain/Step Time": 17.662869540974498} +{"Full-pretrain/Learning Rate": 8.901419973057604e-06, "Full-pretrain/Loss": 1.9147759675979614, "Full-pretrain/Loss (Raw)": 1.574394702911377, "Full-pretrain/Step": 6971, "Full-pretrain/Step Time": 17.66842226497829} +{"Full-pretrain/Learning Rate": 8.894924824212474e-06, "Full-pretrain/Loss": 1.9091845750808716, "Full-pretrain/Loss (Raw)": 1.766102910041809, "Full-pretrain/Step": 6972, "Full-pretrain/Step Time": 17.66417477093637} +{"Full-pretrain/Learning Rate": 8.888431533082104e-06, "Full-pretrain/Loss": 1.9089343547821045, "Full-pretrain/Loss (Raw)": 1.8535211086273193, "Full-pretrain/Step": 6973, "Full-pretrain/Step Time": 17.66192315146327} +{"Full-pretrain/Learning Rate": 8.881940100415495e-06, "Full-pretrain/Loss": 1.9105868339538574, "Full-pretrain/Loss (Raw)": 1.823424220085144, "Full-pretrain/Step": 6974, "Full-pretrain/Step Time": 17.664533115923405} +{"Full-pretrain/Learning Rate": 8.875450526961433e-06, "Full-pretrain/Loss": 1.9050610065460205, "Full-pretrain/Loss (Raw)": 1.5627309083938599, "Full-pretrain/Step": 6975, "Full-pretrain/Step Time": 17.668074721470475} +{"Full-pretrain/Learning Rate": 8.868962813468484e-06, "Full-pretrain/Loss": 1.9061222076416016, "Full-pretrain/Loss (Raw)": 1.879523754119873, "Full-pretrain/Step": 6976, "Full-pretrain/Step Time": 17.667263444513083} +{"Full-pretrain/Learning Rate": 8.862476960685016e-06, "Full-pretrain/Loss": 1.9042904376983643, "Full-pretrain/Loss (Raw)": 1.7748687267303467, "Full-pretrain/Step": 6977, "Full-pretrain/Step Time": 17.668357649818063} +{"Full-pretrain/Learning Rate": 8.855992969359148e-06, "Full-pretrain/Loss": 1.9036962985992432, "Full-pretrain/Loss (Raw)": 1.9158544540405273, "Full-pretrain/Step": 6978, "Full-pretrain/Step Time": 17.6737070530653} +{"Full-pretrain/Learning Rate": 8.84951084023882e-06, "Full-pretrain/Loss": 1.9069440364837646, "Full-pretrain/Loss (Raw)": 1.944137692451477, "Full-pretrain/Step": 6979, "Full-pretrain/Step Time": 17.67683576978743} +{"Full-pretrain/Learning Rate": 8.843030574071747e-06, "Full-pretrain/Loss": 1.8915010690689087, "Full-pretrain/Loss (Raw)": 1.6325937509536743, "Full-pretrain/Step": 6980, "Full-pretrain/Step Time": 17.677780613303185} +{"Full-pretrain/Learning Rate": 8.836552171605414e-06, "Full-pretrain/Loss": 1.8869589567184448, "Full-pretrain/Loss (Raw)": 1.8637042045593262, "Full-pretrain/Step": 6981, "Full-pretrain/Step Time": 17.673171097412705} +{"Full-pretrain/Learning Rate": 8.830075633587115e-06, "Full-pretrain/Loss": 1.892040491104126, "Full-pretrain/Loss (Raw)": 1.8724523782730103, "Full-pretrain/Step": 6982, "Full-pretrain/Step Time": 17.673260824754834} +{"Full-pretrain/Learning Rate": 8.8236009607639e-06, "Full-pretrain/Loss": 1.8986902236938477, "Full-pretrain/Loss (Raw)": 2.1550920009613037, "Full-pretrain/Step": 6983, "Full-pretrain/Step Time": 17.678365755826235} +{"Full-pretrain/Learning Rate": 8.817128153882628e-06, "Full-pretrain/Loss": 1.894271731376648, "Full-pretrain/Loss (Raw)": 1.9918560981750488, "Full-pretrain/Step": 6984, "Full-pretrain/Step Time": 17.677507044747472} +{"Full-pretrain/Learning Rate": 8.810657213689939e-06, "Full-pretrain/Loss": 1.9081625938415527, "Full-pretrain/Loss (Raw)": 1.9792146682739258, "Full-pretrain/Step": 6985, "Full-pretrain/Step Time": 17.67449739575386} +{"Full-pretrain/Learning Rate": 8.80418814093225e-06, "Full-pretrain/Loss": 1.9052364826202393, "Full-pretrain/Loss (Raw)": 1.7722718715667725, "Full-pretrain/Step": 6986, "Full-pretrain/Step Time": 17.673117507249117} +{"Full-pretrain/Learning Rate": 8.797720936355777e-06, "Full-pretrain/Loss": 1.8974249362945557, "Full-pretrain/Loss (Raw)": 1.7465288639068604, "Full-pretrain/Step": 6987, "Full-pretrain/Step Time": 17.672503860667348} +{"Full-pretrain/Learning Rate": 8.791255600706488e-06, "Full-pretrain/Loss": 1.903934121131897, "Full-pretrain/Loss (Raw)": 2.1975135803222656, "Full-pretrain/Step": 6988, "Full-pretrain/Step Time": 17.677914356812835} +{"Full-pretrain/Learning Rate": 8.784792134730174e-06, "Full-pretrain/Loss": 1.9059464931488037, "Full-pretrain/Loss (Raw)": 1.9689247608184814, "Full-pretrain/Step": 6989, "Full-pretrain/Step Time": 17.6714410725981} +{"Full-pretrain/Learning Rate": 8.778330539172386e-06, "Full-pretrain/Loss": 1.911658525466919, "Full-pretrain/Loss (Raw)": 2.062330722808838, "Full-pretrain/Step": 6990, "Full-pretrain/Step Time": 17.670280408114195} +{"Full-pretrain/Learning Rate": 8.77187081477847e-06, "Full-pretrain/Loss": 1.9153172969818115, "Full-pretrain/Loss (Raw)": 1.959487795829773, "Full-pretrain/Step": 6991, "Full-pretrain/Step Time": 17.67991716042161} +{"Full-pretrain/Learning Rate": 8.765412962293562e-06, "Full-pretrain/Loss": 1.9129149913787842, "Full-pretrain/Loss (Raw)": 2.0079870223999023, "Full-pretrain/Step": 6992, "Full-pretrain/Step Time": 17.677488572895527} +{"Full-pretrain/Learning Rate": 8.758956982462555e-06, "Full-pretrain/Loss": 1.9022746086120605, "Full-pretrain/Loss (Raw)": 1.5032621622085571, "Full-pretrain/Step": 6993, "Full-pretrain/Step Time": 17.671051966026425} +{"Full-pretrain/Learning Rate": 8.752502876030153e-06, "Full-pretrain/Loss": 1.9024485349655151, "Full-pretrain/Loss (Raw)": 1.9859594106674194, "Full-pretrain/Step": 6994, "Full-pretrain/Step Time": 17.670820513740182} +{"Full-pretrain/Learning Rate": 8.746050643740833e-06, "Full-pretrain/Loss": 1.895970106124878, "Full-pretrain/Loss (Raw)": 1.9542280435562134, "Full-pretrain/Step": 6995, "Full-pretrain/Step Time": 17.676740124821663} +{"Full-pretrain/Learning Rate": 8.73960028633886e-06, "Full-pretrain/Loss": 1.9005961418151855, "Full-pretrain/Loss (Raw)": 2.0902342796325684, "Full-pretrain/Step": 6996, "Full-pretrain/Step Time": 17.676081612706184} +{"Full-pretrain/Learning Rate": 8.733151804568288e-06, "Full-pretrain/Loss": 1.899272084236145, "Full-pretrain/Loss (Raw)": 2.03635311126709, "Full-pretrain/Step": 6997, "Full-pretrain/Step Time": 17.667829820886254} +{"Full-pretrain/Learning Rate": 8.726705199172929e-06, "Full-pretrain/Loss": 1.8992667198181152, "Full-pretrain/Loss (Raw)": 1.955415964126587, "Full-pretrain/Step": 6998, "Full-pretrain/Step Time": 17.670422261580825} +{"Full-pretrain/Learning Rate": 8.720260470896416e-06, "Full-pretrain/Loss": 1.9006001949310303, "Full-pretrain/Loss (Raw)": 2.0828957557678223, "Full-pretrain/Step": 6999, "Full-pretrain/Step Time": 17.671427676454186} +{"Full-pretrain/Learning Rate": 8.713817620482128e-06, "Full-pretrain/Loss": 1.9085354804992676, "Full-pretrain/Loss (Raw)": 2.0870392322540283, "Full-pretrain/Step": 7000, "Full-pretrain/Step Time": 17.674213353544474} +{"Full-pretrain/Learning Rate": 8.707376648673254e-06, "Full-pretrain/Loss": 1.916641354560852, "Full-pretrain/Loss (Raw)": 2.3021481037139893, "Full-pretrain/Step": 7001, "Full-pretrain/Step Time": 17.667947065085173} +{"Full-pretrain/Learning Rate": 8.70093755621276e-06, "Full-pretrain/Loss": 1.910696029663086, "Full-pretrain/Loss (Raw)": 1.8402231931686401, "Full-pretrain/Step": 7002, "Full-pretrain/Step Time": 17.66832041926682} +{"Full-pretrain/Learning Rate": 8.694500343843395e-06, "Full-pretrain/Loss": 1.9166407585144043, "Full-pretrain/Loss (Raw)": 1.764627456665039, "Full-pretrain/Step": 7003, "Full-pretrain/Step Time": 17.66952300257981} +{"Full-pretrain/Learning Rate": 8.68806501230768e-06, "Full-pretrain/Loss": 1.9242160320281982, "Full-pretrain/Loss (Raw)": 2.0085060596466064, "Full-pretrain/Step": 7004, "Full-pretrain/Step Time": 17.67546160891652} +{"Full-pretrain/Learning Rate": 8.681631562347933e-06, "Full-pretrain/Loss": 1.9317419528961182, "Full-pretrain/Loss (Raw)": 2.0943541526794434, "Full-pretrain/Step": 7005, "Full-pretrain/Step Time": 17.668770885095} +{"Full-pretrain/Learning Rate": 8.675199994706252e-06, "Full-pretrain/Loss": 1.9300322532653809, "Full-pretrain/Loss (Raw)": 1.768711805343628, "Full-pretrain/Step": 7006, "Full-pretrain/Step Time": 17.66432416252792} +{"Full-pretrain/Learning Rate": 8.668770310124514e-06, "Full-pretrain/Loss": 1.9376575946807861, "Full-pretrain/Loss (Raw)": 1.80674147605896, "Full-pretrain/Step": 7007, "Full-pretrain/Step Time": 17.66471568495035} +{"Full-pretrain/Learning Rate": 8.662342509344387e-06, "Full-pretrain/Loss": 1.9421875476837158, "Full-pretrain/Loss (Raw)": 2.0244827270507812, "Full-pretrain/Step": 7008, "Full-pretrain/Step Time": 17.672748057171702} +{"Full-pretrain/Learning Rate": 8.655916593107305e-06, "Full-pretrain/Loss": 1.943580985069275, "Full-pretrain/Loss (Raw)": 1.819460153579712, "Full-pretrain/Step": 7009, "Full-pretrain/Step Time": 17.66823828779161} +{"Full-pretrain/Learning Rate": 8.649492562154499e-06, "Full-pretrain/Loss": 1.9446001052856445, "Full-pretrain/Loss (Raw)": 1.9484643936157227, "Full-pretrain/Step": 7010, "Full-pretrain/Step Time": 17.661215601488948} +{"Full-pretrain/Learning Rate": 8.643070417226978e-06, "Full-pretrain/Loss": 1.9407126903533936, "Full-pretrain/Loss (Raw)": 1.8197414875030518, "Full-pretrain/Step": 7011, "Full-pretrain/Step Time": 17.663281401619315} +{"Full-pretrain/Learning Rate": 8.63665015906554e-06, "Full-pretrain/Loss": 1.9506771564483643, "Full-pretrain/Loss (Raw)": 1.95145845413208, "Full-pretrain/Step": 7012, "Full-pretrain/Step Time": 17.66390165500343} +{"Full-pretrain/Learning Rate": 8.630231788410762e-06, "Full-pretrain/Loss": 1.9530596733093262, "Full-pretrain/Loss (Raw)": 1.9399449825286865, "Full-pretrain/Step": 7013, "Full-pretrain/Step Time": 17.663864417001605} +{"Full-pretrain/Learning Rate": 8.623815306002986e-06, "Full-pretrain/Loss": 1.9635751247406006, "Full-pretrain/Loss (Raw)": 2.2089457511901855, "Full-pretrain/Step": 7014, "Full-pretrain/Step Time": 17.665069507434964} +{"Full-pretrain/Learning Rate": 8.617400712582369e-06, "Full-pretrain/Loss": 1.955368161201477, "Full-pretrain/Loss (Raw)": 1.8924707174301147, "Full-pretrain/Step": 7015, "Full-pretrain/Step Time": 17.667253352701664} +{"Full-pretrain/Learning Rate": 8.610988008888813e-06, "Full-pretrain/Loss": 1.9518632888793945, "Full-pretrain/Loss (Raw)": 1.879699945449829, "Full-pretrain/Step": 7016, "Full-pretrain/Step Time": 17.669221121817827} +{"Full-pretrain/Learning Rate": 8.60457719566203e-06, "Full-pretrain/Loss": 1.9488143920898438, "Full-pretrain/Loss (Raw)": 1.8816475868225098, "Full-pretrain/Step": 7017, "Full-pretrain/Step Time": 17.67090106010437} +{"Full-pretrain/Learning Rate": 8.598168273641508e-06, "Full-pretrain/Loss": 1.9522879123687744, "Full-pretrain/Loss (Raw)": 1.8834264278411865, "Full-pretrain/Step": 7018, "Full-pretrain/Step Time": 17.66790134459734} +{"Full-pretrain/Learning Rate": 8.591761243566517e-06, "Full-pretrain/Loss": 1.9649360179901123, "Full-pretrain/Loss (Raw)": 2.151268482208252, "Full-pretrain/Step": 7019, "Full-pretrain/Step Time": 17.67016812413931} +{"Full-pretrain/Learning Rate": 8.585356106176094e-06, "Full-pretrain/Loss": 1.9509268999099731, "Full-pretrain/Loss (Raw)": 1.7492197751998901, "Full-pretrain/Step": 7020, "Full-pretrain/Step Time": 17.669307254254818} +{"Full-pretrain/Learning Rate": 8.578952862209075e-06, "Full-pretrain/Loss": 1.951474666595459, "Full-pretrain/Loss (Raw)": 1.9864546060562134, "Full-pretrain/Step": 7021, "Full-pretrain/Step Time": 17.66670781187713} +{"Full-pretrain/Learning Rate": 8.572551512404073e-06, "Full-pretrain/Loss": 1.953507900238037, "Full-pretrain/Loss (Raw)": 2.127391815185547, "Full-pretrain/Step": 7022, "Full-pretrain/Step Time": 17.664724227041006} +{"Full-pretrain/Learning Rate": 8.56615205749948e-06, "Full-pretrain/Loss": 1.9472875595092773, "Full-pretrain/Loss (Raw)": 1.7604377269744873, "Full-pretrain/Step": 7023, "Full-pretrain/Step Time": 17.66791235283017} +{"Full-pretrain/Learning Rate": 8.559754498233483e-06, "Full-pretrain/Loss": 1.946230173110962, "Full-pretrain/Loss (Raw)": 1.974149227142334, "Full-pretrain/Step": 7024, "Full-pretrain/Step Time": 17.66776285506785} +{"Full-pretrain/Learning Rate": 8.553358835344016e-06, "Full-pretrain/Loss": 1.9631991386413574, "Full-pretrain/Loss (Raw)": 2.0462732315063477, "Full-pretrain/Step": 7025, "Full-pretrain/Step Time": 17.659945340827107} +{"Full-pretrain/Learning Rate": 8.546965069568827e-06, "Full-pretrain/Loss": 1.9615541696548462, "Full-pretrain/Loss (Raw)": 1.933316707611084, "Full-pretrain/Step": 7026, "Full-pretrain/Step Time": 17.665492499247193} +{"Full-pretrain/Learning Rate": 8.540573201645438e-06, "Full-pretrain/Loss": 1.9635318517684937, "Full-pretrain/Loss (Raw)": 2.017514944076538, "Full-pretrain/Step": 7027, "Full-pretrain/Step Time": 17.668976459652185} +{"Full-pretrain/Learning Rate": 8.534183232311143e-06, "Full-pretrain/Loss": 1.9457693099975586, "Full-pretrain/Loss (Raw)": 1.5218315124511719, "Full-pretrain/Step": 7028, "Full-pretrain/Step Time": 17.669415218755603} +{"Full-pretrain/Learning Rate": 8.527795162303037e-06, "Full-pretrain/Loss": 1.9431657791137695, "Full-pretrain/Loss (Raw)": 1.9530411958694458, "Full-pretrain/Step": 7029, "Full-pretrain/Step Time": 17.6656608954072} +{"Full-pretrain/Learning Rate": 8.52140899235796e-06, "Full-pretrain/Loss": 1.9501076936721802, "Full-pretrain/Loss (Raw)": 2.1775567531585693, "Full-pretrain/Step": 7030, "Full-pretrain/Step Time": 17.66407415829599} +{"Full-pretrain/Learning Rate": 8.515024723212566e-06, "Full-pretrain/Loss": 1.9475386142730713, "Full-pretrain/Loss (Raw)": 2.000684976577759, "Full-pretrain/Step": 7031, "Full-pretrain/Step Time": 17.662190487608314} +{"Full-pretrain/Learning Rate": 8.508642355603286e-06, "Full-pretrain/Loss": 1.9396626949310303, "Full-pretrain/Loss (Raw)": 1.8350077867507935, "Full-pretrain/Step": 7032, "Full-pretrain/Step Time": 17.66324830427766} +{"Full-pretrain/Learning Rate": 8.502261890266303e-06, "Full-pretrain/Loss": 1.9285918474197388, "Full-pretrain/Loss (Raw)": 1.9478838443756104, "Full-pretrain/Step": 7033, "Full-pretrain/Step Time": 17.658229261636734} +{"Full-pretrain/Learning Rate": 8.495883327937614e-06, "Full-pretrain/Loss": 1.9177745580673218, "Full-pretrain/Loss (Raw)": 1.4940688610076904, "Full-pretrain/Step": 7034, "Full-pretrain/Step Time": 17.660834370180964} +{"Full-pretrain/Learning Rate": 8.489506669352994e-06, "Full-pretrain/Loss": 1.9057013988494873, "Full-pretrain/Loss (Raw)": 1.378288984298706, "Full-pretrain/Step": 7035, "Full-pretrain/Step Time": 17.662454592064023} +{"Full-pretrain/Learning Rate": 8.483131915247968e-06, "Full-pretrain/Loss": 1.9013853073120117, "Full-pretrain/Loss (Raw)": 1.8703930377960205, "Full-pretrain/Step": 7036, "Full-pretrain/Step Time": 17.66535330377519} +{"Full-pretrain/Learning Rate": 8.476759066357873e-06, "Full-pretrain/Loss": 1.9073121547698975, "Full-pretrain/Loss (Raw)": 2.284010648727417, "Full-pretrain/Step": 7037, "Full-pretrain/Step Time": 17.664534034207463} +{"Full-pretrain/Learning Rate": 8.470388123417811e-06, "Full-pretrain/Loss": 1.9137707948684692, "Full-pretrain/Loss (Raw)": 1.975386142730713, "Full-pretrain/Step": 7038, "Full-pretrain/Step Time": 17.6566792614758} +{"Full-pretrain/Learning Rate": 8.46401908716267e-06, "Full-pretrain/Loss": 1.9118642807006836, "Full-pretrain/Loss (Raw)": 1.745735764503479, "Full-pretrain/Step": 7039, "Full-pretrain/Step Time": 17.657951790839434} +{"Full-pretrain/Learning Rate": 8.457651958327123e-06, "Full-pretrain/Loss": 1.903857946395874, "Full-pretrain/Loss (Raw)": 1.7682805061340332, "Full-pretrain/Step": 7040, "Full-pretrain/Step Time": 17.654594926163554} +{"Full-pretrain/Learning Rate": 8.451286737645603e-06, "Full-pretrain/Loss": 1.9085121154785156, "Full-pretrain/Loss (Raw)": 1.9683918952941895, "Full-pretrain/Step": 7041, "Full-pretrain/Step Time": 17.654623894020915} +{"Full-pretrain/Learning Rate": 8.444923425852342e-06, "Full-pretrain/Loss": 1.9118678569793701, "Full-pretrain/Loss (Raw)": 2.0558478832244873, "Full-pretrain/Step": 7042, "Full-pretrain/Step Time": 17.64796494320035} +{"Full-pretrain/Learning Rate": 8.438562023681346e-06, "Full-pretrain/Loss": 1.9174964427947998, "Full-pretrain/Loss (Raw)": 1.9998528957366943, "Full-pretrain/Step": 7043, "Full-pretrain/Step Time": 17.65108652226627} +{"Full-pretrain/Learning Rate": 8.432202531866402e-06, "Full-pretrain/Loss": 1.9228187799453735, "Full-pretrain/Loss (Raw)": 2.1217751502990723, "Full-pretrain/Step": 7044, "Full-pretrain/Step Time": 17.646406687796116} +{"Full-pretrain/Learning Rate": 8.42584495114108e-06, "Full-pretrain/Loss": 1.9266324043273926, "Full-pretrain/Loss (Raw)": 2.061979055404663, "Full-pretrain/Step": 7045, "Full-pretrain/Step Time": 17.652314761653543} +{"Full-pretrain/Learning Rate": 8.419489282238708e-06, "Full-pretrain/Loss": 1.92034912109375, "Full-pretrain/Loss (Raw)": 2.007882833480835, "Full-pretrain/Step": 7046, "Full-pretrain/Step Time": 17.647913344204426} +{"Full-pretrain/Learning Rate": 8.413135525892425e-06, "Full-pretrain/Loss": 1.9220629930496216, "Full-pretrain/Loss (Raw)": 1.9473130702972412, "Full-pretrain/Step": 7047, "Full-pretrain/Step Time": 17.650627955794334} +{"Full-pretrain/Learning Rate": 8.406783682835135e-06, "Full-pretrain/Loss": 1.924095869064331, "Full-pretrain/Loss (Raw)": 1.9447537660598755, "Full-pretrain/Step": 7048, "Full-pretrain/Step Time": 17.64558088593185} +{"Full-pretrain/Learning Rate": 8.400433753799508e-06, "Full-pretrain/Loss": 1.9142513275146484, "Full-pretrain/Loss (Raw)": 1.566622257232666, "Full-pretrain/Step": 7049, "Full-pretrain/Step Time": 17.640007354319096} +{"Full-pretrain/Learning Rate": 8.394085739518024e-06, "Full-pretrain/Loss": 1.913346529006958, "Full-pretrain/Loss (Raw)": 1.8544695377349854, "Full-pretrain/Step": 7050, "Full-pretrain/Step Time": 17.640418184921145} +{"Full-pretrain/Learning Rate": 8.387739640722902e-06, "Full-pretrain/Loss": 1.8958256244659424, "Full-pretrain/Loss (Raw)": 1.5906040668487549, "Full-pretrain/Step": 7051, "Full-pretrain/Step Time": 17.649240965023637} +{"Full-pretrain/Learning Rate": 8.38139545814618e-06, "Full-pretrain/Loss": 1.9064533710479736, "Full-pretrain/Loss (Raw)": 2.0893025398254395, "Full-pretrain/Step": 7052, "Full-pretrain/Step Time": 17.64590920507908} +{"Full-pretrain/Learning Rate": 8.375053192519647e-06, "Full-pretrain/Loss": 1.9112930297851562, "Full-pretrain/Loss (Raw)": 2.141326427459717, "Full-pretrain/Step": 7053, "Full-pretrain/Step Time": 17.6413526982069} +{"Full-pretrain/Learning Rate": 8.36871284457489e-06, "Full-pretrain/Loss": 1.9033634662628174, "Full-pretrain/Loss (Raw)": 1.873647928237915, "Full-pretrain/Step": 7054, "Full-pretrain/Step Time": 17.644110839813948} +{"Full-pretrain/Learning Rate": 8.36237441504326e-06, "Full-pretrain/Loss": 1.9129648208618164, "Full-pretrain/Loss (Raw)": 2.067683458328247, "Full-pretrain/Step": 7055, "Full-pretrain/Step Time": 17.6481459364295} +{"Full-pretrain/Learning Rate": 8.3560379046559e-06, "Full-pretrain/Loss": 1.9062083959579468, "Full-pretrain/Loss (Raw)": 1.7579400539398193, "Full-pretrain/Step": 7056, "Full-pretrain/Step Time": 17.643982330337167} +{"Full-pretrain/Learning Rate": 8.34970331414371e-06, "Full-pretrain/Loss": 1.9088680744171143, "Full-pretrain/Loss (Raw)": 2.1313858032226562, "Full-pretrain/Step": 7057, "Full-pretrain/Step Time": 17.640128880739212} +{"Full-pretrain/Learning Rate": 8.343370644237396e-06, "Full-pretrain/Loss": 1.9039015769958496, "Full-pretrain/Loss (Raw)": 1.7743855714797974, "Full-pretrain/Step": 7058, "Full-pretrain/Step Time": 17.639684995636344} +{"Full-pretrain/Learning Rate": 8.337039895667423e-06, "Full-pretrain/Loss": 1.9054030179977417, "Full-pretrain/Loss (Raw)": 2.065563201904297, "Full-pretrain/Step": 7059, "Full-pretrain/Step Time": 17.64110104367137} +{"Full-pretrain/Learning Rate": 8.33071106916404e-06, "Full-pretrain/Loss": 1.924771785736084, "Full-pretrain/Loss (Raw)": 2.141632080078125, "Full-pretrain/Step": 7060, "Full-pretrain/Step Time": 17.638314267620444} +{"Full-pretrain/Learning Rate": 8.324384165457289e-06, "Full-pretrain/Loss": 1.9260464906692505, "Full-pretrain/Loss (Raw)": 1.9938325881958008, "Full-pretrain/Step": 7061, "Full-pretrain/Step Time": 17.640360563993454} +{"Full-pretrain/Learning Rate": 8.318059185276955e-06, "Full-pretrain/Loss": 1.9237711429595947, "Full-pretrain/Loss (Raw)": 2.1047441959381104, "Full-pretrain/Step": 7062, "Full-pretrain/Step Time": 17.63931255787611} +{"Full-pretrain/Learning Rate": 8.31173612935263e-06, "Full-pretrain/Loss": 1.9129137992858887, "Full-pretrain/Loss (Raw)": 1.6532533168792725, "Full-pretrain/Step": 7063, "Full-pretrain/Step Time": 17.64481206610799} +{"Full-pretrain/Learning Rate": 8.305414998413685e-06, "Full-pretrain/Loss": 1.9118211269378662, "Full-pretrain/Loss (Raw)": 1.8000357151031494, "Full-pretrain/Step": 7064, "Full-pretrain/Step Time": 17.635171744972467} +{"Full-pretrain/Learning Rate": 8.29909579318925e-06, "Full-pretrain/Loss": 1.9041199684143066, "Full-pretrain/Loss (Raw)": 1.7014477252960205, "Full-pretrain/Step": 7065, "Full-pretrain/Step Time": 17.639591014012694} +{"Full-pretrain/Learning Rate": 8.29277851440825e-06, "Full-pretrain/Loss": 1.9164433479309082, "Full-pretrain/Loss (Raw)": 1.88841712474823, "Full-pretrain/Step": 7066, "Full-pretrain/Step Time": 17.64106130413711} +{"Full-pretrain/Learning Rate": 8.286463162799368e-06, "Full-pretrain/Loss": 1.9369107484817505, "Full-pretrain/Loss (Raw)": 2.0332493782043457, "Full-pretrain/Step": 7067, "Full-pretrain/Step Time": 17.643429284915328} +{"Full-pretrain/Learning Rate": 8.28014973909109e-06, "Full-pretrain/Loss": 1.9348278045654297, "Full-pretrain/Loss (Raw)": 1.8037388324737549, "Full-pretrain/Step": 7068, "Full-pretrain/Step Time": 17.640377312898636} +{"Full-pretrain/Learning Rate": 8.273838244011662e-06, "Full-pretrain/Loss": 1.923614263534546, "Full-pretrain/Loss (Raw)": 1.925173282623291, "Full-pretrain/Step": 7069, "Full-pretrain/Step Time": 17.630987579002976} +{"Full-pretrain/Learning Rate": 8.267528678289114e-06, "Full-pretrain/Loss": 1.9269599914550781, "Full-pretrain/Loss (Raw)": 2.082453489303589, "Full-pretrain/Step": 7070, "Full-pretrain/Step Time": 17.63596047088504} +{"Full-pretrain/Learning Rate": 8.261221042651262e-06, "Full-pretrain/Loss": 1.9372023344039917, "Full-pretrain/Loss (Raw)": 2.073486804962158, "Full-pretrain/Step": 7071, "Full-pretrain/Step Time": 17.633287210017443} +{"Full-pretrain/Learning Rate": 8.254915337825673e-06, "Full-pretrain/Loss": 1.9400964975357056, "Full-pretrain/Loss (Raw)": 1.860894799232483, "Full-pretrain/Step": 7072, "Full-pretrain/Step Time": 17.63684793934226} +{"Full-pretrain/Learning Rate": 8.248611564539713e-06, "Full-pretrain/Loss": 1.944838047027588, "Full-pretrain/Loss (Raw)": 2.120120048522949, "Full-pretrain/Step": 7073, "Full-pretrain/Step Time": 17.628939393907785} +{"Full-pretrain/Learning Rate": 8.242309723520523e-06, "Full-pretrain/Loss": 1.949070692062378, "Full-pretrain/Loss (Raw)": 2.191290855407715, "Full-pretrain/Step": 7074, "Full-pretrain/Step Time": 17.632277745753527} +{"Full-pretrain/Learning Rate": 8.236009815495019e-06, "Full-pretrain/Loss": 1.942527413368225, "Full-pretrain/Loss (Raw)": 1.7904713153839111, "Full-pretrain/Step": 7075, "Full-pretrain/Step Time": 17.63679595477879} +{"Full-pretrain/Learning Rate": 8.229711841189889e-06, "Full-pretrain/Loss": 1.939059853553772, "Full-pretrain/Loss (Raw)": 2.010812997817993, "Full-pretrain/Step": 7076, "Full-pretrain/Step Time": 17.63792890496552} +{"Full-pretrain/Learning Rate": 8.223415801331612e-06, "Full-pretrain/Loss": 1.930894136428833, "Full-pretrain/Loss (Raw)": 1.800674319267273, "Full-pretrain/Step": 7077, "Full-pretrain/Step Time": 17.62681965343654} +{"Full-pretrain/Learning Rate": 8.21712169664642e-06, "Full-pretrain/Loss": 1.9242846965789795, "Full-pretrain/Loss (Raw)": 1.7963857650756836, "Full-pretrain/Step": 7078, "Full-pretrain/Step Time": 17.634538505226374} +{"Full-pretrain/Learning Rate": 8.210829527860345e-06, "Full-pretrain/Loss": 1.9178814888000488, "Full-pretrain/Loss (Raw)": 1.7424113750457764, "Full-pretrain/Step": 7079, "Full-pretrain/Step Time": 17.635956624522805} +{"Full-pretrain/Learning Rate": 8.204539295699182e-06, "Full-pretrain/Loss": 1.9133728742599487, "Full-pretrain/Loss (Raw)": 1.8004767894744873, "Full-pretrain/Step": 7080, "Full-pretrain/Step Time": 17.629027033224702} +{"Full-pretrain/Learning Rate": 8.198251000888516e-06, "Full-pretrain/Loss": 1.9328837394714355, "Full-pretrain/Loss (Raw)": 2.1909685134887695, "Full-pretrain/Step": 7081, "Full-pretrain/Step Time": 17.627329047769308} +{"Full-pretrain/Learning Rate": 8.191964644153685e-06, "Full-pretrain/Loss": 1.9333794116973877, "Full-pretrain/Loss (Raw)": 1.8703343868255615, "Full-pretrain/Step": 7082, "Full-pretrain/Step Time": 17.628479534760118} +{"Full-pretrain/Learning Rate": 8.185680226219832e-06, "Full-pretrain/Loss": 1.9446632862091064, "Full-pretrain/Loss (Raw)": 1.9516831636428833, "Full-pretrain/Step": 7083, "Full-pretrain/Step Time": 17.63023037649691} +{"Full-pretrain/Learning Rate": 8.179397747811852e-06, "Full-pretrain/Loss": 1.9408924579620361, "Full-pretrain/Loss (Raw)": 1.9686365127563477, "Full-pretrain/Step": 7084, "Full-pretrain/Step Time": 17.62973220832646} +{"Full-pretrain/Learning Rate": 8.173117209654427e-06, "Full-pretrain/Loss": 1.9291187524795532, "Full-pretrain/Loss (Raw)": 1.7645692825317383, "Full-pretrain/Step": 7085, "Full-pretrain/Step Time": 17.631377052515745} +{"Full-pretrain/Learning Rate": 8.16683861247202e-06, "Full-pretrain/Loss": 1.93052077293396, "Full-pretrain/Loss (Raw)": 1.9185106754302979, "Full-pretrain/Step": 7086, "Full-pretrain/Step Time": 17.629804454743862} +{"Full-pretrain/Learning Rate": 8.160561956988869e-06, "Full-pretrain/Loss": 1.9195833206176758, "Full-pretrain/Loss (Raw)": 1.7176859378814697, "Full-pretrain/Step": 7087, "Full-pretrain/Step Time": 17.631995603442192} +{"Full-pretrain/Learning Rate": 8.154287243928974e-06, "Full-pretrain/Loss": 1.928743839263916, "Full-pretrain/Loss (Raw)": 2.0510759353637695, "Full-pretrain/Step": 7088, "Full-pretrain/Step Time": 17.628448305651546} +{"Full-pretrain/Learning Rate": 8.148014474016121e-06, "Full-pretrain/Loss": 1.9131922721862793, "Full-pretrain/Loss (Raw)": 1.6337387561798096, "Full-pretrain/Step": 7089, "Full-pretrain/Step Time": 17.628630105406046} +{"Full-pretrain/Learning Rate": 8.141743647973882e-06, "Full-pretrain/Loss": 1.9220633506774902, "Full-pretrain/Loss (Raw)": 2.058258056640625, "Full-pretrain/Step": 7090, "Full-pretrain/Step Time": 17.630682626739144} +{"Full-pretrain/Learning Rate": 8.135474766525585e-06, "Full-pretrain/Loss": 1.9205313920974731, "Full-pretrain/Loss (Raw)": 2.016541004180908, "Full-pretrain/Step": 7091, "Full-pretrain/Step Time": 17.62909362092614} +{"Full-pretrain/Learning Rate": 8.129207830394356e-06, "Full-pretrain/Loss": 1.9111852645874023, "Full-pretrain/Loss (Raw)": 1.8425577878952026, "Full-pretrain/Step": 7092, "Full-pretrain/Step Time": 17.631011944264174} +{"Full-pretrain/Learning Rate": 8.122942840303067e-06, "Full-pretrain/Loss": 1.9125010967254639, "Full-pretrain/Loss (Raw)": 2.0359387397766113, "Full-pretrain/Step": 7093, "Full-pretrain/Step Time": 17.630719473585486} +{"Full-pretrain/Learning Rate": 8.116679796974388e-06, "Full-pretrain/Loss": 1.902881383895874, "Full-pretrain/Loss (Raw)": 1.7969136238098145, "Full-pretrain/Step": 7094, "Full-pretrain/Step Time": 17.63777199946344} +{"Full-pretrain/Learning Rate": 8.110418701130765e-06, "Full-pretrain/Loss": 1.9065148830413818, "Full-pretrain/Loss (Raw)": 1.7695260047912598, "Full-pretrain/Step": 7095, "Full-pretrain/Step Time": 17.626043397933245} +{"Full-pretrain/Learning Rate": 8.104159553494408e-06, "Full-pretrain/Loss": 1.9103400707244873, "Full-pretrain/Loss (Raw)": 1.922440528869629, "Full-pretrain/Step": 7096, "Full-pretrain/Step Time": 17.628400575369596} +{"Full-pretrain/Learning Rate": 8.097902354787319e-06, "Full-pretrain/Loss": 1.9041576385498047, "Full-pretrain/Loss (Raw)": 1.5036098957061768, "Full-pretrain/Step": 7097, "Full-pretrain/Step Time": 17.635033855214715} +{"Full-pretrain/Learning Rate": 8.091647105731239e-06, "Full-pretrain/Loss": 1.9126843214035034, "Full-pretrain/Loss (Raw)": 2.1612706184387207, "Full-pretrain/Step": 7098, "Full-pretrain/Step Time": 17.63457020558417} +{"Full-pretrain/Learning Rate": 8.085393807047737e-06, "Full-pretrain/Loss": 1.9136922359466553, "Full-pretrain/Loss (Raw)": 2.0655055046081543, "Full-pretrain/Step": 7099, "Full-pretrain/Step Time": 17.631805565208197} +{"Full-pretrain/Learning Rate": 8.079142459458106e-06, "Full-pretrain/Loss": 1.9093667268753052, "Full-pretrain/Loss (Raw)": 1.6653183698654175, "Full-pretrain/Step": 7100, "Full-pretrain/Step Time": 17.633405663073063} +{"Full-pretrain/Learning Rate": 8.072893063683445e-06, "Full-pretrain/Loss": 1.8986563682556152, "Full-pretrain/Loss (Raw)": 1.5824451446533203, "Full-pretrain/Step": 7101, "Full-pretrain/Step Time": 17.628741204738617} +{"Full-pretrain/Learning Rate": 8.066645620444622e-06, "Full-pretrain/Loss": 1.8823375701904297, "Full-pretrain/Loss (Raw)": 1.5602526664733887, "Full-pretrain/Step": 7102, "Full-pretrain/Step Time": 17.63524585776031} +{"Full-pretrain/Learning Rate": 8.060400130462285e-06, "Full-pretrain/Loss": 1.8772356510162354, "Full-pretrain/Loss (Raw)": 1.910221815109253, "Full-pretrain/Step": 7103, "Full-pretrain/Step Time": 17.63332420401275} +{"Full-pretrain/Learning Rate": 8.054156594456828e-06, "Full-pretrain/Loss": 1.8730099201202393, "Full-pretrain/Loss (Raw)": 1.7256728410720825, "Full-pretrain/Step": 7104, "Full-pretrain/Step Time": 17.628848753869534} +{"Full-pretrain/Learning Rate": 8.047915013148454e-06, "Full-pretrain/Loss": 1.848397970199585, "Full-pretrain/Loss (Raw)": 1.3325339555740356, "Full-pretrain/Step": 7105, "Full-pretrain/Step Time": 17.62436014972627} +{"Full-pretrain/Learning Rate": 8.041675387257127e-06, "Full-pretrain/Loss": 1.8345211744308472, "Full-pretrain/Loss (Raw)": 1.7472376823425293, "Full-pretrain/Step": 7106, "Full-pretrain/Step Time": 17.62933355756104} +{"Full-pretrain/Learning Rate": 8.035437717502584e-06, "Full-pretrain/Loss": 1.8434503078460693, "Full-pretrain/Loss (Raw)": 2.0761992931365967, "Full-pretrain/Step": 7107, "Full-pretrain/Step Time": 17.62457925081253} +{"Full-pretrain/Learning Rate": 8.029202004604347e-06, "Full-pretrain/Loss": 1.8407604694366455, "Full-pretrain/Loss (Raw)": 1.9247426986694336, "Full-pretrain/Step": 7108, "Full-pretrain/Step Time": 17.62149545364082} +{"Full-pretrain/Learning Rate": 8.022968249281686e-06, "Full-pretrain/Loss": 1.8465540409088135, "Full-pretrain/Loss (Raw)": 1.9860674142837524, "Full-pretrain/Step": 7109, "Full-pretrain/Step Time": 17.616070717573166} +{"Full-pretrain/Learning Rate": 8.01673645225367e-06, "Full-pretrain/Loss": 1.860482096672058, "Full-pretrain/Loss (Raw)": 2.2420830726623535, "Full-pretrain/Step": 7110, "Full-pretrain/Step Time": 17.622056601569057} +{"Full-pretrain/Learning Rate": 8.010506614239139e-06, "Full-pretrain/Loss": 1.8585829734802246, "Full-pretrain/Loss (Raw)": 1.6816375255584717, "Full-pretrain/Step": 7111, "Full-pretrain/Step Time": 17.61923696100712} +{"Full-pretrain/Learning Rate": 8.004278735956696e-06, "Full-pretrain/Loss": 1.8656728267669678, "Full-pretrain/Loss (Raw)": 2.0273542404174805, "Full-pretrain/Step": 7112, "Full-pretrain/Step Time": 17.620266165584326} +{"Full-pretrain/Learning Rate": 7.99805281812474e-06, "Full-pretrain/Loss": 1.8566296100616455, "Full-pretrain/Loss (Raw)": 1.901583194732666, "Full-pretrain/Step": 7113, "Full-pretrain/Step Time": 17.615849159657955} +{"Full-pretrain/Learning Rate": 7.991828861461407e-06, "Full-pretrain/Loss": 1.8590894937515259, "Full-pretrain/Loss (Raw)": 1.949051856994629, "Full-pretrain/Step": 7114, "Full-pretrain/Step Time": 17.62176333554089} +{"Full-pretrain/Learning Rate": 7.985606866684637e-06, "Full-pretrain/Loss": 1.8516755104064941, "Full-pretrain/Loss (Raw)": 1.7144335508346558, "Full-pretrain/Step": 7115, "Full-pretrain/Step Time": 17.622850190848112} +{"Full-pretrain/Learning Rate": 7.979386834512145e-06, "Full-pretrain/Loss": 1.84638512134552, "Full-pretrain/Loss (Raw)": 1.7993495464324951, "Full-pretrain/Step": 7116, "Full-pretrain/Step Time": 17.61965474486351} +{"Full-pretrain/Learning Rate": 7.97316876566139e-06, "Full-pretrain/Loss": 1.8493214845657349, "Full-pretrain/Loss (Raw)": 1.8585317134857178, "Full-pretrain/Step": 7117, "Full-pretrain/Step Time": 17.61563198827207} +{"Full-pretrain/Learning Rate": 7.966952660849636e-06, "Full-pretrain/Loss": 1.850886583328247, "Full-pretrain/Loss (Raw)": 1.9685897827148438, "Full-pretrain/Step": 7118, "Full-pretrain/Step Time": 17.619240380823612} +{"Full-pretrain/Learning Rate": 7.960738520793914e-06, "Full-pretrain/Loss": 1.8557922840118408, "Full-pretrain/Loss (Raw)": 1.8746718168258667, "Full-pretrain/Step": 7119, "Full-pretrain/Step Time": 17.616610208526254} +{"Full-pretrain/Learning Rate": 7.954526346211008e-06, "Full-pretrain/Loss": 1.8562126159667969, "Full-pretrain/Loss (Raw)": 2.0645246505737305, "Full-pretrain/Step": 7120, "Full-pretrain/Step Time": 17.60913658887148} +{"Full-pretrain/Learning Rate": 7.948316137817497e-06, "Full-pretrain/Loss": 1.8649359941482544, "Full-pretrain/Loss (Raw)": 1.9128886461257935, "Full-pretrain/Step": 7121, "Full-pretrain/Step Time": 17.611698117107153} +{"Full-pretrain/Learning Rate": 7.942107896329728e-06, "Full-pretrain/Loss": 1.853783130645752, "Full-pretrain/Loss (Raw)": 1.7013678550720215, "Full-pretrain/Step": 7122, "Full-pretrain/Step Time": 17.615526227280498} +{"Full-pretrain/Learning Rate": 7.935901622463817e-06, "Full-pretrain/Loss": 1.8453233242034912, "Full-pretrain/Loss (Raw)": 1.7458254098892212, "Full-pretrain/Step": 7123, "Full-pretrain/Step Time": 17.616274448111653} +{"Full-pretrain/Learning Rate": 7.929697316935666e-06, "Full-pretrain/Loss": 1.854677677154541, "Full-pretrain/Loss (Raw)": 2.141895294189453, "Full-pretrain/Step": 7124, "Full-pretrain/Step Time": 17.60972841270268} +{"Full-pretrain/Learning Rate": 7.923494980460924e-06, "Full-pretrain/Loss": 1.849183440208435, "Full-pretrain/Loss (Raw)": 1.860124945640564, "Full-pretrain/Step": 7125, "Full-pretrain/Step Time": 17.607636472210288} +{"Full-pretrain/Learning Rate": 7.917294613755034e-06, "Full-pretrain/Loss": 1.861818790435791, "Full-pretrain/Loss (Raw)": 2.2012455463409424, "Full-pretrain/Step": 7126, "Full-pretrain/Step Time": 17.60179833509028} +{"Full-pretrain/Learning Rate": 7.911096217533206e-06, "Full-pretrain/Loss": 1.8630871772766113, "Full-pretrain/Loss (Raw)": 1.8101155757904053, "Full-pretrain/Step": 7127, "Full-pretrain/Step Time": 17.610710287466645} +{"Full-pretrain/Learning Rate": 7.904899792510426e-06, "Full-pretrain/Loss": 1.8612539768218994, "Full-pretrain/Loss (Raw)": 1.8637775182724, "Full-pretrain/Step": 7128, "Full-pretrain/Step Time": 17.6048313844949} +{"Full-pretrain/Learning Rate": 7.898705339401455e-06, "Full-pretrain/Loss": 1.879786491394043, "Full-pretrain/Loss (Raw)": 2.096648693084717, "Full-pretrain/Step": 7129, "Full-pretrain/Step Time": 17.602377206087112} +{"Full-pretrain/Learning Rate": 7.892512858920803e-06, "Full-pretrain/Loss": 1.869281530380249, "Full-pretrain/Loss (Raw)": 1.825112223625183, "Full-pretrain/Step": 7130, "Full-pretrain/Step Time": 17.600230652838945} +{"Full-pretrain/Learning Rate": 7.886322351782783e-06, "Full-pretrain/Loss": 1.8701457977294922, "Full-pretrain/Loss (Raw)": 2.093160629272461, "Full-pretrain/Step": 7131, "Full-pretrain/Step Time": 17.613133419305086} +{"Full-pretrain/Learning Rate": 7.880133818701472e-06, "Full-pretrain/Loss": 1.8766640424728394, "Full-pretrain/Loss (Raw)": 1.8739039897918701, "Full-pretrain/Step": 7132, "Full-pretrain/Step Time": 17.609069723635912} +{"Full-pretrain/Learning Rate": 7.873947260390702e-06, "Full-pretrain/Loss": 1.889721155166626, "Full-pretrain/Loss (Raw)": 2.000272274017334, "Full-pretrain/Step": 7133, "Full-pretrain/Step Time": 17.608877455815673} +{"Full-pretrain/Learning Rate": 7.867762677564095e-06, "Full-pretrain/Loss": 1.8976080417633057, "Full-pretrain/Loss (Raw)": 1.812631607055664, "Full-pretrain/Step": 7134, "Full-pretrain/Step Time": 17.612771874293685} +{"Full-pretrain/Learning Rate": 7.861580070935052e-06, "Full-pretrain/Loss": 1.8948290348052979, "Full-pretrain/Loss (Raw)": 1.8212953805923462, "Full-pretrain/Step": 7135, "Full-pretrain/Step Time": 17.61906947940588} +{"Full-pretrain/Learning Rate": 7.855399441216716e-06, "Full-pretrain/Loss": 1.899083137512207, "Full-pretrain/Loss (Raw)": 1.861802101135254, "Full-pretrain/Step": 7136, "Full-pretrain/Step Time": 17.60967362113297} +{"Full-pretrain/Learning Rate": 7.84922078912203e-06, "Full-pretrain/Loss": 1.9229167699813843, "Full-pretrain/Loss (Raw)": 2.0952095985412598, "Full-pretrain/Step": 7137, "Full-pretrain/Step Time": 17.613667212426662} +{"Full-pretrain/Learning Rate": 7.843044115363698e-06, "Full-pretrain/Loss": 1.937049388885498, "Full-pretrain/Loss (Raw)": 2.199484348297119, "Full-pretrain/Step": 7138, "Full-pretrain/Step Time": 17.616137949749827} +{"Full-pretrain/Learning Rate": 7.8368694206542e-06, "Full-pretrain/Loss": 1.9314614534378052, "Full-pretrain/Loss (Raw)": 1.8973816633224487, "Full-pretrain/Step": 7139, "Full-pretrain/Step Time": 17.621304469183087} +{"Full-pretrain/Learning Rate": 7.83069670570579e-06, "Full-pretrain/Loss": 1.9323166608810425, "Full-pretrain/Loss (Raw)": 1.9521121978759766, "Full-pretrain/Step": 7140, "Full-pretrain/Step Time": 17.61145720258355} +{"Full-pretrain/Learning Rate": 7.824525971230472e-06, "Full-pretrain/Loss": 1.9280858039855957, "Full-pretrain/Loss (Raw)": 1.8506780862808228, "Full-pretrain/Step": 7141, "Full-pretrain/Step Time": 17.609385622665286} +{"Full-pretrain/Learning Rate": 7.818357217940048e-06, "Full-pretrain/Loss": 1.9226794242858887, "Full-pretrain/Loss (Raw)": 2.069077968597412, "Full-pretrain/Step": 7142, "Full-pretrain/Step Time": 17.60573779977858} +{"Full-pretrain/Learning Rate": 7.81219044654608e-06, "Full-pretrain/Loss": 1.9257409572601318, "Full-pretrain/Loss (Raw)": 1.7796058654785156, "Full-pretrain/Step": 7143, "Full-pretrain/Step Time": 17.611956449225545} +{"Full-pretrain/Learning Rate": 7.806025657759904e-06, "Full-pretrain/Loss": 1.9140632152557373, "Full-pretrain/Loss (Raw)": 1.6536705493927002, "Full-pretrain/Step": 7144, "Full-pretrain/Step Time": 17.612231636419892} +{"Full-pretrain/Learning Rate": 7.799862852292636e-06, "Full-pretrain/Loss": 1.9204171895980835, "Full-pretrain/Loss (Raw)": 2.1049084663391113, "Full-pretrain/Step": 7145, "Full-pretrain/Step Time": 17.61091616563499} +{"Full-pretrain/Learning Rate": 7.793702030855135e-06, "Full-pretrain/Loss": 1.9275670051574707, "Full-pretrain/Loss (Raw)": 2.1778478622436523, "Full-pretrain/Step": 7146, "Full-pretrain/Step Time": 17.612270824611187} +{"Full-pretrain/Learning Rate": 7.787543194158057e-06, "Full-pretrain/Loss": 1.9379091262817383, "Full-pretrain/Loss (Raw)": 2.045379638671875, "Full-pretrain/Step": 7147, "Full-pretrain/Step Time": 17.61244378425181} +{"Full-pretrain/Learning Rate": 7.78138634291183e-06, "Full-pretrain/Loss": 1.935179352760315, "Full-pretrain/Loss (Raw)": 1.7119948863983154, "Full-pretrain/Step": 7148, "Full-pretrain/Step Time": 17.609523756429553} +{"Full-pretrain/Learning Rate": 7.77523147782663e-06, "Full-pretrain/Loss": 1.9348163604736328, "Full-pretrain/Loss (Raw)": 1.8469157218933105, "Full-pretrain/Step": 7149, "Full-pretrain/Step Time": 17.608501913025975} +{"Full-pretrain/Learning Rate": 7.769078599612434e-06, "Full-pretrain/Loss": 1.9286998510360718, "Full-pretrain/Loss (Raw)": 1.7728633880615234, "Full-pretrain/Step": 7150, "Full-pretrain/Step Time": 17.608429802581668} +{"Full-pretrain/Learning Rate": 7.762927708978959e-06, "Full-pretrain/Loss": 1.9305791854858398, "Full-pretrain/Loss (Raw)": 1.934812068939209, "Full-pretrain/Step": 7151, "Full-pretrain/Step Time": 17.61429937928915} +{"Full-pretrain/Learning Rate": 7.756778806635715e-06, "Full-pretrain/Loss": 1.92813241481781, "Full-pretrain/Loss (Raw)": 1.98622465133667, "Full-pretrain/Step": 7152, "Full-pretrain/Step Time": 17.61857009679079} +{"Full-pretrain/Learning Rate": 7.750631893291974e-06, "Full-pretrain/Loss": 1.9316601753234863, "Full-pretrain/Loss (Raw)": 2.0257797241210938, "Full-pretrain/Step": 7153, "Full-pretrain/Step Time": 17.617877962067723} +{"Full-pretrain/Learning Rate": 7.744486969656784e-06, "Full-pretrain/Loss": 1.9440279006958008, "Full-pretrain/Loss (Raw)": 2.0971341133117676, "Full-pretrain/Step": 7154, "Full-pretrain/Step Time": 17.61216022260487} +{"Full-pretrain/Learning Rate": 7.738344036438958e-06, "Full-pretrain/Loss": 1.9528292417526245, "Full-pretrain/Loss (Raw)": 2.0274691581726074, "Full-pretrain/Step": 7155, "Full-pretrain/Step Time": 17.613558273762465} +{"Full-pretrain/Learning Rate": 7.732203094347087e-06, "Full-pretrain/Loss": 1.9542038440704346, "Full-pretrain/Loss (Raw)": 2.185882329940796, "Full-pretrain/Step": 7156, "Full-pretrain/Step Time": 17.612491944804788} +{"Full-pretrain/Learning Rate": 7.726064144089515e-06, "Full-pretrain/Loss": 1.9502954483032227, "Full-pretrain/Loss (Raw)": 1.735058069229126, "Full-pretrain/Step": 7157, "Full-pretrain/Step Time": 17.61134297773242} +{"Full-pretrain/Learning Rate": 7.719927186374373e-06, "Full-pretrain/Loss": 1.9431126117706299, "Full-pretrain/Loss (Raw)": 1.9713903665542603, "Full-pretrain/Step": 7158, "Full-pretrain/Step Time": 17.615453952923417} +{"Full-pretrain/Learning Rate": 7.713792221909558e-06, "Full-pretrain/Loss": 1.9403648376464844, "Full-pretrain/Loss (Raw)": 1.7221895456314087, "Full-pretrain/Step": 7159, "Full-pretrain/Step Time": 17.61977543309331} +{"Full-pretrain/Learning Rate": 7.707659251402735e-06, "Full-pretrain/Loss": 1.948026418685913, "Full-pretrain/Loss (Raw)": 2.1089491844177246, "Full-pretrain/Step": 7160, "Full-pretrain/Step Time": 17.615527717396617} +{"Full-pretrain/Learning Rate": 7.701528275561348e-06, "Full-pretrain/Loss": 1.9495861530303955, "Full-pretrain/Loss (Raw)": 2.1465561389923096, "Full-pretrain/Step": 7161, "Full-pretrain/Step Time": 17.615796832367778} +{"Full-pretrain/Learning Rate": 7.695399295092587e-06, "Full-pretrain/Loss": 1.955020546913147, "Full-pretrain/Loss (Raw)": 1.9990154504776, "Full-pretrain/Step": 7162, "Full-pretrain/Step Time": 17.61264012940228} +{"Full-pretrain/Learning Rate": 7.689272310703438e-06, "Full-pretrain/Loss": 1.9567726850509644, "Full-pretrain/Loss (Raw)": 2.149230480194092, "Full-pretrain/Step": 7163, "Full-pretrain/Step Time": 17.61373833194375} +{"Full-pretrain/Learning Rate": 7.683147323100643e-06, "Full-pretrain/Loss": 1.9587533473968506, "Full-pretrain/Loss (Raw)": 1.9372848272323608, "Full-pretrain/Step": 7164, "Full-pretrain/Step Time": 17.61585278250277} +{"Full-pretrain/Learning Rate": 7.677024332990725e-06, "Full-pretrain/Loss": 1.9579076766967773, "Full-pretrain/Loss (Raw)": 1.9732121229171753, "Full-pretrain/Step": 7165, "Full-pretrain/Step Time": 17.617918303236365} +{"Full-pretrain/Learning Rate": 7.670903341079957e-06, "Full-pretrain/Loss": 1.959778070449829, "Full-pretrain/Loss (Raw)": 1.872481346130371, "Full-pretrain/Step": 7166, "Full-pretrain/Step Time": 17.61964632384479} +{"Full-pretrain/Learning Rate": 7.664784348074404e-06, "Full-pretrain/Loss": 1.9631125926971436, "Full-pretrain/Loss (Raw)": 1.9280034303665161, "Full-pretrain/Step": 7167, "Full-pretrain/Step Time": 17.62164012528956} +{"Full-pretrain/Learning Rate": 7.65866735467988e-06, "Full-pretrain/Loss": 1.957335114479065, "Full-pretrain/Loss (Raw)": 1.6769202947616577, "Full-pretrain/Step": 7168, "Full-pretrain/Step Time": 17.627943754196167} +{"Full-pretrain/Learning Rate": 7.652552361601981e-06, "Full-pretrain/Loss": 1.9449958801269531, "Full-pretrain/Loss (Raw)": 1.7003531455993652, "Full-pretrain/Step": 7169, "Full-pretrain/Step Time": 17.62907279841602} +{"Full-pretrain/Learning Rate": 7.64643936954607e-06, "Full-pretrain/Loss": 1.943101406097412, "Full-pretrain/Loss (Raw)": 2.138861656188965, "Full-pretrain/Step": 7170, "Full-pretrain/Step Time": 17.62774294242263} +{"Full-pretrain/Learning Rate": 7.640328379217291e-06, "Full-pretrain/Loss": 1.9495368003845215, "Full-pretrain/Loss (Raw)": 2.1033143997192383, "Full-pretrain/Step": 7171, "Full-pretrain/Step Time": 17.624113956466317} +{"Full-pretrain/Learning Rate": 7.634219391320522e-06, "Full-pretrain/Loss": 1.940456748008728, "Full-pretrain/Loss (Raw)": 1.6615512371063232, "Full-pretrain/Step": 7172, "Full-pretrain/Step Time": 17.631369549781084} +{"Full-pretrain/Learning Rate": 7.628112406560442e-06, "Full-pretrain/Loss": 1.9422944784164429, "Full-pretrain/Loss (Raw)": 1.9094849824905396, "Full-pretrain/Step": 7173, "Full-pretrain/Step Time": 17.62765546515584} +{"Full-pretrain/Learning Rate": 7.622007425641492e-06, "Full-pretrain/Loss": 1.943160057067871, "Full-pretrain/Loss (Raw)": 2.096775531768799, "Full-pretrain/Step": 7174, "Full-pretrain/Step Time": 17.63011022657156} +{"Full-pretrain/Learning Rate": 7.615904449267877e-06, "Full-pretrain/Loss": 1.9531664848327637, "Full-pretrain/Loss (Raw)": 2.0998127460479736, "Full-pretrain/Step": 7175, "Full-pretrain/Step Time": 17.62648948840797} +{"Full-pretrain/Learning Rate": 7.609803478143576e-06, "Full-pretrain/Loss": 1.9507551193237305, "Full-pretrain/Loss (Raw)": 1.5765089988708496, "Full-pretrain/Step": 7176, "Full-pretrain/Step Time": 17.631169160827994} +{"Full-pretrain/Learning Rate": 7.603704512972343e-06, "Full-pretrain/Loss": 1.9463506937026978, "Full-pretrain/Loss (Raw)": 1.963964819908142, "Full-pretrain/Step": 7177, "Full-pretrain/Step Time": 17.636460250243545} +{"Full-pretrain/Learning Rate": 7.59760755445767e-06, "Full-pretrain/Loss": 1.943640112876892, "Full-pretrain/Loss (Raw)": 2.0911076068878174, "Full-pretrain/Step": 7178, "Full-pretrain/Step Time": 17.633501334115863} +{"Full-pretrain/Learning Rate": 7.59151260330285e-06, "Full-pretrain/Loss": 1.9419869184494019, "Full-pretrain/Loss (Raw)": 1.9924798011779785, "Full-pretrain/Step": 7179, "Full-pretrain/Step Time": 17.628737948834896} +{"Full-pretrain/Learning Rate": 7.585419660210935e-06, "Full-pretrain/Loss": 1.9434125423431396, "Full-pretrain/Loss (Raw)": 1.7576130628585815, "Full-pretrain/Step": 7180, "Full-pretrain/Step Time": 17.638397553935647} +{"Full-pretrain/Learning Rate": 7.579328725884749e-06, "Full-pretrain/Loss": 1.9496092796325684, "Full-pretrain/Loss (Raw)": 2.045210361480713, "Full-pretrain/Step": 7181, "Full-pretrain/Step Time": 17.638298615813255} +{"Full-pretrain/Learning Rate": 7.573239801026863e-06, "Full-pretrain/Loss": 1.956557035446167, "Full-pretrain/Loss (Raw)": 1.9951921701431274, "Full-pretrain/Step": 7182, "Full-pretrain/Step Time": 17.63801966421306} +{"Full-pretrain/Learning Rate": 7.5671528863396515e-06, "Full-pretrain/Loss": 1.951885461807251, "Full-pretrain/Loss (Raw)": 1.7853214740753174, "Full-pretrain/Step": 7183, "Full-pretrain/Step Time": 17.63527169264853} +{"Full-pretrain/Learning Rate": 7.561067982525222e-06, "Full-pretrain/Loss": 1.943570613861084, "Full-pretrain/Loss (Raw)": 1.7201498746871948, "Full-pretrain/Step": 7184, "Full-pretrain/Step Time": 17.638267097994685} +{"Full-pretrain/Learning Rate": 7.554985090285468e-06, "Full-pretrain/Loss": 1.9413074254989624, "Full-pretrain/Loss (Raw)": 1.9533597230911255, "Full-pretrain/Step": 7185, "Full-pretrain/Step Time": 17.634198212996125} +{"Full-pretrain/Learning Rate": 7.548904210322058e-06, "Full-pretrain/Loss": 1.9402220249176025, "Full-pretrain/Loss (Raw)": 2.062399387359619, "Full-pretrain/Step": 7186, "Full-pretrain/Step Time": 17.63656514696777} +{"Full-pretrain/Learning Rate": 7.542825343336418e-06, "Full-pretrain/Loss": 1.9292356967926025, "Full-pretrain/Loss (Raw)": 1.6759061813354492, "Full-pretrain/Step": 7187, "Full-pretrain/Step Time": 17.638403955847025} +{"Full-pretrain/Learning Rate": 7.536748490029736e-06, "Full-pretrain/Loss": 1.9178757667541504, "Full-pretrain/Loss (Raw)": 1.8223633766174316, "Full-pretrain/Step": 7188, "Full-pretrain/Step Time": 17.637753637507558} +{"Full-pretrain/Learning Rate": 7.530673651102976e-06, "Full-pretrain/Loss": 1.9254060983657837, "Full-pretrain/Loss (Raw)": 1.9760313034057617, "Full-pretrain/Step": 7189, "Full-pretrain/Step Time": 17.63468457572162} +{"Full-pretrain/Learning Rate": 7.5246008272568725e-06, "Full-pretrain/Loss": 1.9215338230133057, "Full-pretrain/Loss (Raw)": 1.8474781513214111, "Full-pretrain/Step": 7190, "Full-pretrain/Step Time": 17.631900023669004} +{"Full-pretrain/Learning Rate": 7.518530019191921e-06, "Full-pretrain/Loss": 1.9247571229934692, "Full-pretrain/Loss (Raw)": 1.8253339529037476, "Full-pretrain/Step": 7191, "Full-pretrain/Step Time": 17.63583890348673} +{"Full-pretrain/Learning Rate": 7.512461227608397e-06, "Full-pretrain/Loss": 1.9244399070739746, "Full-pretrain/Loss (Raw)": 2.0988011360168457, "Full-pretrain/Step": 7192, "Full-pretrain/Step Time": 17.637881070375443} +{"Full-pretrain/Learning Rate": 7.506394453206317e-06, "Full-pretrain/Loss": 1.9214906692504883, "Full-pretrain/Loss (Raw)": 2.052177906036377, "Full-pretrain/Step": 7193, "Full-pretrain/Step Time": 17.633225824683905} +{"Full-pretrain/Learning Rate": 7.500329696685488e-06, "Full-pretrain/Loss": 1.9206628799438477, "Full-pretrain/Loss (Raw)": 1.9725253582000732, "Full-pretrain/Step": 7194, "Full-pretrain/Step Time": 17.629157396033406} +{"Full-pretrain/Learning Rate": 7.49426695874548e-06, "Full-pretrain/Loss": 1.9102370738983154, "Full-pretrain/Loss (Raw)": 1.8156086206436157, "Full-pretrain/Step": 7195, "Full-pretrain/Step Time": 17.63119411841035} +{"Full-pretrain/Learning Rate": 7.488206240085627e-06, "Full-pretrain/Loss": 1.9139771461486816, "Full-pretrain/Loss (Raw)": 2.0569682121276855, "Full-pretrain/Step": 7196, "Full-pretrain/Step Time": 17.6298061683774} +{"Full-pretrain/Learning Rate": 7.482147541405035e-06, "Full-pretrain/Loss": 1.9101825952529907, "Full-pretrain/Loss (Raw)": 1.8517855405807495, "Full-pretrain/Step": 7197, "Full-pretrain/Step Time": 17.63424900174141} +{"Full-pretrain/Learning Rate": 7.4760908634025624e-06, "Full-pretrain/Loss": 1.90834641456604, "Full-pretrain/Loss (Raw)": 1.8137242794036865, "Full-pretrain/Step": 7198, "Full-pretrain/Step Time": 17.630230540409684} +{"Full-pretrain/Learning Rate": 7.4700362067768595e-06, "Full-pretrain/Loss": 1.9117965698242188, "Full-pretrain/Loss (Raw)": 2.0384061336517334, "Full-pretrain/Step": 7199, "Full-pretrain/Step Time": 17.634896045550704} +{"Full-pretrain/Learning Rate": 7.46398357222631e-06, "Full-pretrain/Loss": 1.9257688522338867, "Full-pretrain/Loss (Raw)": 2.1240334510803223, "Full-pretrain/Step": 7200, "Full-pretrain/Step Time": 17.632204880937934} +{"Full-pretrain/Learning Rate": 7.457932960449093e-06, "Full-pretrain/Loss": 1.937520146369934, "Full-pretrain/Loss (Raw)": 2.076395034790039, "Full-pretrain/Step": 7201, "Full-pretrain/Step Time": 17.641328521072865} +{"Full-pretrain/Learning Rate": 7.4518843721431446e-06, "Full-pretrain/Loss": 1.9260859489440918, "Full-pretrain/Loss (Raw)": 1.7729653120040894, "Full-pretrain/Step": 7202, "Full-pretrain/Step Time": 17.632543785497546} +{"Full-pretrain/Learning Rate": 7.445837808006173e-06, "Full-pretrain/Loss": 1.9174495935440063, "Full-pretrain/Loss (Raw)": 1.8269524574279785, "Full-pretrain/Step": 7203, "Full-pretrain/Step Time": 17.63557095453143} +{"Full-pretrain/Learning Rate": 7.439793268735635e-06, "Full-pretrain/Loss": 1.9240479469299316, "Full-pretrain/Loss (Raw)": 1.8726998567581177, "Full-pretrain/Step": 7204, "Full-pretrain/Step Time": 17.62805405445397} +{"Full-pretrain/Learning Rate": 7.433750755028773e-06, "Full-pretrain/Loss": 1.9225739240646362, "Full-pretrain/Loss (Raw)": 1.8623123168945312, "Full-pretrain/Step": 7205, "Full-pretrain/Step Time": 17.633081138134003} +{"Full-pretrain/Learning Rate": 7.4277102675825885e-06, "Full-pretrain/Loss": 1.9214355945587158, "Full-pretrain/Loss (Raw)": 2.0603485107421875, "Full-pretrain/Step": 7206, "Full-pretrain/Step Time": 17.630046792328358} +{"Full-pretrain/Learning Rate": 7.4216718070938465e-06, "Full-pretrain/Loss": 1.9131596088409424, "Full-pretrain/Loss (Raw)": 1.834982991218567, "Full-pretrain/Step": 7207, "Full-pretrain/Step Time": 17.633835462853312} +{"Full-pretrain/Learning Rate": 7.415635374259094e-06, "Full-pretrain/Loss": 1.9182474613189697, "Full-pretrain/Loss (Raw)": 1.7393207550048828, "Full-pretrain/Step": 7208, "Full-pretrain/Step Time": 17.636411549523473} +{"Full-pretrain/Learning Rate": 7.409600969774613e-06, "Full-pretrain/Loss": 1.9158620834350586, "Full-pretrain/Loss (Raw)": 1.8876328468322754, "Full-pretrain/Step": 7209, "Full-pretrain/Step Time": 17.633002180606127} +{"Full-pretrain/Learning Rate": 7.4035685943364795e-06, "Full-pretrain/Loss": 1.9134517908096313, "Full-pretrain/Loss (Raw)": 2.0139780044555664, "Full-pretrain/Step": 7210, "Full-pretrain/Step Time": 17.630864284932613} +{"Full-pretrain/Learning Rate": 7.397538248640526e-06, "Full-pretrain/Loss": 1.9144225120544434, "Full-pretrain/Loss (Raw)": 2.0235424041748047, "Full-pretrain/Step": 7211, "Full-pretrain/Step Time": 17.636976022273302} +{"Full-pretrain/Learning Rate": 7.391509933382345e-06, "Full-pretrain/Loss": 1.93158757686615, "Full-pretrain/Loss (Raw)": 2.3068923950195312, "Full-pretrain/Step": 7212, "Full-pretrain/Step Time": 17.63762121461332} +{"Full-pretrain/Learning Rate": 7.385483649257319e-06, "Full-pretrain/Loss": 1.926851511001587, "Full-pretrain/Loss (Raw)": 1.8936583995819092, "Full-pretrain/Step": 7213, "Full-pretrain/Step Time": 17.63286678493023} +{"Full-pretrain/Learning Rate": 7.3794593969605505e-06, "Full-pretrain/Loss": 1.9276065826416016, "Full-pretrain/Loss (Raw)": 2.019357919692993, "Full-pretrain/Step": 7214, "Full-pretrain/Step Time": 17.634641936048865} +{"Full-pretrain/Learning Rate": 7.373437177186951e-06, "Full-pretrain/Loss": 1.927072525024414, "Full-pretrain/Loss (Raw)": 1.76822829246521, "Full-pretrain/Step": 7215, "Full-pretrain/Step Time": 17.636156849563122} +{"Full-pretrain/Learning Rate": 7.367416990631188e-06, "Full-pretrain/Loss": 1.9517821073532104, "Full-pretrain/Loss (Raw)": 2.5108585357666016, "Full-pretrain/Step": 7216, "Full-pretrain/Step Time": 17.636671571061015} +{"Full-pretrain/Learning Rate": 7.361398837987668e-06, "Full-pretrain/Loss": 1.9576756954193115, "Full-pretrain/Loss (Raw)": 2.1419544219970703, "Full-pretrain/Step": 7217, "Full-pretrain/Step Time": 17.63303443044424} +{"Full-pretrain/Learning Rate": 7.355382719950593e-06, "Full-pretrain/Loss": 1.9607537984848022, "Full-pretrain/Loss (Raw)": 2.1609017848968506, "Full-pretrain/Step": 7218, "Full-pretrain/Step Time": 17.636752681806684} +{"Full-pretrain/Learning Rate": 7.34936863721393e-06, "Full-pretrain/Loss": 1.976650595664978, "Full-pretrain/Loss (Raw)": 2.1846024990081787, "Full-pretrain/Step": 7219, "Full-pretrain/Step Time": 17.638524185866117} +{"Full-pretrain/Learning Rate": 7.343356590471384e-06, "Full-pretrain/Loss": 1.977570652961731, "Full-pretrain/Loss (Raw)": 1.8518059253692627, "Full-pretrain/Step": 7220, "Full-pretrain/Step Time": 17.634884543716908} +{"Full-pretrain/Learning Rate": 7.337346580416449e-06, "Full-pretrain/Loss": 1.9769463539123535, "Full-pretrain/Loss (Raw)": 1.956050157546997, "Full-pretrain/Step": 7221, "Full-pretrain/Step Time": 17.63121491484344} +{"Full-pretrain/Learning Rate": 7.33133860774238e-06, "Full-pretrain/Loss": 1.9857971668243408, "Full-pretrain/Loss (Raw)": 2.130709648132324, "Full-pretrain/Step": 7222, "Full-pretrain/Step Time": 17.63195742852986} +{"Full-pretrain/Learning Rate": 7.325332673142193e-06, "Full-pretrain/Loss": 1.9868946075439453, "Full-pretrain/Loss (Raw)": 1.8604496717453003, "Full-pretrain/Step": 7223, "Full-pretrain/Step Time": 17.64131004549563} +{"Full-pretrain/Learning Rate": 7.319328777308679e-06, "Full-pretrain/Loss": 1.9842569828033447, "Full-pretrain/Loss (Raw)": 2.014397144317627, "Full-pretrain/Step": 7224, "Full-pretrain/Step Time": 17.638934649527073} +{"Full-pretrain/Learning Rate": 7.313326920934368e-06, "Full-pretrain/Loss": 1.9868953227996826, "Full-pretrain/Loss (Raw)": 2.136601448059082, "Full-pretrain/Step": 7225, "Full-pretrain/Step Time": 17.627939281985164} +{"Full-pretrain/Learning Rate": 7.3073271047115834e-06, "Full-pretrain/Loss": 1.98819899559021, "Full-pretrain/Loss (Raw)": 2.01424503326416, "Full-pretrain/Step": 7226, "Full-pretrain/Step Time": 17.626331759616733} +{"Full-pretrain/Learning Rate": 7.3013293293323985e-06, "Full-pretrain/Loss": 1.989261507987976, "Full-pretrain/Loss (Raw)": 1.8496098518371582, "Full-pretrain/Step": 7227, "Full-pretrain/Step Time": 17.62910104729235} +{"Full-pretrain/Learning Rate": 7.295333595488657e-06, "Full-pretrain/Loss": 1.9821361303329468, "Full-pretrain/Loss (Raw)": 1.828955888748169, "Full-pretrain/Step": 7228, "Full-pretrain/Step Time": 17.627596342936158} +{"Full-pretrain/Learning Rate": 7.28933990387197e-06, "Full-pretrain/Loss": 1.967766523361206, "Full-pretrain/Loss (Raw)": 1.3919543027877808, "Full-pretrain/Step": 7229, "Full-pretrain/Step Time": 17.629685629159212} +{"Full-pretrain/Learning Rate": 7.283348255173691e-06, "Full-pretrain/Loss": 1.9789340496063232, "Full-pretrain/Loss (Raw)": 2.171085834503174, "Full-pretrain/Step": 7230, "Full-pretrain/Step Time": 17.624757256358862} +{"Full-pretrain/Learning Rate": 7.277358650084967e-06, "Full-pretrain/Loss": 1.9820821285247803, "Full-pretrain/Loss (Raw)": 2.1391441822052, "Full-pretrain/Step": 7231, "Full-pretrain/Step Time": 17.627010736614466} +{"Full-pretrain/Learning Rate": 7.271371089296702e-06, "Full-pretrain/Loss": 1.972076416015625, "Full-pretrain/Loss (Raw)": 1.8038501739501953, "Full-pretrain/Step": 7232, "Full-pretrain/Step Time": 17.631423372775316} +{"Full-pretrain/Learning Rate": 7.2653855734995445e-06, "Full-pretrain/Loss": 1.9687449932098389, "Full-pretrain/Loss (Raw)": 1.969792366027832, "Full-pretrain/Step": 7233, "Full-pretrain/Step Time": 17.631409849971533} +{"Full-pretrain/Learning Rate": 7.25940210338393e-06, "Full-pretrain/Loss": 1.9746829271316528, "Full-pretrain/Loss (Raw)": 1.9629786014556885, "Full-pretrain/Step": 7234, "Full-pretrain/Step Time": 17.62542884796858} +{"Full-pretrain/Learning Rate": 7.253420679640055e-06, "Full-pretrain/Loss": 1.9782958030700684, "Full-pretrain/Loss (Raw)": 1.9425604343414307, "Full-pretrain/Step": 7235, "Full-pretrain/Step Time": 17.62708451412618} +{"Full-pretrain/Learning Rate": 7.247441302957858e-06, "Full-pretrain/Loss": 1.9867422580718994, "Full-pretrain/Loss (Raw)": 2.1429920196533203, "Full-pretrain/Step": 7236, "Full-pretrain/Step Time": 17.629933174699545} +{"Full-pretrain/Learning Rate": 7.241463974027071e-06, "Full-pretrain/Loss": 1.990128993988037, "Full-pretrain/Loss (Raw)": 1.9706854820251465, "Full-pretrain/Step": 7237, "Full-pretrain/Step Time": 17.631090588867664} +{"Full-pretrain/Learning Rate": 7.2354886935371705e-06, "Full-pretrain/Loss": 1.9788610935211182, "Full-pretrain/Loss (Raw)": 1.6997789144515991, "Full-pretrain/Step": 7238, "Full-pretrain/Step Time": 17.630965230986476} +{"Full-pretrain/Learning Rate": 7.229515462177408e-06, "Full-pretrain/Loss": 1.967971682548523, "Full-pretrain/Loss (Raw)": 1.48651921749115, "Full-pretrain/Step": 7239, "Full-pretrain/Step Time": 17.62456865236163} +{"Full-pretrain/Learning Rate": 7.223544280636801e-06, "Full-pretrain/Loss": 1.9763171672821045, "Full-pretrain/Loss (Raw)": 2.006378173828125, "Full-pretrain/Step": 7240, "Full-pretrain/Step Time": 17.625134671106935} +{"Full-pretrain/Learning Rate": 7.217575149604105e-06, "Full-pretrain/Loss": 1.9754793643951416, "Full-pretrain/Loss (Raw)": 1.8608230352401733, "Full-pretrain/Step": 7241, "Full-pretrain/Step Time": 17.62626896612346} +{"Full-pretrain/Learning Rate": 7.211608069767867e-06, "Full-pretrain/Loss": 1.974466323852539, "Full-pretrain/Loss (Raw)": 1.9815629720687866, "Full-pretrain/Step": 7242, "Full-pretrain/Step Time": 17.625313388183713} +{"Full-pretrain/Learning Rate": 7.205643041816387e-06, "Full-pretrain/Loss": 1.9729770421981812, "Full-pretrain/Loss (Raw)": 1.975880742073059, "Full-pretrain/Step": 7243, "Full-pretrain/Step Time": 17.620137287303805} +{"Full-pretrain/Learning Rate": 7.199680066437728e-06, "Full-pretrain/Loss": 1.9620832204818726, "Full-pretrain/Loss (Raw)": 1.9582915306091309, "Full-pretrain/Step": 7244, "Full-pretrain/Step Time": 17.625695906579494} +{"Full-pretrain/Learning Rate": 7.193719144319727e-06, "Full-pretrain/Loss": 1.9581849575042725, "Full-pretrain/Loss (Raw)": 1.7689101696014404, "Full-pretrain/Step": 7245, "Full-pretrain/Step Time": 17.626584246754646} +{"Full-pretrain/Learning Rate": 7.187760276149955e-06, "Full-pretrain/Loss": 1.9514412879943848, "Full-pretrain/Loss (Raw)": 1.8035664558410645, "Full-pretrain/Step": 7246, "Full-pretrain/Step Time": 17.627289609983563} +{"Full-pretrain/Learning Rate": 7.181803462615777e-06, "Full-pretrain/Loss": 1.9522854089736938, "Full-pretrain/Loss (Raw)": 1.795235276222229, "Full-pretrain/Step": 7247, "Full-pretrain/Step Time": 17.62130176834762} +{"Full-pretrain/Learning Rate": 7.175848704404309e-06, "Full-pretrain/Loss": 1.926194429397583, "Full-pretrain/Loss (Raw)": 1.675950050354004, "Full-pretrain/Step": 7248, "Full-pretrain/Step Time": 17.630021896213293} +{"Full-pretrain/Learning Rate": 7.1698960022024335e-06, "Full-pretrain/Loss": 1.919947862625122, "Full-pretrain/Loss (Raw)": 1.9420644044876099, "Full-pretrain/Step": 7249, "Full-pretrain/Step Time": 17.6248278003186} +{"Full-pretrain/Learning Rate": 7.163945356696783e-06, "Full-pretrain/Loss": 1.9092528820037842, "Full-pretrain/Loss (Raw)": 1.8186630010604858, "Full-pretrain/Step": 7250, "Full-pretrain/Step Time": 17.627059295773506} +{"Full-pretrain/Learning Rate": 7.157996768573774e-06, "Full-pretrain/Loss": 1.8930200338363647, "Full-pretrain/Loss (Raw)": 1.665149450302124, "Full-pretrain/Step": 7251, "Full-pretrain/Step Time": 17.620033172890544} +{"Full-pretrain/Learning Rate": 7.152050238519561e-06, "Full-pretrain/Loss": 1.8876869678497314, "Full-pretrain/Loss (Raw)": 1.6811470985412598, "Full-pretrain/Step": 7252, "Full-pretrain/Step Time": 17.632288904860616} +{"Full-pretrain/Learning Rate": 7.146105767220082e-06, "Full-pretrain/Loss": 1.8887996673583984, "Full-pretrain/Loss (Raw)": 1.9916584491729736, "Full-pretrain/Step": 7253, "Full-pretrain/Step Time": 17.63157340325415} +{"Full-pretrain/Learning Rate": 7.140163355361027e-06, "Full-pretrain/Loss": 1.8825002908706665, "Full-pretrain/Loss (Raw)": 1.929128646850586, "Full-pretrain/Step": 7254, "Full-pretrain/Step Time": 17.64169531315565} +{"Full-pretrain/Learning Rate": 7.134223003627852e-06, "Full-pretrain/Loss": 1.8859165906906128, "Full-pretrain/Loss (Raw)": 1.9697717428207397, "Full-pretrain/Step": 7255, "Full-pretrain/Step Time": 17.63187804631889} +{"Full-pretrain/Learning Rate": 7.128284712705782e-06, "Full-pretrain/Loss": 1.8757305145263672, "Full-pretrain/Loss (Raw)": 1.6884433031082153, "Full-pretrain/Step": 7256, "Full-pretrain/Step Time": 17.63778095319867} +{"Full-pretrain/Learning Rate": 7.122348483279784e-06, "Full-pretrain/Loss": 1.8761812448501587, "Full-pretrain/Loss (Raw)": 2.1510229110717773, "Full-pretrain/Step": 7257, "Full-pretrain/Step Time": 17.63899863138795} +{"Full-pretrain/Learning Rate": 7.1164143160346055e-06, "Full-pretrain/Loss": 1.8752390146255493, "Full-pretrain/Loss (Raw)": 1.9840927124023438, "Full-pretrain/Step": 7258, "Full-pretrain/Step Time": 17.645112618803978} +{"Full-pretrain/Learning Rate": 7.110482211654751e-06, "Full-pretrain/Loss": 1.873202919960022, "Full-pretrain/Loss (Raw)": 1.7844570875167847, "Full-pretrain/Step": 7259, "Full-pretrain/Step Time": 17.63253542035818} +{"Full-pretrain/Learning Rate": 7.104552170824485e-06, "Full-pretrain/Loss": 1.8695987462997437, "Full-pretrain/Loss (Raw)": 1.7136187553405762, "Full-pretrain/Step": 7260, "Full-pretrain/Step Time": 17.637709537521005} +{"Full-pretrain/Learning Rate": 7.0986241942278455e-06, "Full-pretrain/Loss": 1.8862519264221191, "Full-pretrain/Loss (Raw)": 1.9248565435409546, "Full-pretrain/Step": 7261, "Full-pretrain/Step Time": 17.637619096785784} +{"Full-pretrain/Learning Rate": 7.092698282548607e-06, "Full-pretrain/Loss": 1.8796350955963135, "Full-pretrain/Loss (Raw)": 1.959349274635315, "Full-pretrain/Step": 7262, "Full-pretrain/Step Time": 17.63713694922626} +{"Full-pretrain/Learning Rate": 7.086774436470328e-06, "Full-pretrain/Loss": 1.86539626121521, "Full-pretrain/Loss (Raw)": 1.6835026741027832, "Full-pretrain/Step": 7263, "Full-pretrain/Step Time": 17.63457772321999} +{"Full-pretrain/Learning Rate": 7.080852656676323e-06, "Full-pretrain/Loss": 1.8642497062683105, "Full-pretrain/Loss (Raw)": 1.7671570777893066, "Full-pretrain/Step": 7264, "Full-pretrain/Step Time": 17.634766122326255} +{"Full-pretrain/Learning Rate": 7.074932943849677e-06, "Full-pretrain/Loss": 1.860967755317688, "Full-pretrain/Loss (Raw)": 1.8647712469100952, "Full-pretrain/Step": 7265, "Full-pretrain/Step Time": 17.632945807650685} +{"Full-pretrain/Learning Rate": 7.069015298673206e-06, "Full-pretrain/Loss": 1.8645557165145874, "Full-pretrain/Loss (Raw)": 2.0777926445007324, "Full-pretrain/Step": 7266, "Full-pretrain/Step Time": 17.640175892040133} +{"Full-pretrain/Learning Rate": 7.063099721829528e-06, "Full-pretrain/Loss": 1.871220588684082, "Full-pretrain/Loss (Raw)": 2.155837297439575, "Full-pretrain/Step": 7267, "Full-pretrain/Step Time": 17.63366600871086} +{"Full-pretrain/Learning Rate": 7.057186214000985e-06, "Full-pretrain/Loss": 1.858662486076355, "Full-pretrain/Loss (Raw)": 1.7411320209503174, "Full-pretrain/Step": 7268, "Full-pretrain/Step Time": 17.636095590889454} +{"Full-pretrain/Learning Rate": 7.0512747758697066e-06, "Full-pretrain/Loss": 1.863957166671753, "Full-pretrain/Loss (Raw)": 2.1401147842407227, "Full-pretrain/Step": 7269, "Full-pretrain/Step Time": 17.63673485442996} +{"Full-pretrain/Learning Rate": 7.045365408117574e-06, "Full-pretrain/Loss": 1.8772913217544556, "Full-pretrain/Loss (Raw)": 2.1264710426330566, "Full-pretrain/Step": 7270, "Full-pretrain/Step Time": 17.63945384696126} +{"Full-pretrain/Learning Rate": 7.039458111426242e-06, "Full-pretrain/Loss": 1.8912811279296875, "Full-pretrain/Loss (Raw)": 1.9341936111450195, "Full-pretrain/Step": 7271, "Full-pretrain/Step Time": 17.627291325479746} +{"Full-pretrain/Learning Rate": 7.033552886477096e-06, "Full-pretrain/Loss": 1.8947057723999023, "Full-pretrain/Loss (Raw)": 2.1159653663635254, "Full-pretrain/Step": 7272, "Full-pretrain/Step Time": 17.627953618764877} +{"Full-pretrain/Learning Rate": 7.0276497339513105e-06, "Full-pretrain/Loss": 1.9018256664276123, "Full-pretrain/Loss (Raw)": 2.0886611938476562, "Full-pretrain/Step": 7273, "Full-pretrain/Step Time": 17.625119483098388} +{"Full-pretrain/Learning Rate": 7.021748654529814e-06, "Full-pretrain/Loss": 1.9010803699493408, "Full-pretrain/Loss (Raw)": 1.9577152729034424, "Full-pretrain/Step": 7274, "Full-pretrain/Step Time": 17.6285267341882} +{"Full-pretrain/Learning Rate": 7.015849648893288e-06, "Full-pretrain/Loss": 1.8944274187088013, "Full-pretrain/Loss (Raw)": 1.762984037399292, "Full-pretrain/Step": 7275, "Full-pretrain/Step Time": 17.629854956641793} +{"Full-pretrain/Learning Rate": 7.009952717722191e-06, "Full-pretrain/Loss": 1.8933771848678589, "Full-pretrain/Loss (Raw)": 1.9246855974197388, "Full-pretrain/Step": 7276, "Full-pretrain/Step Time": 17.629550317302346} +{"Full-pretrain/Learning Rate": 7.004057861696728e-06, "Full-pretrain/Loss": 1.895712971687317, "Full-pretrain/Loss (Raw)": 1.8436548709869385, "Full-pretrain/Step": 7277, "Full-pretrain/Step Time": 17.630694527179003} +{"Full-pretrain/Learning Rate": 6.998165081496863e-06, "Full-pretrain/Loss": 1.9040789604187012, "Full-pretrain/Loss (Raw)": 2.0712788105010986, "Full-pretrain/Step": 7278, "Full-pretrain/Step Time": 17.631084071472287} +{"Full-pretrain/Learning Rate": 6.992274377802327e-06, "Full-pretrain/Loss": 1.9060556888580322, "Full-pretrain/Loss (Raw)": 1.8584907054901123, "Full-pretrain/Step": 7279, "Full-pretrain/Step Time": 17.623751873150468} +{"Full-pretrain/Learning Rate": 6.986385751292615e-06, "Full-pretrain/Loss": 1.9121222496032715, "Full-pretrain/Loss (Raw)": 1.870077133178711, "Full-pretrain/Step": 7280, "Full-pretrain/Step Time": 17.619940077885985} +{"Full-pretrain/Learning Rate": 6.980499202646981e-06, "Full-pretrain/Loss": 1.911945104598999, "Full-pretrain/Loss (Raw)": 1.9363970756530762, "Full-pretrain/Step": 7281, "Full-pretrain/Step Time": 17.628247022628784} +{"Full-pretrain/Learning Rate": 6.974614732544427e-06, "Full-pretrain/Loss": 1.9150669574737549, "Full-pretrain/Loss (Raw)": 1.9185642004013062, "Full-pretrain/Step": 7282, "Full-pretrain/Step Time": 17.62659747339785} +{"Full-pretrain/Learning Rate": 6.9687323416637335e-06, "Full-pretrain/Loss": 1.9246187210083008, "Full-pretrain/Loss (Raw)": 1.9708051681518555, "Full-pretrain/Step": 7283, "Full-pretrain/Step Time": 17.628130055963993} +{"Full-pretrain/Learning Rate": 6.962852030683423e-06, "Full-pretrain/Loss": 1.935380220413208, "Full-pretrain/Loss (Raw)": 2.025513172149658, "Full-pretrain/Step": 7284, "Full-pretrain/Step Time": 17.631704611703753} +{"Full-pretrain/Learning Rate": 6.95697380028179e-06, "Full-pretrain/Loss": 1.9268109798431396, "Full-pretrain/Loss (Raw)": 1.7174427509307861, "Full-pretrain/Step": 7285, "Full-pretrain/Step Time": 17.633388876914978} +{"Full-pretrain/Learning Rate": 6.951097651136889e-06, "Full-pretrain/Loss": 1.9299211502075195, "Full-pretrain/Loss (Raw)": 2.0286569595336914, "Full-pretrain/Step": 7286, "Full-pretrain/Step Time": 17.635966742411256} +{"Full-pretrain/Learning Rate": 6.9452235839265385e-06, "Full-pretrain/Loss": 1.9196083545684814, "Full-pretrain/Loss (Raw)": 1.6397639513015747, "Full-pretrain/Step": 7287, "Full-pretrain/Step Time": 17.631642976775765} +{"Full-pretrain/Learning Rate": 6.9393515993282976e-06, "Full-pretrain/Loss": 1.934838056564331, "Full-pretrain/Loss (Raw)": 2.1757895946502686, "Full-pretrain/Step": 7288, "Full-pretrain/Step Time": 17.63093053176999} +{"Full-pretrain/Learning Rate": 6.9334816980195005e-06, "Full-pretrain/Loss": 1.9332423210144043, "Full-pretrain/Loss (Raw)": 2.0999603271484375, "Full-pretrain/Step": 7289, "Full-pretrain/Step Time": 17.634281126782298} +{"Full-pretrain/Learning Rate": 6.927613880677239e-06, "Full-pretrain/Loss": 1.9396662712097168, "Full-pretrain/Loss (Raw)": 2.1896615028381348, "Full-pretrain/Step": 7290, "Full-pretrain/Step Time": 17.640031047165394} +{"Full-pretrain/Learning Rate": 6.921748147978368e-06, "Full-pretrain/Loss": 1.9445799589157104, "Full-pretrain/Loss (Raw)": 1.9416933059692383, "Full-pretrain/Step": 7291, "Full-pretrain/Step Time": 17.63556207716465} +{"Full-pretrain/Learning Rate": 6.915884500599501e-06, "Full-pretrain/Loss": 1.9524269104003906, "Full-pretrain/Loss (Raw)": 1.9647190570831299, "Full-pretrain/Step": 7292, "Full-pretrain/Step Time": 17.62843542546034} +{"Full-pretrain/Learning Rate": 6.910022939216995e-06, "Full-pretrain/Loss": 1.9597468376159668, "Full-pretrain/Loss (Raw)": 2.159095048904419, "Full-pretrain/Step": 7293, "Full-pretrain/Step Time": 17.62345248274505} +{"Full-pretrain/Learning Rate": 6.904163464506985e-06, "Full-pretrain/Loss": 1.9521286487579346, "Full-pretrain/Loss (Raw)": 1.715570330619812, "Full-pretrain/Step": 7294, "Full-pretrain/Step Time": 17.624756002798676} +{"Full-pretrain/Learning Rate": 6.8983060771453614e-06, "Full-pretrain/Loss": 1.9666006565093994, "Full-pretrain/Loss (Raw)": 2.1466052532196045, "Full-pretrain/Step": 7295, "Full-pretrain/Step Time": 17.629648476839066} +{"Full-pretrain/Learning Rate": 6.892450777807769e-06, "Full-pretrain/Loss": 1.972473382949829, "Full-pretrain/Loss (Raw)": 1.9550851583480835, "Full-pretrain/Step": 7296, "Full-pretrain/Step Time": 17.621808752417564} +{"Full-pretrain/Learning Rate": 6.886597567169617e-06, "Full-pretrain/Loss": 1.979013442993164, "Full-pretrain/Loss (Raw)": 2.074052333831787, "Full-pretrain/Step": 7297, "Full-pretrain/Step Time": 17.621721774339676} +{"Full-pretrain/Learning Rate": 6.880746445906075e-06, "Full-pretrain/Loss": 1.9845768213272095, "Full-pretrain/Loss (Raw)": 2.255824565887451, "Full-pretrain/Step": 7298, "Full-pretrain/Step Time": 17.626449208706617} +{"Full-pretrain/Learning Rate": 6.874897414692058e-06, "Full-pretrain/Loss": 1.978101372718811, "Full-pretrain/Loss (Raw)": 1.9486192464828491, "Full-pretrain/Step": 7299, "Full-pretrain/Step Time": 17.635997381061316} +{"Full-pretrain/Learning Rate": 6.869050474202263e-06, "Full-pretrain/Loss": 1.9853525161743164, "Full-pretrain/Loss (Raw)": 1.9731743335723877, "Full-pretrain/Step": 7300, "Full-pretrain/Step Time": 17.63292732834816} +{"Full-pretrain/Learning Rate": 6.863205625111113e-06, "Full-pretrain/Loss": 1.9806132316589355, "Full-pretrain/Loss (Raw)": 1.9884536266326904, "Full-pretrain/Step": 7301, "Full-pretrain/Step Time": 17.62909794598818} +{"Full-pretrain/Learning Rate": 6.857362868092823e-06, "Full-pretrain/Loss": 1.9690606594085693, "Full-pretrain/Loss (Raw)": 1.7567906379699707, "Full-pretrain/Step": 7302, "Full-pretrain/Step Time": 17.62844675593078} +{"Full-pretrain/Learning Rate": 6.851522203821359e-06, "Full-pretrain/Loss": 1.964867353439331, "Full-pretrain/Loss (Raw)": 1.8000035285949707, "Full-pretrain/Step": 7303, "Full-pretrain/Step Time": 17.63253204524517} +{"Full-pretrain/Learning Rate": 6.8456836329704205e-06, "Full-pretrain/Loss": 1.956494688987732, "Full-pretrain/Loss (Raw)": 1.8480448722839355, "Full-pretrain/Step": 7304, "Full-pretrain/Step Time": 17.628085607662797} +{"Full-pretrain/Learning Rate": 6.839847156213497e-06, "Full-pretrain/Loss": 1.9438300132751465, "Full-pretrain/Loss (Raw)": 1.683388590812683, "Full-pretrain/Step": 7305, "Full-pretrain/Step Time": 17.625465342774987} +{"Full-pretrain/Learning Rate": 6.834012774223822e-06, "Full-pretrain/Loss": 1.936365008354187, "Full-pretrain/Loss (Raw)": 1.7188352346420288, "Full-pretrain/Step": 7306, "Full-pretrain/Step Time": 17.62432443164289} +{"Full-pretrain/Learning Rate": 6.8281804876743875e-06, "Full-pretrain/Loss": 1.9419691562652588, "Full-pretrain/Loss (Raw)": 1.9423134326934814, "Full-pretrain/Step": 7307, "Full-pretrain/Step Time": 17.630461525171995} +{"Full-pretrain/Learning Rate": 6.822350297237959e-06, "Full-pretrain/Loss": 1.9380362033843994, "Full-pretrain/Loss (Raw)": 1.7988322973251343, "Full-pretrain/Step": 7308, "Full-pretrain/Step Time": 17.620253263041377} +{"Full-pretrain/Learning Rate": 6.816522203587025e-06, "Full-pretrain/Loss": 1.9344637393951416, "Full-pretrain/Loss (Raw)": 1.729338526725769, "Full-pretrain/Step": 7309, "Full-pretrain/Step Time": 17.622330840677023} +{"Full-pretrain/Learning Rate": 6.810696207393865e-06, "Full-pretrain/Loss": 1.9264469146728516, "Full-pretrain/Loss (Raw)": 1.8147375583648682, "Full-pretrain/Step": 7310, "Full-pretrain/Step Time": 17.618565695360303} +{"Full-pretrain/Learning Rate": 6.804872309330506e-06, "Full-pretrain/Loss": 1.9334200620651245, "Full-pretrain/Loss (Raw)": 2.081629991531372, "Full-pretrain/Step": 7311, "Full-pretrain/Step Time": 17.61979760043323} +{"Full-pretrain/Learning Rate": 6.799050510068733e-06, "Full-pretrain/Loss": 1.9341315031051636, "Full-pretrain/Loss (Raw)": 1.8928461074829102, "Full-pretrain/Step": 7312, "Full-pretrain/Step Time": 17.620032789185643} +{"Full-pretrain/Learning Rate": 6.793230810280094e-06, "Full-pretrain/Loss": 1.9471020698547363, "Full-pretrain/Loss (Raw)": 2.3514552116394043, "Full-pretrain/Step": 7313, "Full-pretrain/Step Time": 17.620490711182356} +{"Full-pretrain/Learning Rate": 6.7874132106358734e-06, "Full-pretrain/Loss": 1.9518153667449951, "Full-pretrain/Loss (Raw)": 2.069387435913086, "Full-pretrain/Step": 7314, "Full-pretrain/Step Time": 17.623096792027354} +{"Full-pretrain/Learning Rate": 6.781597711807141e-06, "Full-pretrain/Loss": 1.9419584274291992, "Full-pretrain/Loss (Raw)": 1.6553874015808105, "Full-pretrain/Step": 7315, "Full-pretrain/Step Time": 17.62634073384106} +{"Full-pretrain/Learning Rate": 6.775784314464717e-06, "Full-pretrain/Loss": 1.9429376125335693, "Full-pretrain/Loss (Raw)": 2.0568456649780273, "Full-pretrain/Step": 7316, "Full-pretrain/Step Time": 17.628962045535445} +{"Full-pretrain/Learning Rate": 6.76997301927916e-06, "Full-pretrain/Loss": 1.9440603256225586, "Full-pretrain/Loss (Raw)": 1.7533693313598633, "Full-pretrain/Step": 7317, "Full-pretrain/Step Time": 17.633159540593624} +{"Full-pretrain/Learning Rate": 6.764163826920808e-06, "Full-pretrain/Loss": 1.9456067085266113, "Full-pretrain/Loss (Raw)": 2.0781402587890625, "Full-pretrain/Step": 7318, "Full-pretrain/Step Time": 17.635062647983432} +{"Full-pretrain/Learning Rate": 6.75835673805976e-06, "Full-pretrain/Loss": 1.9469925165176392, "Full-pretrain/Loss (Raw)": 1.684112310409546, "Full-pretrain/Step": 7319, "Full-pretrain/Step Time": 17.633385583758354} +{"Full-pretrain/Learning Rate": 6.752551753365843e-06, "Full-pretrain/Loss": 1.9401230812072754, "Full-pretrain/Loss (Raw)": 1.9559667110443115, "Full-pretrain/Step": 7320, "Full-pretrain/Step Time": 17.63872961141169} +{"Full-pretrain/Learning Rate": 6.746748873508668e-06, "Full-pretrain/Loss": 1.9370863437652588, "Full-pretrain/Loss (Raw)": 2.0027828216552734, "Full-pretrain/Step": 7321, "Full-pretrain/Step Time": 17.635254615917802} +{"Full-pretrain/Learning Rate": 6.740948099157596e-06, "Full-pretrain/Loss": 1.9276469945907593, "Full-pretrain/Loss (Raw)": 1.887605905532837, "Full-pretrain/Step": 7322, "Full-pretrain/Step Time": 17.639429019764066} +{"Full-pretrain/Learning Rate": 6.7351494309817434e-06, "Full-pretrain/Loss": 1.9307751655578613, "Full-pretrain/Loss (Raw)": 2.0417919158935547, "Full-pretrain/Step": 7323, "Full-pretrain/Step Time": 17.637933751568198} +{"Full-pretrain/Learning Rate": 6.729352869649994e-06, "Full-pretrain/Loss": 1.9258482456207275, "Full-pretrain/Loss (Raw)": 1.807058572769165, "Full-pretrain/Step": 7324, "Full-pretrain/Step Time": 17.642522102221847} +{"Full-pretrain/Learning Rate": 6.723558415830963e-06, "Full-pretrain/Loss": 1.9238977432250977, "Full-pretrain/Loss (Raw)": 2.096682548522949, "Full-pretrain/Step": 7325, "Full-pretrain/Step Time": 17.63693831115961} +{"Full-pretrain/Learning Rate": 6.717766070193043e-06, "Full-pretrain/Loss": 1.9384087324142456, "Full-pretrain/Loss (Raw)": 2.1799206733703613, "Full-pretrain/Step": 7326, "Full-pretrain/Step Time": 17.631750168278813} +{"Full-pretrain/Learning Rate": 6.7119758334043856e-06, "Full-pretrain/Loss": 1.9369947910308838, "Full-pretrain/Loss (Raw)": 2.101357936859131, "Full-pretrain/Step": 7327, "Full-pretrain/Step Time": 17.629471438005567} +{"Full-pretrain/Learning Rate": 6.706187706132888e-06, "Full-pretrain/Loss": 1.942521095275879, "Full-pretrain/Loss (Raw)": 2.1319265365600586, "Full-pretrain/Step": 7328, "Full-pretrain/Step Time": 17.634906252846122} +{"Full-pretrain/Learning Rate": 6.700401689046218e-06, "Full-pretrain/Loss": 1.9443559646606445, "Full-pretrain/Loss (Raw)": 2.1327714920043945, "Full-pretrain/Step": 7329, "Full-pretrain/Step Time": 17.62729367427528} +{"Full-pretrain/Learning Rate": 6.6946177828117716e-06, "Full-pretrain/Loss": 1.9357645511627197, "Full-pretrain/Loss (Raw)": 1.9808945655822754, "Full-pretrain/Step": 7330, "Full-pretrain/Step Time": 17.626751709729433} +{"Full-pretrain/Learning Rate": 6.688835988096734e-06, "Full-pretrain/Loss": 1.9390714168548584, "Full-pretrain/Loss (Raw)": 2.0544397830963135, "Full-pretrain/Step": 7331, "Full-pretrain/Step Time": 17.625820411369205} +{"Full-pretrain/Learning Rate": 6.683056305568036e-06, "Full-pretrain/Loss": 1.922577142715454, "Full-pretrain/Loss (Raw)": 1.4453556537628174, "Full-pretrain/Step": 7332, "Full-pretrain/Step Time": 17.63778313808143} +{"Full-pretrain/Learning Rate": 6.6772787358923476e-06, "Full-pretrain/Loss": 1.9218552112579346, "Full-pretrain/Loss (Raw)": 1.9653557538986206, "Full-pretrain/Step": 7333, "Full-pretrain/Step Time": 17.636211536824703} +{"Full-pretrain/Learning Rate": 6.671503279736122e-06, "Full-pretrain/Loss": 1.9294564723968506, "Full-pretrain/Loss (Raw)": 2.000030755996704, "Full-pretrain/Step": 7334, "Full-pretrain/Step Time": 17.630101775750518} +{"Full-pretrain/Learning Rate": 6.665729937765555e-06, "Full-pretrain/Loss": 1.955225944519043, "Full-pretrain/Loss (Raw)": 2.6246297359466553, "Full-pretrain/Step": 7335, "Full-pretrain/Step Time": 17.627747770398855} +{"Full-pretrain/Learning Rate": 6.659958710646591e-06, "Full-pretrain/Loss": 1.9626129865646362, "Full-pretrain/Loss (Raw)": 2.0844268798828125, "Full-pretrain/Step": 7336, "Full-pretrain/Step Time": 17.63271938636899} +{"Full-pretrain/Learning Rate": 6.654189599044947e-06, "Full-pretrain/Loss": 1.9760971069335938, "Full-pretrain/Loss (Raw)": 2.1148767471313477, "Full-pretrain/Step": 7337, "Full-pretrain/Step Time": 17.631647530943155} +{"Full-pretrain/Learning Rate": 6.648422603626081e-06, "Full-pretrain/Loss": 1.9825968742370605, "Full-pretrain/Loss (Raw)": 1.9268279075622559, "Full-pretrain/Step": 7338, "Full-pretrain/Step Time": 17.628951443359256} +{"Full-pretrain/Learning Rate": 6.64265772505522e-06, "Full-pretrain/Loss": 1.979552149772644, "Full-pretrain/Loss (Raw)": 1.8448832035064697, "Full-pretrain/Step": 7339, "Full-pretrain/Step Time": 17.625664796680212} +{"Full-pretrain/Learning Rate": 6.636894963997348e-06, "Full-pretrain/Loss": 1.9781074523925781, "Full-pretrain/Loss (Raw)": 1.75260329246521, "Full-pretrain/Step": 7340, "Full-pretrain/Step Time": 17.627030484378338} +{"Full-pretrain/Learning Rate": 6.63113432111718e-06, "Full-pretrain/Loss": 1.9828338623046875, "Full-pretrain/Loss (Raw)": 1.8805832862854004, "Full-pretrain/Step": 7341, "Full-pretrain/Step Time": 17.634722197428346} +{"Full-pretrain/Learning Rate": 6.625375797079214e-06, "Full-pretrain/Loss": 1.9883439540863037, "Full-pretrain/Loss (Raw)": 1.9910591840744019, "Full-pretrain/Step": 7342, "Full-pretrain/Step Time": 17.629108091816306} +{"Full-pretrain/Learning Rate": 6.619619392547693e-06, "Full-pretrain/Loss": 1.9772369861602783, "Full-pretrain/Loss (Raw)": 1.7262053489685059, "Full-pretrain/Step": 7343, "Full-pretrain/Step Time": 17.62513126246631} +{"Full-pretrain/Learning Rate": 6.6138651081866144e-06, "Full-pretrain/Loss": 1.9817733764648438, "Full-pretrain/Loss (Raw)": 2.0380167961120605, "Full-pretrain/Step": 7344, "Full-pretrain/Step Time": 17.629241600632668} +{"Full-pretrain/Learning Rate": 6.608112944659742e-06, "Full-pretrain/Loss": 1.9685802459716797, "Full-pretrain/Loss (Raw)": 1.9292738437652588, "Full-pretrain/Step": 7345, "Full-pretrain/Step Time": 17.629314677789807} +{"Full-pretrain/Learning Rate": 6.602362902630571e-06, "Full-pretrain/Loss": 1.9682281017303467, "Full-pretrain/Loss (Raw)": 2.0581154823303223, "Full-pretrain/Step": 7346, "Full-pretrain/Step Time": 17.620198357850313} +{"Full-pretrain/Learning Rate": 6.596614982762373e-06, "Full-pretrain/Loss": 1.977396845817566, "Full-pretrain/Loss (Raw)": 1.9487884044647217, "Full-pretrain/Step": 7347, "Full-pretrain/Step Time": 17.62295944057405} +{"Full-pretrain/Learning Rate": 6.590869185718168e-06, "Full-pretrain/Loss": 1.977856159210205, "Full-pretrain/Loss (Raw)": 2.0715439319610596, "Full-pretrain/Step": 7348, "Full-pretrain/Step Time": 17.621867790818214} +{"Full-pretrain/Learning Rate": 6.5851255121607415e-06, "Full-pretrain/Loss": 1.977654218673706, "Full-pretrain/Loss (Raw)": 1.74690842628479, "Full-pretrain/Step": 7349, "Full-pretrain/Step Time": 17.63162659853697} +{"Full-pretrain/Learning Rate": 6.579383962752611e-06, "Full-pretrain/Loss": 1.9750375747680664, "Full-pretrain/Loss (Raw)": 1.9944045543670654, "Full-pretrain/Step": 7350, "Full-pretrain/Step Time": 17.62190960906446} +{"Full-pretrain/Learning Rate": 6.5736445381560705e-06, "Full-pretrain/Loss": 1.9710596799850464, "Full-pretrain/Loss (Raw)": 1.55682373046875, "Full-pretrain/Step": 7351, "Full-pretrain/Step Time": 17.619837326928973} +{"Full-pretrain/Learning Rate": 6.567907239033153e-06, "Full-pretrain/Loss": 1.9741363525390625, "Full-pretrain/Loss (Raw)": 2.054419755935669, "Full-pretrain/Step": 7352, "Full-pretrain/Step Time": 17.624903397634625} +{"Full-pretrain/Learning Rate": 6.562172066045655e-06, "Full-pretrain/Loss": 1.9755499362945557, "Full-pretrain/Loss (Raw)": 2.048015594482422, "Full-pretrain/Step": 7353, "Full-pretrain/Step Time": 17.6340896114707} +{"Full-pretrain/Learning Rate": 6.556439019855132e-06, "Full-pretrain/Loss": 1.9794466495513916, "Full-pretrain/Loss (Raw)": 2.0123000144958496, "Full-pretrain/Step": 7354, "Full-pretrain/Step Time": 17.63024210371077} +{"Full-pretrain/Learning Rate": 6.550708101122885e-06, "Full-pretrain/Loss": 1.9773850440979004, "Full-pretrain/Loss (Raw)": 1.9758225679397583, "Full-pretrain/Step": 7355, "Full-pretrain/Step Time": 17.630348714068532} +{"Full-pretrain/Learning Rate": 6.544979310509983e-06, "Full-pretrain/Loss": 1.9770548343658447, "Full-pretrain/Loss (Raw)": 1.7964887619018555, "Full-pretrain/Step": 7356, "Full-pretrain/Step Time": 17.632639046758413} +{"Full-pretrain/Learning Rate": 6.539252648677224e-06, "Full-pretrain/Loss": 1.9738541841506958, "Full-pretrain/Loss (Raw)": 1.9942620992660522, "Full-pretrain/Step": 7357, "Full-pretrain/Step Time": 17.63713035173714} +{"Full-pretrain/Learning Rate": 6.533528116285184e-06, "Full-pretrain/Loss": 1.9625213146209717, "Full-pretrain/Loss (Raw)": 1.8172717094421387, "Full-pretrain/Step": 7358, "Full-pretrain/Step Time": 17.635225471109152} +{"Full-pretrain/Learning Rate": 6.527805713994189e-06, "Full-pretrain/Loss": 1.9569143056869507, "Full-pretrain/Loss (Raw)": 1.9219317436218262, "Full-pretrain/Step": 7359, "Full-pretrain/Step Time": 17.64208896830678} +{"Full-pretrain/Learning Rate": 6.52208544246431e-06, "Full-pretrain/Loss": 1.9458788633346558, "Full-pretrain/Loss (Raw)": 1.7787925004959106, "Full-pretrain/Step": 7360, "Full-pretrain/Step Time": 17.637309005483985} +{"Full-pretrain/Learning Rate": 6.5163673023553915e-06, "Full-pretrain/Loss": 1.9356772899627686, "Full-pretrain/Loss (Raw)": 1.8063228130340576, "Full-pretrain/Step": 7361, "Full-pretrain/Step Time": 17.639944640919566} +{"Full-pretrain/Learning Rate": 6.5106512943269995e-06, "Full-pretrain/Loss": 1.937862753868103, "Full-pretrain/Loss (Raw)": 2.050827741622925, "Full-pretrain/Step": 7362, "Full-pretrain/Step Time": 17.6405986584723} +{"Full-pretrain/Learning Rate": 6.504937419038485e-06, "Full-pretrain/Loss": 1.9293938875198364, "Full-pretrain/Loss (Raw)": 1.783435583114624, "Full-pretrain/Step": 7363, "Full-pretrain/Step Time": 17.63771764561534} +{"Full-pretrain/Learning Rate": 6.49922567714894e-06, "Full-pretrain/Loss": 1.9439241886138916, "Full-pretrain/Loss (Raw)": 1.9103275537490845, "Full-pretrain/Step": 7364, "Full-pretrain/Step Time": 17.637758515775204} +{"Full-pretrain/Learning Rate": 6.493516069317218e-06, "Full-pretrain/Loss": 1.94427490234375, "Full-pretrain/Loss (Raw)": 1.9765790700912476, "Full-pretrain/Step": 7365, "Full-pretrain/Step Time": 17.64483318850398} +{"Full-pretrain/Learning Rate": 6.487808596201905e-06, "Full-pretrain/Loss": 1.9419893026351929, "Full-pretrain/Loss (Raw)": 1.9268887042999268, "Full-pretrain/Step": 7366, "Full-pretrain/Step Time": 17.638827059417963} +{"Full-pretrain/Learning Rate": 6.482103258461372e-06, "Full-pretrain/Loss": 1.9202566146850586, "Full-pretrain/Loss (Raw)": 1.929182767868042, "Full-pretrain/Step": 7367, "Full-pretrain/Step Time": 17.642525270581245} +{"Full-pretrain/Learning Rate": 6.476400056753715e-06, "Full-pretrain/Loss": 1.9164626598358154, "Full-pretrain/Loss (Raw)": 1.9630200862884521, "Full-pretrain/Step": 7368, "Full-pretrain/Step Time": 17.645992336794734} +{"Full-pretrain/Learning Rate": 6.470698991736801e-06, "Full-pretrain/Loss": 1.916574239730835, "Full-pretrain/Loss (Raw)": 2.1184496879577637, "Full-pretrain/Step": 7369, "Full-pretrain/Step Time": 17.65109994262457} +{"Full-pretrain/Learning Rate": 6.4650000640682465e-06, "Full-pretrain/Loss": 1.911893367767334, "Full-pretrain/Loss (Raw)": 1.7770410776138306, "Full-pretrain/Step": 7370, "Full-pretrain/Step Time": 17.643640153110027} +{"Full-pretrain/Learning Rate": 6.459303274405429e-06, "Full-pretrain/Loss": 1.9176722764968872, "Full-pretrain/Loss (Raw)": 2.029804229736328, "Full-pretrain/Step": 7371, "Full-pretrain/Step Time": 17.649450501427054} +{"Full-pretrain/Learning Rate": 6.453608623405455e-06, "Full-pretrain/Loss": 1.9228615760803223, "Full-pretrain/Loss (Raw)": 1.91866135597229, "Full-pretrain/Step": 7372, "Full-pretrain/Step Time": 17.644592495635152} +{"Full-pretrain/Learning Rate": 6.44791611172521e-06, "Full-pretrain/Loss": 1.916982889175415, "Full-pretrain/Loss (Raw)": 1.6924676895141602, "Full-pretrain/Step": 7373, "Full-pretrain/Step Time": 17.64634562470019} +{"Full-pretrain/Learning Rate": 6.442225740021321e-06, "Full-pretrain/Loss": 1.9199151992797852, "Full-pretrain/Loss (Raw)": 2.0848891735076904, "Full-pretrain/Step": 7374, "Full-pretrain/Step Time": 17.64257111772895} +{"Full-pretrain/Learning Rate": 6.436537508950171e-06, "Full-pretrain/Loss": 1.9246500730514526, "Full-pretrain/Loss (Raw)": 1.8777235746383667, "Full-pretrain/Step": 7375, "Full-pretrain/Step Time": 17.646593859419227} +{"Full-pretrain/Learning Rate": 6.430851419167896e-06, "Full-pretrain/Loss": 1.9068493843078613, "Full-pretrain/Loss (Raw)": 1.4683952331542969, "Full-pretrain/Step": 7376, "Full-pretrain/Step Time": 17.64607339538634} +{"Full-pretrain/Learning Rate": 6.42516747133039e-06, "Full-pretrain/Loss": 1.905153512954712, "Full-pretrain/Loss (Raw)": 1.8750061988830566, "Full-pretrain/Step": 7377, "Full-pretrain/Step Time": 17.65038617886603} +{"Full-pretrain/Learning Rate": 6.419485666093283e-06, "Full-pretrain/Loss": 1.88672935962677, "Full-pretrain/Loss (Raw)": 1.4685420989990234, "Full-pretrain/Step": 7378, "Full-pretrain/Step Time": 17.645618544891477} +{"Full-pretrain/Learning Rate": 6.413806004111975e-06, "Full-pretrain/Loss": 1.893499493598938, "Full-pretrain/Loss (Raw)": 2.1654319763183594, "Full-pretrain/Step": 7379, "Full-pretrain/Step Time": 17.64999246969819} +{"Full-pretrain/Learning Rate": 6.408128486041612e-06, "Full-pretrain/Loss": 1.8960249423980713, "Full-pretrain/Loss (Raw)": 2.1523566246032715, "Full-pretrain/Step": 7380, "Full-pretrain/Step Time": 17.640841886401176} +{"Full-pretrain/Learning Rate": 6.402453112537094e-06, "Full-pretrain/Loss": 1.8982782363891602, "Full-pretrain/Loss (Raw)": 1.8190160989761353, "Full-pretrain/Step": 7381, "Full-pretrain/Step Time": 17.64968940988183} +{"Full-pretrain/Learning Rate": 6.396779884253082e-06, "Full-pretrain/Loss": 1.8958388566970825, "Full-pretrain/Loss (Raw)": 1.9163451194763184, "Full-pretrain/Step": 7382, "Full-pretrain/Step Time": 17.64257663860917} +{"Full-pretrain/Learning Rate": 6.391108801843965e-06, "Full-pretrain/Loss": 1.9036420583724976, "Full-pretrain/Loss (Raw)": 1.806525707244873, "Full-pretrain/Step": 7383, "Full-pretrain/Step Time": 17.647556111216545} +{"Full-pretrain/Learning Rate": 6.385439865963916e-06, "Full-pretrain/Loss": 1.9005745649337769, "Full-pretrain/Loss (Raw)": 1.95625901222229, "Full-pretrain/Step": 7384, "Full-pretrain/Step Time": 17.640499990433455} +{"Full-pretrain/Learning Rate": 6.379773077266829e-06, "Full-pretrain/Loss": 1.9005945920944214, "Full-pretrain/Loss (Raw)": 2.0486598014831543, "Full-pretrain/Step": 7385, "Full-pretrain/Step Time": 17.643454438075423} +{"Full-pretrain/Learning Rate": 6.374108436406373e-06, "Full-pretrain/Loss": 1.898188591003418, "Full-pretrain/Loss (Raw)": 1.9353067874908447, "Full-pretrain/Step": 7386, "Full-pretrain/Step Time": 17.639490449801087} +{"Full-pretrain/Learning Rate": 6.368445944035972e-06, "Full-pretrain/Loss": 1.9048144817352295, "Full-pretrain/Loss (Raw)": 2.187851667404175, "Full-pretrain/Step": 7387, "Full-pretrain/Step Time": 17.644814340397716} +{"Full-pretrain/Learning Rate": 6.3627856008087764e-06, "Full-pretrain/Loss": 1.9062716960906982, "Full-pretrain/Loss (Raw)": 1.84312105178833, "Full-pretrain/Step": 7388, "Full-pretrain/Step Time": 17.63961672410369} +{"Full-pretrain/Learning Rate": 6.357127407377711e-06, "Full-pretrain/Loss": 1.9030739068984985, "Full-pretrain/Loss (Raw)": 1.8919326066970825, "Full-pretrain/Step": 7389, "Full-pretrain/Step Time": 17.639832369983196} +{"Full-pretrain/Learning Rate": 6.3514713643954475e-06, "Full-pretrain/Loss": 1.916186809539795, "Full-pretrain/Loss (Raw)": 2.2368850708007812, "Full-pretrain/Step": 7390, "Full-pretrain/Step Time": 17.639187393710017} +{"Full-pretrain/Learning Rate": 6.345817472514409e-06, "Full-pretrain/Loss": 1.9053423404693604, "Full-pretrain/Loss (Raw)": 1.5749046802520752, "Full-pretrain/Step": 7391, "Full-pretrain/Step Time": 17.63992157764733} +{"Full-pretrain/Learning Rate": 6.340165732386777e-06, "Full-pretrain/Loss": 1.909290075302124, "Full-pretrain/Loss (Raw)": 1.9051227569580078, "Full-pretrain/Step": 7392, "Full-pretrain/Step Time": 17.640703659504652} +{"Full-pretrain/Learning Rate": 6.334516144664465e-06, "Full-pretrain/Loss": 1.9172122478485107, "Full-pretrain/Loss (Raw)": 2.059828281402588, "Full-pretrain/Step": 7393, "Full-pretrain/Step Time": 17.640672981739044} +{"Full-pretrain/Learning Rate": 6.328868709999153e-06, "Full-pretrain/Loss": 1.9162013530731201, "Full-pretrain/Loss (Raw)": 2.0184783935546875, "Full-pretrain/Step": 7394, "Full-pretrain/Step Time": 17.636363722383976} +{"Full-pretrain/Learning Rate": 6.323223429042275e-06, "Full-pretrain/Loss": 1.9255040884017944, "Full-pretrain/Loss (Raw)": 2.081127166748047, "Full-pretrain/Step": 7395, "Full-pretrain/Step Time": 17.637711253017187} +{"Full-pretrain/Learning Rate": 6.317580302445012e-06, "Full-pretrain/Loss": 1.9275710582733154, "Full-pretrain/Loss (Raw)": 1.9764704704284668, "Full-pretrain/Step": 7396, "Full-pretrain/Step Time": 17.640108471736312} +{"Full-pretrain/Learning Rate": 6.311939330858293e-06, "Full-pretrain/Loss": 1.9212980270385742, "Full-pretrain/Loss (Raw)": 1.7758443355560303, "Full-pretrain/Step": 7397, "Full-pretrain/Step Time": 17.640753395855427} +{"Full-pretrain/Learning Rate": 6.3063005149328146e-06, "Full-pretrain/Loss": 1.9256937503814697, "Full-pretrain/Loss (Raw)": 2.067547559738159, "Full-pretrain/Step": 7398, "Full-pretrain/Step Time": 17.6422199588269} +{"Full-pretrain/Learning Rate": 6.300663855318995e-06, "Full-pretrain/Loss": 1.9240357875823975, "Full-pretrain/Loss (Raw)": 1.8761317729949951, "Full-pretrain/Step": 7399, "Full-pretrain/Step Time": 17.64549993351102} +{"Full-pretrain/Learning Rate": 6.295029352667034e-06, "Full-pretrain/Loss": 1.9206393957138062, "Full-pretrain/Loss (Raw)": 1.8543343544006348, "Full-pretrain/Step": 7400, "Full-pretrain/Step Time": 17.646381245926023} +{"Full-pretrain/Learning Rate": 6.289397007626857e-06, "Full-pretrain/Loss": 1.9243139028549194, "Full-pretrain/Loss (Raw)": 2.2360353469848633, "Full-pretrain/Step": 7401, "Full-pretrain/Step Time": 17.64722187258303} +{"Full-pretrain/Learning Rate": 6.2837668208481606e-06, "Full-pretrain/Loss": 1.9238739013671875, "Full-pretrain/Loss (Raw)": 1.762960433959961, "Full-pretrain/Step": 7402, "Full-pretrain/Step Time": 17.64304897375405} +{"Full-pretrain/Learning Rate": 6.27813879298039e-06, "Full-pretrain/Loss": 1.9263213872909546, "Full-pretrain/Loss (Raw)": 2.108123302459717, "Full-pretrain/Step": 7403, "Full-pretrain/Step Time": 17.640944035723805} +{"Full-pretrain/Learning Rate": 6.272512924672724e-06, "Full-pretrain/Loss": 1.9269025325775146, "Full-pretrain/Loss (Raw)": 1.9372578859329224, "Full-pretrain/Step": 7404, "Full-pretrain/Step Time": 17.644586576148868} +{"Full-pretrain/Learning Rate": 6.266889216574112e-06, "Full-pretrain/Loss": 1.9284151792526245, "Full-pretrain/Loss (Raw)": 1.7408732175827026, "Full-pretrain/Step": 7405, "Full-pretrain/Step Time": 17.642175883054733} +{"Full-pretrain/Learning Rate": 6.261267669333243e-06, "Full-pretrain/Loss": 1.9268198013305664, "Full-pretrain/Loss (Raw)": 2.0338380336761475, "Full-pretrain/Step": 7406, "Full-pretrain/Step Time": 17.644964948296547} +{"Full-pretrain/Learning Rate": 6.255648283598564e-06, "Full-pretrain/Loss": 1.9245681762695312, "Full-pretrain/Loss (Raw)": 1.8056704998016357, "Full-pretrain/Step": 7407, "Full-pretrain/Step Time": 17.64689333923161} +{"Full-pretrain/Learning Rate": 6.250031060018277e-06, "Full-pretrain/Loss": 1.939738392829895, "Full-pretrain/Loss (Raw)": 1.9538429975509644, "Full-pretrain/Step": 7408, "Full-pretrain/Step Time": 17.64671652764082} +{"Full-pretrain/Learning Rate": 6.244415999240311e-06, "Full-pretrain/Loss": 1.942596435546875, "Full-pretrain/Loss (Raw)": 1.9664647579193115, "Full-pretrain/Step": 7409, "Full-pretrain/Step Time": 17.640184758231044} +{"Full-pretrain/Learning Rate": 6.238803101912366e-06, "Full-pretrain/Loss": 1.9636270999908447, "Full-pretrain/Loss (Raw)": 2.141519069671631, "Full-pretrain/Step": 7410, "Full-pretrain/Step Time": 17.642323885113} +{"Full-pretrain/Learning Rate": 6.23319236868189e-06, "Full-pretrain/Loss": 1.957679271697998, "Full-pretrain/Loss (Raw)": 1.9751052856445312, "Full-pretrain/Step": 7411, "Full-pretrain/Step Time": 17.635141720995307} +{"Full-pretrain/Learning Rate": 6.22758380019608e-06, "Full-pretrain/Loss": 1.9527148008346558, "Full-pretrain/Loss (Raw)": 1.993491768836975, "Full-pretrain/Step": 7412, "Full-pretrain/Step Time": 17.637957472354174} +{"Full-pretrain/Learning Rate": 6.221977397101889e-06, "Full-pretrain/Loss": 1.9553433656692505, "Full-pretrain/Loss (Raw)": 1.903128981590271, "Full-pretrain/Step": 7413, "Full-pretrain/Step Time": 17.634921053424478} +{"Full-pretrain/Learning Rate": 6.216373160045999e-06, "Full-pretrain/Loss": 1.9578564167022705, "Full-pretrain/Loss (Raw)": 1.9967625141143799, "Full-pretrain/Step": 7414, "Full-pretrain/Step Time": 17.631925869733095} +{"Full-pretrain/Learning Rate": 6.210771089674864e-06, "Full-pretrain/Loss": 1.9583628177642822, "Full-pretrain/Loss (Raw)": 1.8227330446243286, "Full-pretrain/Step": 7415, "Full-pretrain/Step Time": 17.63004257902503} +{"Full-pretrain/Learning Rate": 6.205171186634689e-06, "Full-pretrain/Loss": 1.9510815143585205, "Full-pretrain/Loss (Raw)": 1.7232561111450195, "Full-pretrain/Step": 7416, "Full-pretrain/Step Time": 17.632421975955367} +{"Full-pretrain/Learning Rate": 6.199573451571403e-06, "Full-pretrain/Loss": 1.9523508548736572, "Full-pretrain/Loss (Raw)": 2.08927583694458, "Full-pretrain/Step": 7417, "Full-pretrain/Step Time": 17.634223079308867} +{"Full-pretrain/Learning Rate": 6.193977885130714e-06, "Full-pretrain/Loss": 1.9506160020828247, "Full-pretrain/Loss (Raw)": 1.8797907829284668, "Full-pretrain/Step": 7418, "Full-pretrain/Step Time": 17.637896040454507} +{"Full-pretrain/Learning Rate": 6.188384487958074e-06, "Full-pretrain/Loss": 1.9320011138916016, "Full-pretrain/Loss (Raw)": 1.5921783447265625, "Full-pretrain/Step": 7419, "Full-pretrain/Step Time": 17.635042341426015} +{"Full-pretrain/Learning Rate": 6.182793260698666e-06, "Full-pretrain/Loss": 1.9412623643875122, "Full-pretrain/Loss (Raw)": 2.139479160308838, "Full-pretrain/Step": 7420, "Full-pretrain/Step Time": 17.646808210760355} +{"Full-pretrain/Learning Rate": 6.1772042039974415e-06, "Full-pretrain/Loss": 1.9460980892181396, "Full-pretrain/Loss (Raw)": 2.046678304672241, "Full-pretrain/Step": 7421, "Full-pretrain/Step Time": 17.647697715088725} +{"Full-pretrain/Learning Rate": 6.171617318499098e-06, "Full-pretrain/Loss": 1.9307646751403809, "Full-pretrain/Loss (Raw)": 1.7462158203125, "Full-pretrain/Step": 7422, "Full-pretrain/Step Time": 17.649761710315943} +{"Full-pretrain/Learning Rate": 6.166032604848079e-06, "Full-pretrain/Loss": 1.948398470878601, "Full-pretrain/Loss (Raw)": 2.13918399810791, "Full-pretrain/Step": 7423, "Full-pretrain/Step Time": 17.640634667128325} +{"Full-pretrain/Learning Rate": 6.160450063688589e-06, "Full-pretrain/Loss": 1.9358346462249756, "Full-pretrain/Loss (Raw)": 1.5030784606933594, "Full-pretrain/Step": 7424, "Full-pretrain/Step Time": 17.6477055195719} +{"Full-pretrain/Learning Rate": 6.154869695664556e-06, "Full-pretrain/Loss": 1.9304583072662354, "Full-pretrain/Loss (Raw)": 1.8877902030944824, "Full-pretrain/Step": 7425, "Full-pretrain/Step Time": 17.650973178446293} +{"Full-pretrain/Learning Rate": 6.1492915014196795e-06, "Full-pretrain/Loss": 1.9261186122894287, "Full-pretrain/Loss (Raw)": 1.8796058893203735, "Full-pretrain/Step": 7426, "Full-pretrain/Step Time": 17.651214146986604} +{"Full-pretrain/Learning Rate": 6.143715481597404e-06, "Full-pretrain/Loss": 1.9235209226608276, "Full-pretrain/Loss (Raw)": 1.9980003833770752, "Full-pretrain/Step": 7427, "Full-pretrain/Step Time": 17.639976672828197} +{"Full-pretrain/Learning Rate": 6.138141636840922e-06, "Full-pretrain/Loss": 1.9216842651367188, "Full-pretrain/Loss (Raw)": 1.917697787284851, "Full-pretrain/Step": 7428, "Full-pretrain/Step Time": 17.637829296290874} +{"Full-pretrain/Learning Rate": 6.132569967793181e-06, "Full-pretrain/Loss": 1.932253122329712, "Full-pretrain/Loss (Raw)": 2.114048957824707, "Full-pretrain/Step": 7429, "Full-pretrain/Step Time": 17.642659524455667} +{"Full-pretrain/Learning Rate": 6.127000475096856e-06, "Full-pretrain/Loss": 1.9231152534484863, "Full-pretrain/Loss (Raw)": 1.7751333713531494, "Full-pretrain/Step": 7430, "Full-pretrain/Step Time": 17.63755924999714} +{"Full-pretrain/Learning Rate": 6.121433159394394e-06, "Full-pretrain/Loss": 1.9240813255310059, "Full-pretrain/Loss (Raw)": 1.9070463180541992, "Full-pretrain/Step": 7431, "Full-pretrain/Step Time": 17.640262538567185} +{"Full-pretrain/Learning Rate": 6.115868021327981e-06, "Full-pretrain/Loss": 1.9256376028060913, "Full-pretrain/Loss (Raw)": 1.9041353464126587, "Full-pretrain/Step": 7432, "Full-pretrain/Step Time": 17.642285408452153} +{"Full-pretrain/Learning Rate": 6.1103050615395644e-06, "Full-pretrain/Loss": 1.9169501066207886, "Full-pretrain/Loss (Raw)": 1.9580360651016235, "Full-pretrain/Step": 7433, "Full-pretrain/Step Time": 17.65092097967863} +{"Full-pretrain/Learning Rate": 6.104744280670813e-06, "Full-pretrain/Loss": 1.9291527271270752, "Full-pretrain/Loss (Raw)": 2.1534461975097656, "Full-pretrain/Step": 7434, "Full-pretrain/Step Time": 17.649830488488078} +{"Full-pretrain/Learning Rate": 6.099185679363176e-06, "Full-pretrain/Loss": 1.9197688102722168, "Full-pretrain/Loss (Raw)": 1.8078382015228271, "Full-pretrain/Step": 7435, "Full-pretrain/Step Time": 17.64876239746809} +{"Full-pretrain/Learning Rate": 6.093629258257821e-06, "Full-pretrain/Loss": 1.9224127531051636, "Full-pretrain/Loss (Raw)": 2.0218608379364014, "Full-pretrain/Step": 7436, "Full-pretrain/Step Time": 17.651404980570078} +{"Full-pretrain/Learning Rate": 6.0880750179956895e-06, "Full-pretrain/Loss": 1.9323008060455322, "Full-pretrain/Loss (Raw)": 2.05729341506958, "Full-pretrain/Step": 7437, "Full-pretrain/Step Time": 17.652428574860096} +{"Full-pretrain/Learning Rate": 6.082522959217454e-06, "Full-pretrain/Loss": 1.9279987812042236, "Full-pretrain/Loss (Raw)": 1.8961697816848755, "Full-pretrain/Step": 7438, "Full-pretrain/Step Time": 17.65584892220795} +{"Full-pretrain/Learning Rate": 6.0769730825635505e-06, "Full-pretrain/Loss": 1.9338011741638184, "Full-pretrain/Loss (Raw)": 1.9913530349731445, "Full-pretrain/Step": 7439, "Full-pretrain/Step Time": 17.650632239878178} +{"Full-pretrain/Learning Rate": 6.07142538867416e-06, "Full-pretrain/Loss": 1.9336669445037842, "Full-pretrain/Loss (Raw)": 1.9495418071746826, "Full-pretrain/Step": 7440, "Full-pretrain/Step Time": 17.64952552318573} +{"Full-pretrain/Learning Rate": 6.065879878189187e-06, "Full-pretrain/Loss": 1.9266619682312012, "Full-pretrain/Loss (Raw)": 1.7423077821731567, "Full-pretrain/Step": 7441, "Full-pretrain/Step Time": 17.65732621960342} +{"Full-pretrain/Learning Rate": 6.060336551748319e-06, "Full-pretrain/Loss": 1.910157561302185, "Full-pretrain/Loss (Raw)": 1.6133767366409302, "Full-pretrain/Step": 7442, "Full-pretrain/Step Time": 17.656605683267117} +{"Full-pretrain/Learning Rate": 6.054795409990974e-06, "Full-pretrain/Loss": 1.9174813032150269, "Full-pretrain/Loss (Raw)": 2.2094669342041016, "Full-pretrain/Step": 7443, "Full-pretrain/Step Time": 17.6521626599133} +{"Full-pretrain/Learning Rate": 6.04925645355632e-06, "Full-pretrain/Loss": 1.916349172592163, "Full-pretrain/Loss (Raw)": 1.9572609663009644, "Full-pretrain/Step": 7444, "Full-pretrain/Step Time": 17.649997878819704} +{"Full-pretrain/Learning Rate": 6.043719683083282e-06, "Full-pretrain/Loss": 1.913132667541504, "Full-pretrain/Loss (Raw)": 1.8002026081085205, "Full-pretrain/Step": 7445, "Full-pretrain/Step Time": 17.64687499590218} +{"Full-pretrain/Learning Rate": 6.038185099210511e-06, "Full-pretrain/Loss": 1.9237043857574463, "Full-pretrain/Loss (Raw)": 2.335057020187378, "Full-pretrain/Step": 7446, "Full-pretrain/Step Time": 17.647101124748588} +{"Full-pretrain/Learning Rate": 6.032652702576424e-06, "Full-pretrain/Loss": 1.92428457736969, "Full-pretrain/Loss (Raw)": 1.8413007259368896, "Full-pretrain/Step": 7447, "Full-pretrain/Step Time": 17.646121514961123} +{"Full-pretrain/Learning Rate": 6.027122493819182e-06, "Full-pretrain/Loss": 1.9296177625656128, "Full-pretrain/Loss (Raw)": 1.8939160108566284, "Full-pretrain/Step": 7448, "Full-pretrain/Step Time": 17.645852575078607} +{"Full-pretrain/Learning Rate": 6.0215944735767e-06, "Full-pretrain/Loss": 1.925363540649414, "Full-pretrain/Loss (Raw)": 1.9531404972076416, "Full-pretrain/Step": 7449, "Full-pretrain/Step Time": 17.64821496233344} +{"Full-pretrain/Learning Rate": 6.016068642486619e-06, "Full-pretrain/Loss": 1.9278900623321533, "Full-pretrain/Loss (Raw)": 1.9606420993804932, "Full-pretrain/Step": 7450, "Full-pretrain/Step Time": 17.64791789278388} +{"Full-pretrain/Learning Rate": 6.010545001186354e-06, "Full-pretrain/Loss": 1.9385825395584106, "Full-pretrain/Loss (Raw)": 1.9343348741531372, "Full-pretrain/Step": 7451, "Full-pretrain/Step Time": 17.650086661800742} +{"Full-pretrain/Learning Rate": 6.005023550313043e-06, "Full-pretrain/Loss": 1.9334776401519775, "Full-pretrain/Loss (Raw)": 1.9761247634887695, "Full-pretrain/Step": 7452, "Full-pretrain/Step Time": 17.65121318027377} +{"Full-pretrain/Learning Rate": 5.999504290503593e-06, "Full-pretrain/Loss": 1.9244951009750366, "Full-pretrain/Loss (Raw)": 1.7592344284057617, "Full-pretrain/Step": 7453, "Full-pretrain/Step Time": 17.656977865844965} +{"Full-pretrain/Learning Rate": 5.9939872223946455e-06, "Full-pretrain/Loss": 1.9286129474639893, "Full-pretrain/Loss (Raw)": 1.8779903650283813, "Full-pretrain/Step": 7454, "Full-pretrain/Step Time": 17.66080266982317} +{"Full-pretrain/Learning Rate": 5.988472346622589e-06, "Full-pretrain/Loss": 1.9237664937973022, "Full-pretrain/Loss (Raw)": 1.9840940237045288, "Full-pretrain/Step": 7455, "Full-pretrain/Step Time": 17.66020887903869} +{"Full-pretrain/Learning Rate": 5.982959663823576e-06, "Full-pretrain/Loss": 1.938288688659668, "Full-pretrain/Loss (Raw)": 1.967790126800537, "Full-pretrain/Step": 7456, "Full-pretrain/Step Time": 17.655335690826178} +{"Full-pretrain/Learning Rate": 5.977449174633476e-06, "Full-pretrain/Loss": 1.9280259609222412, "Full-pretrain/Loss (Raw)": 1.559382438659668, "Full-pretrain/Step": 7457, "Full-pretrain/Step Time": 17.658900065347552} +{"Full-pretrain/Learning Rate": 5.971940879687929e-06, "Full-pretrain/Loss": 1.9309518337249756, "Full-pretrain/Loss (Raw)": 1.973235011100769, "Full-pretrain/Step": 7458, "Full-pretrain/Step Time": 17.6628990881145} +{"Full-pretrain/Learning Rate": 5.966434779622313e-06, "Full-pretrain/Loss": 1.9318615198135376, "Full-pretrain/Loss (Raw)": 2.027109146118164, "Full-pretrain/Step": 7459, "Full-pretrain/Step Time": 17.660531179979444} +{"Full-pretrain/Learning Rate": 5.9609308750717575e-06, "Full-pretrain/Loss": 1.9326250553131104, "Full-pretrain/Loss (Raw)": 1.9421300888061523, "Full-pretrain/Step": 7460, "Full-pretrain/Step Time": 17.66204447299242} +{"Full-pretrain/Learning Rate": 5.95542916667114e-06, "Full-pretrain/Loss": 1.9281526803970337, "Full-pretrain/Loss (Raw)": 1.9709339141845703, "Full-pretrain/Step": 7461, "Full-pretrain/Step Time": 17.658951027318835} +{"Full-pretrain/Learning Rate": 5.94992965505507e-06, "Full-pretrain/Loss": 1.9346811771392822, "Full-pretrain/Loss (Raw)": 1.9840432405471802, "Full-pretrain/Step": 7462, "Full-pretrain/Step Time": 17.664418837055564} +{"Full-pretrain/Learning Rate": 5.944432340857919e-06, "Full-pretrain/Loss": 1.931627631187439, "Full-pretrain/Loss (Raw)": 1.809334635734558, "Full-pretrain/Step": 7463, "Full-pretrain/Step Time": 17.664284024387598} +{"Full-pretrain/Learning Rate": 5.9389372247138e-06, "Full-pretrain/Loss": 1.9262913465499878, "Full-pretrain/Loss (Raw)": 1.7333757877349854, "Full-pretrain/Step": 7464, "Full-pretrain/Step Time": 17.66191458143294} +{"Full-pretrain/Learning Rate": 5.9334443072565745e-06, "Full-pretrain/Loss": 1.9326980113983154, "Full-pretrain/Loss (Raw)": 2.1630516052246094, "Full-pretrain/Step": 7465, "Full-pretrain/Step Time": 17.666849406436086} +{"Full-pretrain/Learning Rate": 5.927953589119856e-06, "Full-pretrain/Loss": 1.9273455142974854, "Full-pretrain/Loss (Raw)": 1.9821672439575195, "Full-pretrain/Step": 7466, "Full-pretrain/Step Time": 17.665656462311745} +{"Full-pretrain/Learning Rate": 5.92246507093698e-06, "Full-pretrain/Loss": 1.9357125759124756, "Full-pretrain/Loss (Raw)": 2.0755810737609863, "Full-pretrain/Step": 7467, "Full-pretrain/Step Time": 17.665963854640722} +{"Full-pretrain/Learning Rate": 5.916978753341063e-06, "Full-pretrain/Loss": 1.9253461360931396, "Full-pretrain/Loss (Raw)": 1.6901353597640991, "Full-pretrain/Step": 7468, "Full-pretrain/Step Time": 17.66361214220524} +{"Full-pretrain/Learning Rate": 5.911494636964931e-06, "Full-pretrain/Loss": 1.9267632961273193, "Full-pretrain/Loss (Raw)": 2.1026415824890137, "Full-pretrain/Step": 7469, "Full-pretrain/Step Time": 17.660296581685543} +{"Full-pretrain/Learning Rate": 5.906012722441184e-06, "Full-pretrain/Loss": 1.9320173263549805, "Full-pretrain/Loss (Raw)": 2.0643019676208496, "Full-pretrain/Step": 7470, "Full-pretrain/Step Time": 17.660190863534808} +{"Full-pretrain/Learning Rate": 5.900533010402168e-06, "Full-pretrain/Loss": 1.9296215772628784, "Full-pretrain/Loss (Raw)": 1.9146859645843506, "Full-pretrain/Step": 7471, "Full-pretrain/Step Time": 17.660873591899872} +{"Full-pretrain/Learning Rate": 5.895055501479952e-06, "Full-pretrain/Loss": 1.9305137395858765, "Full-pretrain/Loss (Raw)": 1.9780919551849365, "Full-pretrain/Step": 7472, "Full-pretrain/Step Time": 17.6597040258348} +{"Full-pretrain/Learning Rate": 5.889580196306366e-06, "Full-pretrain/Loss": 1.9401230812072754, "Full-pretrain/Loss (Raw)": 2.04980206489563, "Full-pretrain/Step": 7473, "Full-pretrain/Step Time": 17.663688791915774} +{"Full-pretrain/Learning Rate": 5.884107095512992e-06, "Full-pretrain/Loss": 1.9495471715927124, "Full-pretrain/Loss (Raw)": 1.9149501323699951, "Full-pretrain/Step": 7474, "Full-pretrain/Step Time": 17.665948029607534} +{"Full-pretrain/Learning Rate": 5.878636199731144e-06, "Full-pretrain/Loss": 1.9409983158111572, "Full-pretrain/Loss (Raw)": 1.9359039068222046, "Full-pretrain/Step": 7475, "Full-pretrain/Step Time": 17.661715080961585} +{"Full-pretrain/Learning Rate": 5.873167509591893e-06, "Full-pretrain/Loss": 1.939112901687622, "Full-pretrain/Loss (Raw)": 1.8969268798828125, "Full-pretrain/Step": 7476, "Full-pretrain/Step Time": 17.662994289770722} +{"Full-pretrain/Learning Rate": 5.8677010257260525e-06, "Full-pretrain/Loss": 1.9323668479919434, "Full-pretrain/Loss (Raw)": 1.58432936668396, "Full-pretrain/Step": 7477, "Full-pretrain/Step Time": 17.657597102224827} +{"Full-pretrain/Learning Rate": 5.862236748764169e-06, "Full-pretrain/Loss": 1.9106659889221191, "Full-pretrain/Loss (Raw)": 1.6406282186508179, "Full-pretrain/Step": 7478, "Full-pretrain/Step Time": 17.665112072601914} +{"Full-pretrain/Learning Rate": 5.856774679336552e-06, "Full-pretrain/Loss": 1.9106996059417725, "Full-pretrain/Loss (Raw)": 1.8423783779144287, "Full-pretrain/Step": 7479, "Full-pretrain/Step Time": 17.662708846852183} +{"Full-pretrain/Learning Rate": 5.8513148180732476e-06, "Full-pretrain/Loss": 1.9106611013412476, "Full-pretrain/Loss (Raw)": 1.8926827907562256, "Full-pretrain/Step": 7480, "Full-pretrain/Step Time": 17.659205187112093} +{"Full-pretrain/Learning Rate": 5.845857165604049e-06, "Full-pretrain/Loss": 1.9114925861358643, "Full-pretrain/Loss (Raw)": 1.9797509908676147, "Full-pretrain/Step": 7481, "Full-pretrain/Step Time": 17.65850562788546} +{"Full-pretrain/Learning Rate": 5.840401722558503e-06, "Full-pretrain/Loss": 1.9099020957946777, "Full-pretrain/Loss (Raw)": 1.9097450971603394, "Full-pretrain/Step": 7482, "Full-pretrain/Step Time": 17.66017302684486} +{"Full-pretrain/Learning Rate": 5.834948489565878e-06, "Full-pretrain/Loss": 1.914320945739746, "Full-pretrain/Loss (Raw)": 2.075737476348877, "Full-pretrain/Step": 7483, "Full-pretrain/Step Time": 17.657207638025284} +{"Full-pretrain/Learning Rate": 5.829497467255218e-06, "Full-pretrain/Loss": 1.9113621711730957, "Full-pretrain/Loss (Raw)": 1.8814442157745361, "Full-pretrain/Step": 7484, "Full-pretrain/Step Time": 17.65827484987676} +{"Full-pretrain/Learning Rate": 5.82404865625528e-06, "Full-pretrain/Loss": 1.927936315536499, "Full-pretrain/Loss (Raw)": 2.2896056175231934, "Full-pretrain/Step": 7485, "Full-pretrain/Step Time": 17.65117879398167} +{"Full-pretrain/Learning Rate": 5.818602057194589e-06, "Full-pretrain/Loss": 1.935842752456665, "Full-pretrain/Loss (Raw)": 2.1309962272644043, "Full-pretrain/Step": 7486, "Full-pretrain/Step Time": 17.654066674411297} +{"Full-pretrain/Learning Rate": 5.813157670701419e-06, "Full-pretrain/Loss": 1.9361796379089355, "Full-pretrain/Loss (Raw)": 1.9948757886886597, "Full-pretrain/Step": 7487, "Full-pretrain/Step Time": 17.646956166252494} +{"Full-pretrain/Learning Rate": 5.807715497403762e-06, "Full-pretrain/Loss": 1.93302321434021, "Full-pretrain/Loss (Raw)": 1.866782784461975, "Full-pretrain/Step": 7488, "Full-pretrain/Step Time": 17.648792922496796} +{"Full-pretrain/Learning Rate": 5.802275537929375e-06, "Full-pretrain/Loss": 1.9439595937728882, "Full-pretrain/Loss (Raw)": 1.9093464612960815, "Full-pretrain/Step": 7489, "Full-pretrain/Step Time": 17.641947032883763} +{"Full-pretrain/Learning Rate": 5.79683779290576e-06, "Full-pretrain/Loss": 1.936893105506897, "Full-pretrain/Loss (Raw)": 1.7471076250076294, "Full-pretrain/Step": 7490, "Full-pretrain/Step Time": 17.64232444576919} +{"Full-pretrain/Learning Rate": 5.791402262960158e-06, "Full-pretrain/Loss": 1.916632056236267, "Full-pretrain/Loss (Raw)": 1.3787564039230347, "Full-pretrain/Step": 7491, "Full-pretrain/Step Time": 17.645303204655647} +{"Full-pretrain/Learning Rate": 5.785968948719561e-06, "Full-pretrain/Loss": 1.919393539428711, "Full-pretrain/Loss (Raw)": 2.0304977893829346, "Full-pretrain/Step": 7492, "Full-pretrain/Step Time": 17.63936947658658} +{"Full-pretrain/Learning Rate": 5.780537850810686e-06, "Full-pretrain/Loss": 1.930738925933838, "Full-pretrain/Loss (Raw)": 2.333986282348633, "Full-pretrain/Step": 7493, "Full-pretrain/Step Time": 17.636753000319004} +{"Full-pretrain/Learning Rate": 5.775108969860016e-06, "Full-pretrain/Loss": 1.922790765762329, "Full-pretrain/Loss (Raw)": 1.7297052145004272, "Full-pretrain/Step": 7494, "Full-pretrain/Step Time": 17.634772760793567} +{"Full-pretrain/Learning Rate": 5.76968230649377e-06, "Full-pretrain/Loss": 1.927194595336914, "Full-pretrain/Loss (Raw)": 1.9502516984939575, "Full-pretrain/Step": 7495, "Full-pretrain/Step Time": 17.635979548096657} +{"Full-pretrain/Learning Rate": 5.764257861337913e-06, "Full-pretrain/Loss": 1.9302396774291992, "Full-pretrain/Loss (Raw)": 1.8308236598968506, "Full-pretrain/Step": 7496, "Full-pretrain/Step Time": 17.627313148230314} +{"Full-pretrain/Learning Rate": 5.758835635018151e-06, "Full-pretrain/Loss": 1.9275617599487305, "Full-pretrain/Loss (Raw)": 2.0773582458496094, "Full-pretrain/Step": 7497, "Full-pretrain/Step Time": 17.623210914433002} +{"Full-pretrain/Learning Rate": 5.753415628159945e-06, "Full-pretrain/Loss": 1.9217872619628906, "Full-pretrain/Loss (Raw)": 1.797383427619934, "Full-pretrain/Step": 7498, "Full-pretrain/Step Time": 17.622476547956467} +{"Full-pretrain/Learning Rate": 5.747997841388472e-06, "Full-pretrain/Loss": 1.9112727642059326, "Full-pretrain/Loss (Raw)": 1.7391109466552734, "Full-pretrain/Step": 7499, "Full-pretrain/Step Time": 17.621030757203698} +{"Full-pretrain/Learning Rate": 5.742582275328692e-06, "Full-pretrain/Loss": 1.9226878881454468, "Full-pretrain/Loss (Raw)": 2.055424213409424, "Full-pretrain/Step": 7500, "Full-pretrain/Step Time": 17.619272420182824} +{"Full-pretrain/Learning Rate": 5.737168930605272e-06, "Full-pretrain/Loss": 1.9240320920944214, "Full-pretrain/Loss (Raw)": 2.1456549167633057, "Full-pretrain/Step": 7501, "Full-pretrain/Step Time": 17.619876036420465} +{"Full-pretrain/Learning Rate": 5.731757807842647e-06, "Full-pretrain/Loss": 1.9144171476364136, "Full-pretrain/Loss (Raw)": 1.7566239833831787, "Full-pretrain/Step": 7502, "Full-pretrain/Step Time": 17.62222722545266} +{"Full-pretrain/Learning Rate": 5.726348907664994e-06, "Full-pretrain/Loss": 1.9087655544281006, "Full-pretrain/Loss (Raw)": 1.7338333129882812, "Full-pretrain/Step": 7503, "Full-pretrain/Step Time": 17.622671572491527} +{"Full-pretrain/Learning Rate": 5.7209422306962135e-06, "Full-pretrain/Loss": 1.9014639854431152, "Full-pretrain/Loss (Raw)": 1.7444413900375366, "Full-pretrain/Step": 7504, "Full-pretrain/Step Time": 17.62181863747537} +{"Full-pretrain/Learning Rate": 5.715537777559971e-06, "Full-pretrain/Loss": 1.9008492231369019, "Full-pretrain/Loss (Raw)": 2.030130624771118, "Full-pretrain/Step": 7505, "Full-pretrain/Step Time": 17.615835551172495} +{"Full-pretrain/Learning Rate": 5.7101355488796695e-06, "Full-pretrain/Loss": 1.9055322408676147, "Full-pretrain/Loss (Raw)": 2.064807415008545, "Full-pretrain/Step": 7506, "Full-pretrain/Step Time": 17.61452518031001} +{"Full-pretrain/Learning Rate": 5.704735545278453e-06, "Full-pretrain/Loss": 1.9091665744781494, "Full-pretrain/Loss (Raw)": 2.0521998405456543, "Full-pretrain/Step": 7507, "Full-pretrain/Step Time": 17.611655885353684} +{"Full-pretrain/Learning Rate": 5.69933776737922e-06, "Full-pretrain/Loss": 1.9116644859313965, "Full-pretrain/Loss (Raw)": 1.9768590927124023, "Full-pretrain/Step": 7508, "Full-pretrain/Step Time": 17.613334538415074} +{"Full-pretrain/Learning Rate": 5.693942215804585e-06, "Full-pretrain/Loss": 1.9223518371582031, "Full-pretrain/Loss (Raw)": 1.9263262748718262, "Full-pretrain/Step": 7509, "Full-pretrain/Step Time": 17.606857907027006} +{"Full-pretrain/Learning Rate": 5.6885488911769285e-06, "Full-pretrain/Loss": 1.935044527053833, "Full-pretrain/Loss (Raw)": 2.0467963218688965, "Full-pretrain/Step": 7510, "Full-pretrain/Step Time": 17.60464010387659} +{"Full-pretrain/Learning Rate": 5.683157794118371e-06, "Full-pretrain/Loss": 1.9312026500701904, "Full-pretrain/Loss (Raw)": 1.7194364070892334, "Full-pretrain/Step": 7511, "Full-pretrain/Step Time": 17.60345585271716} +{"Full-pretrain/Learning Rate": 5.677768925250776e-06, "Full-pretrain/Loss": 1.9307217597961426, "Full-pretrain/Loss (Raw)": 1.8772956132888794, "Full-pretrain/Step": 7512, "Full-pretrain/Step Time": 17.605875423178077} +{"Full-pretrain/Learning Rate": 5.672382285195751e-06, "Full-pretrain/Loss": 1.933184266090393, "Full-pretrain/Loss (Raw)": 2.0585498809814453, "Full-pretrain/Step": 7513, "Full-pretrain/Step Time": 17.604884408414364} +{"Full-pretrain/Learning Rate": 5.666997874574629e-06, "Full-pretrain/Loss": 1.9400118589401245, "Full-pretrain/Loss (Raw)": 2.128227949142456, "Full-pretrain/Step": 7514, "Full-pretrain/Step Time": 17.604952968657017} +{"Full-pretrain/Learning Rate": 5.66161569400851e-06, "Full-pretrain/Loss": 1.935608148574829, "Full-pretrain/Loss (Raw)": 1.9348236322402954, "Full-pretrain/Step": 7515, "Full-pretrain/Step Time": 17.5999716501683} +{"Full-pretrain/Learning Rate": 5.656235744118224e-06, "Full-pretrain/Loss": 1.9367263317108154, "Full-pretrain/Loss (Raw)": 1.9172242879867554, "Full-pretrain/Step": 7516, "Full-pretrain/Step Time": 17.599572841078043} +{"Full-pretrain/Learning Rate": 5.6508580255243524e-06, "Full-pretrain/Loss": 1.929602026939392, "Full-pretrain/Loss (Raw)": 2.06162691116333, "Full-pretrain/Step": 7517, "Full-pretrain/Step Time": 17.60010644979775} +{"Full-pretrain/Learning Rate": 5.645482538847202e-06, "Full-pretrain/Loss": 1.9130637645721436, "Full-pretrain/Loss (Raw)": 1.6017732620239258, "Full-pretrain/Step": 7518, "Full-pretrain/Step Time": 17.60119822062552} +{"Full-pretrain/Learning Rate": 5.640109284706849e-06, "Full-pretrain/Loss": 1.912761926651001, "Full-pretrain/Loss (Raw)": 1.9852172136306763, "Full-pretrain/Step": 7519, "Full-pretrain/Step Time": 17.599075485020876} +{"Full-pretrain/Learning Rate": 5.634738263723075e-06, "Full-pretrain/Loss": 1.917602777481079, "Full-pretrain/Loss (Raw)": 2.0216894149780273, "Full-pretrain/Step": 7520, "Full-pretrain/Step Time": 17.59635105729103} +{"Full-pretrain/Learning Rate": 5.6293694765154395e-06, "Full-pretrain/Loss": 1.9165602922439575, "Full-pretrain/Loss (Raw)": 1.8759872913360596, "Full-pretrain/Step": 7521, "Full-pretrain/Step Time": 17.59806029126048} +{"Full-pretrain/Learning Rate": 5.624002923703226e-06, "Full-pretrain/Loss": 1.9191235303878784, "Full-pretrain/Loss (Raw)": 1.829131007194519, "Full-pretrain/Step": 7522, "Full-pretrain/Step Time": 17.599681930616498} +{"Full-pretrain/Learning Rate": 5.618638605905469e-06, "Full-pretrain/Loss": 1.9364850521087646, "Full-pretrain/Loss (Raw)": 1.934326410293579, "Full-pretrain/Step": 7523, "Full-pretrain/Step Time": 17.60263194143772} +{"Full-pretrain/Learning Rate": 5.61327652374094e-06, "Full-pretrain/Loss": 1.9378970861434937, "Full-pretrain/Loss (Raw)": 2.0756800174713135, "Full-pretrain/Step": 7524, "Full-pretrain/Step Time": 17.59862119704485} +{"Full-pretrain/Learning Rate": 5.607916677828149e-06, "Full-pretrain/Loss": 1.9301810264587402, "Full-pretrain/Loss (Raw)": 2.087074041366577, "Full-pretrain/Step": 7525, "Full-pretrain/Step Time": 17.60262650065124} +{"Full-pretrain/Learning Rate": 5.602559068785352e-06, "Full-pretrain/Loss": 1.9375463724136353, "Full-pretrain/Loss (Raw)": 1.9653955698013306, "Full-pretrain/Step": 7526, "Full-pretrain/Step Time": 17.598140131682158} +{"Full-pretrain/Learning Rate": 5.597203697230549e-06, "Full-pretrain/Loss": 1.9298014640808105, "Full-pretrain/Loss (Raw)": 1.7024145126342773, "Full-pretrain/Step": 7527, "Full-pretrain/Step Time": 17.599596494808793} +{"Full-pretrain/Learning Rate": 5.591850563781481e-06, "Full-pretrain/Loss": 1.9348167181015015, "Full-pretrain/Loss (Raw)": 1.9913084506988525, "Full-pretrain/Step": 7528, "Full-pretrain/Step Time": 17.596789026632905} +{"Full-pretrain/Learning Rate": 5.586499669055637e-06, "Full-pretrain/Loss": 1.9339821338653564, "Full-pretrain/Loss (Raw)": 2.050652503967285, "Full-pretrain/Step": 7529, "Full-pretrain/Step Time": 17.599846756085753} +{"Full-pretrain/Learning Rate": 5.581151013670227e-06, "Full-pretrain/Loss": 1.926076889038086, "Full-pretrain/Loss (Raw)": 1.5444185733795166, "Full-pretrain/Step": 7530, "Full-pretrain/Step Time": 17.596066566184163} +{"Full-pretrain/Learning Rate": 5.5758045982422235e-06, "Full-pretrain/Loss": 1.933241605758667, "Full-pretrain/Loss (Raw)": 1.968380093574524, "Full-pretrain/Step": 7531, "Full-pretrain/Step Time": 17.59755554422736} +{"Full-pretrain/Learning Rate": 5.570460423388332e-06, "Full-pretrain/Loss": 1.9319781064987183, "Full-pretrain/Loss (Raw)": 2.0149927139282227, "Full-pretrain/Step": 7532, "Full-pretrain/Step Time": 17.593161709606647} +{"Full-pretrain/Learning Rate": 5.565118489725013e-06, "Full-pretrain/Loss": 1.913581132888794, "Full-pretrain/Loss (Raw)": 1.5569498538970947, "Full-pretrain/Step": 7533, "Full-pretrain/Step Time": 17.598496543243527} +{"Full-pretrain/Learning Rate": 5.559778797868437e-06, "Full-pretrain/Loss": 1.926311731338501, "Full-pretrain/Loss (Raw)": 2.16400408744812, "Full-pretrain/Step": 7534, "Full-pretrain/Step Time": 17.596186749637127} +{"Full-pretrain/Learning Rate": 5.554441348434553e-06, "Full-pretrain/Loss": 1.9311103820800781, "Full-pretrain/Loss (Raw)": 1.88739013671875, "Full-pretrain/Step": 7535, "Full-pretrain/Step Time": 17.59987752698362} +{"Full-pretrain/Learning Rate": 5.549106142039018e-06, "Full-pretrain/Loss": 1.9358887672424316, "Full-pretrain/Loss (Raw)": 1.8973493576049805, "Full-pretrain/Step": 7536, "Full-pretrain/Step Time": 17.59812181815505} +{"Full-pretrain/Learning Rate": 5.543773179297254e-06, "Full-pretrain/Loss": 1.9287093877792358, "Full-pretrain/Loss (Raw)": 1.800392985343933, "Full-pretrain/Step": 7537, "Full-pretrain/Step Time": 17.601089423522353} +{"Full-pretrain/Learning Rate": 5.538442460824417e-06, "Full-pretrain/Loss": 1.9056622982025146, "Full-pretrain/Loss (Raw)": 1.3273017406463623, "Full-pretrain/Step": 7538, "Full-pretrain/Step Time": 17.60258740745485} +{"Full-pretrain/Learning Rate": 5.5331139872354e-06, "Full-pretrain/Loss": 1.9139958620071411, "Full-pretrain/Loss (Raw)": 2.318871021270752, "Full-pretrain/Step": 7539, "Full-pretrain/Step Time": 17.6060229819268} +{"Full-pretrain/Learning Rate": 5.527787759144854e-06, "Full-pretrain/Loss": 1.914461612701416, "Full-pretrain/Loss (Raw)": 1.9917649030685425, "Full-pretrain/Step": 7540, "Full-pretrain/Step Time": 17.60641978122294} +{"Full-pretrain/Learning Rate": 5.5224637771671385e-06, "Full-pretrain/Loss": 1.8996086120605469, "Full-pretrain/Loss (Raw)": 1.4510310888290405, "Full-pretrain/Step": 7541, "Full-pretrain/Step Time": 17.606819603592157} +{"Full-pretrain/Learning Rate": 5.517142041916382e-06, "Full-pretrain/Loss": 1.9018545150756836, "Full-pretrain/Loss (Raw)": 2.1186602115631104, "Full-pretrain/Step": 7542, "Full-pretrain/Step Time": 17.608721766620874} +{"Full-pretrain/Learning Rate": 5.511822554006443e-06, "Full-pretrain/Loss": 1.9057393074035645, "Full-pretrain/Loss (Raw)": 1.8437504768371582, "Full-pretrain/Step": 7543, "Full-pretrain/Step Time": 17.60727733746171} +{"Full-pretrain/Learning Rate": 5.506505314050925e-06, "Full-pretrain/Loss": 1.9048101902008057, "Full-pretrain/Loss (Raw)": 1.8475675582885742, "Full-pretrain/Step": 7544, "Full-pretrain/Step Time": 17.611932203173637} +{"Full-pretrain/Learning Rate": 5.5011903226631745e-06, "Full-pretrain/Loss": 1.884009838104248, "Full-pretrain/Loss (Raw)": 1.3929369449615479, "Full-pretrain/Step": 7545, "Full-pretrain/Step Time": 17.611441545188427} +{"Full-pretrain/Learning Rate": 5.4958775804562625e-06, "Full-pretrain/Loss": 1.879088282585144, "Full-pretrain/Loss (Raw)": 1.970739722251892, "Full-pretrain/Step": 7546, "Full-pretrain/Step Time": 17.604959312826395} +{"Full-pretrain/Learning Rate": 5.490567088043016e-06, "Full-pretrain/Loss": 1.874450922012329, "Full-pretrain/Loss (Raw)": 1.786426067352295, "Full-pretrain/Step": 7547, "Full-pretrain/Step Time": 17.602270003408194} +{"Full-pretrain/Learning Rate": 5.485258846036001e-06, "Full-pretrain/Loss": 1.8507099151611328, "Full-pretrain/Loss (Raw)": 1.1575154066085815, "Full-pretrain/Step": 7548, "Full-pretrain/Step Time": 17.59670710377395} +{"Full-pretrain/Learning Rate": 5.479952855047527e-06, "Full-pretrain/Loss": 1.8442997932434082, "Full-pretrain/Loss (Raw)": 1.856501579284668, "Full-pretrain/Step": 7549, "Full-pretrain/Step Time": 17.602125320583582} +{"Full-pretrain/Learning Rate": 5.4746491156896225e-06, "Full-pretrain/Loss": 1.8591409921646118, "Full-pretrain/Loss (Raw)": 2.0766916275024414, "Full-pretrain/Step": 7550, "Full-pretrain/Step Time": 17.60228657722473} +{"Full-pretrain/Learning Rate": 5.4693476285740815e-06, "Full-pretrain/Loss": 1.8555059432983398, "Full-pretrain/Loss (Raw)": 1.868896722793579, "Full-pretrain/Step": 7551, "Full-pretrain/Step Time": 17.60020143724978} +{"Full-pretrain/Learning Rate": 5.464048394312438e-06, "Full-pretrain/Loss": 1.8331868648529053, "Full-pretrain/Loss (Raw)": 1.307478904724121, "Full-pretrain/Step": 7552, "Full-pretrain/Step Time": 17.598260270431638} +{"Full-pretrain/Learning Rate": 5.458751413515936e-06, "Full-pretrain/Loss": 1.834623098373413, "Full-pretrain/Loss (Raw)": 1.921947956085205, "Full-pretrain/Step": 7553, "Full-pretrain/Step Time": 17.593231549486518} +{"Full-pretrain/Learning Rate": 5.453456686795591e-06, "Full-pretrain/Loss": 1.836746335029602, "Full-pretrain/Loss (Raw)": 1.8970692157745361, "Full-pretrain/Step": 7554, "Full-pretrain/Step Time": 17.595420813187957} +{"Full-pretrain/Learning Rate": 5.448164214762158e-06, "Full-pretrain/Loss": 1.8381937742233276, "Full-pretrain/Loss (Raw)": 1.9806442260742188, "Full-pretrain/Step": 7555, "Full-pretrain/Step Time": 17.594259141013026} +{"Full-pretrain/Learning Rate": 5.442873998026102e-06, "Full-pretrain/Loss": 1.8351311683654785, "Full-pretrain/Loss (Raw)": 1.9776806831359863, "Full-pretrain/Step": 7556, "Full-pretrain/Step Time": 17.59978210553527} +{"Full-pretrain/Learning Rate": 5.437586037197659e-06, "Full-pretrain/Loss": 1.8297619819641113, "Full-pretrain/Loss (Raw)": 1.9152599573135376, "Full-pretrain/Step": 7557, "Full-pretrain/Step Time": 17.600411830469966} +{"Full-pretrain/Learning Rate": 5.432300332886791e-06, "Full-pretrain/Loss": 1.830716609954834, "Full-pretrain/Loss (Raw)": 1.99594247341156, "Full-pretrain/Step": 7558, "Full-pretrain/Step Time": 17.60406201519072} +{"Full-pretrain/Learning Rate": 5.427016885703207e-06, "Full-pretrain/Loss": 1.8413573503494263, "Full-pretrain/Loss (Raw)": 2.0429153442382812, "Full-pretrain/Step": 7559, "Full-pretrain/Step Time": 17.600453600287437} +{"Full-pretrain/Learning Rate": 5.421735696256342e-06, "Full-pretrain/Loss": 1.8392795324325562, "Full-pretrain/Loss (Raw)": 1.9248204231262207, "Full-pretrain/Step": 7560, "Full-pretrain/Step Time": 17.60141179896891} +{"Full-pretrain/Learning Rate": 5.416456765155392e-06, "Full-pretrain/Loss": 1.8300926685333252, "Full-pretrain/Loss (Raw)": 1.7566745281219482, "Full-pretrain/Step": 7561, "Full-pretrain/Step Time": 17.589727295562625} +{"Full-pretrain/Learning Rate": 5.411180093009266e-06, "Full-pretrain/Loss": 1.8424904346466064, "Full-pretrain/Loss (Raw)": 1.941148042678833, "Full-pretrain/Step": 7562, "Full-pretrain/Step Time": 17.59215690009296} +{"Full-pretrain/Learning Rate": 5.4059056804266315e-06, "Full-pretrain/Loss": 1.8427155017852783, "Full-pretrain/Loss (Raw)": 1.9755805730819702, "Full-pretrain/Step": 7563, "Full-pretrain/Step Time": 17.589609310030937} +{"Full-pretrain/Learning Rate": 5.400633528015891e-06, "Full-pretrain/Loss": 1.8338829278945923, "Full-pretrain/Loss (Raw)": 1.7323487997055054, "Full-pretrain/Step": 7564, "Full-pretrain/Step Time": 17.59041707403958} +{"Full-pretrain/Learning Rate": 5.395363636385186e-06, "Full-pretrain/Loss": 1.8552277088165283, "Full-pretrain/Loss (Raw)": 2.2399823665618896, "Full-pretrain/Step": 7565, "Full-pretrain/Step Time": 17.588671462610364} +{"Full-pretrain/Learning Rate": 5.390096006142404e-06, "Full-pretrain/Loss": 1.842188835144043, "Full-pretrain/Loss (Raw)": 1.746759057044983, "Full-pretrain/Step": 7566, "Full-pretrain/Step Time": 17.582875851541758} +{"Full-pretrain/Learning Rate": 5.384830637895147e-06, "Full-pretrain/Loss": 1.8432798385620117, "Full-pretrain/Loss (Raw)": 1.9223055839538574, "Full-pretrain/Step": 7567, "Full-pretrain/Step Time": 17.591905338689685} +{"Full-pretrain/Learning Rate": 5.37956753225079e-06, "Full-pretrain/Loss": 1.848501205444336, "Full-pretrain/Loss (Raw)": 2.0644335746765137, "Full-pretrain/Step": 7568, "Full-pretrain/Step Time": 17.58921428769827} +{"Full-pretrain/Learning Rate": 5.374306689816419e-06, "Full-pretrain/Loss": 1.8530216217041016, "Full-pretrain/Loss (Raw)": 1.9450459480285645, "Full-pretrain/Step": 7569, "Full-pretrain/Step Time": 17.5859984010458} +{"Full-pretrain/Learning Rate": 5.369048111198871e-06, "Full-pretrain/Loss": 1.88446044921875, "Full-pretrain/Loss (Raw)": 2.333343029022217, "Full-pretrain/Step": 7570, "Full-pretrain/Step Time": 17.57635961472988} +{"Full-pretrain/Learning Rate": 5.363791797004733e-06, "Full-pretrain/Loss": 1.8713483810424805, "Full-pretrain/Loss (Raw)": 1.8992860317230225, "Full-pretrain/Step": 7571, "Full-pretrain/Step Time": 17.58248914964497} +{"Full-pretrain/Learning Rate": 5.3585377478403035e-06, "Full-pretrain/Loss": 1.8629869222640991, "Full-pretrain/Loss (Raw)": 1.7241970300674438, "Full-pretrain/Step": 7572, "Full-pretrain/Step Time": 17.58692630380392} +{"Full-pretrain/Learning Rate": 5.353285964311642e-06, "Full-pretrain/Loss": 1.8754502534866333, "Full-pretrain/Loss (Raw)": 1.8498592376708984, "Full-pretrain/Step": 7573, "Full-pretrain/Step Time": 17.584986839443445} +{"Full-pretrain/Learning Rate": 5.34803644702454e-06, "Full-pretrain/Loss": 1.8690613508224487, "Full-pretrain/Loss (Raw)": 1.914214849472046, "Full-pretrain/Step": 7574, "Full-pretrain/Step Time": 17.578751910477877} +{"Full-pretrain/Learning Rate": 5.342789196584527e-06, "Full-pretrain/Loss": 1.8736140727996826, "Full-pretrain/Loss (Raw)": 1.9894397258758545, "Full-pretrain/Step": 7575, "Full-pretrain/Step Time": 17.579842496663332} +{"Full-pretrain/Learning Rate": 5.337544213596873e-06, "Full-pretrain/Loss": 1.870168685913086, "Full-pretrain/Loss (Raw)": 1.7373104095458984, "Full-pretrain/Step": 7576, "Full-pretrain/Step Time": 17.583868766203523} +{"Full-pretrain/Learning Rate": 5.332301498666592e-06, "Full-pretrain/Loss": 1.8894429206848145, "Full-pretrain/Loss (Raw)": 2.009713888168335, "Full-pretrain/Step": 7577, "Full-pretrain/Step Time": 17.58463467285037} +{"Full-pretrain/Learning Rate": 5.327061052398413e-06, "Full-pretrain/Loss": 1.881361484527588, "Full-pretrain/Loss (Raw)": 1.7121353149414062, "Full-pretrain/Step": 7578, "Full-pretrain/Step Time": 17.577274084091187} +{"Full-pretrain/Learning Rate": 5.321822875396829e-06, "Full-pretrain/Loss": 1.886875867843628, "Full-pretrain/Loss (Raw)": 1.9628863334655762, "Full-pretrain/Step": 7579, "Full-pretrain/Step Time": 17.58265700004995} +{"Full-pretrain/Learning Rate": 5.31658696826606e-06, "Full-pretrain/Loss": 1.9171555042266846, "Full-pretrain/Loss (Raw)": 2.1264607906341553, "Full-pretrain/Step": 7580, "Full-pretrain/Step Time": 17.57692636922002} +{"Full-pretrain/Learning Rate": 5.311353331610067e-06, "Full-pretrain/Loss": 1.9149036407470703, "Full-pretrain/Loss (Raw)": 1.784445881843567, "Full-pretrain/Step": 7581, "Full-pretrain/Step Time": 17.580944364890456} +{"Full-pretrain/Learning Rate": 5.306121966032557e-06, "Full-pretrain/Loss": 1.9144879579544067, "Full-pretrain/Loss (Raw)": 2.063387870788574, "Full-pretrain/Step": 7582, "Full-pretrain/Step Time": 17.575236840173602} +{"Full-pretrain/Learning Rate": 5.300892872136947e-06, "Full-pretrain/Loss": 1.921971321105957, "Full-pretrain/Loss (Raw)": 2.1083645820617676, "Full-pretrain/Step": 7583, "Full-pretrain/Step Time": 17.577122988179326} +{"Full-pretrain/Learning Rate": 5.295666050526432e-06, "Full-pretrain/Loss": 1.9449870586395264, "Full-pretrain/Loss (Raw)": 2.043980836868286, "Full-pretrain/Step": 7584, "Full-pretrain/Step Time": 17.581402841955423} +{"Full-pretrain/Learning Rate": 5.290441501803903e-06, "Full-pretrain/Loss": 1.943988561630249, "Full-pretrain/Loss (Raw)": 1.8899956941604614, "Full-pretrain/Step": 7585, "Full-pretrain/Step Time": 17.5796557944268} +{"Full-pretrain/Learning Rate": 5.2852192265720216e-06, "Full-pretrain/Loss": 1.9421498775482178, "Full-pretrain/Loss (Raw)": 1.8382328748703003, "Full-pretrain/Step": 7586, "Full-pretrain/Step Time": 17.58306824043393} +{"Full-pretrain/Learning Rate": 5.279999225433182e-06, "Full-pretrain/Loss": 1.9358669519424438, "Full-pretrain/Loss (Raw)": 1.7795910835266113, "Full-pretrain/Step": 7587, "Full-pretrain/Step Time": 17.58271484822035} +{"Full-pretrain/Learning Rate": 5.274781498989495e-06, "Full-pretrain/Loss": 1.9318755865097046, "Full-pretrain/Loss (Raw)": 1.84995698928833, "Full-pretrain/Step": 7588, "Full-pretrain/Step Time": 17.5792340002954} +{"Full-pretrain/Learning Rate": 5.2695660478428305e-06, "Full-pretrain/Loss": 1.929063081741333, "Full-pretrain/Loss (Raw)": 1.8252594470977783, "Full-pretrain/Step": 7589, "Full-pretrain/Step Time": 17.584243148565292} +{"Full-pretrain/Learning Rate": 5.264352872594786e-06, "Full-pretrain/Loss": 1.9303979873657227, "Full-pretrain/Loss (Raw)": 2.038658618927002, "Full-pretrain/Step": 7590, "Full-pretrain/Step Time": 17.580097971484065} +{"Full-pretrain/Learning Rate": 5.259141973846704e-06, "Full-pretrain/Loss": 1.9232732057571411, "Full-pretrain/Loss (Raw)": 1.814923882484436, "Full-pretrain/Step": 7591, "Full-pretrain/Step Time": 17.578591337427497} +{"Full-pretrain/Learning Rate": 5.253933352199664e-06, "Full-pretrain/Loss": 1.9257745742797852, "Full-pretrain/Loss (Raw)": 2.0048651695251465, "Full-pretrain/Step": 7592, "Full-pretrain/Step Time": 17.582292748615146} +{"Full-pretrain/Learning Rate": 5.248727008254467e-06, "Full-pretrain/Loss": 1.9348552227020264, "Full-pretrain/Loss (Raw)": 2.0472521781921387, "Full-pretrain/Step": 7593, "Full-pretrain/Step Time": 17.579833844676614} +{"Full-pretrain/Learning Rate": 5.243522942611667e-06, "Full-pretrain/Loss": 1.93130624294281, "Full-pretrain/Loss (Raw)": 1.8275814056396484, "Full-pretrain/Step": 7594, "Full-pretrain/Step Time": 17.583497639745474} +{"Full-pretrain/Learning Rate": 5.238321155871554e-06, "Full-pretrain/Loss": 1.926575779914856, "Full-pretrain/Loss (Raw)": 1.8242082595825195, "Full-pretrain/Step": 7595, "Full-pretrain/Step Time": 17.57902473397553} +{"Full-pretrain/Learning Rate": 5.233121648634151e-06, "Full-pretrain/Loss": 1.926497220993042, "Full-pretrain/Loss (Raw)": 1.7298312187194824, "Full-pretrain/Step": 7596, "Full-pretrain/Step Time": 17.580619806423783} +{"Full-pretrain/Learning Rate": 5.2279244214992166e-06, "Full-pretrain/Loss": 1.9272016286849976, "Full-pretrain/Loss (Raw)": 2.2625246047973633, "Full-pretrain/Step": 7597, "Full-pretrain/Step Time": 17.58068692497909} +{"Full-pretrain/Learning Rate": 5.222729475066263e-06, "Full-pretrain/Loss": 1.9325851202011108, "Full-pretrain/Loss (Raw)": 1.9190304279327393, "Full-pretrain/Step": 7598, "Full-pretrain/Step Time": 17.58410370349884} +{"Full-pretrain/Learning Rate": 5.217536809934503e-06, "Full-pretrain/Loss": 1.9338229894638062, "Full-pretrain/Loss (Raw)": 1.9619182348251343, "Full-pretrain/Step": 7599, "Full-pretrain/Step Time": 17.58197768777609} +{"Full-pretrain/Learning Rate": 5.212346426702922e-06, "Full-pretrain/Loss": 1.9233896732330322, "Full-pretrain/Loss (Raw)": 1.73056960105896, "Full-pretrain/Step": 7600, "Full-pretrain/Step Time": 17.584661489352584} +{"Full-pretrain/Learning Rate": 5.207158325970235e-06, "Full-pretrain/Loss": 1.9246991872787476, "Full-pretrain/Loss (Raw)": 1.9869484901428223, "Full-pretrain/Step": 7601, "Full-pretrain/Step Time": 17.581659987568855} +{"Full-pretrain/Learning Rate": 5.201972508334871e-06, "Full-pretrain/Loss": 1.9126224517822266, "Full-pretrain/Loss (Raw)": 1.9468858242034912, "Full-pretrain/Step": 7602, "Full-pretrain/Step Time": 17.586454635486007} +{"Full-pretrain/Learning Rate": 5.196788974395026e-06, "Full-pretrain/Loss": 1.9077274799346924, "Full-pretrain/Loss (Raw)": 1.742646336555481, "Full-pretrain/Step": 7603, "Full-pretrain/Step Time": 17.588847506791353} +{"Full-pretrain/Learning Rate": 5.1916077247486095e-06, "Full-pretrain/Loss": 1.9075062274932861, "Full-pretrain/Loss (Raw)": 1.7171193361282349, "Full-pretrain/Step": 7604, "Full-pretrain/Step Time": 17.58998537622392} +{"Full-pretrain/Learning Rate": 5.186428759993278e-06, "Full-pretrain/Loss": 1.914072036743164, "Full-pretrain/Loss (Raw)": 2.0599660873413086, "Full-pretrain/Step": 7605, "Full-pretrain/Step Time": 17.589571300894022} +{"Full-pretrain/Learning Rate": 5.181252080726429e-06, "Full-pretrain/Loss": 1.923532247543335, "Full-pretrain/Loss (Raw)": 2.2169418334960938, "Full-pretrain/Step": 7606, "Full-pretrain/Step Time": 17.585668589919806} +{"Full-pretrain/Learning Rate": 5.176077687545186e-06, "Full-pretrain/Loss": 1.9211852550506592, "Full-pretrain/Loss (Raw)": 1.914334774017334, "Full-pretrain/Step": 7607, "Full-pretrain/Step Time": 17.588819060474634} +{"Full-pretrain/Learning Rate": 5.1709055810464205e-06, "Full-pretrain/Loss": 1.9277541637420654, "Full-pretrain/Loss (Raw)": 1.9475196599960327, "Full-pretrain/Step": 7608, "Full-pretrain/Step Time": 17.587429786100984} +{"Full-pretrain/Learning Rate": 5.165735761826724e-06, "Full-pretrain/Loss": 1.927929401397705, "Full-pretrain/Loss (Raw)": 2.015320301055908, "Full-pretrain/Step": 7609, "Full-pretrain/Step Time": 17.5923108253628} +{"Full-pretrain/Learning Rate": 5.160568230482435e-06, "Full-pretrain/Loss": 1.9343363046646118, "Full-pretrain/Loss (Raw)": 1.917154312133789, "Full-pretrain/Step": 7610, "Full-pretrain/Step Time": 17.59258677996695} +{"Full-pretrain/Learning Rate": 5.155402987609628e-06, "Full-pretrain/Loss": 1.9307914972305298, "Full-pretrain/Loss (Raw)": 1.8494528532028198, "Full-pretrain/Step": 7611, "Full-pretrain/Step Time": 17.591216761618853} +{"Full-pretrain/Learning Rate": 5.150240033804116e-06, "Full-pretrain/Loss": 1.9348118305206299, "Full-pretrain/Loss (Raw)": 2.255113363265991, "Full-pretrain/Step": 7612, "Full-pretrain/Step Time": 17.592994460836053} +{"Full-pretrain/Learning Rate": 5.145079369661443e-06, "Full-pretrain/Loss": 1.9397850036621094, "Full-pretrain/Loss (Raw)": 1.9435853958129883, "Full-pretrain/Step": 7613, "Full-pretrain/Step Time": 17.597286408767104} +{"Full-pretrain/Learning Rate": 5.139920995776884e-06, "Full-pretrain/Loss": 1.9318130016326904, "Full-pretrain/Loss (Raw)": 1.8082784414291382, "Full-pretrain/Step": 7614, "Full-pretrain/Step Time": 17.591753302142024} +{"Full-pretrain/Learning Rate": 5.134764912745457e-06, "Full-pretrain/Loss": 1.932775616645813, "Full-pretrain/Loss (Raw)": 2.139172077178955, "Full-pretrain/Step": 7615, "Full-pretrain/Step Time": 17.5929071046412} +{"Full-pretrain/Learning Rate": 5.1296111211619146e-06, "Full-pretrain/Loss": 1.9307658672332764, "Full-pretrain/Loss (Raw)": 1.979666829109192, "Full-pretrain/Step": 7616, "Full-pretrain/Step Time": 17.593746587634087} +{"Full-pretrain/Learning Rate": 5.1244596216207555e-06, "Full-pretrain/Loss": 1.930053472518921, "Full-pretrain/Loss (Raw)": 1.867199182510376, "Full-pretrain/Step": 7617, "Full-pretrain/Step Time": 17.599029906094074} +{"Full-pretrain/Learning Rate": 5.1193104147161885e-06, "Full-pretrain/Loss": 1.9253442287445068, "Full-pretrain/Loss (Raw)": 1.687534213066101, "Full-pretrain/Step": 7618, "Full-pretrain/Step Time": 17.59415783919394} +{"Full-pretrain/Learning Rate": 5.114163501042182e-06, "Full-pretrain/Loss": 1.9325721263885498, "Full-pretrain/Loss (Raw)": 2.010885715484619, "Full-pretrain/Step": 7619, "Full-pretrain/Step Time": 17.58951124176383} +{"Full-pretrain/Learning Rate": 5.109018881192423e-06, "Full-pretrain/Loss": 1.9336949586868286, "Full-pretrain/Loss (Raw)": 1.8858901262283325, "Full-pretrain/Step": 7620, "Full-pretrain/Step Time": 17.59070648625493} +{"Full-pretrain/Learning Rate": 5.103876555760345e-06, "Full-pretrain/Loss": 1.9327433109283447, "Full-pretrain/Loss (Raw)": 1.7948040962219238, "Full-pretrain/Step": 7621, "Full-pretrain/Step Time": 17.591254932805896} +{"Full-pretrain/Learning Rate": 5.098736525339115e-06, "Full-pretrain/Loss": 1.9357608556747437, "Full-pretrain/Loss (Raw)": 2.135220527648926, "Full-pretrain/Step": 7622, "Full-pretrain/Step Time": 17.594215666875243} +{"Full-pretrain/Learning Rate": 5.093598790521634e-06, "Full-pretrain/Loss": 1.942072868347168, "Full-pretrain/Loss (Raw)": 2.0169076919555664, "Full-pretrain/Step": 7623, "Full-pretrain/Step Time": 17.59086547419429} +{"Full-pretrain/Learning Rate": 5.088463351900541e-06, "Full-pretrain/Loss": 1.930687427520752, "Full-pretrain/Loss (Raw)": 1.6405342817306519, "Full-pretrain/Step": 7624, "Full-pretrain/Step Time": 17.594744050875306} +{"Full-pretrain/Learning Rate": 5.0833302100681965e-06, "Full-pretrain/Loss": 1.9240773916244507, "Full-pretrain/Loss (Raw)": 1.835728645324707, "Full-pretrain/Step": 7625, "Full-pretrain/Step Time": 17.601409351453185} +{"Full-pretrain/Learning Rate": 5.078199365616715e-06, "Full-pretrain/Loss": 1.9289593696594238, "Full-pretrain/Loss (Raw)": 1.983803629875183, "Full-pretrain/Step": 7626, "Full-pretrain/Step Time": 17.602030901238322} +{"Full-pretrain/Learning Rate": 5.073070819137934e-06, "Full-pretrain/Loss": 1.931037425994873, "Full-pretrain/Loss (Raw)": 1.8907067775726318, "Full-pretrain/Step": 7627, "Full-pretrain/Step Time": 17.602710800245404} +{"Full-pretrain/Learning Rate": 5.067944571223432e-06, "Full-pretrain/Loss": 1.9392712116241455, "Full-pretrain/Loss (Raw)": 1.993315577507019, "Full-pretrain/Step": 7628, "Full-pretrain/Step Time": 17.60075961612165} +{"Full-pretrain/Learning Rate": 5.062820622464526e-06, "Full-pretrain/Loss": 1.9276453256607056, "Full-pretrain/Loss (Raw)": 1.8904948234558105, "Full-pretrain/Step": 7629, "Full-pretrain/Step Time": 17.60502770356834} +{"Full-pretrain/Learning Rate": 5.057698973452249e-06, "Full-pretrain/Loss": 1.9304049015045166, "Full-pretrain/Loss (Raw)": 2.007338047027588, "Full-pretrain/Step": 7630, "Full-pretrain/Step Time": 17.601100511848927} +{"Full-pretrain/Learning Rate": 5.052579624777384e-06, "Full-pretrain/Loss": 1.9285649061203003, "Full-pretrain/Loss (Raw)": 1.9030396938323975, "Full-pretrain/Step": 7631, "Full-pretrain/Step Time": 17.600845457985997} +{"Full-pretrain/Learning Rate": 5.047462577030451e-06, "Full-pretrain/Loss": 1.932124376296997, "Full-pretrain/Loss (Raw)": 1.8444726467132568, "Full-pretrain/Step": 7632, "Full-pretrain/Step Time": 17.60186887346208} +{"Full-pretrain/Learning Rate": 5.042347830801705e-06, "Full-pretrain/Loss": 1.931471586227417, "Full-pretrain/Loss (Raw)": 1.9660580158233643, "Full-pretrain/Step": 7633, "Full-pretrain/Step Time": 17.6085945982486} +{"Full-pretrain/Learning Rate": 5.037235386681116e-06, "Full-pretrain/Loss": 1.9313920736312866, "Full-pretrain/Loss (Raw)": 1.9443432092666626, "Full-pretrain/Step": 7634, "Full-pretrain/Step Time": 17.616060996428132} +{"Full-pretrain/Learning Rate": 5.032125245258409e-06, "Full-pretrain/Loss": 1.9349195957183838, "Full-pretrain/Loss (Raw)": 1.8555246591567993, "Full-pretrain/Step": 7635, "Full-pretrain/Step Time": 17.61262816004455} +{"Full-pretrain/Learning Rate": 5.027017407123047e-06, "Full-pretrain/Loss": 1.9451475143432617, "Full-pretrain/Loss (Raw)": 2.044414520263672, "Full-pretrain/Step": 7636, "Full-pretrain/Step Time": 17.62041804380715} +{"Full-pretrain/Learning Rate": 5.021911872864199e-06, "Full-pretrain/Loss": 1.939673662185669, "Full-pretrain/Loss (Raw)": 1.8847993612289429, "Full-pretrain/Step": 7637, "Full-pretrain/Step Time": 17.62780114635825} +{"Full-pretrain/Learning Rate": 5.016808643070798e-06, "Full-pretrain/Loss": 1.9280470609664917, "Full-pretrain/Loss (Raw)": 1.8448936939239502, "Full-pretrain/Step": 7638, "Full-pretrain/Step Time": 17.628152053803205} +{"Full-pretrain/Learning Rate": 5.011707718331496e-06, "Full-pretrain/Loss": 1.9277080297470093, "Full-pretrain/Loss (Raw)": 1.903484582901001, "Full-pretrain/Step": 7639, "Full-pretrain/Step Time": 17.62650628760457} +{"Full-pretrain/Learning Rate": 5.0066090992346905e-06, "Full-pretrain/Loss": 1.9175233840942383, "Full-pretrain/Loss (Raw)": 1.6216084957122803, "Full-pretrain/Step": 7640, "Full-pretrain/Step Time": 17.630341524258256} +{"Full-pretrain/Learning Rate": 5.001512786368492e-06, "Full-pretrain/Loss": 1.9091238975524902, "Full-pretrain/Loss (Raw)": 1.7465386390686035, "Full-pretrain/Step": 7641, "Full-pretrain/Step Time": 17.62930404022336} +{"Full-pretrain/Learning Rate": 4.996418780320766e-06, "Full-pretrain/Loss": 1.903942346572876, "Full-pretrain/Loss (Raw)": 1.751346468925476, "Full-pretrain/Step": 7642, "Full-pretrain/Step Time": 17.62993540428579} +{"Full-pretrain/Learning Rate": 4.991327081679106e-06, "Full-pretrain/Loss": 1.9034192562103271, "Full-pretrain/Loss (Raw)": 1.8327131271362305, "Full-pretrain/Step": 7643, "Full-pretrain/Step Time": 17.629470329731703} +{"Full-pretrain/Learning Rate": 4.986237691030835e-06, "Full-pretrain/Loss": 1.8989031314849854, "Full-pretrain/Loss (Raw)": 2.110600233078003, "Full-pretrain/Step": 7644, "Full-pretrain/Step Time": 17.629751266911626} +{"Full-pretrain/Learning Rate": 4.981150608963017e-06, "Full-pretrain/Loss": 1.900759220123291, "Full-pretrain/Loss (Raw)": 2.0029804706573486, "Full-pretrain/Step": 7645, "Full-pretrain/Step Time": 17.62915377318859} +{"Full-pretrain/Learning Rate": 4.9760658360624355e-06, "Full-pretrain/Loss": 1.9038946628570557, "Full-pretrain/Loss (Raw)": 1.9086120128631592, "Full-pretrain/Step": 7646, "Full-pretrain/Step Time": 17.63178418017924} +{"Full-pretrain/Learning Rate": 4.9709833729156246e-06, "Full-pretrain/Loss": 1.8882107734680176, "Full-pretrain/Loss (Raw)": 1.6372878551483154, "Full-pretrain/Step": 7647, "Full-pretrain/Step Time": 17.63041675835848} +{"Full-pretrain/Learning Rate": 4.965903220108842e-06, "Full-pretrain/Loss": 1.8897593021392822, "Full-pretrain/Loss (Raw)": 2.02921724319458, "Full-pretrain/Step": 7648, "Full-pretrain/Step Time": 17.63605766557157} +{"Full-pretrain/Learning Rate": 4.960825378228082e-06, "Full-pretrain/Loss": 1.891198754310608, "Full-pretrain/Loss (Raw)": 1.9132612943649292, "Full-pretrain/Step": 7649, "Full-pretrain/Step Time": 17.63425735756755} +{"Full-pretrain/Learning Rate": 4.9557498478590785e-06, "Full-pretrain/Loss": 1.8933970928192139, "Full-pretrain/Loss (Raw)": 1.7578816413879395, "Full-pretrain/Step": 7650, "Full-pretrain/Step Time": 17.6332587916404} +{"Full-pretrain/Learning Rate": 4.950676629587281e-06, "Full-pretrain/Loss": 1.8960702419281006, "Full-pretrain/Loss (Raw)": 2.0964269638061523, "Full-pretrain/Step": 7651, "Full-pretrain/Step Time": 17.630113430321217} +{"Full-pretrain/Learning Rate": 4.945605723997896e-06, "Full-pretrain/Loss": 1.8939275741577148, "Full-pretrain/Loss (Raw)": 1.8173208236694336, "Full-pretrain/Step": 7652, "Full-pretrain/Step Time": 17.63439677283168} +{"Full-pretrain/Learning Rate": 4.9405371316758345e-06, "Full-pretrain/Loss": 1.9032620191574097, "Full-pretrain/Loss (Raw)": 2.0935091972351074, "Full-pretrain/Step": 7653, "Full-pretrain/Step Time": 17.62866559624672} +{"Full-pretrain/Learning Rate": 4.935470853205765e-06, "Full-pretrain/Loss": 1.8910778760910034, "Full-pretrain/Loss (Raw)": 1.7453298568725586, "Full-pretrain/Step": 7654, "Full-pretrain/Step Time": 17.6369051579386} +{"Full-pretrain/Learning Rate": 4.93040688917209e-06, "Full-pretrain/Loss": 1.8809661865234375, "Full-pretrain/Loss (Raw)": 1.693327784538269, "Full-pretrain/Step": 7655, "Full-pretrain/Step Time": 17.635147096589208} +{"Full-pretrain/Learning Rate": 4.9253452401589185e-06, "Full-pretrain/Loss": 1.886789321899414, "Full-pretrain/Loss (Raw)": 1.8268756866455078, "Full-pretrain/Step": 7656, "Full-pretrain/Step Time": 17.6369553450495} +{"Full-pretrain/Learning Rate": 4.920285906750122e-06, "Full-pretrain/Loss": 1.8877012729644775, "Full-pretrain/Loss (Raw)": 1.8649156093597412, "Full-pretrain/Step": 7657, "Full-pretrain/Step Time": 17.63529753871262} +{"Full-pretrain/Learning Rate": 4.9152288895292855e-06, "Full-pretrain/Loss": 1.8900705575942993, "Full-pretrain/Loss (Raw)": 2.059619426727295, "Full-pretrain/Step": 7658, "Full-pretrain/Step Time": 17.63734599389136} +{"Full-pretrain/Learning Rate": 4.910174189079742e-06, "Full-pretrain/Loss": 1.8906211853027344, "Full-pretrain/Loss (Raw)": 1.908327579498291, "Full-pretrain/Step": 7659, "Full-pretrain/Step Time": 17.637391505762935} +{"Full-pretrain/Learning Rate": 4.9051218059845446e-06, "Full-pretrain/Loss": 1.8973770141601562, "Full-pretrain/Loss (Raw)": 2.2094974517822266, "Full-pretrain/Step": 7660, "Full-pretrain/Step Time": 17.63795450143516} +{"Full-pretrain/Learning Rate": 4.900071740826489e-06, "Full-pretrain/Loss": 1.8905080556869507, "Full-pretrain/Loss (Raw)": 1.6706892251968384, "Full-pretrain/Step": 7661, "Full-pretrain/Step Time": 17.631779614835978} +{"Full-pretrain/Learning Rate": 4.8950239941880914e-06, "Full-pretrain/Loss": 1.890178918838501, "Full-pretrain/Loss (Raw)": 1.99680495262146, "Full-pretrain/Step": 7662, "Full-pretrain/Step Time": 17.635769737884402} +{"Full-pretrain/Learning Rate": 4.88997856665161e-06, "Full-pretrain/Loss": 1.8839149475097656, "Full-pretrain/Loss (Raw)": 1.7025951147079468, "Full-pretrain/Step": 7663, "Full-pretrain/Step Time": 17.636734806001186} +{"Full-pretrain/Learning Rate": 4.884935458799031e-06, "Full-pretrain/Loss": 1.8779975175857544, "Full-pretrain/Loss (Raw)": 1.655112385749817, "Full-pretrain/Step": 7664, "Full-pretrain/Step Time": 17.63683944568038} +{"Full-pretrain/Learning Rate": 4.879894671212082e-06, "Full-pretrain/Loss": 1.877464771270752, "Full-pretrain/Loss (Raw)": 1.9490101337432861, "Full-pretrain/Step": 7665, "Full-pretrain/Step Time": 17.630957514047623} +{"Full-pretrain/Learning Rate": 4.874856204472217e-06, "Full-pretrain/Loss": 1.8787205219268799, "Full-pretrain/Loss (Raw)": 1.9845294952392578, "Full-pretrain/Step": 7666, "Full-pretrain/Step Time": 17.63158051110804} +{"Full-pretrain/Learning Rate": 4.869820059160607e-06, "Full-pretrain/Loss": 1.8774906396865845, "Full-pretrain/Loss (Raw)": 1.8161674737930298, "Full-pretrain/Step": 7667, "Full-pretrain/Step Time": 17.63242875225842} +{"Full-pretrain/Learning Rate": 4.864786235858187e-06, "Full-pretrain/Loss": 1.8815391063690186, "Full-pretrain/Loss (Raw)": 2.1739678382873535, "Full-pretrain/Step": 7668, "Full-pretrain/Step Time": 17.625542547553778} +{"Full-pretrain/Learning Rate": 4.859754735145594e-06, "Full-pretrain/Loss": 1.8845834732055664, "Full-pretrain/Loss (Raw)": 1.9822206497192383, "Full-pretrain/Step": 7669, "Full-pretrain/Step Time": 17.62909833714366} +{"Full-pretrain/Learning Rate": 4.854725557603215e-06, "Full-pretrain/Loss": 1.8895022869110107, "Full-pretrain/Loss (Raw)": 2.002296209335327, "Full-pretrain/Step": 7670, "Full-pretrain/Step Time": 17.631670523434877} +{"Full-pretrain/Learning Rate": 4.8496987038111674e-06, "Full-pretrain/Loss": 1.8890339136123657, "Full-pretrain/Loss (Raw)": 1.888493537902832, "Full-pretrain/Step": 7671, "Full-pretrain/Step Time": 17.630251988768578} +{"Full-pretrain/Learning Rate": 4.844674174349287e-06, "Full-pretrain/Loss": 1.896841049194336, "Full-pretrain/Loss (Raw)": 1.871436357498169, "Full-pretrain/Step": 7672, "Full-pretrain/Step Time": 17.629191663116217} +{"Full-pretrain/Learning Rate": 4.83965196979716e-06, "Full-pretrain/Loss": 1.9028544425964355, "Full-pretrain/Loss (Raw)": 1.938966989517212, "Full-pretrain/Step": 7673, "Full-pretrain/Step Time": 17.62782140634954} +{"Full-pretrain/Learning Rate": 4.83463209073409e-06, "Full-pretrain/Loss": 1.904602289199829, "Full-pretrain/Loss (Raw)": 1.8072788715362549, "Full-pretrain/Step": 7674, "Full-pretrain/Step Time": 17.627576434984803} +{"Full-pretrain/Learning Rate": 4.829614537739124e-06, "Full-pretrain/Loss": 1.9147460460662842, "Full-pretrain/Loss (Raw)": 2.157313346862793, "Full-pretrain/Step": 7675, "Full-pretrain/Step Time": 17.630694765597582} +{"Full-pretrain/Learning Rate": 4.824599311391031e-06, "Full-pretrain/Loss": 1.8965685367584229, "Full-pretrain/Loss (Raw)": 1.528923749923706, "Full-pretrain/Step": 7676, "Full-pretrain/Step Time": 17.63448260165751} +{"Full-pretrain/Learning Rate": 4.819586412268326e-06, "Full-pretrain/Loss": 1.8974628448486328, "Full-pretrain/Loss (Raw)": 2.0315935611724854, "Full-pretrain/Step": 7677, "Full-pretrain/Step Time": 17.62846465408802} +{"Full-pretrain/Learning Rate": 4.814575840949228e-06, "Full-pretrain/Loss": 1.8932020664215088, "Full-pretrain/Loss (Raw)": 1.7722656726837158, "Full-pretrain/Step": 7678, "Full-pretrain/Step Time": 17.631539791822433} +{"Full-pretrain/Learning Rate": 4.809567598011714e-06, "Full-pretrain/Loss": 1.8994197845458984, "Full-pretrain/Loss (Raw)": 1.836256504058838, "Full-pretrain/Step": 7679, "Full-pretrain/Step Time": 17.634570933878422} +{"Full-pretrain/Learning Rate": 4.8045616840334816e-06, "Full-pretrain/Loss": 1.8884665966033936, "Full-pretrain/Loss (Raw)": 1.6787132024765015, "Full-pretrain/Step": 7680, "Full-pretrain/Step Time": 17.633432149887085} +{"Full-pretrain/Learning Rate": 4.799558099591961e-06, "Full-pretrain/Loss": 1.894735336303711, "Full-pretrain/Loss (Raw)": 2.113861560821533, "Full-pretrain/Step": 7681, "Full-pretrain/Step Time": 17.635449731722474} +{"Full-pretrain/Learning Rate": 4.794556845264322e-06, "Full-pretrain/Loss": 1.897548794746399, "Full-pretrain/Loss (Raw)": 1.8479138612747192, "Full-pretrain/Step": 7682, "Full-pretrain/Step Time": 17.632564906030893} +{"Full-pretrain/Learning Rate": 4.789557921627444e-06, "Full-pretrain/Loss": 1.8924546241760254, "Full-pretrain/Loss (Raw)": 1.9334158897399902, "Full-pretrain/Step": 7683, "Full-pretrain/Step Time": 17.63319660909474} +{"Full-pretrain/Learning Rate": 4.7845613292579585e-06, "Full-pretrain/Loss": 1.8980358839035034, "Full-pretrain/Loss (Raw)": 1.9959168434143066, "Full-pretrain/Step": 7684, "Full-pretrain/Step Time": 17.63199650682509} +{"Full-pretrain/Learning Rate": 4.779567068732224e-06, "Full-pretrain/Loss": 1.8910245895385742, "Full-pretrain/Loss (Raw)": 1.8691468238830566, "Full-pretrain/Step": 7685, "Full-pretrain/Step Time": 17.633286388590932} +{"Full-pretrain/Learning Rate": 4.7745751406263165e-06, "Full-pretrain/Loss": 1.8978135585784912, "Full-pretrain/Loss (Raw)": 1.9625823497772217, "Full-pretrain/Step": 7686, "Full-pretrain/Step Time": 17.62980197556317} +{"Full-pretrain/Learning Rate": 4.769585545516065e-06, "Full-pretrain/Loss": 1.9057104587554932, "Full-pretrain/Loss (Raw)": 1.9460272789001465, "Full-pretrain/Step": 7687, "Full-pretrain/Step Time": 17.62833745777607} +{"Full-pretrain/Learning Rate": 4.764598283977004e-06, "Full-pretrain/Loss": 1.9124376773834229, "Full-pretrain/Loss (Raw)": 2.042145252227783, "Full-pretrain/Step": 7688, "Full-pretrain/Step Time": 17.626648362725973} +{"Full-pretrain/Learning Rate": 4.759613356584422e-06, "Full-pretrain/Loss": 1.9144173860549927, "Full-pretrain/Loss (Raw)": 1.9282671213150024, "Full-pretrain/Step": 7689, "Full-pretrain/Step Time": 17.632580200210214} +{"Full-pretrain/Learning Rate": 4.754630763913323e-06, "Full-pretrain/Loss": 1.9173011779785156, "Full-pretrain/Loss (Raw)": 2.15190052986145, "Full-pretrain/Step": 7690, "Full-pretrain/Step Time": 17.630498971790075} +{"Full-pretrain/Learning Rate": 4.749650506538453e-06, "Full-pretrain/Loss": 1.913527488708496, "Full-pretrain/Loss (Raw)": 1.7875677347183228, "Full-pretrain/Step": 7691, "Full-pretrain/Step Time": 17.635386012494564} +{"Full-pretrain/Learning Rate": 4.7446725850342875e-06, "Full-pretrain/Loss": 1.9059900045394897, "Full-pretrain/Loss (Raw)": 1.968298316001892, "Full-pretrain/Step": 7692, "Full-pretrain/Step Time": 17.634340217337012} +{"Full-pretrain/Learning Rate": 4.739696999975013e-06, "Full-pretrain/Loss": 1.9073883295059204, "Full-pretrain/Loss (Raw)": 1.7154361009597778, "Full-pretrain/Step": 7693, "Full-pretrain/Step Time": 17.632430233061314} +{"Full-pretrain/Learning Rate": 4.734723751934572e-06, "Full-pretrain/Loss": 1.895503044128418, "Full-pretrain/Loss (Raw)": 1.6164727210998535, "Full-pretrain/Step": 7694, "Full-pretrain/Step Time": 17.636376788839698} +{"Full-pretrain/Learning Rate": 4.729752841486623e-06, "Full-pretrain/Loss": 1.89548659324646, "Full-pretrain/Loss (Raw)": 1.702072024345398, "Full-pretrain/Step": 7695, "Full-pretrain/Step Time": 17.635046247392893} +{"Full-pretrain/Learning Rate": 4.72478426920456e-06, "Full-pretrain/Loss": 1.9083895683288574, "Full-pretrain/Loss (Raw)": 2.068007469177246, "Full-pretrain/Step": 7696, "Full-pretrain/Step Time": 17.635488159954548} +{"Full-pretrain/Learning Rate": 4.719818035661508e-06, "Full-pretrain/Loss": 1.9104373455047607, "Full-pretrain/Loss (Raw)": 2.014535903930664, "Full-pretrain/Step": 7697, "Full-pretrain/Step Time": 17.637873040512204} +{"Full-pretrain/Learning Rate": 4.714854141430322e-06, "Full-pretrain/Loss": 1.9075568914413452, "Full-pretrain/Loss (Raw)": 1.8923553228378296, "Full-pretrain/Step": 7698, "Full-pretrain/Step Time": 17.641934536397457} +{"Full-pretrain/Learning Rate": 4.709892587083578e-06, "Full-pretrain/Loss": 1.9107334613800049, "Full-pretrain/Loss (Raw)": 1.9178224802017212, "Full-pretrain/Step": 7699, "Full-pretrain/Step Time": 17.635992294177413} +{"Full-pretrain/Learning Rate": 4.704933373193593e-06, "Full-pretrain/Loss": 1.9140191078186035, "Full-pretrain/Loss (Raw)": 2.279109239578247, "Full-pretrain/Step": 7700, "Full-pretrain/Step Time": 17.631295459344983} +{"Full-pretrain/Learning Rate": 4.699976500332418e-06, "Full-pretrain/Loss": 1.9154930114746094, "Full-pretrain/Loss (Raw)": 2.029383659362793, "Full-pretrain/Step": 7701, "Full-pretrain/Step Time": 17.64615091122687} +{"Full-pretrain/Learning Rate": 4.695021969071811e-06, "Full-pretrain/Loss": 1.9107863903045654, "Full-pretrain/Loss (Raw)": 1.851681113243103, "Full-pretrain/Step": 7702, "Full-pretrain/Step Time": 17.641765551641583} +{"Full-pretrain/Learning Rate": 4.690069779983294e-06, "Full-pretrain/Loss": 1.904677391052246, "Full-pretrain/Loss (Raw)": 1.6930105686187744, "Full-pretrain/Step": 7703, "Full-pretrain/Step Time": 17.643066143617034} +{"Full-pretrain/Learning Rate": 4.685119933638082e-06, "Full-pretrain/Loss": 1.9147975444793701, "Full-pretrain/Loss (Raw)": 2.195277690887451, "Full-pretrain/Step": 7704, "Full-pretrain/Step Time": 17.635473996400833} +{"Full-pretrain/Learning Rate": 4.680172430607146e-06, "Full-pretrain/Loss": 1.905469536781311, "Full-pretrain/Loss (Raw)": 1.64047110080719, "Full-pretrain/Step": 7705, "Full-pretrain/Step Time": 17.642483623698354} +{"Full-pretrain/Learning Rate": 4.675227271461182e-06, "Full-pretrain/Loss": 1.9174989461898804, "Full-pretrain/Loss (Raw)": 2.192220687866211, "Full-pretrain/Step": 7706, "Full-pretrain/Step Time": 17.644544461742043} +{"Full-pretrain/Learning Rate": 4.670284456770607e-06, "Full-pretrain/Loss": 1.907935619354248, "Full-pretrain/Loss (Raw)": 1.851288080215454, "Full-pretrain/Step": 7707, "Full-pretrain/Step Time": 17.633752277120948} +{"Full-pretrain/Learning Rate": 4.665343987105583e-06, "Full-pretrain/Loss": 1.92525053024292, "Full-pretrain/Loss (Raw)": 2.082998514175415, "Full-pretrain/Step": 7708, "Full-pretrain/Step Time": 17.640754278749228} +{"Full-pretrain/Learning Rate": 4.660405863035977e-06, "Full-pretrain/Loss": 1.924121618270874, "Full-pretrain/Loss (Raw)": 1.995469093322754, "Full-pretrain/Step": 7709, "Full-pretrain/Step Time": 17.63642682507634} +{"Full-pretrain/Learning Rate": 4.655470085131408e-06, "Full-pretrain/Loss": 1.9299519062042236, "Full-pretrain/Loss (Raw)": 1.9588351249694824, "Full-pretrain/Step": 7710, "Full-pretrain/Step Time": 17.64008388109505} +{"Full-pretrain/Learning Rate": 4.650536653961215e-06, "Full-pretrain/Loss": 1.914370059967041, "Full-pretrain/Loss (Raw)": 1.3376338481903076, "Full-pretrain/Step": 7711, "Full-pretrain/Step Time": 17.641015015542507} +{"Full-pretrain/Learning Rate": 4.645605570094466e-06, "Full-pretrain/Loss": 1.924590826034546, "Full-pretrain/Loss (Raw)": 2.00577974319458, "Full-pretrain/Step": 7712, "Full-pretrain/Step Time": 17.639107471331954} +{"Full-pretrain/Learning Rate": 4.640676834099969e-06, "Full-pretrain/Loss": 1.9150047302246094, "Full-pretrain/Loss (Raw)": 1.807106614112854, "Full-pretrain/Step": 7713, "Full-pretrain/Step Time": 17.63828483968973} +{"Full-pretrain/Learning Rate": 4.635750446546239e-06, "Full-pretrain/Loss": 1.931760311126709, "Full-pretrain/Loss (Raw)": 2.384091854095459, "Full-pretrain/Step": 7714, "Full-pretrain/Step Time": 17.63681184872985} +{"Full-pretrain/Learning Rate": 4.630826408001537e-06, "Full-pretrain/Loss": 1.9230406284332275, "Full-pretrain/Loss (Raw)": 1.6543856859207153, "Full-pretrain/Step": 7715, "Full-pretrain/Step Time": 17.63522164709866} +{"Full-pretrain/Learning Rate": 4.62590471903385e-06, "Full-pretrain/Loss": 1.9159281253814697, "Full-pretrain/Loss (Raw)": 1.768317699432373, "Full-pretrain/Step": 7716, "Full-pretrain/Step Time": 17.634244296699762} +{"Full-pretrain/Learning Rate": 4.620985380210901e-06, "Full-pretrain/Loss": 1.9351897239685059, "Full-pretrain/Loss (Raw)": 2.4855189323425293, "Full-pretrain/Step": 7717, "Full-pretrain/Step Time": 17.63089832291007} +{"Full-pretrain/Learning Rate": 4.61606839210012e-06, "Full-pretrain/Loss": 1.9367021322250366, "Full-pretrain/Loss (Raw)": 2.0109806060791016, "Full-pretrain/Step": 7718, "Full-pretrain/Step Time": 17.633977895602584} +{"Full-pretrain/Learning Rate": 4.611153755268688e-06, "Full-pretrain/Loss": 1.9356321096420288, "Full-pretrain/Loss (Raw)": 1.9117854833602905, "Full-pretrain/Step": 7719, "Full-pretrain/Step Time": 17.635737458243966} +{"Full-pretrain/Learning Rate": 4.606241470283512e-06, "Full-pretrain/Loss": 1.9340487718582153, "Full-pretrain/Loss (Raw)": 1.991479516029358, "Full-pretrain/Step": 7720, "Full-pretrain/Step Time": 17.631620412692428} +{"Full-pretrain/Learning Rate": 4.601331537711207e-06, "Full-pretrain/Loss": 1.9365301132202148, "Full-pretrain/Loss (Raw)": 2.007669448852539, "Full-pretrain/Step": 7721, "Full-pretrain/Step Time": 17.63408957608044} +{"Full-pretrain/Learning Rate": 4.59642395811814e-06, "Full-pretrain/Loss": 1.9256842136383057, "Full-pretrain/Loss (Raw)": 1.804830551147461, "Full-pretrain/Step": 7722, "Full-pretrain/Step Time": 17.63596686720848} +{"Full-pretrain/Learning Rate": 4.591518732070402e-06, "Full-pretrain/Loss": 1.9376842975616455, "Full-pretrain/Loss (Raw)": 2.1715705394744873, "Full-pretrain/Step": 7723, "Full-pretrain/Step Time": 17.630772536620498} +{"Full-pretrain/Learning Rate": 4.586615860133811e-06, "Full-pretrain/Loss": 1.9236118793487549, "Full-pretrain/Loss (Raw)": 1.5179810523986816, "Full-pretrain/Step": 7724, "Full-pretrain/Step Time": 17.631340604275465} +{"Full-pretrain/Learning Rate": 4.581715342873899e-06, "Full-pretrain/Loss": 1.9354033470153809, "Full-pretrain/Loss (Raw)": 2.0927600860595703, "Full-pretrain/Step": 7725, "Full-pretrain/Step Time": 17.63608335517347} +{"Full-pretrain/Learning Rate": 4.57681718085595e-06, "Full-pretrain/Loss": 1.941650629043579, "Full-pretrain/Loss (Raw)": 1.8163914680480957, "Full-pretrain/Step": 7726, "Full-pretrain/Step Time": 17.633167868480086} +{"Full-pretrain/Learning Rate": 4.571921374644958e-06, "Full-pretrain/Loss": 1.9476385116577148, "Full-pretrain/Loss (Raw)": 1.8936822414398193, "Full-pretrain/Step": 7727, "Full-pretrain/Step Time": 17.637011349201202} +{"Full-pretrain/Learning Rate": 4.5670279248056585e-06, "Full-pretrain/Loss": 1.9454498291015625, "Full-pretrain/Loss (Raw)": 1.9979699850082397, "Full-pretrain/Step": 7728, "Full-pretrain/Step Time": 17.633343759924173} +{"Full-pretrain/Learning Rate": 4.562136831902514e-06, "Full-pretrain/Loss": 1.9396202564239502, "Full-pretrain/Loss (Raw)": 1.8279863595962524, "Full-pretrain/Step": 7729, "Full-pretrain/Step Time": 17.636637467890978} +{"Full-pretrain/Learning Rate": 4.557248096499697e-06, "Full-pretrain/Loss": 1.9361013174057007, "Full-pretrain/Loss (Raw)": 1.7797527313232422, "Full-pretrain/Step": 7730, "Full-pretrain/Step Time": 17.63683184608817} +{"Full-pretrain/Learning Rate": 4.552361719161127e-06, "Full-pretrain/Loss": 1.929189920425415, "Full-pretrain/Loss (Raw)": 1.6966590881347656, "Full-pretrain/Step": 7731, "Full-pretrain/Step Time": 17.63597950525582} +{"Full-pretrain/Learning Rate": 4.547477700450448e-06, "Full-pretrain/Loss": 1.9196014404296875, "Full-pretrain/Loss (Raw)": 1.9722750186920166, "Full-pretrain/Step": 7732, "Full-pretrain/Step Time": 17.64043720625341} +{"Full-pretrain/Learning Rate": 4.542596040931029e-06, "Full-pretrain/Loss": 1.9157869815826416, "Full-pretrain/Loss (Raw)": 1.9073247909545898, "Full-pretrain/Step": 7733, "Full-pretrain/Step Time": 17.637759493663907} +{"Full-pretrain/Learning Rate": 4.537716741165973e-06, "Full-pretrain/Loss": 1.9009071588516235, "Full-pretrain/Loss (Raw)": 1.3755226135253906, "Full-pretrain/Step": 7734, "Full-pretrain/Step Time": 17.63918797299266} +{"Full-pretrain/Learning Rate": 4.532839801718095e-06, "Full-pretrain/Loss": 1.9127142429351807, "Full-pretrain/Loss (Raw)": 2.070836305618286, "Full-pretrain/Step": 7735, "Full-pretrain/Step Time": 17.636304626241326} +{"Full-pretrain/Learning Rate": 4.527965223149957e-06, "Full-pretrain/Loss": 1.9064924716949463, "Full-pretrain/Loss (Raw)": 1.9961854219436646, "Full-pretrain/Step": 7736, "Full-pretrain/Step Time": 17.640976920723915} +{"Full-pretrain/Learning Rate": 4.523093006023832e-06, "Full-pretrain/Loss": 1.9124817848205566, "Full-pretrain/Loss (Raw)": 1.832127332687378, "Full-pretrain/Step": 7737, "Full-pretrain/Step Time": 17.629023855552077} +{"Full-pretrain/Learning Rate": 4.518223150901732e-06, "Full-pretrain/Loss": 1.8933073282241821, "Full-pretrain/Loss (Raw)": 1.5786354541778564, "Full-pretrain/Step": 7738, "Full-pretrain/Step Time": 17.634796775877476} +{"Full-pretrain/Learning Rate": 4.513355658345392e-06, "Full-pretrain/Loss": 1.8982484340667725, "Full-pretrain/Loss (Raw)": 2.0094058513641357, "Full-pretrain/Step": 7739, "Full-pretrain/Step Time": 17.632888574153185} +{"Full-pretrain/Learning Rate": 4.508490528916287e-06, "Full-pretrain/Loss": 1.8937318325042725, "Full-pretrain/Loss (Raw)": 1.9384677410125732, "Full-pretrain/Step": 7740, "Full-pretrain/Step Time": 17.62841702438891} +{"Full-pretrain/Learning Rate": 4.503627763175589e-06, "Full-pretrain/Loss": 1.8930422067642212, "Full-pretrain/Loss (Raw)": 1.973400592803955, "Full-pretrain/Step": 7741, "Full-pretrain/Step Time": 17.632141694426537} +{"Full-pretrain/Learning Rate": 4.498767361684228e-06, "Full-pretrain/Loss": 1.8860816955566406, "Full-pretrain/Loss (Raw)": 1.7360942363739014, "Full-pretrain/Step": 7742, "Full-pretrain/Step Time": 17.636386098340154} +{"Full-pretrain/Learning Rate": 4.493909325002846e-06, "Full-pretrain/Loss": 1.9069547653198242, "Full-pretrain/Loss (Raw)": 2.005573272705078, "Full-pretrain/Step": 7743, "Full-pretrain/Step Time": 17.635767260566354} +{"Full-pretrain/Learning Rate": 4.489053653691816e-06, "Full-pretrain/Loss": 1.9034037590026855, "Full-pretrain/Loss (Raw)": 1.8921475410461426, "Full-pretrain/Step": 7744, "Full-pretrain/Step Time": 17.63753443211317} +{"Full-pretrain/Learning Rate": 4.484200348311246e-06, "Full-pretrain/Loss": 1.9100685119628906, "Full-pretrain/Loss (Raw)": 2.020383358001709, "Full-pretrain/Step": 7745, "Full-pretrain/Step Time": 17.634681595489383} +{"Full-pretrain/Learning Rate": 4.4793494094209496e-06, "Full-pretrain/Loss": 1.9021496772766113, "Full-pretrain/Loss (Raw)": 2.1306869983673096, "Full-pretrain/Step": 7746, "Full-pretrain/Step Time": 17.638023557141423} +{"Full-pretrain/Learning Rate": 4.4745008375804866e-06, "Full-pretrain/Loss": 1.9003164768218994, "Full-pretrain/Loss (Raw)": 1.5957239866256714, "Full-pretrain/Step": 7747, "Full-pretrain/Step Time": 17.64036352559924} +{"Full-pretrain/Learning Rate": 4.469654633349141e-06, "Full-pretrain/Loss": 1.9077322483062744, "Full-pretrain/Loss (Raw)": 2.005620241165161, "Full-pretrain/Step": 7748, "Full-pretrain/Step Time": 17.64232274889946} +{"Full-pretrain/Learning Rate": 4.464810797285918e-06, "Full-pretrain/Loss": 1.891249418258667, "Full-pretrain/Loss (Raw)": 1.9580724239349365, "Full-pretrain/Step": 7749, "Full-pretrain/Step Time": 17.641480596736073} +{"Full-pretrain/Learning Rate": 4.459969329949559e-06, "Full-pretrain/Loss": 1.8725829124450684, "Full-pretrain/Loss (Raw)": 1.4136488437652588, "Full-pretrain/Step": 7750, "Full-pretrain/Step Time": 17.63942366465926} +{"Full-pretrain/Learning Rate": 4.455130231898513e-06, "Full-pretrain/Loss": 1.8682688474655151, "Full-pretrain/Loss (Raw)": 1.7737388610839844, "Full-pretrain/Step": 7751, "Full-pretrain/Step Time": 17.646666795015335} +{"Full-pretrain/Learning Rate": 4.45029350369098e-06, "Full-pretrain/Loss": 1.8676364421844482, "Full-pretrain/Loss (Raw)": 1.971239447593689, "Full-pretrain/Step": 7752, "Full-pretrain/Step Time": 17.64256141707301} +{"Full-pretrain/Learning Rate": 4.445459145884864e-06, "Full-pretrain/Loss": 1.869386911392212, "Full-pretrain/Loss (Raw)": 2.063685417175293, "Full-pretrain/Step": 7753, "Full-pretrain/Step Time": 17.636489929631352} +{"Full-pretrain/Learning Rate": 4.4406271590378135e-06, "Full-pretrain/Loss": 1.8882231712341309, "Full-pretrain/Loss (Raw)": 2.407592535018921, "Full-pretrain/Step": 7754, "Full-pretrain/Step Time": 17.636282917112112} +{"Full-pretrain/Learning Rate": 4.435797543707201e-06, "Full-pretrain/Loss": 1.8929284811019897, "Full-pretrain/Loss (Raw)": 2.3221397399902344, "Full-pretrain/Step": 7755, "Full-pretrain/Step Time": 17.634781137108803} +{"Full-pretrain/Learning Rate": 4.430970300450107e-06, "Full-pretrain/Loss": 1.905090570449829, "Full-pretrain/Loss (Raw)": 1.907169222831726, "Full-pretrain/Step": 7756, "Full-pretrain/Step Time": 17.64065930992365} +{"Full-pretrain/Learning Rate": 4.426145429823361e-06, "Full-pretrain/Loss": 1.9009839296340942, "Full-pretrain/Loss (Raw)": 1.961343765258789, "Full-pretrain/Step": 7757, "Full-pretrain/Step Time": 17.632652148604393} +{"Full-pretrain/Learning Rate": 4.421322932383512e-06, "Full-pretrain/Loss": 1.8972883224487305, "Full-pretrain/Loss (Raw)": 1.6981346607208252, "Full-pretrain/Step": 7758, "Full-pretrain/Step Time": 17.63479471951723} +{"Full-pretrain/Learning Rate": 4.4165028086868285e-06, "Full-pretrain/Loss": 1.891331434249878, "Full-pretrain/Loss (Raw)": 1.703062891960144, "Full-pretrain/Step": 7759, "Full-pretrain/Step Time": 17.63801397383213} +{"Full-pretrain/Learning Rate": 4.411685059289314e-06, "Full-pretrain/Loss": 1.8928289413452148, "Full-pretrain/Loss (Raw)": 2.045891761779785, "Full-pretrain/Step": 7760, "Full-pretrain/Step Time": 17.630394792184234} +{"Full-pretrain/Learning Rate": 4.4068696847466975e-06, "Full-pretrain/Loss": 1.8963879346847534, "Full-pretrain/Loss (Raw)": 1.9418697357177734, "Full-pretrain/Step": 7761, "Full-pretrain/Step Time": 17.634120017290115} +{"Full-pretrain/Learning Rate": 4.40205668561442e-06, "Full-pretrain/Loss": 1.9111895561218262, "Full-pretrain/Loss (Raw)": 2.2534074783325195, "Full-pretrain/Step": 7762, "Full-pretrain/Step Time": 17.62331203185022} +{"Full-pretrain/Learning Rate": 4.397246062447666e-06, "Full-pretrain/Loss": 1.9274375438690186, "Full-pretrain/Loss (Raw)": 2.2165937423706055, "Full-pretrain/Step": 7763, "Full-pretrain/Step Time": 17.62985760718584} +{"Full-pretrain/Learning Rate": 4.3924378158013365e-06, "Full-pretrain/Loss": 1.9236338138580322, "Full-pretrain/Loss (Raw)": 1.8505566120147705, "Full-pretrain/Step": 7764, "Full-pretrain/Step Time": 17.622646309435368} +{"Full-pretrain/Learning Rate": 4.387631946230064e-06, "Full-pretrain/Loss": 1.9309120178222656, "Full-pretrain/Loss (Raw)": 2.1402244567871094, "Full-pretrain/Step": 7765, "Full-pretrain/Step Time": 17.621735084801912} +{"Full-pretrain/Learning Rate": 4.38282845428821e-06, "Full-pretrain/Loss": 1.9533252716064453, "Full-pretrain/Loss (Raw)": 2.092749834060669, "Full-pretrain/Step": 7766, "Full-pretrain/Step Time": 17.617773169651628} +{"Full-pretrain/Learning Rate": 4.378027340529842e-06, "Full-pretrain/Loss": 1.9449501037597656, "Full-pretrain/Loss (Raw)": 1.8028273582458496, "Full-pretrain/Step": 7767, "Full-pretrain/Step Time": 17.616410115733743} +{"Full-pretrain/Learning Rate": 4.373228605508772e-06, "Full-pretrain/Loss": 1.9495028257369995, "Full-pretrain/Loss (Raw)": 2.141875743865967, "Full-pretrain/Step": 7768, "Full-pretrain/Step Time": 17.615900579839945} +{"Full-pretrain/Learning Rate": 4.368432249778539e-06, "Full-pretrain/Loss": 1.9507184028625488, "Full-pretrain/Loss (Raw)": 1.8710227012634277, "Full-pretrain/Step": 7769, "Full-pretrain/Step Time": 17.617850832641125} +{"Full-pretrain/Learning Rate": 4.363638273892393e-06, "Full-pretrain/Loss": 1.9560251235961914, "Full-pretrain/Loss (Raw)": 1.7484517097473145, "Full-pretrain/Step": 7770, "Full-pretrain/Step Time": 17.616163475438952} +{"Full-pretrain/Learning Rate": 4.358846678403322e-06, "Full-pretrain/Loss": 1.9446080923080444, "Full-pretrain/Loss (Raw)": 1.6440614461898804, "Full-pretrain/Step": 7771, "Full-pretrain/Step Time": 17.622996039688587} +{"Full-pretrain/Learning Rate": 4.354057463864028e-06, "Full-pretrain/Loss": 1.93967604637146, "Full-pretrain/Loss (Raw)": 1.7806470394134521, "Full-pretrain/Step": 7772, "Full-pretrain/Step Time": 17.62720146588981} +{"Full-pretrain/Learning Rate": 4.349270630826952e-06, "Full-pretrain/Loss": 1.9375535249710083, "Full-pretrain/Loss (Raw)": 1.9054769277572632, "Full-pretrain/Step": 7773, "Full-pretrain/Step Time": 17.62612957134843} +{"Full-pretrain/Learning Rate": 4.344486179844248e-06, "Full-pretrain/Loss": 1.9535843133926392, "Full-pretrain/Loss (Raw)": 2.249080181121826, "Full-pretrain/Step": 7774, "Full-pretrain/Step Time": 17.625314138829708} +{"Full-pretrain/Learning Rate": 4.339704111467807e-06, "Full-pretrain/Loss": 1.9436113834381104, "Full-pretrain/Loss (Raw)": 1.6864383220672607, "Full-pretrain/Step": 7775, "Full-pretrain/Step Time": 17.621448896825314} +{"Full-pretrain/Learning Rate": 4.334924426249243e-06, "Full-pretrain/Loss": 1.950490117073059, "Full-pretrain/Loss (Raw)": 2.1122679710388184, "Full-pretrain/Step": 7776, "Full-pretrain/Step Time": 17.617924271151423} +{"Full-pretrain/Learning Rate": 4.330147124739875e-06, "Full-pretrain/Loss": 1.9435195922851562, "Full-pretrain/Loss (Raw)": 1.7973253726959229, "Full-pretrain/Step": 7777, "Full-pretrain/Step Time": 17.62009953148663} +{"Full-pretrain/Learning Rate": 4.325372207490774e-06, "Full-pretrain/Loss": 1.9391248226165771, "Full-pretrain/Loss (Raw)": 1.9900566339492798, "Full-pretrain/Step": 7778, "Full-pretrain/Step Time": 17.62548701837659} +{"Full-pretrain/Learning Rate": 4.320599675052725e-06, "Full-pretrain/Loss": 1.9490654468536377, "Full-pretrain/Loss (Raw)": 1.9138201475143433, "Full-pretrain/Step": 7779, "Full-pretrain/Step Time": 17.6204517763108} +{"Full-pretrain/Learning Rate": 4.315829527976234e-06, "Full-pretrain/Loss": 1.953100323677063, "Full-pretrain/Loss (Raw)": 2.134737014770508, "Full-pretrain/Step": 7780, "Full-pretrain/Step Time": 17.624968415126204} +{"Full-pretrain/Learning Rate": 4.3110617668115386e-06, "Full-pretrain/Loss": 1.950876235961914, "Full-pretrain/Loss (Raw)": 1.8869014978408813, "Full-pretrain/Step": 7781, "Full-pretrain/Step Time": 17.62558057717979} +{"Full-pretrain/Learning Rate": 4.306296392108605e-06, "Full-pretrain/Loss": 1.9665014743804932, "Full-pretrain/Loss (Raw)": 1.9136569499969482, "Full-pretrain/Step": 7782, "Full-pretrain/Step Time": 17.623835917562246} +{"Full-pretrain/Learning Rate": 4.301533404417102e-06, "Full-pretrain/Loss": 1.9721332788467407, "Full-pretrain/Loss (Raw)": 1.9539552927017212, "Full-pretrain/Step": 7783, "Full-pretrain/Step Time": 17.62350981682539} +{"Full-pretrain/Learning Rate": 4.296772804286447e-06, "Full-pretrain/Loss": 1.96268892288208, "Full-pretrain/Loss (Raw)": 1.6690171957015991, "Full-pretrain/Step": 7784, "Full-pretrain/Step Time": 17.618658212944865} +{"Full-pretrain/Learning Rate": 4.2920145922657805e-06, "Full-pretrain/Loss": 1.9513001441955566, "Full-pretrain/Loss (Raw)": 1.6992523670196533, "Full-pretrain/Step": 7785, "Full-pretrain/Step Time": 17.624239021912217} +{"Full-pretrain/Learning Rate": 4.2872587689039484e-06, "Full-pretrain/Loss": 1.9442873001098633, "Full-pretrain/Loss (Raw)": 2.183176040649414, "Full-pretrain/Step": 7786, "Full-pretrain/Step Time": 17.62552283704281} +{"Full-pretrain/Learning Rate": 4.282505334749542e-06, "Full-pretrain/Loss": 1.9346354007720947, "Full-pretrain/Loss (Raw)": 2.01328182220459, "Full-pretrain/Step": 7787, "Full-pretrain/Step Time": 17.62707561440766} +{"Full-pretrain/Learning Rate": 4.2777542903508605e-06, "Full-pretrain/Loss": 1.931770920753479, "Full-pretrain/Loss (Raw)": 1.815505862236023, "Full-pretrain/Step": 7788, "Full-pretrain/Step Time": 17.625035412609577} +{"Full-pretrain/Learning Rate": 4.273005636255939e-06, "Full-pretrain/Loss": 1.938089370727539, "Full-pretrain/Loss (Raw)": 2.1635313034057617, "Full-pretrain/Step": 7789, "Full-pretrain/Step Time": 17.628964273259044} +{"Full-pretrain/Learning Rate": 4.268259373012535e-06, "Full-pretrain/Loss": 1.9494507312774658, "Full-pretrain/Loss (Raw)": 2.061699151992798, "Full-pretrain/Step": 7790, "Full-pretrain/Step Time": 17.6266203019768} +{"Full-pretrain/Learning Rate": 4.263515501168122e-06, "Full-pretrain/Loss": 1.9590502977371216, "Full-pretrain/Loss (Raw)": 2.010251522064209, "Full-pretrain/Step": 7791, "Full-pretrain/Step Time": 17.619060188531876} +{"Full-pretrain/Learning Rate": 4.2587740212699175e-06, "Full-pretrain/Loss": 1.9469484090805054, "Full-pretrain/Loss (Raw)": 1.6586318016052246, "Full-pretrain/Step": 7792, "Full-pretrain/Step Time": 17.624048674479127} +{"Full-pretrain/Learning Rate": 4.2540349338648366e-06, "Full-pretrain/Loss": 1.9454729557037354, "Full-pretrain/Loss (Raw)": 1.894654631614685, "Full-pretrain/Step": 7793, "Full-pretrain/Step Time": 17.631498822942376} +{"Full-pretrain/Learning Rate": 4.249298239499533e-06, "Full-pretrain/Loss": 1.9368046522140503, "Full-pretrain/Loss (Raw)": 1.9760205745697021, "Full-pretrain/Step": 7794, "Full-pretrain/Step Time": 17.63697942532599} +{"Full-pretrain/Learning Rate": 4.2445639387203865e-06, "Full-pretrain/Loss": 1.9288501739501953, "Full-pretrain/Loss (Raw)": 1.962050437927246, "Full-pretrain/Step": 7795, "Full-pretrain/Step Time": 17.63158834911883} +{"Full-pretrain/Learning Rate": 4.239832032073493e-06, "Full-pretrain/Loss": 1.9345448017120361, "Full-pretrain/Loss (Raw)": 2.0327847003936768, "Full-pretrain/Step": 7796, "Full-pretrain/Step Time": 17.628040121868253} +{"Full-pretrain/Learning Rate": 4.235102520104681e-06, "Full-pretrain/Loss": 1.9234938621520996, "Full-pretrain/Loss (Raw)": 1.786595344543457, "Full-pretrain/Step": 7797, "Full-pretrain/Step Time": 17.632190562784672} +{"Full-pretrain/Learning Rate": 4.230375403359502e-06, "Full-pretrain/Loss": 1.915083408355713, "Full-pretrain/Loss (Raw)": 1.8236148357391357, "Full-pretrain/Step": 7798, "Full-pretrain/Step Time": 17.626276465132833} +{"Full-pretrain/Learning Rate": 4.225650682383214e-06, "Full-pretrain/Loss": 1.9284745454788208, "Full-pretrain/Loss (Raw)": 2.2313427925109863, "Full-pretrain/Step": 7799, "Full-pretrain/Step Time": 17.633332885801792} +{"Full-pretrain/Learning Rate": 4.220928357720822e-06, "Full-pretrain/Loss": 1.9218671321868896, "Full-pretrain/Loss (Raw)": 1.9304416179656982, "Full-pretrain/Step": 7800, "Full-pretrain/Step Time": 17.623977096751332} +{"Full-pretrain/Learning Rate": 4.216208429917046e-06, "Full-pretrain/Loss": 1.9240552186965942, "Full-pretrain/Loss (Raw)": 1.9410393238067627, "Full-pretrain/Step": 7801, "Full-pretrain/Step Time": 17.628113394603133} +{"Full-pretrain/Learning Rate": 4.211490899516315e-06, "Full-pretrain/Loss": 1.9211723804473877, "Full-pretrain/Loss (Raw)": 1.6561989784240723, "Full-pretrain/Step": 7802, "Full-pretrain/Step Time": 17.635112004354596} +{"Full-pretrain/Learning Rate": 4.2067757670628126e-06, "Full-pretrain/Loss": 1.933470368385315, "Full-pretrain/Loss (Raw)": 2.0376007556915283, "Full-pretrain/Step": 7803, "Full-pretrain/Step Time": 17.639274738729} +{"Full-pretrain/Learning Rate": 4.2020630331004115e-06, "Full-pretrain/Loss": 1.9344013929367065, "Full-pretrain/Loss (Raw)": 1.810438871383667, "Full-pretrain/Step": 7804, "Full-pretrain/Step Time": 17.63118056766689} +{"Full-pretrain/Learning Rate": 4.1973526981727295e-06, "Full-pretrain/Loss": 1.923454761505127, "Full-pretrain/Loss (Raw)": 1.5551884174346924, "Full-pretrain/Step": 7805, "Full-pretrain/Step Time": 17.62880718894303} +{"Full-pretrain/Learning Rate": 4.192644762823106e-06, "Full-pretrain/Loss": 1.9162640571594238, "Full-pretrain/Loss (Raw)": 2.0189766883850098, "Full-pretrain/Step": 7806, "Full-pretrain/Step Time": 17.630221312865615} +{"Full-pretrain/Learning Rate": 4.187939227594595e-06, "Full-pretrain/Loss": 1.9186590909957886, "Full-pretrain/Loss (Raw)": 1.7630770206451416, "Full-pretrain/Step": 7807, "Full-pretrain/Step Time": 17.62942359596491} +{"Full-pretrain/Learning Rate": 4.183236093029985e-06, "Full-pretrain/Loss": 1.919910192489624, "Full-pretrain/Loss (Raw)": 2.1522998809814453, "Full-pretrain/Step": 7808, "Full-pretrain/Step Time": 17.620731370523572} +{"Full-pretrain/Learning Rate": 4.17853535967177e-06, "Full-pretrain/Loss": 1.929181456565857, "Full-pretrain/Loss (Raw)": 2.0940093994140625, "Full-pretrain/Step": 7809, "Full-pretrain/Step Time": 17.623203808441758} +{"Full-pretrain/Learning Rate": 4.173837028062186e-06, "Full-pretrain/Loss": 1.9300973415374756, "Full-pretrain/Loss (Raw)": 2.0193676948547363, "Full-pretrain/Step": 7810, "Full-pretrain/Step Time": 17.62627800181508} +{"Full-pretrain/Learning Rate": 4.169141098743182e-06, "Full-pretrain/Loss": 1.9351506233215332, "Full-pretrain/Loss (Raw)": 2.075521230697632, "Full-pretrain/Step": 7811, "Full-pretrain/Step Time": 17.625268548727036} +{"Full-pretrain/Learning Rate": 4.16444757225643e-06, "Full-pretrain/Loss": 1.929521083831787, "Full-pretrain/Loss (Raw)": 1.9545930624008179, "Full-pretrain/Step": 7812, "Full-pretrain/Step Time": 17.621712198480964} +{"Full-pretrain/Learning Rate": 4.159756449143337e-06, "Full-pretrain/Loss": 1.9259095191955566, "Full-pretrain/Loss (Raw)": 1.7713319063186646, "Full-pretrain/Step": 7813, "Full-pretrain/Step Time": 17.62064679339528} +{"Full-pretrain/Learning Rate": 4.155067729945005e-06, "Full-pretrain/Loss": 1.9221558570861816, "Full-pretrain/Loss (Raw)": 1.7935415506362915, "Full-pretrain/Step": 7814, "Full-pretrain/Step Time": 17.626766443252563} +{"Full-pretrain/Learning Rate": 4.150381415202287e-06, "Full-pretrain/Loss": 1.9173383712768555, "Full-pretrain/Loss (Raw)": 1.799791693687439, "Full-pretrain/Step": 7815, "Full-pretrain/Step Time": 17.62966172210872} +{"Full-pretrain/Learning Rate": 4.145697505455745e-06, "Full-pretrain/Loss": 1.9224317073822021, "Full-pretrain/Loss (Raw)": 1.8320033550262451, "Full-pretrain/Step": 7816, "Full-pretrain/Step Time": 17.627868263050914} +{"Full-pretrain/Learning Rate": 4.141016001245668e-06, "Full-pretrain/Loss": 1.9302880764007568, "Full-pretrain/Loss (Raw)": 1.9506551027297974, "Full-pretrain/Step": 7817, "Full-pretrain/Step Time": 17.62712275236845} +{"Full-pretrain/Learning Rate": 4.13633690311207e-06, "Full-pretrain/Loss": 1.9261696338653564, "Full-pretrain/Loss (Raw)": 2.0513904094696045, "Full-pretrain/Step": 7818, "Full-pretrain/Step Time": 17.6337606087327} +{"Full-pretrain/Learning Rate": 4.131660211594671e-06, "Full-pretrain/Loss": 1.9200246334075928, "Full-pretrain/Loss (Raw)": 1.8166372776031494, "Full-pretrain/Step": 7819, "Full-pretrain/Step Time": 17.631792647764087} +{"Full-pretrain/Learning Rate": 4.12698592723294e-06, "Full-pretrain/Loss": 1.9238088130950928, "Full-pretrain/Loss (Raw)": 1.9366021156311035, "Full-pretrain/Step": 7820, "Full-pretrain/Step Time": 17.6288459636271} +{"Full-pretrain/Learning Rate": 4.122314050566043e-06, "Full-pretrain/Loss": 1.9180753231048584, "Full-pretrain/Loss (Raw)": 1.9800597429275513, "Full-pretrain/Step": 7821, "Full-pretrain/Step Time": 17.629917254671454} +{"Full-pretrain/Learning Rate": 4.1176445821328795e-06, "Full-pretrain/Loss": 1.9191412925720215, "Full-pretrain/Loss (Raw)": 2.095811128616333, "Full-pretrain/Step": 7822, "Full-pretrain/Step Time": 17.634822469204664} +{"Full-pretrain/Learning Rate": 4.1129775224720775e-06, "Full-pretrain/Loss": 1.9204403162002563, "Full-pretrain/Loss (Raw)": 2.051816463470459, "Full-pretrain/Step": 7823, "Full-pretrain/Step Time": 17.635646609589458} +{"Full-pretrain/Learning Rate": 4.108312872121983e-06, "Full-pretrain/Loss": 1.9346857070922852, "Full-pretrain/Loss (Raw)": 2.11448335647583, "Full-pretrain/Step": 7824, "Full-pretrain/Step Time": 17.632409993559122} +{"Full-pretrain/Learning Rate": 4.103650631620651e-06, "Full-pretrain/Loss": 1.9397257566452026, "Full-pretrain/Loss (Raw)": 2.055936813354492, "Full-pretrain/Step": 7825, "Full-pretrain/Step Time": 17.631310841068625} +{"Full-pretrain/Learning Rate": 4.098990801505875e-06, "Full-pretrain/Loss": 1.9457050561904907, "Full-pretrain/Loss (Raw)": 2.1673617362976074, "Full-pretrain/Step": 7826, "Full-pretrain/Step Time": 17.638931661844254} +{"Full-pretrain/Learning Rate": 4.094333382315166e-06, "Full-pretrain/Loss": 1.9419567584991455, "Full-pretrain/Loss (Raw)": 1.8421008586883545, "Full-pretrain/Step": 7827, "Full-pretrain/Step Time": 17.638494443148375} +{"Full-pretrain/Learning Rate": 4.0896783745857535e-06, "Full-pretrain/Loss": 1.9436147212982178, "Full-pretrain/Loss (Raw)": 2.085838794708252, "Full-pretrain/Step": 7828, "Full-pretrain/Step Time": 17.637880390509963} +{"Full-pretrain/Learning Rate": 4.085025778854598e-06, "Full-pretrain/Loss": 1.944108009338379, "Full-pretrain/Loss (Raw)": 1.8023844957351685, "Full-pretrain/Step": 7829, "Full-pretrain/Step Time": 17.628717053681612} +{"Full-pretrain/Learning Rate": 4.0803755956583644e-06, "Full-pretrain/Loss": 1.9462518692016602, "Full-pretrain/Loss (Raw)": 1.8922169208526611, "Full-pretrain/Step": 7830, "Full-pretrain/Step Time": 17.63673768006265} +{"Full-pretrain/Learning Rate": 4.0757278255334514e-06, "Full-pretrain/Loss": 1.9294061660766602, "Full-pretrain/Loss (Raw)": 1.6922776699066162, "Full-pretrain/Step": 7831, "Full-pretrain/Step Time": 17.63349956832826} +{"Full-pretrain/Learning Rate": 4.071082469015982e-06, "Full-pretrain/Loss": 1.927276611328125, "Full-pretrain/Loss (Raw)": 1.8622982501983643, "Full-pretrain/Step": 7832, "Full-pretrain/Step Time": 17.633402725681663} +{"Full-pretrain/Learning Rate": 4.066439526641796e-06, "Full-pretrain/Loss": 1.9304299354553223, "Full-pretrain/Loss (Raw)": 2.0419440269470215, "Full-pretrain/Step": 7833, "Full-pretrain/Step Time": 17.627604020759463} +{"Full-pretrain/Learning Rate": 4.061798998946459e-06, "Full-pretrain/Loss": 1.9432185888290405, "Full-pretrain/Loss (Raw)": 2.065436840057373, "Full-pretrain/Step": 7834, "Full-pretrain/Step Time": 17.6334220841527} +{"Full-pretrain/Learning Rate": 4.057160886465244e-06, "Full-pretrain/Loss": 1.9374933242797852, "Full-pretrain/Loss (Raw)": 1.8543927669525146, "Full-pretrain/Step": 7835, "Full-pretrain/Step Time": 17.638020718470216} +{"Full-pretrain/Learning Rate": 4.052525189733167e-06, "Full-pretrain/Loss": 1.9423925876617432, "Full-pretrain/Loss (Raw)": 1.9672162532806396, "Full-pretrain/Step": 7836, "Full-pretrain/Step Time": 17.633084900677204} +{"Full-pretrain/Learning Rate": 4.04789190928494e-06, "Full-pretrain/Loss": 1.9531067609786987, "Full-pretrain/Loss (Raw)": 1.8980422019958496, "Full-pretrain/Step": 7837, "Full-pretrain/Step Time": 17.626290298998356} +{"Full-pretrain/Learning Rate": 4.04326104565502e-06, "Full-pretrain/Loss": 1.9521578550338745, "Full-pretrain/Loss (Raw)": 1.9886106252670288, "Full-pretrain/Step": 7838, "Full-pretrain/Step Time": 17.63637224957347} +{"Full-pretrain/Learning Rate": 4.03863259937757e-06, "Full-pretrain/Loss": 1.9564874172210693, "Full-pretrain/Loss (Raw)": 1.9016215801239014, "Full-pretrain/Step": 7839, "Full-pretrain/Step Time": 17.6327993478626} +{"Full-pretrain/Learning Rate": 4.034006570986492e-06, "Full-pretrain/Loss": 1.9579713344573975, "Full-pretrain/Loss (Raw)": 2.1997857093811035, "Full-pretrain/Step": 7840, "Full-pretrain/Step Time": 17.628762597218156} +{"Full-pretrain/Learning Rate": 4.029382961015385e-06, "Full-pretrain/Loss": 1.959270715713501, "Full-pretrain/Loss (Raw)": 2.135591506958008, "Full-pretrain/Step": 7841, "Full-pretrain/Step Time": 17.63013937138021} +{"Full-pretrain/Learning Rate": 4.024761769997578e-06, "Full-pretrain/Loss": 1.952256202697754, "Full-pretrain/Loss (Raw)": 1.7948992252349854, "Full-pretrain/Step": 7842, "Full-pretrain/Step Time": 17.629770807921886} +{"Full-pretrain/Learning Rate": 4.020142998466133e-06, "Full-pretrain/Loss": 1.949152946472168, "Full-pretrain/Loss (Raw)": 1.976217269897461, "Full-pretrain/Step": 7843, "Full-pretrain/Step Time": 17.63101813942194} +{"Full-pretrain/Learning Rate": 4.015526646953821e-06, "Full-pretrain/Loss": 1.9479076862335205, "Full-pretrain/Loss (Raw)": 1.914745569229126, "Full-pretrain/Step": 7844, "Full-pretrain/Step Time": 17.62667817622423} +{"Full-pretrain/Learning Rate": 4.010912715993142e-06, "Full-pretrain/Loss": 1.9503049850463867, "Full-pretrain/Loss (Raw)": 1.8480428457260132, "Full-pretrain/Step": 7845, "Full-pretrain/Step Time": 17.62393370643258} +{"Full-pretrain/Learning Rate": 4.006301206116297e-06, "Full-pretrain/Loss": 1.9545159339904785, "Full-pretrain/Loss (Raw)": 1.9282972812652588, "Full-pretrain/Step": 7846, "Full-pretrain/Step Time": 17.620586870238185} +{"Full-pretrain/Learning Rate": 4.0016921178552325e-06, "Full-pretrain/Loss": 1.949946641921997, "Full-pretrain/Loss (Raw)": 1.6535738706588745, "Full-pretrain/Step": 7847, "Full-pretrain/Step Time": 17.630427431315184} +{"Full-pretrain/Learning Rate": 3.9970854517416e-06, "Full-pretrain/Loss": 1.9427372217178345, "Full-pretrain/Loss (Raw)": 1.6013004779815674, "Full-pretrain/Step": 7848, "Full-pretrain/Step Time": 17.630281193181872} +{"Full-pretrain/Learning Rate": 3.992481208306781e-06, "Full-pretrain/Loss": 1.9380862712860107, "Full-pretrain/Loss (Raw)": 1.8018269538879395, "Full-pretrain/Step": 7849, "Full-pretrain/Step Time": 17.623830134049058} +{"Full-pretrain/Learning Rate": 3.987879388081881e-06, "Full-pretrain/Loss": 1.9413142204284668, "Full-pretrain/Loss (Raw)": 2.1546857357025146, "Full-pretrain/Step": 7850, "Full-pretrain/Step Time": 17.62311189621687} +{"Full-pretrain/Learning Rate": 3.983279991597699e-06, "Full-pretrain/Loss": 1.9448959827423096, "Full-pretrain/Loss (Raw)": 1.9312504529953003, "Full-pretrain/Step": 7851, "Full-pretrain/Step Time": 17.634254455566406} +{"Full-pretrain/Learning Rate": 3.978683019384785e-06, "Full-pretrain/Loss": 1.9411301612854004, "Full-pretrain/Loss (Raw)": 1.8161001205444336, "Full-pretrain/Step": 7852, "Full-pretrain/Step Time": 17.63382826372981} +{"Full-pretrain/Learning Rate": 3.974088471973406e-06, "Full-pretrain/Loss": 1.9384196996688843, "Full-pretrain/Loss (Raw)": 1.8933229446411133, "Full-pretrain/Step": 7853, "Full-pretrain/Step Time": 17.62047901377082} +{"Full-pretrain/Learning Rate": 3.969496349893522e-06, "Full-pretrain/Loss": 1.9397799968719482, "Full-pretrain/Loss (Raw)": 2.139343738555908, "Full-pretrain/Step": 7854, "Full-pretrain/Step Time": 17.622970655560493} +{"Full-pretrain/Learning Rate": 3.964906653674855e-06, "Full-pretrain/Loss": 1.9303936958312988, "Full-pretrain/Loss (Raw)": 1.7514551877975464, "Full-pretrain/Step": 7855, "Full-pretrain/Step Time": 17.62466032616794} +{"Full-pretrain/Learning Rate": 3.960319383846803e-06, "Full-pretrain/Loss": 1.926616907119751, "Full-pretrain/Loss (Raw)": 1.9936230182647705, "Full-pretrain/Step": 7856, "Full-pretrain/Step Time": 17.628961881622672} +{"Full-pretrain/Learning Rate": 3.955734540938519e-06, "Full-pretrain/Loss": 1.9203391075134277, "Full-pretrain/Loss (Raw)": 1.8550479412078857, "Full-pretrain/Step": 7857, "Full-pretrain/Step Time": 17.62267952784896} +{"Full-pretrain/Learning Rate": 3.951152125478858e-06, "Full-pretrain/Loss": 1.921151876449585, "Full-pretrain/Loss (Raw)": 2.1933698654174805, "Full-pretrain/Step": 7858, "Full-pretrain/Step Time": 17.614667791873217} +{"Full-pretrain/Learning Rate": 3.946572137996404e-06, "Full-pretrain/Loss": 1.9279975891113281, "Full-pretrain/Loss (Raw)": 2.0611672401428223, "Full-pretrain/Step": 7859, "Full-pretrain/Step Time": 17.61968645453453} +{"Full-pretrain/Learning Rate": 3.9419945790194534e-06, "Full-pretrain/Loss": 1.9147289991378784, "Full-pretrain/Loss (Raw)": 1.6612422466278076, "Full-pretrain/Step": 7860, "Full-pretrain/Step Time": 17.62174743041396} +{"Full-pretrain/Learning Rate": 3.937419449076035e-06, "Full-pretrain/Loss": 1.9252150058746338, "Full-pretrain/Loss (Raw)": 2.137934923171997, "Full-pretrain/Step": 7861, "Full-pretrain/Step Time": 17.622095052152872} +{"Full-pretrain/Learning Rate": 3.932846748693875e-06, "Full-pretrain/Loss": 1.9217064380645752, "Full-pretrain/Loss (Raw)": 1.7799434661865234, "Full-pretrain/Step": 7862, "Full-pretrain/Step Time": 17.619537003338337} +{"Full-pretrain/Learning Rate": 3.928276478400439e-06, "Full-pretrain/Loss": 1.9297215938568115, "Full-pretrain/Loss (Raw)": 1.9487600326538086, "Full-pretrain/Step": 7863, "Full-pretrain/Step Time": 17.62334014289081} +{"Full-pretrain/Learning Rate": 3.923708638722906e-06, "Full-pretrain/Loss": 1.9397265911102295, "Full-pretrain/Loss (Raw)": 2.1824588775634766, "Full-pretrain/Step": 7864, "Full-pretrain/Step Time": 17.62831444479525} +{"Full-pretrain/Learning Rate": 3.919143230188174e-06, "Full-pretrain/Loss": 1.9388383626937866, "Full-pretrain/Loss (Raw)": 2.0135233402252197, "Full-pretrain/Step": 7865, "Full-pretrain/Step Time": 17.62971563078463} +{"Full-pretrain/Learning Rate": 3.9145802533228695e-06, "Full-pretrain/Loss": 1.9306941032409668, "Full-pretrain/Loss (Raw)": 1.804816484451294, "Full-pretrain/Step": 7866, "Full-pretrain/Step Time": 17.62324552051723} +{"Full-pretrain/Learning Rate": 3.910019708653317e-06, "Full-pretrain/Loss": 1.9304685592651367, "Full-pretrain/Loss (Raw)": 1.8471773862838745, "Full-pretrain/Step": 7867, "Full-pretrain/Step Time": 17.626259710639715} +{"Full-pretrain/Learning Rate": 3.905461596705579e-06, "Full-pretrain/Loss": 1.9283082485198975, "Full-pretrain/Loss (Raw)": 1.8980867862701416, "Full-pretrain/Step": 7868, "Full-pretrain/Step Time": 17.63161540403962} +{"Full-pretrain/Learning Rate": 3.900905918005438e-06, "Full-pretrain/Loss": 1.9278488159179688, "Full-pretrain/Loss (Raw)": 1.8833379745483398, "Full-pretrain/Step": 7869, "Full-pretrain/Step Time": 17.623726533725858} +{"Full-pretrain/Learning Rate": 3.89635267307838e-06, "Full-pretrain/Loss": 1.9127421379089355, "Full-pretrain/Loss (Raw)": 1.505197286605835, "Full-pretrain/Step": 7870, "Full-pretrain/Step Time": 17.626328349113464} +{"Full-pretrain/Learning Rate": 3.891801862449629e-06, "Full-pretrain/Loss": 1.9106884002685547, "Full-pretrain/Loss (Raw)": 1.835900902748108, "Full-pretrain/Step": 7871, "Full-pretrain/Step Time": 17.623519126325846} +{"Full-pretrain/Learning Rate": 3.88725348664411e-06, "Full-pretrain/Loss": 1.9027949571609497, "Full-pretrain/Loss (Raw)": 1.9471971988677979, "Full-pretrain/Step": 7872, "Full-pretrain/Step Time": 17.623657254502177} +{"Full-pretrain/Learning Rate": 3.882707546186481e-06, "Full-pretrain/Loss": 1.9018774032592773, "Full-pretrain/Loss (Raw)": 2.1062278747558594, "Full-pretrain/Step": 7873, "Full-pretrain/Step Time": 17.624968336895108} +{"Full-pretrain/Learning Rate": 3.878164041601118e-06, "Full-pretrain/Loss": 1.9074822664260864, "Full-pretrain/Loss (Raw)": 1.9742563962936401, "Full-pretrain/Step": 7874, "Full-pretrain/Step Time": 17.624614419415593} +{"Full-pretrain/Learning Rate": 3.8736229734121085e-06, "Full-pretrain/Loss": 1.9078233242034912, "Full-pretrain/Loss (Raw)": 1.9871325492858887, "Full-pretrain/Step": 7875, "Full-pretrain/Step Time": 17.624374432489276} +{"Full-pretrain/Learning Rate": 3.86908434214327e-06, "Full-pretrain/Loss": 1.9113367795944214, "Full-pretrain/Loss (Raw)": 2.0271759033203125, "Full-pretrain/Step": 7876, "Full-pretrain/Step Time": 17.6266644988209} +{"Full-pretrain/Learning Rate": 3.8645481483181225e-06, "Full-pretrain/Loss": 1.9150649309158325, "Full-pretrain/Loss (Raw)": 1.9673446416854858, "Full-pretrain/Step": 7877, "Full-pretrain/Step Time": 17.62754693441093} +{"Full-pretrain/Learning Rate": 3.860014392459918e-06, "Full-pretrain/Loss": 1.9137686491012573, "Full-pretrain/Loss (Raw)": 1.8868154287338257, "Full-pretrain/Step": 7878, "Full-pretrain/Step Time": 17.624244809150696} +{"Full-pretrain/Learning Rate": 3.855483075091623e-06, "Full-pretrain/Loss": 1.925171136856079, "Full-pretrain/Loss (Raw)": 2.018454074859619, "Full-pretrain/Step": 7879, "Full-pretrain/Step Time": 17.622330082580447} +{"Full-pretrain/Learning Rate": 3.8509541967359254e-06, "Full-pretrain/Loss": 1.9194636344909668, "Full-pretrain/Loss (Raw)": 1.4186594486236572, "Full-pretrain/Step": 7880, "Full-pretrain/Step Time": 17.63084185682237} +{"Full-pretrain/Learning Rate": 3.8464277579152275e-06, "Full-pretrain/Loss": 1.9196174144744873, "Full-pretrain/Loss (Raw)": 1.8067501783370972, "Full-pretrain/Step": 7881, "Full-pretrain/Step Time": 17.62823018990457} +{"Full-pretrain/Learning Rate": 3.841903759151661e-06, "Full-pretrain/Loss": 1.9059525728225708, "Full-pretrain/Loss (Raw)": 1.717406988143921, "Full-pretrain/Step": 7882, "Full-pretrain/Step Time": 17.626527478918433} +{"Full-pretrain/Learning Rate": 3.837382200967055e-06, "Full-pretrain/Loss": 1.905001163482666, "Full-pretrain/Loss (Raw)": 1.9008052349090576, "Full-pretrain/Step": 7883, "Full-pretrain/Step Time": 17.628907894715667} +{"Full-pretrain/Learning Rate": 3.832863083882974e-06, "Full-pretrain/Loss": 1.8928251266479492, "Full-pretrain/Loss (Raw)": 1.4264689683914185, "Full-pretrain/Step": 7884, "Full-pretrain/Step Time": 17.621354550123215} +{"Full-pretrain/Learning Rate": 3.828346408420705e-06, "Full-pretrain/Loss": 1.9001445770263672, "Full-pretrain/Loss (Raw)": 2.127544403076172, "Full-pretrain/Step": 7885, "Full-pretrain/Step Time": 17.62690868973732} +{"Full-pretrain/Learning Rate": 3.82383217510123e-06, "Full-pretrain/Loss": 1.8908896446228027, "Full-pretrain/Loss (Raw)": 1.843182921409607, "Full-pretrain/Step": 7886, "Full-pretrain/Step Time": 17.626574493944645} +{"Full-pretrain/Learning Rate": 3.8193203844452795e-06, "Full-pretrain/Loss": 1.889473795890808, "Full-pretrain/Loss (Raw)": 1.7061516046524048, "Full-pretrain/Step": 7887, "Full-pretrain/Step Time": 17.623237213119864} +{"Full-pretrain/Learning Rate": 3.814811036973271e-06, "Full-pretrain/Loss": 1.8821814060211182, "Full-pretrain/Loss (Raw)": 1.7602651119232178, "Full-pretrain/Step": 7888, "Full-pretrain/Step Time": 17.631227552890778} +{"Full-pretrain/Learning Rate": 3.8103041332053668e-06, "Full-pretrain/Loss": 1.877502202987671, "Full-pretrain/Loss (Raw)": 1.7053134441375732, "Full-pretrain/Step": 7889, "Full-pretrain/Step Time": 17.627436006441712} +{"Full-pretrain/Learning Rate": 3.805799673661431e-06, "Full-pretrain/Loss": 1.8632700443267822, "Full-pretrain/Loss (Raw)": 1.7379425764083862, "Full-pretrain/Step": 7890, "Full-pretrain/Step Time": 17.631368862465024} +{"Full-pretrain/Learning Rate": 3.8012976588610582e-06, "Full-pretrain/Loss": 1.8701276779174805, "Full-pretrain/Loss (Raw)": 2.280611515045166, "Full-pretrain/Step": 7891, "Full-pretrain/Step Time": 17.629692705348134} +{"Full-pretrain/Learning Rate": 3.7967980893235555e-06, "Full-pretrain/Loss": 1.883088231086731, "Full-pretrain/Loss (Raw)": 2.0759780406951904, "Full-pretrain/Step": 7892, "Full-pretrain/Step Time": 17.62769148312509} +{"Full-pretrain/Learning Rate": 3.7923009655679353e-06, "Full-pretrain/Loss": 1.8790066242218018, "Full-pretrain/Loss (Raw)": 2.007326364517212, "Full-pretrain/Step": 7893, "Full-pretrain/Step Time": 17.623935736715794} +{"Full-pretrain/Learning Rate": 3.7878062881129467e-06, "Full-pretrain/Loss": 1.8870047330856323, "Full-pretrain/Loss (Raw)": 2.0358810424804688, "Full-pretrain/Step": 7894, "Full-pretrain/Step Time": 17.627243706956506} +{"Full-pretrain/Learning Rate": 3.783314057477047e-06, "Full-pretrain/Loss": 1.8674530982971191, "Full-pretrain/Loss (Raw)": 1.3231102228164673, "Full-pretrain/Step": 7895, "Full-pretrain/Step Time": 17.629760479554534} +{"Full-pretrain/Learning Rate": 3.7788242741784164e-06, "Full-pretrain/Loss": 1.8637404441833496, "Full-pretrain/Loss (Raw)": 2.0636510848999023, "Full-pretrain/Step": 7896, "Full-pretrain/Step Time": 17.62524875998497} +{"Full-pretrain/Learning Rate": 3.7743369387349514e-06, "Full-pretrain/Loss": 1.8484046459197998, "Full-pretrain/Loss (Raw)": 1.5227775573730469, "Full-pretrain/Step": 7897, "Full-pretrain/Step Time": 17.628466865047812} +{"Full-pretrain/Learning Rate": 3.7698520516642576e-06, "Full-pretrain/Loss": 1.854248046875, "Full-pretrain/Loss (Raw)": 1.9918086528778076, "Full-pretrain/Step": 7898, "Full-pretrain/Step Time": 17.622766494750977} +{"Full-pretrain/Learning Rate": 3.7653696134836687e-06, "Full-pretrain/Loss": 1.860034465789795, "Full-pretrain/Loss (Raw)": 2.0323405265808105, "Full-pretrain/Step": 7899, "Full-pretrain/Step Time": 17.62580214627087} +{"Full-pretrain/Learning Rate": 3.7608896247102315e-06, "Full-pretrain/Loss": 1.8668088912963867, "Full-pretrain/Loss (Raw)": 2.114867687225342, "Full-pretrain/Step": 7900, "Full-pretrain/Step Time": 17.626007856801152} +{"Full-pretrain/Learning Rate": 3.7564120858607136e-06, "Full-pretrain/Loss": 1.8692049980163574, "Full-pretrain/Loss (Raw)": 1.960014820098877, "Full-pretrain/Step": 7901, "Full-pretrain/Step Time": 17.631182802841067} +{"Full-pretrain/Learning Rate": 3.7519369974515993e-06, "Full-pretrain/Loss": 1.879065990447998, "Full-pretrain/Loss (Raw)": 1.820744276046753, "Full-pretrain/Step": 7902, "Full-pretrain/Step Time": 17.621961606666446} +{"Full-pretrain/Learning Rate": 3.747464359999081e-06, "Full-pretrain/Loss": 1.8844579458236694, "Full-pretrain/Loss (Raw)": 2.00844407081604, "Full-pretrain/Step": 7903, "Full-pretrain/Step Time": 17.630275206640363} +{"Full-pretrain/Learning Rate": 3.7429941740190877e-06, "Full-pretrain/Loss": 1.8923087120056152, "Full-pretrain/Loss (Raw)": 2.198420763015747, "Full-pretrain/Step": 7904, "Full-pretrain/Step Time": 17.632902858778834} +{"Full-pretrain/Learning Rate": 3.7385264400272373e-06, "Full-pretrain/Loss": 1.8901970386505127, "Full-pretrain/Loss (Raw)": 2.0386576652526855, "Full-pretrain/Step": 7905, "Full-pretrain/Step Time": 17.630340680480003} +{"Full-pretrain/Learning Rate": 3.734061158538893e-06, "Full-pretrain/Loss": 1.8943967819213867, "Full-pretrain/Loss (Raw)": 2.1086485385894775, "Full-pretrain/Step": 7906, "Full-pretrain/Step Time": 17.625408068299294} +{"Full-pretrain/Learning Rate": 3.7295983300691174e-06, "Full-pretrain/Loss": 1.8929798603057861, "Full-pretrain/Loss (Raw)": 1.9417873620986938, "Full-pretrain/Step": 7907, "Full-pretrain/Step Time": 17.63124193623662} +{"Full-pretrain/Learning Rate": 3.725137955132707e-06, "Full-pretrain/Loss": 1.890822410583496, "Full-pretrain/Loss (Raw)": 1.9581398963928223, "Full-pretrain/Step": 7908, "Full-pretrain/Step Time": 17.623004157096148} +{"Full-pretrain/Learning Rate": 3.7206800342441534e-06, "Full-pretrain/Loss": 1.8883142471313477, "Full-pretrain/Loss (Raw)": 1.8870859146118164, "Full-pretrain/Step": 7909, "Full-pretrain/Step Time": 17.62668241560459} +{"Full-pretrain/Learning Rate": 3.7162245679176784e-06, "Full-pretrain/Loss": 1.8910577297210693, "Full-pretrain/Loss (Raw)": 1.974607229232788, "Full-pretrain/Step": 7910, "Full-pretrain/Step Time": 17.62673802115023} +{"Full-pretrain/Learning Rate": 3.711771556667218e-06, "Full-pretrain/Loss": 1.8833684921264648, "Full-pretrain/Loss (Raw)": 1.7723956108093262, "Full-pretrain/Step": 7911, "Full-pretrain/Step Time": 17.62574164941907} +{"Full-pretrain/Learning Rate": 3.707321001006428e-06, "Full-pretrain/Loss": 1.9035481214523315, "Full-pretrain/Loss (Raw)": 2.0644073486328125, "Full-pretrain/Step": 7912, "Full-pretrain/Step Time": 17.632731454446912} +{"Full-pretrain/Learning Rate": 3.702872901448684e-06, "Full-pretrain/Loss": 1.9113469123840332, "Full-pretrain/Loss (Raw)": 2.0563154220581055, "Full-pretrain/Step": 7913, "Full-pretrain/Step Time": 17.630396688356996} +{"Full-pretrain/Learning Rate": 3.698427258507062e-06, "Full-pretrain/Loss": 1.9152030944824219, "Full-pretrain/Loss (Raw)": 1.8408045768737793, "Full-pretrain/Step": 7914, "Full-pretrain/Step Time": 17.6349776443094} +{"Full-pretrain/Learning Rate": 3.6939840726943675e-06, "Full-pretrain/Loss": 1.9082633256912231, "Full-pretrain/Loss (Raw)": 1.6787298917770386, "Full-pretrain/Step": 7915, "Full-pretrain/Step Time": 17.63954345136881} +{"Full-pretrain/Learning Rate": 3.6895433445231247e-06, "Full-pretrain/Loss": 1.92134428024292, "Full-pretrain/Loss (Raw)": 1.8450591564178467, "Full-pretrain/Step": 7916, "Full-pretrain/Step Time": 17.641687981784344} +{"Full-pretrain/Learning Rate": 3.6851050745055652e-06, "Full-pretrain/Loss": 1.914665699005127, "Full-pretrain/Loss (Raw)": 1.9138318300247192, "Full-pretrain/Step": 7917, "Full-pretrain/Step Time": 17.636249292641878} +{"Full-pretrain/Learning Rate": 3.680669263153655e-06, "Full-pretrain/Loss": 1.9218004941940308, "Full-pretrain/Loss (Raw)": 2.0714950561523438, "Full-pretrain/Step": 7918, "Full-pretrain/Step Time": 17.638860758394003} +{"Full-pretrain/Learning Rate": 3.6762359109790452e-06, "Full-pretrain/Loss": 1.9264276027679443, "Full-pretrain/Loss (Raw)": 1.8542206287384033, "Full-pretrain/Step": 7919, "Full-pretrain/Step Time": 17.64007930085063} +{"Full-pretrain/Learning Rate": 3.6718050184931353e-06, "Full-pretrain/Loss": 1.9382555484771729, "Full-pretrain/Loss (Raw)": 2.1387577056884766, "Full-pretrain/Step": 7920, "Full-pretrain/Step Time": 17.637141574174166} +{"Full-pretrain/Learning Rate": 3.667376586207014e-06, "Full-pretrain/Loss": 1.9414265155792236, "Full-pretrain/Loss (Raw)": 1.8067858219146729, "Full-pretrain/Step": 7921, "Full-pretrain/Step Time": 17.635171892121434} +{"Full-pretrain/Learning Rate": 3.662950614631508e-06, "Full-pretrain/Loss": 1.955322504043579, "Full-pretrain/Loss (Raw)": 2.1826159954071045, "Full-pretrain/Step": 7922, "Full-pretrain/Step Time": 17.627268739044666} +{"Full-pretrain/Learning Rate": 3.6585271042771486e-06, "Full-pretrain/Loss": 1.9404317140579224, "Full-pretrain/Loss (Raw)": 1.804105281829834, "Full-pretrain/Step": 7923, "Full-pretrain/Step Time": 17.632359171286225} +{"Full-pretrain/Learning Rate": 3.654106055654197e-06, "Full-pretrain/Loss": 1.9372377395629883, "Full-pretrain/Loss (Raw)": 1.9737712144851685, "Full-pretrain/Step": 7924, "Full-pretrain/Step Time": 17.63795778527856} +{"Full-pretrain/Learning Rate": 3.6496874692726003e-06, "Full-pretrain/Loss": 1.9317207336425781, "Full-pretrain/Loss (Raw)": 1.8307844400405884, "Full-pretrain/Step": 7925, "Full-pretrain/Step Time": 17.634377608075738} +{"Full-pretrain/Learning Rate": 3.645271345642054e-06, "Full-pretrain/Loss": 1.921454668045044, "Full-pretrain/Loss (Raw)": 1.7073650360107422, "Full-pretrain/Step": 7926, "Full-pretrain/Step Time": 17.637297600507736} +{"Full-pretrain/Learning Rate": 3.6408576852719533e-06, "Full-pretrain/Loss": 1.9422035217285156, "Full-pretrain/Loss (Raw)": 1.9870760440826416, "Full-pretrain/Step": 7927, "Full-pretrain/Step Time": 17.633636260405183} +{"Full-pretrain/Learning Rate": 3.6364464886714105e-06, "Full-pretrain/Loss": 1.9324860572814941, "Full-pretrain/Loss (Raw)": 1.7526911497116089, "Full-pretrain/Step": 7928, "Full-pretrain/Step Time": 17.638597324490547} +{"Full-pretrain/Learning Rate": 3.632037756349266e-06, "Full-pretrain/Loss": 1.945225477218628, "Full-pretrain/Loss (Raw)": 1.9304335117340088, "Full-pretrain/Step": 7929, "Full-pretrain/Step Time": 17.634977474808693} +{"Full-pretrain/Learning Rate": 3.6276314888140513e-06, "Full-pretrain/Loss": 1.9427164793014526, "Full-pretrain/Loss (Raw)": 1.9115220308303833, "Full-pretrain/Step": 7930, "Full-pretrain/Step Time": 17.627685448154807} +{"Full-pretrain/Learning Rate": 3.6232276865740323e-06, "Full-pretrain/Loss": 1.9386119842529297, "Full-pretrain/Loss (Raw)": 1.900997281074524, "Full-pretrain/Step": 7931, "Full-pretrain/Step Time": 17.624468255788088} +{"Full-pretrain/Learning Rate": 3.618826350137186e-06, "Full-pretrain/Loss": 1.9330235719680786, "Full-pretrain/Loss (Raw)": 1.9360407590866089, "Full-pretrain/Step": 7932, "Full-pretrain/Step Time": 17.62628190778196} +{"Full-pretrain/Learning Rate": 3.6144274800112065e-06, "Full-pretrain/Loss": 1.9272522926330566, "Full-pretrain/Loss (Raw)": 1.7753338813781738, "Full-pretrain/Step": 7933, "Full-pretrain/Step Time": 17.63191944733262} +{"Full-pretrain/Learning Rate": 3.6100310767035102e-06, "Full-pretrain/Loss": 1.9260810613632202, "Full-pretrain/Loss (Raw)": 1.7832624912261963, "Full-pretrain/Step": 7934, "Full-pretrain/Step Time": 17.624263105913997} +{"Full-pretrain/Learning Rate": 3.605637140721205e-06, "Full-pretrain/Loss": 1.924334168434143, "Full-pretrain/Loss (Raw)": 1.952543020248413, "Full-pretrain/Step": 7935, "Full-pretrain/Step Time": 17.625667864456773} +{"Full-pretrain/Learning Rate": 3.6012456725711437e-06, "Full-pretrain/Loss": 1.9097213745117188, "Full-pretrain/Loss (Raw)": 1.7308120727539062, "Full-pretrain/Step": 7936, "Full-pretrain/Step Time": 17.630977543070912} +{"Full-pretrain/Learning Rate": 3.596856672759866e-06, "Full-pretrain/Loss": 1.899156093597412, "Full-pretrain/Loss (Raw)": 1.700567364692688, "Full-pretrain/Step": 7937, "Full-pretrain/Step Time": 17.62731653265655} +{"Full-pretrain/Learning Rate": 3.5924701417936495e-06, "Full-pretrain/Loss": 1.8783164024353027, "Full-pretrain/Loss (Raw)": 1.4417808055877686, "Full-pretrain/Step": 7938, "Full-pretrain/Step Time": 17.621422823518515} +{"Full-pretrain/Learning Rate": 3.588086080178482e-06, "Full-pretrain/Loss": 1.8784550428390503, "Full-pretrain/Loss (Raw)": 1.9462233781814575, "Full-pretrain/Step": 7939, "Full-pretrain/Step Time": 17.626099031418562} +{"Full-pretrain/Learning Rate": 3.5837044884200642e-06, "Full-pretrain/Loss": 1.8797630071640015, "Full-pretrain/Loss (Raw)": 1.999993085861206, "Full-pretrain/Step": 7940, "Full-pretrain/Step Time": 17.626595171168447} +{"Full-pretrain/Learning Rate": 3.579325367023803e-06, "Full-pretrain/Loss": 1.888677954673767, "Full-pretrain/Loss (Raw)": 2.1723642349243164, "Full-pretrain/Step": 7941, "Full-pretrain/Step Time": 17.624578334391117} +{"Full-pretrain/Learning Rate": 3.5749487164948303e-06, "Full-pretrain/Loss": 1.8865514993667603, "Full-pretrain/Loss (Raw)": 1.906559705734253, "Full-pretrain/Step": 7942, "Full-pretrain/Step Time": 17.624092649668455} +{"Full-pretrain/Learning Rate": 3.570574537337998e-06, "Full-pretrain/Loss": 1.8782483339309692, "Full-pretrain/Loss (Raw)": 1.5066959857940674, "Full-pretrain/Step": 7943, "Full-pretrain/Step Time": 17.620111774653196} +{"Full-pretrain/Learning Rate": 3.5662028300578576e-06, "Full-pretrain/Loss": 1.8751493692398071, "Full-pretrain/Loss (Raw)": 1.9652395248413086, "Full-pretrain/Step": 7944, "Full-pretrain/Step Time": 17.62130645662546} +{"Full-pretrain/Learning Rate": 3.561833595158698e-06, "Full-pretrain/Loss": 1.8634649515151978, "Full-pretrain/Loss (Raw)": 1.6824138164520264, "Full-pretrain/Step": 7945, "Full-pretrain/Step Time": 17.620066506788135} +{"Full-pretrain/Learning Rate": 3.5574668331444904e-06, "Full-pretrain/Loss": 1.8722901344299316, "Full-pretrain/Loss (Raw)": 2.1232075691223145, "Full-pretrain/Step": 7946, "Full-pretrain/Step Time": 17.615009671077132} +{"Full-pretrain/Learning Rate": 3.5531025445189494e-06, "Full-pretrain/Loss": 1.8874144554138184, "Full-pretrain/Loss (Raw)": 2.162713050842285, "Full-pretrain/Step": 7947, "Full-pretrain/Step Time": 17.608334319666028} +{"Full-pretrain/Learning Rate": 3.5487407297854937e-06, "Full-pretrain/Loss": 1.8964545726776123, "Full-pretrain/Loss (Raw)": 2.1343393325805664, "Full-pretrain/Step": 7948, "Full-pretrain/Step Time": 17.6124569773674} +{"Full-pretrain/Learning Rate": 3.544381389447254e-06, "Full-pretrain/Loss": 1.9018263816833496, "Full-pretrain/Loss (Raw)": 2.085733652114868, "Full-pretrain/Step": 7949, "Full-pretrain/Step Time": 17.615634128451347} +{"Full-pretrain/Learning Rate": 3.5400245240070905e-06, "Full-pretrain/Loss": 1.890789270401001, "Full-pretrain/Loss (Raw)": 1.7183071374893188, "Full-pretrain/Step": 7950, "Full-pretrain/Step Time": 17.611483715474606} +{"Full-pretrain/Learning Rate": 3.5356701339675474e-06, "Full-pretrain/Loss": 1.8866117000579834, "Full-pretrain/Loss (Raw)": 1.7205383777618408, "Full-pretrain/Step": 7951, "Full-pretrain/Step Time": 17.608191082254052} +{"Full-pretrain/Learning Rate": 3.531318219830912e-06, "Full-pretrain/Loss": 1.8639800548553467, "Full-pretrain/Loss (Raw)": 1.4145454168319702, "Full-pretrain/Step": 7952, "Full-pretrain/Step Time": 17.611739236861467} +{"Full-pretrain/Learning Rate": 3.5269687820991824e-06, "Full-pretrain/Loss": 1.8721938133239746, "Full-pretrain/Loss (Raw)": 2.069624423980713, "Full-pretrain/Step": 7953, "Full-pretrain/Step Time": 17.607082828879356} +{"Full-pretrain/Learning Rate": 3.5226218212740497e-06, "Full-pretrain/Loss": 1.8629863262176514, "Full-pretrain/Loss (Raw)": 1.8879778385162354, "Full-pretrain/Step": 7954, "Full-pretrain/Step Time": 17.602252323180437} +{"Full-pretrain/Learning Rate": 3.518277337856951e-06, "Full-pretrain/Loss": 1.8622926473617554, "Full-pretrain/Loss (Raw)": 1.7819074392318726, "Full-pretrain/Step": 7955, "Full-pretrain/Step Time": 17.6050946675241} +{"Full-pretrain/Learning Rate": 3.5139353323490053e-06, "Full-pretrain/Loss": 1.8680943250656128, "Full-pretrain/Loss (Raw)": 2.1594247817993164, "Full-pretrain/Step": 7956, "Full-pretrain/Step Time": 17.603918202221394} +{"Full-pretrain/Learning Rate": 3.5095958052510675e-06, "Full-pretrain/Loss": 1.8632434606552124, "Full-pretrain/Loss (Raw)": 1.675557255744934, "Full-pretrain/Step": 7957, "Full-pretrain/Step Time": 17.601056108251214} +{"Full-pretrain/Learning Rate": 3.5052587570637006e-06, "Full-pretrain/Loss": 1.8690911531448364, "Full-pretrain/Loss (Raw)": 1.894491195678711, "Full-pretrain/Step": 7958, "Full-pretrain/Step Time": 17.603185949847102} +{"Full-pretrain/Learning Rate": 3.500924188287183e-06, "Full-pretrain/Loss": 1.8667834997177124, "Full-pretrain/Loss (Raw)": 1.9132308959960938, "Full-pretrain/Step": 7959, "Full-pretrain/Step Time": 17.60712344571948} +{"Full-pretrain/Learning Rate": 3.4965920994215056e-06, "Full-pretrain/Loss": 1.8595870733261108, "Full-pretrain/Loss (Raw)": 1.5224058628082275, "Full-pretrain/Step": 7960, "Full-pretrain/Step Time": 17.60746626742184} +{"Full-pretrain/Learning Rate": 3.4922624909663774e-06, "Full-pretrain/Loss": 1.8693733215332031, "Full-pretrain/Loss (Raw)": 2.243593692779541, "Full-pretrain/Step": 7961, "Full-pretrain/Step Time": 17.603466045111418} +{"Full-pretrain/Learning Rate": 3.4879353634212076e-06, "Full-pretrain/Loss": 1.8821775913238525, "Full-pretrain/Loss (Raw)": 2.3212573528289795, "Full-pretrain/Step": 7962, "Full-pretrain/Step Time": 17.601299818605185} +{"Full-pretrain/Learning Rate": 3.4836107172851352e-06, "Full-pretrain/Loss": 1.8891098499298096, "Full-pretrain/Loss (Raw)": 2.1228299140930176, "Full-pretrain/Step": 7963, "Full-pretrain/Step Time": 17.598788114264607} +{"Full-pretrain/Learning Rate": 3.479288553057003e-06, "Full-pretrain/Loss": 1.8926048278808594, "Full-pretrain/Loss (Raw)": 2.0478806495666504, "Full-pretrain/Step": 7964, "Full-pretrain/Step Time": 17.600828666239977} +{"Full-pretrain/Learning Rate": 3.4749688712353735e-06, "Full-pretrain/Loss": 1.9050709009170532, "Full-pretrain/Loss (Raw)": 2.1742477416992188, "Full-pretrain/Step": 7965, "Full-pretrain/Step Time": 17.606608597561717} +{"Full-pretrain/Learning Rate": 3.4706516723185256e-06, "Full-pretrain/Loss": 1.9040969610214233, "Full-pretrain/Loss (Raw)": 1.7520946264266968, "Full-pretrain/Step": 7966, "Full-pretrain/Step Time": 17.596440056338906} +{"Full-pretrain/Learning Rate": 3.466336956804436e-06, "Full-pretrain/Loss": 1.9063502550125122, "Full-pretrain/Loss (Raw)": 2.024648427963257, "Full-pretrain/Step": 7967, "Full-pretrain/Step Time": 17.603298846632242} +{"Full-pretrain/Learning Rate": 3.4620247251908127e-06, "Full-pretrain/Loss": 1.9204635620117188, "Full-pretrain/Loss (Raw)": 2.1824357509613037, "Full-pretrain/Step": 7968, "Full-pretrain/Step Time": 17.598840719088912} +{"Full-pretrain/Learning Rate": 3.4577149779750713e-06, "Full-pretrain/Loss": 1.9268958568572998, "Full-pretrain/Loss (Raw)": 1.9064010381698608, "Full-pretrain/Step": 7969, "Full-pretrain/Step Time": 17.60233379341662} +{"Full-pretrain/Learning Rate": 3.4534077156543333e-06, "Full-pretrain/Loss": 1.9411442279815674, "Full-pretrain/Loss (Raw)": 1.897729754447937, "Full-pretrain/Step": 7970, "Full-pretrain/Step Time": 17.60122805275023} +{"Full-pretrain/Learning Rate": 3.4491029387254486e-06, "Full-pretrain/Loss": 1.9473797082901, "Full-pretrain/Loss (Raw)": 2.145759344100952, "Full-pretrain/Step": 7971, "Full-pretrain/Step Time": 17.60690370760858} +{"Full-pretrain/Learning Rate": 3.444800647684959e-06, "Full-pretrain/Loss": 1.9469819068908691, "Full-pretrain/Loss (Raw)": 1.9872623682022095, "Full-pretrain/Step": 7972, "Full-pretrain/Step Time": 17.60514198616147} +{"Full-pretrain/Learning Rate": 3.440500843029143e-06, "Full-pretrain/Loss": 1.9398419857025146, "Full-pretrain/Loss (Raw)": 1.943888783454895, "Full-pretrain/Step": 7973, "Full-pretrain/Step Time": 17.608005829155445} +{"Full-pretrain/Learning Rate": 3.4362035252539754e-06, "Full-pretrain/Loss": 1.9462380409240723, "Full-pretrain/Loss (Raw)": 2.111232280731201, "Full-pretrain/Step": 7974, "Full-pretrain/Step Time": 17.614331636577845} +{"Full-pretrain/Learning Rate": 3.4319086948551544e-06, "Full-pretrain/Loss": 1.952837347984314, "Full-pretrain/Loss (Raw)": 1.7178736925125122, "Full-pretrain/Step": 7975, "Full-pretrain/Step Time": 17.603078136220574} +{"Full-pretrain/Learning Rate": 3.427616352328089e-06, "Full-pretrain/Loss": 1.9375289678573608, "Full-pretrain/Loss (Raw)": 1.4753713607788086, "Full-pretrain/Step": 7976, "Full-pretrain/Step Time": 17.60140604712069} +{"Full-pretrain/Learning Rate": 3.4233264981678947e-06, "Full-pretrain/Loss": 1.9393539428710938, "Full-pretrain/Loss (Raw)": 1.740816354751587, "Full-pretrain/Step": 7977, "Full-pretrain/Step Time": 17.601080808788538} +{"Full-pretrain/Learning Rate": 3.4190391328694034e-06, "Full-pretrain/Loss": 1.9311575889587402, "Full-pretrain/Loss (Raw)": 1.8609247207641602, "Full-pretrain/Step": 7978, "Full-pretrain/Step Time": 17.60520327836275} +{"Full-pretrain/Learning Rate": 3.4147542569271635e-06, "Full-pretrain/Loss": 1.9250901937484741, "Full-pretrain/Loss (Raw)": 1.9685540199279785, "Full-pretrain/Step": 7979, "Full-pretrain/Step Time": 17.60468058474362} +{"Full-pretrain/Learning Rate": 3.4104718708354354e-06, "Full-pretrain/Loss": 1.915459394454956, "Full-pretrain/Loss (Raw)": 1.8261582851409912, "Full-pretrain/Step": 7980, "Full-pretrain/Step Time": 17.602866588160396} +{"Full-pretrain/Learning Rate": 3.406191975088191e-06, "Full-pretrain/Loss": 1.9084341526031494, "Full-pretrain/Loss (Raw)": 1.8609212636947632, "Full-pretrain/Step": 7981, "Full-pretrain/Step Time": 17.607578981667757} +{"Full-pretrain/Learning Rate": 3.4019145701791184e-06, "Full-pretrain/Loss": 1.9181878566741943, "Full-pretrain/Loss (Raw)": 2.030431032180786, "Full-pretrain/Step": 7982, "Full-pretrain/Step Time": 17.61085028387606} +{"Full-pretrain/Learning Rate": 3.397639656601606e-06, "Full-pretrain/Loss": 1.9275771379470825, "Full-pretrain/Loss (Raw)": 2.0209906101226807, "Full-pretrain/Step": 7983, "Full-pretrain/Step Time": 17.609657008200884} +{"Full-pretrain/Learning Rate": 3.3933672348487655e-06, "Full-pretrain/Loss": 1.9485626220703125, "Full-pretrain/Loss (Raw)": 2.0860867500305176, "Full-pretrain/Step": 7984, "Full-pretrain/Step Time": 17.60356247611344} +{"Full-pretrain/Learning Rate": 3.3890973054134217e-06, "Full-pretrain/Loss": 1.9372153282165527, "Full-pretrain/Loss (Raw)": 1.7065058946609497, "Full-pretrain/Step": 7985, "Full-pretrain/Step Time": 17.60785449296236} +{"Full-pretrain/Learning Rate": 3.3848298687881143e-06, "Full-pretrain/Loss": 1.9346137046813965, "Full-pretrain/Loss (Raw)": 1.8047287464141846, "Full-pretrain/Step": 7986, "Full-pretrain/Step Time": 17.615304371342063} +{"Full-pretrain/Learning Rate": 3.3805649254650825e-06, "Full-pretrain/Loss": 1.9402010440826416, "Full-pretrain/Loss (Raw)": 1.960699200630188, "Full-pretrain/Step": 7987, "Full-pretrain/Step Time": 17.607806550338864} +{"Full-pretrain/Learning Rate": 3.376302475936291e-06, "Full-pretrain/Loss": 1.9309537410736084, "Full-pretrain/Loss (Raw)": 1.8635094165802002, "Full-pretrain/Step": 7988, "Full-pretrain/Step Time": 17.60424468666315} +{"Full-pretrain/Learning Rate": 3.3720425206934055e-06, "Full-pretrain/Loss": 1.9350690841674805, "Full-pretrain/Loss (Raw)": 1.8072509765625, "Full-pretrain/Step": 7989, "Full-pretrain/Step Time": 17.60495026782155} +{"Full-pretrain/Learning Rate": 3.3677850602278156e-06, "Full-pretrain/Loss": 1.9317514896392822, "Full-pretrain/Loss (Raw)": 1.7883296012878418, "Full-pretrain/Step": 7990, "Full-pretrain/Step Time": 17.60769384354353} +{"Full-pretrain/Learning Rate": 3.3635300950306174e-06, "Full-pretrain/Loss": 1.9330813884735107, "Full-pretrain/Loss (Raw)": 1.9557846784591675, "Full-pretrain/Step": 7991, "Full-pretrain/Step Time": 17.60522734373808} +{"Full-pretrain/Learning Rate": 3.3592776255926217e-06, "Full-pretrain/Loss": 1.9459915161132812, "Full-pretrain/Loss (Raw)": 1.9355264902114868, "Full-pretrain/Step": 7992, "Full-pretrain/Step Time": 17.596478519961238} +{"Full-pretrain/Learning Rate": 3.355027652404344e-06, "Full-pretrain/Loss": 1.9355602264404297, "Full-pretrain/Loss (Raw)": 1.9097962379455566, "Full-pretrain/Step": 7993, "Full-pretrain/Step Time": 17.597326766699553} +{"Full-pretrain/Learning Rate": 3.3507801759560198e-06, "Full-pretrain/Loss": 1.928694248199463, "Full-pretrain/Loss (Raw)": 2.101543426513672, "Full-pretrain/Step": 7994, "Full-pretrain/Step Time": 17.60111477598548} +{"Full-pretrain/Learning Rate": 3.3465351967375936e-06, "Full-pretrain/Loss": 1.9417879581451416, "Full-pretrain/Loss (Raw)": 2.5418343544006348, "Full-pretrain/Step": 7995, "Full-pretrain/Step Time": 17.601461205631495} +{"Full-pretrain/Learning Rate": 3.3422927152387236e-06, "Full-pretrain/Loss": 1.930955410003662, "Full-pretrain/Loss (Raw)": 1.701233148574829, "Full-pretrain/Step": 7996, "Full-pretrain/Step Time": 17.59374462068081} +{"Full-pretrain/Learning Rate": 3.338052731948782e-06, "Full-pretrain/Loss": 1.9204604625701904, "Full-pretrain/Loss (Raw)": 1.8384121656417847, "Full-pretrain/Step": 7997, "Full-pretrain/Step Time": 17.602659549564123} +{"Full-pretrain/Learning Rate": 3.333815247356839e-06, "Full-pretrain/Loss": 1.927579402923584, "Full-pretrain/Loss (Raw)": 1.9799034595489502, "Full-pretrain/Step": 7998, "Full-pretrain/Step Time": 17.597563438117504} +{"Full-pretrain/Learning Rate": 3.3295802619516954e-06, "Full-pretrain/Loss": 1.9250657558441162, "Full-pretrain/Loss (Raw)": 1.9442119598388672, "Full-pretrain/Step": 7999, "Full-pretrain/Step Time": 17.601717298850417} +{"Full-pretrain/Learning Rate": 3.3253477762218517e-06, "Full-pretrain/Loss": 1.9116466045379639, "Full-pretrain/Loss (Raw)": 1.753021001815796, "Full-pretrain/Step": 8000, "Full-pretrain/Step Time": 17.593577595427632} +{"Full-pretrain/Learning Rate": 3.321117790655526e-06, "Full-pretrain/Loss": 1.916351079940796, "Full-pretrain/Loss (Raw)": 2.056946277618408, "Full-pretrain/Step": 8001, "Full-pretrain/Step Time": 17.601440373808146} +{"Full-pretrain/Learning Rate": 3.3168903057406497e-06, "Full-pretrain/Loss": 1.9218828678131104, "Full-pretrain/Loss (Raw)": 2.0747437477111816, "Full-pretrain/Step": 8002, "Full-pretrain/Step Time": 17.59973736666143} +{"Full-pretrain/Learning Rate": 3.31266532196485e-06, "Full-pretrain/Loss": 1.9195359945297241, "Full-pretrain/Loss (Raw)": 2.0706627368927, "Full-pretrain/Step": 8003, "Full-pretrain/Step Time": 17.596625577658415} +{"Full-pretrain/Learning Rate": 3.3084428398154924e-06, "Full-pretrain/Loss": 1.9187657833099365, "Full-pretrain/Loss (Raw)": 1.9626163244247437, "Full-pretrain/Step": 8004, "Full-pretrain/Step Time": 17.591758938506246} +{"Full-pretrain/Learning Rate": 3.304222859779621e-06, "Full-pretrain/Loss": 1.9123519659042358, "Full-pretrain/Loss (Raw)": 1.7386460304260254, "Full-pretrain/Step": 8005, "Full-pretrain/Step Time": 17.591351320967078} +{"Full-pretrain/Learning Rate": 3.3000053823440207e-06, "Full-pretrain/Loss": 1.9140985012054443, "Full-pretrain/Loss (Raw)": 2.1671204566955566, "Full-pretrain/Step": 8006, "Full-pretrain/Step Time": 17.600933885201812} +{"Full-pretrain/Learning Rate": 3.2957904079951725e-06, "Full-pretrain/Loss": 1.9141461849212646, "Full-pretrain/Loss (Raw)": 1.7193983793258667, "Full-pretrain/Step": 8007, "Full-pretrain/Step Time": 17.598780488595366} +{"Full-pretrain/Learning Rate": 3.291577937219281e-06, "Full-pretrain/Loss": 1.9343520402908325, "Full-pretrain/Loss (Raw)": 2.121957540512085, "Full-pretrain/Step": 8008, "Full-pretrain/Step Time": 17.59223659336567} +{"Full-pretrain/Learning Rate": 3.287367970502239e-06, "Full-pretrain/Loss": 1.9501330852508545, "Full-pretrain/Loss (Raw)": 2.2458112239837646, "Full-pretrain/Step": 8009, "Full-pretrain/Step Time": 17.595461739227176} +{"Full-pretrain/Learning Rate": 3.283160508329669e-06, "Full-pretrain/Loss": 1.9531328678131104, "Full-pretrain/Loss (Raw)": 1.9569177627563477, "Full-pretrain/Step": 8010, "Full-pretrain/Step Time": 17.59922155737877} +{"Full-pretrain/Learning Rate": 3.2789555511869047e-06, "Full-pretrain/Loss": 1.9573264122009277, "Full-pretrain/Loss (Raw)": 2.1027450561523438, "Full-pretrain/Step": 8011, "Full-pretrain/Step Time": 17.600182984024286} +{"Full-pretrain/Learning Rate": 3.274753099558983e-06, "Full-pretrain/Loss": 1.9596055746078491, "Full-pretrain/Loss (Raw)": 1.8990895748138428, "Full-pretrain/Step": 8012, "Full-pretrain/Step Time": 17.601974193006754} +{"Full-pretrain/Learning Rate": 3.2705531539306638e-06, "Full-pretrain/Loss": 1.963294267654419, "Full-pretrain/Loss (Raw)": 1.9789620637893677, "Full-pretrain/Step": 8013, "Full-pretrain/Step Time": 17.601024633273482} +{"Full-pretrain/Learning Rate": 3.2663557147863954e-06, "Full-pretrain/Loss": 1.9515995979309082, "Full-pretrain/Loss (Raw)": 1.6561992168426514, "Full-pretrain/Step": 8014, "Full-pretrain/Step Time": 17.60339042544365} +{"Full-pretrain/Learning Rate": 3.2621607826103572e-06, "Full-pretrain/Loss": 1.9441940784454346, "Full-pretrain/Loss (Raw)": 1.784015417098999, "Full-pretrain/Step": 8015, "Full-pretrain/Step Time": 17.601871646940708} +{"Full-pretrain/Learning Rate": 3.2579683578864347e-06, "Full-pretrain/Loss": 1.9424264430999756, "Full-pretrain/Loss (Raw)": 2.0295233726501465, "Full-pretrain/Step": 8016, "Full-pretrain/Step Time": 17.597868686541915} +{"Full-pretrain/Learning Rate": 3.253778441098221e-06, "Full-pretrain/Loss": 1.9524481296539307, "Full-pretrain/Loss (Raw)": 2.0271992683410645, "Full-pretrain/Step": 8017, "Full-pretrain/Step Time": 17.597138231620193} +{"Full-pretrain/Learning Rate": 3.2495910327290267e-06, "Full-pretrain/Loss": 1.940248727798462, "Full-pretrain/Loss (Raw)": 1.4143469333648682, "Full-pretrain/Step": 8018, "Full-pretrain/Step Time": 17.596729699522257} +{"Full-pretrain/Learning Rate": 3.245406133261858e-06, "Full-pretrain/Loss": 1.9290744066238403, "Full-pretrain/Loss (Raw)": 1.6031219959259033, "Full-pretrain/Step": 8019, "Full-pretrain/Step Time": 17.59958221949637} +{"Full-pretrain/Learning Rate": 3.241223743179453e-06, "Full-pretrain/Loss": 1.9331607818603516, "Full-pretrain/Loss (Raw)": 1.994273066520691, "Full-pretrain/Step": 8020, "Full-pretrain/Step Time": 17.603194925934076} +{"Full-pretrain/Learning Rate": 3.237043862964237e-06, "Full-pretrain/Loss": 1.936440110206604, "Full-pretrain/Loss (Raw)": 1.9121912717819214, "Full-pretrain/Step": 8021, "Full-pretrain/Step Time": 17.60155998170376} +{"Full-pretrain/Learning Rate": 3.2328664930983633e-06, "Full-pretrain/Loss": 1.9416251182556152, "Full-pretrain/Loss (Raw)": 1.954245924949646, "Full-pretrain/Step": 8022, "Full-pretrain/Step Time": 17.604943798854947} +{"Full-pretrain/Learning Rate": 3.228691634063688e-06, "Full-pretrain/Loss": 1.9404489994049072, "Full-pretrain/Loss (Raw)": 1.9181501865386963, "Full-pretrain/Step": 8023, "Full-pretrain/Step Time": 17.607153804972768} +{"Full-pretrain/Learning Rate": 3.22451928634179e-06, "Full-pretrain/Loss": 1.9427597522735596, "Full-pretrain/Loss (Raw)": 2.0094728469848633, "Full-pretrain/Step": 8024, "Full-pretrain/Step Time": 17.60842278972268} +{"Full-pretrain/Learning Rate": 3.2203494504139343e-06, "Full-pretrain/Loss": 1.9396030902862549, "Full-pretrain/Loss (Raw)": 1.8087856769561768, "Full-pretrain/Step": 8025, "Full-pretrain/Step Time": 17.60621335543692} +{"Full-pretrain/Learning Rate": 3.2161821267611137e-06, "Full-pretrain/Loss": 1.9439244270324707, "Full-pretrain/Loss (Raw)": 2.2398219108581543, "Full-pretrain/Step": 8026, "Full-pretrain/Step Time": 17.609163403511047} +{"Full-pretrain/Learning Rate": 3.21201731586403e-06, "Full-pretrain/Loss": 1.9189705848693848, "Full-pretrain/Loss (Raw)": 1.7433143854141235, "Full-pretrain/Step": 8027, "Full-pretrain/Step Time": 17.605560794472694} +{"Full-pretrain/Learning Rate": 3.207855018203093e-06, "Full-pretrain/Loss": 1.9253162145614624, "Full-pretrain/Loss (Raw)": 1.9042903184890747, "Full-pretrain/Step": 8028, "Full-pretrain/Step Time": 17.60002068988979} +{"Full-pretrain/Learning Rate": 3.2036952342584274e-06, "Full-pretrain/Loss": 1.914478063583374, "Full-pretrain/Loss (Raw)": 1.4915904998779297, "Full-pretrain/Step": 8029, "Full-pretrain/Step Time": 17.604307437315583} +{"Full-pretrain/Learning Rate": 3.1995379645098496e-06, "Full-pretrain/Loss": 1.9218392372131348, "Full-pretrain/Loss (Raw)": 2.215463638305664, "Full-pretrain/Step": 8030, "Full-pretrain/Step Time": 17.60742810368538} +{"Full-pretrain/Learning Rate": 3.195383209436906e-06, "Full-pretrain/Loss": 1.9210429191589355, "Full-pretrain/Loss (Raw)": 1.9187290668487549, "Full-pretrain/Step": 8031, "Full-pretrain/Step Time": 17.612178625538945} +{"Full-pretrain/Learning Rate": 3.1912309695188463e-06, "Full-pretrain/Loss": 1.9289703369140625, "Full-pretrain/Loss (Raw)": 2.006697177886963, "Full-pretrain/Step": 8032, "Full-pretrain/Step Time": 17.608334997668862} +{"Full-pretrain/Learning Rate": 3.1870812452346328e-06, "Full-pretrain/Loss": 1.9261788129806519, "Full-pretrain/Loss (Raw)": 1.9676185846328735, "Full-pretrain/Step": 8033, "Full-pretrain/Step Time": 17.6039425060153} +{"Full-pretrain/Learning Rate": 3.1829340370629347e-06, "Full-pretrain/Loss": 1.9198870658874512, "Full-pretrain/Loss (Raw)": 1.8734065294265747, "Full-pretrain/Step": 8034, "Full-pretrain/Step Time": 17.603453738614917} +{"Full-pretrain/Learning Rate": 3.178789345482125e-06, "Full-pretrain/Loss": 1.915542721748352, "Full-pretrain/Loss (Raw)": 1.9316463470458984, "Full-pretrain/Step": 8035, "Full-pretrain/Step Time": 17.60556354187429} +{"Full-pretrain/Learning Rate": 3.1746471709702964e-06, "Full-pretrain/Loss": 1.924370288848877, "Full-pretrain/Loss (Raw)": 2.2450978755950928, "Full-pretrain/Step": 8036, "Full-pretrain/Step Time": 17.605184253305197} +{"Full-pretrain/Learning Rate": 3.17050751400525e-06, "Full-pretrain/Loss": 1.936659336090088, "Full-pretrain/Loss (Raw)": 2.131894111633301, "Full-pretrain/Step": 8037, "Full-pretrain/Step Time": 17.60132121294737} +{"Full-pretrain/Learning Rate": 3.1663703750644843e-06, "Full-pretrain/Loss": 1.9288578033447266, "Full-pretrain/Loss (Raw)": 1.917472243309021, "Full-pretrain/Step": 8038, "Full-pretrain/Step Time": 17.59366498887539} +{"Full-pretrain/Learning Rate": 3.162235754625226e-06, "Full-pretrain/Loss": 1.935331106185913, "Full-pretrain/Loss (Raw)": 1.9265432357788086, "Full-pretrain/Step": 8039, "Full-pretrain/Step Time": 17.597543129697442} +{"Full-pretrain/Learning Rate": 3.1581036531644014e-06, "Full-pretrain/Loss": 1.9267315864562988, "Full-pretrain/Loss (Raw)": 1.8467724323272705, "Full-pretrain/Step": 8040, "Full-pretrain/Step Time": 17.59419241733849} +{"Full-pretrain/Learning Rate": 3.1539740711586415e-06, "Full-pretrain/Loss": 1.9068247079849243, "Full-pretrain/Loss (Raw)": 1.6087913513183594, "Full-pretrain/Step": 8041, "Full-pretrain/Step Time": 17.587182538583875} +{"Full-pretrain/Learning Rate": 3.1498470090842947e-06, "Full-pretrain/Loss": 1.9092984199523926, "Full-pretrain/Loss (Raw)": 2.0360753536224365, "Full-pretrain/Step": 8042, "Full-pretrain/Step Time": 17.58145264349878} +{"Full-pretrain/Learning Rate": 3.1457224674174167e-06, "Full-pretrain/Loss": 1.9063947200775146, "Full-pretrain/Loss (Raw)": 2.009829044342041, "Full-pretrain/Step": 8043, "Full-pretrain/Step Time": 17.57357789762318} +{"Full-pretrain/Learning Rate": 3.141600446633772e-06, "Full-pretrain/Loss": 1.905713677406311, "Full-pretrain/Loss (Raw)": 1.8772962093353271, "Full-pretrain/Step": 8044, "Full-pretrain/Step Time": 17.579272577539086} +{"Full-pretrain/Learning Rate": 3.1374809472088373e-06, "Full-pretrain/Loss": 1.90072500705719, "Full-pretrain/Loss (Raw)": 1.8193249702453613, "Full-pretrain/Step": 8045, "Full-pretrain/Step Time": 17.578322960063815} +{"Full-pretrain/Learning Rate": 3.133363969617789e-06, "Full-pretrain/Loss": 1.9083969593048096, "Full-pretrain/Loss (Raw)": 1.9017003774642944, "Full-pretrain/Step": 8046, "Full-pretrain/Step Time": 17.57363821193576} +{"Full-pretrain/Learning Rate": 3.1292495143355223e-06, "Full-pretrain/Loss": 1.917982578277588, "Full-pretrain/Loss (Raw)": 2.0907583236694336, "Full-pretrain/Step": 8047, "Full-pretrain/Step Time": 17.57073120959103} +{"Full-pretrain/Learning Rate": 3.1251375818366375e-06, "Full-pretrain/Loss": 1.9178624153137207, "Full-pretrain/Loss (Raw)": 2.025676727294922, "Full-pretrain/Step": 8048, "Full-pretrain/Step Time": 17.57635740749538} +{"Full-pretrain/Learning Rate": 3.121028172595447e-06, "Full-pretrain/Loss": 1.9154480695724487, "Full-pretrain/Loss (Raw)": 1.9499403238296509, "Full-pretrain/Step": 8049, "Full-pretrain/Step Time": 17.57568801008165} +{"Full-pretrain/Learning Rate": 3.116921287085972e-06, "Full-pretrain/Loss": 1.9302958250045776, "Full-pretrain/Loss (Raw)": 1.8894743919372559, "Full-pretrain/Step": 8050, "Full-pretrain/Step Time": 17.581475514918566} +{"Full-pretrain/Learning Rate": 3.112816925781931e-06, "Full-pretrain/Loss": 1.9451556205749512, "Full-pretrain/Loss (Raw)": 2.0786385536193848, "Full-pretrain/Step": 8051, "Full-pretrain/Step Time": 17.576019551604986} +{"Full-pretrain/Learning Rate": 3.1087150891567663e-06, "Full-pretrain/Loss": 1.9410679340362549, "Full-pretrain/Loss (Raw)": 1.8634672164916992, "Full-pretrain/Step": 8052, "Full-pretrain/Step Time": 17.580364525318146} +{"Full-pretrain/Learning Rate": 3.1046157776836283e-06, "Full-pretrain/Loss": 1.9362351894378662, "Full-pretrain/Loss (Raw)": 1.7575397491455078, "Full-pretrain/Step": 8053, "Full-pretrain/Step Time": 17.582339705899358} +{"Full-pretrain/Learning Rate": 3.1005189918353606e-06, "Full-pretrain/Loss": 1.9328824281692505, "Full-pretrain/Loss (Raw)": 1.8469597101211548, "Full-pretrain/Step": 8054, "Full-pretrain/Step Time": 17.580615324899554} +{"Full-pretrain/Learning Rate": 3.096424732084535e-06, "Full-pretrain/Loss": 1.924767255783081, "Full-pretrain/Loss (Raw)": 1.6584614515304565, "Full-pretrain/Step": 8055, "Full-pretrain/Step Time": 17.578236557543278} +{"Full-pretrain/Learning Rate": 3.092332998903416e-06, "Full-pretrain/Loss": 1.9263956546783447, "Full-pretrain/Loss (Raw)": 2.061587333679199, "Full-pretrain/Step": 8056, "Full-pretrain/Step Time": 17.58312550932169} +{"Full-pretrain/Learning Rate": 3.088243792763984e-06, "Full-pretrain/Loss": 1.9351017475128174, "Full-pretrain/Loss (Raw)": 2.08737850189209, "Full-pretrain/Step": 8057, "Full-pretrain/Step Time": 17.580698739737272} +{"Full-pretrain/Learning Rate": 3.084157114137931e-06, "Full-pretrain/Loss": 1.9324626922607422, "Full-pretrain/Loss (Raw)": 2.1553711891174316, "Full-pretrain/Step": 8058, "Full-pretrain/Step Time": 17.577963324263692} +{"Full-pretrain/Learning Rate": 3.080072963496655e-06, "Full-pretrain/Loss": 1.9437942504882812, "Full-pretrain/Loss (Raw)": 2.105923652648926, "Full-pretrain/Step": 8059, "Full-pretrain/Step Time": 17.576796108856797} +{"Full-pretrain/Learning Rate": 3.075991341311257e-06, "Full-pretrain/Loss": 1.940420389175415, "Full-pretrain/Loss (Raw)": 1.7963300943374634, "Full-pretrain/Step": 8060, "Full-pretrain/Step Time": 17.579716766253114} +{"Full-pretrain/Learning Rate": 3.0719122480525607e-06, "Full-pretrain/Loss": 1.948350429534912, "Full-pretrain/Loss (Raw)": 1.745352029800415, "Full-pretrain/Step": 8061, "Full-pretrain/Step Time": 17.576794058084488} +{"Full-pretrain/Learning Rate": 3.0678356841910753e-06, "Full-pretrain/Loss": 1.9432356357574463, "Full-pretrain/Loss (Raw)": 2.0517897605895996, "Full-pretrain/Step": 8062, "Full-pretrain/Step Time": 17.573322393000126} +{"Full-pretrain/Learning Rate": 3.0637616501970336e-06, "Full-pretrain/Loss": 1.943195104598999, "Full-pretrain/Loss (Raw)": 1.917428731918335, "Full-pretrain/Step": 8063, "Full-pretrain/Step Time": 17.57116574048996} +{"Full-pretrain/Learning Rate": 3.0596901465403784e-06, "Full-pretrain/Loss": 1.9429810047149658, "Full-pretrain/Loss (Raw)": 1.9998456239700317, "Full-pretrain/Step": 8064, "Full-pretrain/Step Time": 17.573730094358325} +{"Full-pretrain/Learning Rate": 3.0556211736907537e-06, "Full-pretrain/Loss": 1.9404910802841187, "Full-pretrain/Loss (Raw)": 1.8879423141479492, "Full-pretrain/Step": 8065, "Full-pretrain/Step Time": 17.579374384135008} +{"Full-pretrain/Learning Rate": 3.05155473211752e-06, "Full-pretrain/Loss": 1.9499356746673584, "Full-pretrain/Loss (Raw)": 2.1756348609924316, "Full-pretrain/Step": 8066, "Full-pretrain/Step Time": 17.5821751113981} +{"Full-pretrain/Learning Rate": 3.047490822289731e-06, "Full-pretrain/Loss": 1.957283616065979, "Full-pretrain/Loss (Raw)": 2.166778087615967, "Full-pretrain/Step": 8067, "Full-pretrain/Step Time": 17.575827008113265} +{"Full-pretrain/Learning Rate": 3.04342944467616e-06, "Full-pretrain/Loss": 1.9515355825424194, "Full-pretrain/Loss (Raw)": 2.061160087585449, "Full-pretrain/Step": 8068, "Full-pretrain/Step Time": 17.577666325494647} +{"Full-pretrain/Learning Rate": 3.0393705997452863e-06, "Full-pretrain/Loss": 1.9479060173034668, "Full-pretrain/Loss (Raw)": 2.015746593475342, "Full-pretrain/Step": 8069, "Full-pretrain/Step Time": 17.58225733973086} +{"Full-pretrain/Learning Rate": 3.035314287965302e-06, "Full-pretrain/Loss": 1.9453306198120117, "Full-pretrain/Loss (Raw)": 1.8350597620010376, "Full-pretrain/Step": 8070, "Full-pretrain/Step Time": 17.578792698681355} +{"Full-pretrain/Learning Rate": 3.0312605098040904e-06, "Full-pretrain/Loss": 1.9473278522491455, "Full-pretrain/Loss (Raw)": 1.990455985069275, "Full-pretrain/Step": 8071, "Full-pretrain/Step Time": 17.580153511837125} +{"Full-pretrain/Learning Rate": 3.027209265729264e-06, "Full-pretrain/Loss": 1.9453656673431396, "Full-pretrain/Loss (Raw)": 1.7839834690093994, "Full-pretrain/Step": 8072, "Full-pretrain/Step Time": 17.58346259407699} +{"Full-pretrain/Learning Rate": 3.0231605562081213e-06, "Full-pretrain/Loss": 1.958698034286499, "Full-pretrain/Loss (Raw)": 2.035423994064331, "Full-pretrain/Step": 8073, "Full-pretrain/Step Time": 17.585423117503524} +{"Full-pretrain/Learning Rate": 3.0191143817076854e-06, "Full-pretrain/Loss": 1.9589121341705322, "Full-pretrain/Loss (Raw)": 2.042929172515869, "Full-pretrain/Step": 8074, "Full-pretrain/Step Time": 17.5887918677181} +{"Full-pretrain/Learning Rate": 3.015070742694681e-06, "Full-pretrain/Loss": 1.9541468620300293, "Full-pretrain/Loss (Raw)": 1.85733962059021, "Full-pretrain/Step": 8075, "Full-pretrain/Step Time": 17.589246906340122} +{"Full-pretrain/Learning Rate": 3.011029639635546e-06, "Full-pretrain/Loss": 1.9545204639434814, "Full-pretrain/Loss (Raw)": 1.889253854751587, "Full-pretrain/Step": 8076, "Full-pretrain/Step Time": 17.590789748355746} +{"Full-pretrain/Learning Rate": 3.0069910729964068e-06, "Full-pretrain/Loss": 1.9555552005767822, "Full-pretrain/Loss (Raw)": 1.8524329662322998, "Full-pretrain/Step": 8077, "Full-pretrain/Step Time": 17.590808629989624} +{"Full-pretrain/Learning Rate": 3.002955043243122e-06, "Full-pretrain/Loss": 1.9591586589813232, "Full-pretrain/Loss (Raw)": 2.0170116424560547, "Full-pretrain/Step": 8078, "Full-pretrain/Step Time": 17.590978676453233} +{"Full-pretrain/Learning Rate": 2.998921550841241e-06, "Full-pretrain/Loss": 1.9587268829345703, "Full-pretrain/Loss (Raw)": 2.0769410133361816, "Full-pretrain/Step": 8079, "Full-pretrain/Step Time": 17.58867460116744} +{"Full-pretrain/Learning Rate": 2.994890596256028e-06, "Full-pretrain/Loss": 1.9530158042907715, "Full-pretrain/Loss (Raw)": 1.8429256677627563, "Full-pretrain/Step": 8080, "Full-pretrain/Step Time": 17.60333774611354} +{"Full-pretrain/Learning Rate": 2.99086217995245e-06, "Full-pretrain/Loss": 1.95294189453125, "Full-pretrain/Loss (Raw)": 1.9475747346878052, "Full-pretrain/Step": 8081, "Full-pretrain/Step Time": 17.604655427858233} +{"Full-pretrain/Learning Rate": 2.9868363023951935e-06, "Full-pretrain/Loss": 1.9501467943191528, "Full-pretrain/Loss (Raw)": 1.8000283241271973, "Full-pretrain/Step": 8082, "Full-pretrain/Step Time": 17.603601528331637} +{"Full-pretrain/Learning Rate": 2.9828129640486257e-06, "Full-pretrain/Loss": 1.955115795135498, "Full-pretrain/Loss (Raw)": 2.237650156021118, "Full-pretrain/Step": 8083, "Full-pretrain/Step Time": 17.596402518451214} +{"Full-pretrain/Learning Rate": 2.9787921653768454e-06, "Full-pretrain/Loss": 1.9504849910736084, "Full-pretrain/Loss (Raw)": 1.7152786254882812, "Full-pretrain/Step": 8084, "Full-pretrain/Step Time": 17.60071536898613} +{"Full-pretrain/Learning Rate": 2.97477390684365e-06, "Full-pretrain/Loss": 1.9586026668548584, "Full-pretrain/Loss (Raw)": 2.017305850982666, "Full-pretrain/Step": 8085, "Full-pretrain/Step Time": 17.605769457295537} +{"Full-pretrain/Learning Rate": 2.970758188912551e-06, "Full-pretrain/Loss": 1.9633604288101196, "Full-pretrain/Loss (Raw)": 1.9992101192474365, "Full-pretrain/Step": 8086, "Full-pretrain/Step Time": 17.603209249675274} +{"Full-pretrain/Learning Rate": 2.9667450120467453e-06, "Full-pretrain/Loss": 1.958789587020874, "Full-pretrain/Loss (Raw)": 1.5121960639953613, "Full-pretrain/Step": 8087, "Full-pretrain/Step Time": 17.599045388400555} +{"Full-pretrain/Learning Rate": 2.962734376709167e-06, "Full-pretrain/Loss": 1.9616366624832153, "Full-pretrain/Loss (Raw)": 2.152690887451172, "Full-pretrain/Step": 8088, "Full-pretrain/Step Time": 17.600859446451068} +{"Full-pretrain/Learning Rate": 2.958726283362426e-06, "Full-pretrain/Loss": 1.9601958990097046, "Full-pretrain/Loss (Raw)": 2.0412745475769043, "Full-pretrain/Step": 8089, "Full-pretrain/Step Time": 17.60282396711409} +{"Full-pretrain/Learning Rate": 2.954720732468866e-06, "Full-pretrain/Loss": 1.9519069194793701, "Full-pretrain/Loss (Raw)": 1.890127182006836, "Full-pretrain/Step": 8090, "Full-pretrain/Step Time": 17.602365942671895} +{"Full-pretrain/Learning Rate": 2.9507177244905205e-06, "Full-pretrain/Loss": 1.9559781551361084, "Full-pretrain/Loss (Raw)": 2.2361981868743896, "Full-pretrain/Step": 8091, "Full-pretrain/Step Time": 17.60473777167499} +{"Full-pretrain/Learning Rate": 2.9467172598891395e-06, "Full-pretrain/Loss": 1.960892677307129, "Full-pretrain/Loss (Raw)": 1.9535959959030151, "Full-pretrain/Step": 8092, "Full-pretrain/Step Time": 17.599687695503235} +{"Full-pretrain/Learning Rate": 2.942719339126171e-06, "Full-pretrain/Loss": 1.970552682876587, "Full-pretrain/Loss (Raw)": 2.0544722080230713, "Full-pretrain/Step": 8093, "Full-pretrain/Step Time": 17.59954383596778} +{"Full-pretrain/Learning Rate": 2.9387239626627734e-06, "Full-pretrain/Loss": 1.9675040245056152, "Full-pretrain/Loss (Raw)": 1.9542325735092163, "Full-pretrain/Step": 8094, "Full-pretrain/Step Time": 17.60040389560163} +{"Full-pretrain/Learning Rate": 2.934731130959814e-06, "Full-pretrain/Loss": 1.9691388607025146, "Full-pretrain/Loss (Raw)": 1.9697462320327759, "Full-pretrain/Step": 8095, "Full-pretrain/Step Time": 17.596228066831827} +{"Full-pretrain/Learning Rate": 2.930740844477867e-06, "Full-pretrain/Loss": 1.9709184169769287, "Full-pretrain/Loss (Raw)": 2.0567898750305176, "Full-pretrain/Step": 8096, "Full-pretrain/Step Time": 17.601613242179155} +{"Full-pretrain/Learning Rate": 2.92675310367721e-06, "Full-pretrain/Loss": 1.9813203811645508, "Full-pretrain/Loss (Raw)": 2.22080659866333, "Full-pretrain/Step": 8097, "Full-pretrain/Step Time": 17.597251733765006} +{"Full-pretrain/Learning Rate": 2.9227679090178205e-06, "Full-pretrain/Loss": 1.986727237701416, "Full-pretrain/Loss (Raw)": 2.3486547470092773, "Full-pretrain/Step": 8098, "Full-pretrain/Step Time": 17.598756274208426} +{"Full-pretrain/Learning Rate": 2.9187852609593946e-06, "Full-pretrain/Loss": 1.983698844909668, "Full-pretrain/Loss (Raw)": 2.0698652267456055, "Full-pretrain/Step": 8099, "Full-pretrain/Step Time": 17.591752344742417} +{"Full-pretrain/Learning Rate": 2.9148051599613314e-06, "Full-pretrain/Loss": 1.9822897911071777, "Full-pretrain/Loss (Raw)": 2.0160694122314453, "Full-pretrain/Step": 8100, "Full-pretrain/Step Time": 17.595637995749712} +{"Full-pretrain/Learning Rate": 2.910827606482727e-06, "Full-pretrain/Loss": 1.9838005304336548, "Full-pretrain/Loss (Raw)": 2.0640952587127686, "Full-pretrain/Step": 8101, "Full-pretrain/Step Time": 17.59727542102337} +{"Full-pretrain/Learning Rate": 2.906852600982404e-06, "Full-pretrain/Loss": 1.9765574932098389, "Full-pretrain/Loss (Raw)": 1.6032829284667969, "Full-pretrain/Step": 8102, "Full-pretrain/Step Time": 17.591640699654818} +{"Full-pretrain/Learning Rate": 2.9028801439188625e-06, "Full-pretrain/Loss": 1.9797155857086182, "Full-pretrain/Loss (Raw)": 2.091510772705078, "Full-pretrain/Step": 8103, "Full-pretrain/Step Time": 17.586004672572017} +{"Full-pretrain/Learning Rate": 2.8989102357503376e-06, "Full-pretrain/Loss": 1.983544111251831, "Full-pretrain/Loss (Raw)": 1.9064974784851074, "Full-pretrain/Step": 8104, "Full-pretrain/Step Time": 17.59157652594149} +{"Full-pretrain/Learning Rate": 2.8949428769347446e-06, "Full-pretrain/Loss": 1.9775155782699585, "Full-pretrain/Loss (Raw)": 1.8425121307373047, "Full-pretrain/Step": 8105, "Full-pretrain/Step Time": 17.59407783485949} +{"Full-pretrain/Learning Rate": 2.8909780679297225e-06, "Full-pretrain/Loss": 1.9702692031860352, "Full-pretrain/Loss (Raw)": 1.811047077178955, "Full-pretrain/Step": 8106, "Full-pretrain/Step Time": 17.588338498026133} +{"Full-pretrain/Learning Rate": 2.887015809192611e-06, "Full-pretrain/Loss": 1.9823682308197021, "Full-pretrain/Loss (Raw)": 2.2445085048675537, "Full-pretrain/Step": 8107, "Full-pretrain/Step Time": 17.579568672925234} +{"Full-pretrain/Learning Rate": 2.883056101180459e-06, "Full-pretrain/Loss": 1.9795384407043457, "Full-pretrain/Loss (Raw)": 1.7986993789672852, "Full-pretrain/Step": 8108, "Full-pretrain/Step Time": 17.58057216927409} +{"Full-pretrain/Learning Rate": 2.879098944350009e-06, "Full-pretrain/Loss": 1.9884556531906128, "Full-pretrain/Loss (Raw)": 2.1377806663513184, "Full-pretrain/Step": 8109, "Full-pretrain/Step Time": 17.585297361016273} +{"Full-pretrain/Learning Rate": 2.8751443391577203e-06, "Full-pretrain/Loss": 1.9799175262451172, "Full-pretrain/Loss (Raw)": 1.7437958717346191, "Full-pretrain/Step": 8110, "Full-pretrain/Step Time": 17.58405265584588} +{"Full-pretrain/Learning Rate": 2.8711922860597593e-06, "Full-pretrain/Loss": 1.9786291122436523, "Full-pretrain/Loss (Raw)": 2.035707950592041, "Full-pretrain/Step": 8111, "Full-pretrain/Step Time": 17.57970943674445} +{"Full-pretrain/Learning Rate": 2.8672427855119894e-06, "Full-pretrain/Loss": 1.9844086170196533, "Full-pretrain/Loss (Raw)": 2.0278725624084473, "Full-pretrain/Step": 8112, "Full-pretrain/Step Time": 17.583475878462195} +{"Full-pretrain/Learning Rate": 2.8632958379699927e-06, "Full-pretrain/Loss": 1.991047978401184, "Full-pretrain/Loss (Raw)": 2.160031318664551, "Full-pretrain/Step": 8113, "Full-pretrain/Step Time": 17.585845885798335} +{"Full-pretrain/Learning Rate": 2.8593514438890354e-06, "Full-pretrain/Loss": 1.989159345626831, "Full-pretrain/Loss (Raw)": 1.7395925521850586, "Full-pretrain/Step": 8114, "Full-pretrain/Step Time": 17.58540153503418} +{"Full-pretrain/Learning Rate": 2.8554096037241103e-06, "Full-pretrain/Loss": 1.9875916242599487, "Full-pretrain/Loss (Raw)": 2.1874821186065674, "Full-pretrain/Step": 8115, "Full-pretrain/Step Time": 17.58755441196263} +{"Full-pretrain/Learning Rate": 2.8514703179299024e-06, "Full-pretrain/Loss": 1.9916242361068726, "Full-pretrain/Loss (Raw)": 1.844322681427002, "Full-pretrain/Step": 8116, "Full-pretrain/Step Time": 17.582907920703292} +{"Full-pretrain/Learning Rate": 2.8475335869608127e-06, "Full-pretrain/Loss": 1.994086742401123, "Full-pretrain/Loss (Raw)": 2.0961074829101562, "Full-pretrain/Step": 8117, "Full-pretrain/Step Time": 17.585474018007517} +{"Full-pretrain/Learning Rate": 2.843599411270942e-06, "Full-pretrain/Loss": 1.9845294952392578, "Full-pretrain/Loss (Raw)": 1.6933791637420654, "Full-pretrain/Step": 8118, "Full-pretrain/Step Time": 17.588311407715082} +{"Full-pretrain/Learning Rate": 2.8396677913140877e-06, "Full-pretrain/Loss": 1.9995744228363037, "Full-pretrain/Loss (Raw)": 1.9936342239379883, "Full-pretrain/Step": 8119, "Full-pretrain/Step Time": 17.584665903821588} +{"Full-pretrain/Learning Rate": 2.8357387275437657e-06, "Full-pretrain/Loss": 2.01436185836792, "Full-pretrain/Loss (Raw)": 2.6258857250213623, "Full-pretrain/Step": 8120, "Full-pretrain/Step Time": 17.581474907696247} +{"Full-pretrain/Learning Rate": 2.831812220413199e-06, "Full-pretrain/Loss": 2.011348247528076, "Full-pretrain/Loss (Raw)": 1.9448459148406982, "Full-pretrain/Step": 8121, "Full-pretrain/Step Time": 17.58504543453455} +{"Full-pretrain/Learning Rate": 2.827888270375295e-06, "Full-pretrain/Loss": 2.013157367706299, "Full-pretrain/Loss (Raw)": 1.9480128288269043, "Full-pretrain/Step": 8122, "Full-pretrain/Step Time": 17.588843720033765} +{"Full-pretrain/Learning Rate": 2.823966877882689e-06, "Full-pretrain/Loss": 2.0017125606536865, "Full-pretrain/Loss (Raw)": 1.869969367980957, "Full-pretrain/Step": 8123, "Full-pretrain/Step Time": 17.585032718256116} +{"Full-pretrain/Learning Rate": 2.8200480433877158e-06, "Full-pretrain/Loss": 2.0015995502471924, "Full-pretrain/Loss (Raw)": 1.9499742984771729, "Full-pretrain/Step": 8124, "Full-pretrain/Step Time": 17.5839062333107} +{"Full-pretrain/Learning Rate": 2.8161317673424005e-06, "Full-pretrain/Loss": 1.9881246089935303, "Full-pretrain/Loss (Raw)": 1.623277187347412, "Full-pretrain/Step": 8125, "Full-pretrain/Step Time": 17.58525858260691} +{"Full-pretrain/Learning Rate": 2.8122180501984895e-06, "Full-pretrain/Loss": 1.988715410232544, "Full-pretrain/Loss (Raw)": 1.9731370210647583, "Full-pretrain/Step": 8126, "Full-pretrain/Step Time": 17.582512574270368} +{"Full-pretrain/Learning Rate": 2.8083068924074308e-06, "Full-pretrain/Loss": 1.997407078742981, "Full-pretrain/Loss (Raw)": 2.24787974357605, "Full-pretrain/Step": 8127, "Full-pretrain/Step Time": 17.577241895720363} +{"Full-pretrain/Learning Rate": 2.804398294420371e-06, "Full-pretrain/Loss": 1.9855239391326904, "Full-pretrain/Loss (Raw)": 1.6765276193618774, "Full-pretrain/Step": 8128, "Full-pretrain/Step Time": 17.585259633138776} +{"Full-pretrain/Learning Rate": 2.8004922566881753e-06, "Full-pretrain/Loss": 1.9683971405029297, "Full-pretrain/Loss (Raw)": 1.6727497577667236, "Full-pretrain/Step": 8129, "Full-pretrain/Step Time": 17.58126480318606} +{"Full-pretrain/Learning Rate": 2.7965887796613884e-06, "Full-pretrain/Loss": 1.9544169902801514, "Full-pretrain/Loss (Raw)": 1.9012925624847412, "Full-pretrain/Step": 8130, "Full-pretrain/Step Time": 17.587572254240513} +{"Full-pretrain/Learning Rate": 2.792687863790286e-06, "Full-pretrain/Loss": 1.9502397775650024, "Full-pretrain/Loss (Raw)": 1.936189889907837, "Full-pretrain/Step": 8131, "Full-pretrain/Step Time": 17.587963216006756} +{"Full-pretrain/Learning Rate": 2.7887895095248308e-06, "Full-pretrain/Loss": 1.9442617893218994, "Full-pretrain/Loss (Raw)": 1.8247742652893066, "Full-pretrain/Step": 8132, "Full-pretrain/Step Time": 17.590521136298776} +{"Full-pretrain/Learning Rate": 2.7848937173147017e-06, "Full-pretrain/Loss": 1.9407891035079956, "Full-pretrain/Loss (Raw)": 1.9529703855514526, "Full-pretrain/Step": 8133, "Full-pretrain/Step Time": 17.591287875548005} +{"Full-pretrain/Learning Rate": 2.781000487609281e-06, "Full-pretrain/Loss": 1.949040412902832, "Full-pretrain/Loss (Raw)": 1.8673272132873535, "Full-pretrain/Step": 8134, "Full-pretrain/Step Time": 17.589503990486264} +{"Full-pretrain/Learning Rate": 2.77710982085764e-06, "Full-pretrain/Loss": 1.9403733015060425, "Full-pretrain/Loss (Raw)": 1.8141603469848633, "Full-pretrain/Step": 8135, "Full-pretrain/Step Time": 17.58533152192831} +{"Full-pretrain/Learning Rate": 2.773221717508573e-06, "Full-pretrain/Loss": 1.9457552433013916, "Full-pretrain/Loss (Raw)": 2.0787172317504883, "Full-pretrain/Step": 8136, "Full-pretrain/Step Time": 17.586639000102878} +{"Full-pretrain/Learning Rate": 2.769336178010573e-06, "Full-pretrain/Loss": 1.9453284740447998, "Full-pretrain/Loss (Raw)": 1.8288583755493164, "Full-pretrain/Step": 8137, "Full-pretrain/Step Time": 17.593622272834182} +{"Full-pretrain/Learning Rate": 2.7654532028118297e-06, "Full-pretrain/Loss": 1.9395488500595093, "Full-pretrain/Loss (Raw)": 1.6261001825332642, "Full-pretrain/Step": 8138, "Full-pretrain/Step Time": 17.597331330180168} +{"Full-pretrain/Learning Rate": 2.7615727923602426e-06, "Full-pretrain/Loss": 1.92857825756073, "Full-pretrain/Loss (Raw)": 1.8934497833251953, "Full-pretrain/Step": 8139, "Full-pretrain/Step Time": 17.591862354427576} +{"Full-pretrain/Learning Rate": 2.757694947103426e-06, "Full-pretrain/Loss": 1.9351778030395508, "Full-pretrain/Loss (Raw)": 2.0098819732666016, "Full-pretrain/Step": 8140, "Full-pretrain/Step Time": 17.587511252611876} +{"Full-pretrain/Learning Rate": 2.7538196674886746e-06, "Full-pretrain/Loss": 1.935560941696167, "Full-pretrain/Loss (Raw)": 2.150042772293091, "Full-pretrain/Step": 8141, "Full-pretrain/Step Time": 17.58615728467703} +{"Full-pretrain/Learning Rate": 2.7499469539630092e-06, "Full-pretrain/Loss": 1.937260627746582, "Full-pretrain/Loss (Raw)": 1.798184871673584, "Full-pretrain/Step": 8142, "Full-pretrain/Step Time": 17.583432588726282} +{"Full-pretrain/Learning Rate": 2.746076806973141e-06, "Full-pretrain/Loss": 1.9347878694534302, "Full-pretrain/Loss (Raw)": 1.956581473350525, "Full-pretrain/Step": 8143, "Full-pretrain/Step Time": 17.58663234114647} +{"Full-pretrain/Learning Rate": 2.742209226965492e-06, "Full-pretrain/Loss": 1.9210412502288818, "Full-pretrain/Loss (Raw)": 1.5879805088043213, "Full-pretrain/Step": 8144, "Full-pretrain/Step Time": 17.58235930837691} +{"Full-pretrain/Learning Rate": 2.738344214386193e-06, "Full-pretrain/Loss": 1.915148377418518, "Full-pretrain/Loss (Raw)": 1.9714579582214355, "Full-pretrain/Step": 8145, "Full-pretrain/Step Time": 17.583401510491967} +{"Full-pretrain/Learning Rate": 2.7344817696810603e-06, "Full-pretrain/Loss": 1.9198408126831055, "Full-pretrain/Loss (Raw)": 1.889752745628357, "Full-pretrain/Step": 8146, "Full-pretrain/Step Time": 17.585935907438397} +{"Full-pretrain/Learning Rate": 2.7306218932956317e-06, "Full-pretrain/Loss": 1.916105031967163, "Full-pretrain/Loss (Raw)": 2.067934989929199, "Full-pretrain/Step": 8147, "Full-pretrain/Step Time": 17.582207709550858} +{"Full-pretrain/Learning Rate": 2.72676458567514e-06, "Full-pretrain/Loss": 1.922537088394165, "Full-pretrain/Loss (Raw)": 2.05015230178833, "Full-pretrain/Step": 8148, "Full-pretrain/Step Time": 17.57787825167179} +{"Full-pretrain/Learning Rate": 2.7229098472645263e-06, "Full-pretrain/Loss": 1.918443202972412, "Full-pretrain/Loss (Raw)": 1.9651002883911133, "Full-pretrain/Step": 8149, "Full-pretrain/Step Time": 17.580754904076457} +{"Full-pretrain/Learning Rate": 2.7190576785084408e-06, "Full-pretrain/Loss": 1.9258017539978027, "Full-pretrain/Loss (Raw)": 1.928852915763855, "Full-pretrain/Step": 8150, "Full-pretrain/Step Time": 17.578880025073886} +{"Full-pretrain/Learning Rate": 2.7152080798512144e-06, "Full-pretrain/Loss": 1.9279526472091675, "Full-pretrain/Loss (Raw)": 2.06246280670166, "Full-pretrain/Step": 8151, "Full-pretrain/Step Time": 17.579475473612547} +{"Full-pretrain/Learning Rate": 2.711361051736905e-06, "Full-pretrain/Loss": 1.9133280515670776, "Full-pretrain/Loss (Raw)": 2.157899856567383, "Full-pretrain/Step": 8152, "Full-pretrain/Step Time": 17.578428886830807} +{"Full-pretrain/Learning Rate": 2.707516594609269e-06, "Full-pretrain/Loss": 1.9098365306854248, "Full-pretrain/Loss (Raw)": 1.8331140279769897, "Full-pretrain/Step": 8153, "Full-pretrain/Step Time": 17.581603415310383} +{"Full-pretrain/Learning Rate": 2.7036747089117575e-06, "Full-pretrain/Loss": 1.9062002897262573, "Full-pretrain/Loss (Raw)": 1.8316562175750732, "Full-pretrain/Step": 8154, "Full-pretrain/Step Time": 17.587190967053175} +{"Full-pretrain/Learning Rate": 2.69983539508753e-06, "Full-pretrain/Loss": 1.903228998184204, "Full-pretrain/Loss (Raw)": 1.7748860120773315, "Full-pretrain/Step": 8155, "Full-pretrain/Step Time": 17.583005655556917} +{"Full-pretrain/Learning Rate": 2.6959986535794597e-06, "Full-pretrain/Loss": 1.9119927883148193, "Full-pretrain/Loss (Raw)": 2.230414390563965, "Full-pretrain/Step": 8156, "Full-pretrain/Step Time": 17.586021242663264} +{"Full-pretrain/Learning Rate": 2.692164484830101e-06, "Full-pretrain/Loss": 1.9187051057815552, "Full-pretrain/Loss (Raw)": 1.8380720615386963, "Full-pretrain/Step": 8157, "Full-pretrain/Step Time": 17.579902594909072} +{"Full-pretrain/Learning Rate": 2.6883328892817307e-06, "Full-pretrain/Loss": 1.94527006149292, "Full-pretrain/Loss (Raw)": 2.8232150077819824, "Full-pretrain/Step": 8158, "Full-pretrain/Step Time": 17.58977423235774} +{"Full-pretrain/Learning Rate": 2.6845038673763173e-06, "Full-pretrain/Loss": 1.9289608001708984, "Full-pretrain/Loss (Raw)": 1.7259823083877563, "Full-pretrain/Step": 8159, "Full-pretrain/Step Time": 17.57954108156264} +{"Full-pretrain/Learning Rate": 2.680677419555544e-06, "Full-pretrain/Loss": 1.9348680973052979, "Full-pretrain/Loss (Raw)": 1.8655614852905273, "Full-pretrain/Step": 8160, "Full-pretrain/Step Time": 17.583402877673507} +{"Full-pretrain/Learning Rate": 2.676853546260791e-06, "Full-pretrain/Loss": 1.9387259483337402, "Full-pretrain/Loss (Raw)": 1.796202301979065, "Full-pretrain/Step": 8161, "Full-pretrain/Step Time": 17.590512396767735} +{"Full-pretrain/Learning Rate": 2.67303224793313e-06, "Full-pretrain/Loss": 1.9362869262695312, "Full-pretrain/Loss (Raw)": 1.823244333267212, "Full-pretrain/Step": 8162, "Full-pretrain/Step Time": 17.59426841326058} +{"Full-pretrain/Learning Rate": 2.669213525013356e-06, "Full-pretrain/Loss": 1.9388976097106934, "Full-pretrain/Loss (Raw)": 2.0197315216064453, "Full-pretrain/Step": 8163, "Full-pretrain/Step Time": 17.591853629797697} +{"Full-pretrain/Learning Rate": 2.6653973779419528e-06, "Full-pretrain/Loss": 1.9466657638549805, "Full-pretrain/Loss (Raw)": 2.0733518600463867, "Full-pretrain/Step": 8164, "Full-pretrain/Step Time": 17.589911177754402} +{"Full-pretrain/Learning Rate": 2.6615838071591125e-06, "Full-pretrain/Loss": 1.9337384700775146, "Full-pretrain/Loss (Raw)": 1.5392985343933105, "Full-pretrain/Step": 8165, "Full-pretrain/Step Time": 17.592833910137415} +{"Full-pretrain/Learning Rate": 2.6577728131047337e-06, "Full-pretrain/Loss": 1.9482645988464355, "Full-pretrain/Loss (Raw)": 2.332162618637085, "Full-pretrain/Step": 8166, "Full-pretrain/Step Time": 17.59973456710577} +{"Full-pretrain/Learning Rate": 2.6539643962184057e-06, "Full-pretrain/Loss": 1.9577522277832031, "Full-pretrain/Loss (Raw)": 2.1177666187286377, "Full-pretrain/Step": 8167, "Full-pretrain/Step Time": 17.594665026292205} +{"Full-pretrain/Learning Rate": 2.6501585569394333e-06, "Full-pretrain/Loss": 1.9573371410369873, "Full-pretrain/Loss (Raw)": 2.065431594848633, "Full-pretrain/Step": 8168, "Full-pretrain/Step Time": 17.5977383852005} +{"Full-pretrain/Learning Rate": 2.646355295706815e-06, "Full-pretrain/Loss": 1.963435411453247, "Full-pretrain/Loss (Raw)": 2.0240061283111572, "Full-pretrain/Step": 8169, "Full-pretrain/Step Time": 17.603486286476254} +{"Full-pretrain/Learning Rate": 2.642554612959261e-06, "Full-pretrain/Loss": 1.9733270406723022, "Full-pretrain/Loss (Raw)": 1.9426283836364746, "Full-pretrain/Step": 8170, "Full-pretrain/Step Time": 17.606336748227477} +{"Full-pretrain/Learning Rate": 2.6387565091351735e-06, "Full-pretrain/Loss": 1.9732704162597656, "Full-pretrain/Loss (Raw)": 1.8916375637054443, "Full-pretrain/Step": 8171, "Full-pretrain/Step Time": 17.6071699205786} +{"Full-pretrain/Learning Rate": 2.6349609846726688e-06, "Full-pretrain/Loss": 1.9669177532196045, "Full-pretrain/Loss (Raw)": 1.8066022396087646, "Full-pretrain/Step": 8172, "Full-pretrain/Step Time": 17.60699432902038} +{"Full-pretrain/Learning Rate": 2.631168040009549e-06, "Full-pretrain/Loss": 1.9649885892868042, "Full-pretrain/Loss (Raw)": 2.0883073806762695, "Full-pretrain/Step": 8173, "Full-pretrain/Step Time": 17.610358161851764} +{"Full-pretrain/Learning Rate": 2.627377675583337e-06, "Full-pretrain/Loss": 1.969214916229248, "Full-pretrain/Loss (Raw)": 1.9334280490875244, "Full-pretrain/Step": 8174, "Full-pretrain/Step Time": 17.614212723448873} +{"Full-pretrain/Learning Rate": 2.6235898918312434e-06, "Full-pretrain/Loss": 1.9678444862365723, "Full-pretrain/Loss (Raw)": 1.9127299785614014, "Full-pretrain/Step": 8175, "Full-pretrain/Step Time": 17.62119884043932} +{"Full-pretrain/Learning Rate": 2.6198046891902003e-06, "Full-pretrain/Loss": 1.973365306854248, "Full-pretrain/Loss (Raw)": 1.764644980430603, "Full-pretrain/Step": 8176, "Full-pretrain/Step Time": 17.61492809280753} +{"Full-pretrain/Learning Rate": 2.6160220680968155e-06, "Full-pretrain/Loss": 1.9808332920074463, "Full-pretrain/Loss (Raw)": 2.2104310989379883, "Full-pretrain/Step": 8177, "Full-pretrain/Step Time": 17.6162445563823} +{"Full-pretrain/Learning Rate": 2.6122420289874216e-06, "Full-pretrain/Loss": 1.978784441947937, "Full-pretrain/Loss (Raw)": 1.8241922855377197, "Full-pretrain/Step": 8178, "Full-pretrain/Step Time": 17.610424840822816} +{"Full-pretrain/Learning Rate": 2.608464572298039e-06, "Full-pretrain/Loss": 1.9781949520111084, "Full-pretrain/Loss (Raw)": 2.049071788787842, "Full-pretrain/Step": 8179, "Full-pretrain/Step Time": 17.6150094345212} +{"Full-pretrain/Learning Rate": 2.6046896984643993e-06, "Full-pretrain/Loss": 1.9680728912353516, "Full-pretrain/Loss (Raw)": 1.726245403289795, "Full-pretrain/Step": 8180, "Full-pretrain/Step Time": 17.61343222297728} +{"Full-pretrain/Learning Rate": 2.6009174079219324e-06, "Full-pretrain/Loss": 1.9774547815322876, "Full-pretrain/Loss (Raw)": 2.2653186321258545, "Full-pretrain/Step": 8181, "Full-pretrain/Step Time": 17.608866807073355} +{"Full-pretrain/Learning Rate": 2.597147701105779e-06, "Full-pretrain/Loss": 1.9818456172943115, "Full-pretrain/Loss (Raw)": 2.0693626403808594, "Full-pretrain/Step": 8182, "Full-pretrain/Step Time": 17.606017408892512} +{"Full-pretrain/Learning Rate": 2.5933805784507576e-06, "Full-pretrain/Loss": 1.9725509881973267, "Full-pretrain/Loss (Raw)": 1.765031099319458, "Full-pretrain/Step": 8183, "Full-pretrain/Step Time": 17.60610608011484} +{"Full-pretrain/Learning Rate": 2.5896160403914126e-06, "Full-pretrain/Loss": 1.970963954925537, "Full-pretrain/Loss (Raw)": 2.1071221828460693, "Full-pretrain/Step": 8184, "Full-pretrain/Step Time": 17.603793101385236} +{"Full-pretrain/Learning Rate": 2.58585408736198e-06, "Full-pretrain/Loss": 1.9763044118881226, "Full-pretrain/Loss (Raw)": 2.0040016174316406, "Full-pretrain/Step": 8185, "Full-pretrain/Step Time": 17.60176465846598} +{"Full-pretrain/Learning Rate": 2.5820947197964103e-06, "Full-pretrain/Loss": 1.9769771099090576, "Full-pretrain/Loss (Raw)": 1.8531875610351562, "Full-pretrain/Step": 8186, "Full-pretrain/Step Time": 17.60380589030683} +{"Full-pretrain/Learning Rate": 2.5783379381283277e-06, "Full-pretrain/Loss": 1.974376916885376, "Full-pretrain/Loss (Raw)": 1.6916745901107788, "Full-pretrain/Step": 8187, "Full-pretrain/Step Time": 17.61115567944944} +{"Full-pretrain/Learning Rate": 2.5745837427910923e-06, "Full-pretrain/Loss": 1.9691622257232666, "Full-pretrain/Loss (Raw)": 2.063549518585205, "Full-pretrain/Step": 8188, "Full-pretrain/Step Time": 17.608432106673717} +{"Full-pretrain/Learning Rate": 2.570832134217735e-06, "Full-pretrain/Loss": 1.9677226543426514, "Full-pretrain/Loss (Raw)": 1.7920010089874268, "Full-pretrain/Step": 8189, "Full-pretrain/Step Time": 17.608359795063734} +{"Full-pretrain/Learning Rate": 2.5670831128410094e-06, "Full-pretrain/Loss": 1.9320738315582275, "Full-pretrain/Loss (Raw)": 1.6824573278427124, "Full-pretrain/Step": 8190, "Full-pretrain/Step Time": 17.61491161212325} +{"Full-pretrain/Learning Rate": 2.5633366790933615e-06, "Full-pretrain/Loss": 1.9357248544692993, "Full-pretrain/Loss (Raw)": 1.8428115844726562, "Full-pretrain/Step": 8191, "Full-pretrain/Step Time": 17.617240903899074} +{"Full-pretrain/Learning Rate": 2.5595928334069487e-06, "Full-pretrain/Loss": 1.9427112340927124, "Full-pretrain/Loss (Raw)": 2.089127779006958, "Full-pretrain/Step": 8192, "Full-pretrain/Step Time": 17.61299385689199} +{"Full-pretrain/Learning Rate": 2.5558515762136137e-06, "Full-pretrain/Loss": 1.9392949342727661, "Full-pretrain/Loss (Raw)": 1.6868809461593628, "Full-pretrain/Step": 8193, "Full-pretrain/Step Time": 17.615687815472484} +{"Full-pretrain/Learning Rate": 2.552112907944909e-06, "Full-pretrain/Loss": 1.9435468912124634, "Full-pretrain/Loss (Raw)": 1.959307312965393, "Full-pretrain/Step": 8194, "Full-pretrain/Step Time": 17.610240519046783} +{"Full-pretrain/Learning Rate": 2.5483768290320925e-06, "Full-pretrain/Loss": 1.9449074268341064, "Full-pretrain/Loss (Raw)": 2.063267946243286, "Full-pretrain/Step": 8195, "Full-pretrain/Step Time": 17.619932375848293} +{"Full-pretrain/Learning Rate": 2.5446433399061194e-06, "Full-pretrain/Loss": 1.9439184665679932, "Full-pretrain/Loss (Raw)": 2.0417051315307617, "Full-pretrain/Step": 8196, "Full-pretrain/Step Time": 17.617732491344213} +{"Full-pretrain/Learning Rate": 2.5409124409976506e-06, "Full-pretrain/Loss": 1.949162483215332, "Full-pretrain/Loss (Raw)": 1.7071068286895752, "Full-pretrain/Step": 8197, "Full-pretrain/Step Time": 17.612243682146072} +{"Full-pretrain/Learning Rate": 2.537184132737033e-06, "Full-pretrain/Loss": 1.9425009489059448, "Full-pretrain/Loss (Raw)": 2.118993043899536, "Full-pretrain/Step": 8198, "Full-pretrain/Step Time": 17.615944530814886} +{"Full-pretrain/Learning Rate": 2.533458415554335e-06, "Full-pretrain/Loss": 1.9293341636657715, "Full-pretrain/Loss (Raw)": 1.6964261531829834, "Full-pretrain/Step": 8199, "Full-pretrain/Step Time": 17.61900175921619} +{"Full-pretrain/Learning Rate": 2.5297352898793092e-06, "Full-pretrain/Loss": 1.926132082939148, "Full-pretrain/Loss (Raw)": 1.962966799736023, "Full-pretrain/Step": 8200, "Full-pretrain/Step Time": 17.617965010926127} +{"Full-pretrain/Learning Rate": 2.5260147561414234e-06, "Full-pretrain/Loss": 1.9189047813415527, "Full-pretrain/Loss (Raw)": 1.7927354574203491, "Full-pretrain/Step": 8201, "Full-pretrain/Step Time": 17.618095749989152} +{"Full-pretrain/Learning Rate": 2.5222968147698365e-06, "Full-pretrain/Loss": 1.9217259883880615, "Full-pretrain/Loss (Raw)": 2.032905101776123, "Full-pretrain/Step": 8202, "Full-pretrain/Step Time": 17.61569901742041} +{"Full-pretrain/Learning Rate": 2.51858146619342e-06, "Full-pretrain/Loss": 1.9170188903808594, "Full-pretrain/Loss (Raw)": 1.7410123348236084, "Full-pretrain/Step": 8203, "Full-pretrain/Step Time": 17.61900066025555} +{"Full-pretrain/Learning Rate": 2.514868710840723e-06, "Full-pretrain/Loss": 1.9233973026275635, "Full-pretrain/Loss (Raw)": 2.0107107162475586, "Full-pretrain/Step": 8204, "Full-pretrain/Step Time": 17.61527535505593} +{"Full-pretrain/Learning Rate": 2.511158549140025e-06, "Full-pretrain/Loss": 1.9299001693725586, "Full-pretrain/Loss (Raw)": 2.2963993549346924, "Full-pretrain/Step": 8205, "Full-pretrain/Step Time": 17.61099678836763} +{"Full-pretrain/Learning Rate": 2.50745098151928e-06, "Full-pretrain/Loss": 1.933105707168579, "Full-pretrain/Loss (Raw)": 2.0360021591186523, "Full-pretrain/Step": 8206, "Full-pretrain/Step Time": 17.611920539289713} +{"Full-pretrain/Learning Rate": 2.5037460084061602e-06, "Full-pretrain/Loss": 1.9283161163330078, "Full-pretrain/Loss (Raw)": 1.759462833404541, "Full-pretrain/Step": 8207, "Full-pretrain/Step Time": 17.61815626733005} +{"Full-pretrain/Learning Rate": 2.5000436302280355e-06, "Full-pretrain/Loss": 1.9418779611587524, "Full-pretrain/Loss (Raw)": 2.19862699508667, "Full-pretrain/Step": 8208, "Full-pretrain/Step Time": 17.60189693979919} +{"Full-pretrain/Learning Rate": 2.4963438474119694e-06, "Full-pretrain/Loss": 1.9369113445281982, "Full-pretrain/Loss (Raw)": 2.051497459411621, "Full-pretrain/Step": 8209, "Full-pretrain/Step Time": 17.604355856776237} +{"Full-pretrain/Learning Rate": 2.4926466603847286e-06, "Full-pretrain/Loss": 1.942117691040039, "Full-pretrain/Loss (Raw)": 1.9907944202423096, "Full-pretrain/Step": 8210, "Full-pretrain/Step Time": 17.60494190081954} +{"Full-pretrain/Learning Rate": 2.488952069572789e-06, "Full-pretrain/Loss": 1.9346150159835815, "Full-pretrain/Loss (Raw)": 1.8089878559112549, "Full-pretrain/Step": 8211, "Full-pretrain/Step Time": 17.612967744469643} +{"Full-pretrain/Learning Rate": 2.4852600754023155e-06, "Full-pretrain/Loss": 1.9367759227752686, "Full-pretrain/Loss (Raw)": 1.7953920364379883, "Full-pretrain/Step": 8212, "Full-pretrain/Step Time": 17.60957965813577} +{"Full-pretrain/Learning Rate": 2.481570678299186e-06, "Full-pretrain/Loss": 1.9267812967300415, "Full-pretrain/Loss (Raw)": 1.945492148399353, "Full-pretrain/Step": 8213, "Full-pretrain/Step Time": 17.60722222737968} +{"Full-pretrain/Learning Rate": 2.477883878688958e-06, "Full-pretrain/Loss": 1.9208180904388428, "Full-pretrain/Loss (Raw)": 1.8785384893417358, "Full-pretrain/Step": 8214, "Full-pretrain/Step Time": 17.60234258323908} +{"Full-pretrain/Learning Rate": 2.4741996769969134e-06, "Full-pretrain/Loss": 1.919649362564087, "Full-pretrain/Loss (Raw)": 1.7276362180709839, "Full-pretrain/Step": 8215, "Full-pretrain/Step Time": 17.606947837397456} +{"Full-pretrain/Learning Rate": 2.4705180736480176e-06, "Full-pretrain/Loss": 1.9254896640777588, "Full-pretrain/Loss (Raw)": 2.2940077781677246, "Full-pretrain/Step": 8216, "Full-pretrain/Step Time": 17.601614993065596} +{"Full-pretrain/Learning Rate": 2.4668390690669452e-06, "Full-pretrain/Loss": 1.9177932739257812, "Full-pretrain/Loss (Raw)": 1.757718563079834, "Full-pretrain/Step": 8217, "Full-pretrain/Step Time": 17.60625266842544} +{"Full-pretrain/Learning Rate": 2.4631626636780704e-06, "Full-pretrain/Loss": 1.9204957485198975, "Full-pretrain/Loss (Raw)": 1.939669132232666, "Full-pretrain/Step": 8218, "Full-pretrain/Step Time": 17.609470022842288} +{"Full-pretrain/Learning Rate": 2.459488857905459e-06, "Full-pretrain/Loss": 1.929641604423523, "Full-pretrain/Loss (Raw)": 1.984340786933899, "Full-pretrain/Step": 8219, "Full-pretrain/Step Time": 17.61186602152884} +{"Full-pretrain/Learning Rate": 2.455817652172887e-06, "Full-pretrain/Loss": 1.915924072265625, "Full-pretrain/Loss (Raw)": 1.6245869398117065, "Full-pretrain/Step": 8220, "Full-pretrain/Step Time": 17.618126448243856} +{"Full-pretrain/Learning Rate": 2.4521490469038316e-06, "Full-pretrain/Loss": 1.921935796737671, "Full-pretrain/Loss (Raw)": 1.9843800067901611, "Full-pretrain/Step": 8221, "Full-pretrain/Step Time": 17.621317306533456} +{"Full-pretrain/Learning Rate": 2.4484830425214543e-06, "Full-pretrain/Loss": 1.9307162761688232, "Full-pretrain/Loss (Raw)": 1.9634337425231934, "Full-pretrain/Step": 8222, "Full-pretrain/Step Time": 17.62291452102363} +{"Full-pretrain/Learning Rate": 2.444819639448631e-06, "Full-pretrain/Loss": 1.9261620044708252, "Full-pretrain/Loss (Raw)": 1.6970716714859009, "Full-pretrain/Step": 8223, "Full-pretrain/Step Time": 17.61938945017755} +{"Full-pretrain/Learning Rate": 2.441158838107943e-06, "Full-pretrain/Loss": 1.9204500913619995, "Full-pretrain/Loss (Raw)": 1.9063446521759033, "Full-pretrain/Step": 8224, "Full-pretrain/Step Time": 17.621176570653915} +{"Full-pretrain/Learning Rate": 2.4375006389216497e-06, "Full-pretrain/Loss": 1.9307892322540283, "Full-pretrain/Loss (Raw)": 2.0177345275878906, "Full-pretrain/Step": 8225, "Full-pretrain/Step Time": 17.62191248871386} +{"Full-pretrain/Learning Rate": 2.4338450423117306e-06, "Full-pretrain/Loss": 1.9351556301116943, "Full-pretrain/Loss (Raw)": 2.099030017852783, "Full-pretrain/Step": 8226, "Full-pretrain/Step Time": 17.624786177650094} +{"Full-pretrain/Learning Rate": 2.430192048699853e-06, "Full-pretrain/Loss": 1.9343376159667969, "Full-pretrain/Loss (Raw)": 2.0370965003967285, "Full-pretrain/Step": 8227, "Full-pretrain/Step Time": 17.62471796013415} +{"Full-pretrain/Learning Rate": 2.426541658507392e-06, "Full-pretrain/Loss": 1.9313565492630005, "Full-pretrain/Loss (Raw)": 1.9463070631027222, "Full-pretrain/Step": 8228, "Full-pretrain/Step Time": 17.62531218677759} +{"Full-pretrain/Learning Rate": 2.422893872155421e-06, "Full-pretrain/Loss": 1.9347753524780273, "Full-pretrain/Loss (Raw)": 1.8165130615234375, "Full-pretrain/Step": 8229, "Full-pretrain/Step Time": 17.625806590542197} +{"Full-pretrain/Learning Rate": 2.4192486900647043e-06, "Full-pretrain/Loss": 1.9159929752349854, "Full-pretrain/Loss (Raw)": 1.5179518461227417, "Full-pretrain/Step": 8230, "Full-pretrain/Step Time": 17.63078634440899} +{"Full-pretrain/Learning Rate": 2.415606112655716e-06, "Full-pretrain/Loss": 1.922952651977539, "Full-pretrain/Loss (Raw)": 1.9191412925720215, "Full-pretrain/Step": 8231, "Full-pretrain/Step Time": 17.63515250198543} +{"Full-pretrain/Learning Rate": 2.411966140348626e-06, "Full-pretrain/Loss": 1.9049124717712402, "Full-pretrain/Loss (Raw)": 1.3856748342514038, "Full-pretrain/Step": 8232, "Full-pretrain/Step Time": 17.63087248802185} +{"Full-pretrain/Learning Rate": 2.4083287735633036e-06, "Full-pretrain/Loss": 1.9038984775543213, "Full-pretrain/Loss (Raw)": 1.7602938413619995, "Full-pretrain/Step": 8233, "Full-pretrain/Step Time": 17.634112548083067} +{"Full-pretrain/Learning Rate": 2.404694012719322e-06, "Full-pretrain/Loss": 1.893007516860962, "Full-pretrain/Loss (Raw)": 1.6843920946121216, "Full-pretrain/Step": 8234, "Full-pretrain/Step Time": 17.636680375784636} +{"Full-pretrain/Learning Rate": 2.4010618582359424e-06, "Full-pretrain/Loss": 1.8948307037353516, "Full-pretrain/Loss (Raw)": 1.7993550300598145, "Full-pretrain/Step": 8235, "Full-pretrain/Step Time": 17.641401138156652} +{"Full-pretrain/Learning Rate": 2.397432310532133e-06, "Full-pretrain/Loss": 1.892213225364685, "Full-pretrain/Loss (Raw)": 1.9269498586654663, "Full-pretrain/Step": 8236, "Full-pretrain/Step Time": 17.638967614620924} +{"Full-pretrain/Learning Rate": 2.3938053700265694e-06, "Full-pretrain/Loss": 1.879725456237793, "Full-pretrain/Loss (Raw)": 1.896791696548462, "Full-pretrain/Step": 8237, "Full-pretrain/Step Time": 17.634266637265682} +{"Full-pretrain/Learning Rate": 2.3901810371376066e-06, "Full-pretrain/Loss": 1.8697431087493896, "Full-pretrain/Loss (Raw)": 1.7165658473968506, "Full-pretrain/Step": 8238, "Full-pretrain/Step Time": 17.637538257986307} +{"Full-pretrain/Learning Rate": 2.386559312283318e-06, "Full-pretrain/Loss": 1.8778096437454224, "Full-pretrain/Loss (Raw)": 2.0175909996032715, "Full-pretrain/Step": 8239, "Full-pretrain/Step Time": 17.63924557901919} +{"Full-pretrain/Learning Rate": 2.3829401958814694e-06, "Full-pretrain/Loss": 1.8786834478378296, "Full-pretrain/Loss (Raw)": 2.226590156555176, "Full-pretrain/Step": 8240, "Full-pretrain/Step Time": 17.636015908792615} +{"Full-pretrain/Learning Rate": 2.379323688349516e-06, "Full-pretrain/Loss": 1.8716862201690674, "Full-pretrain/Loss (Raw)": 1.8275840282440186, "Full-pretrain/Step": 8241, "Full-pretrain/Step Time": 17.631580471992493} +{"Full-pretrain/Learning Rate": 2.3757097901046244e-06, "Full-pretrain/Loss": 1.868481159210205, "Full-pretrain/Loss (Raw)": 1.888232946395874, "Full-pretrain/Step": 8242, "Full-pretrain/Step Time": 17.627597026526928} +{"Full-pretrain/Learning Rate": 2.3720985015636577e-06, "Full-pretrain/Loss": 1.876632809638977, "Full-pretrain/Loss (Raw)": 2.06984281539917, "Full-pretrain/Step": 8243, "Full-pretrain/Step Time": 17.63513358682394} +{"Full-pretrain/Learning Rate": 2.3684898231431802e-06, "Full-pretrain/Loss": 1.8788790702819824, "Full-pretrain/Loss (Raw)": 1.8672704696655273, "Full-pretrain/Step": 8244, "Full-pretrain/Step Time": 17.635419750586152} +{"Full-pretrain/Learning Rate": 2.3648837552594505e-06, "Full-pretrain/Loss": 1.8805584907531738, "Full-pretrain/Loss (Raw)": 1.9992375373840332, "Full-pretrain/Step": 8245, "Full-pretrain/Step Time": 17.63364406861365} +{"Full-pretrain/Learning Rate": 2.3612802983284193e-06, "Full-pretrain/Loss": 1.8686619997024536, "Full-pretrain/Loss (Raw)": 1.4978479146957397, "Full-pretrain/Step": 8246, "Full-pretrain/Step Time": 17.63101378828287} +{"Full-pretrain/Learning Rate": 2.3576794527657516e-06, "Full-pretrain/Loss": 1.8685073852539062, "Full-pretrain/Loss (Raw)": 1.7226922512054443, "Full-pretrain/Step": 8247, "Full-pretrain/Step Time": 17.63101217150688} +{"Full-pretrain/Learning Rate": 2.3540812189868005e-06, "Full-pretrain/Loss": 1.8549582958221436, "Full-pretrain/Loss (Raw)": 1.860435962677002, "Full-pretrain/Step": 8248, "Full-pretrain/Step Time": 17.63282233849168} +{"Full-pretrain/Learning Rate": 2.3504855974066236e-06, "Full-pretrain/Loss": 1.852097749710083, "Full-pretrain/Loss (Raw)": 1.666182279586792, "Full-pretrain/Step": 8249, "Full-pretrain/Step Time": 17.629854509606957} +{"Full-pretrain/Learning Rate": 2.346892588439981e-06, "Full-pretrain/Loss": 1.8517735004425049, "Full-pretrain/Loss (Raw)": 1.9292927980422974, "Full-pretrain/Step": 8250, "Full-pretrain/Step Time": 17.625393772497773} +{"Full-pretrain/Learning Rate": 2.3433021925013092e-06, "Full-pretrain/Loss": 1.8546435832977295, "Full-pretrain/Loss (Raw)": 2.0761795043945312, "Full-pretrain/Step": 8251, "Full-pretrain/Step Time": 17.627372939139605} +{"Full-pretrain/Learning Rate": 2.3397144100047673e-06, "Full-pretrain/Loss": 1.85921311378479, "Full-pretrain/Loss (Raw)": 1.7708148956298828, "Full-pretrain/Step": 8252, "Full-pretrain/Step Time": 17.629053181037307} +{"Full-pretrain/Learning Rate": 2.3361292413642043e-06, "Full-pretrain/Loss": 1.8600871562957764, "Full-pretrain/Loss (Raw)": 2.0123488903045654, "Full-pretrain/Step": 8253, "Full-pretrain/Step Time": 17.62395003810525} +{"Full-pretrain/Learning Rate": 2.3325466869931756e-06, "Full-pretrain/Loss": 1.8705482482910156, "Full-pretrain/Loss (Raw)": 2.298186779022217, "Full-pretrain/Step": 8254, "Full-pretrain/Step Time": 17.625454261898994} +{"Full-pretrain/Learning Rate": 2.3289667473049143e-06, "Full-pretrain/Loss": 1.8784842491149902, "Full-pretrain/Loss (Raw)": 1.9510245323181152, "Full-pretrain/Step": 8255, "Full-pretrain/Step Time": 17.62856850773096} +{"Full-pretrain/Learning Rate": 2.325389422712379e-06, "Full-pretrain/Loss": 1.8872671127319336, "Full-pretrain/Loss (Raw)": 2.1873972415924072, "Full-pretrain/Step": 8256, "Full-pretrain/Step Time": 17.62949452921748} +{"Full-pretrain/Learning Rate": 2.321814713628198e-06, "Full-pretrain/Loss": 1.8875844478607178, "Full-pretrain/Loss (Raw)": 2.027888536453247, "Full-pretrain/Step": 8257, "Full-pretrain/Step Time": 17.627626257017255} +{"Full-pretrain/Learning Rate": 2.3182426204647197e-06, "Full-pretrain/Loss": 1.886886477470398, "Full-pretrain/Loss (Raw)": 2.076692581176758, "Full-pretrain/Step": 8258, "Full-pretrain/Step Time": 17.620716558769345} +{"Full-pretrain/Learning Rate": 2.3146731436339857e-06, "Full-pretrain/Loss": 1.8722069263458252, "Full-pretrain/Loss (Raw)": 1.5673508644104004, "Full-pretrain/Step": 8259, "Full-pretrain/Step Time": 17.620501833036542} +{"Full-pretrain/Learning Rate": 2.3111062835477315e-06, "Full-pretrain/Loss": 1.868802785873413, "Full-pretrain/Loss (Raw)": 1.837372064590454, "Full-pretrain/Step": 8260, "Full-pretrain/Step Time": 17.621527832001448} +{"Full-pretrain/Learning Rate": 2.3075420406173997e-06, "Full-pretrain/Loss": 1.8729839324951172, "Full-pretrain/Loss (Raw)": 1.9503116607666016, "Full-pretrain/Step": 8261, "Full-pretrain/Step Time": 17.625941084697843} +{"Full-pretrain/Learning Rate": 2.3039804152541146e-06, "Full-pretrain/Loss": 1.8851944208145142, "Full-pretrain/Loss (Raw)": 1.9086878299713135, "Full-pretrain/Step": 8262, "Full-pretrain/Step Time": 17.622007597237825} +{"Full-pretrain/Learning Rate": 2.300421407868711e-06, "Full-pretrain/Loss": 1.8852922916412354, "Full-pretrain/Loss (Raw)": 1.9222736358642578, "Full-pretrain/Step": 8263, "Full-pretrain/Step Time": 17.62436236999929} +{"Full-pretrain/Learning Rate": 2.2968650188717218e-06, "Full-pretrain/Loss": 1.9031445980072021, "Full-pretrain/Loss (Raw)": 1.9569464921951294, "Full-pretrain/Step": 8264, "Full-pretrain/Step Time": 17.627358816564083} +{"Full-pretrain/Learning Rate": 2.2933112486733716e-06, "Full-pretrain/Loss": 1.9085444211959839, "Full-pretrain/Loss (Raw)": 1.9330898523330688, "Full-pretrain/Step": 8265, "Full-pretrain/Step Time": 17.627964155748487} +{"Full-pretrain/Learning Rate": 2.2897600976835963e-06, "Full-pretrain/Loss": 1.918444275856018, "Full-pretrain/Loss (Raw)": 2.0011885166168213, "Full-pretrain/Step": 8266, "Full-pretrain/Step Time": 17.619945663958788} +{"Full-pretrain/Learning Rate": 2.2862115663120076e-06, "Full-pretrain/Loss": 1.9198592901229858, "Full-pretrain/Loss (Raw)": 1.844635248184204, "Full-pretrain/Step": 8267, "Full-pretrain/Step Time": 17.62388540431857} +{"Full-pretrain/Learning Rate": 2.2826656549679332e-06, "Full-pretrain/Loss": 1.917078971862793, "Full-pretrain/Loss (Raw)": 1.8379782438278198, "Full-pretrain/Step": 8268, "Full-pretrain/Step Time": 17.63156273588538} +{"Full-pretrain/Learning Rate": 2.279122364060393e-06, "Full-pretrain/Loss": 1.9279460906982422, "Full-pretrain/Loss (Raw)": 2.244539976119995, "Full-pretrain/Step": 8269, "Full-pretrain/Step Time": 17.631367621943355} +{"Full-pretrain/Learning Rate": 2.275581693998108e-06, "Full-pretrain/Loss": 1.9337557554244995, "Full-pretrain/Loss (Raw)": 1.9024757146835327, "Full-pretrain/Step": 8270, "Full-pretrain/Step Time": 17.629047714173794} +{"Full-pretrain/Learning Rate": 2.272043645189481e-06, "Full-pretrain/Loss": 1.9337478876113892, "Full-pretrain/Loss (Raw)": 2.0173392295837402, "Full-pretrain/Step": 8271, "Full-pretrain/Step Time": 17.625707730650902} +{"Full-pretrain/Learning Rate": 2.268508218042639e-06, "Full-pretrain/Loss": 1.9253828525543213, "Full-pretrain/Loss (Raw)": 1.9589070081710815, "Full-pretrain/Step": 8272, "Full-pretrain/Step Time": 17.62984713539481} +{"Full-pretrain/Learning Rate": 2.264975412965381e-06, "Full-pretrain/Loss": 1.9362967014312744, "Full-pretrain/Loss (Raw)": 2.1768276691436768, "Full-pretrain/Step": 8273, "Full-pretrain/Step Time": 17.632348274812102} +{"Full-pretrain/Learning Rate": 2.2614452303652195e-06, "Full-pretrain/Loss": 1.938774585723877, "Full-pretrain/Loss (Raw)": 1.9675260782241821, "Full-pretrain/Step": 8274, "Full-pretrain/Step Time": 17.633368818089366} +{"Full-pretrain/Learning Rate": 2.257917670649359e-06, "Full-pretrain/Loss": 1.9328728914260864, "Full-pretrain/Loss (Raw)": 1.8809888362884521, "Full-pretrain/Step": 8275, "Full-pretrain/Step Time": 17.62949712201953} +{"Full-pretrain/Learning Rate": 2.2543927342247086e-06, "Full-pretrain/Loss": 1.9361538887023926, "Full-pretrain/Loss (Raw)": 1.9722599983215332, "Full-pretrain/Step": 8276, "Full-pretrain/Step Time": 17.634065283462405} +{"Full-pretrain/Learning Rate": 2.250870421497858e-06, "Full-pretrain/Loss": 1.941877841949463, "Full-pretrain/Loss (Raw)": 2.182405948638916, "Full-pretrain/Step": 8277, "Full-pretrain/Step Time": 17.63638507388532} +{"Full-pretrain/Learning Rate": 2.2473507328751086e-06, "Full-pretrain/Loss": 1.9546082019805908, "Full-pretrain/Loss (Raw)": 1.9052187204360962, "Full-pretrain/Step": 8278, "Full-pretrain/Step Time": 17.637181002646685} +{"Full-pretrain/Learning Rate": 2.24383366876246e-06, "Full-pretrain/Loss": 1.9656169414520264, "Full-pretrain/Loss (Raw)": 2.0749714374542236, "Full-pretrain/Step": 8279, "Full-pretrain/Step Time": 17.626757951453328} +{"Full-pretrain/Learning Rate": 2.2403192295655962e-06, "Full-pretrain/Loss": 1.971766471862793, "Full-pretrain/Loss (Raw)": 2.057224750518799, "Full-pretrain/Step": 8280, "Full-pretrain/Step Time": 17.628762912005186} +{"Full-pretrain/Learning Rate": 2.236807415689912e-06, "Full-pretrain/Loss": 1.9869481325149536, "Full-pretrain/Loss (Raw)": 2.1519935131073, "Full-pretrain/Step": 8281, "Full-pretrain/Step Time": 17.628183964639902} +{"Full-pretrain/Learning Rate": 2.2332982275405005e-06, "Full-pretrain/Loss": 1.986741542816162, "Full-pretrain/Loss (Raw)": 1.9226830005645752, "Full-pretrain/Step": 8282, "Full-pretrain/Step Time": 17.635734541341662} +{"Full-pretrain/Learning Rate": 2.2297916655221297e-06, "Full-pretrain/Loss": 1.974304437637329, "Full-pretrain/Loss (Raw)": 1.6781938076019287, "Full-pretrain/Step": 8283, "Full-pretrain/Step Time": 17.63319501839578} +{"Full-pretrain/Learning Rate": 2.226287730039289e-06, "Full-pretrain/Loss": 1.9867624044418335, "Full-pretrain/Loss (Raw)": 2.16947078704834, "Full-pretrain/Step": 8284, "Full-pretrain/Step Time": 17.632196974009275} +{"Full-pretrain/Learning Rate": 2.2227864214961562e-06, "Full-pretrain/Loss": 1.9867174625396729, "Full-pretrain/Loss (Raw)": 2.010909080505371, "Full-pretrain/Step": 8285, "Full-pretrain/Step Time": 17.63219726085663} +{"Full-pretrain/Learning Rate": 2.219287740296605e-06, "Full-pretrain/Loss": 1.9776326417922974, "Full-pretrain/Loss (Raw)": 2.007473945617676, "Full-pretrain/Step": 8286, "Full-pretrain/Step Time": 17.632055148482323} +{"Full-pretrain/Learning Rate": 2.2157916868442125e-06, "Full-pretrain/Loss": 1.9790573120117188, "Full-pretrain/Loss (Raw)": 1.9966139793395996, "Full-pretrain/Step": 8287, "Full-pretrain/Step Time": 17.631099704653025} +{"Full-pretrain/Learning Rate": 2.2122982615422365e-06, "Full-pretrain/Loss": 1.9671990871429443, "Full-pretrain/Loss (Raw)": 1.8079313039779663, "Full-pretrain/Step": 8288, "Full-pretrain/Step Time": 17.62691307067871} +{"Full-pretrain/Learning Rate": 2.2088074647936524e-06, "Full-pretrain/Loss": 1.972550392150879, "Full-pretrain/Loss (Raw)": 2.199130058288574, "Full-pretrain/Step": 8289, "Full-pretrain/Step Time": 17.628355050459504} +{"Full-pretrain/Learning Rate": 2.205319297001113e-06, "Full-pretrain/Loss": 1.969387412071228, "Full-pretrain/Loss (Raw)": 1.975480556488037, "Full-pretrain/Step": 8290, "Full-pretrain/Step Time": 17.621389212086797} +{"Full-pretrain/Learning Rate": 2.201833758566982e-06, "Full-pretrain/Loss": 1.9762001037597656, "Full-pretrain/Loss (Raw)": 1.7853535413742065, "Full-pretrain/Step": 8291, "Full-pretrain/Step Time": 17.619284307584167} +{"Full-pretrain/Learning Rate": 2.1983508498933185e-06, "Full-pretrain/Loss": 1.9762983322143555, "Full-pretrain/Loss (Raw)": 1.8405158519744873, "Full-pretrain/Step": 8292, "Full-pretrain/Step Time": 17.623053876683116} +{"Full-pretrain/Learning Rate": 2.1948705713818683e-06, "Full-pretrain/Loss": 1.9752187728881836, "Full-pretrain/Loss (Raw)": 1.9157651662826538, "Full-pretrain/Step": 8293, "Full-pretrain/Step Time": 17.62284736149013} +{"Full-pretrain/Learning Rate": 2.191392923434085e-06, "Full-pretrain/Loss": 1.9722838401794434, "Full-pretrain/Loss (Raw)": 1.8147733211517334, "Full-pretrain/Step": 8294, "Full-pretrain/Step Time": 17.622218258678913} +{"Full-pretrain/Learning Rate": 2.1879179064511117e-06, "Full-pretrain/Loss": 1.9727243185043335, "Full-pretrain/Loss (Raw)": 1.9363665580749512, "Full-pretrain/Step": 8295, "Full-pretrain/Step Time": 17.62322884425521} +{"Full-pretrain/Learning Rate": 2.184445520833789e-06, "Full-pretrain/Loss": 1.9712464809417725, "Full-pretrain/Loss (Raw)": 1.909653902053833, "Full-pretrain/Step": 8296, "Full-pretrain/Step Time": 17.61965630017221} +{"Full-pretrain/Learning Rate": 2.1809757669826653e-06, "Full-pretrain/Loss": 1.963831901550293, "Full-pretrain/Loss (Raw)": 1.6958250999450684, "Full-pretrain/Step": 8297, "Full-pretrain/Step Time": 17.623114805668592} +{"Full-pretrain/Learning Rate": 2.1775086452979598e-06, "Full-pretrain/Loss": 1.9627275466918945, "Full-pretrain/Loss (Raw)": 1.9658503532409668, "Full-pretrain/Step": 8298, "Full-pretrain/Step Time": 17.622798092663288} +{"Full-pretrain/Learning Rate": 2.1740441561796137e-06, "Full-pretrain/Loss": 1.9635132551193237, "Full-pretrain/Loss (Raw)": 1.8697766065597534, "Full-pretrain/Step": 8299, "Full-pretrain/Step Time": 17.620572458952665} +{"Full-pretrain/Learning Rate": 2.1705823000272518e-06, "Full-pretrain/Loss": 1.965608835220337, "Full-pretrain/Loss (Raw)": 1.9050366878509521, "Full-pretrain/Step": 8300, "Full-pretrain/Step Time": 17.616325419396162} +{"Full-pretrain/Learning Rate": 2.167123077240199e-06, "Full-pretrain/Loss": 1.9581499099731445, "Full-pretrain/Loss (Raw)": 2.005852460861206, "Full-pretrain/Step": 8301, "Full-pretrain/Step Time": 17.62227221019566} +{"Full-pretrain/Learning Rate": 2.163666488217475e-06, "Full-pretrain/Loss": 1.9563488960266113, "Full-pretrain/Loss (Raw)": 1.8448420763015747, "Full-pretrain/Step": 8302, "Full-pretrain/Step Time": 17.624725172296166} +{"Full-pretrain/Learning Rate": 2.1602125333578025e-06, "Full-pretrain/Loss": 1.9535268545150757, "Full-pretrain/Loss (Raw)": 1.9270375967025757, "Full-pretrain/Step": 8303, "Full-pretrain/Step Time": 17.615936944261193} +{"Full-pretrain/Learning Rate": 2.15676121305958e-06, "Full-pretrain/Loss": 1.9357712268829346, "Full-pretrain/Loss (Raw)": 1.3907235860824585, "Full-pretrain/Step": 8304, "Full-pretrain/Step Time": 17.62206471711397} +{"Full-pretrain/Learning Rate": 2.1533125277209326e-06, "Full-pretrain/Loss": 1.931950569152832, "Full-pretrain/Loss (Raw)": 2.054567337036133, "Full-pretrain/Step": 8305, "Full-pretrain/Step Time": 17.62615542858839} +{"Full-pretrain/Learning Rate": 2.149866477739648e-06, "Full-pretrain/Loss": 1.9360969066619873, "Full-pretrain/Loss (Raw)": 2.1002087593078613, "Full-pretrain/Step": 8306, "Full-pretrain/Step Time": 17.628213491290808} +{"Full-pretrain/Learning Rate": 2.1464230635132366e-06, "Full-pretrain/Loss": 1.9407639503479004, "Full-pretrain/Loss (Raw)": 2.0303359031677246, "Full-pretrain/Step": 8307, "Full-pretrain/Step Time": 17.62569816224277} +{"Full-pretrain/Learning Rate": 2.142982285438899e-06, "Full-pretrain/Loss": 1.9432318210601807, "Full-pretrain/Loss (Raw)": 2.0512313842773438, "Full-pretrain/Step": 8308, "Full-pretrain/Step Time": 17.624470552429557} +{"Full-pretrain/Learning Rate": 2.1395441439135163e-06, "Full-pretrain/Loss": 1.9398504495620728, "Full-pretrain/Loss (Raw)": 2.074202060699463, "Full-pretrain/Step": 8309, "Full-pretrain/Step Time": 17.621741600334644} +{"Full-pretrain/Learning Rate": 2.136108639333684e-06, "Full-pretrain/Loss": 1.9380192756652832, "Full-pretrain/Loss (Raw)": 1.8466237783432007, "Full-pretrain/Step": 8310, "Full-pretrain/Step Time": 17.626568153500557} +{"Full-pretrain/Learning Rate": 2.1326757720956827e-06, "Full-pretrain/Loss": 1.9396750926971436, "Full-pretrain/Loss (Raw)": 2.127953290939331, "Full-pretrain/Step": 8311, "Full-pretrain/Step Time": 17.631249664351344} +{"Full-pretrain/Learning Rate": 2.129245542595498e-06, "Full-pretrain/Loss": 1.9364819526672363, "Full-pretrain/Loss (Raw)": 1.9550459384918213, "Full-pretrain/Step": 8312, "Full-pretrain/Step Time": 17.629904137924314} +{"Full-pretrain/Learning Rate": 2.125817951228806e-06, "Full-pretrain/Loss": 1.9253958463668823, "Full-pretrain/Loss (Raw)": 1.7972389459609985, "Full-pretrain/Step": 8313, "Full-pretrain/Step Time": 17.634648017585278} +{"Full-pretrain/Learning Rate": 2.1223929983909705e-06, "Full-pretrain/Loss": 1.9261094331741333, "Full-pretrain/Loss (Raw)": 1.9455188512802124, "Full-pretrain/Step": 8314, "Full-pretrain/Step Time": 17.639537999406457} +{"Full-pretrain/Learning Rate": 2.118970684477062e-06, "Full-pretrain/Loss": 1.934004306793213, "Full-pretrain/Loss (Raw)": 1.930829405784607, "Full-pretrain/Step": 8315, "Full-pretrain/Step Time": 17.63580707460642} +{"Full-pretrain/Learning Rate": 2.1155510098818445e-06, "Full-pretrain/Loss": 1.9236764907836914, "Full-pretrain/Loss (Raw)": 1.8389792442321777, "Full-pretrain/Step": 8316, "Full-pretrain/Step Time": 17.637433987110853} +{"Full-pretrain/Learning Rate": 2.112133974999775e-06, "Full-pretrain/Loss": 1.926965594291687, "Full-pretrain/Loss (Raw)": 2.1161625385284424, "Full-pretrain/Step": 8317, "Full-pretrain/Step Time": 17.634772228077054} +{"Full-pretrain/Learning Rate": 2.108719580225013e-06, "Full-pretrain/Loss": 1.9204607009887695, "Full-pretrain/Loss (Raw)": 1.7993202209472656, "Full-pretrain/Step": 8318, "Full-pretrain/Step Time": 17.641027888283134} +{"Full-pretrain/Learning Rate": 2.1053078259513996e-06, "Full-pretrain/Loss": 1.9127509593963623, "Full-pretrain/Loss (Raw)": 1.7498986721038818, "Full-pretrain/Step": 8319, "Full-pretrain/Step Time": 17.6421790830791} +{"Full-pretrain/Learning Rate": 2.101898712572484e-06, "Full-pretrain/Loss": 1.9150333404541016, "Full-pretrain/Loss (Raw)": 1.8809661865234375, "Full-pretrain/Step": 8320, "Full-pretrain/Step Time": 17.647512804716825} +{"Full-pretrain/Learning Rate": 2.098492240481506e-06, "Full-pretrain/Loss": 1.913771629333496, "Full-pretrain/Loss (Raw)": 2.158759593963623, "Full-pretrain/Step": 8321, "Full-pretrain/Step Time": 17.637925073504448} +{"Full-pretrain/Learning Rate": 2.095088410071397e-06, "Full-pretrain/Loss": 1.912461519241333, "Full-pretrain/Loss (Raw)": 1.9335585832595825, "Full-pretrain/Step": 8322, "Full-pretrain/Step Time": 17.648096730932593} +{"Full-pretrain/Learning Rate": 2.091687221734789e-06, "Full-pretrain/Loss": 1.9157845973968506, "Full-pretrain/Loss (Raw)": 1.8916863203048706, "Full-pretrain/Step": 8323, "Full-pretrain/Step Time": 17.640089688822627} +{"Full-pretrain/Learning Rate": 2.088288675864017e-06, "Full-pretrain/Loss": 1.9121289253234863, "Full-pretrain/Loss (Raw)": 1.7235333919525146, "Full-pretrain/Step": 8324, "Full-pretrain/Step Time": 17.642787516117096} +{"Full-pretrain/Learning Rate": 2.084892772851088e-06, "Full-pretrain/Loss": 1.9100759029388428, "Full-pretrain/Loss (Raw)": 1.8500702381134033, "Full-pretrain/Step": 8325, "Full-pretrain/Step Time": 17.643491193652153} +{"Full-pretrain/Learning Rate": 2.0814995130877256e-06, "Full-pretrain/Loss": 1.9061216115951538, "Full-pretrain/Loss (Raw)": 1.6882367134094238, "Full-pretrain/Step": 8326, "Full-pretrain/Step Time": 17.646101204678416} +{"Full-pretrain/Learning Rate": 2.078108896965339e-06, "Full-pretrain/Loss": 1.908811092376709, "Full-pretrain/Loss (Raw)": 2.022429943084717, "Full-pretrain/Step": 8327, "Full-pretrain/Step Time": 17.6466976236552} +{"Full-pretrain/Learning Rate": 2.074720924875037e-06, "Full-pretrain/Loss": 1.8995966911315918, "Full-pretrain/Loss (Raw)": 1.614794373512268, "Full-pretrain/Step": 8328, "Full-pretrain/Step Time": 17.642456881701946} +{"Full-pretrain/Learning Rate": 2.071335597207624e-06, "Full-pretrain/Loss": 1.8990405797958374, "Full-pretrain/Loss (Raw)": 1.6780271530151367, "Full-pretrain/Step": 8329, "Full-pretrain/Step Time": 17.64002864435315} +{"Full-pretrain/Learning Rate": 2.067952914353588e-06, "Full-pretrain/Loss": 1.891869306564331, "Full-pretrain/Loss (Raw)": 1.7363697290420532, "Full-pretrain/Step": 8330, "Full-pretrain/Step Time": 17.641212424263358} +{"Full-pretrain/Learning Rate": 2.0645728767031246e-06, "Full-pretrain/Loss": 1.8896093368530273, "Full-pretrain/Loss (Raw)": 1.797457218170166, "Full-pretrain/Step": 8331, "Full-pretrain/Step Time": 17.639992268756032} +{"Full-pretrain/Learning Rate": 2.0611954846461167e-06, "Full-pretrain/Loss": 1.8919472694396973, "Full-pretrain/Loss (Raw)": 1.9798492193222046, "Full-pretrain/Step": 8332, "Full-pretrain/Step Time": 17.64042448438704} +{"Full-pretrain/Learning Rate": 2.0578207385721526e-06, "Full-pretrain/Loss": 1.8820364475250244, "Full-pretrain/Loss (Raw)": 1.6887110471725464, "Full-pretrain/Step": 8333, "Full-pretrain/Step Time": 17.64372807368636} +{"Full-pretrain/Learning Rate": 2.054448638870507e-06, "Full-pretrain/Loss": 1.8876996040344238, "Full-pretrain/Loss (Raw)": 2.0260586738586426, "Full-pretrain/Step": 8334, "Full-pretrain/Step Time": 17.643840247765183} +{"Full-pretrain/Learning Rate": 2.0510791859301408e-06, "Full-pretrain/Loss": 1.8983405828475952, "Full-pretrain/Loss (Raw)": 2.2675490379333496, "Full-pretrain/Step": 8335, "Full-pretrain/Step Time": 17.640329966321588} +{"Full-pretrain/Learning Rate": 2.047712380139727e-06, "Full-pretrain/Loss": 1.9149054288864136, "Full-pretrain/Loss (Raw)": 1.92079758644104, "Full-pretrain/Step": 8336, "Full-pretrain/Step Time": 17.639691974967718} +{"Full-pretrain/Learning Rate": 2.0443482218876265e-06, "Full-pretrain/Loss": 1.9163691997528076, "Full-pretrain/Loss (Raw)": 2.101409673690796, "Full-pretrain/Step": 8337, "Full-pretrain/Step Time": 17.643981333822012} +{"Full-pretrain/Learning Rate": 2.040986711561893e-06, "Full-pretrain/Loss": 1.9069099426269531, "Full-pretrain/Loss (Raw)": 1.7975108623504639, "Full-pretrain/Step": 8338, "Full-pretrain/Step Time": 17.645101191475987} +{"Full-pretrain/Learning Rate": 2.0376278495502693e-06, "Full-pretrain/Loss": 1.9054553508758545, "Full-pretrain/Loss (Raw)": 1.9837901592254639, "Full-pretrain/Step": 8339, "Full-pretrain/Step Time": 17.646555352956057} +{"Full-pretrain/Learning Rate": 2.0342716362402094e-06, "Full-pretrain/Loss": 1.905574083328247, "Full-pretrain/Loss (Raw)": 2.0550293922424316, "Full-pretrain/Step": 8340, "Full-pretrain/Step Time": 17.6480061840266} +{"Full-pretrain/Learning Rate": 2.030918072018842e-06, "Full-pretrain/Loss": 1.9034020900726318, "Full-pretrain/Loss (Raw)": 2.004697799682617, "Full-pretrain/Step": 8341, "Full-pretrain/Step Time": 17.646784756332636} +{"Full-pretrain/Learning Rate": 2.027567157273e-06, "Full-pretrain/Loss": 1.9013292789459229, "Full-pretrain/Loss (Raw)": 1.7802977561950684, "Full-pretrain/Step": 8342, "Full-pretrain/Step Time": 17.65432714857161} +{"Full-pretrain/Learning Rate": 2.0242188923892154e-06, "Full-pretrain/Loss": 1.9018875360488892, "Full-pretrain/Loss (Raw)": 2.145814895629883, "Full-pretrain/Step": 8343, "Full-pretrain/Step Time": 17.657026890665293} +{"Full-pretrain/Learning Rate": 2.0208732777537072e-06, "Full-pretrain/Loss": 1.8925247192382812, "Full-pretrain/Loss (Raw)": 1.6554365158081055, "Full-pretrain/Step": 8344, "Full-pretrain/Step Time": 17.658697485923767} +{"Full-pretrain/Learning Rate": 2.0175303137523943e-06, "Full-pretrain/Loss": 1.9065711498260498, "Full-pretrain/Loss (Raw)": 2.2467246055603027, "Full-pretrain/Step": 8345, "Full-pretrain/Step Time": 17.655505234375596} +{"Full-pretrain/Learning Rate": 2.01419000077088e-06, "Full-pretrain/Loss": 1.9013676643371582, "Full-pretrain/Loss (Raw)": 1.7790067195892334, "Full-pretrain/Step": 8346, "Full-pretrain/Step Time": 17.65484927035868} +{"Full-pretrain/Learning Rate": 2.0108523391944717e-06, "Full-pretrain/Loss": 1.9069534540176392, "Full-pretrain/Loss (Raw)": 2.1095757484436035, "Full-pretrain/Step": 8347, "Full-pretrain/Step Time": 17.650224586948752} +{"Full-pretrain/Learning Rate": 2.007517329408165e-06, "Full-pretrain/Loss": 1.90838623046875, "Full-pretrain/Loss (Raw)": 1.8848291635513306, "Full-pretrain/Step": 8348, "Full-pretrain/Step Time": 17.6550110001117} +{"Full-pretrain/Learning Rate": 2.004184971796658e-06, "Full-pretrain/Loss": 1.9027087688446045, "Full-pretrain/Loss (Raw)": 1.9344826936721802, "Full-pretrain/Step": 8349, "Full-pretrain/Step Time": 17.65158729068935} +{"Full-pretrain/Learning Rate": 2.0008552667443335e-06, "Full-pretrain/Loss": 1.9039478302001953, "Full-pretrain/Loss (Raw)": 1.8389718532562256, "Full-pretrain/Step": 8350, "Full-pretrain/Step Time": 17.649289758875966} +{"Full-pretrain/Learning Rate": 1.997528214635269e-06, "Full-pretrain/Loss": 1.905900001525879, "Full-pretrain/Loss (Raw)": 1.8123670816421509, "Full-pretrain/Step": 8351, "Full-pretrain/Step Time": 17.655574904754758} +{"Full-pretrain/Learning Rate": 1.9942038158532407e-06, "Full-pretrain/Loss": 1.911033272743225, "Full-pretrain/Loss (Raw)": 2.0452308654785156, "Full-pretrain/Step": 8352, "Full-pretrain/Step Time": 17.65510617569089} +{"Full-pretrain/Learning Rate": 1.990882070781719e-06, "Full-pretrain/Loss": 1.896579384803772, "Full-pretrain/Loss (Raw)": 1.6962354183197021, "Full-pretrain/Step": 8353, "Full-pretrain/Step Time": 17.658713752403855} +{"Full-pretrain/Learning Rate": 1.9875629798038668e-06, "Full-pretrain/Loss": 1.88214111328125, "Full-pretrain/Loss (Raw)": 1.4715303182601929, "Full-pretrain/Step": 8354, "Full-pretrain/Step Time": 17.6565566547215} +{"Full-pretrain/Learning Rate": 1.9842465433025343e-06, "Full-pretrain/Loss": 1.883802890777588, "Full-pretrain/Loss (Raw)": 1.9448661804199219, "Full-pretrain/Step": 8355, "Full-pretrain/Step Time": 17.654198732227087} +{"Full-pretrain/Learning Rate": 1.9809327616602784e-06, "Full-pretrain/Loss": 1.8881287574768066, "Full-pretrain/Loss (Raw)": 1.8619608879089355, "Full-pretrain/Step": 8356, "Full-pretrain/Step Time": 17.65628561936319} +{"Full-pretrain/Learning Rate": 1.977621635259336e-06, "Full-pretrain/Loss": 1.8909045457839966, "Full-pretrain/Loss (Raw)": 1.9388964176177979, "Full-pretrain/Step": 8357, "Full-pretrain/Step Time": 17.653044255450368} +{"Full-pretrain/Learning Rate": 1.9743131644816477e-06, "Full-pretrain/Loss": 1.8948414325714111, "Full-pretrain/Loss (Raw)": 1.8142157793045044, "Full-pretrain/Step": 8358, "Full-pretrain/Step Time": 17.650004932656884} +{"Full-pretrain/Learning Rate": 1.971007349708842e-06, "Full-pretrain/Loss": 1.8992621898651123, "Full-pretrain/Loss (Raw)": 2.1638925075531006, "Full-pretrain/Step": 8359, "Full-pretrain/Step Time": 17.652622988447547} +{"Full-pretrain/Learning Rate": 1.9677041913222476e-06, "Full-pretrain/Loss": 1.906832218170166, "Full-pretrain/Loss (Raw)": 1.85703706741333, "Full-pretrain/Step": 8360, "Full-pretrain/Step Time": 17.655085131525993} +{"Full-pretrain/Learning Rate": 1.964403689702882e-06, "Full-pretrain/Loss": 1.9006922245025635, "Full-pretrain/Loss (Raw)": 1.4815495014190674, "Full-pretrain/Step": 8361, "Full-pretrain/Step Time": 17.651713794097304} +{"Full-pretrain/Learning Rate": 1.9611058452314535e-06, "Full-pretrain/Loss": 1.895169734954834, "Full-pretrain/Loss (Raw)": 1.5596472024917603, "Full-pretrain/Step": 8362, "Full-pretrain/Step Time": 17.648189501836896} +{"Full-pretrain/Learning Rate": 1.95781065828837e-06, "Full-pretrain/Loss": 1.9094034433364868, "Full-pretrain/Loss (Raw)": 2.2529373168945312, "Full-pretrain/Step": 8363, "Full-pretrain/Step Time": 17.646359788253903} +{"Full-pretrain/Learning Rate": 1.9545181292537267e-06, "Full-pretrain/Loss": 1.9037492275238037, "Full-pretrain/Loss (Raw)": 1.798911452293396, "Full-pretrain/Step": 8364, "Full-pretrain/Step Time": 17.64980221912265} +{"Full-pretrain/Learning Rate": 1.9512282585073205e-06, "Full-pretrain/Loss": 1.9127299785614014, "Full-pretrain/Loss (Raw)": 1.9760982990264893, "Full-pretrain/Step": 8365, "Full-pretrain/Step Time": 17.650919619947672} +{"Full-pretrain/Learning Rate": 1.947941046428639e-06, "Full-pretrain/Loss": 1.917697548866272, "Full-pretrain/Loss (Raw)": 2.1850197315216064, "Full-pretrain/Step": 8366, "Full-pretrain/Step Time": 17.647772887721658} +{"Full-pretrain/Learning Rate": 1.9446564933968513e-06, "Full-pretrain/Loss": 1.9105583429336548, "Full-pretrain/Loss (Raw)": 2.039095640182495, "Full-pretrain/Step": 8367, "Full-pretrain/Step Time": 17.648266712203622} +{"Full-pretrain/Learning Rate": 1.941374599790838e-06, "Full-pretrain/Loss": 1.9125871658325195, "Full-pretrain/Loss (Raw)": 1.9857237339019775, "Full-pretrain/Step": 8368, "Full-pretrain/Step Time": 17.651235833764076} +{"Full-pretrain/Learning Rate": 1.9380953659891563e-06, "Full-pretrain/Loss": 1.9040932655334473, "Full-pretrain/Loss (Raw)": 1.8296003341674805, "Full-pretrain/Step": 8369, "Full-pretrain/Step Time": 17.65485388599336} +{"Full-pretrain/Learning Rate": 1.9348187923700772e-06, "Full-pretrain/Loss": 1.8991833925247192, "Full-pretrain/Loss (Raw)": 1.6403933763504028, "Full-pretrain/Step": 8370, "Full-pretrain/Step Time": 17.658377435058355} +{"Full-pretrain/Learning Rate": 1.9315448793115395e-06, "Full-pretrain/Loss": 1.898039698600769, "Full-pretrain/Loss (Raw)": 1.9471927881240845, "Full-pretrain/Step": 8371, "Full-pretrain/Step Time": 17.64721398241818} +{"Full-pretrain/Learning Rate": 1.9282736271911935e-06, "Full-pretrain/Loss": 1.898945689201355, "Full-pretrain/Loss (Raw)": 2.084023952484131, "Full-pretrain/Step": 8372, "Full-pretrain/Step Time": 17.64866608195007} +{"Full-pretrain/Learning Rate": 1.925005036386382e-06, "Full-pretrain/Loss": 1.8890318870544434, "Full-pretrain/Loss (Raw)": 1.6874537467956543, "Full-pretrain/Step": 8373, "Full-pretrain/Step Time": 17.65034900419414} +{"Full-pretrain/Learning Rate": 1.921739107274123e-06, "Full-pretrain/Loss": 1.8973489999771118, "Full-pretrain/Loss (Raw)": 2.046444892883301, "Full-pretrain/Step": 8374, "Full-pretrain/Step Time": 17.650625241920352} +{"Full-pretrain/Learning Rate": 1.9184758402311514e-06, "Full-pretrain/Loss": 1.8815228939056396, "Full-pretrain/Loss (Raw)": 1.6393811702728271, "Full-pretrain/Step": 8375, "Full-pretrain/Step Time": 17.649928582832217} +{"Full-pretrain/Learning Rate": 1.915215235633883e-06, "Full-pretrain/Loss": 1.8871736526489258, "Full-pretrain/Loss (Raw)": 1.8362585306167603, "Full-pretrain/Step": 8376, "Full-pretrain/Step Time": 17.65462440997362} +{"Full-pretrain/Learning Rate": 1.9119572938584184e-06, "Full-pretrain/Loss": 1.877217173576355, "Full-pretrain/Loss (Raw)": 1.9281190633773804, "Full-pretrain/Step": 8377, "Full-pretrain/Step Time": 17.651716243475676} +{"Full-pretrain/Learning Rate": 1.9087020152805698e-06, "Full-pretrain/Loss": 1.876511573791504, "Full-pretrain/Loss (Raw)": 1.7564295530319214, "Full-pretrain/Step": 8378, "Full-pretrain/Step Time": 17.6512578073889} +{"Full-pretrain/Learning Rate": 1.9054494002758245e-06, "Full-pretrain/Loss": 1.8746225833892822, "Full-pretrain/Loss (Raw)": 2.049123525619507, "Full-pretrain/Step": 8379, "Full-pretrain/Step Time": 17.650999726727605} +{"Full-pretrain/Learning Rate": 1.9021994492193773e-06, "Full-pretrain/Loss": 1.8778151273727417, "Full-pretrain/Loss (Raw)": 1.9869929552078247, "Full-pretrain/Step": 8380, "Full-pretrain/Step Time": 17.655328515917063} +{"Full-pretrain/Learning Rate": 1.8989521624861089e-06, "Full-pretrain/Loss": 1.879844307899475, "Full-pretrain/Loss (Raw)": 1.9994168281555176, "Full-pretrain/Step": 8381, "Full-pretrain/Step Time": 17.65548704750836} +{"Full-pretrain/Learning Rate": 1.895707540450592e-06, "Full-pretrain/Loss": 1.8800714015960693, "Full-pretrain/Loss (Raw)": 1.8462404012680054, "Full-pretrain/Step": 8382, "Full-pretrain/Step Time": 17.658565985038877} +{"Full-pretrain/Learning Rate": 1.8924655834870853e-06, "Full-pretrain/Loss": 1.8817059993743896, "Full-pretrain/Loss (Raw)": 1.8646703958511353, "Full-pretrain/Step": 8383, "Full-pretrain/Step Time": 17.654785526916385} +{"Full-pretrain/Learning Rate": 1.8892262919695563e-06, "Full-pretrain/Loss": 1.8716950416564941, "Full-pretrain/Loss (Raw)": 1.7248809337615967, "Full-pretrain/Step": 8384, "Full-pretrain/Step Time": 17.649904185906053} +{"Full-pretrain/Learning Rate": 1.885989666271651e-06, "Full-pretrain/Loss": 1.8846969604492188, "Full-pretrain/Loss (Raw)": 2.1122961044311523, "Full-pretrain/Step": 8385, "Full-pretrain/Step Time": 17.650630988180637} +{"Full-pretrain/Learning Rate": 1.8827557067667146e-06, "Full-pretrain/Loss": 1.9015998840332031, "Full-pretrain/Loss (Raw)": 2.0124266147613525, "Full-pretrain/Step": 8386, "Full-pretrain/Step Time": 17.65424489416182} +{"Full-pretrain/Learning Rate": 1.8795244138277878e-06, "Full-pretrain/Loss": 1.8958337306976318, "Full-pretrain/Loss (Raw)": 1.7603459358215332, "Full-pretrain/Step": 8387, "Full-pretrain/Step Time": 17.654707320034504} +{"Full-pretrain/Learning Rate": 1.8762957878275893e-06, "Full-pretrain/Loss": 1.902367353439331, "Full-pretrain/Loss (Raw)": 2.071040630340576, "Full-pretrain/Step": 8388, "Full-pretrain/Step Time": 17.652335742488503} +{"Full-pretrain/Learning Rate": 1.8730698291385518e-06, "Full-pretrain/Loss": 1.9056134223937988, "Full-pretrain/Loss (Raw)": 2.0427699089050293, "Full-pretrain/Step": 8389, "Full-pretrain/Step Time": 17.648629028350115} +{"Full-pretrain/Learning Rate": 1.8698465381327774e-06, "Full-pretrain/Loss": 1.9274691343307495, "Full-pretrain/Loss (Raw)": 2.513598680496216, "Full-pretrain/Step": 8390, "Full-pretrain/Step Time": 17.651193242520094} +{"Full-pretrain/Learning Rate": 1.8666259151820769e-06, "Full-pretrain/Loss": 1.9243141412734985, "Full-pretrain/Loss (Raw)": 2.0629310607910156, "Full-pretrain/Step": 8391, "Full-pretrain/Step Time": 17.65420839935541} +{"Full-pretrain/Learning Rate": 1.8634079606579507e-06, "Full-pretrain/Loss": 1.9279255867004395, "Full-pretrain/Loss (Raw)": 1.9726064205169678, "Full-pretrain/Step": 8392, "Full-pretrain/Step Time": 17.65022704936564} +{"Full-pretrain/Learning Rate": 1.8601926749315796e-06, "Full-pretrain/Loss": 1.9468963146209717, "Full-pretrain/Loss (Raw)": 2.0886130332946777, "Full-pretrain/Step": 8393, "Full-pretrain/Step Time": 17.64260113425553} +{"Full-pretrain/Learning Rate": 1.8569800583738556e-06, "Full-pretrain/Loss": 1.9587773084640503, "Full-pretrain/Loss (Raw)": 1.9398361444473267, "Full-pretrain/Step": 8394, "Full-pretrain/Step Time": 17.653534699231386} +{"Full-pretrain/Learning Rate": 1.8537701113553462e-06, "Full-pretrain/Loss": 1.9517204761505127, "Full-pretrain/Loss (Raw)": 2.0271215438842773, "Full-pretrain/Step": 8395, "Full-pretrain/Step Time": 17.65657903626561} +{"Full-pretrain/Learning Rate": 1.8505628342463193e-06, "Full-pretrain/Loss": 1.9580917358398438, "Full-pretrain/Loss (Raw)": 2.0027899742126465, "Full-pretrain/Step": 8396, "Full-pretrain/Step Time": 17.650109255686402} +{"Full-pretrain/Learning Rate": 1.84735822741674e-06, "Full-pretrain/Loss": 1.953730583190918, "Full-pretrain/Loss (Raw)": 1.8365414142608643, "Full-pretrain/Step": 8397, "Full-pretrain/Step Time": 17.650155747309327} +{"Full-pretrain/Learning Rate": 1.8441562912362487e-06, "Full-pretrain/Loss": 1.944680094718933, "Full-pretrain/Loss (Raw)": 1.895404577255249, "Full-pretrain/Step": 8398, "Full-pretrain/Step Time": 17.656521167606115} +{"Full-pretrain/Learning Rate": 1.8409570260741916e-06, "Full-pretrain/Loss": 1.944657325744629, "Full-pretrain/Loss (Raw)": 2.03836727142334, "Full-pretrain/Step": 8399, "Full-pretrain/Step Time": 17.659480784088373} +{"Full-pretrain/Learning Rate": 1.837760432299601e-06, "Full-pretrain/Loss": 1.9595470428466797, "Full-pretrain/Loss (Raw)": 2.4621901512145996, "Full-pretrain/Step": 8400, "Full-pretrain/Step Time": 17.66107663884759} +{"Full-pretrain/Learning Rate": 1.8345665102812076e-06, "Full-pretrain/Loss": 1.9591177701950073, "Full-pretrain/Loss (Raw)": 1.8158665895462036, "Full-pretrain/Step": 8401, "Full-pretrain/Step Time": 17.65799544379115} +{"Full-pretrain/Learning Rate": 1.8313752603874246e-06, "Full-pretrain/Loss": 1.9707494974136353, "Full-pretrain/Loss (Raw)": 2.012610673904419, "Full-pretrain/Step": 8402, "Full-pretrain/Step Time": 17.655107844620943} +{"Full-pretrain/Learning Rate": 1.8281866829863687e-06, "Full-pretrain/Loss": 1.9636602401733398, "Full-pretrain/Loss (Raw)": 1.7203357219696045, "Full-pretrain/Step": 8403, "Full-pretrain/Step Time": 17.657249035313725} +{"Full-pretrain/Learning Rate": 1.825000778445829e-06, "Full-pretrain/Loss": 1.9576689004898071, "Full-pretrain/Loss (Raw)": 1.8923008441925049, "Full-pretrain/Step": 8404, "Full-pretrain/Step Time": 17.66088962368667} +{"Full-pretrain/Learning Rate": 1.8218175471333116e-06, "Full-pretrain/Loss": 1.9573493003845215, "Full-pretrain/Loss (Raw)": 1.6772260665893555, "Full-pretrain/Step": 8405, "Full-pretrain/Step Time": 17.65587786398828} +{"Full-pretrain/Learning Rate": 1.8186369894159921e-06, "Full-pretrain/Loss": 1.9514729976654053, "Full-pretrain/Loss (Raw)": 1.8584034442901611, "Full-pretrain/Step": 8406, "Full-pretrain/Step Time": 17.6579618640244} +{"Full-pretrain/Learning Rate": 1.8154591056607467e-06, "Full-pretrain/Loss": 1.9474198818206787, "Full-pretrain/Loss (Raw)": 1.5096802711486816, "Full-pretrain/Step": 8407, "Full-pretrain/Step Time": 17.6705965064466} +{"Full-pretrain/Learning Rate": 1.8122838962341515e-06, "Full-pretrain/Loss": 1.9461108446121216, "Full-pretrain/Loss (Raw)": 1.7943705320358276, "Full-pretrain/Step": 8408, "Full-pretrain/Step Time": 17.667674208059907} +{"Full-pretrain/Learning Rate": 1.8091113615024553e-06, "Full-pretrain/Loss": 1.9437448978424072, "Full-pretrain/Loss (Raw)": 1.852407693862915, "Full-pretrain/Step": 8409, "Full-pretrain/Step Time": 17.6690454762429} +{"Full-pretrain/Learning Rate": 1.8059415018316123e-06, "Full-pretrain/Loss": 1.9463328123092651, "Full-pretrain/Loss (Raw)": 1.8392444849014282, "Full-pretrain/Step": 8410, "Full-pretrain/Step Time": 17.65918301232159} +{"Full-pretrain/Learning Rate": 1.8027743175872664e-06, "Full-pretrain/Loss": 1.9403667449951172, "Full-pretrain/Loss (Raw)": 1.8582046031951904, "Full-pretrain/Step": 8411, "Full-pretrain/Step Time": 17.663147939369082} +{"Full-pretrain/Learning Rate": 1.799609809134753e-06, "Full-pretrain/Loss": 1.945281744003296, "Full-pretrain/Loss (Raw)": 2.1442768573760986, "Full-pretrain/Step": 8412, "Full-pretrain/Step Time": 17.66744109801948} +{"Full-pretrain/Learning Rate": 1.796447976839097e-06, "Full-pretrain/Loss": 1.9384914636611938, "Full-pretrain/Loss (Raw)": 1.7821251153945923, "Full-pretrain/Step": 8413, "Full-pretrain/Step Time": 17.66667602956295} +{"Full-pretrain/Learning Rate": 1.7932888210650117e-06, "Full-pretrain/Loss": 1.9488908052444458, "Full-pretrain/Loss (Raw)": 2.179021120071411, "Full-pretrain/Step": 8414, "Full-pretrain/Step Time": 17.66328932158649} +{"Full-pretrain/Learning Rate": 1.7901323421769035e-06, "Full-pretrain/Loss": 1.9460326433181763, "Full-pretrain/Loss (Raw)": 1.7732059955596924, "Full-pretrain/Step": 8415, "Full-pretrain/Step Time": 17.6695578917861} +{"Full-pretrain/Learning Rate": 1.7869785405388723e-06, "Full-pretrain/Loss": 1.9465121030807495, "Full-pretrain/Loss (Raw)": 1.7402268648147583, "Full-pretrain/Step": 8416, "Full-pretrain/Step Time": 17.670892713591456} +{"Full-pretrain/Learning Rate": 1.783827416514708e-06, "Full-pretrain/Loss": 1.939705491065979, "Full-pretrain/Loss (Raw)": 1.8944849967956543, "Full-pretrain/Step": 8417, "Full-pretrain/Step Time": 17.669589914381504} +{"Full-pretrain/Learning Rate": 1.7806789704678973e-06, "Full-pretrain/Loss": 1.9397305250167847, "Full-pretrain/Loss (Raw)": 2.013225793838501, "Full-pretrain/Step": 8418, "Full-pretrain/Step Time": 17.67505308613181} +{"Full-pretrain/Learning Rate": 1.7775332027616053e-06, "Full-pretrain/Loss": 1.9484816789627075, "Full-pretrain/Loss (Raw)": 2.0403828620910645, "Full-pretrain/Step": 8419, "Full-pretrain/Step Time": 17.682808719575405} +{"Full-pretrain/Learning Rate": 1.774390113758695e-06, "Full-pretrain/Loss": 1.9421360492706299, "Full-pretrain/Loss (Raw)": 1.8679795265197754, "Full-pretrain/Step": 8420, "Full-pretrain/Step Time": 17.68420180492103} +{"Full-pretrain/Learning Rate": 1.7712497038217258e-06, "Full-pretrain/Loss": 1.9409823417663574, "Full-pretrain/Loss (Raw)": 2.005856513977051, "Full-pretrain/Step": 8421, "Full-pretrain/Step Time": 17.68760566972196} +{"Full-pretrain/Learning Rate": 1.7681119733129414e-06, "Full-pretrain/Loss": 1.9224694967269897, "Full-pretrain/Loss (Raw)": 1.9211846590042114, "Full-pretrain/Step": 8422, "Full-pretrain/Step Time": 17.6865725684911} +{"Full-pretrain/Learning Rate": 1.7649769225942747e-06, "Full-pretrain/Loss": 1.9210891723632812, "Full-pretrain/Loss (Raw)": 2.0187625885009766, "Full-pretrain/Step": 8423, "Full-pretrain/Step Time": 17.689486695453525} +{"Full-pretrain/Learning Rate": 1.7618445520273558e-06, "Full-pretrain/Loss": 1.9255056381225586, "Full-pretrain/Loss (Raw)": 2.113931655883789, "Full-pretrain/Step": 8424, "Full-pretrain/Step Time": 17.684978015720844} +{"Full-pretrain/Learning Rate": 1.7587148619735011e-06, "Full-pretrain/Loss": 1.9161651134490967, "Full-pretrain/Loss (Raw)": 1.7897148132324219, "Full-pretrain/Step": 8425, "Full-pretrain/Step Time": 17.684903068467975} +{"Full-pretrain/Learning Rate": 1.7555878527937164e-06, "Full-pretrain/Loss": 1.9233547449111938, "Full-pretrain/Loss (Raw)": 2.1699061393737793, "Full-pretrain/Step": 8426, "Full-pretrain/Step Time": 17.686165129765868} +{"Full-pretrain/Learning Rate": 1.7524635248487048e-06, "Full-pretrain/Loss": 1.9185271263122559, "Full-pretrain/Loss (Raw)": 1.872633695602417, "Full-pretrain/Step": 8427, "Full-pretrain/Step Time": 17.688804792240262} +{"Full-pretrain/Learning Rate": 1.7493418784988586e-06, "Full-pretrain/Loss": 1.922540545463562, "Full-pretrain/Loss (Raw)": 2.1312224864959717, "Full-pretrain/Step": 8428, "Full-pretrain/Step Time": 17.686570078134537} +{"Full-pretrain/Learning Rate": 1.7462229141042562e-06, "Full-pretrain/Loss": 1.9159075021743774, "Full-pretrain/Loss (Raw)": 1.624284267425537, "Full-pretrain/Step": 8429, "Full-pretrain/Step Time": 17.68741975352168} +{"Full-pretrain/Learning Rate": 1.7431066320246658e-06, "Full-pretrain/Loss": 1.9254950284957886, "Full-pretrain/Loss (Raw)": 2.20220685005188, "Full-pretrain/Step": 8430, "Full-pretrain/Step Time": 17.6806909032166} +{"Full-pretrain/Learning Rate": 1.7399930326195523e-06, "Full-pretrain/Loss": 1.9157582521438599, "Full-pretrain/Loss (Raw)": 1.7267887592315674, "Full-pretrain/Step": 8431, "Full-pretrain/Step Time": 17.69201106391847} +{"Full-pretrain/Learning Rate": 1.7368821162480703e-06, "Full-pretrain/Loss": 1.8905640840530396, "Full-pretrain/Loss (Raw)": 1.6559752225875854, "Full-pretrain/Step": 8432, "Full-pretrain/Step Time": 17.68186871148646} +{"Full-pretrain/Learning Rate": 1.7337738832690603e-06, "Full-pretrain/Loss": 1.8944575786590576, "Full-pretrain/Loss (Raw)": 1.9404628276824951, "Full-pretrain/Step": 8433, "Full-pretrain/Step Time": 17.67976040765643} +{"Full-pretrain/Learning Rate": 1.730668334041058e-06, "Full-pretrain/Loss": 1.89591383934021, "Full-pretrain/Loss (Raw)": 2.059206485748291, "Full-pretrain/Step": 8434, "Full-pretrain/Step Time": 17.67779523693025} +{"Full-pretrain/Learning Rate": 1.7275654689222847e-06, "Full-pretrain/Loss": 1.9054937362670898, "Full-pretrain/Loss (Raw)": 2.026895523071289, "Full-pretrain/Step": 8435, "Full-pretrain/Step Time": 17.682561924681067} +{"Full-pretrain/Learning Rate": 1.7244652882706546e-06, "Full-pretrain/Loss": 1.9134304523468018, "Full-pretrain/Loss (Raw)": 2.1462764739990234, "Full-pretrain/Step": 8436, "Full-pretrain/Step Time": 17.676254577934742} +{"Full-pretrain/Learning Rate": 1.7213677924437733e-06, "Full-pretrain/Loss": 1.928480863571167, "Full-pretrain/Loss (Raw)": 2.158836841583252, "Full-pretrain/Step": 8437, "Full-pretrain/Step Time": 17.67650348134339} +{"Full-pretrain/Learning Rate": 1.7182729817989436e-06, "Full-pretrain/Loss": 1.9281206130981445, "Full-pretrain/Loss (Raw)": 1.846876859664917, "Full-pretrain/Step": 8438, "Full-pretrain/Step Time": 17.67986204661429} +{"Full-pretrain/Learning Rate": 1.7151808566931354e-06, "Full-pretrain/Loss": 1.9454472064971924, "Full-pretrain/Loss (Raw)": 2.0641298294067383, "Full-pretrain/Step": 8439, "Full-pretrain/Step Time": 17.685299076139927} +{"Full-pretrain/Learning Rate": 1.7120914174830387e-06, "Full-pretrain/Loss": 1.9512925148010254, "Full-pretrain/Loss (Raw)": 1.9814238548278809, "Full-pretrain/Step": 8440, "Full-pretrain/Step Time": 17.684399340301752} +{"Full-pretrain/Learning Rate": 1.7090046645250101e-06, "Full-pretrain/Loss": 1.9511020183563232, "Full-pretrain/Loss (Raw)": 1.8463091850280762, "Full-pretrain/Step": 8441, "Full-pretrain/Step Time": 17.681916143745184} +{"Full-pretrain/Learning Rate": 1.7059205981751065e-06, "Full-pretrain/Loss": 1.9525201320648193, "Full-pretrain/Loss (Raw)": 1.8846228122711182, "Full-pretrain/Step": 8442, "Full-pretrain/Step Time": 17.682978162541986} +{"Full-pretrain/Learning Rate": 1.7028392187890762e-06, "Full-pretrain/Loss": 1.9597032070159912, "Full-pretrain/Loss (Raw)": 2.0880627632141113, "Full-pretrain/Step": 8443, "Full-pretrain/Step Time": 17.68737106397748} +{"Full-pretrain/Learning Rate": 1.699760526722355e-06, "Full-pretrain/Loss": 1.9534258842468262, "Full-pretrain/Loss (Raw)": 1.9434031248092651, "Full-pretrain/Step": 8444, "Full-pretrain/Step Time": 17.68602478504181} +{"Full-pretrain/Learning Rate": 1.6966845223300747e-06, "Full-pretrain/Loss": 1.9518218040466309, "Full-pretrain/Loss (Raw)": 1.7307968139648438, "Full-pretrain/Step": 8445, "Full-pretrain/Step Time": 17.693710369989276} +{"Full-pretrain/Learning Rate": 1.6936112059670383e-06, "Full-pretrain/Loss": 1.9408754110336304, "Full-pretrain/Loss (Raw)": 1.8287372589111328, "Full-pretrain/Step": 8446, "Full-pretrain/Step Time": 17.688888374716043} +{"Full-pretrain/Learning Rate": 1.690540577987762e-06, "Full-pretrain/Loss": 1.9361658096313477, "Full-pretrain/Loss (Raw)": 1.6224945783615112, "Full-pretrain/Step": 8447, "Full-pretrain/Step Time": 17.69030386209488} +{"Full-pretrain/Learning Rate": 1.6874726387464347e-06, "Full-pretrain/Loss": 1.9441845417022705, "Full-pretrain/Loss (Raw)": 1.9968270063400269, "Full-pretrain/Step": 8448, "Full-pretrain/Step Time": 17.688544442877173} +{"Full-pretrain/Learning Rate": 1.684407388596948e-06, "Full-pretrain/Loss": 1.9490180015563965, "Full-pretrain/Loss (Raw)": 2.049156904220581, "Full-pretrain/Step": 8449, "Full-pretrain/Step Time": 17.68860339745879} +{"Full-pretrain/Learning Rate": 1.6813448278928807e-06, "Full-pretrain/Loss": 1.9441860914230347, "Full-pretrain/Loss (Raw)": 1.8586065769195557, "Full-pretrain/Step": 8450, "Full-pretrain/Step Time": 17.685540022328496} +{"Full-pretrain/Learning Rate": 1.678284956987486e-06, "Full-pretrain/Loss": 1.944068193435669, "Full-pretrain/Loss (Raw)": 2.0366079807281494, "Full-pretrain/Step": 8451, "Full-pretrain/Step Time": 17.689299311488867} +{"Full-pretrain/Learning Rate": 1.6752277762337288e-06, "Full-pretrain/Loss": 1.941559076309204, "Full-pretrain/Loss (Raw)": 1.7876899242401123, "Full-pretrain/Step": 8452, "Full-pretrain/Step Time": 17.684193190187216} +{"Full-pretrain/Learning Rate": 1.6721732859842466e-06, "Full-pretrain/Loss": 1.936732292175293, "Full-pretrain/Loss (Raw)": 1.8513984680175781, "Full-pretrain/Step": 8453, "Full-pretrain/Step Time": 17.685891542583704} +{"Full-pretrain/Learning Rate": 1.6691214865913851e-06, "Full-pretrain/Loss": 1.9331787824630737, "Full-pretrain/Loss (Raw)": 1.807471513748169, "Full-pretrain/Step": 8454, "Full-pretrain/Step Time": 17.683390721678734} +{"Full-pretrain/Learning Rate": 1.6660723784071575e-06, "Full-pretrain/Loss": 1.9285316467285156, "Full-pretrain/Loss (Raw)": 1.870055913925171, "Full-pretrain/Step": 8455, "Full-pretrain/Step Time": 17.68596268258989} +{"Full-pretrain/Learning Rate": 1.6630259617832794e-06, "Full-pretrain/Loss": 1.9311985969543457, "Full-pretrain/Loss (Raw)": 2.1992712020874023, "Full-pretrain/Step": 8456, "Full-pretrain/Step Time": 17.686314940452576} +{"Full-pretrain/Learning Rate": 1.6599822370711586e-06, "Full-pretrain/Loss": 1.9278978109359741, "Full-pretrain/Loss (Raw)": 1.6840943098068237, "Full-pretrain/Step": 8457, "Full-pretrain/Step Time": 17.687585776671767} +{"Full-pretrain/Learning Rate": 1.6569412046218814e-06, "Full-pretrain/Loss": 1.9215110540390015, "Full-pretrain/Loss (Raw)": 1.9655272960662842, "Full-pretrain/Step": 8458, "Full-pretrain/Step Time": 17.685427583754063} +{"Full-pretrain/Learning Rate": 1.653902864786233e-06, "Full-pretrain/Loss": 1.9190990924835205, "Full-pretrain/Loss (Raw)": 1.7954504489898682, "Full-pretrain/Step": 8459, "Full-pretrain/Step Time": 17.688167741522193} +{"Full-pretrain/Learning Rate": 1.6508672179146894e-06, "Full-pretrain/Loss": 1.9149240255355835, "Full-pretrain/Loss (Raw)": 1.9976201057434082, "Full-pretrain/Step": 8460, "Full-pretrain/Step Time": 17.687310803681612} +{"Full-pretrain/Learning Rate": 1.6478342643574008e-06, "Full-pretrain/Loss": 1.9276604652404785, "Full-pretrain/Loss (Raw)": 2.0318503379821777, "Full-pretrain/Step": 8461, "Full-pretrain/Step Time": 17.684151142835617} +{"Full-pretrain/Learning Rate": 1.644804004464226e-06, "Full-pretrain/Loss": 1.9246506690979004, "Full-pretrain/Loss (Raw)": 2.105893850326538, "Full-pretrain/Step": 8462, "Full-pretrain/Step Time": 17.683419156819582} +{"Full-pretrain/Learning Rate": 1.6417764385846996e-06, "Full-pretrain/Loss": 1.9271022081375122, "Full-pretrain/Loss (Raw)": 1.8052400350570679, "Full-pretrain/Step": 8463, "Full-pretrain/Step Time": 17.681310411542654} +{"Full-pretrain/Learning Rate": 1.638751567068053e-06, "Full-pretrain/Loss": 1.9363701343536377, "Full-pretrain/Loss (Raw)": 1.9525446891784668, "Full-pretrain/Step": 8464, "Full-pretrain/Step Time": 17.68799608759582} +{"Full-pretrain/Learning Rate": 1.6357293902632049e-06, "Full-pretrain/Loss": 1.9370834827423096, "Full-pretrain/Loss (Raw)": 1.9632959365844727, "Full-pretrain/Step": 8465, "Full-pretrain/Step Time": 17.683184193447232} +{"Full-pretrain/Learning Rate": 1.632709908518762e-06, "Full-pretrain/Loss": 1.9315922260284424, "Full-pretrain/Loss (Raw)": 1.8834843635559082, "Full-pretrain/Step": 8466, "Full-pretrain/Step Time": 17.68338335864246} +{"Full-pretrain/Learning Rate": 1.629693122183018e-06, "Full-pretrain/Loss": 1.9335479736328125, "Full-pretrain/Loss (Raw)": 2.0894811153411865, "Full-pretrain/Step": 8467, "Full-pretrain/Step Time": 17.681109502911568} +{"Full-pretrain/Learning Rate": 1.626679031603956e-06, "Full-pretrain/Loss": 1.9276930093765259, "Full-pretrain/Loss (Raw)": 1.9589139223098755, "Full-pretrain/Step": 8468, "Full-pretrain/Step Time": 17.683601493015885} +{"Full-pretrain/Learning Rate": 1.6236676371292558e-06, "Full-pretrain/Loss": 1.9199806451797485, "Full-pretrain/Loss (Raw)": 1.9120423793792725, "Full-pretrain/Step": 8469, "Full-pretrain/Step Time": 17.68723256699741} +{"Full-pretrain/Learning Rate": 1.6206589391062787e-06, "Full-pretrain/Loss": 1.9237275123596191, "Full-pretrain/Loss (Raw)": 1.9667760133743286, "Full-pretrain/Step": 8470, "Full-pretrain/Step Time": 17.684319119900465} +{"Full-pretrain/Learning Rate": 1.6176529378820832e-06, "Full-pretrain/Loss": 1.9131436347961426, "Full-pretrain/Loss (Raw)": 1.7254430055618286, "Full-pretrain/Step": 8471, "Full-pretrain/Step Time": 17.679684640839696} +{"Full-pretrain/Learning Rate": 1.6146496338033973e-06, "Full-pretrain/Loss": 1.9125056266784668, "Full-pretrain/Loss (Raw)": 1.9610121250152588, "Full-pretrain/Step": 8472, "Full-pretrain/Step Time": 17.68565265648067} +{"Full-pretrain/Learning Rate": 1.6116490272166607e-06, "Full-pretrain/Loss": 1.9133495092391968, "Full-pretrain/Loss (Raw)": 1.873311996459961, "Full-pretrain/Step": 8473, "Full-pretrain/Step Time": 17.688458604738116} +{"Full-pretrain/Learning Rate": 1.6086511184679881e-06, "Full-pretrain/Loss": 1.9161245822906494, "Full-pretrain/Loss (Raw)": 1.9734280109405518, "Full-pretrain/Step": 8474, "Full-pretrain/Step Time": 17.687557006254792} +{"Full-pretrain/Learning Rate": 1.605655907903189e-06, "Full-pretrain/Loss": 1.91827392578125, "Full-pretrain/Loss (Raw)": 2.1568377017974854, "Full-pretrain/Step": 8475, "Full-pretrain/Step Time": 17.6852770652622} +{"Full-pretrain/Learning Rate": 1.6026633958677622e-06, "Full-pretrain/Loss": 1.9199100732803345, "Full-pretrain/Loss (Raw)": 1.9957611560821533, "Full-pretrain/Step": 8476, "Full-pretrain/Step Time": 17.685375787317753} +{"Full-pretrain/Learning Rate": 1.5996735827068871e-06, "Full-pretrain/Loss": 1.9143145084381104, "Full-pretrain/Loss (Raw)": 1.5517404079437256, "Full-pretrain/Step": 8477, "Full-pretrain/Step Time": 17.6825687084347} +{"Full-pretrain/Learning Rate": 1.5966864687654403e-06, "Full-pretrain/Loss": 1.9152107238769531, "Full-pretrain/Loss (Raw)": 1.8574140071868896, "Full-pretrain/Step": 8478, "Full-pretrain/Step Time": 17.684753505513072} +{"Full-pretrain/Learning Rate": 1.5937020543879855e-06, "Full-pretrain/Loss": 1.9226182699203491, "Full-pretrain/Loss (Raw)": 1.85953688621521, "Full-pretrain/Step": 8479, "Full-pretrain/Step Time": 17.680230164900422} +{"Full-pretrain/Learning Rate": 1.590720339918772e-06, "Full-pretrain/Loss": 1.919025182723999, "Full-pretrain/Loss (Raw)": 1.8818479776382446, "Full-pretrain/Step": 8480, "Full-pretrain/Step Time": 17.68628195859492} +{"Full-pretrain/Learning Rate": 1.5877413257017415e-06, "Full-pretrain/Loss": 1.912109613418579, "Full-pretrain/Loss (Raw)": 1.8278613090515137, "Full-pretrain/Step": 8481, "Full-pretrain/Step Time": 17.686410158872604} +{"Full-pretrain/Learning Rate": 1.5847650120805247e-06, "Full-pretrain/Loss": 1.9243545532226562, "Full-pretrain/Loss (Raw)": 2.2504427433013916, "Full-pretrain/Step": 8482, "Full-pretrain/Step Time": 17.682555774226785} +{"Full-pretrain/Learning Rate": 1.5817913993984302e-06, "Full-pretrain/Loss": 1.9164924621582031, "Full-pretrain/Loss (Raw)": 1.7850229740142822, "Full-pretrain/Step": 8483, "Full-pretrain/Step Time": 17.681924233213067} +{"Full-pretrain/Learning Rate": 1.5788204879984696e-06, "Full-pretrain/Loss": 1.922357439994812, "Full-pretrain/Loss (Raw)": 1.9753673076629639, "Full-pretrain/Step": 8484, "Full-pretrain/Step Time": 17.681322816759348} +{"Full-pretrain/Learning Rate": 1.5758522782233358e-06, "Full-pretrain/Loss": 1.9177324771881104, "Full-pretrain/Loss (Raw)": 1.7033989429473877, "Full-pretrain/Step": 8485, "Full-pretrain/Step Time": 17.68556108698249} +{"Full-pretrain/Learning Rate": 1.5728867704154077e-06, "Full-pretrain/Loss": 1.9213857650756836, "Full-pretrain/Loss (Raw)": 1.9243794679641724, "Full-pretrain/Step": 8486, "Full-pretrain/Step Time": 17.685168696567416} +{"Full-pretrain/Learning Rate": 1.569923964916764e-06, "Full-pretrain/Loss": 1.9211448431015015, "Full-pretrain/Loss (Raw)": 1.8623452186584473, "Full-pretrain/Step": 8487, "Full-pretrain/Step Time": 17.683857256546617} +{"Full-pretrain/Learning Rate": 1.5669638620691513e-06, "Full-pretrain/Loss": 1.9174095392227173, "Full-pretrain/Loss (Raw)": 2.079740524291992, "Full-pretrain/Step": 8488, "Full-pretrain/Step Time": 17.6828004270792} +{"Full-pretrain/Learning Rate": 1.5640064622140265e-06, "Full-pretrain/Loss": 1.9191932678222656, "Full-pretrain/Loss (Raw)": 1.741172194480896, "Full-pretrain/Step": 8489, "Full-pretrain/Step Time": 17.68552789092064} +{"Full-pretrain/Learning Rate": 1.5610517656925172e-06, "Full-pretrain/Loss": 1.9186277389526367, "Full-pretrain/Loss (Raw)": 1.9474326372146606, "Full-pretrain/Step": 8490, "Full-pretrain/Step Time": 17.68707691319287} +{"Full-pretrain/Learning Rate": 1.5580997728454477e-06, "Full-pretrain/Loss": 1.9263381958007812, "Full-pretrain/Loss (Raw)": 2.042186737060547, "Full-pretrain/Step": 8491, "Full-pretrain/Step Time": 17.686761170625687} +{"Full-pretrain/Learning Rate": 1.5551504840133375e-06, "Full-pretrain/Loss": 1.9129493236541748, "Full-pretrain/Loss (Raw)": 1.5691721439361572, "Full-pretrain/Step": 8492, "Full-pretrain/Step Time": 17.6861084792763} +{"Full-pretrain/Learning Rate": 1.5522038995363751e-06, "Full-pretrain/Loss": 1.9063475131988525, "Full-pretrain/Loss (Raw)": 1.820591688156128, "Full-pretrain/Step": 8493, "Full-pretrain/Step Time": 17.682736188173294} +{"Full-pretrain/Learning Rate": 1.5492600197544532e-06, "Full-pretrain/Loss": 1.9070653915405273, "Full-pretrain/Loss (Raw)": 2.128870964050293, "Full-pretrain/Step": 8494, "Full-pretrain/Step Time": 17.682586390525103} +{"Full-pretrain/Learning Rate": 1.546318845007147e-06, "Full-pretrain/Loss": 1.9094923734664917, "Full-pretrain/Loss (Raw)": 1.8829002380371094, "Full-pretrain/Step": 8495, "Full-pretrain/Step Time": 17.685902090743184} +{"Full-pretrain/Learning Rate": 1.5433803756337185e-06, "Full-pretrain/Loss": 1.9166038036346436, "Full-pretrain/Loss (Raw)": 2.1801133155822754, "Full-pretrain/Step": 8496, "Full-pretrain/Step Time": 17.68445516563952} +{"Full-pretrain/Learning Rate": 1.5404446119731242e-06, "Full-pretrain/Loss": 1.9116250276565552, "Full-pretrain/Loss (Raw)": 1.8039720058441162, "Full-pretrain/Step": 8497, "Full-pretrain/Step Time": 17.683872539550066} +{"Full-pretrain/Learning Rate": 1.5375115543639962e-06, "Full-pretrain/Loss": 1.9048535823822021, "Full-pretrain/Loss (Raw)": 1.666800856590271, "Full-pretrain/Step": 8498, "Full-pretrain/Step Time": 17.685359939932823} +{"Full-pretrain/Learning Rate": 1.5345812031446667e-06, "Full-pretrain/Loss": 1.9012606143951416, "Full-pretrain/Loss (Raw)": 1.974500298500061, "Full-pretrain/Step": 8499, "Full-pretrain/Step Time": 17.687885036692023} +{"Full-pretrain/Learning Rate": 1.5316535586531483e-06, "Full-pretrain/Loss": 1.8998677730560303, "Full-pretrain/Loss (Raw)": 1.9143463373184204, "Full-pretrain/Step": 8500, "Full-pretrain/Step Time": 17.68893115967512} +{"Full-pretrain/Learning Rate": 1.5287286212271434e-06, "Full-pretrain/Loss": 1.8958594799041748, "Full-pretrain/Loss (Raw)": 1.7837777137756348, "Full-pretrain/Step": 8501, "Full-pretrain/Step Time": 17.689008181914687} +{"Full-pretrain/Learning Rate": 1.525806391204046e-06, "Full-pretrain/Loss": 1.8934110403060913, "Full-pretrain/Loss (Raw)": 1.8884258270263672, "Full-pretrain/Step": 8502, "Full-pretrain/Step Time": 17.690384078770876} +{"Full-pretrain/Learning Rate": 1.5228868689209335e-06, "Full-pretrain/Loss": 1.9073516130447388, "Full-pretrain/Loss (Raw)": 2.1715402603149414, "Full-pretrain/Step": 8503, "Full-pretrain/Step Time": 17.691804321482778} +{"Full-pretrain/Learning Rate": 1.5199700547145674e-06, "Full-pretrain/Loss": 1.9067542552947998, "Full-pretrain/Loss (Raw)": 1.9418994188308716, "Full-pretrain/Step": 8504, "Full-pretrain/Step Time": 17.690995287150145} +{"Full-pretrain/Learning Rate": 1.5170559489214032e-06, "Full-pretrain/Loss": 1.9095399379730225, "Full-pretrain/Loss (Raw)": 1.962450623512268, "Full-pretrain/Step": 8505, "Full-pretrain/Step Time": 17.697417130693793} +{"Full-pretrain/Learning Rate": 1.514144551877586e-06, "Full-pretrain/Loss": 1.9028027057647705, "Full-pretrain/Loss (Raw)": 1.7578362226486206, "Full-pretrain/Step": 8506, "Full-pretrain/Step Time": 17.701530339196324} +{"Full-pretrain/Learning Rate": 1.5112358639189388e-06, "Full-pretrain/Loss": 1.888234257698059, "Full-pretrain/Loss (Raw)": 1.6906495094299316, "Full-pretrain/Step": 8507, "Full-pretrain/Step Time": 17.70645627938211} +{"Full-pretrain/Learning Rate": 1.5083298853809852e-06, "Full-pretrain/Loss": 1.884530782699585, "Full-pretrain/Loss (Raw)": 1.8772473335266113, "Full-pretrain/Step": 8508, "Full-pretrain/Step Time": 17.704301368445158} +{"Full-pretrain/Learning Rate": 1.5054266165989177e-06, "Full-pretrain/Loss": 1.8928518295288086, "Full-pretrain/Loss (Raw)": 1.8180155754089355, "Full-pretrain/Step": 8509, "Full-pretrain/Step Time": 17.706982869654894} +{"Full-pretrain/Learning Rate": 1.5025260579076328e-06, "Full-pretrain/Loss": 1.8948237895965576, "Full-pretrain/Loss (Raw)": 1.9205173254013062, "Full-pretrain/Step": 8510, "Full-pretrain/Step Time": 17.70690480619669} +{"Full-pretrain/Learning Rate": 1.4996282096417125e-06, "Full-pretrain/Loss": 1.89960515499115, "Full-pretrain/Loss (Raw)": 2.012540578842163, "Full-pretrain/Step": 8511, "Full-pretrain/Step Time": 17.70879060216248} +{"Full-pretrain/Learning Rate": 1.4967330721354172e-06, "Full-pretrain/Loss": 1.9005705118179321, "Full-pretrain/Loss (Raw)": 1.9127380847930908, "Full-pretrain/Step": 8512, "Full-pretrain/Step Time": 17.708356050774455} +{"Full-pretrain/Learning Rate": 1.4938406457227077e-06, "Full-pretrain/Loss": 1.8988807201385498, "Full-pretrain/Loss (Raw)": 1.773785948753357, "Full-pretrain/Step": 8513, "Full-pretrain/Step Time": 17.707224952057004} +{"Full-pretrain/Learning Rate": 1.4909509307372144e-06, "Full-pretrain/Loss": 1.8936192989349365, "Full-pretrain/Loss (Raw)": 2.0820775032043457, "Full-pretrain/Step": 8514, "Full-pretrain/Step Time": 17.70587608218193} +{"Full-pretrain/Learning Rate": 1.4880639275122704e-06, "Full-pretrain/Loss": 1.9020212888717651, "Full-pretrain/Loss (Raw)": 2.053889036178589, "Full-pretrain/Step": 8515, "Full-pretrain/Step Time": 17.711615534499288} +{"Full-pretrain/Learning Rate": 1.4851796363808872e-06, "Full-pretrain/Loss": 1.896986484527588, "Full-pretrain/Loss (Raw)": 1.814253807067871, "Full-pretrain/Step": 8516, "Full-pretrain/Step Time": 17.71462757885456} +{"Full-pretrain/Learning Rate": 1.4822980576757712e-06, "Full-pretrain/Loss": 1.9068703651428223, "Full-pretrain/Loss (Raw)": 2.0196805000305176, "Full-pretrain/Step": 8517, "Full-pretrain/Step Time": 17.710188306868076} +{"Full-pretrain/Learning Rate": 1.4794191917293142e-06, "Full-pretrain/Loss": 1.8995630741119385, "Full-pretrain/Loss (Raw)": 1.6905460357666016, "Full-pretrain/Step": 8518, "Full-pretrain/Step Time": 17.703558173030615} +{"Full-pretrain/Learning Rate": 1.4765430388735817e-06, "Full-pretrain/Loss": 1.895972728729248, "Full-pretrain/Loss (Raw)": 1.7474578619003296, "Full-pretrain/Step": 8519, "Full-pretrain/Step Time": 17.703490814194083} +{"Full-pretrain/Learning Rate": 1.4736695994403444e-06, "Full-pretrain/Loss": 1.8970777988433838, "Full-pretrain/Loss (Raw)": 2.1151041984558105, "Full-pretrain/Step": 8520, "Full-pretrain/Step Time": 17.707572588697076} +{"Full-pretrain/Learning Rate": 1.4707988737610506e-06, "Full-pretrain/Loss": 1.8990178108215332, "Full-pretrain/Loss (Raw)": 1.8032490015029907, "Full-pretrain/Step": 8521, "Full-pretrain/Step Time": 17.704855423420668} +{"Full-pretrain/Learning Rate": 1.4679308621668442e-06, "Full-pretrain/Loss": 1.897782802581787, "Full-pretrain/Loss (Raw)": 1.9079118967056274, "Full-pretrain/Step": 8522, "Full-pretrain/Step Time": 17.698825204744935} +{"Full-pretrain/Learning Rate": 1.4650655649885353e-06, "Full-pretrain/Loss": 1.893958330154419, "Full-pretrain/Loss (Raw)": 1.9198050498962402, "Full-pretrain/Step": 8523, "Full-pretrain/Step Time": 17.69861694611609} +{"Full-pretrain/Learning Rate": 1.4622029825566486e-06, "Full-pretrain/Loss": 1.906649112701416, "Full-pretrain/Loss (Raw)": 1.9752819538116455, "Full-pretrain/Step": 8524, "Full-pretrain/Step Time": 17.710217878222466} +{"Full-pretrain/Learning Rate": 1.4593431152013725e-06, "Full-pretrain/Loss": 1.90756094455719, "Full-pretrain/Loss (Raw)": 1.849764108657837, "Full-pretrain/Step": 8525, "Full-pretrain/Step Time": 17.705892523750663} +{"Full-pretrain/Learning Rate": 1.4564859632525962e-06, "Full-pretrain/Loss": 1.8979827165603638, "Full-pretrain/Loss (Raw)": 1.8223694562911987, "Full-pretrain/Step": 8526, "Full-pretrain/Step Time": 17.70460009947419} +{"Full-pretrain/Learning Rate": 1.4536315270398864e-06, "Full-pretrain/Loss": 1.9032645225524902, "Full-pretrain/Loss (Raw)": 2.0519163608551025, "Full-pretrain/Step": 8527, "Full-pretrain/Step Time": 17.703084675595164} +{"Full-pretrain/Learning Rate": 1.4507798068925078e-06, "Full-pretrain/Loss": 1.8996880054473877, "Full-pretrain/Loss (Raw)": 2.0656661987304688, "Full-pretrain/Step": 8528, "Full-pretrain/Step Time": 17.705936808139086} +{"Full-pretrain/Learning Rate": 1.4479308031394078e-06, "Full-pretrain/Loss": 1.8945707082748413, "Full-pretrain/Loss (Raw)": 1.6402173042297363, "Full-pretrain/Step": 8529, "Full-pretrain/Step Time": 17.70225925371051} +{"Full-pretrain/Learning Rate": 1.4450845161092074e-06, "Full-pretrain/Loss": 1.9026002883911133, "Full-pretrain/Loss (Raw)": 1.9237492084503174, "Full-pretrain/Step": 8530, "Full-pretrain/Step Time": 17.703317860141397} +{"Full-pretrain/Learning Rate": 1.44224094613023e-06, "Full-pretrain/Loss": 1.9001158475875854, "Full-pretrain/Loss (Raw)": 1.89499831199646, "Full-pretrain/Step": 8531, "Full-pretrain/Step Time": 17.714109499007463} +{"Full-pretrain/Learning Rate": 1.4394000935304825e-06, "Full-pretrain/Loss": 1.891870141029358, "Full-pretrain/Loss (Raw)": 1.6504822969436646, "Full-pretrain/Step": 8532, "Full-pretrain/Step Time": 17.709098843857646} +{"Full-pretrain/Learning Rate": 1.4365619586376528e-06, "Full-pretrain/Loss": 1.8995423316955566, "Full-pretrain/Loss (Raw)": 2.0292880535125732, "Full-pretrain/Step": 8533, "Full-pretrain/Step Time": 17.71089380979538} +{"Full-pretrain/Learning Rate": 1.4337265417791235e-06, "Full-pretrain/Loss": 1.9123955965042114, "Full-pretrain/Loss (Raw)": 2.2997303009033203, "Full-pretrain/Step": 8534, "Full-pretrain/Step Time": 17.70655968785286} +{"Full-pretrain/Learning Rate": 1.4308938432819524e-06, "Full-pretrain/Loss": 1.9031481742858887, "Full-pretrain/Loss (Raw)": 1.8756213188171387, "Full-pretrain/Step": 8535, "Full-pretrain/Step Time": 17.70596309006214} +{"Full-pretrain/Learning Rate": 1.428063863472895e-06, "Full-pretrain/Loss": 1.9045331478118896, "Full-pretrain/Loss (Raw)": 1.9862217903137207, "Full-pretrain/Step": 8536, "Full-pretrain/Step Time": 17.705815875902772} +{"Full-pretrain/Learning Rate": 1.425236602678387e-06, "Full-pretrain/Loss": 1.9051175117492676, "Full-pretrain/Loss (Raw)": 1.9811456203460693, "Full-pretrain/Step": 8537, "Full-pretrain/Step Time": 17.702385999262333} +{"Full-pretrain/Learning Rate": 1.4224120612245566e-06, "Full-pretrain/Loss": 1.9087750911712646, "Full-pretrain/Loss (Raw)": 1.8748822212219238, "Full-pretrain/Step": 8538, "Full-pretrain/Step Time": 17.704461803659797} +{"Full-pretrain/Learning Rate": 1.4195902394372045e-06, "Full-pretrain/Loss": 1.91032874584198, "Full-pretrain/Loss (Raw)": 1.740365743637085, "Full-pretrain/Step": 8539, "Full-pretrain/Step Time": 17.704722424969077} +{"Full-pretrain/Learning Rate": 1.4167711376418313e-06, "Full-pretrain/Loss": 1.9041194915771484, "Full-pretrain/Loss (Raw)": 1.6785515546798706, "Full-pretrain/Step": 8540, "Full-pretrain/Step Time": 17.699655843898654} +{"Full-pretrain/Learning Rate": 1.4139547561636213e-06, "Full-pretrain/Loss": 1.9073021411895752, "Full-pretrain/Loss (Raw)": 1.9198582172393799, "Full-pretrain/Step": 8541, "Full-pretrain/Step Time": 17.696831058710814} +{"Full-pretrain/Learning Rate": 1.4111410953274424e-06, "Full-pretrain/Loss": 1.8941798210144043, "Full-pretrain/Loss (Raw)": 1.5006057024002075, "Full-pretrain/Step": 8542, "Full-pretrain/Step Time": 17.696159668266773} +{"Full-pretrain/Learning Rate": 1.4083301554578433e-06, "Full-pretrain/Loss": 1.881274700164795, "Full-pretrain/Loss (Raw)": 1.5995770692825317, "Full-pretrain/Step": 8543, "Full-pretrain/Step Time": 17.6926937289536} +{"Full-pretrain/Learning Rate": 1.405521936879073e-06, "Full-pretrain/Loss": 1.8862180709838867, "Full-pretrain/Loss (Raw)": 2.0709269046783447, "Full-pretrain/Step": 8544, "Full-pretrain/Step Time": 17.69294578768313} +{"Full-pretrain/Learning Rate": 1.402716439915061e-06, "Full-pretrain/Loss": 1.8914618492126465, "Full-pretrain/Loss (Raw)": 1.941585659980774, "Full-pretrain/Step": 8545, "Full-pretrain/Step Time": 17.690162427723408} +{"Full-pretrain/Learning Rate": 1.3999136648894074e-06, "Full-pretrain/Loss": 1.878747820854187, "Full-pretrain/Loss (Raw)": 1.6752278804779053, "Full-pretrain/Step": 8546, "Full-pretrain/Step Time": 17.685477098450065} +{"Full-pretrain/Learning Rate": 1.3971136121254225e-06, "Full-pretrain/Loss": 1.8764376640319824, "Full-pretrain/Loss (Raw)": 1.9799662828445435, "Full-pretrain/Step": 8547, "Full-pretrain/Step Time": 17.679288361221552} +{"Full-pretrain/Learning Rate": 1.3943162819460841e-06, "Full-pretrain/Loss": 1.876997470855713, "Full-pretrain/Loss (Raw)": 1.8321688175201416, "Full-pretrain/Step": 8548, "Full-pretrain/Step Time": 17.683269448578358} +{"Full-pretrain/Learning Rate": 1.3915216746740705e-06, "Full-pretrain/Loss": 1.8754997253417969, "Full-pretrain/Loss (Raw)": 1.97174870967865, "Full-pretrain/Step": 8549, "Full-pretrain/Step Time": 17.678648153319955} +{"Full-pretrain/Learning Rate": 1.3887297906317375e-06, "Full-pretrain/Loss": 1.8802907466888428, "Full-pretrain/Loss (Raw)": 1.8438596725463867, "Full-pretrain/Step": 8550, "Full-pretrain/Step Time": 17.67651216685772} +{"Full-pretrain/Learning Rate": 1.385940630141122e-06, "Full-pretrain/Loss": 1.8908690214157104, "Full-pretrain/Loss (Raw)": 2.08596134185791, "Full-pretrain/Step": 8551, "Full-pretrain/Step Time": 17.67604940570891} +{"Full-pretrain/Learning Rate": 1.3831541935239556e-06, "Full-pretrain/Loss": 1.8853225708007812, "Full-pretrain/Loss (Raw)": 1.9376161098480225, "Full-pretrain/Step": 8552, "Full-pretrain/Step Time": 17.677145382389426} +{"Full-pretrain/Learning Rate": 1.3803704811016532e-06, "Full-pretrain/Loss": 1.8883976936340332, "Full-pretrain/Loss (Raw)": 1.901653528213501, "Full-pretrain/Step": 8553, "Full-pretrain/Step Time": 17.677939280867577} +{"Full-pretrain/Learning Rate": 1.3775894931953165e-06, "Full-pretrain/Loss": 1.887398362159729, "Full-pretrain/Loss (Raw)": 1.875934362411499, "Full-pretrain/Step": 8554, "Full-pretrain/Step Time": 17.675207825377584} +{"Full-pretrain/Learning Rate": 1.3748112301257332e-06, "Full-pretrain/Loss": 1.8876510858535767, "Full-pretrain/Loss (Raw)": 1.927891492843628, "Full-pretrain/Step": 8555, "Full-pretrain/Step Time": 17.673540100455284} +{"Full-pretrain/Learning Rate": 1.3720356922133666e-06, "Full-pretrain/Loss": 1.8739774227142334, "Full-pretrain/Loss (Raw)": 1.5377254486083984, "Full-pretrain/Step": 8556, "Full-pretrain/Step Time": 17.677076989784837} +{"Full-pretrain/Learning Rate": 1.3692628797783852e-06, "Full-pretrain/Loss": 1.885467290878296, "Full-pretrain/Loss (Raw)": 2.217439651489258, "Full-pretrain/Step": 8557, "Full-pretrain/Step Time": 17.672539500519633} +{"Full-pretrain/Learning Rate": 1.3664927931406225e-06, "Full-pretrain/Loss": 1.880893349647522, "Full-pretrain/Loss (Raw)": 1.676001787185669, "Full-pretrain/Step": 8558, "Full-pretrain/Step Time": 17.674576507881284} +{"Full-pretrain/Learning Rate": 1.3637254326196115e-06, "Full-pretrain/Loss": 1.8767539262771606, "Full-pretrain/Loss (Raw)": 1.9194550514221191, "Full-pretrain/Step": 8559, "Full-pretrain/Step Time": 17.66705133393407} +{"Full-pretrain/Learning Rate": 1.3609607985345662e-06, "Full-pretrain/Loss": 1.8729605674743652, "Full-pretrain/Loss (Raw)": 1.9442801475524902, "Full-pretrain/Step": 8560, "Full-pretrain/Step Time": 17.669153625145555} +{"Full-pretrain/Learning Rate": 1.3581988912043847e-06, "Full-pretrain/Loss": 1.8784886598587036, "Full-pretrain/Loss (Raw)": 1.8171157836914062, "Full-pretrain/Step": 8561, "Full-pretrain/Step Time": 17.66564785502851} +{"Full-pretrain/Learning Rate": 1.3554397109476507e-06, "Full-pretrain/Loss": 1.86703360080719, "Full-pretrain/Loss (Raw)": 1.5571866035461426, "Full-pretrain/Step": 8562, "Full-pretrain/Step Time": 17.668734965845942} +{"Full-pretrain/Learning Rate": 1.3526832580826376e-06, "Full-pretrain/Loss": 1.8765811920166016, "Full-pretrain/Loss (Raw)": 2.2005233764648438, "Full-pretrain/Step": 8563, "Full-pretrain/Step Time": 17.664903704077005} +{"Full-pretrain/Learning Rate": 1.349929532927302e-06, "Full-pretrain/Loss": 1.8809494972229004, "Full-pretrain/Loss (Raw)": 1.790266513824463, "Full-pretrain/Step": 8564, "Full-pretrain/Step Time": 17.67194069735706} +{"Full-pretrain/Learning Rate": 1.3471785357992816e-06, "Full-pretrain/Loss": 1.8670196533203125, "Full-pretrain/Loss (Raw)": 1.583533525466919, "Full-pretrain/Step": 8565, "Full-pretrain/Step Time": 17.67586720176041} +{"Full-pretrain/Learning Rate": 1.3444302670159088e-06, "Full-pretrain/Loss": 1.8580539226531982, "Full-pretrain/Loss (Raw)": 2.0128250122070312, "Full-pretrain/Step": 8566, "Full-pretrain/Step Time": 17.673786899074912} +{"Full-pretrain/Learning Rate": 1.341684726894188e-06, "Full-pretrain/Loss": 1.8613338470458984, "Full-pretrain/Loss (Raw)": 1.9805843830108643, "Full-pretrain/Step": 8567, "Full-pretrain/Step Time": 17.664540447294712} +{"Full-pretrain/Learning Rate": 1.3389419157508216e-06, "Full-pretrain/Loss": 1.8575183153152466, "Full-pretrain/Loss (Raw)": 1.8641223907470703, "Full-pretrain/Step": 8568, "Full-pretrain/Step Time": 17.66255503334105} +{"Full-pretrain/Learning Rate": 1.336201833902187e-06, "Full-pretrain/Loss": 1.8547099828720093, "Full-pretrain/Loss (Raw)": 1.8912795782089233, "Full-pretrain/Step": 8569, "Full-pretrain/Step Time": 17.666325509548187} +{"Full-pretrain/Learning Rate": 1.3334644816643566e-06, "Full-pretrain/Loss": 1.856428623199463, "Full-pretrain/Loss (Raw)": 1.9298759698867798, "Full-pretrain/Step": 8570, "Full-pretrain/Step Time": 17.659444050863385} +{"Full-pretrain/Learning Rate": 1.330729859353086e-06, "Full-pretrain/Loss": 1.8552138805389404, "Full-pretrain/Loss (Raw)": 1.7014946937561035, "Full-pretrain/Step": 8571, "Full-pretrain/Step Time": 17.655012199655175} +{"Full-pretrain/Learning Rate": 1.3279979672838032e-06, "Full-pretrain/Loss": 1.8643007278442383, "Full-pretrain/Loss (Raw)": 1.969330072402954, "Full-pretrain/Step": 8572, "Full-pretrain/Step Time": 17.655989233404398} +{"Full-pretrain/Learning Rate": 1.3252688057716373e-06, "Full-pretrain/Loss": 1.8760305643081665, "Full-pretrain/Loss (Raw)": 2.2952146530151367, "Full-pretrain/Step": 8573, "Full-pretrain/Step Time": 17.653452454134822} +{"Full-pretrain/Learning Rate": 1.3225423751313942e-06, "Full-pretrain/Loss": 1.878396987915039, "Full-pretrain/Loss (Raw)": 1.5763291120529175, "Full-pretrain/Step": 8574, "Full-pretrain/Step Time": 17.654333414509892} +{"Full-pretrain/Learning Rate": 1.3198186756775672e-06, "Full-pretrain/Loss": 1.8879196643829346, "Full-pretrain/Loss (Raw)": 1.904304027557373, "Full-pretrain/Step": 8575, "Full-pretrain/Step Time": 17.644861767068505} +{"Full-pretrain/Learning Rate": 1.317097707724338e-06, "Full-pretrain/Loss": 1.880122423171997, "Full-pretrain/Loss (Raw)": 1.8214154243469238, "Full-pretrain/Step": 8576, "Full-pretrain/Step Time": 17.647179055958986} +{"Full-pretrain/Learning Rate": 1.3143794715855584e-06, "Full-pretrain/Loss": 1.8796454668045044, "Full-pretrain/Loss (Raw)": 1.9263226985931396, "Full-pretrain/Step": 8577, "Full-pretrain/Step Time": 17.654247764497995} +{"Full-pretrain/Learning Rate": 1.311663967574786e-06, "Full-pretrain/Loss": 1.8860044479370117, "Full-pretrain/Loss (Raw)": 1.8787134885787964, "Full-pretrain/Step": 8578, "Full-pretrain/Step Time": 17.649570900946856} +{"Full-pretrain/Learning Rate": 1.3089511960052508e-06, "Full-pretrain/Loss": 1.8811018466949463, "Full-pretrain/Loss (Raw)": 1.823087453842163, "Full-pretrain/Step": 8579, "Full-pretrain/Step Time": 17.648187467828393} +{"Full-pretrain/Learning Rate": 1.3062411571898692e-06, "Full-pretrain/Loss": 1.8871307373046875, "Full-pretrain/Loss (Raw)": 2.0250892639160156, "Full-pretrain/Step": 8580, "Full-pretrain/Step Time": 17.6505814678967} +{"Full-pretrain/Learning Rate": 1.303533851441241e-06, "Full-pretrain/Loss": 1.882865309715271, "Full-pretrain/Loss (Raw)": 1.835258960723877, "Full-pretrain/Step": 8581, "Full-pretrain/Step Time": 17.65174415335059} +{"Full-pretrain/Learning Rate": 1.3008292790716608e-06, "Full-pretrain/Loss": 1.8846676349639893, "Full-pretrain/Loss (Raw)": 1.9015296697616577, "Full-pretrain/Step": 8582, "Full-pretrain/Step Time": 17.65356321260333} +{"Full-pretrain/Learning Rate": 1.2981274403930933e-06, "Full-pretrain/Loss": 1.8809267282485962, "Full-pretrain/Loss (Raw)": 1.9662543535232544, "Full-pretrain/Step": 8583, "Full-pretrain/Step Time": 17.647979352623224} +{"Full-pretrain/Learning Rate": 1.2954283357171943e-06, "Full-pretrain/Loss": 1.8817217350006104, "Full-pretrain/Loss (Raw)": 1.9630576372146606, "Full-pretrain/Step": 8584, "Full-pretrain/Step Time": 17.648301294073462} +{"Full-pretrain/Learning Rate": 1.2927319653553065e-06, "Full-pretrain/Loss": 1.8826074600219727, "Full-pretrain/Loss (Raw)": 1.9300001859664917, "Full-pretrain/Step": 8585, "Full-pretrain/Step Time": 17.649654110893607} +{"Full-pretrain/Learning Rate": 1.2900383296184536e-06, "Full-pretrain/Loss": 1.8687570095062256, "Full-pretrain/Loss (Raw)": 1.432715892791748, "Full-pretrain/Step": 8586, "Full-pretrain/Step Time": 17.652787629514933} +{"Full-pretrain/Learning Rate": 1.2873474288173538e-06, "Full-pretrain/Loss": 1.8629814386367798, "Full-pretrain/Loss (Raw)": 1.7430732250213623, "Full-pretrain/Step": 8587, "Full-pretrain/Step Time": 17.651334021240473} +{"Full-pretrain/Learning Rate": 1.2846592632623889e-06, "Full-pretrain/Loss": 1.8821017742156982, "Full-pretrain/Loss (Raw)": 2.149576187133789, "Full-pretrain/Step": 8588, "Full-pretrain/Step Time": 17.653791163116693} +{"Full-pretrain/Learning Rate": 1.2819738332636443e-06, "Full-pretrain/Loss": 1.8719420433044434, "Full-pretrain/Loss (Raw)": 1.8923298120498657, "Full-pretrain/Step": 8589, "Full-pretrain/Step Time": 17.65482585132122} +{"Full-pretrain/Learning Rate": 1.2792911391308864e-06, "Full-pretrain/Loss": 1.8683347702026367, "Full-pretrain/Loss (Raw)": 1.5605642795562744, "Full-pretrain/Step": 8590, "Full-pretrain/Step Time": 17.65566067956388} +{"Full-pretrain/Learning Rate": 1.2766111811735564e-06, "Full-pretrain/Loss": 1.8676635026931763, "Full-pretrain/Loss (Raw)": 1.8979780673980713, "Full-pretrain/Step": 8591, "Full-pretrain/Step Time": 17.654613273218274} +{"Full-pretrain/Learning Rate": 1.2739339597007932e-06, "Full-pretrain/Loss": 1.8739302158355713, "Full-pretrain/Loss (Raw)": 2.1448147296905518, "Full-pretrain/Step": 8592, "Full-pretrain/Step Time": 17.648192642256618} +{"Full-pretrain/Learning Rate": 1.2712594750214052e-06, "Full-pretrain/Loss": 1.8747003078460693, "Full-pretrain/Loss (Raw)": 1.8417569398880005, "Full-pretrain/Step": 8593, "Full-pretrain/Step Time": 17.648173233494163} +{"Full-pretrain/Learning Rate": 1.2685877274438985e-06, "Full-pretrain/Loss": 1.8772568702697754, "Full-pretrain/Loss (Raw)": 1.638995885848999, "Full-pretrain/Step": 8594, "Full-pretrain/Step Time": 17.646467737853527} +{"Full-pretrain/Learning Rate": 1.2659187172764597e-06, "Full-pretrain/Loss": 1.866591453552246, "Full-pretrain/Loss (Raw)": 1.8592332601547241, "Full-pretrain/Step": 8595, "Full-pretrain/Step Time": 17.644336842000484} +{"Full-pretrain/Learning Rate": 1.263252444826954e-06, "Full-pretrain/Loss": 1.8735169172286987, "Full-pretrain/Loss (Raw)": 2.0118823051452637, "Full-pretrain/Step": 8596, "Full-pretrain/Step Time": 17.639167303219438} +{"Full-pretrain/Learning Rate": 1.2605889104029406e-06, "Full-pretrain/Loss": 1.878422737121582, "Full-pretrain/Loss (Raw)": 1.7405176162719727, "Full-pretrain/Step": 8597, "Full-pretrain/Step Time": 17.63338152691722} +{"Full-pretrain/Learning Rate": 1.2579281143116518e-06, "Full-pretrain/Loss": 1.8687368631362915, "Full-pretrain/Loss (Raw)": 1.7028776407241821, "Full-pretrain/Step": 8598, "Full-pretrain/Step Time": 17.637964798137546} +{"Full-pretrain/Learning Rate": 1.2552700568600085e-06, "Full-pretrain/Loss": 1.8513108491897583, "Full-pretrain/Loss (Raw)": 1.4229533672332764, "Full-pretrain/Step": 8599, "Full-pretrain/Step Time": 17.6396867018193} +{"Full-pretrain/Learning Rate": 1.2526147383546239e-06, "Full-pretrain/Loss": 1.8487231731414795, "Full-pretrain/Loss (Raw)": 1.7813140153884888, "Full-pretrain/Step": 8600, "Full-pretrain/Step Time": 17.63335480540991} +{"Full-pretrain/Learning Rate": 1.2499621591017807e-06, "Full-pretrain/Loss": 1.8477277755737305, "Full-pretrain/Loss (Raw)": 1.8594282865524292, "Full-pretrain/Step": 8601, "Full-pretrain/Step Time": 17.631353402510285} +{"Full-pretrain/Learning Rate": 1.2473123194074565e-06, "Full-pretrain/Loss": 1.841200828552246, "Full-pretrain/Loss (Raw)": 1.721014142036438, "Full-pretrain/Step": 8602, "Full-pretrain/Step Time": 17.633947361260653} +{"Full-pretrain/Learning Rate": 1.2446652195773123e-06, "Full-pretrain/Loss": 1.853987216949463, "Full-pretrain/Loss (Raw)": 2.1106581687927246, "Full-pretrain/Step": 8603, "Full-pretrain/Step Time": 17.63686603307724} +{"Full-pretrain/Learning Rate": 1.2420208599166844e-06, "Full-pretrain/Loss": 1.8446848392486572, "Full-pretrain/Loss (Raw)": 1.6716538667678833, "Full-pretrain/Step": 8604, "Full-pretrain/Step Time": 17.627858012914658} +{"Full-pretrain/Learning Rate": 1.2393792407306009e-06, "Full-pretrain/Loss": 1.8301904201507568, "Full-pretrain/Loss (Raw)": 1.8313963413238525, "Full-pretrain/Step": 8605, "Full-pretrain/Step Time": 17.632894724607468} +{"Full-pretrain/Learning Rate": 1.236740362323774e-06, "Full-pretrain/Loss": 1.8399684429168701, "Full-pretrain/Loss (Raw)": 1.8892250061035156, "Full-pretrain/Step": 8606, "Full-pretrain/Step Time": 17.631164556369185} +{"Full-pretrain/Learning Rate": 1.234104225000593e-06, "Full-pretrain/Loss": 1.8374414443969727, "Full-pretrain/Loss (Raw)": 1.823439359664917, "Full-pretrain/Step": 8607, "Full-pretrain/Step Time": 17.635206108912826} +{"Full-pretrain/Learning Rate": 1.2314708290651427e-06, "Full-pretrain/Loss": 1.8461906909942627, "Full-pretrain/Loss (Raw)": 2.101393938064575, "Full-pretrain/Step": 8608, "Full-pretrain/Step Time": 17.626523992046714} +{"Full-pretrain/Learning Rate": 1.228840174821172e-06, "Full-pretrain/Loss": 1.8516294956207275, "Full-pretrain/Loss (Raw)": 2.1003642082214355, "Full-pretrain/Step": 8609, "Full-pretrain/Step Time": 17.61791041865945} +{"Full-pretrain/Learning Rate": 1.2262122625721377e-06, "Full-pretrain/Loss": 1.8556066751480103, "Full-pretrain/Loss (Raw)": 2.0059802532196045, "Full-pretrain/Step": 8610, "Full-pretrain/Step Time": 17.62420977652073} +{"Full-pretrain/Learning Rate": 1.2235870926211619e-06, "Full-pretrain/Loss": 1.862142562866211, "Full-pretrain/Loss (Raw)": 2.032238006591797, "Full-pretrain/Step": 8611, "Full-pretrain/Step Time": 17.629014864563942} +{"Full-pretrain/Learning Rate": 1.22096466527106e-06, "Full-pretrain/Loss": 1.8660976886749268, "Full-pretrain/Loss (Raw)": 2.151654005050659, "Full-pretrain/Step": 8612, "Full-pretrain/Step Time": 17.625729536637664} +{"Full-pretrain/Learning Rate": 1.218344980824329e-06, "Full-pretrain/Loss": 1.8641695976257324, "Full-pretrain/Loss (Raw)": 1.7735564708709717, "Full-pretrain/Step": 8613, "Full-pretrain/Step Time": 17.62301379442215} +{"Full-pretrain/Learning Rate": 1.2157280395831473e-06, "Full-pretrain/Loss": 1.867824912071228, "Full-pretrain/Loss (Raw)": 2.0184991359710693, "Full-pretrain/Step": 8614, "Full-pretrain/Step Time": 17.623263908550143} +{"Full-pretrain/Learning Rate": 1.2131138418493754e-06, "Full-pretrain/Loss": 1.8742055892944336, "Full-pretrain/Loss (Raw)": 2.1704354286193848, "Full-pretrain/Step": 8615, "Full-pretrain/Step Time": 17.62423120997846} +{"Full-pretrain/Learning Rate": 1.2105023879245614e-06, "Full-pretrain/Loss": 1.8668444156646729, "Full-pretrain/Loss (Raw)": 1.7275036573410034, "Full-pretrain/Step": 8616, "Full-pretrain/Step Time": 17.622494254261255} +{"Full-pretrain/Learning Rate": 1.2078936781099392e-06, "Full-pretrain/Loss": 1.8546332120895386, "Full-pretrain/Loss (Raw)": 1.539239525794983, "Full-pretrain/Step": 8617, "Full-pretrain/Step Time": 17.621305422857404} +{"Full-pretrain/Learning Rate": 1.205287712706421e-06, "Full-pretrain/Loss": 1.8683973550796509, "Full-pretrain/Loss (Raw)": 1.873168706893921, "Full-pretrain/Step": 8618, "Full-pretrain/Step Time": 17.620710549876094} +{"Full-pretrain/Learning Rate": 1.2026844920146024e-06, "Full-pretrain/Loss": 1.8790256977081299, "Full-pretrain/Loss (Raw)": 2.083178997039795, "Full-pretrain/Step": 8619, "Full-pretrain/Step Time": 17.6209579911083} +{"Full-pretrain/Learning Rate": 1.2000840163347627e-06, "Full-pretrain/Loss": 1.8810510635375977, "Full-pretrain/Loss (Raw)": 2.214387893676758, "Full-pretrain/Step": 8620, "Full-pretrain/Step Time": 17.620725190266967} +{"Full-pretrain/Learning Rate": 1.19748628596687e-06, "Full-pretrain/Loss": 1.8825032711029053, "Full-pretrain/Loss (Raw)": 1.938800573348999, "Full-pretrain/Step": 8621, "Full-pretrain/Step Time": 17.62164862267673} +{"Full-pretrain/Learning Rate": 1.1948913012105712e-06, "Full-pretrain/Loss": 1.8967350721359253, "Full-pretrain/Loss (Raw)": 2.0159826278686523, "Full-pretrain/Step": 8622, "Full-pretrain/Step Time": 17.62156836874783} +{"Full-pretrain/Learning Rate": 1.1922990623651902e-06, "Full-pretrain/Loss": 1.9033896923065186, "Full-pretrain/Loss (Raw)": 2.110926628112793, "Full-pretrain/Step": 8623, "Full-pretrain/Step Time": 17.62315595522523} +{"Full-pretrain/Learning Rate": 1.1897095697297522e-06, "Full-pretrain/Loss": 1.8940716981887817, "Full-pretrain/Loss (Raw)": 1.8466355800628662, "Full-pretrain/Step": 8624, "Full-pretrain/Step Time": 17.630187455564737} +{"Full-pretrain/Learning Rate": 1.187122823602943e-06, "Full-pretrain/Loss": 1.891592264175415, "Full-pretrain/Loss (Raw)": 1.7624183893203735, "Full-pretrain/Step": 8625, "Full-pretrain/Step Time": 17.62724945694208} +{"Full-pretrain/Learning Rate": 1.1845388242831462e-06, "Full-pretrain/Loss": 1.9018110036849976, "Full-pretrain/Loss (Raw)": 1.9659943580627441, "Full-pretrain/Step": 8626, "Full-pretrain/Step Time": 17.62127973139286} +{"Full-pretrain/Learning Rate": 1.181957572068429e-06, "Full-pretrain/Loss": 1.901465654373169, "Full-pretrain/Loss (Raw)": 1.8481817245483398, "Full-pretrain/Step": 8627, "Full-pretrain/Step Time": 17.625663205981255} +{"Full-pretrain/Learning Rate": 1.1793790672565335e-06, "Full-pretrain/Loss": 1.8965590000152588, "Full-pretrain/Loss (Raw)": 1.8548691272735596, "Full-pretrain/Step": 8628, "Full-pretrain/Step Time": 17.625977033749223} +{"Full-pretrain/Learning Rate": 1.176803310144897e-06, "Full-pretrain/Loss": 1.8983874320983887, "Full-pretrain/Loss (Raw)": 1.7990251779556274, "Full-pretrain/Step": 8629, "Full-pretrain/Step Time": 17.62678474932909} +{"Full-pretrain/Learning Rate": 1.1742303010306211e-06, "Full-pretrain/Loss": 1.898549199104309, "Full-pretrain/Loss (Raw)": 1.708057165145874, "Full-pretrain/Step": 8630, "Full-pretrain/Step Time": 17.62271667830646} +{"Full-pretrain/Learning Rate": 1.1716600402105093e-06, "Full-pretrain/Loss": 1.9142045974731445, "Full-pretrain/Loss (Raw)": 1.9239248037338257, "Full-pretrain/Step": 8631, "Full-pretrain/Step Time": 17.624798499047756} +{"Full-pretrain/Learning Rate": 1.1690925279810362e-06, "Full-pretrain/Loss": 1.9230897426605225, "Full-pretrain/Loss (Raw)": 2.0656380653381348, "Full-pretrain/Step": 8632, "Full-pretrain/Step Time": 17.625688817352057} +{"Full-pretrain/Learning Rate": 1.1665277646383671e-06, "Full-pretrain/Loss": 1.9243501424789429, "Full-pretrain/Loss (Raw)": 1.8997619152069092, "Full-pretrain/Step": 8633, "Full-pretrain/Step Time": 17.624363424256444} +{"Full-pretrain/Learning Rate": 1.1639657504783462e-06, "Full-pretrain/Loss": 1.927628517150879, "Full-pretrain/Loss (Raw)": 1.8259214162826538, "Full-pretrain/Step": 8634, "Full-pretrain/Step Time": 17.61841611377895} +{"Full-pretrain/Learning Rate": 1.1614064857964985e-06, "Full-pretrain/Loss": 1.9227304458618164, "Full-pretrain/Loss (Raw)": 1.9539190530776978, "Full-pretrain/Step": 8635, "Full-pretrain/Step Time": 17.61896389722824} +{"Full-pretrain/Learning Rate": 1.158849970888032e-06, "Full-pretrain/Loss": 1.916837453842163, "Full-pretrain/Loss (Raw)": 1.4830830097198486, "Full-pretrain/Step": 8636, "Full-pretrain/Step Time": 17.617645865306258} +{"Full-pretrain/Learning Rate": 1.1562962060478439e-06, "Full-pretrain/Loss": 1.9351940155029297, "Full-pretrain/Loss (Raw)": 2.418801784515381, "Full-pretrain/Step": 8637, "Full-pretrain/Step Time": 17.617732293903828} +{"Full-pretrain/Learning Rate": 1.15374519157051e-06, "Full-pretrain/Loss": 1.9398136138916016, "Full-pretrain/Loss (Raw)": 2.037050724029541, "Full-pretrain/Step": 8638, "Full-pretrain/Step Time": 17.61300741508603} +{"Full-pretrain/Learning Rate": 1.151196927750292e-06, "Full-pretrain/Loss": 1.9417390823364258, "Full-pretrain/Loss (Raw)": 1.8850560188293457, "Full-pretrain/Step": 8639, "Full-pretrain/Step Time": 17.616559272632003} +{"Full-pretrain/Learning Rate": 1.1486514148811216e-06, "Full-pretrain/Loss": 1.9346617460250854, "Full-pretrain/Loss (Raw)": 1.8749208450317383, "Full-pretrain/Step": 8640, "Full-pretrain/Step Time": 17.61972433514893} +{"Full-pretrain/Learning Rate": 1.1461086532566335e-06, "Full-pretrain/Loss": 1.9190198183059692, "Full-pretrain/Loss (Raw)": 1.5998218059539795, "Full-pretrain/Step": 8641, "Full-pretrain/Step Time": 17.621122382581234} +{"Full-pretrain/Learning Rate": 1.143568643170126e-06, "Full-pretrain/Loss": 1.9141517877578735, "Full-pretrain/Loss (Raw)": 1.8502013683319092, "Full-pretrain/Step": 8642, "Full-pretrain/Step Time": 17.6240314822644} +{"Full-pretrain/Learning Rate": 1.1410313849145926e-06, "Full-pretrain/Loss": 1.9163997173309326, "Full-pretrain/Loss (Raw)": 2.1041746139526367, "Full-pretrain/Step": 8643, "Full-pretrain/Step Time": 17.622627845034003} +{"Full-pretrain/Learning Rate": 1.1384968787827022e-06, "Full-pretrain/Loss": 1.9083116054534912, "Full-pretrain/Loss (Raw)": 1.892834186553955, "Full-pretrain/Step": 8644, "Full-pretrain/Step Time": 17.619607465341687} +{"Full-pretrain/Learning Rate": 1.135965125066818e-06, "Full-pretrain/Loss": 1.9194858074188232, "Full-pretrain/Loss (Raw)": 2.131131410598755, "Full-pretrain/Step": 8645, "Full-pretrain/Step Time": 17.623607575893402} +{"Full-pretrain/Learning Rate": 1.1334361240589647e-06, "Full-pretrain/Loss": 1.9168744087219238, "Full-pretrain/Loss (Raw)": 1.9349347352981567, "Full-pretrain/Step": 8646, "Full-pretrain/Step Time": 17.636327363550663} +{"Full-pretrain/Learning Rate": 1.1309098760508646e-06, "Full-pretrain/Loss": 1.9197804927825928, "Full-pretrain/Loss (Raw)": 2.2634294033050537, "Full-pretrain/Step": 8647, "Full-pretrain/Step Time": 17.631798001006246} +{"Full-pretrain/Learning Rate": 1.1283863813339263e-06, "Full-pretrain/Loss": 1.9241058826446533, "Full-pretrain/Loss (Raw)": 1.865914225578308, "Full-pretrain/Step": 8648, "Full-pretrain/Step Time": 17.63183349557221} +{"Full-pretrain/Learning Rate": 1.1258656401992278e-06, "Full-pretrain/Loss": 1.9369924068450928, "Full-pretrain/Loss (Raw)": 1.9516109228134155, "Full-pretrain/Step": 8649, "Full-pretrain/Step Time": 17.632568132132292} +{"Full-pretrain/Learning Rate": 1.1233476529375426e-06, "Full-pretrain/Loss": 1.942620038986206, "Full-pretrain/Loss (Raw)": 2.053255081176758, "Full-pretrain/Step": 8650, "Full-pretrain/Step Time": 17.635864816606045} +{"Full-pretrain/Learning Rate": 1.12083241983931e-06, "Full-pretrain/Loss": 1.9306831359863281, "Full-pretrain/Loss (Raw)": 1.7011942863464355, "Full-pretrain/Step": 8651, "Full-pretrain/Step Time": 17.63599115423858} +{"Full-pretrain/Learning Rate": 1.1183199411946649e-06, "Full-pretrain/Loss": 1.9252160787582397, "Full-pretrain/Loss (Raw)": 2.0394437313079834, "Full-pretrain/Step": 8652, "Full-pretrain/Step Time": 17.627601535990834} +{"Full-pretrain/Learning Rate": 1.1158102172934254e-06, "Full-pretrain/Loss": 1.9304773807525635, "Full-pretrain/Loss (Raw)": 2.1071605682373047, "Full-pretrain/Step": 8653, "Full-pretrain/Step Time": 17.633878502994776} +{"Full-pretrain/Learning Rate": 1.1133032484250821e-06, "Full-pretrain/Loss": 1.9175692796707153, "Full-pretrain/Loss (Raw)": 1.6029233932495117, "Full-pretrain/Step": 8654, "Full-pretrain/Step Time": 17.634091839194298} +{"Full-pretrain/Learning Rate": 1.1107990348788178e-06, "Full-pretrain/Loss": 1.917548418045044, "Full-pretrain/Loss (Raw)": 2.1102609634399414, "Full-pretrain/Step": 8655, "Full-pretrain/Step Time": 17.6376243121922} +{"Full-pretrain/Learning Rate": 1.1082975769434845e-06, "Full-pretrain/Loss": 1.929109811782837, "Full-pretrain/Loss (Raw)": 2.2165956497192383, "Full-pretrain/Step": 8656, "Full-pretrain/Step Time": 17.629604252055287} +{"Full-pretrain/Learning Rate": 1.1057988749076348e-06, "Full-pretrain/Loss": 1.9271960258483887, "Full-pretrain/Loss (Raw)": 1.701182246208191, "Full-pretrain/Step": 8657, "Full-pretrain/Step Time": 17.636595584452152} +{"Full-pretrain/Learning Rate": 1.1033029290594855e-06, "Full-pretrain/Loss": 1.919524073600769, "Full-pretrain/Loss (Raw)": 1.7204875946044922, "Full-pretrain/Step": 8658, "Full-pretrain/Step Time": 17.63913999311626} +{"Full-pretrain/Learning Rate": 1.100809739686945e-06, "Full-pretrain/Loss": 1.9225959777832031, "Full-pretrain/Loss (Raw)": 1.9464856386184692, "Full-pretrain/Step": 8659, "Full-pretrain/Step Time": 17.632174687460065} +{"Full-pretrain/Learning Rate": 1.0983193070776053e-06, "Full-pretrain/Loss": 1.9221093654632568, "Full-pretrain/Loss (Raw)": 1.8392950296401978, "Full-pretrain/Step": 8660, "Full-pretrain/Step Time": 17.63338352367282} +{"Full-pretrain/Learning Rate": 1.095831631518729e-06, "Full-pretrain/Loss": 1.923140048980713, "Full-pretrain/Loss (Raw)": 1.8320107460021973, "Full-pretrain/Step": 8661, "Full-pretrain/Step Time": 17.635552514344454} +{"Full-pretrain/Learning Rate": 1.0933467132972746e-06, "Full-pretrain/Loss": 1.9289110898971558, "Full-pretrain/Loss (Raw)": 1.8927278518676758, "Full-pretrain/Step": 8662, "Full-pretrain/Step Time": 17.63616793975234} +{"Full-pretrain/Learning Rate": 1.0908645526998745e-06, "Full-pretrain/Loss": 1.9278450012207031, "Full-pretrain/Loss (Raw)": 1.88981294631958, "Full-pretrain/Step": 8663, "Full-pretrain/Step Time": 17.63468312472105} +{"Full-pretrain/Learning Rate": 1.0883851500128494e-06, "Full-pretrain/Loss": 1.9280182123184204, "Full-pretrain/Loss (Raw)": 2.0711803436279297, "Full-pretrain/Step": 8664, "Full-pretrain/Step Time": 17.639303650707006} +{"Full-pretrain/Learning Rate": 1.0859085055221902e-06, "Full-pretrain/Loss": 1.924543857574463, "Full-pretrain/Loss (Raw)": 1.7885831594467163, "Full-pretrain/Step": 8665, "Full-pretrain/Step Time": 17.6410256549716} +{"Full-pretrain/Learning Rate": 1.0834346195135874e-06, "Full-pretrain/Loss": 1.9243026971817017, "Full-pretrain/Loss (Raw)": 1.818202257156372, "Full-pretrain/Step": 8666, "Full-pretrain/Step Time": 17.639847928658128} +{"Full-pretrain/Learning Rate": 1.080963492272391e-06, "Full-pretrain/Loss": 1.9225986003875732, "Full-pretrain/Loss (Raw)": 1.8993864059448242, "Full-pretrain/Step": 8667, "Full-pretrain/Step Time": 17.639425767585635} +{"Full-pretrain/Learning Rate": 1.0784951240836505e-06, "Full-pretrain/Loss": 1.925346851348877, "Full-pretrain/Loss (Raw)": 1.571030855178833, "Full-pretrain/Step": 8668, "Full-pretrain/Step Time": 17.64257686212659} +{"Full-pretrain/Learning Rate": 1.076029515232091e-06, "Full-pretrain/Loss": 1.9116907119750977, "Full-pretrain/Loss (Raw)": 1.9818028211593628, "Full-pretrain/Step": 8669, "Full-pretrain/Step Time": 17.642751233652234} +{"Full-pretrain/Learning Rate": 1.0735666660021182e-06, "Full-pretrain/Loss": 1.8945097923278809, "Full-pretrain/Loss (Raw)": 1.487264633178711, "Full-pretrain/Step": 8670, "Full-pretrain/Step Time": 17.641958449035883} +{"Full-pretrain/Learning Rate": 1.0711065766778272e-06, "Full-pretrain/Loss": 1.8943215608596802, "Full-pretrain/Loss (Raw)": 1.8790309429168701, "Full-pretrain/Step": 8671, "Full-pretrain/Step Time": 17.64163661748171} +{"Full-pretrain/Learning Rate": 1.06864924754298e-06, "Full-pretrain/Loss": 1.8942087888717651, "Full-pretrain/Loss (Raw)": 1.871313452720642, "Full-pretrain/Step": 8672, "Full-pretrain/Step Time": 17.645253805443645} +{"Full-pretrain/Learning Rate": 1.0661946788810301e-06, "Full-pretrain/Loss": 1.8981932401657104, "Full-pretrain/Loss (Raw)": 1.7273231744766235, "Full-pretrain/Step": 8673, "Full-pretrain/Step Time": 17.64595367014408} +{"Full-pretrain/Learning Rate": 1.0637428709751178e-06, "Full-pretrain/Loss": 1.8998849391937256, "Full-pretrain/Loss (Raw)": 1.9043375253677368, "Full-pretrain/Step": 8674, "Full-pretrain/Step Time": 17.649723332375288} +{"Full-pretrain/Learning Rate": 1.0612938241080506e-06, "Full-pretrain/Loss": 1.897566795349121, "Full-pretrain/Loss (Raw)": 2.0299935340881348, "Full-pretrain/Step": 8675, "Full-pretrain/Step Time": 17.65122831054032} +{"Full-pretrain/Learning Rate": 1.0588475385623297e-06, "Full-pretrain/Loss": 1.8932820558547974, "Full-pretrain/Loss (Raw)": 1.7557220458984375, "Full-pretrain/Step": 8676, "Full-pretrain/Step Time": 17.650235017761588} +{"Full-pretrain/Learning Rate": 1.0564040146201299e-06, "Full-pretrain/Loss": 1.887446403503418, "Full-pretrain/Loss (Raw)": 1.9443899393081665, "Full-pretrain/Step": 8677, "Full-pretrain/Step Time": 17.65370993129909} +{"Full-pretrain/Learning Rate": 1.0539632525633113e-06, "Full-pretrain/Loss": 1.8893418312072754, "Full-pretrain/Loss (Raw)": 1.995589017868042, "Full-pretrain/Step": 8678, "Full-pretrain/Step Time": 17.655675522983074} +{"Full-pretrain/Learning Rate": 1.0515252526734186e-06, "Full-pretrain/Loss": 1.8738152980804443, "Full-pretrain/Loss (Raw)": 1.7665780782699585, "Full-pretrain/Step": 8679, "Full-pretrain/Step Time": 17.657461654394865} +{"Full-pretrain/Learning Rate": 1.0490900152316713e-06, "Full-pretrain/Loss": 1.8932266235351562, "Full-pretrain/Loss (Raw)": 2.4870786666870117, "Full-pretrain/Step": 8680, "Full-pretrain/Step Time": 17.661609649658203} +{"Full-pretrain/Learning Rate": 1.046657540518975e-06, "Full-pretrain/Loss": 1.891836404800415, "Full-pretrain/Loss (Raw)": 1.9071260690689087, "Full-pretrain/Step": 8681, "Full-pretrain/Step Time": 17.653429908677936} +{"Full-pretrain/Learning Rate": 1.0442278288159136e-06, "Full-pretrain/Loss": 1.885406494140625, "Full-pretrain/Loss (Raw)": 1.8474981784820557, "Full-pretrain/Step": 8682, "Full-pretrain/Step Time": 17.65636958926916} +{"Full-pretrain/Learning Rate": 1.041800880402749e-06, "Full-pretrain/Loss": 1.8881909847259521, "Full-pretrain/Loss (Raw)": 1.7902922630310059, "Full-pretrain/Step": 8683, "Full-pretrain/Step Time": 17.65755874849856} +{"Full-pretrain/Learning Rate": 1.0393766955594382e-06, "Full-pretrain/Loss": 1.8787739276885986, "Full-pretrain/Loss (Raw)": 1.7381033897399902, "Full-pretrain/Step": 8684, "Full-pretrain/Step Time": 17.661579051986337} +{"Full-pretrain/Learning Rate": 1.0369552745656013e-06, "Full-pretrain/Loss": 1.8749659061431885, "Full-pretrain/Loss (Raw)": 1.9853031635284424, "Full-pretrain/Step": 8685, "Full-pretrain/Step Time": 17.660874370485544} +{"Full-pretrain/Learning Rate": 1.0345366177005544e-06, "Full-pretrain/Loss": 1.8964710235595703, "Full-pretrain/Loss (Raw)": 2.2910876274108887, "Full-pretrain/Step": 8686, "Full-pretrain/Step Time": 17.66151331551373} +{"Full-pretrain/Learning Rate": 1.0321207252432907e-06, "Full-pretrain/Loss": 1.8927907943725586, "Full-pretrain/Loss (Raw)": 1.9924921989440918, "Full-pretrain/Step": 8687, "Full-pretrain/Step Time": 17.66271948069334} +{"Full-pretrain/Learning Rate": 1.0297075974724735e-06, "Full-pretrain/Loss": 1.896090030670166, "Full-pretrain/Loss (Raw)": 2.3221704959869385, "Full-pretrain/Step": 8688, "Full-pretrain/Step Time": 17.669015049934387} +{"Full-pretrain/Learning Rate": 1.0272972346664606e-06, "Full-pretrain/Loss": 1.9035978317260742, "Full-pretrain/Loss (Raw)": 1.9414339065551758, "Full-pretrain/Step": 8689, "Full-pretrain/Step Time": 17.666483283042908} +{"Full-pretrain/Learning Rate": 1.0248896371032907e-06, "Full-pretrain/Loss": 1.8993310928344727, "Full-pretrain/Loss (Raw)": 1.5839519500732422, "Full-pretrain/Step": 8690, "Full-pretrain/Step Time": 17.66469194740057} +{"Full-pretrain/Learning Rate": 1.022484805060675e-06, "Full-pretrain/Loss": 1.8976237773895264, "Full-pretrain/Loss (Raw)": 1.8918471336364746, "Full-pretrain/Step": 8691, "Full-pretrain/Step Time": 17.66347101330757} +{"Full-pretrain/Learning Rate": 1.020082738816011e-06, "Full-pretrain/Loss": 1.899276852607727, "Full-pretrain/Loss (Raw)": 1.8921961784362793, "Full-pretrain/Step": 8692, "Full-pretrain/Step Time": 17.665457332506776} +{"Full-pretrain/Learning Rate": 1.0176834386463745e-06, "Full-pretrain/Loss": 1.9045028686523438, "Full-pretrain/Loss (Raw)": 1.999241828918457, "Full-pretrain/Step": 8693, "Full-pretrain/Step Time": 17.66607723198831} +{"Full-pretrain/Learning Rate": 1.0152869048285246e-06, "Full-pretrain/Loss": 1.9055447578430176, "Full-pretrain/Loss (Raw)": 1.92606782913208, "Full-pretrain/Step": 8694, "Full-pretrain/Step Time": 17.662918427959085} +{"Full-pretrain/Learning Rate": 1.0128931376389011e-06, "Full-pretrain/Loss": 1.9010980129241943, "Full-pretrain/Loss (Raw)": 1.7475156784057617, "Full-pretrain/Step": 8695, "Full-pretrain/Step Time": 17.661259852349758} +{"Full-pretrain/Learning Rate": 1.010502137353625e-06, "Full-pretrain/Loss": 1.8931877613067627, "Full-pretrain/Loss (Raw)": 1.8180562257766724, "Full-pretrain/Step": 8696, "Full-pretrain/Step Time": 17.66397670842707} +{"Full-pretrain/Learning Rate": 1.0081139042485006e-06, "Full-pretrain/Loss": 1.8784840106964111, "Full-pretrain/Loss (Raw)": 1.318060278892517, "Full-pretrain/Step": 8697, "Full-pretrain/Step Time": 17.665087012574077} +{"Full-pretrain/Learning Rate": 1.0057284385990018e-06, "Full-pretrain/Loss": 1.8904935121536255, "Full-pretrain/Loss (Raw)": 2.2025070190429688, "Full-pretrain/Step": 8698, "Full-pretrain/Step Time": 17.66764833033085} +{"Full-pretrain/Learning Rate": 1.0033457406802948e-06, "Full-pretrain/Loss": 1.901052474975586, "Full-pretrain/Loss (Raw)": 2.2372727394104004, "Full-pretrain/Step": 8699, "Full-pretrain/Step Time": 17.66052539087832} +{"Full-pretrain/Learning Rate": 1.0009658107672237e-06, "Full-pretrain/Loss": 1.9265427589416504, "Full-pretrain/Loss (Raw)": 2.3867228031158447, "Full-pretrain/Step": 8700, "Full-pretrain/Step Time": 17.660743994638324} +{"Full-pretrain/Learning Rate": 9.985886491343132e-07, "Full-pretrain/Loss": 1.9219861030578613, "Full-pretrain/Loss (Raw)": 1.8359864950180054, "Full-pretrain/Step": 8701, "Full-pretrain/Step Time": 17.670387042686343} +{"Full-pretrain/Learning Rate": 9.962142560557692e-07, "Full-pretrain/Loss": 1.9413912296295166, "Full-pretrain/Loss (Raw)": 2.1082284450531006, "Full-pretrain/Step": 8702, "Full-pretrain/Step Time": 17.66448674723506} +{"Full-pretrain/Learning Rate": 9.93842631805475e-07, "Full-pretrain/Loss": 1.943657398223877, "Full-pretrain/Loss (Raw)": 1.9515491724014282, "Full-pretrain/Step": 8703, "Full-pretrain/Step Time": 17.668856697157025} +{"Full-pretrain/Learning Rate": 9.914737766569953e-07, "Full-pretrain/Loss": 1.9470798969268799, "Full-pretrain/Loss (Raw)": 1.9808318614959717, "Full-pretrain/Step": 8704, "Full-pretrain/Step Time": 17.664447268471122} +{"Full-pretrain/Learning Rate": 9.891076908835783e-07, "Full-pretrain/Loss": 1.950007677078247, "Full-pretrain/Loss (Raw)": 1.8210158348083496, "Full-pretrain/Step": 8705, "Full-pretrain/Step Time": 17.667766842991114} +{"Full-pretrain/Learning Rate": 9.867443747581555e-07, "Full-pretrain/Loss": 1.9550387859344482, "Full-pretrain/Loss (Raw)": 2.0653343200683594, "Full-pretrain/Step": 8706, "Full-pretrain/Step Time": 17.668248668313026} +{"Full-pretrain/Learning Rate": 9.843838285533258e-07, "Full-pretrain/Loss": 1.9504814147949219, "Full-pretrain/Loss (Raw)": 1.8841561079025269, "Full-pretrain/Step": 8707, "Full-pretrain/Step Time": 17.668545324355364} +{"Full-pretrain/Learning Rate": 9.820260525413849e-07, "Full-pretrain/Loss": 1.9330084323883057, "Full-pretrain/Loss (Raw)": 1.1965842247009277, "Full-pretrain/Step": 8708, "Full-pretrain/Step Time": 17.66475798562169} +{"Full-pretrain/Learning Rate": 9.79671046994296e-07, "Full-pretrain/Loss": 1.934493064880371, "Full-pretrain/Loss (Raw)": 1.9919016361236572, "Full-pretrain/Step": 8709, "Full-pretrain/Step Time": 17.67053539864719} +{"Full-pretrain/Learning Rate": 9.773188121837085e-07, "Full-pretrain/Loss": 1.9274468421936035, "Full-pretrain/Loss (Raw)": 1.7701054811477661, "Full-pretrain/Step": 8710, "Full-pretrain/Step Time": 17.667127408087254} +{"Full-pretrain/Learning Rate": 9.749693483809552e-07, "Full-pretrain/Loss": 1.9329509735107422, "Full-pretrain/Loss (Raw)": 1.942711591720581, "Full-pretrain/Step": 8711, "Full-pretrain/Step Time": 17.666008537635207} +{"Full-pretrain/Learning Rate": 9.726226558570444e-07, "Full-pretrain/Loss": 1.9236935377120972, "Full-pretrain/Loss (Raw)": 2.1908414363861084, "Full-pretrain/Step": 8712, "Full-pretrain/Step Time": 17.66281888447702} +{"Full-pretrain/Learning Rate": 9.702787348826708e-07, "Full-pretrain/Loss": 1.9406700134277344, "Full-pretrain/Loss (Raw)": 2.450376272201538, "Full-pretrain/Step": 8713, "Full-pretrain/Step Time": 17.663543386384845} +{"Full-pretrain/Learning Rate": 9.679375857281959e-07, "Full-pretrain/Loss": 1.943188190460205, "Full-pretrain/Loss (Raw)": 1.9280743598937988, "Full-pretrain/Step": 8714, "Full-pretrain/Step Time": 17.66102435439825} +{"Full-pretrain/Learning Rate": 9.655992086636755e-07, "Full-pretrain/Loss": 1.9415998458862305, "Full-pretrain/Loss (Raw)": 1.7394652366638184, "Full-pretrain/Step": 8715, "Full-pretrain/Step Time": 17.655132533982396} +{"Full-pretrain/Learning Rate": 9.63263603958839e-07, "Full-pretrain/Loss": 1.9467296600341797, "Full-pretrain/Loss (Raw)": 1.902259349822998, "Full-pretrain/Step": 8716, "Full-pretrain/Step Time": 17.651062352582812} +{"Full-pretrain/Learning Rate": 9.609307718831006e-07, "Full-pretrain/Loss": 1.9480421543121338, "Full-pretrain/Loss (Raw)": 2.0273027420043945, "Full-pretrain/Step": 8717, "Full-pretrain/Step Time": 17.651746451854706} +{"Full-pretrain/Learning Rate": 9.586007127055512e-07, "Full-pretrain/Loss": 1.933351755142212, "Full-pretrain/Loss (Raw)": 1.8209933042526245, "Full-pretrain/Step": 8718, "Full-pretrain/Step Time": 17.656038638204336} +{"Full-pretrain/Learning Rate": 9.562734266949592e-07, "Full-pretrain/Loss": 1.9230372905731201, "Full-pretrain/Loss (Raw)": 1.6624276638031006, "Full-pretrain/Step": 8719, "Full-pretrain/Step Time": 17.65566297248006} +{"Full-pretrain/Learning Rate": 9.53948914119776e-07, "Full-pretrain/Loss": 1.8986496925354004, "Full-pretrain/Loss (Raw)": 1.54176926612854, "Full-pretrain/Step": 8720, "Full-pretrain/Step Time": 17.657896392047405} +{"Full-pretrain/Learning Rate": 9.516271752481376e-07, "Full-pretrain/Loss": 1.8992154598236084, "Full-pretrain/Loss (Raw)": 1.9595401287078857, "Full-pretrain/Step": 8721, "Full-pretrain/Step Time": 17.65972540155053} +{"Full-pretrain/Learning Rate": 9.493082103478517e-07, "Full-pretrain/Loss": 1.9063084125518799, "Full-pretrain/Loss (Raw)": 1.810927152633667, "Full-pretrain/Step": 8722, "Full-pretrain/Step Time": 17.65807688049972} +{"Full-pretrain/Learning Rate": 9.469920196864158e-07, "Full-pretrain/Loss": 1.9050796031951904, "Full-pretrain/Loss (Raw)": 1.8525211811065674, "Full-pretrain/Step": 8723, "Full-pretrain/Step Time": 17.652183251455426} +{"Full-pretrain/Learning Rate": 9.446786035309934e-07, "Full-pretrain/Loss": 1.900132179260254, "Full-pretrain/Loss (Raw)": 1.7338848114013672, "Full-pretrain/Step": 8724, "Full-pretrain/Step Time": 17.653684487566352} +{"Full-pretrain/Learning Rate": 9.423679621484438e-07, "Full-pretrain/Loss": 1.8999652862548828, "Full-pretrain/Loss (Raw)": 1.9938991069793701, "Full-pretrain/Step": 8725, "Full-pretrain/Step Time": 17.65745110064745} +{"Full-pretrain/Learning Rate": 9.400600958052924e-07, "Full-pretrain/Loss": 1.8967642784118652, "Full-pretrain/Loss (Raw)": 1.8236377239227295, "Full-pretrain/Step": 8726, "Full-pretrain/Step Time": 17.656858026981354} +{"Full-pretrain/Learning Rate": 9.377550047677541e-07, "Full-pretrain/Loss": 1.9075725078582764, "Full-pretrain/Loss (Raw)": 2.0933730602264404, "Full-pretrain/Step": 8727, "Full-pretrain/Step Time": 17.647313253954053} +{"Full-pretrain/Learning Rate": 9.354526893017191e-07, "Full-pretrain/Loss": 1.9068331718444824, "Full-pretrain/Loss (Raw)": 1.7944024801254272, "Full-pretrain/Step": 8728, "Full-pretrain/Step Time": 17.650690507143736} +{"Full-pretrain/Learning Rate": 9.331531496727635e-07, "Full-pretrain/Loss": 1.9198861122131348, "Full-pretrain/Loss (Raw)": 1.7357546091079712, "Full-pretrain/Step": 8729, "Full-pretrain/Step Time": 17.65249107964337} +{"Full-pretrain/Learning Rate": 9.308563861461311e-07, "Full-pretrain/Loss": 1.9080418348312378, "Full-pretrain/Loss (Raw)": 1.8234893083572388, "Full-pretrain/Step": 8730, "Full-pretrain/Step Time": 17.646646983921528} +{"Full-pretrain/Learning Rate": 9.285623989867543e-07, "Full-pretrain/Loss": 1.8883559703826904, "Full-pretrain/Loss (Raw)": 1.60732102394104, "Full-pretrain/Step": 8731, "Full-pretrain/Step Time": 17.645471528172493} +{"Full-pretrain/Learning Rate": 9.262711884592462e-07, "Full-pretrain/Loss": 1.871586561203003, "Full-pretrain/Loss (Raw)": 1.8501050472259521, "Full-pretrain/Step": 8732, "Full-pretrain/Step Time": 17.647263577207923} +{"Full-pretrain/Learning Rate": 9.239827548278985e-07, "Full-pretrain/Loss": 1.8690292835235596, "Full-pretrain/Loss (Raw)": 1.754152536392212, "Full-pretrain/Step": 8733, "Full-pretrain/Step Time": 17.64404588751495} +{"Full-pretrain/Learning Rate": 9.216970983566802e-07, "Full-pretrain/Loss": 1.8571531772613525, "Full-pretrain/Loss (Raw)": 1.728191614151001, "Full-pretrain/Step": 8734, "Full-pretrain/Step Time": 17.648032562807202} +{"Full-pretrain/Learning Rate": 9.194142193092392e-07, "Full-pretrain/Loss": 1.8490214347839355, "Full-pretrain/Loss (Raw)": 1.6913341283798218, "Full-pretrain/Step": 8735, "Full-pretrain/Step Time": 17.645618768408895} +{"Full-pretrain/Learning Rate": 9.171341179489034e-07, "Full-pretrain/Loss": 1.8474723100662231, "Full-pretrain/Loss (Raw)": 1.931260108947754, "Full-pretrain/Step": 8736, "Full-pretrain/Step Time": 17.644367584958673} +{"Full-pretrain/Learning Rate": 9.148567945386849e-07, "Full-pretrain/Loss": 1.8363279104232788, "Full-pretrain/Loss (Raw)": 1.4643977880477905, "Full-pretrain/Step": 8737, "Full-pretrain/Step Time": 17.651264676824212} +{"Full-pretrain/Learning Rate": 9.125822493412678e-07, "Full-pretrain/Loss": 1.8215947151184082, "Full-pretrain/Loss (Raw)": 1.5938720703125, "Full-pretrain/Step": 8738, "Full-pretrain/Step Time": 17.655830204486847} +{"Full-pretrain/Learning Rate": 9.103104826190312e-07, "Full-pretrain/Loss": 1.816937804222107, "Full-pretrain/Loss (Raw)": 1.7351341247558594, "Full-pretrain/Step": 8739, "Full-pretrain/Step Time": 17.65019467100501} +{"Full-pretrain/Learning Rate": 9.080414946340071e-07, "Full-pretrain/Loss": 1.8301284313201904, "Full-pretrain/Loss (Raw)": 1.6186838150024414, "Full-pretrain/Step": 8740, "Full-pretrain/Step Time": 17.64900598488748} +{"Full-pretrain/Learning Rate": 9.057752856479363e-07, "Full-pretrain/Loss": 1.83026123046875, "Full-pretrain/Loss (Raw)": 1.996152639389038, "Full-pretrain/Step": 8741, "Full-pretrain/Step Time": 17.647174693644047} +{"Full-pretrain/Learning Rate": 9.03511855922215e-07, "Full-pretrain/Loss": 1.8357715606689453, "Full-pretrain/Loss (Raw)": 1.9464333057403564, "Full-pretrain/Step": 8742, "Full-pretrain/Step Time": 17.652120742946863} +{"Full-pretrain/Learning Rate": 9.012512057179345e-07, "Full-pretrain/Loss": 1.8367043733596802, "Full-pretrain/Loss (Raw)": 1.972564697265625, "Full-pretrain/Step": 8743, "Full-pretrain/Step Time": 17.648393915966153} +{"Full-pretrain/Learning Rate": 8.989933352958558e-07, "Full-pretrain/Loss": 1.8219175338745117, "Full-pretrain/Loss (Raw)": 1.7176613807678223, "Full-pretrain/Step": 8744, "Full-pretrain/Step Time": 17.648742236196995} +{"Full-pretrain/Learning Rate": 8.967382449164314e-07, "Full-pretrain/Loss": 1.8036577701568604, "Full-pretrain/Loss (Raw)": 1.8660647869110107, "Full-pretrain/Step": 8745, "Full-pretrain/Step Time": 17.64582802541554} +{"Full-pretrain/Learning Rate": 8.944859348397755e-07, "Full-pretrain/Loss": 1.7955989837646484, "Full-pretrain/Loss (Raw)": 1.6701889038085938, "Full-pretrain/Step": 8746, "Full-pretrain/Step Time": 17.648166358470917} +{"Full-pretrain/Learning Rate": 8.922364053256971e-07, "Full-pretrain/Loss": 1.8026163578033447, "Full-pretrain/Loss (Raw)": 1.9640238285064697, "Full-pretrain/Step": 8747, "Full-pretrain/Step Time": 17.64828547462821} +{"Full-pretrain/Learning Rate": 8.899896566336746e-07, "Full-pretrain/Loss": 1.807342529296875, "Full-pretrain/Loss (Raw)": 2.0534989833831787, "Full-pretrain/Step": 8748, "Full-pretrain/Step Time": 17.647220192477107} +{"Full-pretrain/Learning Rate": 8.877456890228758e-07, "Full-pretrain/Loss": 1.8041679859161377, "Full-pretrain/Loss (Raw)": 1.9257147312164307, "Full-pretrain/Step": 8749, "Full-pretrain/Step Time": 17.65154094994068} +{"Full-pretrain/Learning Rate": 8.85504502752138e-07, "Full-pretrain/Loss": 1.7984199523925781, "Full-pretrain/Loss (Raw)": 1.6370558738708496, "Full-pretrain/Step": 8750, "Full-pretrain/Step Time": 17.647170243784785} +{"Full-pretrain/Learning Rate": 8.832660980799795e-07, "Full-pretrain/Loss": 1.7993547916412354, "Full-pretrain/Loss (Raw)": 1.6923458576202393, "Full-pretrain/Step": 8751, "Full-pretrain/Step Time": 17.643421521410346} +{"Full-pretrain/Learning Rate": 8.81030475264602e-07, "Full-pretrain/Loss": 1.8095897436141968, "Full-pretrain/Loss (Raw)": 1.8692855834960938, "Full-pretrain/Step": 8752, "Full-pretrain/Step Time": 17.640211582183838} +{"Full-pretrain/Learning Rate": 8.787976345638826e-07, "Full-pretrain/Loss": 1.8105230331420898, "Full-pretrain/Loss (Raw)": 1.9894044399261475, "Full-pretrain/Step": 8753, "Full-pretrain/Step Time": 17.644362242892385} +{"Full-pretrain/Learning Rate": 8.76567576235382e-07, "Full-pretrain/Loss": 1.8226797580718994, "Full-pretrain/Loss (Raw)": 2.1999433040618896, "Full-pretrain/Step": 8754, "Full-pretrain/Step Time": 17.64423399977386} +{"Full-pretrain/Learning Rate": 8.743403005363332e-07, "Full-pretrain/Loss": 1.829991102218628, "Full-pretrain/Loss (Raw)": 2.0864856243133545, "Full-pretrain/Step": 8755, "Full-pretrain/Step Time": 17.642588274553418} +{"Full-pretrain/Learning Rate": 8.721158077236503e-07, "Full-pretrain/Loss": 1.8348572254180908, "Full-pretrain/Loss (Raw)": 1.8896002769470215, "Full-pretrain/Step": 8756, "Full-pretrain/Step Time": 17.645051427185535} +{"Full-pretrain/Learning Rate": 8.698940980539332e-07, "Full-pretrain/Loss": 1.8422902822494507, "Full-pretrain/Loss (Raw)": 2.231755256652832, "Full-pretrain/Step": 8757, "Full-pretrain/Step Time": 17.642354499548674} +{"Full-pretrain/Learning Rate": 8.676751717834497e-07, "Full-pretrain/Loss": 1.8434076309204102, "Full-pretrain/Loss (Raw)": 1.85939359664917, "Full-pretrain/Step": 8758, "Full-pretrain/Step Time": 17.641969168558717} +{"Full-pretrain/Learning Rate": 8.65459029168153e-07, "Full-pretrain/Loss": 1.821467638015747, "Full-pretrain/Loss (Raw)": 1.3912944793701172, "Full-pretrain/Step": 8759, "Full-pretrain/Step Time": 17.64586234278977} +{"Full-pretrain/Learning Rate": 8.632456704636805e-07, "Full-pretrain/Loss": 1.8189282417297363, "Full-pretrain/Loss (Raw)": 1.7131401300430298, "Full-pretrain/Step": 8760, "Full-pretrain/Step Time": 17.64290643669665} +{"Full-pretrain/Learning Rate": 8.610350959253332e-07, "Full-pretrain/Loss": 1.8229119777679443, "Full-pretrain/Loss (Raw)": 1.8632349967956543, "Full-pretrain/Step": 8761, "Full-pretrain/Step Time": 17.64116115681827} +{"Full-pretrain/Learning Rate": 8.588273058081048e-07, "Full-pretrain/Loss": 1.8250701427459717, "Full-pretrain/Loss (Raw)": 1.892548680305481, "Full-pretrain/Step": 8762, "Full-pretrain/Step Time": 17.641778253018856} +{"Full-pretrain/Learning Rate": 8.566223003666635e-07, "Full-pretrain/Loss": 1.823854684829712, "Full-pretrain/Loss (Raw)": 1.5684261322021484, "Full-pretrain/Step": 8763, "Full-pretrain/Step Time": 17.63866768963635} +{"Full-pretrain/Learning Rate": 8.544200798553559e-07, "Full-pretrain/Loss": 1.826237678527832, "Full-pretrain/Loss (Raw)": 1.9263616800308228, "Full-pretrain/Step": 8764, "Full-pretrain/Step Time": 17.64579932577908} +{"Full-pretrain/Learning Rate": 8.522206445282038e-07, "Full-pretrain/Loss": 1.827115535736084, "Full-pretrain/Loss (Raw)": 1.7822442054748535, "Full-pretrain/Step": 8765, "Full-pretrain/Step Time": 17.642349721863866} +{"Full-pretrain/Learning Rate": 8.50023994638921e-07, "Full-pretrain/Loss": 1.835810899734497, "Full-pretrain/Loss (Raw)": 2.0064427852630615, "Full-pretrain/Step": 8766, "Full-pretrain/Step Time": 17.644961470738053} +{"Full-pretrain/Learning Rate": 8.47830130440877e-07, "Full-pretrain/Loss": 1.8512275218963623, "Full-pretrain/Loss (Raw)": 2.184663772583008, "Full-pretrain/Step": 8767, "Full-pretrain/Step Time": 17.645585911348462} +{"Full-pretrain/Learning Rate": 8.456390521871415e-07, "Full-pretrain/Loss": 1.8412950038909912, "Full-pretrain/Loss (Raw)": 1.6134214401245117, "Full-pretrain/Step": 8768, "Full-pretrain/Step Time": 17.65068037994206} +{"Full-pretrain/Learning Rate": 8.434507601304542e-07, "Full-pretrain/Loss": 1.8577035665512085, "Full-pretrain/Loss (Raw)": 1.9894729852676392, "Full-pretrain/Step": 8769, "Full-pretrain/Step Time": 17.649646386504173} +{"Full-pretrain/Learning Rate": 8.412652545232324e-07, "Full-pretrain/Loss": 1.8556815385818481, "Full-pretrain/Loss (Raw)": 1.5291694402694702, "Full-pretrain/Step": 8770, "Full-pretrain/Step Time": 17.644211309030652} +{"Full-pretrain/Learning Rate": 8.390825356175747e-07, "Full-pretrain/Loss": 1.8626947402954102, "Full-pretrain/Loss (Raw)": 1.959552526473999, "Full-pretrain/Step": 8771, "Full-pretrain/Step Time": 17.64131575077772} +{"Full-pretrain/Learning Rate": 8.369026036652516e-07, "Full-pretrain/Loss": 1.8687068223953247, "Full-pretrain/Loss (Raw)": 1.8110737800598145, "Full-pretrain/Step": 8772, "Full-pretrain/Step Time": 17.64639661461115} +{"Full-pretrain/Learning Rate": 8.347254589177234e-07, "Full-pretrain/Loss": 1.859297752380371, "Full-pretrain/Loss (Raw)": 1.6950576305389404, "Full-pretrain/Step": 8773, "Full-pretrain/Step Time": 17.646122166886926} +{"Full-pretrain/Learning Rate": 8.32551101626125e-07, "Full-pretrain/Loss": 1.8623356819152832, "Full-pretrain/Loss (Raw)": 2.043652057647705, "Full-pretrain/Step": 8774, "Full-pretrain/Step Time": 17.63564645498991} +{"Full-pretrain/Learning Rate": 8.303795320412616e-07, "Full-pretrain/Loss": 1.865721583366394, "Full-pretrain/Loss (Raw)": 2.0809130668640137, "Full-pretrain/Step": 8775, "Full-pretrain/Step Time": 17.636922949925065} +{"Full-pretrain/Learning Rate": 8.282107504136271e-07, "Full-pretrain/Loss": 1.8766841888427734, "Full-pretrain/Loss (Raw)": 2.068467378616333, "Full-pretrain/Step": 8776, "Full-pretrain/Step Time": 17.632947199046612} +{"Full-pretrain/Learning Rate": 8.260447569933827e-07, "Full-pretrain/Loss": 1.8749363422393799, "Full-pretrain/Loss (Raw)": 1.8101308345794678, "Full-pretrain/Step": 8777, "Full-pretrain/Step Time": 17.6357187833637} +{"Full-pretrain/Learning Rate": 8.238815520303839e-07, "Full-pretrain/Loss": 1.8726763725280762, "Full-pretrain/Loss (Raw)": 1.5978721380233765, "Full-pretrain/Step": 8778, "Full-pretrain/Step Time": 17.63657896593213} +{"Full-pretrain/Learning Rate": 8.217211357741505e-07, "Full-pretrain/Loss": 1.8739638328552246, "Full-pretrain/Loss (Raw)": 2.005218982696533, "Full-pretrain/Step": 8779, "Full-pretrain/Step Time": 17.633442850783467} +{"Full-pretrain/Learning Rate": 8.195635084738862e-07, "Full-pretrain/Loss": 1.8680071830749512, "Full-pretrain/Loss (Raw)": 1.86288583278656, "Full-pretrain/Step": 8780, "Full-pretrain/Step Time": 17.630578443408012} +{"Full-pretrain/Learning Rate": 8.174086703784778e-07, "Full-pretrain/Loss": 1.8671424388885498, "Full-pretrain/Loss (Raw)": 1.8980450630187988, "Full-pretrain/Step": 8781, "Full-pretrain/Step Time": 17.63116754963994} +{"Full-pretrain/Learning Rate": 8.152566217364793e-07, "Full-pretrain/Loss": 1.8737118244171143, "Full-pretrain/Loss (Raw)": 1.8472752571105957, "Full-pretrain/Step": 8782, "Full-pretrain/Step Time": 17.62686286866665} +{"Full-pretrain/Learning Rate": 8.131073627961283e-07, "Full-pretrain/Loss": 1.8893324136734009, "Full-pretrain/Loss (Raw)": 2.192203998565674, "Full-pretrain/Step": 8783, "Full-pretrain/Step Time": 17.62242187745869} +{"Full-pretrain/Learning Rate": 8.109608938053431e-07, "Full-pretrain/Loss": 1.8948991298675537, "Full-pretrain/Loss (Raw)": 2.047421932220459, "Full-pretrain/Step": 8784, "Full-pretrain/Step Time": 17.62872314080596} +{"Full-pretrain/Learning Rate": 8.088172150117202e-07, "Full-pretrain/Loss": 1.890033483505249, "Full-pretrain/Loss (Raw)": 1.8337022066116333, "Full-pretrain/Step": 8785, "Full-pretrain/Step Time": 17.62295284308493} +{"Full-pretrain/Learning Rate": 8.066763266625282e-07, "Full-pretrain/Loss": 1.8840241432189941, "Full-pretrain/Loss (Raw)": 2.007643938064575, "Full-pretrain/Step": 8786, "Full-pretrain/Step Time": 17.621854692697525} +{"Full-pretrain/Learning Rate": 8.045382290047227e-07, "Full-pretrain/Loss": 1.8802573680877686, "Full-pretrain/Loss (Raw)": 1.965950608253479, "Full-pretrain/Step": 8787, "Full-pretrain/Step Time": 17.622148636728525} +{"Full-pretrain/Learning Rate": 8.024029222849283e-07, "Full-pretrain/Loss": 1.8723876476287842, "Full-pretrain/Loss (Raw)": 1.6377696990966797, "Full-pretrain/Step": 8788, "Full-pretrain/Step Time": 17.6223664842546} +{"Full-pretrain/Learning Rate": 8.002704067494509e-07, "Full-pretrain/Loss": 1.8537945747375488, "Full-pretrain/Loss (Raw)": 1.6367738246917725, "Full-pretrain/Step": 8789, "Full-pretrain/Step Time": 17.62149938195944} +{"Full-pretrain/Learning Rate": 7.981406826442828e-07, "Full-pretrain/Loss": 1.8549206256866455, "Full-pretrain/Loss (Raw)": 1.8954304456710815, "Full-pretrain/Step": 8790, "Full-pretrain/Step Time": 17.621457681059837} +{"Full-pretrain/Learning Rate": 7.960137502150772e-07, "Full-pretrain/Loss": 1.8778818845748901, "Full-pretrain/Loss (Raw)": 2.1260533332824707, "Full-pretrain/Step": 8791, "Full-pretrain/Step Time": 17.616528943181038} +{"Full-pretrain/Learning Rate": 7.938896097071824e-07, "Full-pretrain/Loss": 1.8853309154510498, "Full-pretrain/Loss (Raw)": 1.9515119791030884, "Full-pretrain/Step": 8792, "Full-pretrain/Step Time": 17.612276785075665} +{"Full-pretrain/Learning Rate": 7.917682613656136e-07, "Full-pretrain/Loss": 1.8804991245269775, "Full-pretrain/Loss (Raw)": 1.7086162567138672, "Full-pretrain/Step": 8793, "Full-pretrain/Step Time": 17.613111075013876} +{"Full-pretrain/Learning Rate": 7.896497054350665e-07, "Full-pretrain/Loss": 1.8815081119537354, "Full-pretrain/Loss (Raw)": 1.9248380661010742, "Full-pretrain/Step": 8794, "Full-pretrain/Step Time": 17.61023577488959} +{"Full-pretrain/Learning Rate": 7.875339421599182e-07, "Full-pretrain/Loss": 1.8902835845947266, "Full-pretrain/Loss (Raw)": 1.8492352962493896, "Full-pretrain/Step": 8795, "Full-pretrain/Step Time": 17.609040927141905} +{"Full-pretrain/Learning Rate": 7.854209717842231e-07, "Full-pretrain/Loss": 1.8924989700317383, "Full-pretrain/Loss (Raw)": 1.9972566366195679, "Full-pretrain/Step": 8796, "Full-pretrain/Step Time": 17.60782629624009} +{"Full-pretrain/Learning Rate": 7.833107945517087e-07, "Full-pretrain/Loss": 1.8967740535736084, "Full-pretrain/Loss (Raw)": 1.9190478324890137, "Full-pretrain/Step": 8797, "Full-pretrain/Step Time": 17.619277769699693} +{"Full-pretrain/Learning Rate": 7.81203410705783e-07, "Full-pretrain/Loss": 1.898949384689331, "Full-pretrain/Loss (Raw)": 2.076054096221924, "Full-pretrain/Step": 8798, "Full-pretrain/Step Time": 17.615825014188886} +{"Full-pretrain/Learning Rate": 7.790988204895323e-07, "Full-pretrain/Loss": 1.9011050462722778, "Full-pretrain/Loss (Raw)": 2.2536427974700928, "Full-pretrain/Step": 8799, "Full-pretrain/Step Time": 17.6136276088655} +{"Full-pretrain/Learning Rate": 7.769970241457203e-07, "Full-pretrain/Loss": 1.9109042882919312, "Full-pretrain/Loss (Raw)": 1.9269983768463135, "Full-pretrain/Step": 8800, "Full-pretrain/Step Time": 17.615930115804076} +{"Full-pretrain/Learning Rate": 7.748980219167895e-07, "Full-pretrain/Loss": 1.9109714031219482, "Full-pretrain/Loss (Raw)": 1.991622805595398, "Full-pretrain/Step": 8801, "Full-pretrain/Step Time": 17.61536510847509} +{"Full-pretrain/Learning Rate": 7.728018140448628e-07, "Full-pretrain/Loss": 1.9266217947006226, "Full-pretrain/Loss (Raw)": 2.0299792289733887, "Full-pretrain/Step": 8802, "Full-pretrain/Step Time": 17.611656229943037} +{"Full-pretrain/Learning Rate": 7.707084007717274e-07, "Full-pretrain/Loss": 1.929232120513916, "Full-pretrain/Loss (Raw)": 2.043081760406494, "Full-pretrain/Step": 8803, "Full-pretrain/Step Time": 17.605248177424073} +{"Full-pretrain/Learning Rate": 7.686177823388651e-07, "Full-pretrain/Loss": 1.9281342029571533, "Full-pretrain/Loss (Raw)": 1.7759387493133545, "Full-pretrain/Step": 8804, "Full-pretrain/Step Time": 17.605930540710688} +{"Full-pretrain/Learning Rate": 7.665299589874248e-07, "Full-pretrain/Loss": 1.9305295944213867, "Full-pretrain/Loss (Raw)": 1.7717158794403076, "Full-pretrain/Step": 8805, "Full-pretrain/Step Time": 17.604272769764066} +{"Full-pretrain/Learning Rate": 7.644449309582385e-07, "Full-pretrain/Loss": 1.9204027652740479, "Full-pretrain/Loss (Raw)": 1.719590425491333, "Full-pretrain/Step": 8806, "Full-pretrain/Step Time": 17.604115705937147} +{"Full-pretrain/Learning Rate": 7.623626984918142e-07, "Full-pretrain/Loss": 1.9212532043457031, "Full-pretrain/Loss (Raw)": 2.108124256134033, "Full-pretrain/Step": 8807, "Full-pretrain/Step Time": 17.60802024230361} +{"Full-pretrain/Learning Rate": 7.602832618283346e-07, "Full-pretrain/Loss": 1.9105051755905151, "Full-pretrain/Loss (Raw)": 1.724534034729004, "Full-pretrain/Step": 8808, "Full-pretrain/Step Time": 17.6054560393095} +{"Full-pretrain/Learning Rate": 7.582066212076632e-07, "Full-pretrain/Loss": 1.900040864944458, "Full-pretrain/Loss (Raw)": 1.47527015209198, "Full-pretrain/Step": 8809, "Full-pretrain/Step Time": 17.60962489619851} +{"Full-pretrain/Learning Rate": 7.561327768693366e-07, "Full-pretrain/Loss": 1.913438320159912, "Full-pretrain/Loss (Raw)": 2.02659273147583, "Full-pretrain/Step": 8810, "Full-pretrain/Step Time": 17.61260531656444} +{"Full-pretrain/Learning Rate": 7.540617290525743e-07, "Full-pretrain/Loss": 1.9136834144592285, "Full-pretrain/Loss (Raw)": 2.0130581855773926, "Full-pretrain/Step": 8811, "Full-pretrain/Step Time": 17.610619992017746} +{"Full-pretrain/Learning Rate": 7.519934779962684e-07, "Full-pretrain/Loss": 1.9144713878631592, "Full-pretrain/Loss (Raw)": 1.8881053924560547, "Full-pretrain/Step": 8812, "Full-pretrain/Step Time": 17.605334237217903} +{"Full-pretrain/Learning Rate": 7.499280239389978e-07, "Full-pretrain/Loss": 1.9136497974395752, "Full-pretrain/Loss (Raw)": 1.871753215789795, "Full-pretrain/Step": 8813, "Full-pretrain/Step Time": 17.603186678141356} +{"Full-pretrain/Learning Rate": 7.478653671190078e-07, "Full-pretrain/Loss": 1.9198888540267944, "Full-pretrain/Loss (Raw)": 2.0469284057617188, "Full-pretrain/Step": 8814, "Full-pretrain/Step Time": 17.60172407887876} +{"Full-pretrain/Learning Rate": 7.458055077742221e-07, "Full-pretrain/Loss": 1.9259415864944458, "Full-pretrain/Loss (Raw)": 2.385887861251831, "Full-pretrain/Step": 8815, "Full-pretrain/Step Time": 17.604020366445184} +{"Full-pretrain/Learning Rate": 7.437484461422478e-07, "Full-pretrain/Loss": 1.9167019128799438, "Full-pretrain/Loss (Raw)": 1.751753807067871, "Full-pretrain/Step": 8816, "Full-pretrain/Step Time": 17.598689476028085} +{"Full-pretrain/Learning Rate": 7.416941824603646e-07, "Full-pretrain/Loss": 1.9222527742385864, "Full-pretrain/Loss (Raw)": 2.0113282203674316, "Full-pretrain/Step": 8817, "Full-pretrain/Step Time": 17.602687971666455} +{"Full-pretrain/Learning Rate": 7.396427169655384e-07, "Full-pretrain/Loss": 1.917239785194397, "Full-pretrain/Loss (Raw)": 1.8472301959991455, "Full-pretrain/Step": 8818, "Full-pretrain/Step Time": 17.603970436379313} +{"Full-pretrain/Learning Rate": 7.37594049894394e-07, "Full-pretrain/Loss": 1.9262031316757202, "Full-pretrain/Loss (Raw)": 2.2527754306793213, "Full-pretrain/Step": 8819, "Full-pretrain/Step Time": 17.606988944113255} +{"Full-pretrain/Learning Rate": 7.355481814832505e-07, "Full-pretrain/Loss": 1.9293005466461182, "Full-pretrain/Loss (Raw)": 1.7368892431259155, "Full-pretrain/Step": 8820, "Full-pretrain/Step Time": 17.60164976865053} +{"Full-pretrain/Learning Rate": 7.335051119680969e-07, "Full-pretrain/Loss": 1.9320745468139648, "Full-pretrain/Loss (Raw)": 1.7255370616912842, "Full-pretrain/Step": 8821, "Full-pretrain/Step Time": 17.604257687926292} +{"Full-pretrain/Learning Rate": 7.314648415846004e-07, "Full-pretrain/Loss": 1.923424482345581, "Full-pretrain/Loss (Raw)": 1.6186299324035645, "Full-pretrain/Step": 8822, "Full-pretrain/Step Time": 17.604402154684067} +{"Full-pretrain/Learning Rate": 7.294273705681087e-07, "Full-pretrain/Loss": 1.926213026046753, "Full-pretrain/Loss (Raw)": 2.215285539627075, "Full-pretrain/Step": 8823, "Full-pretrain/Step Time": 17.60869264230132} +{"Full-pretrain/Learning Rate": 7.273926991536367e-07, "Full-pretrain/Loss": 1.9292322397232056, "Full-pretrain/Loss (Raw)": 2.048129081726074, "Full-pretrain/Step": 8824, "Full-pretrain/Step Time": 17.60991644486785} +{"Full-pretrain/Learning Rate": 7.253608275758911e-07, "Full-pretrain/Loss": 1.9320993423461914, "Full-pretrain/Loss (Raw)": 1.8003652095794678, "Full-pretrain/Step": 8825, "Full-pretrain/Step Time": 17.610148360952735} +{"Full-pretrain/Learning Rate": 7.233317560692426e-07, "Full-pretrain/Loss": 1.940753698348999, "Full-pretrain/Loss (Raw)": 2.2017743587493896, "Full-pretrain/Step": 8826, "Full-pretrain/Step Time": 17.608715809881687} +{"Full-pretrain/Learning Rate": 7.213054848677403e-07, "Full-pretrain/Loss": 1.949995756149292, "Full-pretrain/Loss (Raw)": 2.1449813842773438, "Full-pretrain/Step": 8827, "Full-pretrain/Step Time": 17.617060359567404} +{"Full-pretrain/Learning Rate": 7.192820142051221e-07, "Full-pretrain/Loss": 1.942814588546753, "Full-pretrain/Loss (Raw)": 1.7674651145935059, "Full-pretrain/Step": 8828, "Full-pretrain/Step Time": 17.616638142615557} +{"Full-pretrain/Learning Rate": 7.172613443147902e-07, "Full-pretrain/Loss": 1.9451708793640137, "Full-pretrain/Loss (Raw)": 1.9944474697113037, "Full-pretrain/Step": 8829, "Full-pretrain/Step Time": 17.609291039407253} +{"Full-pretrain/Learning Rate": 7.152434754298276e-07, "Full-pretrain/Loss": 1.940021276473999, "Full-pretrain/Loss (Raw)": 1.9112629890441895, "Full-pretrain/Step": 8830, "Full-pretrain/Step Time": 17.61029153689742} +{"Full-pretrain/Learning Rate": 7.132284077829954e-07, "Full-pretrain/Loss": 1.9293217658996582, "Full-pretrain/Loss (Raw)": 1.9112623929977417, "Full-pretrain/Step": 8831, "Full-pretrain/Step Time": 17.61762573570013} +{"Full-pretrain/Learning Rate": 7.112161416067325e-07, "Full-pretrain/Loss": 1.9288685321807861, "Full-pretrain/Loss (Raw)": 1.9124925136566162, "Full-pretrain/Step": 8832, "Full-pretrain/Step Time": 17.61880054883659} +{"Full-pretrain/Learning Rate": 7.092066771331507e-07, "Full-pretrain/Loss": 1.9371017217636108, "Full-pretrain/Loss (Raw)": 2.255084991455078, "Full-pretrain/Step": 8833, "Full-pretrain/Step Time": 17.608633067458868} +{"Full-pretrain/Learning Rate": 7.07200014594045e-07, "Full-pretrain/Loss": 1.9261488914489746, "Full-pretrain/Loss (Raw)": 1.6794888973236084, "Full-pretrain/Step": 8834, "Full-pretrain/Step Time": 17.613533591851592} +{"Full-pretrain/Learning Rate": 7.051961542208801e-07, "Full-pretrain/Loss": 1.9242336750030518, "Full-pretrain/Loss (Raw)": 1.9817917346954346, "Full-pretrain/Step": 8835, "Full-pretrain/Step Time": 17.614493997767568} +{"Full-pretrain/Learning Rate": 7.031950962447992e-07, "Full-pretrain/Loss": 1.934804916381836, "Full-pretrain/Loss (Raw)": 2.1142194271087646, "Full-pretrain/Step": 8836, "Full-pretrain/Step Time": 17.616549227386713} +{"Full-pretrain/Learning Rate": 7.011968408966257e-07, "Full-pretrain/Loss": 1.9427545070648193, "Full-pretrain/Loss (Raw)": 2.026104211807251, "Full-pretrain/Step": 8837, "Full-pretrain/Step Time": 17.613644115626812} +{"Full-pretrain/Learning Rate": 6.99201388406856e-07, "Full-pretrain/Loss": 1.9514331817626953, "Full-pretrain/Loss (Raw)": 1.9973093271255493, "Full-pretrain/Step": 8838, "Full-pretrain/Step Time": 17.62089833058417} +{"Full-pretrain/Learning Rate": 6.972087390056697e-07, "Full-pretrain/Loss": 1.941270112991333, "Full-pretrain/Loss (Raw)": 1.7829010486602783, "Full-pretrain/Step": 8839, "Full-pretrain/Step Time": 17.623187076300383} +{"Full-pretrain/Learning Rate": 6.952188929229136e-07, "Full-pretrain/Loss": 1.9438883066177368, "Full-pretrain/Loss (Raw)": 1.8083195686340332, "Full-pretrain/Step": 8840, "Full-pretrain/Step Time": 17.631513057276607} +{"Full-pretrain/Learning Rate": 6.93231850388118e-07, "Full-pretrain/Loss": 1.9592349529266357, "Full-pretrain/Loss (Raw)": 1.9663598537445068, "Full-pretrain/Step": 8841, "Full-pretrain/Step Time": 17.62657110579312} +{"Full-pretrain/Learning Rate": 6.912476116304828e-07, "Full-pretrain/Loss": 1.9525926113128662, "Full-pretrain/Loss (Raw)": 1.8140404224395752, "Full-pretrain/Step": 8842, "Full-pretrain/Step Time": 17.62394225783646} +{"Full-pretrain/Learning Rate": 6.892661768788944e-07, "Full-pretrain/Loss": 1.9553501605987549, "Full-pretrain/Loss (Raw)": 2.1013009548187256, "Full-pretrain/Step": 8843, "Full-pretrain/Step Time": 17.629001127555966} +{"Full-pretrain/Learning Rate": 6.872875463619088e-07, "Full-pretrain/Loss": 1.9621202945709229, "Full-pretrain/Loss (Raw)": 2.1047511100769043, "Full-pretrain/Step": 8844, "Full-pretrain/Step Time": 17.638719966635108} +{"Full-pretrain/Learning Rate": 6.853117203077658e-07, "Full-pretrain/Loss": 1.9634430408477783, "Full-pretrain/Loss (Raw)": 1.9140782356262207, "Full-pretrain/Step": 8845, "Full-pretrain/Step Time": 17.636261463165283} +{"Full-pretrain/Learning Rate": 6.833386989443636e-07, "Full-pretrain/Loss": 1.9616531133651733, "Full-pretrain/Loss (Raw)": 1.9896509647369385, "Full-pretrain/Step": 8846, "Full-pretrain/Step Time": 17.629581646993756} +{"Full-pretrain/Learning Rate": 6.813684824993005e-07, "Full-pretrain/Loss": 1.9425928592681885, "Full-pretrain/Loss (Raw)": 1.7759628295898438, "Full-pretrain/Step": 8847, "Full-pretrain/Step Time": 17.6315799318254} +{"Full-pretrain/Learning Rate": 6.794010711998366e-07, "Full-pretrain/Loss": 1.9482924938201904, "Full-pretrain/Loss (Raw)": 1.9341421127319336, "Full-pretrain/Step": 8848, "Full-pretrain/Step Time": 17.63647322356701} +{"Full-pretrain/Learning Rate": 6.774364652729098e-07, "Full-pretrain/Loss": 1.9443199634552002, "Full-pretrain/Loss (Raw)": 1.8842074871063232, "Full-pretrain/Step": 8849, "Full-pretrain/Step Time": 17.63127608038485} +{"Full-pretrain/Learning Rate": 6.754746649451444e-07, "Full-pretrain/Loss": 1.951567530632019, "Full-pretrain/Loss (Raw)": 2.0791494846343994, "Full-pretrain/Step": 8850, "Full-pretrain/Step Time": 17.631913892924786} +{"Full-pretrain/Learning Rate": 6.735156704428258e-07, "Full-pretrain/Loss": 1.9459667205810547, "Full-pretrain/Loss (Raw)": 2.0735514163970947, "Full-pretrain/Step": 8851, "Full-pretrain/Step Time": 17.641590164974332} +{"Full-pretrain/Learning Rate": 6.715594819919236e-07, "Full-pretrain/Loss": 1.9588842391967773, "Full-pretrain/Loss (Raw)": 2.1502490043640137, "Full-pretrain/Step": 8852, "Full-pretrain/Step Time": 17.641829408705235} +{"Full-pretrain/Learning Rate": 6.696060998180875e-07, "Full-pretrain/Loss": 1.962332010269165, "Full-pretrain/Loss (Raw)": 1.835863471031189, "Full-pretrain/Step": 8853, "Full-pretrain/Step Time": 17.644783249124885} +{"Full-pretrain/Learning Rate": 6.676555241466347e-07, "Full-pretrain/Loss": 1.968968152999878, "Full-pretrain/Loss (Raw)": 1.8309892416000366, "Full-pretrain/Step": 8854, "Full-pretrain/Step Time": 17.633401157334447} +{"Full-pretrain/Learning Rate": 6.657077552025714e-07, "Full-pretrain/Loss": 1.965815782546997, "Full-pretrain/Loss (Raw)": 2.1144070625305176, "Full-pretrain/Step": 8855, "Full-pretrain/Step Time": 17.640361290425062} +{"Full-pretrain/Learning Rate": 6.637627932105623e-07, "Full-pretrain/Loss": 1.9436999559402466, "Full-pretrain/Loss (Raw)": 1.3404231071472168, "Full-pretrain/Step": 8856, "Full-pretrain/Step Time": 17.642514197155833} +{"Full-pretrain/Learning Rate": 6.618206383949638e-07, "Full-pretrain/Loss": 1.9497276544570923, "Full-pretrain/Loss (Raw)": 1.9932506084442139, "Full-pretrain/Step": 8857, "Full-pretrain/Step Time": 17.640337757766247} +{"Full-pretrain/Learning Rate": 6.598812909798052e-07, "Full-pretrain/Loss": 1.9299542903900146, "Full-pretrain/Loss (Raw)": 1.569025993347168, "Full-pretrain/Step": 8858, "Full-pretrain/Step Time": 17.639688152819872} +{"Full-pretrain/Learning Rate": 6.579447511887826e-07, "Full-pretrain/Loss": 1.9247417449951172, "Full-pretrain/Loss (Raw)": 1.9781808853149414, "Full-pretrain/Step": 8859, "Full-pretrain/Step Time": 17.642707761377096} +{"Full-pretrain/Learning Rate": 6.560110192452812e-07, "Full-pretrain/Loss": 1.9289422035217285, "Full-pretrain/Loss (Raw)": 1.9018813371658325, "Full-pretrain/Step": 8860, "Full-pretrain/Step Time": 17.643955631181598} +{"Full-pretrain/Learning Rate": 6.540800953723503e-07, "Full-pretrain/Loss": 1.9263231754302979, "Full-pretrain/Loss (Raw)": 1.9106388092041016, "Full-pretrain/Step": 8861, "Full-pretrain/Step Time": 17.644421027973294} +{"Full-pretrain/Learning Rate": 6.521519797927256e-07, "Full-pretrain/Loss": 1.9267547130584717, "Full-pretrain/Loss (Raw)": 1.925071120262146, "Full-pretrain/Step": 8862, "Full-pretrain/Step Time": 17.64533601887524} +{"Full-pretrain/Learning Rate": 6.502266727288126e-07, "Full-pretrain/Loss": 1.9324090480804443, "Full-pretrain/Loss (Raw)": 2.092203140258789, "Full-pretrain/Step": 8863, "Full-pretrain/Step Time": 17.6462237033993} +{"Full-pretrain/Learning Rate": 6.483041744026946e-07, "Full-pretrain/Loss": 1.9366226196289062, "Full-pretrain/Loss (Raw)": 2.047325611114502, "Full-pretrain/Step": 8864, "Full-pretrain/Step Time": 17.648227291181684} +{"Full-pretrain/Learning Rate": 6.463844850361361e-07, "Full-pretrain/Loss": 1.918299674987793, "Full-pretrain/Loss (Raw)": 1.6687541007995605, "Full-pretrain/Step": 8865, "Full-pretrain/Step Time": 17.647542448714375} +{"Full-pretrain/Learning Rate": 6.444676048505682e-07, "Full-pretrain/Loss": 1.9204986095428467, "Full-pretrain/Loss (Raw)": 1.7498505115509033, "Full-pretrain/Step": 8866, "Full-pretrain/Step Time": 17.638281248509884} +{"Full-pretrain/Learning Rate": 6.425535340671002e-07, "Full-pretrain/Loss": 1.9213314056396484, "Full-pretrain/Loss (Raw)": 2.008441925048828, "Full-pretrain/Step": 8867, "Full-pretrain/Step Time": 17.642394127324224} +{"Full-pretrain/Learning Rate": 6.406422729065248e-07, "Full-pretrain/Loss": 1.91796875, "Full-pretrain/Loss (Raw)": 2.0066118240356445, "Full-pretrain/Step": 8868, "Full-pretrain/Step Time": 17.647488014772534} +{"Full-pretrain/Learning Rate": 6.387338215893019e-07, "Full-pretrain/Loss": 1.9080486297607422, "Full-pretrain/Loss (Raw)": 1.7086608409881592, "Full-pretrain/Step": 8869, "Full-pretrain/Step Time": 17.647626414895058} +{"Full-pretrain/Learning Rate": 6.368281803355691e-07, "Full-pretrain/Loss": 1.8949213027954102, "Full-pretrain/Loss (Raw)": 1.5772340297698975, "Full-pretrain/Step": 8870, "Full-pretrain/Step Time": 17.643959064036608} +{"Full-pretrain/Learning Rate": 6.349253493651508e-07, "Full-pretrain/Loss": 1.8980942964553833, "Full-pretrain/Loss (Raw)": 1.884439468383789, "Full-pretrain/Step": 8871, "Full-pretrain/Step Time": 17.648401144891977} +{"Full-pretrain/Learning Rate": 6.33025328897524e-07, "Full-pretrain/Loss": 1.9092944860458374, "Full-pretrain/Loss (Raw)": 2.1667227745056152, "Full-pretrain/Step": 8872, "Full-pretrain/Step Time": 17.650894297286868} +{"Full-pretrain/Learning Rate": 6.311281191518636e-07, "Full-pretrain/Loss": 1.902612566947937, "Full-pretrain/Loss (Raw)": 1.7525415420532227, "Full-pretrain/Step": 8873, "Full-pretrain/Step Time": 17.64636933989823} +{"Full-pretrain/Learning Rate": 6.292337203470139e-07, "Full-pretrain/Loss": 1.8963701725006104, "Full-pretrain/Loss (Raw)": 1.6142820119857788, "Full-pretrain/Step": 8874, "Full-pretrain/Step Time": 17.650169115513563} +{"Full-pretrain/Learning Rate": 6.273421327014889e-07, "Full-pretrain/Loss": 1.8883987665176392, "Full-pretrain/Loss (Raw)": 1.8462172746658325, "Full-pretrain/Step": 8875, "Full-pretrain/Step Time": 17.65058534219861} +{"Full-pretrain/Learning Rate": 6.254533564334863e-07, "Full-pretrain/Loss": 1.8695003986358643, "Full-pretrain/Loss (Raw)": 1.5000057220458984, "Full-pretrain/Step": 8876, "Full-pretrain/Step Time": 17.649529665708542} +{"Full-pretrain/Learning Rate": 6.235673917608681e-07, "Full-pretrain/Loss": 1.867058277130127, "Full-pretrain/Loss (Raw)": 1.8359289169311523, "Full-pretrain/Step": 8877, "Full-pretrain/Step Time": 17.649821426719427} +{"Full-pretrain/Learning Rate": 6.216842389011852e-07, "Full-pretrain/Loss": 1.8704946041107178, "Full-pretrain/Loss (Raw)": 2.099614143371582, "Full-pretrain/Step": 8878, "Full-pretrain/Step Time": 17.65474558994174} +{"Full-pretrain/Learning Rate": 6.198038980716608e-07, "Full-pretrain/Loss": 1.8765549659729004, "Full-pretrain/Loss (Raw)": 1.9698926210403442, "Full-pretrain/Step": 8879, "Full-pretrain/Step Time": 17.656323172152042} +{"Full-pretrain/Learning Rate": 6.179263694891857e-07, "Full-pretrain/Loss": 1.8810850381851196, "Full-pretrain/Loss (Raw)": 2.0791051387786865, "Full-pretrain/Step": 8880, "Full-pretrain/Step Time": 17.65136832371354} +{"Full-pretrain/Learning Rate": 6.160516533703392e-07, "Full-pretrain/Loss": 1.8873673677444458, "Full-pretrain/Loss (Raw)": 2.0852408409118652, "Full-pretrain/Step": 8881, "Full-pretrain/Step Time": 17.64807366207242} +{"Full-pretrain/Learning Rate": 6.14179749931365e-07, "Full-pretrain/Loss": 1.884127140045166, "Full-pretrain/Loss (Raw)": 1.9754624366760254, "Full-pretrain/Step": 8882, "Full-pretrain/Step Time": 17.649857522919774} +{"Full-pretrain/Learning Rate": 6.12310659388185e-07, "Full-pretrain/Loss": 1.873466968536377, "Full-pretrain/Loss (Raw)": 1.7324280738830566, "Full-pretrain/Step": 8883, "Full-pretrain/Step Time": 17.650897976011038} +{"Full-pretrain/Learning Rate": 6.104443819563987e-07, "Full-pretrain/Loss": 1.8753430843353271, "Full-pretrain/Loss (Raw)": 2.210283041000366, "Full-pretrain/Step": 8884, "Full-pretrain/Step Time": 17.646481726318598} +{"Full-pretrain/Learning Rate": 6.085809178512841e-07, "Full-pretrain/Loss": 1.8818597793579102, "Full-pretrain/Loss (Raw)": 2.0443975925445557, "Full-pretrain/Step": 8885, "Full-pretrain/Step Time": 17.644890444353223} +{"Full-pretrain/Learning Rate": 6.067202672877886e-07, "Full-pretrain/Loss": 1.8728973865509033, "Full-pretrain/Loss (Raw)": 1.544193983078003, "Full-pretrain/Step": 8886, "Full-pretrain/Step Time": 17.649271292611957} +{"Full-pretrain/Learning Rate": 6.048624304805378e-07, "Full-pretrain/Loss": 1.8735973834991455, "Full-pretrain/Loss (Raw)": 2.1368050575256348, "Full-pretrain/Step": 8887, "Full-pretrain/Step Time": 17.640886144712567} +{"Full-pretrain/Learning Rate": 6.030074076438325e-07, "Full-pretrain/Loss": 1.8880294561386108, "Full-pretrain/Loss (Raw)": 1.8022522926330566, "Full-pretrain/Step": 8888, "Full-pretrain/Step Time": 17.643274838104844} +{"Full-pretrain/Learning Rate": 6.011551989916486e-07, "Full-pretrain/Loss": 1.883979320526123, "Full-pretrain/Loss (Raw)": 1.8636445999145508, "Full-pretrain/Step": 8889, "Full-pretrain/Step Time": 17.64078276231885} +{"Full-pretrain/Learning Rate": 5.993058047376376e-07, "Full-pretrain/Loss": 1.885716199874878, "Full-pretrain/Loss (Raw)": 1.6246079206466675, "Full-pretrain/Step": 8890, "Full-pretrain/Step Time": 17.642027216032147} +{"Full-pretrain/Learning Rate": 5.974592250951316e-07, "Full-pretrain/Loss": 1.878555178642273, "Full-pretrain/Loss (Raw)": 1.7490262985229492, "Full-pretrain/Step": 8891, "Full-pretrain/Step Time": 17.646073274314404} +{"Full-pretrain/Learning Rate": 5.956154602771241e-07, "Full-pretrain/Loss": 1.8759928941726685, "Full-pretrain/Loss (Raw)": 1.8198885917663574, "Full-pretrain/Step": 8892, "Full-pretrain/Step Time": 17.64559186808765} +{"Full-pretrain/Learning Rate": 5.937745104962978e-07, "Full-pretrain/Loss": 1.8620166778564453, "Full-pretrain/Loss (Raw)": 1.4634039402008057, "Full-pretrain/Step": 8893, "Full-pretrain/Step Time": 17.64364742487669} +{"Full-pretrain/Learning Rate": 5.919363759650049e-07, "Full-pretrain/Loss": 1.8665300607681274, "Full-pretrain/Loss (Raw)": 2.0694961547851562, "Full-pretrain/Step": 8894, "Full-pretrain/Step Time": 17.641528071835637} +{"Full-pretrain/Learning Rate": 5.90101056895273e-07, "Full-pretrain/Loss": 1.8553599119186401, "Full-pretrain/Loss (Raw)": 1.7347586154937744, "Full-pretrain/Step": 8895, "Full-pretrain/Step Time": 17.64754462055862} +{"Full-pretrain/Learning Rate": 5.882685534988053e-07, "Full-pretrain/Loss": 1.8532031774520874, "Full-pretrain/Loss (Raw)": 1.978309988975525, "Full-pretrain/Step": 8896, "Full-pretrain/Step Time": 17.639013849198818} +{"Full-pretrain/Learning Rate": 5.864388659869823e-07, "Full-pretrain/Loss": 1.8617422580718994, "Full-pretrain/Loss (Raw)": 1.942006230354309, "Full-pretrain/Step": 8897, "Full-pretrain/Step Time": 17.64047622308135} +{"Full-pretrain/Learning Rate": 5.846119945708578e-07, "Full-pretrain/Loss": 1.8632601499557495, "Full-pretrain/Loss (Raw)": 1.7984217405319214, "Full-pretrain/Step": 8898, "Full-pretrain/Step Time": 17.641335554420948} +{"Full-pretrain/Learning Rate": 5.827879394611574e-07, "Full-pretrain/Loss": 1.8511817455291748, "Full-pretrain/Loss (Raw)": 1.621935486793518, "Full-pretrain/Step": 8899, "Full-pretrain/Step Time": 17.64143257960677} +{"Full-pretrain/Learning Rate": 5.80966700868285e-07, "Full-pretrain/Loss": 1.8521677255630493, "Full-pretrain/Loss (Raw)": 2.0381600856781006, "Full-pretrain/Step": 8900, "Full-pretrain/Step Time": 17.63755325973034} +{"Full-pretrain/Learning Rate": 5.791482790023256e-07, "Full-pretrain/Loss": 1.8581349849700928, "Full-pretrain/Loss (Raw)": 1.8996163606643677, "Full-pretrain/Step": 8901, "Full-pretrain/Step Time": 17.638360423967242} +{"Full-pretrain/Learning Rate": 5.773326740730306e-07, "Full-pretrain/Loss": 1.872022032737732, "Full-pretrain/Loss (Raw)": 2.021615505218506, "Full-pretrain/Step": 8902, "Full-pretrain/Step Time": 17.63693891093135} +{"Full-pretrain/Learning Rate": 5.75519886289827e-07, "Full-pretrain/Loss": 1.8707714080810547, "Full-pretrain/Loss (Raw)": 1.844421625137329, "Full-pretrain/Step": 8903, "Full-pretrain/Step Time": 17.63474960811436} +{"Full-pretrain/Learning Rate": 5.737099158618225e-07, "Full-pretrain/Loss": 1.8633415699005127, "Full-pretrain/Loss (Raw)": 1.9289650917053223, "Full-pretrain/Step": 8904, "Full-pretrain/Step Time": 17.640683671459556} +{"Full-pretrain/Learning Rate": 5.719027629977947e-07, "Full-pretrain/Loss": 1.8668739795684814, "Full-pretrain/Loss (Raw)": 1.8655779361724854, "Full-pretrain/Step": 8905, "Full-pretrain/Step Time": 17.637305604293942} +{"Full-pretrain/Learning Rate": 5.700984279061988e-07, "Full-pretrain/Loss": 1.8745476007461548, "Full-pretrain/Loss (Raw)": 1.8598384857177734, "Full-pretrain/Step": 8906, "Full-pretrain/Step Time": 17.633728720247746} +{"Full-pretrain/Learning Rate": 5.68296910795163e-07, "Full-pretrain/Loss": 1.8816711902618408, "Full-pretrain/Loss (Raw)": 2.0741727352142334, "Full-pretrain/Step": 8907, "Full-pretrain/Step Time": 17.634004190564156} +{"Full-pretrain/Learning Rate": 5.664982118724932e-07, "Full-pretrain/Loss": 1.8947832584381104, "Full-pretrain/Loss (Raw)": 1.9195913076400757, "Full-pretrain/Step": 8908, "Full-pretrain/Step Time": 17.63914304971695} +{"Full-pretrain/Learning Rate": 5.647023313456706e-07, "Full-pretrain/Loss": 1.8958183526992798, "Full-pretrain/Loss (Raw)": 1.8690516948699951, "Full-pretrain/Step": 8909, "Full-pretrain/Step Time": 17.63912831246853} +{"Full-pretrain/Learning Rate": 5.629092694218435e-07, "Full-pretrain/Loss": 1.8898205757141113, "Full-pretrain/Loss (Raw)": 1.907687783241272, "Full-pretrain/Step": 8910, "Full-pretrain/Step Time": 17.637834472581744} +{"Full-pretrain/Learning Rate": 5.611190263078464e-07, "Full-pretrain/Loss": 1.8932229280471802, "Full-pretrain/Loss (Raw)": 2.0787668228149414, "Full-pretrain/Step": 8911, "Full-pretrain/Step Time": 17.638763189315796} +{"Full-pretrain/Learning Rate": 5.593316022101779e-07, "Full-pretrain/Loss": 1.890524983406067, "Full-pretrain/Loss (Raw)": 1.992769718170166, "Full-pretrain/Step": 8912, "Full-pretrain/Step Time": 17.63204364851117} +{"Full-pretrain/Learning Rate": 5.575469973350262e-07, "Full-pretrain/Loss": 1.8868541717529297, "Full-pretrain/Loss (Raw)": 1.9677760601043701, "Full-pretrain/Step": 8913, "Full-pretrain/Step Time": 17.638711219653487} +{"Full-pretrain/Learning Rate": 5.557652118882345e-07, "Full-pretrain/Loss": 1.883798599243164, "Full-pretrain/Loss (Raw)": 1.8776836395263672, "Full-pretrain/Step": 8914, "Full-pretrain/Step Time": 17.63510972261429} +{"Full-pretrain/Learning Rate": 5.539862460753331e-07, "Full-pretrain/Loss": 1.887915849685669, "Full-pretrain/Loss (Raw)": 1.864179253578186, "Full-pretrain/Step": 8915, "Full-pretrain/Step Time": 17.630576675757766} +{"Full-pretrain/Learning Rate": 5.522101001015301e-07, "Full-pretrain/Loss": 1.8881549835205078, "Full-pretrain/Loss (Raw)": 2.2179346084594727, "Full-pretrain/Step": 8916, "Full-pretrain/Step Time": 17.628777410835028} +{"Full-pretrain/Learning Rate": 5.504367741717004e-07, "Full-pretrain/Loss": 1.8799149990081787, "Full-pretrain/Loss (Raw)": 1.780720591545105, "Full-pretrain/Step": 8917, "Full-pretrain/Step Time": 17.63675880432129} +{"Full-pretrain/Learning Rate": 5.48666268490397e-07, "Full-pretrain/Loss": 1.8961141109466553, "Full-pretrain/Loss (Raw)": 2.0625619888305664, "Full-pretrain/Step": 8918, "Full-pretrain/Step Time": 17.636346392333508} +{"Full-pretrain/Learning Rate": 5.468985832618456e-07, "Full-pretrain/Loss": 1.8876301050186157, "Full-pretrain/Loss (Raw)": 1.8653192520141602, "Full-pretrain/Step": 8919, "Full-pretrain/Step Time": 17.63648896291852} +{"Full-pretrain/Learning Rate": 5.451337186899496e-07, "Full-pretrain/Loss": 1.8936357498168945, "Full-pretrain/Loss (Raw)": 1.994431495666504, "Full-pretrain/Step": 8920, "Full-pretrain/Step Time": 17.636314038187265} +{"Full-pretrain/Learning Rate": 5.433716749782853e-07, "Full-pretrain/Loss": 1.9000141620635986, "Full-pretrain/Loss (Raw)": 2.0677552223205566, "Full-pretrain/Step": 8921, "Full-pretrain/Step Time": 17.62921069562435} +{"Full-pretrain/Learning Rate": 5.416124523301036e-07, "Full-pretrain/Loss": 1.907420039176941, "Full-pretrain/Loss (Raw)": 1.861595869064331, "Full-pretrain/Step": 8922, "Full-pretrain/Step Time": 17.636935280635953} +{"Full-pretrain/Learning Rate": 5.398560509483313e-07, "Full-pretrain/Loss": 1.906153917312622, "Full-pretrain/Loss (Raw)": 1.7085095643997192, "Full-pretrain/Step": 8923, "Full-pretrain/Step Time": 17.631884833797812} +{"Full-pretrain/Learning Rate": 5.381024710355675e-07, "Full-pretrain/Loss": 1.9133288860321045, "Full-pretrain/Loss (Raw)": 2.049487590789795, "Full-pretrain/Step": 8924, "Full-pretrain/Step Time": 17.634873704984784} +{"Full-pretrain/Learning Rate": 5.363517127940864e-07, "Full-pretrain/Loss": 1.9195985794067383, "Full-pretrain/Loss (Raw)": 1.6640342473983765, "Full-pretrain/Step": 8925, "Full-pretrain/Step Time": 17.621014347299933} +{"Full-pretrain/Learning Rate": 5.346037764258377e-07, "Full-pretrain/Loss": 1.9080753326416016, "Full-pretrain/Loss (Raw)": 1.70075261592865, "Full-pretrain/Step": 8926, "Full-pretrain/Step Time": 17.628990679979324} +{"Full-pretrain/Learning Rate": 5.328586621324461e-07, "Full-pretrain/Loss": 1.9155861139297485, "Full-pretrain/Loss (Raw)": 1.975104570388794, "Full-pretrain/Step": 8927, "Full-pretrain/Step Time": 17.6315997838974} +{"Full-pretrain/Learning Rate": 5.311163701152088e-07, "Full-pretrain/Loss": 1.9198845624923706, "Full-pretrain/Loss (Raw)": 2.115861177444458, "Full-pretrain/Step": 8928, "Full-pretrain/Step Time": 17.631947696208954} +{"Full-pretrain/Learning Rate": 5.293769005751015e-07, "Full-pretrain/Loss": 1.907510757446289, "Full-pretrain/Loss (Raw)": 1.5460460186004639, "Full-pretrain/Step": 8929, "Full-pretrain/Step Time": 17.631973896175623} +{"Full-pretrain/Learning Rate": 5.276402537127662e-07, "Full-pretrain/Loss": 1.9121625423431396, "Full-pretrain/Loss (Raw)": 1.947274088859558, "Full-pretrain/Step": 8930, "Full-pretrain/Step Time": 17.63739399239421} +{"Full-pretrain/Learning Rate": 5.259064297285287e-07, "Full-pretrain/Loss": 1.918521523475647, "Full-pretrain/Loss (Raw)": 1.825424313545227, "Full-pretrain/Step": 8931, "Full-pretrain/Step Time": 17.6417157612741} +{"Full-pretrain/Learning Rate": 5.241754288223822e-07, "Full-pretrain/Loss": 1.9102532863616943, "Full-pretrain/Loss (Raw)": 1.773578405380249, "Full-pretrain/Step": 8932, "Full-pretrain/Step Time": 17.639782525599003} +{"Full-pretrain/Learning Rate": 5.224472511939998e-07, "Full-pretrain/Loss": 1.9081332683563232, "Full-pretrain/Loss (Raw)": 1.8317762613296509, "Full-pretrain/Step": 8933, "Full-pretrain/Step Time": 17.639523623511195} +{"Full-pretrain/Learning Rate": 5.207218970427253e-07, "Full-pretrain/Loss": 1.9045684337615967, "Full-pretrain/Loss (Raw)": 1.90753972530365, "Full-pretrain/Step": 8934, "Full-pretrain/Step Time": 17.64198857359588} +{"Full-pretrain/Learning Rate": 5.189993665675768e-07, "Full-pretrain/Loss": 1.9055578708648682, "Full-pretrain/Loss (Raw)": 1.876081109046936, "Full-pretrain/Step": 8935, "Full-pretrain/Step Time": 17.636081295087934} +{"Full-pretrain/Learning Rate": 5.172796599672485e-07, "Full-pretrain/Loss": 1.908219337463379, "Full-pretrain/Loss (Raw)": 2.0141355991363525, "Full-pretrain/Step": 8936, "Full-pretrain/Step Time": 17.635068219155073} +{"Full-pretrain/Learning Rate": 5.155627774401067e-07, "Full-pretrain/Loss": 1.9183087348937988, "Full-pretrain/Loss (Raw)": 2.1884374618530273, "Full-pretrain/Step": 8937, "Full-pretrain/Step Time": 17.635950945317745} +{"Full-pretrain/Learning Rate": 5.138487191841956e-07, "Full-pretrain/Loss": 1.918966293334961, "Full-pretrain/Loss (Raw)": 1.8808820247650146, "Full-pretrain/Step": 8938, "Full-pretrain/Step Time": 17.630195973441005} +{"Full-pretrain/Learning Rate": 5.121374853972294e-07, "Full-pretrain/Loss": 1.9111874103546143, "Full-pretrain/Loss (Raw)": 1.8252482414245605, "Full-pretrain/Step": 8939, "Full-pretrain/Step Time": 17.63190477900207} +{"Full-pretrain/Learning Rate": 5.104290762766001e-07, "Full-pretrain/Loss": 1.9115376472473145, "Full-pretrain/Loss (Raw)": 1.930796504020691, "Full-pretrain/Step": 8940, "Full-pretrain/Step Time": 17.62934349104762} +{"Full-pretrain/Learning Rate": 5.087234920193668e-07, "Full-pretrain/Loss": 1.9080431461334229, "Full-pretrain/Loss (Raw)": 1.7572290897369385, "Full-pretrain/Step": 8941, "Full-pretrain/Step Time": 17.634848637506366} +{"Full-pretrain/Learning Rate": 5.070207328222748e-07, "Full-pretrain/Loss": 1.9148306846618652, "Full-pretrain/Loss (Raw)": 2.1248903274536133, "Full-pretrain/Step": 8942, "Full-pretrain/Step Time": 17.63540001027286} +{"Full-pretrain/Learning Rate": 5.053207988817338e-07, "Full-pretrain/Loss": 1.9067354202270508, "Full-pretrain/Loss (Raw)": 1.8197154998779297, "Full-pretrain/Step": 8943, "Full-pretrain/Step Time": 17.63485903479159} +{"Full-pretrain/Learning Rate": 5.036236903938285e-07, "Full-pretrain/Loss": 1.9009745121002197, "Full-pretrain/Loss (Raw)": 1.8084205389022827, "Full-pretrain/Step": 8944, "Full-pretrain/Step Time": 17.635268341749907} +{"Full-pretrain/Learning Rate": 5.019294075543246e-07, "Full-pretrain/Loss": 1.907921314239502, "Full-pretrain/Loss (Raw)": 2.1900739669799805, "Full-pretrain/Step": 8945, "Full-pretrain/Step Time": 17.628298077732325} +{"Full-pretrain/Learning Rate": 5.002379505586518e-07, "Full-pretrain/Loss": 1.9127147197723389, "Full-pretrain/Loss (Raw)": 2.0310750007629395, "Full-pretrain/Step": 8946, "Full-pretrain/Step Time": 17.630979131907225} +{"Full-pretrain/Learning Rate": 4.985493196019237e-07, "Full-pretrain/Loss": 1.9164960384368896, "Full-pretrain/Loss (Raw)": 1.9851797819137573, "Full-pretrain/Step": 8947, "Full-pretrain/Step Time": 17.631287522614002} +{"Full-pretrain/Learning Rate": 4.968635148789174e-07, "Full-pretrain/Loss": 1.9094306230545044, "Full-pretrain/Loss (Raw)": 1.9918389320373535, "Full-pretrain/Step": 8948, "Full-pretrain/Step Time": 17.629789074882865} +{"Full-pretrain/Learning Rate": 4.951805365840972e-07, "Full-pretrain/Loss": 1.9051270484924316, "Full-pretrain/Loss (Raw)": 1.6430094242095947, "Full-pretrain/Step": 8949, "Full-pretrain/Step Time": 17.625263992697} +{"Full-pretrain/Learning Rate": 4.93500384911591e-07, "Full-pretrain/Loss": 1.9047636985778809, "Full-pretrain/Loss (Raw)": 2.050934076309204, "Full-pretrain/Step": 8950, "Full-pretrain/Step Time": 17.620763316750526} +{"Full-pretrain/Learning Rate": 4.918230600552021e-07, "Full-pretrain/Loss": 1.9142930507659912, "Full-pretrain/Loss (Raw)": 2.1702592372894287, "Full-pretrain/Step": 8951, "Full-pretrain/Step Time": 17.620645763352513} +{"Full-pretrain/Learning Rate": 4.90148562208409e-07, "Full-pretrain/Loss": 1.9048027992248535, "Full-pretrain/Loss (Raw)": 1.6907426118850708, "Full-pretrain/Step": 8952, "Full-pretrain/Step Time": 17.62125893495977} +{"Full-pretrain/Learning Rate": 4.884768915643657e-07, "Full-pretrain/Loss": 1.8986623287200928, "Full-pretrain/Loss (Raw)": 1.8712619543075562, "Full-pretrain/Step": 8953, "Full-pretrain/Step Time": 17.611009452492} +{"Full-pretrain/Learning Rate": 4.86808048315901e-07, "Full-pretrain/Loss": 1.8965094089508057, "Full-pretrain/Loss (Raw)": 1.7927032709121704, "Full-pretrain/Step": 8954, "Full-pretrain/Step Time": 17.612012200057507} +{"Full-pretrain/Learning Rate": 4.85142032655514e-07, "Full-pretrain/Loss": 1.8965098857879639, "Full-pretrain/Loss (Raw)": 1.7085258960723877, "Full-pretrain/Step": 8955, "Full-pretrain/Step Time": 17.61547694541514} +{"Full-pretrain/Learning Rate": 4.834788447753758e-07, "Full-pretrain/Loss": 1.8953615427017212, "Full-pretrain/Loss (Raw)": 2.01273775100708, "Full-pretrain/Step": 8956, "Full-pretrain/Step Time": 17.61692035011947} +{"Full-pretrain/Learning Rate": 4.818184848673385e-07, "Full-pretrain/Loss": 1.9021985530853271, "Full-pretrain/Loss (Raw)": 1.8828188180923462, "Full-pretrain/Step": 8957, "Full-pretrain/Step Time": 17.61185951344669} +{"Full-pretrain/Learning Rate": 4.80160953122924e-07, "Full-pretrain/Loss": 1.9028546810150146, "Full-pretrain/Loss (Raw)": 1.7217497825622559, "Full-pretrain/Step": 8958, "Full-pretrain/Step Time": 17.61057599261403} +{"Full-pretrain/Learning Rate": 4.785062497333265e-07, "Full-pretrain/Loss": 1.9013566970825195, "Full-pretrain/Loss (Raw)": 1.9271653890609741, "Full-pretrain/Step": 8959, "Full-pretrain/Step Time": 17.60813700594008} +{"Full-pretrain/Learning Rate": 4.768543748894155e-07, "Full-pretrain/Loss": 1.882663607597351, "Full-pretrain/Loss (Raw)": 1.517685055732727, "Full-pretrain/Step": 8960, "Full-pretrain/Step Time": 17.61634059995413} +{"Full-pretrain/Learning Rate": 4.752053287817332e-07, "Full-pretrain/Loss": 1.8955968618392944, "Full-pretrain/Loss (Raw)": 1.959909200668335, "Full-pretrain/Step": 8961, "Full-pretrain/Step Time": 17.615850791335106} +{"Full-pretrain/Learning Rate": 4.735591116004967e-07, "Full-pretrain/Loss": 1.9010000228881836, "Full-pretrain/Loss (Raw)": 2.120175838470459, "Full-pretrain/Step": 8962, "Full-pretrain/Step Time": 17.61023516766727} +{"Full-pretrain/Learning Rate": 4.719157235355959e-07, "Full-pretrain/Loss": 1.9005486965179443, "Full-pretrain/Loss (Raw)": 1.8109841346740723, "Full-pretrain/Step": 8963, "Full-pretrain/Step Time": 17.612382367253304} +{"Full-pretrain/Learning Rate": 4.702751647765985e-07, "Full-pretrain/Loss": 1.9128016233444214, "Full-pretrain/Loss (Raw)": 2.165670394897461, "Full-pretrain/Step": 8964, "Full-pretrain/Step Time": 17.61564858071506} +{"Full-pretrain/Learning Rate": 4.686374355127421e-07, "Full-pretrain/Loss": 1.920910120010376, "Full-pretrain/Loss (Raw)": 2.091249465942383, "Full-pretrain/Step": 8965, "Full-pretrain/Step Time": 17.610445706173778} +{"Full-pretrain/Learning Rate": 4.670025359329366e-07, "Full-pretrain/Loss": 1.9127578735351562, "Full-pretrain/Loss (Raw)": 1.6466643810272217, "Full-pretrain/Step": 8966, "Full-pretrain/Step Time": 17.599449371919036} +{"Full-pretrain/Learning Rate": 4.653704662257674e-07, "Full-pretrain/Loss": 1.914384365081787, "Full-pretrain/Loss (Raw)": 1.9281325340270996, "Full-pretrain/Step": 8967, "Full-pretrain/Step Time": 17.598441882058978} +{"Full-pretrain/Learning Rate": 4.637412265794894e-07, "Full-pretrain/Loss": 1.9153584241867065, "Full-pretrain/Loss (Raw)": 2.0453033447265625, "Full-pretrain/Step": 8968, "Full-pretrain/Step Time": 17.603264974430203} +{"Full-pretrain/Learning Rate": 4.621148171820411e-07, "Full-pretrain/Loss": 1.9108999967575073, "Full-pretrain/Loss (Raw)": 2.0457682609558105, "Full-pretrain/Step": 8969, "Full-pretrain/Step Time": 17.600931372493505} +{"Full-pretrain/Learning Rate": 4.6049123822102245e-07, "Full-pretrain/Loss": 1.915932536125183, "Full-pretrain/Loss (Raw)": 2.041921615600586, "Full-pretrain/Step": 8970, "Full-pretrain/Step Time": 17.599398851394653} +{"Full-pretrain/Learning Rate": 4.5887048988371986e-07, "Full-pretrain/Loss": 1.915324091911316, "Full-pretrain/Loss (Raw)": 1.805777668952942, "Full-pretrain/Step": 8971, "Full-pretrain/Step Time": 17.596846824511886} +{"Full-pretrain/Learning Rate": 4.572525723570809e-07, "Full-pretrain/Loss": 1.9233856201171875, "Full-pretrain/Loss (Raw)": 2.188765048980713, "Full-pretrain/Step": 8972, "Full-pretrain/Step Time": 17.600832030177116} +{"Full-pretrain/Learning Rate": 4.5563748582773124e-07, "Full-pretrain/Loss": 1.9275389909744263, "Full-pretrain/Loss (Raw)": 1.8901386260986328, "Full-pretrain/Step": 8973, "Full-pretrain/Step Time": 17.602295078337193} +{"Full-pretrain/Learning Rate": 4.540252304819748e-07, "Full-pretrain/Loss": 1.9197627305984497, "Full-pretrain/Loss (Raw)": 1.8760476112365723, "Full-pretrain/Step": 8974, "Full-pretrain/Step Time": 17.603429978713393} +{"Full-pretrain/Learning Rate": 4.524158065057793e-07, "Full-pretrain/Loss": 1.920273780822754, "Full-pretrain/Loss (Raw)": 1.836069941520691, "Full-pretrain/Step": 8975, "Full-pretrain/Step Time": 17.600315058603883} +{"Full-pretrain/Learning Rate": 4.508092140847936e-07, "Full-pretrain/Loss": 1.9381005764007568, "Full-pretrain/Loss (Raw)": 2.378877639770508, "Full-pretrain/Step": 8976, "Full-pretrain/Step Time": 17.597463715821505} +{"Full-pretrain/Learning Rate": 4.4920545340433886e-07, "Full-pretrain/Loss": 1.9313201904296875, "Full-pretrain/Loss (Raw)": 1.9731035232543945, "Full-pretrain/Step": 8977, "Full-pretrain/Step Time": 17.599858935922384} +{"Full-pretrain/Learning Rate": 4.4760452464940874e-07, "Full-pretrain/Loss": 1.925276279449463, "Full-pretrain/Loss (Raw)": 1.8376675844192505, "Full-pretrain/Step": 8978, "Full-pretrain/Step Time": 17.599982023239136} +{"Full-pretrain/Learning Rate": 4.4600642800466664e-07, "Full-pretrain/Loss": 1.9291554689407349, "Full-pretrain/Loss (Raw)": 2.1093173027038574, "Full-pretrain/Step": 8979, "Full-pretrain/Step Time": 17.59827812574804} +{"Full-pretrain/Learning Rate": 4.4441116365445125e-07, "Full-pretrain/Loss": 1.923830509185791, "Full-pretrain/Loss (Raw)": 1.8214411735534668, "Full-pretrain/Step": 8980, "Full-pretrain/Step Time": 17.602753348648548} +{"Full-pretrain/Learning Rate": 4.4281873178278475e-07, "Full-pretrain/Loss": 1.936159372329712, "Full-pretrain/Loss (Raw)": 2.0375306606292725, "Full-pretrain/Step": 8981, "Full-pretrain/Step Time": 17.598496278747916} +{"Full-pretrain/Learning Rate": 4.412291325733453e-07, "Full-pretrain/Loss": 1.9375553131103516, "Full-pretrain/Loss (Raw)": 2.09560489654541, "Full-pretrain/Step": 8982, "Full-pretrain/Step Time": 17.60187539458275} +{"Full-pretrain/Learning Rate": 4.3964236620949173e-07, "Full-pretrain/Loss": 1.9320179224014282, "Full-pretrain/Loss (Raw)": 1.9930634498596191, "Full-pretrain/Step": 8983, "Full-pretrain/Step Time": 17.602144852280617} +{"Full-pretrain/Learning Rate": 4.3805843287426376e-07, "Full-pretrain/Loss": 1.9328162670135498, "Full-pretrain/Loss (Raw)": 1.716288447380066, "Full-pretrain/Step": 8984, "Full-pretrain/Step Time": 17.604253977537155} +{"Full-pretrain/Learning Rate": 4.364773327503624e-07, "Full-pretrain/Loss": 1.9355813264846802, "Full-pretrain/Loss (Raw)": 1.9597442150115967, "Full-pretrain/Step": 8985, "Full-pretrain/Step Time": 17.59985239058733} +{"Full-pretrain/Learning Rate": 4.3489906602016686e-07, "Full-pretrain/Loss": 1.9340746402740479, "Full-pretrain/Loss (Raw)": 1.744490623474121, "Full-pretrain/Step": 8986, "Full-pretrain/Step Time": 17.599326822906733} +{"Full-pretrain/Learning Rate": 4.333236328657342e-07, "Full-pretrain/Loss": 1.9390349388122559, "Full-pretrain/Loss (Raw)": 1.867255449295044, "Full-pretrain/Step": 8987, "Full-pretrain/Step Time": 17.592327125370502} +{"Full-pretrain/Learning Rate": 4.3175103346878575e-07, "Full-pretrain/Loss": 1.938405156135559, "Full-pretrain/Loss (Raw)": 1.992581844329834, "Full-pretrain/Step": 8988, "Full-pretrain/Step Time": 17.598306335508823} +{"Full-pretrain/Learning Rate": 4.301812680107209e-07, "Full-pretrain/Loss": 1.9326835870742798, "Full-pretrain/Loss (Raw)": 1.6997284889221191, "Full-pretrain/Step": 8989, "Full-pretrain/Step Time": 17.597024163231254} +{"Full-pretrain/Learning Rate": 4.286143366726142e-07, "Full-pretrain/Loss": 1.938018798828125, "Full-pretrain/Loss (Raw)": 1.8924775123596191, "Full-pretrain/Step": 8990, "Full-pretrain/Step Time": 17.592977499589324} +{"Full-pretrain/Learning Rate": 4.2705023963520993e-07, "Full-pretrain/Loss": 1.942291498184204, "Full-pretrain/Loss (Raw)": 2.063892364501953, "Full-pretrain/Step": 8991, "Full-pretrain/Step Time": 17.588588766753674} +{"Full-pretrain/Learning Rate": 4.254889770789222e-07, "Full-pretrain/Loss": 1.955592155456543, "Full-pretrain/Loss (Raw)": 1.943303108215332, "Full-pretrain/Step": 8992, "Full-pretrain/Step Time": 17.59491748176515} +{"Full-pretrain/Learning Rate": 4.2393054918384855e-07, "Full-pretrain/Loss": 1.9541847705841064, "Full-pretrain/Loss (Raw)": 1.914874792098999, "Full-pretrain/Step": 8993, "Full-pretrain/Step Time": 17.591774854809046} +{"Full-pretrain/Learning Rate": 4.223749561297452e-07, "Full-pretrain/Loss": 1.9436430931091309, "Full-pretrain/Loss (Raw)": 1.7828434705734253, "Full-pretrain/Step": 8994, "Full-pretrain/Step Time": 17.594197442755103} +{"Full-pretrain/Learning Rate": 4.208221980960547e-07, "Full-pretrain/Loss": 1.9442545175552368, "Full-pretrain/Loss (Raw)": 1.8305493593215942, "Full-pretrain/Step": 8995, "Full-pretrain/Step Time": 17.589941600337625} +{"Full-pretrain/Learning Rate": 4.192722752618866e-07, "Full-pretrain/Loss": 1.9396172761917114, "Full-pretrain/Loss (Raw)": 2.0172760486602783, "Full-pretrain/Step": 8996, "Full-pretrain/Step Time": 17.589725092053413} +{"Full-pretrain/Learning Rate": 4.177251878060229e-07, "Full-pretrain/Loss": 1.927216649055481, "Full-pretrain/Loss (Raw)": 1.6944319009780884, "Full-pretrain/Step": 8997, "Full-pretrain/Step Time": 17.59944692440331} +{"Full-pretrain/Learning Rate": 4.1618093590692073e-07, "Full-pretrain/Loss": 1.93741774559021, "Full-pretrain/Loss (Raw)": 1.9730961322784424, "Full-pretrain/Step": 8998, "Full-pretrain/Step Time": 17.59408071450889} +{"Full-pretrain/Learning Rate": 4.146395197427072e-07, "Full-pretrain/Loss": 1.9399125576019287, "Full-pretrain/Loss (Raw)": 2.0079703330993652, "Full-pretrain/Step": 8999, "Full-pretrain/Step Time": 17.590241027995944} +{"Full-pretrain/Learning Rate": 4.1310093949118443e-07, "Full-pretrain/Loss": 1.934565782546997, "Full-pretrain/Loss (Raw)": 1.8742055892944336, "Full-pretrain/Step": 9000, "Full-pretrain/Step Time": 17.59084495343268} +{"Full-pretrain/Learning Rate": 4.115651953298272e-07, "Full-pretrain/Loss": 1.93497896194458, "Full-pretrain/Loss (Raw)": 2.058990955352783, "Full-pretrain/Step": 9001, "Full-pretrain/Step Time": 17.59659610129893} +{"Full-pretrain/Learning Rate": 4.1003228743578814e-07, "Full-pretrain/Loss": 1.936437964439392, "Full-pretrain/Loss (Raw)": 2.0886080265045166, "Full-pretrain/Step": 9002, "Full-pretrain/Step Time": 17.593285888433456} +{"Full-pretrain/Learning Rate": 4.0850221598587867e-07, "Full-pretrain/Loss": 1.9405487775802612, "Full-pretrain/Loss (Raw)": 1.9373254776000977, "Full-pretrain/Step": 9003, "Full-pretrain/Step Time": 17.588721027597785} +{"Full-pretrain/Learning Rate": 4.069749811565965e-07, "Full-pretrain/Loss": 1.9357692003250122, "Full-pretrain/Loss (Raw)": 2.035818099975586, "Full-pretrain/Step": 9004, "Full-pretrain/Step Time": 17.589129338040948} +{"Full-pretrain/Learning Rate": 4.05450583124109e-07, "Full-pretrain/Loss": 1.9418326616287231, "Full-pretrain/Loss (Raw)": 2.084170341491699, "Full-pretrain/Step": 9005, "Full-pretrain/Step Time": 17.591086268424988} +{"Full-pretrain/Learning Rate": 4.039290220642533e-07, "Full-pretrain/Loss": 1.9411089420318604, "Full-pretrain/Loss (Raw)": 1.8528859615325928, "Full-pretrain/Step": 9006, "Full-pretrain/Step Time": 17.58711234666407} +{"Full-pretrain/Learning Rate": 4.024102981525446e-07, "Full-pretrain/Loss": 1.9544838666915894, "Full-pretrain/Loss (Raw)": 2.2640695571899414, "Full-pretrain/Step": 9007, "Full-pretrain/Step Time": 17.584784135222435} +{"Full-pretrain/Learning Rate": 4.008944115641594e-07, "Full-pretrain/Loss": 1.936328411102295, "Full-pretrain/Loss (Raw)": 1.797900915145874, "Full-pretrain/Step": 9008, "Full-pretrain/Step Time": 17.59061286598444} +{"Full-pretrain/Learning Rate": 3.993813624739634e-07, "Full-pretrain/Loss": 1.941413402557373, "Full-pretrain/Loss (Raw)": 2.1358256340026855, "Full-pretrain/Step": 9009, "Full-pretrain/Step Time": 17.59452079795301} +{"Full-pretrain/Learning Rate": 3.978711510564781e-07, "Full-pretrain/Loss": 1.9454779624938965, "Full-pretrain/Loss (Raw)": 1.967734456062317, "Full-pretrain/Step": 9010, "Full-pretrain/Step Time": 17.595080627128482} +{"Full-pretrain/Learning Rate": 3.963637774859114e-07, "Full-pretrain/Loss": 1.9307663440704346, "Full-pretrain/Loss (Raw)": 1.638543725013733, "Full-pretrain/Step": 9011, "Full-pretrain/Step Time": 17.589379576966166} +{"Full-pretrain/Learning Rate": 3.9485924193613523e-07, "Full-pretrain/Loss": 1.9271284341812134, "Full-pretrain/Loss (Raw)": 1.7050286531448364, "Full-pretrain/Step": 9012, "Full-pretrain/Step Time": 17.592773739248514} +{"Full-pretrain/Learning Rate": 3.933575445807025e-07, "Full-pretrain/Loss": 1.9213080406188965, "Full-pretrain/Loss (Raw)": 1.8512760400772095, "Full-pretrain/Step": 9013, "Full-pretrain/Step Time": 17.590304259210825} +{"Full-pretrain/Learning Rate": 3.9185868559282466e-07, "Full-pretrain/Loss": 1.9160935878753662, "Full-pretrain/Loss (Raw)": 1.9287431240081787, "Full-pretrain/Step": 9014, "Full-pretrain/Step Time": 17.589750315994024} +{"Full-pretrain/Learning Rate": 3.903626651454023e-07, "Full-pretrain/Loss": 1.9144946336746216, "Full-pretrain/Loss (Raw)": 1.9418973922729492, "Full-pretrain/Step": 9015, "Full-pretrain/Step Time": 17.59833275154233} +{"Full-pretrain/Learning Rate": 3.8886948341099737e-07, "Full-pretrain/Loss": 1.9162869453430176, "Full-pretrain/Loss (Raw)": 1.7736455202102661, "Full-pretrain/Step": 9016, "Full-pretrain/Step Time": 17.60195992514491} +{"Full-pretrain/Learning Rate": 3.873791405618471e-07, "Full-pretrain/Loss": 1.9239635467529297, "Full-pretrain/Loss (Raw)": 2.205393075942993, "Full-pretrain/Step": 9017, "Full-pretrain/Step Time": 17.603055940940976} +{"Full-pretrain/Learning Rate": 3.8589163676986674e-07, "Full-pretrain/Loss": 1.9139543771743774, "Full-pretrain/Loss (Raw)": 1.4241979122161865, "Full-pretrain/Step": 9018, "Full-pretrain/Step Time": 17.603363294154406} +{"Full-pretrain/Learning Rate": 3.844069722066329e-07, "Full-pretrain/Loss": 1.9132354259490967, "Full-pretrain/Loss (Raw)": 1.8442484140396118, "Full-pretrain/Step": 9019, "Full-pretrain/Step Time": 17.599052948877215} +{"Full-pretrain/Learning Rate": 3.8292514704340586e-07, "Full-pretrain/Loss": 1.9153411388397217, "Full-pretrain/Loss (Raw)": 2.0599660873413086, "Full-pretrain/Step": 9020, "Full-pretrain/Step Time": 17.59771317243576} +{"Full-pretrain/Learning Rate": 3.8144616145111277e-07, "Full-pretrain/Loss": 1.9273544549942017, "Full-pretrain/Loss (Raw)": 2.0841517448425293, "Full-pretrain/Step": 9021, "Full-pretrain/Step Time": 17.5970600489527} +{"Full-pretrain/Learning Rate": 3.799700156003505e-07, "Full-pretrain/Loss": 1.9133498668670654, "Full-pretrain/Loss (Raw)": 1.444329857826233, "Full-pretrain/Step": 9022, "Full-pretrain/Step Time": 17.601512825116515} +{"Full-pretrain/Learning Rate": 3.784967096613995e-07, "Full-pretrain/Loss": 1.8987300395965576, "Full-pretrain/Loss (Raw)": 1.5960607528686523, "Full-pretrain/Step": 9023, "Full-pretrain/Step Time": 17.594147058203816} +{"Full-pretrain/Learning Rate": 3.7702624380419607e-07, "Full-pretrain/Loss": 1.9023077487945557, "Full-pretrain/Loss (Raw)": 2.0577878952026367, "Full-pretrain/Step": 9024, "Full-pretrain/Step Time": 17.59820356592536} +{"Full-pretrain/Learning Rate": 3.755586181983628e-07, "Full-pretrain/Loss": 1.899979591369629, "Full-pretrain/Loss (Raw)": 1.8403773307800293, "Full-pretrain/Step": 9025, "Full-pretrain/Step Time": 17.598617792129517} +{"Full-pretrain/Learning Rate": 3.7409383301319213e-07, "Full-pretrain/Loss": 1.9066210985183716, "Full-pretrain/Loss (Raw)": 1.9953703880310059, "Full-pretrain/Step": 9026, "Full-pretrain/Step Time": 17.600826289504766} +{"Full-pretrain/Learning Rate": 3.726318884176433e-07, "Full-pretrain/Loss": 1.9135884046554565, "Full-pretrain/Loss (Raw)": 2.0535011291503906, "Full-pretrain/Step": 9027, "Full-pretrain/Step Time": 17.605441980063915} +{"Full-pretrain/Learning Rate": 3.711727845803481e-07, "Full-pretrain/Loss": 1.9155762195587158, "Full-pretrain/Loss (Raw)": 2.0808849334716797, "Full-pretrain/Step": 9028, "Full-pretrain/Step Time": 17.60574841313064} +{"Full-pretrain/Learning Rate": 3.697165216696219e-07, "Full-pretrain/Loss": 1.9198780059814453, "Full-pretrain/Loss (Raw)": 1.8320887088775635, "Full-pretrain/Step": 9029, "Full-pretrain/Step Time": 17.60407537780702} +{"Full-pretrain/Learning Rate": 3.682630998534359e-07, "Full-pretrain/Loss": 1.9165725708007812, "Full-pretrain/Loss (Raw)": 1.867325782775879, "Full-pretrain/Step": 9030, "Full-pretrain/Step Time": 17.608022272586823} +{"Full-pretrain/Learning Rate": 3.668125192994448e-07, "Full-pretrain/Loss": 1.915246844291687, "Full-pretrain/Loss (Raw)": 1.9655470848083496, "Full-pretrain/Step": 9031, "Full-pretrain/Step Time": 17.61158712953329} +{"Full-pretrain/Learning Rate": 3.653647801749732e-07, "Full-pretrain/Loss": 1.9108996391296387, "Full-pretrain/Loss (Raw)": 1.735093355178833, "Full-pretrain/Step": 9032, "Full-pretrain/Step Time": 17.604892440140247} +{"Full-pretrain/Learning Rate": 3.63919882647018e-07, "Full-pretrain/Loss": 1.9010038375854492, "Full-pretrain/Loss (Raw)": 1.742323637008667, "Full-pretrain/Step": 9033, "Full-pretrain/Step Time": 17.608576081693172} +{"Full-pretrain/Learning Rate": 3.6247782688224596e-07, "Full-pretrain/Loss": 1.8962299823760986, "Full-pretrain/Loss (Raw)": 1.9358481168746948, "Full-pretrain/Step": 9034, "Full-pretrain/Step Time": 17.607543542981148} +{"Full-pretrain/Learning Rate": 3.6103861304699895e-07, "Full-pretrain/Loss": 1.8779211044311523, "Full-pretrain/Loss (Raw)": 1.3514440059661865, "Full-pretrain/Step": 9035, "Full-pretrain/Step Time": 17.60915474034846} +{"Full-pretrain/Learning Rate": 3.5960224130728857e-07, "Full-pretrain/Loss": 1.8781719207763672, "Full-pretrain/Loss (Raw)": 2.04384183883667, "Full-pretrain/Step": 9036, "Full-pretrain/Step Time": 17.61064667068422} +{"Full-pretrain/Learning Rate": 3.581687118287991e-07, "Full-pretrain/Loss": 1.871488094329834, "Full-pretrain/Loss (Raw)": 1.8702846765518188, "Full-pretrain/Step": 9037, "Full-pretrain/Step Time": 17.603675911203027} +{"Full-pretrain/Learning Rate": 3.5673802477689257e-07, "Full-pretrain/Loss": 1.8750383853912354, "Full-pretrain/Loss (Raw)": 1.9664958715438843, "Full-pretrain/Step": 9038, "Full-pretrain/Step Time": 17.60595159418881} +{"Full-pretrain/Learning Rate": 3.553101803165926e-07, "Full-pretrain/Loss": 1.8603804111480713, "Full-pretrain/Loss (Raw)": 1.7950127124786377, "Full-pretrain/Step": 9039, "Full-pretrain/Step Time": 17.608763387426734} +{"Full-pretrain/Learning Rate": 3.538851786126035e-07, "Full-pretrain/Loss": 1.8640401363372803, "Full-pretrain/Loss (Raw)": 1.9150161743164062, "Full-pretrain/Step": 9040, "Full-pretrain/Step Time": 17.613086519762874} +{"Full-pretrain/Learning Rate": 3.5246301982929387e-07, "Full-pretrain/Loss": 1.8697985410690308, "Full-pretrain/Loss (Raw)": 2.320091485977173, "Full-pretrain/Step": 9041, "Full-pretrain/Step Time": 17.60694227553904} +{"Full-pretrain/Learning Rate": 3.510437041307185e-07, "Full-pretrain/Loss": 1.8666268587112427, "Full-pretrain/Loss (Raw)": 1.8662431240081787, "Full-pretrain/Step": 9042, "Full-pretrain/Step Time": 17.607857063412666} +{"Full-pretrain/Learning Rate": 3.496272316805882e-07, "Full-pretrain/Loss": 1.8736027479171753, "Full-pretrain/Loss (Raw)": 1.8617701530456543, "Full-pretrain/Step": 9043, "Full-pretrain/Step Time": 17.607124725356698} +{"Full-pretrain/Learning Rate": 3.4821360264229165e-07, "Full-pretrain/Loss": 1.8758563995361328, "Full-pretrain/Loss (Raw)": 1.7771456241607666, "Full-pretrain/Step": 9044, "Full-pretrain/Step Time": 17.607558842748404} +{"Full-pretrain/Learning Rate": 3.4680281717889564e-07, "Full-pretrain/Loss": 1.8819032907485962, "Full-pretrain/Loss (Raw)": 2.0447778701782227, "Full-pretrain/Step": 9045, "Full-pretrain/Step Time": 17.598772685974836} +{"Full-pretrain/Learning Rate": 3.453948754531283e-07, "Full-pretrain/Loss": 1.87332022190094, "Full-pretrain/Loss (Raw)": 1.6540868282318115, "Full-pretrain/Step": 9046, "Full-pretrain/Step Time": 17.59722345881164} +{"Full-pretrain/Learning Rate": 3.439897776273987e-07, "Full-pretrain/Loss": 1.8739811182022095, "Full-pretrain/Loss (Raw)": 1.9630440473556519, "Full-pretrain/Step": 9047, "Full-pretrain/Step Time": 17.603303549811244} +{"Full-pretrain/Learning Rate": 3.4258752386378267e-07, "Full-pretrain/Loss": 1.8799998760223389, "Full-pretrain/Loss (Raw)": 1.9662449359893799, "Full-pretrain/Step": 9048, "Full-pretrain/Step Time": 17.606514623388648} +{"Full-pretrain/Learning Rate": 3.4118811432403144e-07, "Full-pretrain/Loss": 1.8719797134399414, "Full-pretrain/Loss (Raw)": 1.948746919631958, "Full-pretrain/Step": 9049, "Full-pretrain/Step Time": 17.608782729133964} +{"Full-pretrain/Learning Rate": 3.397915491695686e-07, "Full-pretrain/Loss": 1.8945446014404297, "Full-pretrain/Loss (Raw)": 2.1462795734405518, "Full-pretrain/Step": 9050, "Full-pretrain/Step Time": 17.60184731706977} +{"Full-pretrain/Learning Rate": 3.3839782856147916e-07, "Full-pretrain/Loss": 1.9067437648773193, "Full-pretrain/Loss (Raw)": 2.234619140625, "Full-pretrain/Step": 9051, "Full-pretrain/Step Time": 17.607596388086677} +{"Full-pretrain/Learning Rate": 3.370069526605374e-07, "Full-pretrain/Loss": 1.9051029682159424, "Full-pretrain/Loss (Raw)": 2.007462739944458, "Full-pretrain/Step": 9052, "Full-pretrain/Step Time": 17.608802003785968} +{"Full-pretrain/Learning Rate": 3.3561892162717325e-07, "Full-pretrain/Loss": 1.9024322032928467, "Full-pretrain/Loss (Raw)": 1.9986813068389893, "Full-pretrain/Step": 9053, "Full-pretrain/Step Time": 17.610608408227563} +{"Full-pretrain/Learning Rate": 3.342337356215003e-07, "Full-pretrain/Loss": 1.9183186292648315, "Full-pretrain/Loss (Raw)": 1.9526989459991455, "Full-pretrain/Step": 9054, "Full-pretrain/Step Time": 17.60711905360222} +{"Full-pretrain/Learning Rate": 3.328513948032991e-07, "Full-pretrain/Loss": 1.9179408550262451, "Full-pretrain/Loss (Raw)": 1.5839694738388062, "Full-pretrain/Step": 9055, "Full-pretrain/Step Time": 17.61002827435732} +{"Full-pretrain/Learning Rate": 3.314718993320198e-07, "Full-pretrain/Loss": 1.9139163494110107, "Full-pretrain/Loss (Raw)": 1.929005742073059, "Full-pretrain/Step": 9056, "Full-pretrain/Step Time": 17.605848021805286} +{"Full-pretrain/Learning Rate": 3.3009524936678527e-07, "Full-pretrain/Loss": 1.922669529914856, "Full-pretrain/Loss (Raw)": 2.1204802989959717, "Full-pretrain/Step": 9057, "Full-pretrain/Step Time": 17.605178870260715} +{"Full-pretrain/Learning Rate": 3.287214450663989e-07, "Full-pretrain/Loss": 1.9223469495773315, "Full-pretrain/Loss (Raw)": 1.9850473403930664, "Full-pretrain/Step": 9058, "Full-pretrain/Step Time": 17.60138166323304} +{"Full-pretrain/Learning Rate": 3.273504865893201e-07, "Full-pretrain/Loss": 1.9175174236297607, "Full-pretrain/Loss (Raw)": 1.8989564180374146, "Full-pretrain/Step": 9059, "Full-pretrain/Step Time": 17.60184988938272} +{"Full-pretrain/Learning Rate": 3.259823740936946e-07, "Full-pretrain/Loss": 1.905961036682129, "Full-pretrain/Loss (Raw)": 1.711079716682434, "Full-pretrain/Step": 9060, "Full-pretrain/Step Time": 17.598787834867835} +{"Full-pretrain/Learning Rate": 3.2461710773732947e-07, "Full-pretrain/Loss": 1.9127717018127441, "Full-pretrain/Loss (Raw)": 2.0500283241271973, "Full-pretrain/Step": 9061, "Full-pretrain/Step Time": 17.598583322018385} +{"Full-pretrain/Learning Rate": 3.2325468767770984e-07, "Full-pretrain/Loss": 1.9154211282730103, "Full-pretrain/Loss (Raw)": 1.9521082639694214, "Full-pretrain/Step": 9062, "Full-pretrain/Step Time": 17.592041596770287} +{"Full-pretrain/Learning Rate": 3.218951140719906e-07, "Full-pretrain/Loss": 1.9149458408355713, "Full-pretrain/Loss (Raw)": 1.9503365755081177, "Full-pretrain/Step": 9063, "Full-pretrain/Step Time": 17.59563886374235} +{"Full-pretrain/Learning Rate": 3.2053838707699626e-07, "Full-pretrain/Loss": 1.9134571552276611, "Full-pretrain/Loss (Raw)": 1.687459111213684, "Full-pretrain/Step": 9064, "Full-pretrain/Step Time": 17.597304401919246} +{"Full-pretrain/Learning Rate": 3.191845068492266e-07, "Full-pretrain/Loss": 1.9203391075134277, "Full-pretrain/Loss (Raw)": 1.9625463485717773, "Full-pretrain/Step": 9065, "Full-pretrain/Step Time": 17.59613304771483} +{"Full-pretrain/Learning Rate": 3.178334735448513e-07, "Full-pretrain/Loss": 1.9205623865127563, "Full-pretrain/Loss (Raw)": 1.9429916143417358, "Full-pretrain/Step": 9066, "Full-pretrain/Step Time": 17.595054326578975} +{"Full-pretrain/Learning Rate": 3.164852873197094e-07, "Full-pretrain/Loss": 1.9364948272705078, "Full-pretrain/Loss (Raw)": 1.8612830638885498, "Full-pretrain/Step": 9067, "Full-pretrain/Step Time": 17.595148015767336} +{"Full-pretrain/Learning Rate": 3.151399483293155e-07, "Full-pretrain/Loss": 1.9349464178085327, "Full-pretrain/Loss (Raw)": 1.9942916631698608, "Full-pretrain/Step": 9068, "Full-pretrain/Step Time": 17.599954372271895} +{"Full-pretrain/Learning Rate": 3.1379745672885375e-07, "Full-pretrain/Loss": 1.9285472631454468, "Full-pretrain/Loss (Raw)": 1.6655123233795166, "Full-pretrain/Step": 9069, "Full-pretrain/Step Time": 17.594864200800657} +{"Full-pretrain/Learning Rate": 3.1245781267318085e-07, "Full-pretrain/Loss": 1.9147655963897705, "Full-pretrain/Loss (Raw)": 1.5254806280136108, "Full-pretrain/Step": 9070, "Full-pretrain/Step Time": 17.598444551229477} +{"Full-pretrain/Learning Rate": 3.111210163168232e-07, "Full-pretrain/Loss": 1.918595314025879, "Full-pretrain/Loss (Raw)": 1.917568325996399, "Full-pretrain/Step": 9071, "Full-pretrain/Step Time": 17.599631551653147} +{"Full-pretrain/Learning Rate": 3.097870678139797e-07, "Full-pretrain/Loss": 1.915358304977417, "Full-pretrain/Loss (Raw)": 1.8114314079284668, "Full-pretrain/Step": 9072, "Full-pretrain/Step Time": 17.60341160558164} +{"Full-pretrain/Learning Rate": 3.084559673185217e-07, "Full-pretrain/Loss": 1.9080810546875, "Full-pretrain/Loss (Raw)": 2.087216854095459, "Full-pretrain/Step": 9073, "Full-pretrain/Step Time": 17.607085259631276} +{"Full-pretrain/Learning Rate": 3.0712771498399017e-07, "Full-pretrain/Loss": 1.9079502820968628, "Full-pretrain/Loss (Raw)": 1.8620586395263672, "Full-pretrain/Step": 9074, "Full-pretrain/Step Time": 17.605646582320333} +{"Full-pretrain/Learning Rate": 3.058023109636016e-07, "Full-pretrain/Loss": 1.9150285720825195, "Full-pretrain/Loss (Raw)": 2.0882742404937744, "Full-pretrain/Step": 9075, "Full-pretrain/Step Time": 17.604319280013442} +{"Full-pretrain/Learning Rate": 3.0447975541023356e-07, "Full-pretrain/Loss": 1.9221200942993164, "Full-pretrain/Loss (Raw)": 2.004077672958374, "Full-pretrain/Step": 9076, "Full-pretrain/Step Time": 17.608815358951688} +{"Full-pretrain/Learning Rate": 3.031600484764502e-07, "Full-pretrain/Loss": 1.9184229373931885, "Full-pretrain/Loss (Raw)": 1.926466464996338, "Full-pretrain/Step": 9077, "Full-pretrain/Step Time": 17.607850080356002} +{"Full-pretrain/Learning Rate": 3.0184319031447696e-07, "Full-pretrain/Loss": 1.9240773916244507, "Full-pretrain/Loss (Raw)": 1.8350287675857544, "Full-pretrain/Step": 9078, "Full-pretrain/Step Time": 17.61789862625301} +{"Full-pretrain/Learning Rate": 3.00529181076209e-07, "Full-pretrain/Loss": 1.925491452217102, "Full-pretrain/Loss (Raw)": 2.008293628692627, "Full-pretrain/Step": 9079, "Full-pretrain/Step Time": 17.61899896711111} +{"Full-pretrain/Learning Rate": 2.9921802091322224e-07, "Full-pretrain/Loss": 1.9288694858551025, "Full-pretrain/Loss (Raw)": 2.0743422508239746, "Full-pretrain/Step": 9080, "Full-pretrain/Step Time": 17.61989344470203} +{"Full-pretrain/Learning Rate": 2.9790970997675695e-07, "Full-pretrain/Loss": 1.9308886528015137, "Full-pretrain/Loss (Raw)": 2.013361930847168, "Full-pretrain/Step": 9081, "Full-pretrain/Step Time": 17.628087861463428} +{"Full-pretrain/Learning Rate": 2.966042484177228e-07, "Full-pretrain/Loss": 1.9314603805541992, "Full-pretrain/Loss (Raw)": 2.1645748615264893, "Full-pretrain/Step": 9082, "Full-pretrain/Step Time": 17.624272791668773} +{"Full-pretrain/Learning Rate": 2.953016363867078e-07, "Full-pretrain/Loss": 1.9244976043701172, "Full-pretrain/Loss (Raw)": 2.0118117332458496, "Full-pretrain/Step": 9083, "Full-pretrain/Step Time": 17.62425903044641} +{"Full-pretrain/Learning Rate": 2.940018740339695e-07, "Full-pretrain/Loss": 1.9238197803497314, "Full-pretrain/Loss (Raw)": 1.9857710599899292, "Full-pretrain/Step": 9084, "Full-pretrain/Step Time": 17.621618174016476} +{"Full-pretrain/Learning Rate": 2.927049615094296e-07, "Full-pretrain/Loss": 1.92738938331604, "Full-pretrain/Loss (Raw)": 2.1129071712493896, "Full-pretrain/Step": 9085, "Full-pretrain/Step Time": 17.62542953528464} +{"Full-pretrain/Learning Rate": 2.9141089896269346e-07, "Full-pretrain/Loss": 1.9309699535369873, "Full-pretrain/Loss (Raw)": 2.067275047302246, "Full-pretrain/Step": 9086, "Full-pretrain/Step Time": 17.625470308586955} +{"Full-pretrain/Learning Rate": 2.90119686543025e-07, "Full-pretrain/Loss": 1.9426636695861816, "Full-pretrain/Loss (Raw)": 1.9581712484359741, "Full-pretrain/Step": 9087, "Full-pretrain/Step Time": 17.628830209374428} +{"Full-pretrain/Learning Rate": 2.888313243993662e-07, "Full-pretrain/Loss": 1.9415249824523926, "Full-pretrain/Loss (Raw)": 1.8925647735595703, "Full-pretrain/Step": 9088, "Full-pretrain/Step Time": 17.625723265111446} +{"Full-pretrain/Learning Rate": 2.875458126803315e-07, "Full-pretrain/Loss": 1.9433515071868896, "Full-pretrain/Loss (Raw)": 2.1789298057556152, "Full-pretrain/Step": 9089, "Full-pretrain/Step Time": 17.623494766652584} +{"Full-pretrain/Learning Rate": 2.8626315153420236e-07, "Full-pretrain/Loss": 1.9383995532989502, "Full-pretrain/Loss (Raw)": 1.8265881538391113, "Full-pretrain/Step": 9090, "Full-pretrain/Step Time": 17.626608531922102} +{"Full-pretrain/Learning Rate": 2.8498334110893256e-07, "Full-pretrain/Loss": 1.9371747970581055, "Full-pretrain/Loss (Raw)": 1.8597609996795654, "Full-pretrain/Step": 9091, "Full-pretrain/Step Time": 17.626581110060215} +{"Full-pretrain/Learning Rate": 2.8370638155215123e-07, "Full-pretrain/Loss": 1.9485517740249634, "Full-pretrain/Loss (Raw)": 2.0751428604125977, "Full-pretrain/Step": 9092, "Full-pretrain/Step Time": 17.623189330101013} +{"Full-pretrain/Learning Rate": 2.8243227301115173e-07, "Full-pretrain/Loss": 1.942314624786377, "Full-pretrain/Loss (Raw)": 1.8504390716552734, "Full-pretrain/Step": 9093, "Full-pretrain/Step Time": 17.62467984482646} +{"Full-pretrain/Learning Rate": 2.8116101563290253e-07, "Full-pretrain/Loss": 1.9425132274627686, "Full-pretrain/Loss (Raw)": 1.9584629535675049, "Full-pretrain/Step": 9094, "Full-pretrain/Step Time": 17.630542039871216} +{"Full-pretrain/Learning Rate": 2.7989260956404193e-07, "Full-pretrain/Loss": 1.9430675506591797, "Full-pretrain/Loss (Raw)": 1.9680761098861694, "Full-pretrain/Step": 9095, "Full-pretrain/Step Time": 17.63086044229567} +{"Full-pretrain/Learning Rate": 2.786270549508835e-07, "Full-pretrain/Loss": 1.949522852897644, "Full-pretrain/Loss (Raw)": 1.894030213356018, "Full-pretrain/Step": 9096, "Full-pretrain/Step Time": 17.62684865295887} +{"Full-pretrain/Learning Rate": 2.7736435193940755e-07, "Full-pretrain/Loss": 1.957468867301941, "Full-pretrain/Loss (Raw)": 2.216817617416382, "Full-pretrain/Step": 9097, "Full-pretrain/Step Time": 17.63262073136866} +{"Full-pretrain/Learning Rate": 2.7610450067526436e-07, "Full-pretrain/Loss": 1.9490370750427246, "Full-pretrain/Loss (Raw)": 1.6731717586517334, "Full-pretrain/Step": 9098, "Full-pretrain/Step Time": 17.642583779990673} +{"Full-pretrain/Learning Rate": 2.7484750130377655e-07, "Full-pretrain/Loss": 1.948449969291687, "Full-pretrain/Loss (Raw)": 1.842496633529663, "Full-pretrain/Step": 9099, "Full-pretrain/Step Time": 17.64465106278658} +{"Full-pretrain/Learning Rate": 2.73593353969942e-07, "Full-pretrain/Loss": 1.9526057243347168, "Full-pretrain/Loss (Raw)": 2.1272811889648438, "Full-pretrain/Step": 9100, "Full-pretrain/Step Time": 17.630876258015633} +{"Full-pretrain/Learning Rate": 2.7234205881842554e-07, "Full-pretrain/Loss": 1.964881181716919, "Full-pretrain/Loss (Raw)": 2.0583229064941406, "Full-pretrain/Step": 9101, "Full-pretrain/Step Time": 17.633784549310803} +{"Full-pretrain/Learning Rate": 2.7109361599356177e-07, "Full-pretrain/Loss": 1.964210033416748, "Full-pretrain/Loss (Raw)": 1.5040061473846436, "Full-pretrain/Step": 9102, "Full-pretrain/Step Time": 17.634515192359686} +{"Full-pretrain/Learning Rate": 2.698480256393604e-07, "Full-pretrain/Loss": 1.9622888565063477, "Full-pretrain/Loss (Raw)": 1.8560900688171387, "Full-pretrain/Step": 9103, "Full-pretrain/Step Time": 17.641497004777193} +{"Full-pretrain/Learning Rate": 2.6860528789949544e-07, "Full-pretrain/Loss": 1.9661366939544678, "Full-pretrain/Loss (Raw)": 1.9345660209655762, "Full-pretrain/Step": 9104, "Full-pretrain/Step Time": 17.638109523802996} +{"Full-pretrain/Learning Rate": 2.673654029173217e-07, "Full-pretrain/Loss": 1.95802640914917, "Full-pretrain/Loss (Raw)": 1.827684760093689, "Full-pretrain/Step": 9105, "Full-pretrain/Step Time": 17.64142812974751} +{"Full-pretrain/Learning Rate": 2.6612837083585527e-07, "Full-pretrain/Loss": 1.9591445922851562, "Full-pretrain/Loss (Raw)": 1.897838830947876, "Full-pretrain/Step": 9106, "Full-pretrain/Step Time": 17.641705291345716} +{"Full-pretrain/Learning Rate": 2.648941917977904e-07, "Full-pretrain/Loss": 1.9634369611740112, "Full-pretrain/Loss (Raw)": 2.2256312370300293, "Full-pretrain/Step": 9107, "Full-pretrain/Step Time": 17.639353854581714} +{"Full-pretrain/Learning Rate": 2.6366286594549093e-07, "Full-pretrain/Loss": 1.9711287021636963, "Full-pretrain/Loss (Raw)": 2.250211238861084, "Full-pretrain/Step": 9108, "Full-pretrain/Step Time": 17.64088132046163} +{"Full-pretrain/Learning Rate": 2.624343934209822e-07, "Full-pretrain/Loss": 1.9604233503341675, "Full-pretrain/Loss (Raw)": 1.5838954448699951, "Full-pretrain/Step": 9109, "Full-pretrain/Step Time": 17.64240833185613} +{"Full-pretrain/Learning Rate": 2.6120877436597577e-07, "Full-pretrain/Loss": 1.9704525470733643, "Full-pretrain/Loss (Raw)": 2.1559643745422363, "Full-pretrain/Step": 9110, "Full-pretrain/Step Time": 17.64565054886043} +{"Full-pretrain/Learning Rate": 2.59986008921842e-07, "Full-pretrain/Loss": 1.9638983011245728, "Full-pretrain/Loss (Raw)": 1.7985551357269287, "Full-pretrain/Step": 9111, "Full-pretrain/Step Time": 17.64604769833386} +{"Full-pretrain/Learning Rate": 2.587660972296263e-07, "Full-pretrain/Loss": 1.950823426246643, "Full-pretrain/Loss (Raw)": 1.6559443473815918, "Full-pretrain/Step": 9112, "Full-pretrain/Step Time": 17.641927905380726} +{"Full-pretrain/Learning Rate": 2.575490394300495e-07, "Full-pretrain/Loss": 1.9317011833190918, "Full-pretrain/Loss (Raw)": 1.4014506340026855, "Full-pretrain/Step": 9113, "Full-pretrain/Step Time": 17.64506276138127} +{"Full-pretrain/Learning Rate": 2.5633483566349645e-07, "Full-pretrain/Loss": 1.9327425956726074, "Full-pretrain/Loss (Raw)": 2.1979024410247803, "Full-pretrain/Step": 9114, "Full-pretrain/Step Time": 17.65113476291299} +{"Full-pretrain/Learning Rate": 2.551234860700219e-07, "Full-pretrain/Loss": 1.9287890195846558, "Full-pretrain/Loss (Raw)": 1.8852972984313965, "Full-pretrain/Step": 9115, "Full-pretrain/Step Time": 17.656247237697244} +{"Full-pretrain/Learning Rate": 2.5391499078935845e-07, "Full-pretrain/Loss": 1.9298017024993896, "Full-pretrain/Loss (Raw)": 2.0181779861450195, "Full-pretrain/Step": 9116, "Full-pretrain/Step Time": 17.65062036924064} +{"Full-pretrain/Learning Rate": 2.527093499609029e-07, "Full-pretrain/Loss": 1.9229304790496826, "Full-pretrain/Loss (Raw)": 1.8930296897888184, "Full-pretrain/Step": 9117, "Full-pretrain/Step Time": 17.65664231777191} +{"Full-pretrain/Learning Rate": 2.515065637237302e-07, "Full-pretrain/Loss": 1.9160282611846924, "Full-pretrain/Loss (Raw)": 1.846400260925293, "Full-pretrain/Step": 9118, "Full-pretrain/Step Time": 17.65918766334653} +{"Full-pretrain/Learning Rate": 2.5030663221657646e-07, "Full-pretrain/Loss": 1.9132018089294434, "Full-pretrain/Loss (Raw)": 1.8677268028259277, "Full-pretrain/Step": 9119, "Full-pretrain/Step Time": 17.663035994395614} +{"Full-pretrain/Learning Rate": 2.491095555778533e-07, "Full-pretrain/Loss": 1.9166414737701416, "Full-pretrain/Loss (Raw)": 2.002636432647705, "Full-pretrain/Step": 9120, "Full-pretrain/Step Time": 17.656864596530795} +{"Full-pretrain/Learning Rate": 2.479153339456447e-07, "Full-pretrain/Loss": 1.9065942764282227, "Full-pretrain/Loss (Raw)": 1.8574182987213135, "Full-pretrain/Step": 9121, "Full-pretrain/Step Time": 17.657315991818905} +{"Full-pretrain/Learning Rate": 2.467239674577071e-07, "Full-pretrain/Loss": 1.910928726196289, "Full-pretrain/Loss (Raw)": 1.9652893543243408, "Full-pretrain/Step": 9122, "Full-pretrain/Step Time": 17.657938901335} +{"Full-pretrain/Learning Rate": 2.4553545625145835e-07, "Full-pretrain/Loss": 1.906404972076416, "Full-pretrain/Loss (Raw)": 1.7149975299835205, "Full-pretrain/Step": 9123, "Full-pretrain/Step Time": 17.662957137450576} +{"Full-pretrain/Learning Rate": 2.4434980046399713e-07, "Full-pretrain/Loss": 1.8906211853027344, "Full-pretrain/Loss (Raw)": 1.5700676441192627, "Full-pretrain/Step": 9124, "Full-pretrain/Step Time": 17.65845070593059} +{"Full-pretrain/Learning Rate": 2.431670002320863e-07, "Full-pretrain/Loss": 1.8952202796936035, "Full-pretrain/Loss (Raw)": 1.997607946395874, "Full-pretrain/Step": 9125, "Full-pretrain/Step Time": 17.65147978812456} +{"Full-pretrain/Learning Rate": 2.419870556921611e-07, "Full-pretrain/Loss": 1.8939279317855835, "Full-pretrain/Loss (Raw)": 1.9171078205108643, "Full-pretrain/Step": 9126, "Full-pretrain/Step Time": 17.655740762129426} +{"Full-pretrain/Learning Rate": 2.4080996698032934e-07, "Full-pretrain/Loss": 1.8971391916275024, "Full-pretrain/Loss (Raw)": 2.070836067199707, "Full-pretrain/Step": 9127, "Full-pretrain/Step Time": 17.65479601547122} +{"Full-pretrain/Learning Rate": 2.3963573423236573e-07, "Full-pretrain/Loss": 1.8928046226501465, "Full-pretrain/Loss (Raw)": 1.7553250789642334, "Full-pretrain/Step": 9128, "Full-pretrain/Step Time": 17.656094413250685} +{"Full-pretrain/Learning Rate": 2.384643575837203e-07, "Full-pretrain/Loss": 1.8850791454315186, "Full-pretrain/Loss (Raw)": 1.9696033000946045, "Full-pretrain/Step": 9129, "Full-pretrain/Step Time": 17.658070923760533} +{"Full-pretrain/Learning Rate": 2.3729583716950998e-07, "Full-pretrain/Loss": 1.8989688158035278, "Full-pretrain/Loss (Raw)": 2.11763858795166, "Full-pretrain/Step": 9130, "Full-pretrain/Step Time": 17.6556756477803} +{"Full-pretrain/Learning Rate": 2.3613017312451858e-07, "Full-pretrain/Loss": 1.9027342796325684, "Full-pretrain/Loss (Raw)": 1.9629961252212524, "Full-pretrain/Step": 9131, "Full-pretrain/Step Time": 17.657921815291047} +{"Full-pretrain/Learning Rate": 2.3496736558321354e-07, "Full-pretrain/Loss": 1.9035382270812988, "Full-pretrain/Loss (Raw)": 2.153003215789795, "Full-pretrain/Step": 9132, "Full-pretrain/Step Time": 17.656875958666205} +{"Full-pretrain/Learning Rate": 2.3380741467971534e-07, "Full-pretrain/Loss": 1.900201678276062, "Full-pretrain/Loss (Raw)": 1.951553225517273, "Full-pretrain/Step": 9133, "Full-pretrain/Step Time": 17.653742149472237} +{"Full-pretrain/Learning Rate": 2.3265032054783365e-07, "Full-pretrain/Loss": 1.9117176532745361, "Full-pretrain/Loss (Raw)": 1.8725173473358154, "Full-pretrain/Step": 9134, "Full-pretrain/Step Time": 17.65724451467395} +{"Full-pretrain/Learning Rate": 2.3149608332103113e-07, "Full-pretrain/Loss": 1.9149751663208008, "Full-pretrain/Loss (Raw)": 1.960329532623291, "Full-pretrain/Step": 9135, "Full-pretrain/Step Time": 17.657780192792416} +{"Full-pretrain/Learning Rate": 2.303447031324485e-07, "Full-pretrain/Loss": 1.917175531387329, "Full-pretrain/Loss (Raw)": 2.0049800872802734, "Full-pretrain/Step": 9136, "Full-pretrain/Step Time": 17.652172479778528} +{"Full-pretrain/Learning Rate": 2.2919618011490174e-07, "Full-pretrain/Loss": 1.9235725402832031, "Full-pretrain/Loss (Raw)": 2.0323843955993652, "Full-pretrain/Step": 9137, "Full-pretrain/Step Time": 17.65290253981948} +{"Full-pretrain/Learning Rate": 2.28050514400871e-07, "Full-pretrain/Loss": 1.9286829233169556, "Full-pretrain/Loss (Raw)": 2.061372995376587, "Full-pretrain/Step": 9138, "Full-pretrain/Step Time": 17.652214784175158} +{"Full-pretrain/Learning Rate": 2.269077061225089e-07, "Full-pretrain/Loss": 1.9141287803649902, "Full-pretrain/Loss (Raw)": 1.759898066520691, "Full-pretrain/Step": 9139, "Full-pretrain/Step Time": 17.651349890977144} +{"Full-pretrain/Learning Rate": 2.2576775541163498e-07, "Full-pretrain/Loss": 1.9063427448272705, "Full-pretrain/Loss (Raw)": 2.001063108444214, "Full-pretrain/Step": 9140, "Full-pretrain/Step Time": 17.646406944841146} +{"Full-pretrain/Learning Rate": 2.2463066239974684e-07, "Full-pretrain/Loss": 1.9056437015533447, "Full-pretrain/Loss (Raw)": 1.5615234375, "Full-pretrain/Step": 9141, "Full-pretrain/Step Time": 17.652260176837444} +{"Full-pretrain/Learning Rate": 2.2349642721800346e-07, "Full-pretrain/Loss": 1.899418830871582, "Full-pretrain/Loss (Raw)": 1.956766128540039, "Full-pretrain/Step": 9142, "Full-pretrain/Step Time": 17.651755528524518} +{"Full-pretrain/Learning Rate": 2.2236504999723906e-07, "Full-pretrain/Loss": 1.9058648347854614, "Full-pretrain/Loss (Raw)": 2.0048301219940186, "Full-pretrain/Step": 9143, "Full-pretrain/Step Time": 17.649226240813732} +{"Full-pretrain/Learning Rate": 2.2123653086796038e-07, "Full-pretrain/Loss": 1.9148310422897339, "Full-pretrain/Loss (Raw)": 1.942863941192627, "Full-pretrain/Step": 9144, "Full-pretrain/Step Time": 17.638738237321377} +{"Full-pretrain/Learning Rate": 2.2011086996034103e-07, "Full-pretrain/Loss": 1.9291398525238037, "Full-pretrain/Loss (Raw)": 1.8593311309814453, "Full-pretrain/Step": 9145, "Full-pretrain/Step Time": 17.644595336169004} +{"Full-pretrain/Learning Rate": 2.1898806740422163e-07, "Full-pretrain/Loss": 1.9204537868499756, "Full-pretrain/Loss (Raw)": 1.9199471473693848, "Full-pretrain/Step": 9146, "Full-pretrain/Step Time": 17.64593749679625} +{"Full-pretrain/Learning Rate": 2.1786812332912076e-07, "Full-pretrain/Loss": 1.9243988990783691, "Full-pretrain/Loss (Raw)": 2.0115442276000977, "Full-pretrain/Step": 9147, "Full-pretrain/Step Time": 17.643926994875073} +{"Full-pretrain/Learning Rate": 2.1675103786422402e-07, "Full-pretrain/Loss": 1.9076809883117676, "Full-pretrain/Loss (Raw)": 1.4832017421722412, "Full-pretrain/Step": 9148, "Full-pretrain/Step Time": 17.640195973217487} +{"Full-pretrain/Learning Rate": 2.1563681113838387e-07, "Full-pretrain/Loss": 1.9057399034500122, "Full-pretrain/Loss (Raw)": 1.8309178352355957, "Full-pretrain/Step": 9149, "Full-pretrain/Step Time": 17.64404726214707} +{"Full-pretrain/Learning Rate": 2.145254432801308e-07, "Full-pretrain/Loss": 1.9045614004135132, "Full-pretrain/Loss (Raw)": 1.8086843490600586, "Full-pretrain/Step": 9150, "Full-pretrain/Step Time": 17.64625160396099} +{"Full-pretrain/Learning Rate": 2.1341693441765398e-07, "Full-pretrain/Loss": 1.9034720659255981, "Full-pretrain/Loss (Raw)": 1.832869529724121, "Full-pretrain/Step": 9151, "Full-pretrain/Step Time": 17.643824802711606} +{"Full-pretrain/Learning Rate": 2.123112846788261e-07, "Full-pretrain/Loss": 1.901930809020996, "Full-pretrain/Loss (Raw)": 1.9533171653747559, "Full-pretrain/Step": 9152, "Full-pretrain/Step Time": 17.641568763181567} +{"Full-pretrain/Learning Rate": 2.112084941911785e-07, "Full-pretrain/Loss": 1.895936369895935, "Full-pretrain/Loss (Raw)": 1.6655964851379395, "Full-pretrain/Step": 9153, "Full-pretrain/Step Time": 17.638517362996936} +{"Full-pretrain/Learning Rate": 2.101085630819205e-07, "Full-pretrain/Loss": 1.8919073343276978, "Full-pretrain/Loss (Raw)": 1.836360216140747, "Full-pretrain/Step": 9154, "Full-pretrain/Step Time": 17.642592325806618} +{"Full-pretrain/Learning Rate": 2.0901149147792841e-07, "Full-pretrain/Loss": 1.8945732116699219, "Full-pretrain/Loss (Raw)": 1.8003038167953491, "Full-pretrain/Step": 9155, "Full-pretrain/Step Time": 17.637443650513887} +{"Full-pretrain/Learning Rate": 2.0791727950574823e-07, "Full-pretrain/Loss": 1.9046456813812256, "Full-pretrain/Loss (Raw)": 1.8923888206481934, "Full-pretrain/Step": 9156, "Full-pretrain/Step Time": 17.64196807332337} +{"Full-pretrain/Learning Rate": 2.0682592729159567e-07, "Full-pretrain/Loss": 1.9002436399459839, "Full-pretrain/Loss (Raw)": 1.8567419052124023, "Full-pretrain/Step": 9157, "Full-pretrain/Step Time": 17.644184255972505} +{"Full-pretrain/Learning Rate": 2.0573743496136167e-07, "Full-pretrain/Loss": 1.8992226123809814, "Full-pretrain/Loss (Raw)": 1.8844355344772339, "Full-pretrain/Step": 9158, "Full-pretrain/Step Time": 17.644604260101914} +{"Full-pretrain/Learning Rate": 2.0465180264060135e-07, "Full-pretrain/Loss": 1.8945575952529907, "Full-pretrain/Loss (Raw)": 1.9215552806854248, "Full-pretrain/Step": 9159, "Full-pretrain/Step Time": 17.643512789160013} +{"Full-pretrain/Learning Rate": 2.0356903045453958e-07, "Full-pretrain/Loss": 1.8994805812835693, "Full-pretrain/Loss (Raw)": 1.912862777709961, "Full-pretrain/Step": 9160, "Full-pretrain/Step Time": 17.64467214792967} +{"Full-pretrain/Learning Rate": 2.0248911852807916e-07, "Full-pretrain/Loss": 1.8948715925216675, "Full-pretrain/Loss (Raw)": 1.822113275527954, "Full-pretrain/Step": 9161, "Full-pretrain/Step Time": 17.644690046086907} +{"Full-pretrain/Learning Rate": 2.0141206698578163e-07, "Full-pretrain/Loss": 1.8900834321975708, "Full-pretrain/Loss (Raw)": 1.964416742324829, "Full-pretrain/Step": 9162, "Full-pretrain/Step Time": 17.646588690578938} +{"Full-pretrain/Learning Rate": 2.0033787595188925e-07, "Full-pretrain/Loss": 1.8881559371948242, "Full-pretrain/Loss (Raw)": 1.9013149738311768, "Full-pretrain/Step": 9163, "Full-pretrain/Step Time": 17.648033902049065} +{"Full-pretrain/Learning Rate": 1.9926654555030566e-07, "Full-pretrain/Loss": 1.8795031309127808, "Full-pretrain/Loss (Raw)": 1.8761156797409058, "Full-pretrain/Step": 9164, "Full-pretrain/Step Time": 17.645252278074622} +{"Full-pretrain/Learning Rate": 1.981980759046126e-07, "Full-pretrain/Loss": 1.8807536363601685, "Full-pretrain/Loss (Raw)": 1.991570234298706, "Full-pretrain/Step": 9165, "Full-pretrain/Step Time": 17.648262530565262} +{"Full-pretrain/Learning Rate": 1.9713246713805588e-07, "Full-pretrain/Loss": 1.878067135810852, "Full-pretrain/Loss (Raw)": 1.786547064781189, "Full-pretrain/Step": 9166, "Full-pretrain/Step Time": 17.651650495827198} +{"Full-pretrain/Learning Rate": 1.960697193735511e-07, "Full-pretrain/Loss": 1.885815143585205, "Full-pretrain/Loss (Raw)": 2.2082629203796387, "Full-pretrain/Step": 9167, "Full-pretrain/Step Time": 17.649752451106906} +{"Full-pretrain/Learning Rate": 1.9500983273368633e-07, "Full-pretrain/Loss": 1.886894702911377, "Full-pretrain/Loss (Raw)": 2.039527416229248, "Full-pretrain/Step": 9168, "Full-pretrain/Step Time": 17.65444170869887} +{"Full-pretrain/Learning Rate": 1.9395280734072208e-07, "Full-pretrain/Loss": 1.8828344345092773, "Full-pretrain/Loss (Raw)": 1.902456283569336, "Full-pretrain/Step": 9169, "Full-pretrain/Step Time": 17.652624543756247} +{"Full-pretrain/Learning Rate": 1.9289864331658303e-07, "Full-pretrain/Loss": 1.8843739032745361, "Full-pretrain/Loss (Raw)": 2.110635757446289, "Full-pretrain/Step": 9170, "Full-pretrain/Step Time": 17.65897050127387} +{"Full-pretrain/Learning Rate": 1.9184734078286914e-07, "Full-pretrain/Loss": 1.8939895629882812, "Full-pretrain/Loss (Raw)": 2.067598581314087, "Full-pretrain/Step": 9171, "Full-pretrain/Step Time": 17.65803198516369} +{"Full-pretrain/Learning Rate": 1.9079889986084453e-07, "Full-pretrain/Loss": 1.8959712982177734, "Full-pretrain/Loss (Raw)": 2.064481019973755, "Full-pretrain/Step": 9172, "Full-pretrain/Step Time": 17.66140593215823} +{"Full-pretrain/Learning Rate": 1.8975332067145134e-07, "Full-pretrain/Loss": 1.8954362869262695, "Full-pretrain/Loss (Raw)": 1.544402837753296, "Full-pretrain/Step": 9173, "Full-pretrain/Step Time": 17.658755159005523} +{"Full-pretrain/Learning Rate": 1.8871060333529033e-07, "Full-pretrain/Loss": 1.8907744884490967, "Full-pretrain/Loss (Raw)": 1.8075900077819824, "Full-pretrain/Step": 9174, "Full-pretrain/Step Time": 17.666963262483478} +{"Full-pretrain/Learning Rate": 1.8767074797264306e-07, "Full-pretrain/Loss": 1.8929556608200073, "Full-pretrain/Loss (Raw)": 2.07462477684021, "Full-pretrain/Step": 9175, "Full-pretrain/Step Time": 17.65711022168398} +{"Full-pretrain/Learning Rate": 1.8663375470345523e-07, "Full-pretrain/Loss": 1.892366886138916, "Full-pretrain/Loss (Raw)": 1.9240243434906006, "Full-pretrain/Step": 9176, "Full-pretrain/Step Time": 17.658455861732364} +{"Full-pretrain/Learning Rate": 1.8559962364734507e-07, "Full-pretrain/Loss": 1.8947125673294067, "Full-pretrain/Loss (Raw)": 1.9343910217285156, "Full-pretrain/Step": 9177, "Full-pretrain/Step Time": 17.657251048833132} +{"Full-pretrain/Learning Rate": 1.845683549235977e-07, "Full-pretrain/Loss": 1.8907172679901123, "Full-pretrain/Loss (Raw)": 1.7920970916748047, "Full-pretrain/Step": 9178, "Full-pretrain/Step Time": 17.662398297339678} +{"Full-pretrain/Learning Rate": 1.8353994865116797e-07, "Full-pretrain/Loss": 1.8830257654190063, "Full-pretrain/Loss (Raw)": 1.7654170989990234, "Full-pretrain/Step": 9179, "Full-pretrain/Step Time": 17.660902582108974} +{"Full-pretrain/Learning Rate": 1.8251440494868598e-07, "Full-pretrain/Loss": 1.8963040113449097, "Full-pretrain/Loss (Raw)": 1.9081088304519653, "Full-pretrain/Step": 9180, "Full-pretrain/Step Time": 17.65745732933283} +{"Full-pretrain/Learning Rate": 1.8149172393444603e-07, "Full-pretrain/Loss": 1.903829574584961, "Full-pretrain/Loss (Raw)": 2.071732997894287, "Full-pretrain/Step": 9181, "Full-pretrain/Step Time": 17.659955330193043} +{"Full-pretrain/Learning Rate": 1.8047190572641204e-07, "Full-pretrain/Loss": 1.9103593826293945, "Full-pretrain/Loss (Raw)": 2.017638921737671, "Full-pretrain/Step": 9182, "Full-pretrain/Step Time": 17.660940382629633} +{"Full-pretrain/Learning Rate": 1.794549504422205e-07, "Full-pretrain/Loss": 1.9156017303466797, "Full-pretrain/Loss (Raw)": 2.000624418258667, "Full-pretrain/Step": 9183, "Full-pretrain/Step Time": 17.652932738885283} +{"Full-pretrain/Learning Rate": 1.7844085819918032e-07, "Full-pretrain/Loss": 1.9106147289276123, "Full-pretrain/Loss (Raw)": 1.7937332391738892, "Full-pretrain/Step": 9184, "Full-pretrain/Step Time": 17.657236767932773} +{"Full-pretrain/Learning Rate": 1.7742962911426464e-07, "Full-pretrain/Loss": 1.9225878715515137, "Full-pretrain/Loss (Raw)": 2.048734188079834, "Full-pretrain/Step": 9185, "Full-pretrain/Step Time": 17.65706610120833} +{"Full-pretrain/Learning Rate": 1.7642126330411624e-07, "Full-pretrain/Loss": 1.9255821704864502, "Full-pretrain/Loss (Raw)": 1.93218195438385, "Full-pretrain/Step": 9186, "Full-pretrain/Step Time": 17.66283810324967} +{"Full-pretrain/Learning Rate": 1.7541576088505318e-07, "Full-pretrain/Loss": 1.9264445304870605, "Full-pretrain/Loss (Raw)": 1.827897548675537, "Full-pretrain/Step": 9187, "Full-pretrain/Step Time": 17.658274890854955} +{"Full-pretrain/Learning Rate": 1.7441312197305494e-07, "Full-pretrain/Loss": 1.9291889667510986, "Full-pretrain/Loss (Raw)": 1.9802119731903076, "Full-pretrain/Step": 9188, "Full-pretrain/Step Time": 17.670194583013654} +{"Full-pretrain/Learning Rate": 1.7341334668378172e-07, "Full-pretrain/Loss": 1.9345377683639526, "Full-pretrain/Loss (Raw)": 2.027902603149414, "Full-pretrain/Step": 9189, "Full-pretrain/Step Time": 17.663845516741276} +{"Full-pretrain/Learning Rate": 1.7241643513255247e-07, "Full-pretrain/Loss": 1.9348666667938232, "Full-pretrain/Loss (Raw)": 1.894958734512329, "Full-pretrain/Step": 9190, "Full-pretrain/Step Time": 17.670087793841958} +{"Full-pretrain/Learning Rate": 1.7142238743436401e-07, "Full-pretrain/Loss": 1.9343024492263794, "Full-pretrain/Loss (Raw)": 1.903501272201538, "Full-pretrain/Step": 9191, "Full-pretrain/Step Time": 17.6617818698287} +{"Full-pretrain/Learning Rate": 1.7043120370387744e-07, "Full-pretrain/Loss": 1.92803955078125, "Full-pretrain/Loss (Raw)": 1.712449073791504, "Full-pretrain/Step": 9192, "Full-pretrain/Step Time": 17.667147658765316} +{"Full-pretrain/Learning Rate": 1.694428840554263e-07, "Full-pretrain/Loss": 1.9233319759368896, "Full-pretrain/Loss (Raw)": 1.6714718341827393, "Full-pretrain/Step": 9193, "Full-pretrain/Step Time": 17.66391621902585} +{"Full-pretrain/Learning Rate": 1.6845742860301382e-07, "Full-pretrain/Loss": 1.9301421642303467, "Full-pretrain/Loss (Raw)": 2.182344913482666, "Full-pretrain/Step": 9194, "Full-pretrain/Step Time": 17.664234075695276} +{"Full-pretrain/Learning Rate": 1.6747483746030746e-07, "Full-pretrain/Loss": 1.9434280395507812, "Full-pretrain/Loss (Raw)": 2.326462984085083, "Full-pretrain/Step": 9195, "Full-pretrain/Step Time": 17.668192664161325} +{"Full-pretrain/Learning Rate": 1.664951107406526e-07, "Full-pretrain/Loss": 1.9396536350250244, "Full-pretrain/Loss (Raw)": 1.755332589149475, "Full-pretrain/Step": 9196, "Full-pretrain/Step Time": 17.666169887408614} +{"Full-pretrain/Learning Rate": 1.6551824855705888e-07, "Full-pretrain/Loss": 1.931471347808838, "Full-pretrain/Loss (Raw)": 1.729739785194397, "Full-pretrain/Step": 9197, "Full-pretrain/Step Time": 17.663082737475634} +{"Full-pretrain/Learning Rate": 1.645442510222084e-07, "Full-pretrain/Loss": 1.9416967630386353, "Full-pretrain/Loss (Raw)": 2.113759994506836, "Full-pretrain/Step": 9198, "Full-pretrain/Step Time": 17.664669442921877} +{"Full-pretrain/Learning Rate": 1.635731182484529e-07, "Full-pretrain/Loss": 1.941104769706726, "Full-pretrain/Loss (Raw)": 2.1893200874328613, "Full-pretrain/Step": 9199, "Full-pretrain/Step Time": 17.664023634046316} +{"Full-pretrain/Learning Rate": 1.626048503478056e-07, "Full-pretrain/Loss": 1.9354498386383057, "Full-pretrain/Loss (Raw)": 1.858566164970398, "Full-pretrain/Step": 9200, "Full-pretrain/Step Time": 17.666000513359904} +{"Full-pretrain/Learning Rate": 1.6163944743196323e-07, "Full-pretrain/Loss": 1.9374897480010986, "Full-pretrain/Loss (Raw)": 1.9677354097366333, "Full-pretrain/Step": 9201, "Full-pretrain/Step Time": 17.664540752768517} +{"Full-pretrain/Learning Rate": 1.6067690961228398e-07, "Full-pretrain/Loss": 1.928959608078003, "Full-pretrain/Loss (Raw)": 1.837669849395752, "Full-pretrain/Step": 9202, "Full-pretrain/Step Time": 17.661826683208346} +{"Full-pretrain/Learning Rate": 1.5971723699979013e-07, "Full-pretrain/Loss": 1.9223164319992065, "Full-pretrain/Loss (Raw)": 1.8550196886062622, "Full-pretrain/Step": 9203, "Full-pretrain/Step Time": 17.659416060894728} +{"Full-pretrain/Learning Rate": 1.5876042970518478e-07, "Full-pretrain/Loss": 1.9178640842437744, "Full-pretrain/Loss (Raw)": 1.9220057725906372, "Full-pretrain/Step": 9204, "Full-pretrain/Step Time": 17.659125668928027} +{"Full-pretrain/Learning Rate": 1.5780648783883523e-07, "Full-pretrain/Loss": 1.9282984733581543, "Full-pretrain/Loss (Raw)": 1.878301739692688, "Full-pretrain/Step": 9205, "Full-pretrain/Step Time": 17.66607599519193} +{"Full-pretrain/Learning Rate": 1.5685541151077566e-07, "Full-pretrain/Loss": 1.9337854385375977, "Full-pretrain/Loss (Raw)": 1.9831715822219849, "Full-pretrain/Step": 9206, "Full-pretrain/Step Time": 17.659378420561552} +{"Full-pretrain/Learning Rate": 1.5590720083071275e-07, "Full-pretrain/Loss": 1.9348889589309692, "Full-pretrain/Loss (Raw)": 2.1099400520324707, "Full-pretrain/Step": 9207, "Full-pretrain/Step Time": 17.65800255164504} +{"Full-pretrain/Learning Rate": 1.549618559080257e-07, "Full-pretrain/Loss": 1.935618281364441, "Full-pretrain/Loss (Raw)": 1.9473603963851929, "Full-pretrain/Step": 9208, "Full-pretrain/Step Time": 17.649705156683922} +{"Full-pretrain/Learning Rate": 1.5401937685175781e-07, "Full-pretrain/Loss": 1.9418978691101074, "Full-pretrain/Loss (Raw)": 2.1353416442871094, "Full-pretrain/Step": 9209, "Full-pretrain/Step Time": 17.650269120931625} +{"Full-pretrain/Learning Rate": 1.5307976377062216e-07, "Full-pretrain/Loss": 1.9478962421417236, "Full-pretrain/Loss (Raw)": 1.9840421676635742, "Full-pretrain/Step": 9210, "Full-pretrain/Step Time": 17.657810961827636} +{"Full-pretrain/Learning Rate": 1.5214301677300425e-07, "Full-pretrain/Loss": 1.9448018074035645, "Full-pretrain/Loss (Raw)": 1.666398048400879, "Full-pretrain/Step": 9211, "Full-pretrain/Step Time": 17.657181780785322} +{"Full-pretrain/Learning Rate": 1.512091359669565e-07, "Full-pretrain/Loss": 1.9454233646392822, "Full-pretrain/Loss (Raw)": 1.9279956817626953, "Full-pretrain/Step": 9212, "Full-pretrain/Step Time": 17.65726206637919} +{"Full-pretrain/Learning Rate": 1.502781214602039e-07, "Full-pretrain/Loss": 1.9431531429290771, "Full-pretrain/Loss (Raw)": 1.9990894794464111, "Full-pretrain/Step": 9213, "Full-pretrain/Step Time": 17.66184316202998} +{"Full-pretrain/Learning Rate": 1.4934997336013557e-07, "Full-pretrain/Loss": 1.9405231475830078, "Full-pretrain/Loss (Raw)": 1.9334770441055298, "Full-pretrain/Step": 9214, "Full-pretrain/Step Time": 17.66633260436356} +{"Full-pretrain/Learning Rate": 1.484246917738158e-07, "Full-pretrain/Loss": 1.9397609233856201, "Full-pretrain/Loss (Raw)": 1.9762341976165771, "Full-pretrain/Step": 9215, "Full-pretrain/Step Time": 17.661057664081454} +{"Full-pretrain/Learning Rate": 1.4750227680797312e-07, "Full-pretrain/Loss": 1.9588019847869873, "Full-pretrain/Loss (Raw)": 2.4030489921569824, "Full-pretrain/Step": 9216, "Full-pretrain/Step Time": 17.651508200913668} +{"Full-pretrain/Learning Rate": 1.4658272856900857e-07, "Full-pretrain/Loss": 1.948911190032959, "Full-pretrain/Loss (Raw)": 1.7322251796722412, "Full-pretrain/Step": 9217, "Full-pretrain/Step Time": 17.65683090314269} +{"Full-pretrain/Learning Rate": 1.4566604716299282e-07, "Full-pretrain/Loss": 1.9584167003631592, "Full-pretrain/Loss (Raw)": 2.236360549926758, "Full-pretrain/Step": 9218, "Full-pretrain/Step Time": 17.659965751692653} +{"Full-pretrain/Learning Rate": 1.447522326956663e-07, "Full-pretrain/Loss": 1.9568026065826416, "Full-pretrain/Loss (Raw)": 1.776242733001709, "Full-pretrain/Step": 9219, "Full-pretrain/Step Time": 17.658463809639215} +{"Full-pretrain/Learning Rate": 1.4384128527243356e-07, "Full-pretrain/Loss": 1.9529154300689697, "Full-pretrain/Loss (Raw)": 1.855823278427124, "Full-pretrain/Step": 9220, "Full-pretrain/Step Time": 17.656414380297065} +{"Full-pretrain/Learning Rate": 1.4293320499837171e-07, "Full-pretrain/Loss": 1.9483827352523804, "Full-pretrain/Loss (Raw)": 1.8828554153442383, "Full-pretrain/Step": 9221, "Full-pretrain/Step Time": 17.655295193195343} +{"Full-pretrain/Learning Rate": 1.4202799197823025e-07, "Full-pretrain/Loss": 1.9379055500030518, "Full-pretrain/Loss (Raw)": 1.5596911907196045, "Full-pretrain/Step": 9222, "Full-pretrain/Step Time": 17.65630672685802} +{"Full-pretrain/Learning Rate": 1.4112564631642568e-07, "Full-pretrain/Loss": 1.928391456604004, "Full-pretrain/Loss (Raw)": 1.5990468263626099, "Full-pretrain/Step": 9223, "Full-pretrain/Step Time": 17.657034520059824} +{"Full-pretrain/Learning Rate": 1.4022616811704137e-07, "Full-pretrain/Loss": 1.936303973197937, "Full-pretrain/Loss (Raw)": 1.9656518697738647, "Full-pretrain/Step": 9224, "Full-pretrain/Step Time": 17.655082911252975} +{"Full-pretrain/Learning Rate": 1.3932955748383049e-07, "Full-pretrain/Loss": 1.9387813806533813, "Full-pretrain/Loss (Raw)": 1.7507480382919312, "Full-pretrain/Step": 9225, "Full-pretrain/Step Time": 17.654538080096245} +{"Full-pretrain/Learning Rate": 1.3843581452022137e-07, "Full-pretrain/Loss": 1.9214105606079102, "Full-pretrain/Loss (Raw)": 1.6264797449111938, "Full-pretrain/Step": 9226, "Full-pretrain/Step Time": 17.653556495904922} +{"Full-pretrain/Learning Rate": 1.3754493932930102e-07, "Full-pretrain/Loss": 1.8949744701385498, "Full-pretrain/Loss (Raw)": 1.4805055856704712, "Full-pretrain/Step": 9227, "Full-pretrain/Step Time": 17.654643898829818} +{"Full-pretrain/Learning Rate": 1.3665693201383723e-07, "Full-pretrain/Loss": 1.9029203653335571, "Full-pretrain/Loss (Raw)": 2.0096068382263184, "Full-pretrain/Step": 9228, "Full-pretrain/Step Time": 17.655987080186605} +{"Full-pretrain/Learning Rate": 1.3577179267625638e-07, "Full-pretrain/Loss": 1.9150108098983765, "Full-pretrain/Loss (Raw)": 2.116630792617798, "Full-pretrain/Step": 9229, "Full-pretrain/Step Time": 17.65533723309636} +{"Full-pretrain/Learning Rate": 1.3488952141866294e-07, "Full-pretrain/Loss": 1.9100356101989746, "Full-pretrain/Loss (Raw)": 1.9545588493347168, "Full-pretrain/Step": 9230, "Full-pretrain/Step Time": 17.656694075092673} +{"Full-pretrain/Learning Rate": 1.3401011834282552e-07, "Full-pretrain/Loss": 1.9105753898620605, "Full-pretrain/Loss (Raw)": 2.2065911293029785, "Full-pretrain/Step": 9231, "Full-pretrain/Step Time": 17.651912601664662} +{"Full-pretrain/Learning Rate": 1.3313358355017959e-07, "Full-pretrain/Loss": 1.9117608070373535, "Full-pretrain/Loss (Raw)": 1.8965001106262207, "Full-pretrain/Step": 9232, "Full-pretrain/Step Time": 17.656467828899622} +{"Full-pretrain/Learning Rate": 1.3225991714183872e-07, "Full-pretrain/Loss": 1.9166890382766724, "Full-pretrain/Loss (Raw)": 2.1254353523254395, "Full-pretrain/Step": 9233, "Full-pretrain/Step Time": 17.652632586658} +{"Full-pretrain/Learning Rate": 1.3138911921857788e-07, "Full-pretrain/Loss": 1.9157493114471436, "Full-pretrain/Loss (Raw)": 1.8075993061065674, "Full-pretrain/Step": 9234, "Full-pretrain/Step Time": 17.65318200737238} +{"Full-pretrain/Learning Rate": 1.3052118988083894e-07, "Full-pretrain/Loss": 1.9129348993301392, "Full-pretrain/Loss (Raw)": 1.7649562358856201, "Full-pretrain/Step": 9235, "Full-pretrain/Step Time": 17.654221311211586} +{"Full-pretrain/Learning Rate": 1.296561292287446e-07, "Full-pretrain/Loss": 1.906660795211792, "Full-pretrain/Loss (Raw)": 1.7212350368499756, "Full-pretrain/Step": 9236, "Full-pretrain/Step Time": 17.650910140946507} +{"Full-pretrain/Learning Rate": 1.2879393736207336e-07, "Full-pretrain/Loss": 1.9085237979888916, "Full-pretrain/Loss (Raw)": 1.9379183053970337, "Full-pretrain/Step": 9237, "Full-pretrain/Step Time": 17.648210246115923} +{"Full-pretrain/Learning Rate": 1.2793461438028176e-07, "Full-pretrain/Loss": 1.9022634029388428, "Full-pretrain/Loss (Raw)": 1.7828400135040283, "Full-pretrain/Step": 9238, "Full-pretrain/Step Time": 17.648266803473234} +{"Full-pretrain/Learning Rate": 1.270781603824933e-07, "Full-pretrain/Loss": 1.8945178985595703, "Full-pretrain/Loss (Raw)": 1.8620800971984863, "Full-pretrain/Step": 9239, "Full-pretrain/Step Time": 17.649695018306375} +{"Full-pretrain/Learning Rate": 1.2622457546749567e-07, "Full-pretrain/Loss": 1.8962457180023193, "Full-pretrain/Loss (Raw)": 2.002653121948242, "Full-pretrain/Step": 9240, "Full-pretrain/Step Time": 17.650726044550538} +{"Full-pretrain/Learning Rate": 1.2537385973375448e-07, "Full-pretrain/Loss": 1.8908963203430176, "Full-pretrain/Loss (Raw)": 1.9641584157943726, "Full-pretrain/Step": 9241, "Full-pretrain/Step Time": 17.649781934916973} +{"Full-pretrain/Learning Rate": 1.2452601327939406e-07, "Full-pretrain/Loss": 1.8774906396865845, "Full-pretrain/Loss (Raw)": 1.555064082145691, "Full-pretrain/Step": 9242, "Full-pretrain/Step Time": 17.64884228631854} +{"Full-pretrain/Learning Rate": 1.236810362022195e-07, "Full-pretrain/Loss": 1.8776090145111084, "Full-pretrain/Loss (Raw)": 1.670183777809143, "Full-pretrain/Step": 9243, "Full-pretrain/Step Time": 17.64780167862773} +{"Full-pretrain/Learning Rate": 1.228389285996917e-07, "Full-pretrain/Loss": 1.8812097311019897, "Full-pretrain/Loss (Raw)": 2.0432186126708984, "Full-pretrain/Step": 9244, "Full-pretrain/Step Time": 17.651752972975373} +{"Full-pretrain/Learning Rate": 1.2199969056895523e-07, "Full-pretrain/Loss": 1.879422664642334, "Full-pretrain/Loss (Raw)": 1.9419033527374268, "Full-pretrain/Step": 9245, "Full-pretrain/Step Time": 17.645790249109268} +{"Full-pretrain/Learning Rate": 1.2116332220680758e-07, "Full-pretrain/Loss": 1.878409743309021, "Full-pretrain/Loss (Raw)": 1.9010646343231201, "Full-pretrain/Step": 9246, "Full-pretrain/Step Time": 17.647308269515634} +{"Full-pretrain/Learning Rate": 1.2032982360973e-07, "Full-pretrain/Loss": 1.874649167060852, "Full-pretrain/Loss (Raw)": 1.855894923210144, "Full-pretrain/Step": 9247, "Full-pretrain/Step Time": 17.642754705622792} +{"Full-pretrain/Learning Rate": 1.1949919487386218e-07, "Full-pretrain/Loss": 1.8525983095169067, "Full-pretrain/Loss (Raw)": 1.697422742843628, "Full-pretrain/Step": 9248, "Full-pretrain/Step Time": 17.647672498598695} +{"Full-pretrain/Learning Rate": 1.1867143609502195e-07, "Full-pretrain/Loss": 1.8619074821472168, "Full-pretrain/Loss (Raw)": 2.0301170349121094, "Full-pretrain/Step": 9249, "Full-pretrain/Step Time": 17.656008725985885} +{"Full-pretrain/Learning Rate": 1.1784654736868572e-07, "Full-pretrain/Loss": 1.8564759492874146, "Full-pretrain/Loss (Raw)": 2.062553882598877, "Full-pretrain/Step": 9250, "Full-pretrain/Step Time": 17.64935263246298} +{"Full-pretrain/Learning Rate": 1.1702452879000514e-07, "Full-pretrain/Loss": 1.864161729812622, "Full-pretrain/Loss (Raw)": 2.022188663482666, "Full-pretrain/Step": 9251, "Full-pretrain/Step Time": 17.646786630153656} +{"Full-pretrain/Learning Rate": 1.1620538045380158e-07, "Full-pretrain/Loss": 1.872744083404541, "Full-pretrain/Loss (Raw)": 2.13045597076416, "Full-pretrain/Step": 9252, "Full-pretrain/Step Time": 17.652672071009874} +{"Full-pretrain/Learning Rate": 1.1538910245456058e-07, "Full-pretrain/Loss": 1.8745226860046387, "Full-pretrain/Loss (Raw)": 1.9397714138031006, "Full-pretrain/Step": 9253, "Full-pretrain/Step Time": 17.655631635338068} +{"Full-pretrain/Learning Rate": 1.1457569488644294e-07, "Full-pretrain/Loss": 1.881909966468811, "Full-pretrain/Loss (Raw)": 1.7960858345031738, "Full-pretrain/Step": 9254, "Full-pretrain/Step Time": 17.653531288728118} +{"Full-pretrain/Learning Rate": 1.1376515784327634e-07, "Full-pretrain/Loss": 1.8875739574432373, "Full-pretrain/Loss (Raw)": 1.7802932262420654, "Full-pretrain/Step": 9255, "Full-pretrain/Step Time": 17.65346265025437} +{"Full-pretrain/Learning Rate": 1.1295749141854994e-07, "Full-pretrain/Loss": 1.8867156505584717, "Full-pretrain/Loss (Raw)": 1.9381868839263916, "Full-pretrain/Step": 9256, "Full-pretrain/Step Time": 17.65450469776988} +{"Full-pretrain/Learning Rate": 1.1215269570543085e-07, "Full-pretrain/Loss": 1.8854470252990723, "Full-pretrain/Loss (Raw)": 1.7101495265960693, "Full-pretrain/Step": 9257, "Full-pretrain/Step Time": 17.65570991486311} +{"Full-pretrain/Learning Rate": 1.1135077079675315e-07, "Full-pretrain/Loss": 1.8970415592193604, "Full-pretrain/Loss (Raw)": 1.9975076913833618, "Full-pretrain/Step": 9258, "Full-pretrain/Step Time": 17.655046198517084} +{"Full-pretrain/Learning Rate": 1.1055171678501785e-07, "Full-pretrain/Loss": 1.9112671613693237, "Full-pretrain/Loss (Raw)": 1.935722827911377, "Full-pretrain/Step": 9259, "Full-pretrain/Step Time": 17.65486989170313} +{"Full-pretrain/Learning Rate": 1.0975553376239566e-07, "Full-pretrain/Loss": 1.8973562717437744, "Full-pretrain/Loss (Raw)": 1.5644586086273193, "Full-pretrain/Step": 9260, "Full-pretrain/Step Time": 17.663150779902935} +{"Full-pretrain/Learning Rate": 1.0896222182072424e-07, "Full-pretrain/Loss": 1.8928658962249756, "Full-pretrain/Loss (Raw)": 1.9729379415512085, "Full-pretrain/Step": 9261, "Full-pretrain/Step Time": 17.666071623563766} +{"Full-pretrain/Learning Rate": 1.0817178105151371e-07, "Full-pretrain/Loss": 1.894853115081787, "Full-pretrain/Loss (Raw)": 2.018153190612793, "Full-pretrain/Step": 9262, "Full-pretrain/Step Time": 17.659979866817594} +{"Full-pretrain/Learning Rate": 1.0738421154594114e-07, "Full-pretrain/Loss": 1.8802688121795654, "Full-pretrain/Loss (Raw)": 1.7398884296417236, "Full-pretrain/Step": 9263, "Full-pretrain/Step Time": 17.661875063553452} +{"Full-pretrain/Learning Rate": 1.0659951339485053e-07, "Full-pretrain/Loss": 1.8825587034225464, "Full-pretrain/Loss (Raw)": 1.9697823524475098, "Full-pretrain/Step": 9264, "Full-pretrain/Step Time": 17.663659101352096} +{"Full-pretrain/Learning Rate": 1.0581768668875836e-07, "Full-pretrain/Loss": 1.879504919052124, "Full-pretrain/Loss (Raw)": 2.027710437774658, "Full-pretrain/Step": 9265, "Full-pretrain/Step Time": 17.661187510937452} +{"Full-pretrain/Learning Rate": 1.0503873151785082e-07, "Full-pretrain/Loss": 1.8760384321212769, "Full-pretrain/Loss (Raw)": 1.6966742277145386, "Full-pretrain/Step": 9266, "Full-pretrain/Step Time": 17.661349149420857} +{"Full-pretrain/Learning Rate": 1.0426264797197272e-07, "Full-pretrain/Loss": 1.8780195713043213, "Full-pretrain/Loss (Raw)": 1.828352451324463, "Full-pretrain/Step": 9267, "Full-pretrain/Step Time": 17.668609131127596} +{"Full-pretrain/Learning Rate": 1.0348943614064965e-07, "Full-pretrain/Loss": 1.8841608762741089, "Full-pretrain/Loss (Raw)": 1.917755126953125, "Full-pretrain/Step": 9268, "Full-pretrain/Step Time": 17.67490143701434} +{"Full-pretrain/Learning Rate": 1.027190961130714e-07, "Full-pretrain/Loss": 1.8812865018844604, "Full-pretrain/Loss (Raw)": 1.8459376096725464, "Full-pretrain/Step": 9269, "Full-pretrain/Step Time": 17.670015500858426} +{"Full-pretrain/Learning Rate": 1.0195162797809743e-07, "Full-pretrain/Loss": 1.8785581588745117, "Full-pretrain/Loss (Raw)": 1.6955342292785645, "Full-pretrain/Step": 9270, "Full-pretrain/Step Time": 17.66996826417744} +{"Full-pretrain/Learning Rate": 1.0118703182425137e-07, "Full-pretrain/Loss": 1.8831391334533691, "Full-pretrain/Loss (Raw)": 2.0086708068847656, "Full-pretrain/Step": 9271, "Full-pretrain/Step Time": 17.666359405964613} +{"Full-pretrain/Learning Rate": 1.0042530773973213e-07, "Full-pretrain/Loss": 1.8760038614273071, "Full-pretrain/Loss (Raw)": 1.77432382106781, "Full-pretrain/Step": 9272, "Full-pretrain/Step Time": 17.67272720299661} +{"Full-pretrain/Learning Rate": 9.966645581240274e-08, "Full-pretrain/Loss": 1.8795028924942017, "Full-pretrain/Loss (Raw)": 2.07612681388855, "Full-pretrain/Step": 9273, "Full-pretrain/Step Time": 17.66923438385129} +{"Full-pretrain/Learning Rate": 9.891047612979876e-08, "Full-pretrain/Loss": 1.8946127891540527, "Full-pretrain/Loss (Raw)": 2.0385806560516357, "Full-pretrain/Step": 9274, "Full-pretrain/Step Time": 17.670052375644445} +{"Full-pretrain/Learning Rate": 9.815736877911985e-08, "Full-pretrain/Loss": 1.9057395458221436, "Full-pretrain/Loss (Raw)": 2.026240110397339, "Full-pretrain/Step": 9275, "Full-pretrain/Step Time": 17.668729532510042} +{"Full-pretrain/Learning Rate": 9.740713384723543e-08, "Full-pretrain/Loss": 1.9041171073913574, "Full-pretrain/Loss (Raw)": 1.9913036823272705, "Full-pretrain/Step": 9276, "Full-pretrain/Step Time": 17.6694809589535} +{"Full-pretrain/Learning Rate": 9.665977142068738e-08, "Full-pretrain/Loss": 1.8992201089859009, "Full-pretrain/Loss (Raw)": 1.7851966619491577, "Full-pretrain/Step": 9277, "Full-pretrain/Step Time": 17.668677393347025} +{"Full-pretrain/Learning Rate": 9.591528158568453e-08, "Full-pretrain/Loss": 1.9008044004440308, "Full-pretrain/Loss (Raw)": 1.9517641067504883, "Full-pretrain/Step": 9278, "Full-pretrain/Step Time": 17.66562595590949} +{"Full-pretrain/Learning Rate": 9.51736644281026e-08, "Full-pretrain/Loss": 1.8975913524627686, "Full-pretrain/Loss (Raw)": 1.7530750036239624, "Full-pretrain/Step": 9279, "Full-pretrain/Step Time": 17.662112057209015} +{"Full-pretrain/Learning Rate": 9.443492003348431e-08, "Full-pretrain/Loss": 1.9016480445861816, "Full-pretrain/Loss (Raw)": 1.8272372484207153, "Full-pretrain/Step": 9280, "Full-pretrain/Step Time": 17.662868270650506} +{"Full-pretrain/Learning Rate": 9.369904848704758e-08, "Full-pretrain/Loss": 1.8988080024719238, "Full-pretrain/Loss (Raw)": 1.9392374753952026, "Full-pretrain/Step": 9281, "Full-pretrain/Step Time": 17.66716025955975} +{"Full-pretrain/Learning Rate": 9.296604987366898e-08, "Full-pretrain/Loss": 1.8910062313079834, "Full-pretrain/Loss (Raw)": 1.8128960132598877, "Full-pretrain/Step": 9282, "Full-pretrain/Step Time": 17.663718780502677} +{"Full-pretrain/Learning Rate": 9.223592427790584e-08, "Full-pretrain/Loss": 1.8843268156051636, "Full-pretrain/Loss (Raw)": 1.8084487915039062, "Full-pretrain/Step": 9283, "Full-pretrain/Step Time": 17.6661919914186} +{"Full-pretrain/Learning Rate": 9.150867178397693e-08, "Full-pretrain/Loss": 1.8801136016845703, "Full-pretrain/Loss (Raw)": 1.9956320524215698, "Full-pretrain/Step": 9284, "Full-pretrain/Step Time": 17.660699363797903} +{"Full-pretrain/Learning Rate": 9.078429247576791e-08, "Full-pretrain/Loss": 1.888436198234558, "Full-pretrain/Loss (Raw)": 2.2060940265655518, "Full-pretrain/Step": 9285, "Full-pretrain/Step Time": 17.658035326749086} +{"Full-pretrain/Learning Rate": 9.006278643683696e-08, "Full-pretrain/Loss": 1.8799173831939697, "Full-pretrain/Loss (Raw)": 1.5234830379486084, "Full-pretrain/Step": 9286, "Full-pretrain/Step Time": 17.65931787341833} +{"Full-pretrain/Learning Rate": 8.934415375041195e-08, "Full-pretrain/Loss": 1.8725054264068604, "Full-pretrain/Loss (Raw)": 1.5431116819381714, "Full-pretrain/Step": 9287, "Full-pretrain/Step Time": 17.662072895094752} +{"Full-pretrain/Learning Rate": 8.86283944993821e-08, "Full-pretrain/Loss": 1.8766613006591797, "Full-pretrain/Loss (Raw)": 2.0711750984191895, "Full-pretrain/Step": 9288, "Full-pretrain/Step Time": 17.664645057171583} +{"Full-pretrain/Learning Rate": 8.791550876631193e-08, "Full-pretrain/Loss": 1.8774826526641846, "Full-pretrain/Loss (Raw)": 1.7364355325698853, "Full-pretrain/Step": 9289, "Full-pretrain/Step Time": 17.66612215898931} +{"Full-pretrain/Learning Rate": 8.720549663343291e-08, "Full-pretrain/Loss": 1.8847432136535645, "Full-pretrain/Loss (Raw)": 2.2298457622528076, "Full-pretrain/Step": 9290, "Full-pretrain/Step Time": 17.663241593167186} +{"Full-pretrain/Learning Rate": 8.649835818264618e-08, "Full-pretrain/Loss": 1.878237247467041, "Full-pretrain/Loss (Raw)": 1.7275274991989136, "Full-pretrain/Step": 9291, "Full-pretrain/Step Time": 17.661507746204734} +{"Full-pretrain/Learning Rate": 8.579409349551981e-08, "Full-pretrain/Loss": 1.893377661705017, "Full-pretrain/Loss (Raw)": 2.048954486846924, "Full-pretrain/Step": 9292, "Full-pretrain/Step Time": 17.664130859076977} +{"Full-pretrain/Learning Rate": 8.509270265328884e-08, "Full-pretrain/Loss": 1.8955752849578857, "Full-pretrain/Loss (Raw)": 2.0432610511779785, "Full-pretrain/Step": 9293, "Full-pretrain/Step Time": 17.66893282905221} +{"Full-pretrain/Learning Rate": 8.439418573685797e-08, "Full-pretrain/Loss": 1.8842973709106445, "Full-pretrain/Loss (Raw)": 1.6572624444961548, "Full-pretrain/Step": 9294, "Full-pretrain/Step Time": 17.6669381596148} +{"Full-pretrain/Learning Rate": 8.369854282680168e-08, "Full-pretrain/Loss": 1.887765645980835, "Full-pretrain/Loss (Raw)": 1.850867748260498, "Full-pretrain/Step": 9295, "Full-pretrain/Step Time": 17.666558692231774} +{"Full-pretrain/Learning Rate": 8.300577400336407e-08, "Full-pretrain/Loss": 1.8804419040679932, "Full-pretrain/Loss (Raw)": 1.7354289293289185, "Full-pretrain/Step": 9296, "Full-pretrain/Step Time": 17.665274016559124} +{"Full-pretrain/Learning Rate": 8.231587934645068e-08, "Full-pretrain/Loss": 1.8802251815795898, "Full-pretrain/Loss (Raw)": 2.020771026611328, "Full-pretrain/Step": 9297, "Full-pretrain/Step Time": 17.667874842882156} +{"Full-pretrain/Learning Rate": 8.162885893564786e-08, "Full-pretrain/Loss": 1.8938977718353271, "Full-pretrain/Loss (Raw)": 2.1341991424560547, "Full-pretrain/Step": 9298, "Full-pretrain/Step Time": 17.66372751444578} +{"Full-pretrain/Learning Rate": 8.0944712850195e-08, "Full-pretrain/Loss": 1.8985397815704346, "Full-pretrain/Loss (Raw)": 1.976893663406372, "Full-pretrain/Step": 9299, "Full-pretrain/Step Time": 17.66745567508042} +{"Full-pretrain/Learning Rate": 8.026344116901507e-08, "Full-pretrain/Loss": 1.9048004150390625, "Full-pretrain/Loss (Raw)": 2.1180994510650635, "Full-pretrain/Step": 9300, "Full-pretrain/Step Time": 17.669096464291215} +{"Full-pretrain/Learning Rate": 7.958504397068966e-08, "Full-pretrain/Loss": 1.9064180850982666, "Full-pretrain/Loss (Raw)": 1.8977022171020508, "Full-pretrain/Step": 9301, "Full-pretrain/Step Time": 17.67489825002849} +{"Full-pretrain/Learning Rate": 7.890952133347007e-08, "Full-pretrain/Loss": 1.9158375263214111, "Full-pretrain/Loss (Raw)": 1.9969526529312134, "Full-pretrain/Step": 9302, "Full-pretrain/Step Time": 17.66730099916458} +{"Full-pretrain/Learning Rate": 7.823687333528008e-08, "Full-pretrain/Loss": 1.916100263595581, "Full-pretrain/Loss (Raw)": 2.0170836448669434, "Full-pretrain/Step": 9303, "Full-pretrain/Step Time": 17.676247034221888} +{"Full-pretrain/Learning Rate": 7.756710005371037e-08, "Full-pretrain/Loss": 1.917814016342163, "Full-pretrain/Loss (Raw)": 1.8291637897491455, "Full-pretrain/Step": 9304, "Full-pretrain/Step Time": 17.671742314472795} +{"Full-pretrain/Learning Rate": 7.690020156601585e-08, "Full-pretrain/Loss": 1.913771152496338, "Full-pretrain/Loss (Raw)": 1.946756362915039, "Full-pretrain/Step": 9305, "Full-pretrain/Step Time": 17.66796070151031} +{"Full-pretrain/Learning Rate": 7.623617794912386e-08, "Full-pretrain/Loss": 1.9115386009216309, "Full-pretrain/Loss (Raw)": 1.967137098312378, "Full-pretrain/Step": 9306, "Full-pretrain/Step Time": 17.67204491607845} +{"Full-pretrain/Learning Rate": 7.557502927963145e-08, "Full-pretrain/Loss": 1.9170703887939453, "Full-pretrain/Loss (Raw)": 2.203254222869873, "Full-pretrain/Step": 9307, "Full-pretrain/Step Time": 17.672943798825145} +{"Full-pretrain/Learning Rate": 7.491675563379985e-08, "Full-pretrain/Loss": 1.9154646396636963, "Full-pretrain/Loss (Raw)": 1.939922571182251, "Full-pretrain/Step": 9308, "Full-pretrain/Step Time": 17.666582258418202} +{"Full-pretrain/Learning Rate": 7.426135708756e-08, "Full-pretrain/Loss": 1.9253199100494385, "Full-pretrain/Loss (Raw)": 2.100564956665039, "Full-pretrain/Step": 9309, "Full-pretrain/Step Time": 17.673254132270813} +{"Full-pretrain/Learning Rate": 7.360883371651528e-08, "Full-pretrain/Loss": 1.910515308380127, "Full-pretrain/Loss (Raw)": 1.4780151844024658, "Full-pretrain/Step": 9310, "Full-pretrain/Step Time": 17.666077811270952} +{"Full-pretrain/Learning Rate": 7.295918559593051e-08, "Full-pretrain/Loss": 1.9166384935379028, "Full-pretrain/Loss (Raw)": 1.9490158557891846, "Full-pretrain/Step": 9311, "Full-pretrain/Step Time": 17.672848090529442} +{"Full-pretrain/Learning Rate": 7.231241280074297e-08, "Full-pretrain/Loss": 1.9191373586654663, "Full-pretrain/Loss (Raw)": 1.9072016477584839, "Full-pretrain/Step": 9312, "Full-pretrain/Step Time": 17.66835612989962} +{"Full-pretrain/Learning Rate": 7.166851540555963e-08, "Full-pretrain/Loss": 1.9190189838409424, "Full-pretrain/Loss (Raw)": 1.9354493618011475, "Full-pretrain/Step": 9313, "Full-pretrain/Step Time": 17.671462427824736} +{"Full-pretrain/Learning Rate": 7.102749348465165e-08, "Full-pretrain/Loss": 1.9197649955749512, "Full-pretrain/Loss (Raw)": 1.8367669582366943, "Full-pretrain/Step": 9314, "Full-pretrain/Step Time": 17.664845693856478} +{"Full-pretrain/Learning Rate": 7.038934711196265e-08, "Full-pretrain/Loss": 1.9249448776245117, "Full-pretrain/Loss (Raw)": 1.9742062091827393, "Full-pretrain/Step": 9315, "Full-pretrain/Step Time": 17.66329074278474} +{"Full-pretrain/Learning Rate": 6.975407636110043e-08, "Full-pretrain/Loss": 1.9343359470367432, "Full-pretrain/Loss (Raw)": 2.2961487770080566, "Full-pretrain/Step": 9316, "Full-pretrain/Step Time": 17.655736483633518} +{"Full-pretrain/Learning Rate": 6.912168130534525e-08, "Full-pretrain/Loss": 1.9226018190383911, "Full-pretrain/Loss (Raw)": 1.830599069595337, "Full-pretrain/Step": 9317, "Full-pretrain/Step Time": 17.664925690740347} +{"Full-pretrain/Learning Rate": 6.84921620176443e-08, "Full-pretrain/Loss": 1.9263205528259277, "Full-pretrain/Loss (Raw)": 1.6424846649169922, "Full-pretrain/Step": 9318, "Full-pretrain/Step Time": 17.659458534792066} +{"Full-pretrain/Learning Rate": 6.786551857060896e-08, "Full-pretrain/Loss": 1.9397281408309937, "Full-pretrain/Loss (Raw)": 1.972153902053833, "Full-pretrain/Step": 9319, "Full-pretrain/Step Time": 17.662999466061592} +{"Full-pretrain/Learning Rate": 6.724175103652308e-08, "Full-pretrain/Loss": 1.9294310808181763, "Full-pretrain/Loss (Raw)": 1.7416672706604004, "Full-pretrain/Step": 9320, "Full-pretrain/Step Time": 17.660306356847286} +{"Full-pretrain/Learning Rate": 6.66208594873402e-08, "Full-pretrain/Loss": 1.9365572929382324, "Full-pretrain/Loss (Raw)": 1.964474081993103, "Full-pretrain/Step": 9321, "Full-pretrain/Step Time": 17.66467992030084} +{"Full-pretrain/Learning Rate": 6.600284399468082e-08, "Full-pretrain/Loss": 1.9244623184204102, "Full-pretrain/Loss (Raw)": 1.8428065776824951, "Full-pretrain/Step": 9322, "Full-pretrain/Step Time": 17.6719623580575} +{"Full-pretrain/Learning Rate": 6.538770462982957e-08, "Full-pretrain/Loss": 1.9316699504852295, "Full-pretrain/Loss (Raw)": 1.9581758975982666, "Full-pretrain/Step": 9323, "Full-pretrain/Step Time": 17.669778436422348} +{"Full-pretrain/Learning Rate": 6.47754414637436e-08, "Full-pretrain/Loss": 1.9279614686965942, "Full-pretrain/Loss (Raw)": 1.9302817583084106, "Full-pretrain/Step": 9324, "Full-pretrain/Step Time": 17.66759686730802} +{"Full-pretrain/Learning Rate": 6.416605456704694e-08, "Full-pretrain/Loss": 1.9272514581680298, "Full-pretrain/Loss (Raw)": 2.020540237426758, "Full-pretrain/Step": 9325, "Full-pretrain/Step Time": 17.67091618105769} +{"Full-pretrain/Learning Rate": 6.355954401003339e-08, "Full-pretrain/Loss": 1.9357388019561768, "Full-pretrain/Loss (Raw)": 1.9288564920425415, "Full-pretrain/Step": 9326, "Full-pretrain/Step Time": 17.671671176329255} +{"Full-pretrain/Learning Rate": 6.295590986266642e-08, "Full-pretrain/Loss": 1.9342548847198486, "Full-pretrain/Loss (Raw)": 1.8033852577209473, "Full-pretrain/Step": 9327, "Full-pretrain/Step Time": 17.671215632930398} +{"Full-pretrain/Learning Rate": 6.235515219456811e-08, "Full-pretrain/Loss": 1.9393973350524902, "Full-pretrain/Loss (Raw)": 1.8999882936477661, "Full-pretrain/Step": 9328, "Full-pretrain/Step Time": 17.666054543107748} +{"Full-pretrain/Learning Rate": 6.175727107504137e-08, "Full-pretrain/Loss": 1.9384726285934448, "Full-pretrain/Loss (Raw)": 1.991178035736084, "Full-pretrain/Step": 9329, "Full-pretrain/Step Time": 17.665344337001443} +{"Full-pretrain/Learning Rate": 6.116226657304769e-08, "Full-pretrain/Loss": 1.9307878017425537, "Full-pretrain/Loss (Raw)": 1.8882858753204346, "Full-pretrain/Step": 9330, "Full-pretrain/Step Time": 17.66916187107563} +{"Full-pretrain/Learning Rate": 6.057013875722107e-08, "Full-pretrain/Loss": 1.9349147081375122, "Full-pretrain/Loss (Raw)": 2.108954906463623, "Full-pretrain/Step": 9331, "Full-pretrain/Step Time": 17.671289952471852} +{"Full-pretrain/Learning Rate": 5.998088769586795e-08, "Full-pretrain/Loss": 1.9284515380859375, "Full-pretrain/Loss (Raw)": 1.91127610206604, "Full-pretrain/Step": 9332, "Full-pretrain/Step Time": 17.669642070308328} +{"Full-pretrain/Learning Rate": 5.939451345695346e-08, "Full-pretrain/Loss": 1.9227921962738037, "Full-pretrain/Loss (Raw)": 1.7166037559509277, "Full-pretrain/Step": 9333, "Full-pretrain/Step Time": 17.66413587331772} +{"Full-pretrain/Learning Rate": 5.88110161081179e-08, "Full-pretrain/Loss": 1.927006721496582, "Full-pretrain/Loss (Raw)": 2.1318202018737793, "Full-pretrain/Step": 9334, "Full-pretrain/Step Time": 17.665194489061832} +{"Full-pretrain/Learning Rate": 5.823039571666578e-08, "Full-pretrain/Loss": 1.9219849109649658, "Full-pretrain/Loss (Raw)": 1.8563793897628784, "Full-pretrain/Step": 9335, "Full-pretrain/Step Time": 17.665606569498777} +{"Full-pretrain/Learning Rate": 5.765265234957129e-08, "Full-pretrain/Loss": 1.9182851314544678, "Full-pretrain/Loss (Raw)": 1.7107744216918945, "Full-pretrain/Step": 9336, "Full-pretrain/Step Time": 17.669723453000188} +{"Full-pretrain/Learning Rate": 5.7077786073478356e-08, "Full-pretrain/Loss": 1.9187291860580444, "Full-pretrain/Loss (Raw)": 1.9609640836715698, "Full-pretrain/Step": 9337, "Full-pretrain/Step Time": 17.66839432530105} +{"Full-pretrain/Learning Rate": 5.650579695469782e-08, "Full-pretrain/Loss": 1.9105197191238403, "Full-pretrain/Loss (Raw)": 1.7044352293014526, "Full-pretrain/Step": 9338, "Full-pretrain/Step Time": 17.669191701337695} +{"Full-pretrain/Learning Rate": 5.593668505921024e-08, "Full-pretrain/Loss": 1.9093499183654785, "Full-pretrain/Loss (Raw)": 2.1658194065093994, "Full-pretrain/Step": 9339, "Full-pretrain/Step Time": 17.668406696990132} +{"Full-pretrain/Learning Rate": 5.537045045265754e-08, "Full-pretrain/Loss": 1.9239721298217773, "Full-pretrain/Loss (Raw)": 2.4078335762023926, "Full-pretrain/Step": 9340, "Full-pretrain/Step Time": 17.67013198696077} +{"Full-pretrain/Learning Rate": 5.480709320035693e-08, "Full-pretrain/Loss": 1.9205520153045654, "Full-pretrain/Loss (Raw)": 1.9911186695098877, "Full-pretrain/Step": 9341, "Full-pretrain/Step Time": 17.65986116603017} +{"Full-pretrain/Learning Rate": 5.424661336729253e-08, "Full-pretrain/Loss": 1.942172646522522, "Full-pretrain/Loss (Raw)": 2.1698763370513916, "Full-pretrain/Step": 9342, "Full-pretrain/Step Time": 17.663545044139028} +{"Full-pretrain/Learning Rate": 5.3689011018115406e-08, "Full-pretrain/Loss": 1.9385648965835571, "Full-pretrain/Loss (Raw)": 1.8335710763931274, "Full-pretrain/Step": 9343, "Full-pretrain/Step Time": 17.66212389804423} +{"Full-pretrain/Learning Rate": 5.3134286217143556e-08, "Full-pretrain/Loss": 1.9378976821899414, "Full-pretrain/Loss (Raw)": 1.8858497142791748, "Full-pretrain/Step": 9344, "Full-pretrain/Step Time": 17.667434364557266} +{"Full-pretrain/Learning Rate": 5.258243902836468e-08, "Full-pretrain/Loss": 1.940680980682373, "Full-pretrain/Loss (Raw)": 2.0245132446289062, "Full-pretrain/Step": 9345, "Full-pretrain/Step Time": 17.665433602407575} +{"Full-pretrain/Learning Rate": 5.203346951543342e-08, "Full-pretrain/Loss": 1.9471607208251953, "Full-pretrain/Loss (Raw)": 2.044119358062744, "Full-pretrain/Step": 9346, "Full-pretrain/Step Time": 17.667380910366774} +{"Full-pretrain/Learning Rate": 5.148737774167411e-08, "Full-pretrain/Loss": 1.9534412622451782, "Full-pretrain/Loss (Raw)": 2.1751866340637207, "Full-pretrain/Step": 9347, "Full-pretrain/Step Time": 17.665714172646403} +{"Full-pretrain/Learning Rate": 5.094416377008082e-08, "Full-pretrain/Loss": 1.9473313093185425, "Full-pretrain/Loss (Raw)": 2.1006274223327637, "Full-pretrain/Step": 9348, "Full-pretrain/Step Time": 17.668643163517118} +{"Full-pretrain/Learning Rate": 5.040382766330898e-08, "Full-pretrain/Loss": 1.9522221088409424, "Full-pretrain/Loss (Raw)": 1.9871039390563965, "Full-pretrain/Step": 9349, "Full-pretrain/Step Time": 17.671070715412498} +{"Full-pretrain/Learning Rate": 4.9866369483686504e-08, "Full-pretrain/Loss": 1.953525185585022, "Full-pretrain/Loss (Raw)": 1.6841821670532227, "Full-pretrain/Step": 9350, "Full-pretrain/Step Time": 17.66935970634222} +{"Full-pretrain/Learning Rate": 4.9331789293211026e-08, "Full-pretrain/Loss": 1.9461698532104492, "Full-pretrain/Loss (Raw)": 1.7367854118347168, "Full-pretrain/Step": 9351, "Full-pretrain/Step Time": 17.6692658290267} +{"Full-pretrain/Learning Rate": 4.880008715354434e-08, "Full-pretrain/Loss": 1.9544951915740967, "Full-pretrain/Loss (Raw)": 2.0080783367156982, "Full-pretrain/Step": 9352, "Full-pretrain/Step Time": 17.667651411145926} +{"Full-pretrain/Learning Rate": 4.8271263126020705e-08, "Full-pretrain/Loss": 1.9516329765319824, "Full-pretrain/Loss (Raw)": 1.8728851079940796, "Full-pretrain/Step": 9353, "Full-pretrain/Step Time": 17.669301725924015} +{"Full-pretrain/Learning Rate": 4.7745317271638556e-08, "Full-pretrain/Loss": 1.955387830734253, "Full-pretrain/Loss (Raw)": 1.962957501411438, "Full-pretrain/Step": 9354, "Full-pretrain/Step Time": 17.66921997256577} +{"Full-pretrain/Learning Rate": 4.722224965106603e-08, "Full-pretrain/Loss": 1.955435872077942, "Full-pretrain/Loss (Raw)": 1.9597127437591553, "Full-pretrain/Step": 9355, "Full-pretrain/Step Time": 17.66622463427484} +{"Full-pretrain/Learning Rate": 4.670206032463542e-08, "Full-pretrain/Loss": 1.9525644779205322, "Full-pretrain/Loss (Raw)": 1.8383996486663818, "Full-pretrain/Step": 9356, "Full-pretrain/Step Time": 17.669503077864647} +{"Full-pretrain/Learning Rate": 4.618474935235429e-08, "Full-pretrain/Loss": 1.9439302682876587, "Full-pretrain/Loss (Raw)": 1.7442442178726196, "Full-pretrain/Step": 9357, "Full-pretrain/Step Time": 17.669547276571393} +{"Full-pretrain/Learning Rate": 4.5670316793891555e-08, "Full-pretrain/Loss": 1.9445024728775024, "Full-pretrain/Loss (Raw)": 1.9471690654754639, "Full-pretrain/Step": 9358, "Full-pretrain/Step Time": 17.670042540878057} +{"Full-pretrain/Learning Rate": 4.515876270859143e-08, "Full-pretrain/Loss": 1.9513260126113892, "Full-pretrain/Loss (Raw)": 2.021735429763794, "Full-pretrain/Step": 9359, "Full-pretrain/Step Time": 17.67053021118045} +{"Full-pretrain/Learning Rate": 4.4650087155453936e-08, "Full-pretrain/Loss": 1.9503685235977173, "Full-pretrain/Loss (Raw)": 1.869349718093872, "Full-pretrain/Step": 9360, "Full-pretrain/Step Time": 17.667511254549026} +{"Full-pretrain/Learning Rate": 4.414429019316268e-08, "Full-pretrain/Loss": 1.9441262483596802, "Full-pretrain/Loss (Raw)": 1.7914260625839233, "Full-pretrain/Step": 9361, "Full-pretrain/Step Time": 17.67024229094386} +{"Full-pretrain/Learning Rate": 4.3641371880057123e-08, "Full-pretrain/Loss": 1.941848635673523, "Full-pretrain/Loss (Raw)": 1.8154029846191406, "Full-pretrain/Step": 9362, "Full-pretrain/Step Time": 17.67426784709096} +{"Full-pretrain/Learning Rate": 4.3141332274146404e-08, "Full-pretrain/Loss": 1.932550311088562, "Full-pretrain/Loss (Raw)": 1.8114087581634521, "Full-pretrain/Step": 9363, "Full-pretrain/Step Time": 17.673699487000704} +{"Full-pretrain/Learning Rate": 4.2644171433114945e-08, "Full-pretrain/Loss": 1.9352469444274902, "Full-pretrain/Loss (Raw)": 1.9975658655166626, "Full-pretrain/Step": 9364, "Full-pretrain/Step Time": 17.670879509299994} +{"Full-pretrain/Learning Rate": 4.2149889414305756e-08, "Full-pretrain/Loss": 1.9397985935211182, "Full-pretrain/Loss (Raw)": 1.8622591495513916, "Full-pretrain/Step": 9365, "Full-pretrain/Step Time": 17.678744718432426} +{"Full-pretrain/Learning Rate": 4.165848627473712e-08, "Full-pretrain/Loss": 1.9313228130340576, "Full-pretrain/Loss (Raw)": 1.860594391822815, "Full-pretrain/Step": 9366, "Full-pretrain/Step Time": 17.68118134327233} +{"Full-pretrain/Learning Rate": 4.1169962071091474e-08, "Full-pretrain/Loss": 1.9394954442977905, "Full-pretrain/Loss (Raw)": 2.117905378341675, "Full-pretrain/Step": 9367, "Full-pretrain/Step Time": 17.679516717791557} +{"Full-pretrain/Learning Rate": 4.068431685971818e-08, "Full-pretrain/Loss": 1.952458143234253, "Full-pretrain/Loss (Raw)": 2.125577688217163, "Full-pretrain/Step": 9368, "Full-pretrain/Step Time": 17.67919670045376} +{"Full-pretrain/Learning Rate": 4.020155069663911e-08, "Full-pretrain/Loss": 1.9566068649291992, "Full-pretrain/Loss (Raw)": 2.09372615814209, "Full-pretrain/Step": 9369, "Full-pretrain/Step Time": 17.68041954562068} +{"Full-pretrain/Learning Rate": 3.9721663637537485e-08, "Full-pretrain/Loss": 1.96450936794281, "Full-pretrain/Loss (Raw)": 1.9573144912719727, "Full-pretrain/Step": 9370, "Full-pretrain/Step Time": 17.684231678023934} +{"Full-pretrain/Learning Rate": 3.924465573777458e-08, "Full-pretrain/Loss": 1.9572532176971436, "Full-pretrain/Loss (Raw)": 1.9336224794387817, "Full-pretrain/Step": 9371, "Full-pretrain/Step Time": 17.68714931793511} +{"Full-pretrain/Learning Rate": 3.877052705236472e-08, "Full-pretrain/Loss": 1.939803957939148, "Full-pretrain/Loss (Raw)": 1.8494575023651123, "Full-pretrain/Step": 9372, "Full-pretrain/Step Time": 17.68248350918293} +{"Full-pretrain/Learning Rate": 3.829927763600305e-08, "Full-pretrain/Loss": 1.9392644166946411, "Full-pretrain/Loss (Raw)": 1.9738547801971436, "Full-pretrain/Step": 9373, "Full-pretrain/Step Time": 17.680682668462396} +{"Full-pretrain/Learning Rate": 3.783090754304885e-08, "Full-pretrain/Loss": 1.9226617813110352, "Full-pretrain/Loss (Raw)": 1.6385899782180786, "Full-pretrain/Step": 9374, "Full-pretrain/Step Time": 17.68075511790812} +{"Full-pretrain/Learning Rate": 3.7365416827528364e-08, "Full-pretrain/Loss": 1.923384189605713, "Full-pretrain/Loss (Raw)": 1.856689691543579, "Full-pretrain/Step": 9375, "Full-pretrain/Step Time": 17.690493686124682} +{"Full-pretrain/Learning Rate": 3.690280554313197e-08, "Full-pretrain/Loss": 1.9305157661437988, "Full-pretrain/Loss (Raw)": 2.114058017730713, "Full-pretrain/Step": 9376, "Full-pretrain/Step Time": 17.681630225852132} +{"Full-pretrain/Learning Rate": 3.644307374322531e-08, "Full-pretrain/Loss": 1.938122272491455, "Full-pretrain/Loss (Raw)": 2.2679214477539062, "Full-pretrain/Step": 9377, "Full-pretrain/Step Time": 17.674518393352628} +{"Full-pretrain/Learning Rate": 3.598622148083819e-08, "Full-pretrain/Loss": 1.9487550258636475, "Full-pretrain/Loss (Raw)": 2.3843650817871094, "Full-pretrain/Step": 9378, "Full-pretrain/Step Time": 17.67630354873836} +{"Full-pretrain/Learning Rate": 3.553224880866735e-08, "Full-pretrain/Loss": 1.9477208852767944, "Full-pretrain/Loss (Raw)": 2.142096996307373, "Full-pretrain/Step": 9379, "Full-pretrain/Step Time": 17.681834993883967} +{"Full-pretrain/Learning Rate": 3.508115577907645e-08, "Full-pretrain/Loss": 1.9385087490081787, "Full-pretrain/Loss (Raw)": 1.8058350086212158, "Full-pretrain/Step": 9380, "Full-pretrain/Step Time": 17.67908113077283} +{"Full-pretrain/Learning Rate": 3.463294244410165e-08, "Full-pretrain/Loss": 1.9389337301254272, "Full-pretrain/Loss (Raw)": 2.000706911087036, "Full-pretrain/Step": 9381, "Full-pretrain/Step Time": 17.67541710473597} +{"Full-pretrain/Learning Rate": 3.418760885544325e-08, "Full-pretrain/Loss": 1.9456417560577393, "Full-pretrain/Loss (Raw)": 1.8988392353057861, "Full-pretrain/Step": 9382, "Full-pretrain/Step Time": 17.673357667401433} +{"Full-pretrain/Learning Rate": 3.374515506447129e-08, "Full-pretrain/Loss": 1.947995901107788, "Full-pretrain/Loss (Raw)": 1.812117099761963, "Full-pretrain/Step": 9383, "Full-pretrain/Step Time": 17.679124092683196} +{"Full-pretrain/Learning Rate": 3.330558112222271e-08, "Full-pretrain/Loss": 1.9421350955963135, "Full-pretrain/Loss (Raw)": 1.8205289840698242, "Full-pretrain/Step": 9384, "Full-pretrain/Step Time": 17.683807572349906} +{"Full-pretrain/Learning Rate": 3.2868887079401386e-08, "Full-pretrain/Loss": 1.949791669845581, "Full-pretrain/Loss (Raw)": 2.1178977489471436, "Full-pretrain/Step": 9385, "Full-pretrain/Step Time": 17.67675332352519} +{"Full-pretrain/Learning Rate": 3.2435072986378154e-08, "Full-pretrain/Loss": 1.9459092617034912, "Full-pretrain/Loss (Raw)": 1.8387179374694824, "Full-pretrain/Step": 9386, "Full-pretrain/Step Time": 17.673822602257133} +{"Full-pretrain/Learning Rate": 3.200413889319631e-08, "Full-pretrain/Loss": 1.9437956809997559, "Full-pretrain/Loss (Raw)": 1.8920836448669434, "Full-pretrain/Step": 9387, "Full-pretrain/Step Time": 17.67943986132741} +{"Full-pretrain/Learning Rate": 3.157608484956332e-08, "Full-pretrain/Loss": 1.9481360912322998, "Full-pretrain/Loss (Raw)": 1.9772905111312866, "Full-pretrain/Step": 9388, "Full-pretrain/Step Time": 17.682847920805216} +{"Full-pretrain/Learning Rate": 3.115091090485356e-08, "Full-pretrain/Loss": 1.9516078233718872, "Full-pretrain/Loss (Raw)": 1.855341911315918, "Full-pretrain/Step": 9389, "Full-pretrain/Step Time": 17.67807531543076} +{"Full-pretrain/Learning Rate": 3.0728617108111147e-08, "Full-pretrain/Loss": 1.9452288150787354, "Full-pretrain/Loss (Raw)": 1.7430384159088135, "Full-pretrain/Step": 9390, "Full-pretrain/Step Time": 17.67893884703517} +{"Full-pretrain/Learning Rate": 3.030920350804711e-08, "Full-pretrain/Loss": 1.93912672996521, "Full-pretrain/Loss (Raw)": 1.8264737129211426, "Full-pretrain/Step": 9391, "Full-pretrain/Step Time": 17.680942563340068} +{"Full-pretrain/Learning Rate": 2.98926701530422e-08, "Full-pretrain/Loss": 1.9428210258483887, "Full-pretrain/Loss (Raw)": 1.987564206123352, "Full-pretrain/Step": 9392, "Full-pretrain/Step Time": 17.685563964769244} +{"Full-pretrain/Learning Rate": 2.947901709114409e-08, "Full-pretrain/Loss": 1.945199966430664, "Full-pretrain/Loss (Raw)": 1.8675509691238403, "Full-pretrain/Step": 9393, "Full-pretrain/Step Time": 17.68060089275241} +{"Full-pretrain/Learning Rate": 2.9068244370064613e-08, "Full-pretrain/Loss": 1.9458450078964233, "Full-pretrain/Loss (Raw)": 1.8360463380813599, "Full-pretrain/Step": 9394, "Full-pretrain/Step Time": 17.68236245959997} +{"Full-pretrain/Learning Rate": 2.8660352037188088e-08, "Full-pretrain/Loss": 1.947047472000122, "Full-pretrain/Loss (Raw)": 1.849888563156128, "Full-pretrain/Step": 9395, "Full-pretrain/Step Time": 17.68291986733675} +{"Full-pretrain/Learning Rate": 2.8255340139565767e-08, "Full-pretrain/Loss": 1.9427953958511353, "Full-pretrain/Loss (Raw)": 1.8614957332611084, "Full-pretrain/Step": 9396, "Full-pretrain/Step Time": 17.67962290532887} +{"Full-pretrain/Learning Rate": 2.785320872391306e-08, "Full-pretrain/Loss": 1.9422004222869873, "Full-pretrain/Loss (Raw)": 1.8432245254516602, "Full-pretrain/Step": 9397, "Full-pretrain/Step Time": 17.68235852383077} +{"Full-pretrain/Learning Rate": 2.745395783661786e-08, "Full-pretrain/Loss": 1.9448977708816528, "Full-pretrain/Loss (Raw)": 1.9469068050384521, "Full-pretrain/Step": 9398, "Full-pretrain/Step Time": 17.680937595665455} +{"Full-pretrain/Learning Rate": 2.7057587523729445e-08, "Full-pretrain/Loss": 1.941698670387268, "Full-pretrain/Loss (Raw)": 2.015533447265625, "Full-pretrain/Step": 9399, "Full-pretrain/Step Time": 17.68290976062417} +{"Full-pretrain/Learning Rate": 2.6664097830975123e-08, "Full-pretrain/Loss": 1.9324504137039185, "Full-pretrain/Loss (Raw)": 1.82963228225708, "Full-pretrain/Step": 9400, "Full-pretrain/Step Time": 17.678990801796317} +{"Full-pretrain/Learning Rate": 2.627348880374081e-08, "Full-pretrain/Loss": 1.9228553771972656, "Full-pretrain/Loss (Raw)": 1.786686658859253, "Full-pretrain/Step": 9401, "Full-pretrain/Step Time": 17.682434590533376} +{"Full-pretrain/Learning Rate": 2.5885760487082135e-08, "Full-pretrain/Loss": 1.9187462329864502, "Full-pretrain/Loss (Raw)": 1.8258235454559326, "Full-pretrain/Step": 9402, "Full-pretrain/Step Time": 17.67725702188909} +{"Full-pretrain/Learning Rate": 2.550091292572443e-08, "Full-pretrain/Loss": 1.9183396100997925, "Full-pretrain/Loss (Raw)": 1.920609951019287, "Full-pretrain/Step": 9403, "Full-pretrain/Step Time": 17.6817620228976} +{"Full-pretrain/Learning Rate": 2.5118946164059963e-08, "Full-pretrain/Loss": 1.92438805103302, "Full-pretrain/Loss (Raw)": 2.04300594329834, "Full-pretrain/Step": 9404, "Full-pretrain/Step Time": 17.67525958828628} +{"Full-pretrain/Learning Rate": 2.4739860246150716e-08, "Full-pretrain/Loss": 1.922997236251831, "Full-pretrain/Loss (Raw)": 1.9293509721755981, "Full-pretrain/Step": 9405, "Full-pretrain/Step Time": 17.679960755631328} +{"Full-pretrain/Learning Rate": 2.4363655215717264e-08, "Full-pretrain/Loss": 1.935838222503662, "Full-pretrain/Loss (Raw)": 2.049501657485962, "Full-pretrain/Step": 9406, "Full-pretrain/Step Time": 17.678434282541275} +{"Full-pretrain/Learning Rate": 2.3990331116161e-08, "Full-pretrain/Loss": 1.9433300495147705, "Full-pretrain/Loss (Raw)": 2.0964274406433105, "Full-pretrain/Step": 9407, "Full-pretrain/Step Time": 17.68359673023224} +{"Full-pretrain/Learning Rate": 2.361988799054471e-08, "Full-pretrain/Loss": 1.9440914392471313, "Full-pretrain/Loss (Raw)": 2.1384224891662598, "Full-pretrain/Step": 9408, "Full-pretrain/Step Time": 17.677774094045162} +{"Full-pretrain/Learning Rate": 2.3252325881595316e-08, "Full-pretrain/Loss": 1.9392268657684326, "Full-pretrain/Loss (Raw)": 2.112255573272705, "Full-pretrain/Step": 9409, "Full-pretrain/Step Time": 17.681401105597615} +{"Full-pretrain/Learning Rate": 2.288764483171224e-08, "Full-pretrain/Loss": 1.9236098527908325, "Full-pretrain/Loss (Raw)": 1.8846204280853271, "Full-pretrain/Step": 9410, "Full-pretrain/Step Time": 17.679786141961813} +{"Full-pretrain/Learning Rate": 2.2525844882964607e-08, "Full-pretrain/Loss": 1.9110050201416016, "Full-pretrain/Loss (Raw)": 1.7387416362762451, "Full-pretrain/Step": 9411, "Full-pretrain/Step Time": 17.675721598789096} +{"Full-pretrain/Learning Rate": 2.2166926077080153e-08, "Full-pretrain/Loss": 1.9152274131774902, "Full-pretrain/Loss (Raw)": 1.9409502744674683, "Full-pretrain/Step": 9412, "Full-pretrain/Step Time": 17.68511389195919} +{"Full-pretrain/Learning Rate": 2.181088845546464e-08, "Full-pretrain/Loss": 1.910600185394287, "Full-pretrain/Loss (Raw)": 1.8526344299316406, "Full-pretrain/Step": 9413, "Full-pretrain/Step Time": 17.68616422638297} +{"Full-pretrain/Learning Rate": 2.1457732059182443e-08, "Full-pretrain/Loss": 1.9169515371322632, "Full-pretrain/Loss (Raw)": 2.1020865440368652, "Full-pretrain/Step": 9414, "Full-pretrain/Step Time": 17.684974478557706} +{"Full-pretrain/Learning Rate": 2.1107456928975978e-08, "Full-pretrain/Loss": 1.9230690002441406, "Full-pretrain/Loss (Raw)": 2.007875442504883, "Full-pretrain/Step": 9415, "Full-pretrain/Step Time": 17.68458983488381} +{"Full-pretrain/Learning Rate": 2.0760063105243475e-08, "Full-pretrain/Loss": 1.9243190288543701, "Full-pretrain/Loss (Raw)": 1.8605259656906128, "Full-pretrain/Step": 9416, "Full-pretrain/Step Time": 17.68222908861935} +{"Full-pretrain/Learning Rate": 2.041555062806122e-08, "Full-pretrain/Loss": 1.9201090335845947, "Full-pretrain/Loss (Raw)": 1.983182430267334, "Full-pretrain/Step": 9417, "Full-pretrain/Step Time": 17.678253723308444} +{"Full-pretrain/Learning Rate": 2.0073919537166864e-08, "Full-pretrain/Loss": 1.9177162647247314, "Full-pretrain/Loss (Raw)": 1.7621498107910156, "Full-pretrain/Step": 9418, "Full-pretrain/Step Time": 17.68587322719395} +{"Full-pretrain/Learning Rate": 1.9735169871964997e-08, "Full-pretrain/Loss": 1.9230868816375732, "Full-pretrain/Loss (Raw)": 2.0639424324035645, "Full-pretrain/Step": 9419, "Full-pretrain/Step Time": 17.681758334860206} +{"Full-pretrain/Learning Rate": 1.9399301671535473e-08, "Full-pretrain/Loss": 1.9170650243759155, "Full-pretrain/Loss (Raw)": 1.7845875024795532, "Full-pretrain/Step": 9420, "Full-pretrain/Step Time": 17.680346401408315} +{"Full-pretrain/Learning Rate": 1.9066314974613974e-08, "Full-pretrain/Loss": 1.9256914854049683, "Full-pretrain/Loss (Raw)": 2.1313905715942383, "Full-pretrain/Step": 9421, "Full-pretrain/Step Time": 17.67448245920241} +{"Full-pretrain/Learning Rate": 1.873620981961699e-08, "Full-pretrain/Loss": 1.932378888130188, "Full-pretrain/Loss (Raw)": 1.9570362567901611, "Full-pretrain/Step": 9422, "Full-pretrain/Step Time": 17.675925489515066} +{"Full-pretrain/Learning Rate": 1.840898624461962e-08, "Full-pretrain/Loss": 1.9358251094818115, "Full-pretrain/Loss (Raw)": 1.9367527961730957, "Full-pretrain/Step": 9423, "Full-pretrain/Step Time": 17.673971865326166} +{"Full-pretrain/Learning Rate": 1.808464428736667e-08, "Full-pretrain/Loss": 1.9410556554794312, "Full-pretrain/Loss (Raw)": 2.154939889907837, "Full-pretrain/Step": 9424, "Full-pretrain/Step Time": 17.67044387757778} +{"Full-pretrain/Learning Rate": 1.7763183985269883e-08, "Full-pretrain/Loss": 1.9429256916046143, "Full-pretrain/Loss (Raw)": 1.9273940324783325, "Full-pretrain/Step": 9425, "Full-pretrain/Step Time": 17.676010984927416} +{"Full-pretrain/Learning Rate": 1.744460537540793e-08, "Full-pretrain/Loss": 1.9446523189544678, "Full-pretrain/Loss (Raw)": 1.8912954330444336, "Full-pretrain/Step": 9426, "Full-pretrain/Step Time": 17.674037439748645} +{"Full-pretrain/Learning Rate": 1.7128908494534745e-08, "Full-pretrain/Loss": 1.9510619640350342, "Full-pretrain/Loss (Raw)": 2.055002212524414, "Full-pretrain/Step": 9427, "Full-pretrain/Step Time": 17.675676530227065} +{"Full-pretrain/Learning Rate": 1.681609337906287e-08, "Full-pretrain/Loss": 1.9593127965927124, "Full-pretrain/Loss (Raw)": 2.125519275665283, "Full-pretrain/Step": 9428, "Full-pretrain/Step Time": 17.671113474294543} +{"Full-pretrain/Learning Rate": 1.6506160065071775e-08, "Full-pretrain/Loss": 1.9470840692520142, "Full-pretrain/Loss (Raw)": 1.4519054889678955, "Full-pretrain/Step": 9429, "Full-pretrain/Step Time": 17.66787524521351} +{"Full-pretrain/Learning Rate": 1.6199108588316193e-08, "Full-pretrain/Loss": 1.941578984260559, "Full-pretrain/Loss (Raw)": 1.7707440853118896, "Full-pretrain/Step": 9430, "Full-pretrain/Step Time": 17.673989618197083} +{"Full-pretrain/Learning Rate": 1.5894938984215013e-08, "Full-pretrain/Loss": 1.9229531288146973, "Full-pretrain/Loss (Raw)": 1.4195092916488647, "Full-pretrain/Step": 9431, "Full-pretrain/Step Time": 17.67224445566535} +{"Full-pretrain/Learning Rate": 1.5593651287851285e-08, "Full-pretrain/Loss": 1.9257123470306396, "Full-pretrain/Loss (Raw)": 1.9179219007492065, "Full-pretrain/Step": 9432, "Full-pretrain/Step Time": 17.67255619727075} +{"Full-pretrain/Learning Rate": 1.529524553398054e-08, "Full-pretrain/Loss": 1.930342197418213, "Full-pretrain/Loss (Raw)": 1.9348483085632324, "Full-pretrain/Step": 9433, "Full-pretrain/Step Time": 17.680604064837098} +{"Full-pretrain/Learning Rate": 1.4999721757022467e-08, "Full-pretrain/Loss": 1.9367119073867798, "Full-pretrain/Loss (Raw)": 2.0296502113342285, "Full-pretrain/Step": 9434, "Full-pretrain/Step Time": 17.672042882069945} +{"Full-pretrain/Learning Rate": 1.4707079991066464e-08, "Full-pretrain/Loss": 1.9348580837249756, "Full-pretrain/Loss (Raw)": 1.8612887859344482, "Full-pretrain/Step": 9435, "Full-pretrain/Step Time": 17.67369118332863} +{"Full-pretrain/Learning Rate": 1.4417320269868861e-08, "Full-pretrain/Loss": 1.935563564300537, "Full-pretrain/Loss (Raw)": 2.0655829906463623, "Full-pretrain/Step": 9436, "Full-pretrain/Step Time": 17.67980958148837} +{"Full-pretrain/Learning Rate": 1.4130442626850149e-08, "Full-pretrain/Loss": 1.9352927207946777, "Full-pretrain/Loss (Raw)": 1.9206823110580444, "Full-pretrain/Step": 9437, "Full-pretrain/Step Time": 17.672952001914382} +{"Full-pretrain/Learning Rate": 1.3846447095106074e-08, "Full-pretrain/Loss": 1.925614833831787, "Full-pretrain/Loss (Raw)": 1.7398097515106201, "Full-pretrain/Step": 9438, "Full-pretrain/Step Time": 17.674311434850097} +{"Full-pretrain/Learning Rate": 1.3565333707393769e-08, "Full-pretrain/Loss": 1.9283044338226318, "Full-pretrain/Loss (Raw)": 2.1824951171875, "Full-pretrain/Step": 9439, "Full-pretrain/Step Time": 17.672123109921813} +{"Full-pretrain/Learning Rate": 1.3287102496140069e-08, "Full-pretrain/Loss": 1.9138600826263428, "Full-pretrain/Loss (Raw)": 1.6762018203735352, "Full-pretrain/Step": 9440, "Full-pretrain/Step Time": 17.675026200711727} +{"Full-pretrain/Learning Rate": 1.3011753493438749e-08, "Full-pretrain/Loss": 1.9066139459609985, "Full-pretrain/Loss (Raw)": 1.8803777694702148, "Full-pretrain/Step": 9441, "Full-pretrain/Step Time": 17.672336857765913} +{"Full-pretrain/Learning Rate": 1.2739286731047739e-08, "Full-pretrain/Loss": 1.910275936126709, "Full-pretrain/Loss (Raw)": 2.0018062591552734, "Full-pretrain/Step": 9442, "Full-pretrain/Step Time": 17.671200750395656} +{"Full-pretrain/Learning Rate": 1.2469702240400227e-08, "Full-pretrain/Loss": 1.9033854007720947, "Full-pretrain/Loss (Raw)": 1.5182428359985352, "Full-pretrain/Step": 9443, "Full-pretrain/Step Time": 17.683498000726104} +{"Full-pretrain/Learning Rate": 1.2203000052590785e-08, "Full-pretrain/Loss": 1.9056105613708496, "Full-pretrain/Loss (Raw)": 2.012155532836914, "Full-pretrain/Step": 9444, "Full-pretrain/Step Time": 17.683167392387986} +{"Full-pretrain/Learning Rate": 1.1939180198386468e-08, "Full-pretrain/Loss": 1.9087355136871338, "Full-pretrain/Loss (Raw)": 1.9526318311691284, "Full-pretrain/Step": 9445, "Full-pretrain/Step Time": 17.67842224612832} +{"Full-pretrain/Learning Rate": 1.1678242708212939e-08, "Full-pretrain/Loss": 1.8922579288482666, "Full-pretrain/Loss (Raw)": 1.57480788230896, "Full-pretrain/Step": 9446, "Full-pretrain/Step Time": 17.681980326771736} +{"Full-pretrain/Learning Rate": 1.1420187612173894e-08, "Full-pretrain/Loss": 1.892068862915039, "Full-pretrain/Loss (Raw)": 2.0018210411071777, "Full-pretrain/Step": 9447, "Full-pretrain/Step Time": 17.682601204141974} +{"Full-pretrain/Learning Rate": 1.1165014940037189e-08, "Full-pretrain/Loss": 1.892820119857788, "Full-pretrain/Loss (Raw)": 1.884568452835083, "Full-pretrain/Step": 9448, "Full-pretrain/Step Time": 17.68153116479516} +{"Full-pretrain/Learning Rate": 1.091272472123206e-08, "Full-pretrain/Loss": 1.8904846906661987, "Full-pretrain/Loss (Raw)": 1.908447027206421, "Full-pretrain/Step": 9449, "Full-pretrain/Step Time": 17.680825458839536} +{"Full-pretrain/Learning Rate": 1.0663316984860228e-08, "Full-pretrain/Loss": 1.8906234502792358, "Full-pretrain/Loss (Raw)": 1.7665915489196777, "Full-pretrain/Step": 9450, "Full-pretrain/Step Time": 17.674499321728945} +{"Full-pretrain/Learning Rate": 1.0416791759695899e-08, "Full-pretrain/Loss": 1.8785004615783691, "Full-pretrain/Loss (Raw)": 1.6760029792785645, "Full-pretrain/Step": 9451, "Full-pretrain/Step Time": 17.67295105755329} +{"Full-pretrain/Learning Rate": 1.0173149074171883e-08, "Full-pretrain/Loss": 1.8757808208465576, "Full-pretrain/Loss (Raw)": 1.697561502456665, "Full-pretrain/Step": 9452, "Full-pretrain/Step Time": 17.6759876254946} +{"Full-pretrain/Learning Rate": 9.932388956393479e-09, "Full-pretrain/Loss": 1.8709486722946167, "Full-pretrain/Loss (Raw)": 1.9767634868621826, "Full-pretrain/Step": 9453, "Full-pretrain/Step Time": 17.67557123117149} +{"Full-pretrain/Learning Rate": 9.694511434130139e-09, "Full-pretrain/Loss": 1.8664439916610718, "Full-pretrain/Loss (Raw)": 1.8128842115402222, "Full-pretrain/Step": 9454, "Full-pretrain/Step Time": 17.671209855005145} +{"Full-pretrain/Learning Rate": 9.459516534823797e-09, "Full-pretrain/Loss": 1.8635213375091553, "Full-pretrain/Loss (Raw)": 1.8432278633117676, "Full-pretrain/Step": 9455, "Full-pretrain/Step Time": 17.669357968494296} +{"Full-pretrain/Learning Rate": 9.227404285580555e-09, "Full-pretrain/Loss": 1.871934175491333, "Full-pretrain/Loss (Raw)": 2.42415189743042, "Full-pretrain/Step": 9456, "Full-pretrain/Step Time": 17.671784419566393} +{"Full-pretrain/Learning Rate": 8.998174713173435e-09, "Full-pretrain/Loss": 1.8718897104263306, "Full-pretrain/Loss (Raw)": 1.9259722232818604, "Full-pretrain/Step": 9457, "Full-pretrain/Step Time": 17.67881915718317} +{"Full-pretrain/Learning Rate": 8.771827844042402e-09, "Full-pretrain/Loss": 1.8833281993865967, "Full-pretrain/Loss (Raw)": 2.2573251724243164, "Full-pretrain/Step": 9458, "Full-pretrain/Step Time": 17.676470819860697} +{"Full-pretrain/Learning Rate": 8.548363704302676e-09, "Full-pretrain/Loss": 1.8842384815216064, "Full-pretrain/Loss (Raw)": 2.0841362476348877, "Full-pretrain/Step": 9459, "Full-pretrain/Step Time": 17.672024751082063} +{"Full-pretrain/Learning Rate": 8.327782319722532e-09, "Full-pretrain/Loss": 1.8753204345703125, "Full-pretrain/Loss (Raw)": 1.8401360511779785, "Full-pretrain/Step": 9460, "Full-pretrain/Step Time": 17.676868204027414} +{"Full-pretrain/Learning Rate": 8.11008371575106e-09, "Full-pretrain/Loss": 1.884278416633606, "Full-pretrain/Loss (Raw)": 1.7385621070861816, "Full-pretrain/Step": 9461, "Full-pretrain/Step Time": 17.678601061925292} +{"Full-pretrain/Learning Rate": 7.895267917501504e-09, "Full-pretrain/Loss": 1.8798757791519165, "Full-pretrain/Loss (Raw)": 1.6298587322235107, "Full-pretrain/Step": 9462, "Full-pretrain/Step Time": 17.67892720364034} +{"Full-pretrain/Learning Rate": 7.683334949745713e-09, "Full-pretrain/Loss": 1.8953207731246948, "Full-pretrain/Loss (Raw)": 1.9137532711029053, "Full-pretrain/Step": 9463, "Full-pretrain/Step Time": 17.679084036499262} +{"Full-pretrain/Learning Rate": 7.474284836936352e-09, "Full-pretrain/Loss": 1.889436960220337, "Full-pretrain/Loss (Raw)": 1.729640245437622, "Full-pretrain/Step": 9464, "Full-pretrain/Step Time": 17.685282226651907} +{"Full-pretrain/Learning Rate": 7.268117603187463e-09, "Full-pretrain/Loss": 1.9037522077560425, "Full-pretrain/Loss (Raw)": 2.392932653427124, "Full-pretrain/Step": 9465, "Full-pretrain/Step Time": 17.68087435886264} +{"Full-pretrain/Learning Rate": 7.064833272274474e-09, "Full-pretrain/Loss": 1.8985036611557007, "Full-pretrain/Loss (Raw)": 1.8616970777511597, "Full-pretrain/Step": 9466, "Full-pretrain/Step Time": 17.679778050631285} +{"Full-pretrain/Learning Rate": 6.864431867650845e-09, "Full-pretrain/Loss": 1.9010931253433228, "Full-pretrain/Loss (Raw)": 1.9441519975662231, "Full-pretrain/Step": 9467, "Full-pretrain/Step Time": 17.6751019153744} +{"Full-pretrain/Learning Rate": 6.666913412434195e-09, "Full-pretrain/Loss": 1.8954167366027832, "Full-pretrain/Loss (Raw)": 1.8839378356933594, "Full-pretrain/Step": 9468, "Full-pretrain/Step Time": 17.67950427532196} +{"Full-pretrain/Learning Rate": 6.4722779294035254e-09, "Full-pretrain/Loss": 1.8996152877807617, "Full-pretrain/Loss (Raw)": 2.055035352706909, "Full-pretrain/Step": 9469, "Full-pretrain/Step Time": 17.684523306787014} +{"Full-pretrain/Learning Rate": 6.280525441010321e-09, "Full-pretrain/Loss": 1.9074770212173462, "Full-pretrain/Loss (Raw)": 1.9913867712020874, "Full-pretrain/Step": 9470, "Full-pretrain/Step Time": 17.681742317974567} +{"Full-pretrain/Learning Rate": 6.091655969378552e-09, "Full-pretrain/Loss": 1.9008879661560059, "Full-pretrain/Loss (Raw)": 1.9716432094573975, "Full-pretrain/Step": 9471, "Full-pretrain/Step Time": 17.682865373790264} +{"Full-pretrain/Learning Rate": 5.905669536290792e-09, "Full-pretrain/Loss": 1.9017642736434937, "Full-pretrain/Loss (Raw)": 1.7042468786239624, "Full-pretrain/Step": 9472, "Full-pretrain/Step Time": 17.686522103846073} +{"Full-pretrain/Learning Rate": 5.722566163199328e-09, "Full-pretrain/Loss": 1.8991479873657227, "Full-pretrain/Loss (Raw)": 1.7966562509536743, "Full-pretrain/Step": 9473, "Full-pretrain/Step Time": 17.689877178519964} +{"Full-pretrain/Learning Rate": 5.542345871226151e-09, "Full-pretrain/Loss": 1.8945096731185913, "Full-pretrain/Loss (Raw)": 1.8533786535263062, "Full-pretrain/Step": 9474, "Full-pretrain/Step Time": 17.684176405891776} +{"Full-pretrain/Learning Rate": 5.365008681157413e-09, "Full-pretrain/Loss": 1.90982186794281, "Full-pretrain/Loss (Raw)": 2.0082333087921143, "Full-pretrain/Step": 9475, "Full-pretrain/Step Time": 17.682948982343078} +{"Full-pretrain/Learning Rate": 5.190554613454524e-09, "Full-pretrain/Loss": 1.8977155685424805, "Full-pretrain/Loss (Raw)": 1.6247535943984985, "Full-pretrain/Step": 9476, "Full-pretrain/Step Time": 17.686988161876798} +{"Full-pretrain/Learning Rate": 5.0189836882375e-09, "Full-pretrain/Loss": 1.9005227088928223, "Full-pretrain/Loss (Raw)": 2.0424630641937256, "Full-pretrain/Step": 9477, "Full-pretrain/Step Time": 17.68536182306707} +{"Full-pretrain/Learning Rate": 4.850295925296067e-09, "Full-pretrain/Loss": 1.9066948890686035, "Full-pretrain/Loss (Raw)": 1.7723150253295898, "Full-pretrain/Step": 9478, "Full-pretrain/Step Time": 17.691782496869564} +{"Full-pretrain/Learning Rate": 4.684491344086883e-09, "Full-pretrain/Loss": 1.9007874727249146, "Full-pretrain/Loss (Raw)": 1.812784194946289, "Full-pretrain/Step": 9479, "Full-pretrain/Step Time": 17.68754311092198} +{"Full-pretrain/Learning Rate": 4.521569963739092e-09, "Full-pretrain/Loss": 1.9058663845062256, "Full-pretrain/Loss (Raw)": 2.047093152999878, "Full-pretrain/Step": 9480, "Full-pretrain/Step Time": 17.692942844703794} +{"Full-pretrain/Learning Rate": 4.361531803045993e-09, "Full-pretrain/Loss": 1.9035513401031494, "Full-pretrain/Loss (Raw)": 1.834367036819458, "Full-pretrain/Step": 9481, "Full-pretrain/Step Time": 17.69045371748507} +{"Full-pretrain/Learning Rate": 4.204376880465044e-09, "Full-pretrain/Loss": 1.912743330001831, "Full-pretrain/Loss (Raw)": 2.060732841491699, "Full-pretrain/Step": 9482, "Full-pretrain/Step Time": 17.688764790073037} +{"Full-pretrain/Learning Rate": 4.050105214123412e-09, "Full-pretrain/Loss": 1.9154139757156372, "Full-pretrain/Loss (Raw)": 1.761465072631836, "Full-pretrain/Step": 9483, "Full-pretrain/Step Time": 17.69196029379964} +{"Full-pretrain/Learning Rate": 3.898716821820747e-09, "Full-pretrain/Loss": 1.9131766557693481, "Full-pretrain/Loss (Raw)": 1.625967025756836, "Full-pretrain/Step": 9484, "Full-pretrain/Step Time": 17.68738680332899} +{"Full-pretrain/Learning Rate": 3.750211721015306e-09, "Full-pretrain/Loss": 1.909230351448059, "Full-pretrain/Loss (Raw)": 1.85048246383667, "Full-pretrain/Step": 9485, "Full-pretrain/Step Time": 17.68389988131821} +{"Full-pretrain/Learning Rate": 3.6045899288378317e-09, "Full-pretrain/Loss": 1.9237446784973145, "Full-pretrain/Loss (Raw)": 2.277339458465576, "Full-pretrain/Step": 9486, "Full-pretrain/Step Time": 17.68638371862471} +{"Full-pretrain/Learning Rate": 3.461851462088772e-09, "Full-pretrain/Loss": 1.9325735569000244, "Full-pretrain/Loss (Raw)": 2.1257543563842773, "Full-pretrain/Step": 9487, "Full-pretrain/Step Time": 17.68694273941219} +{"Full-pretrain/Learning Rate": 3.3219963372271844e-09, "Full-pretrain/Loss": 1.9105725288391113, "Full-pretrain/Loss (Raw)": 1.720117211341858, "Full-pretrain/Step": 9488, "Full-pretrain/Step Time": 17.684461027383804} +{"Full-pretrain/Learning Rate": 3.185024570392936e-09, "Full-pretrain/Loss": 1.919599175453186, "Full-pretrain/Loss (Raw)": 2.214827060699463, "Full-pretrain/Step": 9489, "Full-pretrain/Step Time": 17.68198230676353} +{"Full-pretrain/Learning Rate": 3.050936177378949e-09, "Full-pretrain/Loss": 1.9120514392852783, "Full-pretrain/Loss (Raw)": 2.0157992839813232, "Full-pretrain/Step": 9490, "Full-pretrain/Step Time": 17.68161159195006} +{"Full-pretrain/Learning Rate": 2.9197311736561816e-09, "Full-pretrain/Loss": 1.902243971824646, "Full-pretrain/Loss (Raw)": 1.770294189453125, "Full-pretrain/Step": 9491, "Full-pretrain/Step Time": 17.68134407699108} +{"Full-pretrain/Learning Rate": 2.7914095743569736e-09, "Full-pretrain/Loss": 1.9156955480575562, "Full-pretrain/Loss (Raw)": 2.27058482170105, "Full-pretrain/Step": 9492, "Full-pretrain/Step Time": 17.681955909356475} +{"Full-pretrain/Learning Rate": 2.665971394283373e-09, "Full-pretrain/Loss": 1.9310985803604126, "Full-pretrain/Loss (Raw)": 2.231462240219116, "Full-pretrain/Step": 9493, "Full-pretrain/Step Time": 17.676898585632443} +{"Full-pretrain/Learning Rate": 2.5434166479071376e-09, "Full-pretrain/Loss": 1.940369725227356, "Full-pretrain/Loss (Raw)": 1.9265354871749878, "Full-pretrain/Step": 9494, "Full-pretrain/Step Time": 17.678641840815544} +{"Full-pretrain/Learning Rate": 2.4237453493641816e-09, "Full-pretrain/Loss": 1.942054033279419, "Full-pretrain/Loss (Raw)": 1.9676536321640015, "Full-pretrain/Step": 9495, "Full-pretrain/Step Time": 17.677946599200368} +{"Full-pretrain/Learning Rate": 2.3069575124545773e-09, "Full-pretrain/Loss": 1.9497549533843994, "Full-pretrain/Loss (Raw)": 1.9760653972625732, "Full-pretrain/Step": 9496, "Full-pretrain/Step Time": 17.67030666768551} +{"Full-pretrain/Learning Rate": 2.1930531506536565e-09, "Full-pretrain/Loss": 1.9348163604736328, "Full-pretrain/Loss (Raw)": 1.914900779724121, "Full-pretrain/Step": 9497, "Full-pretrain/Step Time": 17.673858461901546} +{"Full-pretrain/Learning Rate": 2.0820322770981337e-09, "Full-pretrain/Loss": 1.932936191558838, "Full-pretrain/Loss (Raw)": 1.8015313148498535, "Full-pretrain/Step": 9498, "Full-pretrain/Step Time": 17.665880171582103} +{"Full-pretrain/Learning Rate": 1.973894904597207e-09, "Full-pretrain/Loss": 1.923715353012085, "Full-pretrain/Loss (Raw)": 1.6490859985351562, "Full-pretrain/Step": 9499, "Full-pretrain/Step Time": 17.66918422281742} +{"Full-pretrain/Learning Rate": 1.8686410456214553e-09, "Full-pretrain/Loss": 1.925504207611084, "Full-pretrain/Loss (Raw)": 1.9411792755126953, "Full-pretrain/Step": 9500, "Full-pretrain/Step Time": 17.66856854595244} +{"Full-pretrain/Learning Rate": 1.7662707123139443e-09, "Full-pretrain/Loss": 1.9171723127365112, "Full-pretrain/Loss (Raw)": 1.788416862487793, "Full-pretrain/Step": 9501, "Full-pretrain/Step Time": 17.66552373766899} +{"Full-pretrain/Learning Rate": 1.6667839164818954e-09, "Full-pretrain/Loss": 1.9211180210113525, "Full-pretrain/Loss (Raw)": 2.1176488399505615, "Full-pretrain/Step": 9502, "Full-pretrain/Step Time": 17.666799323633313} +{"Full-pretrain/Learning Rate": 1.5701806695994636e-09, "Full-pretrain/Loss": 1.927376627922058, "Full-pretrain/Loss (Raw)": 2.171915292739868, "Full-pretrain/Step": 9503, "Full-pretrain/Step Time": 17.66127870976925} +{"Full-pretrain/Learning Rate": 1.4764609828132881e-09, "Full-pretrain/Loss": 1.9333412647247314, "Full-pretrain/Loss (Raw)": 1.895115613937378, "Full-pretrain/Step": 9504, "Full-pretrain/Step Time": 17.66345740109682} +{"Full-pretrain/Learning Rate": 1.3856248669313899e-09, "Full-pretrain/Loss": 1.9440195560455322, "Full-pretrain/Loss (Raw)": 2.138363838195801, "Full-pretrain/Step": 9505, "Full-pretrain/Step Time": 17.66415948420763} +{"Full-pretrain/Learning Rate": 1.2976723324342744e-09, "Full-pretrain/Loss": 1.9507436752319336, "Full-pretrain/Loss (Raw)": 2.0685501098632812, "Full-pretrain/Step": 9506, "Full-pretrain/Step Time": 17.66939303651452} +{"Full-pretrain/Learning Rate": 1.212603389463829e-09, "Full-pretrain/Loss": 1.9530425071716309, "Full-pretrain/Loss (Raw)": 2.0817923545837402, "Full-pretrain/Step": 9507, "Full-pretrain/Step Time": 17.6661233343184} +{"Full-pretrain/Learning Rate": 1.1304180478344251e-09, "Full-pretrain/Loss": 1.9608538150787354, "Full-pretrain/Loss (Raw)": 1.8747183084487915, "Full-pretrain/Step": 9508, "Full-pretrain/Step Time": 17.666204011067748} +{"Full-pretrain/Learning Rate": 1.0511163170273674e-09, "Full-pretrain/Loss": 1.943540334701538, "Full-pretrain/Loss (Raw)": 1.4884326457977295, "Full-pretrain/Step": 9509, "Full-pretrain/Step Time": 17.663192812353373} +{"Full-pretrain/Learning Rate": 9.746982061881183e-10, "Full-pretrain/Loss": 1.948555827140808, "Full-pretrain/Loss (Raw)": 1.9328101873397827, "Full-pretrain/Step": 9510, "Full-pretrain/Step Time": 17.66494371369481} +{"Full-pretrain/Learning Rate": 9.011637241318483e-10, "Full-pretrain/Loss": 1.947542428970337, "Full-pretrain/Loss (Raw)": 1.7803575992584229, "Full-pretrain/Step": 9511, "Full-pretrain/Step Time": 17.66413478180766} +{"Full-pretrain/Learning Rate": 8.305128793406613e-10, "Full-pretrain/Loss": 1.9385403394699097, "Full-pretrain/Loss (Raw)": 1.7590270042419434, "Full-pretrain/Step": 9512, "Full-pretrain/Step Time": 17.65311532281339} +{"Full-pretrain/Learning Rate": 7.627456799635946e-10, "Full-pretrain/Loss": 1.9445723295211792, "Full-pretrain/Loss (Raw)": 2.027388334274292, "Full-pretrain/Step": 9513, "Full-pretrain/Step Time": 17.656628981232643} +{"Full-pretrain/Learning Rate": 6.978621338193936e-10, "Full-pretrain/Loss": 1.9426801204681396, "Full-pretrain/Loss (Raw)": 2.000180721282959, "Full-pretrain/Step": 9514, "Full-pretrain/Step Time": 17.658526776358485} +{"Full-pretrain/Learning Rate": 6.358622483937371e-10, "Full-pretrain/Loss": 1.9323840141296387, "Full-pretrain/Loss (Raw)": 1.431990385055542, "Full-pretrain/Step": 9515, "Full-pretrain/Step Time": 17.656880039721727} +{"Full-pretrain/Learning Rate": 5.767460308336859e-10, "Full-pretrain/Loss": 1.9482355117797852, "Full-pretrain/Loss (Raw)": 2.133216619491577, "Full-pretrain/Step": 9516, "Full-pretrain/Step Time": 17.651528472080827} +{"Full-pretrain/Learning Rate": 5.205134879615603e-10, "Full-pretrain/Loss": 1.9542909860610962, "Full-pretrain/Loss (Raw)": 2.044257640838623, "Full-pretrain/Step": 9517, "Full-pretrain/Step Time": 17.64881738461554} +{"Full-pretrain/Learning Rate": 4.671646262610629e-10, "Full-pretrain/Loss": 1.9462132453918457, "Full-pretrain/Loss (Raw)": 2.018850326538086, "Full-pretrain/Step": 9518, "Full-pretrain/Step Time": 17.654465701431036} +{"Full-pretrain/Learning Rate": 4.1669945188838044e-10, "Full-pretrain/Loss": 1.941813349723816, "Full-pretrain/Loss (Raw)": 1.9849562644958496, "Full-pretrain/Step": 9519, "Full-pretrain/Step Time": 17.64880364201963} +{"Full-pretrain/Learning Rate": 3.69117970663857e-10, "Full-pretrain/Loss": 1.9543707370758057, "Full-pretrain/Loss (Raw)": 2.1219544410705566, "Full-pretrain/Step": 9520, "Full-pretrain/Step Time": 17.645510613918304} +{"Full-pretrain/Learning Rate": 3.244201880775455e-10, "Full-pretrain/Loss": 1.9500133991241455, "Full-pretrain/Loss (Raw)": 2.075390338897705, "Full-pretrain/Step": 9521, "Full-pretrain/Step Time": 17.647736363112926} +{"Full-pretrain/Learning Rate": 2.826061092836563e-10, "Full-pretrain/Loss": 1.9478117227554321, "Full-pretrain/Loss (Raw)": 1.9453498125076294, "Full-pretrain/Step": 9522, "Full-pretrain/Step Time": 17.647600086405873} +{"Full-pretrain/Learning Rate": 2.4367573910333283e-10, "Full-pretrain/Loss": 1.9494624137878418, "Full-pretrain/Loss (Raw)": 1.8231149911880493, "Full-pretrain/Step": 9523, "Full-pretrain/Step Time": 17.644766541197896} +{"Full-pretrain/Learning Rate": 2.0762908203297849e-10, "Full-pretrain/Loss": 1.9343748092651367, "Full-pretrain/Loss (Raw)": 1.7877800464630127, "Full-pretrain/Step": 9524, "Full-pretrain/Step Time": 17.649016983807087} +{"Full-pretrain/Learning Rate": 1.7446614222482728e-10, "Full-pretrain/Loss": 1.9219715595245361, "Full-pretrain/Loss (Raw)": 1.834560751914978, "Full-pretrain/Step": 9525, "Full-pretrain/Step Time": 17.64959575049579} +{"Full-pretrain/Learning Rate": 1.441869235063731e-10, "Full-pretrain/Loss": 1.926786184310913, "Full-pretrain/Loss (Raw)": 2.080599784851074, "Full-pretrain/Step": 9526, "Full-pretrain/Step Time": 17.654993787407875} +{"Full-pretrain/Learning Rate": 1.1679142936926734e-10, "Full-pretrain/Loss": 1.9347383975982666, "Full-pretrain/Loss (Raw)": 2.2221264839172363, "Full-pretrain/Step": 9527, "Full-pretrain/Step Time": 17.65282374434173} +{"Full-pretrain/Learning Rate": 9.227966297764567e-11, "Full-pretrain/Loss": 1.9323606491088867, "Full-pretrain/Loss (Raw)": 1.8999769687652588, "Full-pretrain/Step": 9528, "Full-pretrain/Step Time": 17.658364752307534} +{"Full-pretrain/Learning Rate": 7.06516271542501e-11, "Full-pretrain/Loss": 1.9318419694900513, "Full-pretrain/Loss (Raw)": 1.8983025550842285, "Full-pretrain/Step": 9529, "Full-pretrain/Step Time": 17.659103024750948} +{"Full-pretrain/Learning Rate": 5.19073243943069e-11, "Full-pretrain/Loss": 1.9311938285827637, "Full-pretrain/Loss (Raw)": 1.7807945013046265, "Full-pretrain/Step": 9530, "Full-pretrain/Step Time": 17.65901919454336} +{"Full-pretrain/Learning Rate": 3.604675686275094e-11, "Full-pretrain/Loss": 1.939307451248169, "Full-pretrain/Loss (Raw)": 1.9087198972702026, "Full-pretrain/Step": 9531, "Full-pretrain/Step Time": 17.663737673312426} +{"Full-pretrain/Learning Rate": 2.3069926388674667e-11, "Full-pretrain/Loss": 1.9426624774932861, "Full-pretrain/Loss (Raw)": 2.048542022705078, "Full-pretrain/Step": 9532, "Full-pretrain/Step Time": 17.667521592229605} +{"Full-pretrain/Learning Rate": 1.2976834468103605e-11, "Full-pretrain/Loss": 1.9500523805618286, "Full-pretrain/Loss (Raw)": 2.024888515472412, "Full-pretrain/Step": 9533, "Full-pretrain/Step Time": 17.660828409716487} +{"Full-pretrain/Learning Rate": 5.767482261220814e-12, "Full-pretrain/Loss": 1.9481666088104248, "Full-pretrain/Loss (Raw)": 2.057307243347168, "Full-pretrain/Step": 9534, "Full-pretrain/Step Time": 17.664770416915417} +{"Full-pretrain/Learning Rate": 1.4418706062446774e-12, "Full-pretrain/Loss": 1.9349696636199951, "Full-pretrain/Loss (Raw)": 1.7496135234832764, "Full-pretrain/Step": 9535, "Full-pretrain/Step Time": 17.66432292945683} +{"Full-pretrain/Learning Rate": 0.0, "Full-pretrain/Loss": 1.9312673807144165, "Full-pretrain/Loss (Raw)": 1.7766423225402832, "Full-pretrain/Step": 9536, "Full-pretrain/Step Time": 17.672137279063463} diff --git a/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/run-metrics.jsonl b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/run-metrics.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..71faaf8912c66bae007ab765f829a3a1bf0f2a1a --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-claude3+stage-full-pretrain+x7/run-metrics.jsonl @@ -0,0 +1 @@ +{"hparams": {"dataset": {"align_stage_components": ["download/llava-laion-cc-sbu-558k/chat.json", "download/llava-laion-cc-sbu-558k"], "dataset_id": "obelics", "dataset_resampled": true, "dataset_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl_pil/", "finetune_stage_components": ["/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/llava_v1_5_mix665k.json", "/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/data"], "max_num_images": 6, "min_num_images": 1, "train_num_samples": 2441407, "type": "obelics", "workers": 4}, "model": {"align_epochs": 1, "align_global_batch_size": 256, "align_learning_rate": 0.001, "align_lr_scheduler_type": "linear-warmup+cosine-decay", "align_max_grad_norm": 1.0, "align_max_steps": null, "align_per_device_batch_size": 16, "align_train_strategy": "fsdp-shard-grad-op", "align_warmup_ratio": 0.03, "align_weight_decay": 0.0, "arch_specifier": "no-align+avgpool", "enable_gradient_checkpointing": true, "enable_mixed_precision_training": true, "finetune_epochs": 1, "finetune_global_batch_size": 128, "finetune_learning_rate": 2e-05, "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", "finetune_max_grad_norm": 1.0, "finetune_max_steps": null, "finetune_per_device_batch_size": 16, "finetune_train_strategy": "fsdp-full-shard", "finetune_warmup_ratio": 0.03, "finetune_weight_decay": 0.1, "image_resize_strategy": "resize-naive", "llm_backbone_id": "phi3-3b", "llm_max_length": 4096, "model_id": "phi3-3b-continue-training-hq", "pretrain_epochs": 1, "pretrain_global_batch_size": 256, "pretrain_learning_rate": 5e-05, "pretrain_lr_scheduler_type": "linear-warmup+cosine-decay", "pretrain_max_grad_norm": 1.0, "pretrain_max_steps": 9536, "pretrain_per_device_batch_size": 2, "pretrain_train_strategy": "fsdp-full-shard", "pretrain_warmup_ratio": 0.03, "pretrain_weight_decay": 0.01, "reduce_in_full_precision": false, "type": "one-stage+7b", "vision_backbone_id": "siglip-vit-so400m-384px"}, "mount_path": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models", "pretrained_checkpoint": null, "run_id": "obelics+phi3-3b-continue-training-hq+stage-full-pretrain+x7", "run_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints/mllm_pretrain_checkpoints", "seed": 7, "stage": "full-pretrain", "trackers": ["jsonl", "wandb"], "wandb_entity": null, "wandb_project": "mmpretrain"}, "run_id": "obelics+phi3-3b-continue-training-hq+stage-full-pretrain+x7"}