YagiASAFAS commited on Feb 8, 2025

Commit

e04e294

1 Parent(s): 0efbf92

Add tokenizer files

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

checkpoint-1348/config.json +126 -0
checkpoint-1348/model.safetensors +3 -0
checkpoint-1348/optimizer.pt +3 -0
checkpoint-1348/rng_state.pth +3 -0
checkpoint-1348/scheduler.pt +3 -0
checkpoint-1348/trainer_state.json +124 -0
checkpoint-1348/training_args.bin +3 -0
checkpoint-2022/config.json +126 -0
checkpoint-2022/model.safetensors +3 -0
checkpoint-2022/optimizer.pt +3 -0
checkpoint-2022/rng_state.pth +3 -0
checkpoint-2022/scheduler.pt +3 -0
checkpoint-2022/trainer_state.json +172 -0
checkpoint-2022/training_args.bin +3 -0
checkpoint-2696/config.json +126 -0
checkpoint-2696/model.safetensors +3 -0
checkpoint-2696/optimizer.pt +3 -0
checkpoint-2696/rng_state.pth +3 -0
checkpoint-2696/scheduler.pt +3 -0
checkpoint-2696/trainer_state.json +213 -0
checkpoint-2696/training_args.bin +3 -0
checkpoint-3370/config.json +126 -0
checkpoint-3370/model.safetensors +3 -0
checkpoint-3370/optimizer.pt +3 -0
checkpoint-3370/rng_state.pth +3 -0
checkpoint-3370/scheduler.pt +3 -0
checkpoint-3370/trainer_state.json +254 -0
checkpoint-3370/training_args.bin +3 -0
checkpoint-4044/config.json +126 -0
checkpoint-4044/model.safetensors +3 -0
checkpoint-4044/optimizer.pt +3 -0
checkpoint-4044/rng_state.pth +3 -0
checkpoint-4044/scheduler.pt +3 -0
checkpoint-4044/trainer_state.json +302 -0
checkpoint-4044/training_args.bin +3 -0
checkpoint-4718/config.json +126 -0
checkpoint-4718/model.safetensors +3 -0
checkpoint-4718/optimizer.pt +3 -0
checkpoint-4718/rng_state.pth +3 -0
checkpoint-4718/scheduler.pt +3 -0
checkpoint-4718/trainer_state.json +343 -0
checkpoint-4718/training_args.bin +3 -0
checkpoint-674/config.json +126 -0
checkpoint-674/model.safetensors +3 -0
checkpoint-674/optimizer.pt +3 -0
checkpoint-674/rng_state.pth +3 -0
checkpoint-674/scheduler.pt +3 -0
checkpoint-674/trainer_state.json +83 -0
checkpoint-674/training_args.bin +3 -0
special_tokens_map.json +7 -0

checkpoint-1348/config.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7",
+    "8": "LABEL_8",
+    "9": "LABEL_9",
+    "10": "LABEL_10",
+    "11": "LABEL_11",
+    "12": "LABEL_12",
+    "13": "LABEL_13",
+    "14": "LABEL_14",
+    "15": "LABEL_15",
+    "16": "LABEL_16",
+    "17": "LABEL_17",
+    "18": "LABEL_18",
+    "19": "LABEL_19",
+    "20": "LABEL_20",
+    "21": "LABEL_21",
+    "22": "LABEL_22",
+    "23": "LABEL_23",
+    "24": "LABEL_24",
+    "25": "LABEL_25",
+    "26": "LABEL_26",
+    "27": "LABEL_27",
+    "28": "LABEL_28",
+    "29": "LABEL_29",
+    "30": "LABEL_30",
+    "31": "LABEL_31",
+    "32": "LABEL_32",
+    "33": "LABEL_33",
+    "34": "LABEL_34",
+    "35": "LABEL_35",
+    "36": "LABEL_36",
+    "37": "LABEL_37",
+    "38": "LABEL_38",
+    "39": "LABEL_39",
+    "40": "LABEL_40",
+    "41": "LABEL_41",
+    "42": "LABEL_42",
+    "43": "LABEL_43",
+    "44": "LABEL_44",
+    "45": "LABEL_45",
+    "46": "LABEL_46",
+    "47": "LABEL_47"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_10": 10,
+    "LABEL_11": 11,
+    "LABEL_12": 12,
+    "LABEL_13": 13,
+    "LABEL_14": 14,
+    "LABEL_15": 15,
+    "LABEL_16": 16,
+    "LABEL_17": 17,
+    "LABEL_18": 18,
+    "LABEL_19": 19,
+    "LABEL_2": 2,
+    "LABEL_20": 20,
+    "LABEL_21": 21,
+    "LABEL_22": 22,
+    "LABEL_23": 23,
+    "LABEL_24": 24,
+    "LABEL_25": 25,
+    "LABEL_26": 26,
+    "LABEL_27": 27,
+    "LABEL_28": 28,
+    "LABEL_29": 29,
+    "LABEL_3": 3,
+    "LABEL_30": 30,
+    "LABEL_31": 31,
+    "LABEL_32": 32,
+    "LABEL_33": 33,
+    "LABEL_34": 34,
+    "LABEL_35": 35,
+    "LABEL_36": 36,
+    "LABEL_37": 37,
+    "LABEL_38": 38,
+    "LABEL_39": 39,
+    "LABEL_4": 4,
+    "LABEL_40": 40,
+    "LABEL_41": 41,
+    "LABEL_42": 42,
+    "LABEL_43": 43,
+    "LABEL_44": 44,
+    "LABEL_45": 45,
+    "LABEL_46": 46,
+    "LABEL_47": 47,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7,
+    "LABEL_8": 8,
+    "LABEL_9": 9
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

checkpoint-1348/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5fce8f95d3cf8aff1a50c809fe98dd604891e8de87b59f6120aa33197dca0a66
+size 438100144

checkpoint-1348/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9187dde97cea8c1cf9cb99c4687e70c49adae5398710ee1afd363eb067ec64e5
+size 876321402

checkpoint-1348/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f15d59ec259156654b7d699d265c49f473bc80117753dbc660df0ce861bf6667
+size 14244

checkpoint-1348/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b6ecb4f315a32a13883fe1ef1036339d6775c6db67dc4dd1bd600ddb6aece2b
+size 1064

checkpoint-1348/trainer_state.json ADDED Viewed

	@@ -0,0 +1,124 @@

+{
+  "best_metric": 0.9156647148374422,
+  "best_model_checkpoint": "./results/checkpoint-1348",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 1348,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7423904974016332,
+      "grad_norm": 1.0851198434829712,
+      "learning_rate": 2.8606983655274892e-05,
+      "loss": 0.448,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_administration_accuracy": 0.8700092850510678,
+      "eval_administration_f1": 0.830681542112301,
+      "eval_corruption_accuracy": 0.9301764159702879,
+      "eval_corruption_f1": 0.9210203978746075,
+      "eval_democracy_accuracy": 0.9201485608170845,
+      "eval_democracy_f1": 0.8972549864645475,
+      "eval_development_accuracy": 0.8672237697307336,
+      "eval_development_f1": 0.8462048329953127,
+      "eval_economy_accuracy": 0.9062209842154132,
+      "eval_economy_f1": 0.8952254345075943,
+      "eval_education_accuracy": 0.9467038068709378,
+      "eval_education_f1": 0.9344408657756663,
+      "eval_environment_accuracy": 0.9619312906220984,
+      "eval_environment_f1": 0.9564784032426319,
+      "eval_instability_accuracy": 0.9084493964716805,
+      "eval_instability_f1": 0.8872576883139862,
+      "eval_leadership_accuracy": 0.833983286908078,
+      "eval_leadership_f1": 0.8199437016930928,
+      "eval_loss": 0.2781185507774353,
+      "eval_overall_accuracy": 0.9090374497059734,
+      "eval_overall_f1": 0.8943279031006514,
+      "eval_race_accuracy": 0.9385329619312907,
+      "eval_race_f1": 0.9345823913548884,
+      "eval_religion_accuracy": 0.9303621169916435,
+      "eval_religion_f1": 0.9219388519537324,
+      "eval_runtime": 6.3896,
+      "eval_safety_accuracy": 0.8947075208913648,
+      "eval_safety_f1": 0.8869057409194557,
+      "eval_samples_per_second": 842.781,
+      "eval_steps_per_second": 52.742,
+      "step": 674
+    },
+    {
+      "epoch": 1.4840386043058649,
+      "grad_norm": 1.3921394348144531,
+      "learning_rate": 2.7213967310549777e-05,
+      "loss": 0.2646,
+      "step": 1000
+    },
+    {
+      "epoch": 2.0,
+      "eval_administration_accuracy": 0.886908077994429,
+      "eval_administration_f1": 0.8723732992505114,
+      "eval_corruption_accuracy": 0.9424326833797586,
+      "eval_corruption_f1": 0.9384898864061544,
+      "eval_democracy_accuracy": 0.933519034354689,
+      "eval_democracy_f1": 0.9231869597067329,
+      "eval_development_accuracy": 0.8739090064995357,
+      "eval_development_f1": 0.8668624356641937,
+      "eval_economy_accuracy": 0.9143918291550603,
+      "eval_economy_f1": 0.9111034488927022,
+      "eval_education_accuracy": 0.9580315691736304,
+      "eval_education_f1": 0.9543147194312244,
+      "eval_environment_accuracy": 0.9734447539461467,
+      "eval_environment_f1": 0.9731508098039792,
+      "eval_instability_accuracy": 0.9277623026926648,
+      "eval_instability_f1": 0.9222378035229967,
+      "eval_leadership_accuracy": 0.840297121634169,
+      "eval_leadership_f1": 0.8406461991345243,
+      "eval_loss": 0.23724055290222168,
+      "eval_overall_accuracy": 0.9205354379449089,
+      "eval_overall_f1": 0.9156647148374422,
+      "eval_race_accuracy": 0.9467038068709378,
+      "eval_race_f1": 0.943797657082642,
+      "eval_religion_accuracy": 0.9409470752089136,
+      "eval_religion_f1": 0.9380295054445577,
+      "eval_runtime": 6.3736,
+      "eval_safety_accuracy": 0.9080779944289693,
+      "eval_safety_f1": 0.9037838537090879,
+      "eval_samples_per_second": 844.886,
+      "eval_steps_per_second": 52.874,
+      "step": 1348
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 10768,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 16,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.1338452843429888e+16,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-1348/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e04a520e0b54409a3029464cde7d12079be452340929d293e17e45309f482f8
+size 5368

checkpoint-2022/config.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7",
+    "8": "LABEL_8",
+    "9": "LABEL_9",
+    "10": "LABEL_10",
+    "11": "LABEL_11",
+    "12": "LABEL_12",
+    "13": "LABEL_13",
+    "14": "LABEL_14",
+    "15": "LABEL_15",
+    "16": "LABEL_16",
+    "17": "LABEL_17",
+    "18": "LABEL_18",
+    "19": "LABEL_19",
+    "20": "LABEL_20",
+    "21": "LABEL_21",
+    "22": "LABEL_22",
+    "23": "LABEL_23",
+    "24": "LABEL_24",
+    "25": "LABEL_25",
+    "26": "LABEL_26",
+    "27": "LABEL_27",
+    "28": "LABEL_28",
+    "29": "LABEL_29",
+    "30": "LABEL_30",
+    "31": "LABEL_31",
+    "32": "LABEL_32",
+    "33": "LABEL_33",
+    "34": "LABEL_34",
+    "35": "LABEL_35",
+    "36": "LABEL_36",
+    "37": "LABEL_37",
+    "38": "LABEL_38",
+    "39": "LABEL_39",
+    "40": "LABEL_40",
+    "41": "LABEL_41",
+    "42": "LABEL_42",
+    "43": "LABEL_43",
+    "44": "LABEL_44",
+    "45": "LABEL_45",
+    "46": "LABEL_46",
+    "47": "LABEL_47"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_10": 10,
+    "LABEL_11": 11,
+    "LABEL_12": 12,
+    "LABEL_13": 13,
+    "LABEL_14": 14,
+    "LABEL_15": 15,
+    "LABEL_16": 16,
+    "LABEL_17": 17,
+    "LABEL_18": 18,
+    "LABEL_19": 19,
+    "LABEL_2": 2,
+    "LABEL_20": 20,
+    "LABEL_21": 21,
+    "LABEL_22": 22,
+    "LABEL_23": 23,
+    "LABEL_24": 24,
+    "LABEL_25": 25,
+    "LABEL_26": 26,
+    "LABEL_27": 27,
+    "LABEL_28": 28,
+    "LABEL_29": 29,
+    "LABEL_3": 3,
+    "LABEL_30": 30,
+    "LABEL_31": 31,
+    "LABEL_32": 32,
+    "LABEL_33": 33,
+    "LABEL_34": 34,
+    "LABEL_35": 35,
+    "LABEL_36": 36,
+    "LABEL_37": 37,
+    "LABEL_38": 38,
+    "LABEL_39": 39,
+    "LABEL_4": 4,
+    "LABEL_40": 40,
+    "LABEL_41": 41,
+    "LABEL_42": 42,
+    "LABEL_43": 43,
+    "LABEL_44": 44,
+    "LABEL_45": 45,
+    "LABEL_46": 46,
+    "LABEL_47": 47,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7,
+    "LABEL_8": 8,
+    "LABEL_9": 9
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

checkpoint-2022/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5da5bcf984a34091cb18e050126d51750543e1ed6c4a773905c484ffd83d8b4b
+size 438100144

checkpoint-2022/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:66dbdd9a56f01c2cecf497957017972c09ca424ef5659d8fe692bfc125ef6f57
+size 876321402

checkpoint-2022/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b73932204efe53704e932ab7c4720df6118415e4984d139269a56ea57da1c48a
+size 14244

checkpoint-2022/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc65d5c1626b5099811d02a9fb91c5737fc97e0195b3258c9705ce310425541a
+size 1064

checkpoint-2022/trainer_state.json ADDED Viewed

	@@ -0,0 +1,172 @@

+{
+  "best_metric": 0.9198927823234619,
+  "best_model_checkpoint": "./results/checkpoint-2022",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 2022,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7423904974016332,
+      "grad_norm": 1.0851198434829712,
+      "learning_rate": 2.8606983655274892e-05,
+      "loss": 0.448,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_administration_accuracy": 0.8700092850510678,
+      "eval_administration_f1": 0.830681542112301,
+      "eval_corruption_accuracy": 0.9301764159702879,
+      "eval_corruption_f1": 0.9210203978746075,
+      "eval_democracy_accuracy": 0.9201485608170845,
+      "eval_democracy_f1": 0.8972549864645475,
+      "eval_development_accuracy": 0.8672237697307336,
+      "eval_development_f1": 0.8462048329953127,
+      "eval_economy_accuracy": 0.9062209842154132,
+      "eval_economy_f1": 0.8952254345075943,
+      "eval_education_accuracy": 0.9467038068709378,
+      "eval_education_f1": 0.9344408657756663,
+      "eval_environment_accuracy": 0.9619312906220984,
+      "eval_environment_f1": 0.9564784032426319,
+      "eval_instability_accuracy": 0.9084493964716805,
+      "eval_instability_f1": 0.8872576883139862,
+      "eval_leadership_accuracy": 0.833983286908078,
+      "eval_leadership_f1": 0.8199437016930928,
+      "eval_loss": 0.2781185507774353,
+      "eval_overall_accuracy": 0.9090374497059734,
+      "eval_overall_f1": 0.8943279031006514,
+      "eval_race_accuracy": 0.9385329619312907,
+      "eval_race_f1": 0.9345823913548884,
+      "eval_religion_accuracy": 0.9303621169916435,
+      "eval_religion_f1": 0.9219388519537324,
+      "eval_runtime": 6.3896,
+      "eval_safety_accuracy": 0.8947075208913648,
+      "eval_safety_f1": 0.8869057409194557,
+      "eval_samples_per_second": 842.781,
+      "eval_steps_per_second": 52.742,
+      "step": 674
+    },
+    {
+      "epoch": 1.4840386043058649,
+      "grad_norm": 1.3921394348144531,
+      "learning_rate": 2.7213967310549777e-05,
+      "loss": 0.2646,
+      "step": 1000
+    },
+    {
+      "epoch": 2.0,
+      "eval_administration_accuracy": 0.886908077994429,
+      "eval_administration_f1": 0.8723732992505114,
+      "eval_corruption_accuracy": 0.9424326833797586,
+      "eval_corruption_f1": 0.9384898864061544,
+      "eval_democracy_accuracy": 0.933519034354689,
+      "eval_democracy_f1": 0.9231869597067329,
+      "eval_development_accuracy": 0.8739090064995357,
+      "eval_development_f1": 0.8668624356641937,
+      "eval_economy_accuracy": 0.9143918291550603,
+      "eval_economy_f1": 0.9111034488927022,
+      "eval_education_accuracy": 0.9580315691736304,
+      "eval_education_f1": 0.9543147194312244,
+      "eval_environment_accuracy": 0.9734447539461467,
+      "eval_environment_f1": 0.9731508098039792,
+      "eval_instability_accuracy": 0.9277623026926648,
+      "eval_instability_f1": 0.9222378035229967,
+      "eval_leadership_accuracy": 0.840297121634169,
+      "eval_leadership_f1": 0.8406461991345243,
+      "eval_loss": 0.23724055290222168,
+      "eval_overall_accuracy": 0.9205354379449089,
+      "eval_overall_f1": 0.9156647148374422,
+      "eval_race_accuracy": 0.9467038068709378,
+      "eval_race_f1": 0.943797657082642,
+      "eval_religion_accuracy": 0.9409470752089136,
+      "eval_religion_f1": 0.9380295054445577,
+      "eval_runtime": 6.3736,
+      "eval_safety_accuracy": 0.9080779944289693,
+      "eval_safety_f1": 0.9037838537090879,
+      "eval_samples_per_second": 844.886,
+      "eval_steps_per_second": 52.874,
+      "step": 1348
+    },
+    {
+      "epoch": 2.2256867112100966,
+      "grad_norm": 0.9178161025047302,
+      "learning_rate": 2.582095096582467e-05,
+      "loss": 0.2085,
+      "step": 1500
+    },
+    {
+      "epoch": 2.9680772086117297,
+      "grad_norm": 1.1747676134109497,
+      "learning_rate": 2.4427934621099553e-05,
+      "loss": 0.1696,
+      "step": 2000
+    },
+    {
+      "epoch": 3.0,
+      "eval_administration_accuracy": 0.8919220055710306,
+      "eval_administration_f1": 0.8805907698259323,
+      "eval_corruption_accuracy": 0.9454038997214484,
+      "eval_corruption_f1": 0.9422755927443824,
+      "eval_democracy_accuracy": 0.9333333333333333,
+      "eval_democracy_f1": 0.9277380787973176,
+      "eval_development_accuracy": 0.8846796657381616,
+      "eval_development_f1": 0.8767801428288444,
+      "eval_economy_accuracy": 0.9177344475394614,
+      "eval_economy_f1": 0.913190124488594,
+      "eval_education_accuracy": 0.959702878365831,
+      "eval_education_f1": 0.9592018840910198,
+      "eval_environment_accuracy": 0.9766016713091922,
+      "eval_environment_f1": 0.9753052667455842,
+      "eval_instability_accuracy": 0.9255338904363974,
+      "eval_instability_f1": 0.9219441146038561,
+      "eval_leadership_accuracy": 0.8503249767873723,
+      "eval_leadership_f1": 0.8464660955301658,
+      "eval_loss": 0.22912514209747314,
+      "eval_overall_accuracy": 0.923785205818632,
+      "eval_overall_f1": 0.9198927823234619,
+      "eval_race_accuracy": 0.9468895078922934,
+      "eval_race_f1": 0.9441406664359246,
+      "eval_religion_accuracy": 0.9418755803156917,
+      "eval_religion_f1": 0.9406664102976392,
+      "eval_runtime": 6.3983,
+      "eval_safety_accuracy": 0.9114206128133705,
+      "eval_safety_f1": 0.9104142414922826,
+      "eval_samples_per_second": 841.634,
+      "eval_steps_per_second": 52.67,
+      "step": 2022
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 10768,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 16,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.7007679265144832e+16,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-2022/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e04a520e0b54409a3029464cde7d12079be452340929d293e17e45309f482f8
+size 5368

checkpoint-2696/config.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7",
+    "8": "LABEL_8",
+    "9": "LABEL_9",
+    "10": "LABEL_10",
+    "11": "LABEL_11",
+    "12": "LABEL_12",
+    "13": "LABEL_13",
+    "14": "LABEL_14",
+    "15": "LABEL_15",
+    "16": "LABEL_16",
+    "17": "LABEL_17",
+    "18": "LABEL_18",
+    "19": "LABEL_19",
+    "20": "LABEL_20",
+    "21": "LABEL_21",
+    "22": "LABEL_22",
+    "23": "LABEL_23",
+    "24": "LABEL_24",
+    "25": "LABEL_25",
+    "26": "LABEL_26",
+    "27": "LABEL_27",
+    "28": "LABEL_28",
+    "29": "LABEL_29",
+    "30": "LABEL_30",
+    "31": "LABEL_31",
+    "32": "LABEL_32",
+    "33": "LABEL_33",
+    "34": "LABEL_34",
+    "35": "LABEL_35",
+    "36": "LABEL_36",
+    "37": "LABEL_37",
+    "38": "LABEL_38",
+    "39": "LABEL_39",
+    "40": "LABEL_40",
+    "41": "LABEL_41",
+    "42": "LABEL_42",
+    "43": "LABEL_43",
+    "44": "LABEL_44",
+    "45": "LABEL_45",
+    "46": "LABEL_46",
+    "47": "LABEL_47"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_10": 10,
+    "LABEL_11": 11,
+    "LABEL_12": 12,
+    "LABEL_13": 13,
+    "LABEL_14": 14,
+    "LABEL_15": 15,
+    "LABEL_16": 16,
+    "LABEL_17": 17,
+    "LABEL_18": 18,
+    "LABEL_19": 19,
+    "LABEL_2": 2,
+    "LABEL_20": 20,
+    "LABEL_21": 21,
+    "LABEL_22": 22,
+    "LABEL_23": 23,
+    "LABEL_24": 24,
+    "LABEL_25": 25,
+    "LABEL_26": 26,
+    "LABEL_27": 27,
+    "LABEL_28": 28,
+    "LABEL_29": 29,
+    "LABEL_3": 3,
+    "LABEL_30": 30,
+    "LABEL_31": 31,
+    "LABEL_32": 32,
+    "LABEL_33": 33,
+    "LABEL_34": 34,
+    "LABEL_35": 35,
+    "LABEL_36": 36,
+    "LABEL_37": 37,
+    "LABEL_38": 38,
+    "LABEL_39": 39,
+    "LABEL_4": 4,
+    "LABEL_40": 40,
+    "LABEL_41": 41,
+    "LABEL_42": 42,
+    "LABEL_43": 43,
+    "LABEL_44": 44,
+    "LABEL_45": 45,
+    "LABEL_46": 46,
+    "LABEL_47": 47,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7,
+    "LABEL_8": 8,
+    "LABEL_9": 9
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

checkpoint-2696/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:386ff4bc5faac38b06b3db23ca121834b04cf585a5b7e049d1ae21f0791260be
+size 438100144

checkpoint-2696/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e99fe4775ef593f4ecc30c37478b3a3aba9d37aa2d50779e0c69a2e5f94d9c1
+size 876321402

checkpoint-2696/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:64dc7c8d35ce0619ad041d92905273538a85dfb6cdd09fa753450f6ca183ddd5
+size 14244

checkpoint-2696/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a874b7ba73317e7750ce0ec4ee79350af46c2657c894e4dfbe16f8ec62ccdbaf
+size 1064

checkpoint-2696/trainer_state.json ADDED Viewed

	@@ -0,0 +1,213 @@

+{
+  "best_metric": 0.9198927823234619,
+  "best_model_checkpoint": "./results/checkpoint-2022",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 2696,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7423904974016332,
+      "grad_norm": 1.0851198434829712,
+      "learning_rate": 2.8606983655274892e-05,
+      "loss": 0.448,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_administration_accuracy": 0.8700092850510678,
+      "eval_administration_f1": 0.830681542112301,
+      "eval_corruption_accuracy": 0.9301764159702879,
+      "eval_corruption_f1": 0.9210203978746075,
+      "eval_democracy_accuracy": 0.9201485608170845,
+      "eval_democracy_f1": 0.8972549864645475,
+      "eval_development_accuracy": 0.8672237697307336,
+      "eval_development_f1": 0.8462048329953127,
+      "eval_economy_accuracy": 0.9062209842154132,
+      "eval_economy_f1": 0.8952254345075943,
+      "eval_education_accuracy": 0.9467038068709378,
+      "eval_education_f1": 0.9344408657756663,
+      "eval_environment_accuracy": 0.9619312906220984,
+      "eval_environment_f1": 0.9564784032426319,
+      "eval_instability_accuracy": 0.9084493964716805,
+      "eval_instability_f1": 0.8872576883139862,
+      "eval_leadership_accuracy": 0.833983286908078,
+      "eval_leadership_f1": 0.8199437016930928,
+      "eval_loss": 0.2781185507774353,
+      "eval_overall_accuracy": 0.9090374497059734,
+      "eval_overall_f1": 0.8943279031006514,
+      "eval_race_accuracy": 0.9385329619312907,
+      "eval_race_f1": 0.9345823913548884,
+      "eval_religion_accuracy": 0.9303621169916435,
+      "eval_religion_f1": 0.9219388519537324,
+      "eval_runtime": 6.3896,
+      "eval_safety_accuracy": 0.8947075208913648,
+      "eval_safety_f1": 0.8869057409194557,
+      "eval_samples_per_second": 842.781,
+      "eval_steps_per_second": 52.742,
+      "step": 674
+    },
+    {
+      "epoch": 1.4840386043058649,
+      "grad_norm": 1.3921394348144531,
+      "learning_rate": 2.7213967310549777e-05,
+      "loss": 0.2646,
+      "step": 1000
+    },
+    {
+      "epoch": 2.0,
+      "eval_administration_accuracy": 0.886908077994429,
+      "eval_administration_f1": 0.8723732992505114,
+      "eval_corruption_accuracy": 0.9424326833797586,
+      "eval_corruption_f1": 0.9384898864061544,
+      "eval_democracy_accuracy": 0.933519034354689,
+      "eval_democracy_f1": 0.9231869597067329,
+      "eval_development_accuracy": 0.8739090064995357,
+      "eval_development_f1": 0.8668624356641937,
+      "eval_economy_accuracy": 0.9143918291550603,
+      "eval_economy_f1": 0.9111034488927022,
+      "eval_education_accuracy": 0.9580315691736304,
+      "eval_education_f1": 0.9543147194312244,
+      "eval_environment_accuracy": 0.9734447539461467,
+      "eval_environment_f1": 0.9731508098039792,
+      "eval_instability_accuracy": 0.9277623026926648,
+      "eval_instability_f1": 0.9222378035229967,
+      "eval_leadership_accuracy": 0.840297121634169,
+      "eval_leadership_f1": 0.8406461991345243,
+      "eval_loss": 0.23724055290222168,
+      "eval_overall_accuracy": 0.9205354379449089,
+      "eval_overall_f1": 0.9156647148374422,
+      "eval_race_accuracy": 0.9467038068709378,
+      "eval_race_f1": 0.943797657082642,
+      "eval_religion_accuracy": 0.9409470752089136,
+      "eval_religion_f1": 0.9380295054445577,
+      "eval_runtime": 6.3736,
+      "eval_safety_accuracy": 0.9080779944289693,
+      "eval_safety_f1": 0.9037838537090879,
+      "eval_samples_per_second": 844.886,
+      "eval_steps_per_second": 52.874,
+      "step": 1348
+    },
+    {
+      "epoch": 2.2256867112100966,
+      "grad_norm": 0.9178161025047302,
+      "learning_rate": 2.582095096582467e-05,
+      "loss": 0.2085,
+      "step": 1500
+    },
+    {
+      "epoch": 2.9680772086117297,
+      "grad_norm": 1.1747676134109497,
+      "learning_rate": 2.4427934621099553e-05,
+      "loss": 0.1696,
+      "step": 2000
+    },
+    {
+      "epoch": 3.0,
+      "eval_administration_accuracy": 0.8919220055710306,
+      "eval_administration_f1": 0.8805907698259323,
+      "eval_corruption_accuracy": 0.9454038997214484,
+      "eval_corruption_f1": 0.9422755927443824,
+      "eval_democracy_accuracy": 0.9333333333333333,
+      "eval_democracy_f1": 0.9277380787973176,
+      "eval_development_accuracy": 0.8846796657381616,
+      "eval_development_f1": 0.8767801428288444,
+      "eval_economy_accuracy": 0.9177344475394614,
+      "eval_economy_f1": 0.913190124488594,
+      "eval_education_accuracy": 0.959702878365831,
+      "eval_education_f1": 0.9592018840910198,
+      "eval_environment_accuracy": 0.9766016713091922,
+      "eval_environment_f1": 0.9753052667455842,
+      "eval_instability_accuracy": 0.9255338904363974,
+      "eval_instability_f1": 0.9219441146038561,
+      "eval_leadership_accuracy": 0.8503249767873723,
+      "eval_leadership_f1": 0.8464660955301658,
+      "eval_loss": 0.22912514209747314,
+      "eval_overall_accuracy": 0.923785205818632,
+      "eval_overall_f1": 0.9198927823234619,
+      "eval_race_accuracy": 0.9468895078922934,
+      "eval_race_f1": 0.9441406664359246,
+      "eval_religion_accuracy": 0.9418755803156917,
+      "eval_religion_f1": 0.9406664102976392,
+      "eval_runtime": 6.3983,
+      "eval_safety_accuracy": 0.9114206128133705,
+      "eval_safety_f1": 0.9104142414922826,
+      "eval_samples_per_second": 841.634,
+      "eval_steps_per_second": 52.67,
+      "step": 2022
+    },
+    {
+      "epoch": 3.7097253155159615,
+      "grad_norm": 1.7257879972457886,
+      "learning_rate": 2.3034918276374445e-05,
+      "loss": 0.1309,
+      "step": 2500
+    },
+    {
+      "epoch": 4.0,
+      "eval_administration_accuracy": 0.875766016713092,
+      "eval_administration_f1": 0.8761692862915822,
+      "eval_corruption_accuracy": 0.9465181058495822,
+      "eval_corruption_f1": 0.9432932911595113,
+      "eval_democracy_accuracy": 0.9344475394614671,
+      "eval_democracy_f1": 0.9289539940724922,
+      "eval_development_accuracy": 0.8804085422469824,
+      "eval_development_f1": 0.8733152085361343,
+      "eval_economy_accuracy": 0.9175487465181058,
+      "eval_economy_f1": 0.9168308054942083,
+      "eval_education_accuracy": 0.959702878365831,
+      "eval_education_f1": 0.9577025286068839,
+      "eval_environment_accuracy": 0.9740018570102136,
+      "eval_environment_f1": 0.9740155750677182,
+      "eval_instability_accuracy": 0.92330547818013,
+      "eval_instability_f1": 0.9214961270553598,
+      "eval_leadership_accuracy": 0.8469823584029712,
+      "eval_leadership_f1": 0.8454208641557382,
+      "eval_loss": 0.23740428686141968,
+      "eval_overall_accuracy": 0.9211853915196534,
+      "eval_overall_f1": 0.9191929747362485,
+      "eval_race_accuracy": 0.9452181987000928,
+      "eval_race_f1": 0.9441252497587079,
+      "eval_religion_accuracy": 0.940761374187558,
+      "eval_religion_f1": 0.9389083250935241,
+      "eval_runtime": 6.3816,
+      "eval_safety_accuracy": 0.9095636025998143,
+      "eval_safety_f1": 0.9100844415431236,
+      "eval_samples_per_second": 843.83,
+      "eval_steps_per_second": 52.808,
+      "step": 2696
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 10768,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 16,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 1
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.2676905686859776e+16,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-2696/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e04a520e0b54409a3029464cde7d12079be452340929d293e17e45309f482f8
+size 5368

checkpoint-3370/config.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7",
+    "8": "LABEL_8",
+    "9": "LABEL_9",
+    "10": "LABEL_10",
+    "11": "LABEL_11",
+    "12": "LABEL_12",
+    "13": "LABEL_13",
+    "14": "LABEL_14",
+    "15": "LABEL_15",
+    "16": "LABEL_16",
+    "17": "LABEL_17",
+    "18": "LABEL_18",
+    "19": "LABEL_19",
+    "20": "LABEL_20",
+    "21": "LABEL_21",
+    "22": "LABEL_22",
+    "23": "LABEL_23",
+    "24": "LABEL_24",
+    "25": "LABEL_25",
+    "26": "LABEL_26",
+    "27": "LABEL_27",
+    "28": "LABEL_28",
+    "29": "LABEL_29",
+    "30": "LABEL_30",
+    "31": "LABEL_31",
+    "32": "LABEL_32",
+    "33": "LABEL_33",
+    "34": "LABEL_34",
+    "35": "LABEL_35",
+    "36": "LABEL_36",
+    "37": "LABEL_37",
+    "38": "LABEL_38",
+    "39": "LABEL_39",
+    "40": "LABEL_40",
+    "41": "LABEL_41",
+    "42": "LABEL_42",
+    "43": "LABEL_43",
+    "44": "LABEL_44",
+    "45": "LABEL_45",
+    "46": "LABEL_46",
+    "47": "LABEL_47"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_10": 10,
+    "LABEL_11": 11,
+    "LABEL_12": 12,
+    "LABEL_13": 13,
+    "LABEL_14": 14,
+    "LABEL_15": 15,
+    "LABEL_16": 16,
+    "LABEL_17": 17,
+    "LABEL_18": 18,
+    "LABEL_19": 19,
+    "LABEL_2": 2,
+    "LABEL_20": 20,
+    "LABEL_21": 21,
+    "LABEL_22": 22,
+    "LABEL_23": 23,
+    "LABEL_24": 24,
+    "LABEL_25": 25,
+    "LABEL_26": 26,
+    "LABEL_27": 27,
+    "LABEL_28": 28,
+    "LABEL_29": 29,
+    "LABEL_3": 3,
+    "LABEL_30": 30,
+    "LABEL_31": 31,
+    "LABEL_32": 32,
+    "LABEL_33": 33,
+    "LABEL_34": 34,
+    "LABEL_35": 35,
+    "LABEL_36": 36,
+    "LABEL_37": 37,
+    "LABEL_38": 38,
+    "LABEL_39": 39,
+    "LABEL_4": 4,
+    "LABEL_40": 40,
+    "LABEL_41": 41,
+    "LABEL_42": 42,
+    "LABEL_43": 43,
+    "LABEL_44": 44,
+    "LABEL_45": 45,
+    "LABEL_46": 46,
+    "LABEL_47": 47,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7,
+    "LABEL_8": 8,
+    "LABEL_9": 9
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

checkpoint-3370/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc069e386a6deb789edc1a12057f57b654519f5f9fe6868369fcde2f08a30b74
+size 438100144

checkpoint-3370/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35e4b3f3f995bb1fae31c38a3b82ef5cd9569281b00de71c26e8c4f58b271614
+size 876321402

checkpoint-3370/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7a8de39f56cebb77b98b62c5b8379c529ea942c4cf0e172c9d640d6d9f81168
+size 14244

checkpoint-3370/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5908ea72e3438172d9daa4995d49ed342e883ef405edcfc9f86191cf29863ecf
+size 1064

checkpoint-3370/trainer_state.json ADDED Viewed

	@@ -0,0 +1,254 @@

+{
+  "best_metric": 0.9203949718676169,
+  "best_model_checkpoint": "./results/checkpoint-3370",
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 3370,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7423904974016332,
+      "grad_norm": 1.0851198434829712,
+      "learning_rate": 2.8606983655274892e-05,
+      "loss": 0.448,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_administration_accuracy": 0.8700092850510678,
+      "eval_administration_f1": 0.830681542112301,
+      "eval_corruption_accuracy": 0.9301764159702879,
+      "eval_corruption_f1": 0.9210203978746075,
+      "eval_democracy_accuracy": 0.9201485608170845,
+      "eval_democracy_f1": 0.8972549864645475,
+      "eval_development_accuracy": 0.8672237697307336,
+      "eval_development_f1": 0.8462048329953127,
+      "eval_economy_accuracy": 0.9062209842154132,
+      "eval_economy_f1": 0.8952254345075943,
+      "eval_education_accuracy": 0.9467038068709378,
+      "eval_education_f1": 0.9344408657756663,
+      "eval_environment_accuracy": 0.9619312906220984,
+      "eval_environment_f1": 0.9564784032426319,
+      "eval_instability_accuracy": 0.9084493964716805,
+      "eval_instability_f1": 0.8872576883139862,
+      "eval_leadership_accuracy": 0.833983286908078,
+      "eval_leadership_f1": 0.8199437016930928,
+      "eval_loss": 0.2781185507774353,
+      "eval_overall_accuracy": 0.9090374497059734,
+      "eval_overall_f1": 0.8943279031006514,
+      "eval_race_accuracy": 0.9385329619312907,
+      "eval_race_f1": 0.9345823913548884,
+      "eval_religion_accuracy": 0.9303621169916435,
+      "eval_religion_f1": 0.9219388519537324,
+      "eval_runtime": 6.3896,
+      "eval_safety_accuracy": 0.8947075208913648,
+      "eval_safety_f1": 0.8869057409194557,
+      "eval_samples_per_second": 842.781,
+      "eval_steps_per_second": 52.742,
+      "step": 674
+    },
+    {
+      "epoch": 1.4840386043058649,
+      "grad_norm": 1.3921394348144531,
+      "learning_rate": 2.7213967310549777e-05,
+      "loss": 0.2646,
+      "step": 1000
+    },
+    {
+      "epoch": 2.0,
+      "eval_administration_accuracy": 0.886908077994429,
+      "eval_administration_f1": 0.8723732992505114,
+      "eval_corruption_accuracy": 0.9424326833797586,
+      "eval_corruption_f1": 0.9384898864061544,
+      "eval_democracy_accuracy": 0.933519034354689,
+      "eval_democracy_f1": 0.9231869597067329,
+      "eval_development_accuracy": 0.8739090064995357,
+      "eval_development_f1": 0.8668624356641937,
+      "eval_economy_accuracy": 0.9143918291550603,
+      "eval_economy_f1": 0.9111034488927022,
+      "eval_education_accuracy": 0.9580315691736304,
+      "eval_education_f1": 0.9543147194312244,
+      "eval_environment_accuracy": 0.9734447539461467,
+      "eval_environment_f1": 0.9731508098039792,
+      "eval_instability_accuracy": 0.9277623026926648,
+      "eval_instability_f1": 0.9222378035229967,
+      "eval_leadership_accuracy": 0.840297121634169,
+      "eval_leadership_f1": 0.8406461991345243,
+      "eval_loss": 0.23724055290222168,
+      "eval_overall_accuracy": 0.9205354379449089,
+      "eval_overall_f1": 0.9156647148374422,
+      "eval_race_accuracy": 0.9467038068709378,
+      "eval_race_f1": 0.943797657082642,
+      "eval_religion_accuracy": 0.9409470752089136,
+      "eval_religion_f1": 0.9380295054445577,
+      "eval_runtime": 6.3736,
+      "eval_safety_accuracy": 0.9080779944289693,
+      "eval_safety_f1": 0.9037838537090879,
+      "eval_samples_per_second": 844.886,
+      "eval_steps_per_second": 52.874,
+      "step": 1348
+    },
+    {
+      "epoch": 2.2256867112100966,
+      "grad_norm": 0.9178161025047302,
+      "learning_rate": 2.582095096582467e-05,
+      "loss": 0.2085,
+      "step": 1500
+    },
+    {
+      "epoch": 2.9680772086117297,
+      "grad_norm": 1.1747676134109497,
+      "learning_rate": 2.4427934621099553e-05,
+      "loss": 0.1696,
+      "step": 2000
+    },
+    {
+      "epoch": 3.0,
+      "eval_administration_accuracy": 0.8919220055710306,
+      "eval_administration_f1": 0.8805907698259323,
+      "eval_corruption_accuracy": 0.9454038997214484,
+      "eval_corruption_f1": 0.9422755927443824,
+      "eval_democracy_accuracy": 0.9333333333333333,
+      "eval_democracy_f1": 0.9277380787973176,
+      "eval_development_accuracy": 0.8846796657381616,
+      "eval_development_f1": 0.8767801428288444,
+      "eval_economy_accuracy": 0.9177344475394614,
+      "eval_economy_f1": 0.913190124488594,
+      "eval_education_accuracy": 0.959702878365831,
+      "eval_education_f1": 0.9592018840910198,
+      "eval_environment_accuracy": 0.9766016713091922,
+      "eval_environment_f1": 0.9753052667455842,
+      "eval_instability_accuracy": 0.9255338904363974,
+      "eval_instability_f1": 0.9219441146038561,
+      "eval_leadership_accuracy": 0.8503249767873723,
+      "eval_leadership_f1": 0.8464660955301658,
+      "eval_loss": 0.22912514209747314,
+      "eval_overall_accuracy": 0.923785205818632,
+      "eval_overall_f1": 0.9198927823234619,
+      "eval_race_accuracy": 0.9468895078922934,
+      "eval_race_f1": 0.9441406664359246,
+      "eval_religion_accuracy": 0.9418755803156917,
+      "eval_religion_f1": 0.9406664102976392,
+      "eval_runtime": 6.3983,
+      "eval_safety_accuracy": 0.9114206128133705,
+      "eval_safety_f1": 0.9104142414922826,
+      "eval_samples_per_second": 841.634,
+      "eval_steps_per_second": 52.67,
+      "step": 2022
+    },
+    {
+      "epoch": 3.7097253155159615,
+      "grad_norm": 1.7257879972457886,
+      "learning_rate": 2.3034918276374445e-05,
+      "loss": 0.1309,
+      "step": 2500
+    },
+    {
+      "epoch": 4.0,
+      "eval_administration_accuracy": 0.875766016713092,
+      "eval_administration_f1": 0.8761692862915822,
+      "eval_corruption_accuracy": 0.9465181058495822,
+      "eval_corruption_f1": 0.9432932911595113,
+      "eval_democracy_accuracy": 0.9344475394614671,
+      "eval_democracy_f1": 0.9289539940724922,
+      "eval_development_accuracy": 0.8804085422469824,
+      "eval_development_f1": 0.8733152085361343,
+      "eval_economy_accuracy": 0.9175487465181058,
+      "eval_economy_f1": 0.9168308054942083,
+      "eval_education_accuracy": 0.959702878365831,
+      "eval_education_f1": 0.9577025286068839,
+      "eval_environment_accuracy": 0.9740018570102136,
+      "eval_environment_f1": 0.9740155750677182,
+      "eval_instability_accuracy": 0.92330547818013,
+      "eval_instability_f1": 0.9214961270553598,
+      "eval_leadership_accuracy": 0.8469823584029712,
+      "eval_leadership_f1": 0.8454208641557382,
+      "eval_loss": 0.23740428686141968,
+      "eval_overall_accuracy": 0.9211853915196534,
+      "eval_overall_f1": 0.9191929747362485,
+      "eval_race_accuracy": 0.9452181987000928,
+      "eval_race_f1": 0.9441252497587079,
+      "eval_religion_accuracy": 0.940761374187558,
+      "eval_religion_f1": 0.9389083250935241,
+      "eval_runtime": 6.3816,
+      "eval_safety_accuracy": 0.9095636025998143,
+      "eval_safety_f1": 0.9100844415431236,
+      "eval_samples_per_second": 843.83,
+      "eval_steps_per_second": 52.808,
+      "step": 2696
+    },
+    {
+      "epoch": 4.451373422420193,
+      "grad_norm": 1.5328147411346436,
+      "learning_rate": 2.1641901931649333e-05,
+      "loss": 0.1085,
+      "step": 3000
+    },
+    {
+      "epoch": 5.0,
+      "eval_administration_accuracy": 0.8921077065923863,
+      "eval_administration_f1": 0.8861580465319954,
+      "eval_corruption_accuracy": 0.9463324048282266,
+      "eval_corruption_f1": 0.943458379396768,
+      "eval_democracy_accuracy": 0.9346332404828227,
+      "eval_democracy_f1": 0.9313693520601084,
+      "eval_development_accuracy": 0.8807799442896936,
+      "eval_development_f1": 0.8746742414193872,
+      "eval_economy_accuracy": 0.9175487465181058,
+      "eval_economy_f1": 0.9165794145446547,
+      "eval_education_accuracy": 0.9587743732590529,
+      "eval_education_f1": 0.9574397967431261,
+      "eval_environment_accuracy": 0.9736304549675023,
+      "eval_environment_f1": 0.9731615305259281,
+      "eval_instability_accuracy": 0.9257195914577531,
+      "eval_instability_f1": 0.9217833078621397,
+      "eval_leadership_accuracy": 0.8458681522748375,
+      "eval_leadership_f1": 0.849217017756863,
+      "eval_loss": 0.24142640829086304,
+      "eval_overall_accuracy": 0.9226245744351593,
+      "eval_overall_f1": 0.9203949718676169,
+      "eval_race_accuracy": 0.9452181987000928,
+      "eval_race_f1": 0.9418839421000289,
+      "eval_religion_accuracy": 0.9426183844011142,
+      "eval_religion_f1": 0.9420269885121756,
+      "eval_runtime": 6.3895,
+      "eval_safety_accuracy": 0.9082636954503249,
+      "eval_safety_f1": 0.9069876449582265,
+      "eval_samples_per_second": 842.785,
+      "eval_steps_per_second": 52.743,
+      "step": 3370
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 10768,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 16,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.834613210857472e+16,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-3370/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e04a520e0b54409a3029464cde7d12079be452340929d293e17e45309f482f8
+size 5368

checkpoint-4044/config.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7",
+    "8": "LABEL_8",
+    "9": "LABEL_9",
+    "10": "LABEL_10",
+    "11": "LABEL_11",
+    "12": "LABEL_12",
+    "13": "LABEL_13",
+    "14": "LABEL_14",
+    "15": "LABEL_15",
+    "16": "LABEL_16",
+    "17": "LABEL_17",
+    "18": "LABEL_18",
+    "19": "LABEL_19",
+    "20": "LABEL_20",
+    "21": "LABEL_21",
+    "22": "LABEL_22",
+    "23": "LABEL_23",
+    "24": "LABEL_24",
+    "25": "LABEL_25",
+    "26": "LABEL_26",
+    "27": "LABEL_27",
+    "28": "LABEL_28",
+    "29": "LABEL_29",
+    "30": "LABEL_30",
+    "31": "LABEL_31",
+    "32": "LABEL_32",
+    "33": "LABEL_33",
+    "34": "LABEL_34",
+    "35": "LABEL_35",
+    "36": "LABEL_36",
+    "37": "LABEL_37",
+    "38": "LABEL_38",
+    "39": "LABEL_39",
+    "40": "LABEL_40",
+    "41": "LABEL_41",
+    "42": "LABEL_42",
+    "43": "LABEL_43",
+    "44": "LABEL_44",
+    "45": "LABEL_45",
+    "46": "LABEL_46",
+    "47": "LABEL_47"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_10": 10,
+    "LABEL_11": 11,
+    "LABEL_12": 12,
+    "LABEL_13": 13,
+    "LABEL_14": 14,
+    "LABEL_15": 15,
+    "LABEL_16": 16,
+    "LABEL_17": 17,
+    "LABEL_18": 18,
+    "LABEL_19": 19,
+    "LABEL_2": 2,
+    "LABEL_20": 20,
+    "LABEL_21": 21,
+    "LABEL_22": 22,
+    "LABEL_23": 23,
+    "LABEL_24": 24,
+    "LABEL_25": 25,
+    "LABEL_26": 26,
+    "LABEL_27": 27,
+    "LABEL_28": 28,
+    "LABEL_29": 29,
+    "LABEL_3": 3,
+    "LABEL_30": 30,
+    "LABEL_31": 31,
+    "LABEL_32": 32,
+    "LABEL_33": 33,
+    "LABEL_34": 34,
+    "LABEL_35": 35,
+    "LABEL_36": 36,
+    "LABEL_37": 37,
+    "LABEL_38": 38,
+    "LABEL_39": 39,
+    "LABEL_4": 4,
+    "LABEL_40": 40,
+    "LABEL_41": 41,
+    "LABEL_42": 42,
+    "LABEL_43": 43,
+    "LABEL_44": 44,
+    "LABEL_45": 45,
+    "LABEL_46": 46,
+    "LABEL_47": 47,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7,
+    "LABEL_8": 8,
+    "LABEL_9": 9
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

checkpoint-4044/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:50ae65792f946dd206a56e7171e8841d42a6d25d5695f1e1d083a0e8ad3cee3a
+size 438100144

checkpoint-4044/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b4f90ccce91d0d7244cb66f2172c62962b5f639102025a0f65a9e9c5c9577a8
+size 876321402

checkpoint-4044/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc14f83f1d8bcc8e0cf5de47b08170b2935f5ce887d598ce751ad81394d1f39d
+size 14244

checkpoint-4044/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8d5bbe16a9975d3dcaf6e23f5f25fced7bda78de9f7385dedda983b7eb1e5c42
+size 1064

checkpoint-4044/trainer_state.json ADDED Viewed

	@@ -0,0 +1,302 @@

+{
+  "best_metric": 0.9203949718676169,
+  "best_model_checkpoint": "./results/checkpoint-3370",
+  "epoch": 6.0,
+  "eval_steps": 500,
+  "global_step": 4044,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7423904974016332,
+      "grad_norm": 1.0851198434829712,
+      "learning_rate": 2.8606983655274892e-05,
+      "loss": 0.448,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_administration_accuracy": 0.8700092850510678,
+      "eval_administration_f1": 0.830681542112301,
+      "eval_corruption_accuracy": 0.9301764159702879,
+      "eval_corruption_f1": 0.9210203978746075,
+      "eval_democracy_accuracy": 0.9201485608170845,
+      "eval_democracy_f1": 0.8972549864645475,
+      "eval_development_accuracy": 0.8672237697307336,
+      "eval_development_f1": 0.8462048329953127,
+      "eval_economy_accuracy": 0.9062209842154132,
+      "eval_economy_f1": 0.8952254345075943,
+      "eval_education_accuracy": 0.9467038068709378,
+      "eval_education_f1": 0.9344408657756663,
+      "eval_environment_accuracy": 0.9619312906220984,
+      "eval_environment_f1": 0.9564784032426319,
+      "eval_instability_accuracy": 0.9084493964716805,
+      "eval_instability_f1": 0.8872576883139862,
+      "eval_leadership_accuracy": 0.833983286908078,
+      "eval_leadership_f1": 0.8199437016930928,
+      "eval_loss": 0.2781185507774353,
+      "eval_overall_accuracy": 0.9090374497059734,
+      "eval_overall_f1": 0.8943279031006514,
+      "eval_race_accuracy": 0.9385329619312907,
+      "eval_race_f1": 0.9345823913548884,
+      "eval_religion_accuracy": 0.9303621169916435,
+      "eval_religion_f1": 0.9219388519537324,
+      "eval_runtime": 6.3896,
+      "eval_safety_accuracy": 0.8947075208913648,
+      "eval_safety_f1": 0.8869057409194557,
+      "eval_samples_per_second": 842.781,
+      "eval_steps_per_second": 52.742,
+      "step": 674
+    },
+    {
+      "epoch": 1.4840386043058649,
+      "grad_norm": 1.3921394348144531,
+      "learning_rate": 2.7213967310549777e-05,
+      "loss": 0.2646,
+      "step": 1000
+    },
+    {
+      "epoch": 2.0,
+      "eval_administration_accuracy": 0.886908077994429,
+      "eval_administration_f1": 0.8723732992505114,
+      "eval_corruption_accuracy": 0.9424326833797586,
+      "eval_corruption_f1": 0.9384898864061544,
+      "eval_democracy_accuracy": 0.933519034354689,
+      "eval_democracy_f1": 0.9231869597067329,
+      "eval_development_accuracy": 0.8739090064995357,
+      "eval_development_f1": 0.8668624356641937,
+      "eval_economy_accuracy": 0.9143918291550603,
+      "eval_economy_f1": 0.9111034488927022,
+      "eval_education_accuracy": 0.9580315691736304,
+      "eval_education_f1": 0.9543147194312244,
+      "eval_environment_accuracy": 0.9734447539461467,
+      "eval_environment_f1": 0.9731508098039792,
+      "eval_instability_accuracy": 0.9277623026926648,
+      "eval_instability_f1": 0.9222378035229967,
+      "eval_leadership_accuracy": 0.840297121634169,
+      "eval_leadership_f1": 0.8406461991345243,
+      "eval_loss": 0.23724055290222168,
+      "eval_overall_accuracy": 0.9205354379449089,
+      "eval_overall_f1": 0.9156647148374422,
+      "eval_race_accuracy": 0.9467038068709378,
+      "eval_race_f1": 0.943797657082642,
+      "eval_religion_accuracy": 0.9409470752089136,
+      "eval_religion_f1": 0.9380295054445577,
+      "eval_runtime": 6.3736,
+      "eval_safety_accuracy": 0.9080779944289693,
+      "eval_safety_f1": 0.9037838537090879,
+      "eval_samples_per_second": 844.886,
+      "eval_steps_per_second": 52.874,
+      "step": 1348
+    },
+    {
+      "epoch": 2.2256867112100966,
+      "grad_norm": 0.9178161025047302,
+      "learning_rate": 2.582095096582467e-05,
+      "loss": 0.2085,
+      "step": 1500
+    },
+    {
+      "epoch": 2.9680772086117297,
+      "grad_norm": 1.1747676134109497,
+      "learning_rate": 2.4427934621099553e-05,
+      "loss": 0.1696,
+      "step": 2000
+    },
+    {
+      "epoch": 3.0,
+      "eval_administration_accuracy": 0.8919220055710306,
+      "eval_administration_f1": 0.8805907698259323,
+      "eval_corruption_accuracy": 0.9454038997214484,
+      "eval_corruption_f1": 0.9422755927443824,
+      "eval_democracy_accuracy": 0.9333333333333333,
+      "eval_democracy_f1": 0.9277380787973176,
+      "eval_development_accuracy": 0.8846796657381616,
+      "eval_development_f1": 0.8767801428288444,
+      "eval_economy_accuracy": 0.9177344475394614,
+      "eval_economy_f1": 0.913190124488594,
+      "eval_education_accuracy": 0.959702878365831,
+      "eval_education_f1": 0.9592018840910198,
+      "eval_environment_accuracy": 0.9766016713091922,
+      "eval_environment_f1": 0.9753052667455842,
+      "eval_instability_accuracy": 0.9255338904363974,
+      "eval_instability_f1": 0.9219441146038561,
+      "eval_leadership_accuracy": 0.8503249767873723,
+      "eval_leadership_f1": 0.8464660955301658,
+      "eval_loss": 0.22912514209747314,
+      "eval_overall_accuracy": 0.923785205818632,
+      "eval_overall_f1": 0.9198927823234619,
+      "eval_race_accuracy": 0.9468895078922934,
+      "eval_race_f1": 0.9441406664359246,
+      "eval_religion_accuracy": 0.9418755803156917,
+      "eval_religion_f1": 0.9406664102976392,
+      "eval_runtime": 6.3983,
+      "eval_safety_accuracy": 0.9114206128133705,
+      "eval_safety_f1": 0.9104142414922826,
+      "eval_samples_per_second": 841.634,
+      "eval_steps_per_second": 52.67,
+      "step": 2022
+    },
+    {
+      "epoch": 3.7097253155159615,
+      "grad_norm": 1.7257879972457886,
+      "learning_rate": 2.3034918276374445e-05,
+      "loss": 0.1309,
+      "step": 2500
+    },
+    {
+      "epoch": 4.0,
+      "eval_administration_accuracy": 0.875766016713092,
+      "eval_administration_f1": 0.8761692862915822,
+      "eval_corruption_accuracy": 0.9465181058495822,
+      "eval_corruption_f1": 0.9432932911595113,
+      "eval_democracy_accuracy": 0.9344475394614671,
+      "eval_democracy_f1": 0.9289539940724922,
+      "eval_development_accuracy": 0.8804085422469824,
+      "eval_development_f1": 0.8733152085361343,
+      "eval_economy_accuracy": 0.9175487465181058,
+      "eval_economy_f1": 0.9168308054942083,
+      "eval_education_accuracy": 0.959702878365831,
+      "eval_education_f1": 0.9577025286068839,
+      "eval_environment_accuracy": 0.9740018570102136,
+      "eval_environment_f1": 0.9740155750677182,
+      "eval_instability_accuracy": 0.92330547818013,
+      "eval_instability_f1": 0.9214961270553598,
+      "eval_leadership_accuracy": 0.8469823584029712,
+      "eval_leadership_f1": 0.8454208641557382,
+      "eval_loss": 0.23740428686141968,
+      "eval_overall_accuracy": 0.9211853915196534,
+      "eval_overall_f1": 0.9191929747362485,
+      "eval_race_accuracy": 0.9452181987000928,
+      "eval_race_f1": 0.9441252497587079,
+      "eval_religion_accuracy": 0.940761374187558,
+      "eval_religion_f1": 0.9389083250935241,
+      "eval_runtime": 6.3816,
+      "eval_safety_accuracy": 0.9095636025998143,
+      "eval_safety_f1": 0.9100844415431236,
+      "eval_samples_per_second": 843.83,
+      "eval_steps_per_second": 52.808,
+      "step": 2696
+    },
+    {
+      "epoch": 4.451373422420193,
+      "grad_norm": 1.5328147411346436,
+      "learning_rate": 2.1641901931649333e-05,
+      "loss": 0.1085,
+      "step": 3000
+    },
+    {
+      "epoch": 5.0,
+      "eval_administration_accuracy": 0.8921077065923863,
+      "eval_administration_f1": 0.8861580465319954,
+      "eval_corruption_accuracy": 0.9463324048282266,
+      "eval_corruption_f1": 0.943458379396768,
+      "eval_democracy_accuracy": 0.9346332404828227,
+      "eval_democracy_f1": 0.9313693520601084,
+      "eval_development_accuracy": 0.8807799442896936,
+      "eval_development_f1": 0.8746742414193872,
+      "eval_economy_accuracy": 0.9175487465181058,
+      "eval_economy_f1": 0.9165794145446547,
+      "eval_education_accuracy": 0.9587743732590529,
+      "eval_education_f1": 0.9574397967431261,
+      "eval_environment_accuracy": 0.9736304549675023,
+      "eval_environment_f1": 0.9731615305259281,
+      "eval_instability_accuracy": 0.9257195914577531,
+      "eval_instability_f1": 0.9217833078621397,
+      "eval_leadership_accuracy": 0.8458681522748375,
+      "eval_leadership_f1": 0.849217017756863,
+      "eval_loss": 0.24142640829086304,
+      "eval_overall_accuracy": 0.9226245744351593,
+      "eval_overall_f1": 0.9203949718676169,
+      "eval_race_accuracy": 0.9452181987000928,
+      "eval_race_f1": 0.9418839421000289,
+      "eval_religion_accuracy": 0.9426183844011142,
+      "eval_religion_f1": 0.9420269885121756,
+      "eval_runtime": 6.3895,
+      "eval_safety_accuracy": 0.9082636954503249,
+      "eval_safety_f1": 0.9069876449582265,
+      "eval_samples_per_second": 842.785,
+      "eval_steps_per_second": 52.743,
+      "step": 3370
+    },
+    {
+      "epoch": 5.193021529324425,
+      "grad_norm": 1.2458630800247192,
+      "learning_rate": 2.024888558692422e-05,
+      "loss": 0.0925,
+      "step": 3500
+    },
+    {
+      "epoch": 5.935412026726058,
+      "grad_norm": 1.964983582496643,
+      "learning_rate": 1.885586924219911e-05,
+      "loss": 0.0759,
+      "step": 4000
+    },
+    {
+      "epoch": 6.0,
+      "eval_administration_accuracy": 0.8885793871866295,
+      "eval_administration_f1": 0.8796540295327503,
+      "eval_corruption_accuracy": 0.944661095636026,
+      "eval_corruption_f1": 0.9430977714288632,
+      "eval_democracy_accuracy": 0.9312906220984215,
+      "eval_democracy_f1": 0.9311108081348881,
+      "eval_development_accuracy": 0.8809656453110493,
+      "eval_development_f1": 0.8743050043114865,
+      "eval_economy_accuracy": 0.9162488393686166,
+      "eval_economy_f1": 0.9153006920861309,
+      "eval_education_accuracy": 0.9600742804085423,
+      "eval_education_f1": 0.9587642973646463,
+      "eval_environment_accuracy": 0.9756731662024141,
+      "eval_environment_f1": 0.9753440362005743,
+      "eval_instability_accuracy": 0.9205199628597958,
+      "eval_instability_f1": 0.9185046153727873,
+      "eval_leadership_accuracy": 0.8510677808727948,
+      "eval_leadership_f1": 0.8491756854928866,
+      "eval_loss": 0.25557437539100647,
+      "eval_overall_accuracy": 0.9218198700092851,
+      "eval_overall_f1": 0.9198843837682896,
+      "eval_race_accuracy": 0.9472609099350047,
+      "eval_race_f1": 0.9465463984676691,
+      "eval_religion_accuracy": 0.9420612813370474,
+      "eval_religion_f1": 0.941883774169552,
+      "eval_runtime": 6.406,
+      "eval_safety_accuracy": 0.903435468895079,
+      "eval_safety_f1": 0.9049254926572401,
+      "eval_samples_per_second": 840.618,
+      "eval_steps_per_second": 52.607,
+      "step": 4044
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 10768,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 16,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 1
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.4015358530289664e+16,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-4044/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e04a520e0b54409a3029464cde7d12079be452340929d293e17e45309f482f8
+size 5368

checkpoint-4718/config.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7",
+    "8": "LABEL_8",
+    "9": "LABEL_9",
+    "10": "LABEL_10",
+    "11": "LABEL_11",
+    "12": "LABEL_12",
+    "13": "LABEL_13",
+    "14": "LABEL_14",
+    "15": "LABEL_15",
+    "16": "LABEL_16",
+    "17": "LABEL_17",
+    "18": "LABEL_18",
+    "19": "LABEL_19",
+    "20": "LABEL_20",
+    "21": "LABEL_21",
+    "22": "LABEL_22",
+    "23": "LABEL_23",
+    "24": "LABEL_24",
+    "25": "LABEL_25",
+    "26": "LABEL_26",
+    "27": "LABEL_27",
+    "28": "LABEL_28",
+    "29": "LABEL_29",
+    "30": "LABEL_30",
+    "31": "LABEL_31",
+    "32": "LABEL_32",
+    "33": "LABEL_33",
+    "34": "LABEL_34",
+    "35": "LABEL_35",
+    "36": "LABEL_36",
+    "37": "LABEL_37",
+    "38": "LABEL_38",
+    "39": "LABEL_39",
+    "40": "LABEL_40",
+    "41": "LABEL_41",
+    "42": "LABEL_42",
+    "43": "LABEL_43",
+    "44": "LABEL_44",
+    "45": "LABEL_45",
+    "46": "LABEL_46",
+    "47": "LABEL_47"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_10": 10,
+    "LABEL_11": 11,
+    "LABEL_12": 12,
+    "LABEL_13": 13,
+    "LABEL_14": 14,
+    "LABEL_15": 15,
+    "LABEL_16": 16,
+    "LABEL_17": 17,
+    "LABEL_18": 18,
+    "LABEL_19": 19,
+    "LABEL_2": 2,
+    "LABEL_20": 20,
+    "LABEL_21": 21,
+    "LABEL_22": 22,
+    "LABEL_23": 23,
+    "LABEL_24": 24,
+    "LABEL_25": 25,
+    "LABEL_26": 26,
+    "LABEL_27": 27,
+    "LABEL_28": 28,
+    "LABEL_29": 29,
+    "LABEL_3": 3,
+    "LABEL_30": 30,
+    "LABEL_31": 31,
+    "LABEL_32": 32,
+    "LABEL_33": 33,
+    "LABEL_34": 34,
+    "LABEL_35": 35,
+    "LABEL_36": 36,
+    "LABEL_37": 37,
+    "LABEL_38": 38,
+    "LABEL_39": 39,
+    "LABEL_4": 4,
+    "LABEL_40": 40,
+    "LABEL_41": 41,
+    "LABEL_42": 42,
+    "LABEL_43": 43,
+    "LABEL_44": 44,
+    "LABEL_45": 45,
+    "LABEL_46": 46,
+    "LABEL_47": 47,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7,
+    "LABEL_8": 8,
+    "LABEL_9": 9
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

checkpoint-4718/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:239459ee5e26bfb60ee18a2ddd2b19f03414d3a5ab527beb9d4cd2508e4f07d2
+size 438100144

checkpoint-4718/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c3ae74aa8ed8d1923695fb3378148bb3e12537f41d5e7b9873d73085e55d4aff
+size 876321402

checkpoint-4718/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35450a7534388067569db6fc13d4f16c9ae0806647d56ff8ce7dc917bbea9205
+size 14244

checkpoint-4718/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e87bacdf67f2de74e66d886eb3658fb593c867d5deb67c6a9bb916b5d65f2116
+size 1064

checkpoint-4718/trainer_state.json ADDED Viewed

	@@ -0,0 +1,343 @@

+{
+  "best_metric": 0.9203949718676169,
+  "best_model_checkpoint": "./results/checkpoint-3370",
+  "epoch": 7.0,
+  "eval_steps": 500,
+  "global_step": 4718,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7423904974016332,
+      "grad_norm": 1.0851198434829712,
+      "learning_rate": 2.8606983655274892e-05,
+      "loss": 0.448,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_administration_accuracy": 0.8700092850510678,
+      "eval_administration_f1": 0.830681542112301,
+      "eval_corruption_accuracy": 0.9301764159702879,
+      "eval_corruption_f1": 0.9210203978746075,
+      "eval_democracy_accuracy": 0.9201485608170845,
+      "eval_democracy_f1": 0.8972549864645475,
+      "eval_development_accuracy": 0.8672237697307336,
+      "eval_development_f1": 0.8462048329953127,
+      "eval_economy_accuracy": 0.9062209842154132,
+      "eval_economy_f1": 0.8952254345075943,
+      "eval_education_accuracy": 0.9467038068709378,
+      "eval_education_f1": 0.9344408657756663,
+      "eval_environment_accuracy": 0.9619312906220984,
+      "eval_environment_f1": 0.9564784032426319,
+      "eval_instability_accuracy": 0.9084493964716805,
+      "eval_instability_f1": 0.8872576883139862,
+      "eval_leadership_accuracy": 0.833983286908078,
+      "eval_leadership_f1": 0.8199437016930928,
+      "eval_loss": 0.2781185507774353,
+      "eval_overall_accuracy": 0.9090374497059734,
+      "eval_overall_f1": 0.8943279031006514,
+      "eval_race_accuracy": 0.9385329619312907,
+      "eval_race_f1": 0.9345823913548884,
+      "eval_religion_accuracy": 0.9303621169916435,
+      "eval_religion_f1": 0.9219388519537324,
+      "eval_runtime": 6.3896,
+      "eval_safety_accuracy": 0.8947075208913648,
+      "eval_safety_f1": 0.8869057409194557,
+      "eval_samples_per_second": 842.781,
+      "eval_steps_per_second": 52.742,
+      "step": 674
+    },
+    {
+      "epoch": 1.4840386043058649,
+      "grad_norm": 1.3921394348144531,
+      "learning_rate": 2.7213967310549777e-05,
+      "loss": 0.2646,
+      "step": 1000
+    },
+    {
+      "epoch": 2.0,
+      "eval_administration_accuracy": 0.886908077994429,
+      "eval_administration_f1": 0.8723732992505114,
+      "eval_corruption_accuracy": 0.9424326833797586,
+      "eval_corruption_f1": 0.9384898864061544,
+      "eval_democracy_accuracy": 0.933519034354689,
+      "eval_democracy_f1": 0.9231869597067329,
+      "eval_development_accuracy": 0.8739090064995357,
+      "eval_development_f1": 0.8668624356641937,
+      "eval_economy_accuracy": 0.9143918291550603,
+      "eval_economy_f1": 0.9111034488927022,
+      "eval_education_accuracy": 0.9580315691736304,
+      "eval_education_f1": 0.9543147194312244,
+      "eval_environment_accuracy": 0.9734447539461467,
+      "eval_environment_f1": 0.9731508098039792,
+      "eval_instability_accuracy": 0.9277623026926648,
+      "eval_instability_f1": 0.9222378035229967,
+      "eval_leadership_accuracy": 0.840297121634169,
+      "eval_leadership_f1": 0.8406461991345243,
+      "eval_loss": 0.23724055290222168,
+      "eval_overall_accuracy": 0.9205354379449089,
+      "eval_overall_f1": 0.9156647148374422,
+      "eval_race_accuracy": 0.9467038068709378,
+      "eval_race_f1": 0.943797657082642,
+      "eval_religion_accuracy": 0.9409470752089136,
+      "eval_religion_f1": 0.9380295054445577,
+      "eval_runtime": 6.3736,
+      "eval_safety_accuracy": 0.9080779944289693,
+      "eval_safety_f1": 0.9037838537090879,
+      "eval_samples_per_second": 844.886,
+      "eval_steps_per_second": 52.874,
+      "step": 1348
+    },
+    {
+      "epoch": 2.2256867112100966,
+      "grad_norm": 0.9178161025047302,
+      "learning_rate": 2.582095096582467e-05,
+      "loss": 0.2085,
+      "step": 1500
+    },
+    {
+      "epoch": 2.9680772086117297,
+      "grad_norm": 1.1747676134109497,
+      "learning_rate": 2.4427934621099553e-05,
+      "loss": 0.1696,
+      "step": 2000
+    },
+    {
+      "epoch": 3.0,
+      "eval_administration_accuracy": 0.8919220055710306,
+      "eval_administration_f1": 0.8805907698259323,
+      "eval_corruption_accuracy": 0.9454038997214484,
+      "eval_corruption_f1": 0.9422755927443824,
+      "eval_democracy_accuracy": 0.9333333333333333,
+      "eval_democracy_f1": 0.9277380787973176,
+      "eval_development_accuracy": 0.8846796657381616,
+      "eval_development_f1": 0.8767801428288444,
+      "eval_economy_accuracy": 0.9177344475394614,
+      "eval_economy_f1": 0.913190124488594,
+      "eval_education_accuracy": 0.959702878365831,
+      "eval_education_f1": 0.9592018840910198,
+      "eval_environment_accuracy": 0.9766016713091922,
+      "eval_environment_f1": 0.9753052667455842,
+      "eval_instability_accuracy": 0.9255338904363974,
+      "eval_instability_f1": 0.9219441146038561,
+      "eval_leadership_accuracy": 0.8503249767873723,
+      "eval_leadership_f1": 0.8464660955301658,
+      "eval_loss": 0.22912514209747314,
+      "eval_overall_accuracy": 0.923785205818632,
+      "eval_overall_f1": 0.9198927823234619,
+      "eval_race_accuracy": 0.9468895078922934,
+      "eval_race_f1": 0.9441406664359246,
+      "eval_religion_accuracy": 0.9418755803156917,
+      "eval_religion_f1": 0.9406664102976392,
+      "eval_runtime": 6.3983,
+      "eval_safety_accuracy": 0.9114206128133705,
+      "eval_safety_f1": 0.9104142414922826,
+      "eval_samples_per_second": 841.634,
+      "eval_steps_per_second": 52.67,
+      "step": 2022
+    },
+    {
+      "epoch": 3.7097253155159615,
+      "grad_norm": 1.7257879972457886,
+      "learning_rate": 2.3034918276374445e-05,
+      "loss": 0.1309,
+      "step": 2500
+    },
+    {
+      "epoch": 4.0,
+      "eval_administration_accuracy": 0.875766016713092,
+      "eval_administration_f1": 0.8761692862915822,
+      "eval_corruption_accuracy": 0.9465181058495822,
+      "eval_corruption_f1": 0.9432932911595113,
+      "eval_democracy_accuracy": 0.9344475394614671,
+      "eval_democracy_f1": 0.9289539940724922,
+      "eval_development_accuracy": 0.8804085422469824,
+      "eval_development_f1": 0.8733152085361343,
+      "eval_economy_accuracy": 0.9175487465181058,
+      "eval_economy_f1": 0.9168308054942083,
+      "eval_education_accuracy": 0.959702878365831,
+      "eval_education_f1": 0.9577025286068839,
+      "eval_environment_accuracy": 0.9740018570102136,
+      "eval_environment_f1": 0.9740155750677182,
+      "eval_instability_accuracy": 0.92330547818013,
+      "eval_instability_f1": 0.9214961270553598,
+      "eval_leadership_accuracy": 0.8469823584029712,
+      "eval_leadership_f1": 0.8454208641557382,
+      "eval_loss": 0.23740428686141968,
+      "eval_overall_accuracy": 0.9211853915196534,
+      "eval_overall_f1": 0.9191929747362485,
+      "eval_race_accuracy": 0.9452181987000928,
+      "eval_race_f1": 0.9441252497587079,
+      "eval_religion_accuracy": 0.940761374187558,
+      "eval_religion_f1": 0.9389083250935241,
+      "eval_runtime": 6.3816,
+      "eval_safety_accuracy": 0.9095636025998143,
+      "eval_safety_f1": 0.9100844415431236,
+      "eval_samples_per_second": 843.83,
+      "eval_steps_per_second": 52.808,
+      "step": 2696
+    },
+    {
+      "epoch": 4.451373422420193,
+      "grad_norm": 1.5328147411346436,
+      "learning_rate": 2.1641901931649333e-05,
+      "loss": 0.1085,
+      "step": 3000
+    },
+    {
+      "epoch": 5.0,
+      "eval_administration_accuracy": 0.8921077065923863,
+      "eval_administration_f1": 0.8861580465319954,
+      "eval_corruption_accuracy": 0.9463324048282266,
+      "eval_corruption_f1": 0.943458379396768,
+      "eval_democracy_accuracy": 0.9346332404828227,
+      "eval_democracy_f1": 0.9313693520601084,
+      "eval_development_accuracy": 0.8807799442896936,
+      "eval_development_f1": 0.8746742414193872,
+      "eval_economy_accuracy": 0.9175487465181058,
+      "eval_economy_f1": 0.9165794145446547,
+      "eval_education_accuracy": 0.9587743732590529,
+      "eval_education_f1": 0.9574397967431261,
+      "eval_environment_accuracy": 0.9736304549675023,
+      "eval_environment_f1": 0.9731615305259281,
+      "eval_instability_accuracy": 0.9257195914577531,
+      "eval_instability_f1": 0.9217833078621397,
+      "eval_leadership_accuracy": 0.8458681522748375,
+      "eval_leadership_f1": 0.849217017756863,
+      "eval_loss": 0.24142640829086304,
+      "eval_overall_accuracy": 0.9226245744351593,
+      "eval_overall_f1": 0.9203949718676169,
+      "eval_race_accuracy": 0.9452181987000928,
+      "eval_race_f1": 0.9418839421000289,
+      "eval_religion_accuracy": 0.9426183844011142,
+      "eval_religion_f1": 0.9420269885121756,
+      "eval_runtime": 6.3895,
+      "eval_safety_accuracy": 0.9082636954503249,
+      "eval_safety_f1": 0.9069876449582265,
+      "eval_samples_per_second": 842.785,
+      "eval_steps_per_second": 52.743,
+      "step": 3370
+    },
+    {
+      "epoch": 5.193021529324425,
+      "grad_norm": 1.2458630800247192,
+      "learning_rate": 2.024888558692422e-05,
+      "loss": 0.0925,
+      "step": 3500
+    },
+    {
+      "epoch": 5.935412026726058,
+      "grad_norm": 1.964983582496643,
+      "learning_rate": 1.885586924219911e-05,
+      "loss": 0.0759,
+      "step": 4000
+    },
+    {
+      "epoch": 6.0,
+      "eval_administration_accuracy": 0.8885793871866295,
+      "eval_administration_f1": 0.8796540295327503,
+      "eval_corruption_accuracy": 0.944661095636026,
+      "eval_corruption_f1": 0.9430977714288632,
+      "eval_democracy_accuracy": 0.9312906220984215,
+      "eval_democracy_f1": 0.9311108081348881,
+      "eval_development_accuracy": 0.8809656453110493,
+      "eval_development_f1": 0.8743050043114865,
+      "eval_economy_accuracy": 0.9162488393686166,
+      "eval_economy_f1": 0.9153006920861309,
+      "eval_education_accuracy": 0.9600742804085423,
+      "eval_education_f1": 0.9587642973646463,
+      "eval_environment_accuracy": 0.9756731662024141,
+      "eval_environment_f1": 0.9753440362005743,
+      "eval_instability_accuracy": 0.9205199628597958,
+      "eval_instability_f1": 0.9185046153727873,
+      "eval_leadership_accuracy": 0.8510677808727948,
+      "eval_leadership_f1": 0.8491756854928866,
+      "eval_loss": 0.25557437539100647,
+      "eval_overall_accuracy": 0.9218198700092851,
+      "eval_overall_f1": 0.9198843837682896,
+      "eval_race_accuracy": 0.9472609099350047,
+      "eval_race_f1": 0.9465463984676691,
+      "eval_religion_accuracy": 0.9420612813370474,
+      "eval_religion_f1": 0.941883774169552,
+      "eval_runtime": 6.406,
+      "eval_safety_accuracy": 0.903435468895079,
+      "eval_safety_f1": 0.9049254926572401,
+      "eval_samples_per_second": 840.618,
+      "eval_steps_per_second": 52.607,
+      "step": 4044
+    },
+    {
+      "epoch": 6.67706013363029,
+      "grad_norm": 1.1733307838439941,
+      "learning_rate": 1.7462852897474e-05,
+      "loss": 0.0618,
+      "step": 4500
+    },
+    {
+      "epoch": 7.0,
+      "eval_administration_accuracy": 0.8891364902506964,
+      "eval_administration_f1": 0.8830637895995853,
+      "eval_corruption_accuracy": 0.9441039925719591,
+      "eval_corruption_f1": 0.9419800967289127,
+      "eval_democracy_accuracy": 0.9318477251624884,
+      "eval_democracy_f1": 0.9312436052041511,
+      "eval_development_accuracy": 0.8748375116063138,
+      "eval_development_f1": 0.8709535653934616,
+      "eval_economy_accuracy": 0.9151346332404828,
+      "eval_economy_f1": 0.9143035893385101,
+      "eval_education_accuracy": 0.9567316620241412,
+      "eval_education_f1": 0.956532871707756,
+      "eval_environment_accuracy": 0.9745589600742804,
+      "eval_environment_f1": 0.9745453763641572,
+      "eval_instability_accuracy": 0.9197771587743733,
+      "eval_instability_f1": 0.9164183053432433,
+      "eval_leadership_accuracy": 0.8493964716805943,
+      "eval_leadership_f1": 0.848764162637075,
+      "eval_loss": 0.2655349373817444,
+      "eval_overall_accuracy": 0.9205663881151346,
+      "eval_overall_f1": 0.9191255338624242,
+      "eval_race_accuracy": 0.9455896007428041,
+      "eval_race_f1": 0.9449102601982086,
+      "eval_religion_accuracy": 0.9424326833797586,
+      "eval_religion_f1": 0.9425971967753438,
+      "eval_runtime": 6.378,
+      "eval_safety_accuracy": 0.9032497678737234,
+      "eval_safety_f1": 0.9041935870586874,
+      "eval_samples_per_second": 844.304,
+      "eval_steps_per_second": 52.838,
+      "step": 4718
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 10768,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 16,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 2
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.968458495200461e+16,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-4718/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e04a520e0b54409a3029464cde7d12079be452340929d293e17e45309f482f8
+size 5368

checkpoint-674/config.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7",
+    "8": "LABEL_8",
+    "9": "LABEL_9",
+    "10": "LABEL_10",
+    "11": "LABEL_11",
+    "12": "LABEL_12",
+    "13": "LABEL_13",
+    "14": "LABEL_14",
+    "15": "LABEL_15",
+    "16": "LABEL_16",
+    "17": "LABEL_17",
+    "18": "LABEL_18",
+    "19": "LABEL_19",
+    "20": "LABEL_20",
+    "21": "LABEL_21",
+    "22": "LABEL_22",
+    "23": "LABEL_23",
+    "24": "LABEL_24",
+    "25": "LABEL_25",
+    "26": "LABEL_26",
+    "27": "LABEL_27",
+    "28": "LABEL_28",
+    "29": "LABEL_29",
+    "30": "LABEL_30",
+    "31": "LABEL_31",
+    "32": "LABEL_32",
+    "33": "LABEL_33",
+    "34": "LABEL_34",
+    "35": "LABEL_35",
+    "36": "LABEL_36",
+    "37": "LABEL_37",
+    "38": "LABEL_38",
+    "39": "LABEL_39",
+    "40": "LABEL_40",
+    "41": "LABEL_41",
+    "42": "LABEL_42",
+    "43": "LABEL_43",
+    "44": "LABEL_44",
+    "45": "LABEL_45",
+    "46": "LABEL_46",
+    "47": "LABEL_47"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_10": 10,
+    "LABEL_11": 11,
+    "LABEL_12": 12,
+    "LABEL_13": 13,
+    "LABEL_14": 14,
+    "LABEL_15": 15,
+    "LABEL_16": 16,
+    "LABEL_17": 17,
+    "LABEL_18": 18,
+    "LABEL_19": 19,
+    "LABEL_2": 2,
+    "LABEL_20": 20,
+    "LABEL_21": 21,
+    "LABEL_22": 22,
+    "LABEL_23": 23,
+    "LABEL_24": 24,
+    "LABEL_25": 25,
+    "LABEL_26": 26,
+    "LABEL_27": 27,
+    "LABEL_28": 28,
+    "LABEL_29": 29,
+    "LABEL_3": 3,
+    "LABEL_30": 30,
+    "LABEL_31": 31,
+    "LABEL_32": 32,
+    "LABEL_33": 33,
+    "LABEL_34": 34,
+    "LABEL_35": 35,
+    "LABEL_36": 36,
+    "LABEL_37": 37,
+    "LABEL_38": 38,
+    "LABEL_39": 39,
+    "LABEL_4": 4,
+    "LABEL_40": 40,
+    "LABEL_41": 41,
+    "LABEL_42": 42,
+    "LABEL_43": 43,
+    "LABEL_44": 44,
+    "LABEL_45": 45,
+    "LABEL_46": 46,
+    "LABEL_47": 47,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7,
+    "LABEL_8": 8,
+    "LABEL_9": 9
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

checkpoint-674/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b3d49ce2f1a0d0092e1c0c0cd7fab055a42d4b88fc148888c40876ab95f86abd
+size 438100144

checkpoint-674/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:87f29edb5809f4669985e698b6315aa7d40836eb8562e5760932f7ed0d42168e
+size 876321402

checkpoint-674/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d911a0bdc9ef9f737150dae5e889b348d434cf30a1a9f52362f02dc016393dd
+size 14244

checkpoint-674/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1547eae16c074f20d1a13d5cb87c5bda11f93c49f4196988823c5e3b0a74c12e
+size 1064

checkpoint-674/trainer_state.json ADDED Viewed

	@@ -0,0 +1,83 @@

+{
+  "best_metric": 0.8943279031006514,
+  "best_model_checkpoint": "./results/checkpoint-674",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 674,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7423904974016332,
+      "grad_norm": 1.0851198434829712,
+      "learning_rate": 2.8606983655274892e-05,
+      "loss": 0.448,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_administration_accuracy": 0.8700092850510678,
+      "eval_administration_f1": 0.830681542112301,
+      "eval_corruption_accuracy": 0.9301764159702879,
+      "eval_corruption_f1": 0.9210203978746075,
+      "eval_democracy_accuracy": 0.9201485608170845,
+      "eval_democracy_f1": 0.8972549864645475,
+      "eval_development_accuracy": 0.8672237697307336,
+      "eval_development_f1": 0.8462048329953127,
+      "eval_economy_accuracy": 0.9062209842154132,
+      "eval_economy_f1": 0.8952254345075943,
+      "eval_education_accuracy": 0.9467038068709378,
+      "eval_education_f1": 0.9344408657756663,
+      "eval_environment_accuracy": 0.9619312906220984,
+      "eval_environment_f1": 0.9564784032426319,
+      "eval_instability_accuracy": 0.9084493964716805,
+      "eval_instability_f1": 0.8872576883139862,
+      "eval_leadership_accuracy": 0.833983286908078,
+      "eval_leadership_f1": 0.8199437016930928,
+      "eval_loss": 0.2781185507774353,
+      "eval_overall_accuracy": 0.9090374497059734,
+      "eval_overall_f1": 0.8943279031006514,
+      "eval_race_accuracy": 0.9385329619312907,
+      "eval_race_f1": 0.9345823913548884,
+      "eval_religion_accuracy": 0.9303621169916435,
+      "eval_religion_f1": 0.9219388519537324,
+      "eval_runtime": 6.3896,
+      "eval_safety_accuracy": 0.8947075208913648,
+      "eval_safety_f1": 0.8869057409194557,
+      "eval_samples_per_second": 842.781,
+      "eval_steps_per_second": 52.742,
+      "step": 674
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 10768,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 16,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5669226421714944.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-674/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e04a520e0b54409a3029464cde7d12079be452340929d293e17e45309f482f8
+size 5368

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}