HimAJ commited on Dec 16, 2025

Commit

395efd4

verified ·

1 Parent(s): 112d5a7

Upload folder using huggingface_hub

Browse files

Files changed (24) hide show

checkpoint-3400/config.json +45 -0
checkpoint-3400/model.safetensors +3 -0
checkpoint-3400/optimizer.pt +3 -0
checkpoint-3400/rng_state.pth +3 -0
checkpoint-3400/scheduler.pt +3 -0
checkpoint-3400/trainer_state.json +290 -0
checkpoint-3400/training_args.bin +3 -0
checkpoint-3600/config.json +45 -0
checkpoint-3600/model.safetensors +3 -0
checkpoint-3600/optimizer.pt +3 -0
checkpoint-3600/rng_state.pth +3 -0
checkpoint-3600/scheduler.pt +3 -0
checkpoint-3600/trainer_state.json +304 -0
checkpoint-3600/training_args.bin +3 -0
checkpoint-3732/config.json +45 -0
checkpoint-3732/model.safetensors +3 -0
checkpoint-3732/optimizer.pt +3 -0
checkpoint-3732/rng_state.pth +3 -0
checkpoint-3732/scheduler.pt +3 -0
checkpoint-3732/trainer_state.json +311 -0
checkpoint-3732/training_args.bin +3 -0
config.json +45 -0
model.safetensors +3 -0
preprocessor_config.json +24 -0

checkpoint-3400/config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "architectures": [
+    "ViTForImageClassification"
+  ],
+  "attention_probs_dropout_prob": 0.0,
+  "dtype": "float32",
+  "encoder_stride": 16,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "anger",
+    "1": "contempt",
+    "2": "disgust",
+    "3": "fear",
+    "4": "happy",
+    "5": "neutral",
+    "6": "sad",
+    "7": "surprise"
+  },
+  "image_size": 224,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "anger": "0",
+    "contempt": "1",
+    "disgust": "2",
+    "fear": "3",
+    "happy": "4",
+    "neutral": "5",
+    "sad": "6",
+    "surprise": "7"
+  },
+  "layer_norm_eps": 1e-12,
+  "model_type": "vit",
+  "num_attention_heads": 12,
+  "num_channels": 3,
+  "num_hidden_layers": 12,
+  "patch_size": 16,
+  "pooler_act": "tanh",
+  "pooler_output_size": 768,
+  "problem_type": "single_label_classification",
+  "qkv_bias": true,
+  "transformers_version": "4.57.3"
+}

checkpoint-3400/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:41f0456248e27f1f0606463d3f5816840ca22ae7f3864137bd1529d62a54df1a
+size 343242432

checkpoint-3400/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2df1d0d882d9d2bcddd02570db69852accefd36809d5f4529d772df9696f5e69
+size 686600587

checkpoint-3400/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22dbf3c2822bd0e012a008f2f8f6fc37e79fd72d0b78e165acf9c07025f5405f
+size 14455

checkpoint-3400/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c12d23a7bc6ab06788f8ab2a95b69ea92d91493a5ff0dec3f64c332eb5606cce
+size 1465

checkpoint-3400/trainer_state.json ADDED Viewed

	@@ -0,0 +1,290 @@

+{
+  "best_global_step": 2488,
+  "best_metric": 0.7773311897106109,
+  "best_model_checkpoint": null,
+  "epoch": 2.733118971061093,
+  "eval_steps": 500,
+  "global_step": 3400,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.08038585209003216,
+      "grad_norm": 10.019948959350586,
+      "learning_rate": 1.946945337620579e-05,
+      "loss": 1.2824,
+      "step": 100
+    },
+    {
+      "epoch": 0.1607717041800643,
+      "grad_norm": 8.063481330871582,
+      "learning_rate": 1.8933547695605573e-05,
+      "loss": 1.159,
+      "step": 200
+    },
+    {
+      "epoch": 0.24115755627009647,
+      "grad_norm": 13.041501998901367,
+      "learning_rate": 1.839764201500536e-05,
+      "loss": 1.0909,
+      "step": 300
+    },
+    {
+      "epoch": 0.3215434083601286,
+      "grad_norm": 8.986650466918945,
+      "learning_rate": 1.7861736334405145e-05,
+      "loss": 1.0968,
+      "step": 400
+    },
+    {
+      "epoch": 0.40192926045016075,
+      "grad_norm": 7.692521572113037,
+      "learning_rate": 1.732583065380493e-05,
+      "loss": 1.0873,
+      "step": 500
+    },
+    {
+      "epoch": 0.48231511254019294,
+      "grad_norm": 9.055645942687988,
+      "learning_rate": 1.6789924973204718e-05,
+      "loss": 1.0169,
+      "step": 600
+    },
+    {
+      "epoch": 0.5627009646302251,
+      "grad_norm": 7.9042463302612305,
+      "learning_rate": 1.6254019292604505e-05,
+      "loss": 1.0865,
+      "step": 700
+    },
+    {
+      "epoch": 0.6430868167202572,
+      "grad_norm": 7.55495548248291,
+      "learning_rate": 1.571811361200429e-05,
+      "loss": 1.0137,
+      "step": 800
+    },
+    {
+      "epoch": 0.7234726688102894,
+      "grad_norm": 6.291072368621826,
+      "learning_rate": 1.5182207931404074e-05,
+      "loss": 1.0695,
+      "step": 900
+    },
+    {
+      "epoch": 0.8038585209003215,
+      "grad_norm": 9.746781349182129,
+      "learning_rate": 1.4646302250803858e-05,
+      "loss": 1.0335,
+      "step": 1000
+    },
+    {
+      "epoch": 0.8842443729903537,
+      "grad_norm": 6.898703098297119,
+      "learning_rate": 1.4110396570203646e-05,
+      "loss": 0.987,
+      "step": 1100
+    },
+    {
+      "epoch": 0.9646302250803859,
+      "grad_norm": 8.23352336883545,
+      "learning_rate": 1.3574490889603432e-05,
+      "loss": 0.9442,
+      "step": 1200
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.6370578778135049,
+      "eval_loss": 0.9694849848747253,
+      "eval_runtime": 840.7369,
+      "eval_samples_per_second": 2.959,
+      "eval_steps_per_second": 0.37,
+      "step": 1244
+    },
+    {
+      "epoch": 1.045016077170418,
+      "grad_norm": 9.776803016662598,
+      "learning_rate": 1.3038585209003216e-05,
+      "loss": 0.868,
+      "step": 1300
+    },
+    {
+      "epoch": 1.1254019292604502,
+      "grad_norm": 10.52991771697998,
+      "learning_rate": 1.2502679528403e-05,
+      "loss": 0.7531,
+      "step": 1400
+    },
+    {
+      "epoch": 1.2057877813504823,
+      "grad_norm": 11.897740364074707,
+      "learning_rate": 1.1966773847802788e-05,
+      "loss": 0.7265,
+      "step": 1500
+    },
+    {
+      "epoch": 1.2861736334405145,
+      "grad_norm": 7.514660835266113,
+      "learning_rate": 1.1430868167202574e-05,
+      "loss": 0.7793,
+      "step": 1600
+    },
+    {
+      "epoch": 1.3665594855305465,
+      "grad_norm": 10.338397979736328,
+      "learning_rate": 1.0894962486602359e-05,
+      "loss": 0.7701,
+      "step": 1700
+    },
+    {
+      "epoch": 1.4469453376205788,
+      "grad_norm": 13.336085319519043,
+      "learning_rate": 1.0359056806002143e-05,
+      "loss": 0.7251,
+      "step": 1800
+    },
+    {
+      "epoch": 1.527331189710611,
+      "grad_norm": 9.34284496307373,
+      "learning_rate": 9.823151125401929e-06,
+      "loss": 0.7506,
+      "step": 1900
+    },
+    {
+      "epoch": 1.607717041800643,
+      "grad_norm": 10.490428924560547,
+      "learning_rate": 9.287245444801717e-06,
+      "loss": 0.7982,
+      "step": 2000
+    },
+    {
+      "epoch": 1.6881028938906752,
+      "grad_norm": 7.529485702514648,
+      "learning_rate": 8.751339764201501e-06,
+      "loss": 0.6313,
+      "step": 2100
+    },
+    {
+      "epoch": 1.7684887459807075,
+      "grad_norm": 12.055130958557129,
+      "learning_rate": 8.215434083601287e-06,
+      "loss": 0.6671,
+      "step": 2200
+    },
+    {
+      "epoch": 1.8488745980707395,
+      "grad_norm": 8.625040054321289,
+      "learning_rate": 7.679528403001071e-06,
+      "loss": 0.6896,
+      "step": 2300
+    },
+    {
+      "epoch": 1.9292604501607717,
+      "grad_norm": 8.715214729309082,
+      "learning_rate": 7.143622722400858e-06,
+      "loss": 0.672,
+      "step": 2400
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.7773311897106109,
+      "eval_loss": 0.6390692591667175,
+      "eval_runtime": 680.6477,
+      "eval_samples_per_second": 3.655,
+      "eval_steps_per_second": 0.457,
+      "step": 2488
+    },
+    {
+      "epoch": 2.009646302250804,
+      "grad_norm": 15.922383308410645,
+      "learning_rate": 6.607717041800643e-06,
+      "loss": 0.6789,
+      "step": 2500
+    },
+    {
+      "epoch": 2.090032154340836,
+      "grad_norm": 5.49733829498291,
+      "learning_rate": 6.071811361200429e-06,
+      "loss": 0.5946,
+      "step": 2600
+    },
+    {
+      "epoch": 2.170418006430868,
+      "grad_norm": 7.4076714515686035,
+      "learning_rate": 5.535905680600214e-06,
+      "loss": 0.5985,
+      "step": 2700
+    },
+    {
+      "epoch": 2.2508038585209005,
+      "grad_norm": 10.85772705078125,
+      "learning_rate": 5e-06,
+      "loss": 0.6036,
+      "step": 2800
+    },
+    {
+      "epoch": 2.3311897106109325,
+      "grad_norm": 7.137866497039795,
+      "learning_rate": 4.4640943193997856e-06,
+      "loss": 0.5502,
+      "step": 2900
+    },
+    {
+      "epoch": 2.4115755627009645,
+      "grad_norm": 6.020912170410156,
+      "learning_rate": 3.928188638799572e-06,
+      "loss": 0.6147,
+      "step": 3000
+    },
+    {
+      "epoch": 2.491961414790997,
+      "grad_norm": 13.015932083129883,
+      "learning_rate": 3.392282958199357e-06,
+      "loss": 0.5449,
+      "step": 3100
+    },
+    {
+      "epoch": 2.572347266881029,
+      "grad_norm": 9.120644569396973,
+      "learning_rate": 2.8563772775991428e-06,
+      "loss": 0.5881,
+      "step": 3200
+    },
+    {
+      "epoch": 2.652733118971061,
+      "grad_norm": 8.311524391174316,
+      "learning_rate": 2.3204715969989283e-06,
+      "loss": 0.5486,
+      "step": 3300
+    },
+    {
+      "epoch": 2.733118971061093,
+      "grad_norm": 13.35053825378418,
+      "learning_rate": 1.784565916398714e-06,
+      "loss": 0.5958,
+      "step": 3400
+    }
+  ],
+  "logging_steps": 100,
+  "max_steps": 3732,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 200,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.1072754965687828e+18,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-3400/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d0ba41b78fb9f233a65b0c2a6b875ec90644efb6b193c931d1e5c5f69391c7d7
+size 5905

checkpoint-3600/config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "architectures": [
+    "ViTForImageClassification"
+  ],
+  "attention_probs_dropout_prob": 0.0,
+  "dtype": "float32",
+  "encoder_stride": 16,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "anger",
+    "1": "contempt",
+    "2": "disgust",
+    "3": "fear",
+    "4": "happy",
+    "5": "neutral",
+    "6": "sad",
+    "7": "surprise"
+  },
+  "image_size": 224,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "anger": "0",
+    "contempt": "1",
+    "disgust": "2",
+    "fear": "3",
+    "happy": "4",
+    "neutral": "5",
+    "sad": "6",
+    "surprise": "7"
+  },
+  "layer_norm_eps": 1e-12,
+  "model_type": "vit",
+  "num_attention_heads": 12,
+  "num_channels": 3,
+  "num_hidden_layers": 12,
+  "patch_size": 16,
+  "pooler_act": "tanh",
+  "pooler_output_size": 768,
+  "problem_type": "single_label_classification",
+  "qkv_bias": true,
+  "transformers_version": "4.57.3"
+}

checkpoint-3600/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2d3141b1d64241c51bb55415ba3e4f7ff173b8479aec154e69e3497ac04489bf
+size 343242432

checkpoint-3600/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a525dc18888b1155712c0e7873959c112cf51e6afd289c03c9f326dffcb13b3f
+size 686600587

checkpoint-3600/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22dbf3c2822bd0e012a008f2f8f6fc37e79fd72d0b78e165acf9c07025f5405f
+size 14455

checkpoint-3600/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d5fb3a26ee12109820d069cdf6b9f01db3c645d99db15921417a38e8b948cd69
+size 1465

checkpoint-3600/trainer_state.json ADDED Viewed

	@@ -0,0 +1,304 @@

+{
+  "best_global_step": 2488,
+  "best_metric": 0.7773311897106109,
+  "best_model_checkpoint": null,
+  "epoch": 2.8938906752411575,
+  "eval_steps": 500,
+  "global_step": 3600,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.08038585209003216,
+      "grad_norm": 10.019948959350586,
+      "learning_rate": 1.946945337620579e-05,
+      "loss": 1.2824,
+      "step": 100
+    },
+    {
+      "epoch": 0.1607717041800643,
+      "grad_norm": 8.063481330871582,
+      "learning_rate": 1.8933547695605573e-05,
+      "loss": 1.159,
+      "step": 200
+    },
+    {
+      "epoch": 0.24115755627009647,
+      "grad_norm": 13.041501998901367,
+      "learning_rate": 1.839764201500536e-05,
+      "loss": 1.0909,
+      "step": 300
+    },
+    {
+      "epoch": 0.3215434083601286,
+      "grad_norm": 8.986650466918945,
+      "learning_rate": 1.7861736334405145e-05,
+      "loss": 1.0968,
+      "step": 400
+    },
+    {
+      "epoch": 0.40192926045016075,
+      "grad_norm": 7.692521572113037,
+      "learning_rate": 1.732583065380493e-05,
+      "loss": 1.0873,
+      "step": 500
+    },
+    {
+      "epoch": 0.48231511254019294,
+      "grad_norm": 9.055645942687988,
+      "learning_rate": 1.6789924973204718e-05,
+      "loss": 1.0169,
+      "step": 600
+    },
+    {
+      "epoch": 0.5627009646302251,
+      "grad_norm": 7.9042463302612305,
+      "learning_rate": 1.6254019292604505e-05,
+      "loss": 1.0865,
+      "step": 700
+    },
+    {
+      "epoch": 0.6430868167202572,
+      "grad_norm": 7.55495548248291,
+      "learning_rate": 1.571811361200429e-05,
+      "loss": 1.0137,
+      "step": 800
+    },
+    {
+      "epoch": 0.7234726688102894,
+      "grad_norm": 6.291072368621826,
+      "learning_rate": 1.5182207931404074e-05,
+      "loss": 1.0695,
+      "step": 900
+    },
+    {
+      "epoch": 0.8038585209003215,
+      "grad_norm": 9.746781349182129,
+      "learning_rate": 1.4646302250803858e-05,
+      "loss": 1.0335,
+      "step": 1000
+    },
+    {
+      "epoch": 0.8842443729903537,
+      "grad_norm": 6.898703098297119,
+      "learning_rate": 1.4110396570203646e-05,
+      "loss": 0.987,
+      "step": 1100
+    },
+    {
+      "epoch": 0.9646302250803859,
+      "grad_norm": 8.23352336883545,
+      "learning_rate": 1.3574490889603432e-05,
+      "loss": 0.9442,
+      "step": 1200
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.6370578778135049,
+      "eval_loss": 0.9694849848747253,
+      "eval_runtime": 840.7369,
+      "eval_samples_per_second": 2.959,
+      "eval_steps_per_second": 0.37,
+      "step": 1244
+    },
+    {
+      "epoch": 1.045016077170418,
+      "grad_norm": 9.776803016662598,
+      "learning_rate": 1.3038585209003216e-05,
+      "loss": 0.868,
+      "step": 1300
+    },
+    {
+      "epoch": 1.1254019292604502,
+      "grad_norm": 10.52991771697998,
+      "learning_rate": 1.2502679528403e-05,
+      "loss": 0.7531,
+      "step": 1400
+    },
+    {
+      "epoch": 1.2057877813504823,
+      "grad_norm": 11.897740364074707,
+      "learning_rate": 1.1966773847802788e-05,
+      "loss": 0.7265,
+      "step": 1500
+    },
+    {
+      "epoch": 1.2861736334405145,
+      "grad_norm": 7.514660835266113,
+      "learning_rate": 1.1430868167202574e-05,
+      "loss": 0.7793,
+      "step": 1600
+    },
+    {
+      "epoch": 1.3665594855305465,
+      "grad_norm": 10.338397979736328,
+      "learning_rate": 1.0894962486602359e-05,
+      "loss": 0.7701,
+      "step": 1700
+    },
+    {
+      "epoch": 1.4469453376205788,
+      "grad_norm": 13.336085319519043,
+      "learning_rate": 1.0359056806002143e-05,
+      "loss": 0.7251,
+      "step": 1800
+    },
+    {
+      "epoch": 1.527331189710611,
+      "grad_norm": 9.34284496307373,
+      "learning_rate": 9.823151125401929e-06,
+      "loss": 0.7506,
+      "step": 1900
+    },
+    {
+      "epoch": 1.607717041800643,
+      "grad_norm": 10.490428924560547,
+      "learning_rate": 9.287245444801717e-06,
+      "loss": 0.7982,
+      "step": 2000
+    },
+    {
+      "epoch": 1.6881028938906752,
+      "grad_norm": 7.529485702514648,
+      "learning_rate": 8.751339764201501e-06,
+      "loss": 0.6313,
+      "step": 2100
+    },
+    {
+      "epoch": 1.7684887459807075,
+      "grad_norm": 12.055130958557129,
+      "learning_rate": 8.215434083601287e-06,
+      "loss": 0.6671,
+      "step": 2200
+    },
+    {
+      "epoch": 1.8488745980707395,
+      "grad_norm": 8.625040054321289,
+      "learning_rate": 7.679528403001071e-06,
+      "loss": 0.6896,
+      "step": 2300
+    },
+    {
+      "epoch": 1.9292604501607717,
+      "grad_norm": 8.715214729309082,
+      "learning_rate": 7.143622722400858e-06,
+      "loss": 0.672,
+      "step": 2400
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.7773311897106109,
+      "eval_loss": 0.6390692591667175,
+      "eval_runtime": 680.6477,
+      "eval_samples_per_second": 3.655,
+      "eval_steps_per_second": 0.457,
+      "step": 2488
+    },
+    {
+      "epoch": 2.009646302250804,
+      "grad_norm": 15.922383308410645,
+      "learning_rate": 6.607717041800643e-06,
+      "loss": 0.6789,
+      "step": 2500
+    },
+    {
+      "epoch": 2.090032154340836,
+      "grad_norm": 5.49733829498291,
+      "learning_rate": 6.071811361200429e-06,
+      "loss": 0.5946,
+      "step": 2600
+    },
+    {
+      "epoch": 2.170418006430868,
+      "grad_norm": 7.4076714515686035,
+      "learning_rate": 5.535905680600214e-06,
+      "loss": 0.5985,
+      "step": 2700
+    },
+    {
+      "epoch": 2.2508038585209005,
+      "grad_norm": 10.85772705078125,
+      "learning_rate": 5e-06,
+      "loss": 0.6036,
+      "step": 2800
+    },
+    {
+      "epoch": 2.3311897106109325,
+      "grad_norm": 7.137866497039795,
+      "learning_rate": 4.4640943193997856e-06,
+      "loss": 0.5502,
+      "step": 2900
+    },
+    {
+      "epoch": 2.4115755627009645,
+      "grad_norm": 6.020912170410156,
+      "learning_rate": 3.928188638799572e-06,
+      "loss": 0.6147,
+      "step": 3000
+    },
+    {
+      "epoch": 2.491961414790997,
+      "grad_norm": 13.015932083129883,
+      "learning_rate": 3.392282958199357e-06,
+      "loss": 0.5449,
+      "step": 3100
+    },
+    {
+      "epoch": 2.572347266881029,
+      "grad_norm": 9.120644569396973,
+      "learning_rate": 2.8563772775991428e-06,
+      "loss": 0.5881,
+      "step": 3200
+    },
+    {
+      "epoch": 2.652733118971061,
+      "grad_norm": 8.311524391174316,
+      "learning_rate": 2.3204715969989283e-06,
+      "loss": 0.5486,
+      "step": 3300
+    },
+    {
+      "epoch": 2.733118971061093,
+      "grad_norm": 13.35053825378418,
+      "learning_rate": 1.784565916398714e-06,
+      "loss": 0.5958,
+      "step": 3400
+    },
+    {
+      "epoch": 2.8135048231511255,
+      "grad_norm": 16.09385871887207,
+      "learning_rate": 1.2486602357984997e-06,
+      "loss": 0.6082,
+      "step": 3500
+    },
+    {
+      "epoch": 2.8938906752411575,
+      "grad_norm": 9.562971115112305,
+      "learning_rate": 7.127545551982852e-07,
+      "loss": 0.5594,
+      "step": 3600
+    }
+  ],
+  "logging_steps": 100,
+  "max_steps": 3732,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 200,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.2312693474995732e+18,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-3600/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d0ba41b78fb9f233a65b0c2a6b875ec90644efb6b193c931d1e5c5f69391c7d7
+size 5905

checkpoint-3732/config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "architectures": [
+    "ViTForImageClassification"
+  ],
+  "attention_probs_dropout_prob": 0.0,
+  "dtype": "float32",
+  "encoder_stride": 16,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "anger",
+    "1": "contempt",
+    "2": "disgust",
+    "3": "fear",
+    "4": "happy",
+    "5": "neutral",
+    "6": "sad",
+    "7": "surprise"
+  },
+  "image_size": 224,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "anger": "0",
+    "contempt": "1",
+    "disgust": "2",
+    "fear": "3",
+    "happy": "4",
+    "neutral": "5",
+    "sad": "6",
+    "surprise": "7"
+  },
+  "layer_norm_eps": 1e-12,
+  "model_type": "vit",
+  "num_attention_heads": 12,
+  "num_channels": 3,
+  "num_hidden_layers": 12,
+  "patch_size": 16,
+  "pooler_act": "tanh",
+  "pooler_output_size": 768,
+  "problem_type": "single_label_classification",
+  "qkv_bias": true,
+  "transformers_version": "4.57.3"
+}

checkpoint-3732/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8042f5d8525c3fcd046818ef47c0a408fb3cf19641062a0ddbe7dcb988074e71
+size 343242432

checkpoint-3732/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ea7e9e20efbb8863a34f99f2df1f2c11af75a85807ffa44417a3285aaa7c344
+size 686600587

checkpoint-3732/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22dbf3c2822bd0e012a008f2f8f6fc37e79fd72d0b78e165acf9c07025f5405f
+size 14455

checkpoint-3732/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e842b18da9a03233c55cb3838b93e2fb950a36a84937fcc6640c9a8d649167a4
+size 1465

checkpoint-3732/trainer_state.json ADDED Viewed

	@@ -0,0 +1,311 @@

+{
+  "best_global_step": 2488,
+  "best_metric": 0.7773311897106109,
+  "best_model_checkpoint": null,
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 3732,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.08038585209003216,
+      "grad_norm": 10.019948959350586,
+      "learning_rate": 1.946945337620579e-05,
+      "loss": 1.2824,
+      "step": 100
+    },
+    {
+      "epoch": 0.1607717041800643,
+      "grad_norm": 8.063481330871582,
+      "learning_rate": 1.8933547695605573e-05,
+      "loss": 1.159,
+      "step": 200
+    },
+    {
+      "epoch": 0.24115755627009647,
+      "grad_norm": 13.041501998901367,
+      "learning_rate": 1.839764201500536e-05,
+      "loss": 1.0909,
+      "step": 300
+    },
+    {
+      "epoch": 0.3215434083601286,
+      "grad_norm": 8.986650466918945,
+      "learning_rate": 1.7861736334405145e-05,
+      "loss": 1.0968,
+      "step": 400
+    },
+    {
+      "epoch": 0.40192926045016075,
+      "grad_norm": 7.692521572113037,
+      "learning_rate": 1.732583065380493e-05,
+      "loss": 1.0873,
+      "step": 500
+    },
+    {
+      "epoch": 0.48231511254019294,
+      "grad_norm": 9.055645942687988,
+      "learning_rate": 1.6789924973204718e-05,
+      "loss": 1.0169,
+      "step": 600
+    },
+    {
+      "epoch": 0.5627009646302251,
+      "grad_norm": 7.9042463302612305,
+      "learning_rate": 1.6254019292604505e-05,
+      "loss": 1.0865,
+      "step": 700
+    },
+    {
+      "epoch": 0.6430868167202572,
+      "grad_norm": 7.55495548248291,
+      "learning_rate": 1.571811361200429e-05,
+      "loss": 1.0137,
+      "step": 800
+    },
+    {
+      "epoch": 0.7234726688102894,
+      "grad_norm": 6.291072368621826,
+      "learning_rate": 1.5182207931404074e-05,
+      "loss": 1.0695,
+      "step": 900
+    },
+    {
+      "epoch": 0.8038585209003215,
+      "grad_norm": 9.746781349182129,
+      "learning_rate": 1.4646302250803858e-05,
+      "loss": 1.0335,
+      "step": 1000
+    },
+    {
+      "epoch": 0.8842443729903537,
+      "grad_norm": 6.898703098297119,
+      "learning_rate": 1.4110396570203646e-05,
+      "loss": 0.987,
+      "step": 1100
+    },
+    {
+      "epoch": 0.9646302250803859,
+      "grad_norm": 8.23352336883545,
+      "learning_rate": 1.3574490889603432e-05,
+      "loss": 0.9442,
+      "step": 1200
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.6370578778135049,
+      "eval_loss": 0.9694849848747253,
+      "eval_runtime": 840.7369,
+      "eval_samples_per_second": 2.959,
+      "eval_steps_per_second": 0.37,
+      "step": 1244
+    },
+    {
+      "epoch": 1.045016077170418,
+      "grad_norm": 9.776803016662598,
+      "learning_rate": 1.3038585209003216e-05,
+      "loss": 0.868,
+      "step": 1300
+    },
+    {
+      "epoch": 1.1254019292604502,
+      "grad_norm": 10.52991771697998,
+      "learning_rate": 1.2502679528403e-05,
+      "loss": 0.7531,
+      "step": 1400
+    },
+    {
+      "epoch": 1.2057877813504823,
+      "grad_norm": 11.897740364074707,
+      "learning_rate": 1.1966773847802788e-05,
+      "loss": 0.7265,
+      "step": 1500
+    },
+    {
+      "epoch": 1.2861736334405145,
+      "grad_norm": 7.514660835266113,
+      "learning_rate": 1.1430868167202574e-05,
+      "loss": 0.7793,
+      "step": 1600
+    },
+    {
+      "epoch": 1.3665594855305465,
+      "grad_norm": 10.338397979736328,
+      "learning_rate": 1.0894962486602359e-05,
+      "loss": 0.7701,
+      "step": 1700
+    },
+    {
+      "epoch": 1.4469453376205788,
+      "grad_norm": 13.336085319519043,
+      "learning_rate": 1.0359056806002143e-05,
+      "loss": 0.7251,
+      "step": 1800
+    },
+    {
+      "epoch": 1.527331189710611,
+      "grad_norm": 9.34284496307373,
+      "learning_rate": 9.823151125401929e-06,
+      "loss": 0.7506,
+      "step": 1900
+    },
+    {
+      "epoch": 1.607717041800643,
+      "grad_norm": 10.490428924560547,
+      "learning_rate": 9.287245444801717e-06,
+      "loss": 0.7982,
+      "step": 2000
+    },
+    {
+      "epoch": 1.6881028938906752,
+      "grad_norm": 7.529485702514648,
+      "learning_rate": 8.751339764201501e-06,
+      "loss": 0.6313,
+      "step": 2100
+    },
+    {
+      "epoch": 1.7684887459807075,
+      "grad_norm": 12.055130958557129,
+      "learning_rate": 8.215434083601287e-06,
+      "loss": 0.6671,
+      "step": 2200
+    },
+    {
+      "epoch": 1.8488745980707395,
+      "grad_norm": 8.625040054321289,
+      "learning_rate": 7.679528403001071e-06,
+      "loss": 0.6896,
+      "step": 2300
+    },
+    {
+      "epoch": 1.9292604501607717,
+      "grad_norm": 8.715214729309082,
+      "learning_rate": 7.143622722400858e-06,
+      "loss": 0.672,
+      "step": 2400
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.7773311897106109,
+      "eval_loss": 0.6390692591667175,
+      "eval_runtime": 680.6477,
+      "eval_samples_per_second": 3.655,
+      "eval_steps_per_second": 0.457,
+      "step": 2488
+    },
+    {
+      "epoch": 2.009646302250804,
+      "grad_norm": 15.922383308410645,
+      "learning_rate": 6.607717041800643e-06,
+      "loss": 0.6789,
+      "step": 2500
+    },
+    {
+      "epoch": 2.090032154340836,
+      "grad_norm": 5.49733829498291,
+      "learning_rate": 6.071811361200429e-06,
+      "loss": 0.5946,
+      "step": 2600
+    },
+    {
+      "epoch": 2.170418006430868,
+      "grad_norm": 7.4076714515686035,
+      "learning_rate": 5.535905680600214e-06,
+      "loss": 0.5985,
+      "step": 2700
+    },
+    {
+      "epoch": 2.2508038585209005,
+      "grad_norm": 10.85772705078125,
+      "learning_rate": 5e-06,
+      "loss": 0.6036,
+      "step": 2800
+    },
+    {
+      "epoch": 2.3311897106109325,
+      "grad_norm": 7.137866497039795,
+      "learning_rate": 4.4640943193997856e-06,
+      "loss": 0.5502,
+      "step": 2900
+    },
+    {
+      "epoch": 2.4115755627009645,
+      "grad_norm": 6.020912170410156,
+      "learning_rate": 3.928188638799572e-06,
+      "loss": 0.6147,
+      "step": 3000
+    },
+    {
+      "epoch": 2.491961414790997,
+      "grad_norm": 13.015932083129883,
+      "learning_rate": 3.392282958199357e-06,
+      "loss": 0.5449,
+      "step": 3100
+    },
+    {
+      "epoch": 2.572347266881029,
+      "grad_norm": 9.120644569396973,
+      "learning_rate": 2.8563772775991428e-06,
+      "loss": 0.5881,
+      "step": 3200
+    },
+    {
+      "epoch": 2.652733118971061,
+      "grad_norm": 8.311524391174316,
+      "learning_rate": 2.3204715969989283e-06,
+      "loss": 0.5486,
+      "step": 3300
+    },
+    {
+      "epoch": 2.733118971061093,
+      "grad_norm": 13.35053825378418,
+      "learning_rate": 1.784565916398714e-06,
+      "loss": 0.5958,
+      "step": 3400
+    },
+    {
+      "epoch": 2.8135048231511255,
+      "grad_norm": 16.09385871887207,
+      "learning_rate": 1.2486602357984997e-06,
+      "loss": 0.6082,
+      "step": 3500
+    },
+    {
+      "epoch": 2.8938906752411575,
+      "grad_norm": 9.562971115112305,
+      "learning_rate": 7.127545551982852e-07,
+      "loss": 0.5594,
+      "step": 3600
+    },
+    {
+      "epoch": 2.97427652733119,
+      "grad_norm": 2.4870011806488037,
+      "learning_rate": 1.7684887459807076e-07,
+      "loss": 0.5797,
+      "step": 3700
+    }
+  ],
+  "logging_steps": 100,
+  "max_steps": 3732,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 200,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.312795304486568e+18,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-3732/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d0ba41b78fb9f233a65b0c2a6b875ec90644efb6b193c931d1e5c5f69391c7d7
+size 5905

config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "architectures": [
+    "ViTForImageClassification"
+  ],
+  "attention_probs_dropout_prob": 0.0,
+  "dtype": "float32",
+  "encoder_stride": 16,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "anger",
+    "1": "contempt",
+    "2": "disgust",
+    "3": "fear",
+    "4": "happy",
+    "5": "neutral",
+    "6": "sad",
+    "7": "surprise"
+  },
+  "image_size": 224,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "anger": "0",
+    "contempt": "1",
+    "disgust": "2",
+    "fear": "3",
+    "happy": "4",
+    "neutral": "5",
+    "sad": "6",
+    "surprise": "7"
+  },
+  "layer_norm_eps": 1e-12,
+  "model_type": "vit",
+  "num_attention_heads": 12,
+  "num_channels": 3,
+  "num_hidden_layers": 12,
+  "patch_size": 16,
+  "pooler_act": "tanh",
+  "pooler_output_size": 768,
+  "problem_type": "single_label_classification",
+  "qkv_bias": true,
+  "transformers_version": "4.57.3"
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8042f5d8525c3fcd046818ef47c0a408fb3cf19641062a0ddbe7dcb988074e71
+size 343242432

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "do_convert_rgb": null,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": "google/vit-base-patch16-224",
+  "image_mean": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "image_processor_type": "ViTFeatureExtractor",
+  "image_std": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "resample": 2,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 224,
+    "width": 224
+  },
+  "trust_remote_code": true
+}