End of training

Browse files

Files changed (6) hide show

README.md +3 -3
all_results.json +13 -0
eval_results.json +8 -0
runs/May13_08-52-11_c641b86eca15/events.out.tfevents.1715593286.c641b86eca15.935.1 +3 -0
train_results.json +8 -0
trainer_state.json +127 -0

README.md CHANGED Viewed

@@ -22,7 +22,7 @@ model-index:
     metrics:
     - name: Accuracy
       type: accuracy
-      value: 0.9288461538461539
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [Angy309/swin-tiny-patch4-window7-224-finetuned](https://huggingface.co/Angy309/swin-tiny-patch4-window7-224-finetuned) on the imagefolder dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.1961
-- Accuracy: 0.9288
 ## Model description

     metrics:
     - name: Accuracy
       type: accuracy
+      value: 0.9365384615384615
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [Angy309/swin-tiny-patch4-window7-224-finetuned](https://huggingface.co/Angy309/swin-tiny-patch4-window7-224-finetuned) on the imagefolder dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.1937
+- Accuracy: 0.9365
 ## Model description

all_results.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+    "epoch": 2.938775510204082,
+    "eval_accuracy": 0.9365384615384615,
+    "eval_loss": 0.19368061423301697,
+    "eval_runtime": 4.2611,
+    "eval_samples_per_second": 122.033,
+    "eval_steps_per_second": 3.99,
+    "total_flos": 3.424639439220572e+17,
+    "train_loss": 0.6798421343167623,
+    "train_runtime": 2572.3495,
+    "train_samples_per_second": 5.458,
+    "train_steps_per_second": 0.042
+}

eval_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 2.938775510204082,
+    "eval_accuracy": 0.9365384615384615,
+    "eval_loss": 0.19368061423301697,
+    "eval_runtime": 4.2611,
+    "eval_samples_per_second": 122.033,
+    "eval_steps_per_second": 3.99
+}

runs/May13_08-52-11_c641b86eca15/events.out.tfevents.1715593286.c641b86eca15.935.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4164764261b4e696fc452c25916a8d029f605ce6155064375e960b634b653d7c
+size 405

train_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 2.938775510204082,
+    "total_flos": 3.424639439220572e+17,
+    "train_loss": 0.6798421343167623,
+    "train_runtime": 2572.3495,
+    "train_samples_per_second": 5.458,
+    "train_steps_per_second": 0.042
+}

trainer_state.json ADDED Viewed

	@@ -0,0 +1,127 @@

+{
+  "best_metric": 0.9365384615384615,
+  "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-finetuned/checkpoint-73",
+  "epoch": 2.938775510204082,
+  "eval_steps": 500,
+  "global_step": 108,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.272108843537415,
+      "grad_norm": 10.030804634094238,
+      "learning_rate": 4.545454545454546e-05,
+      "loss": 1.801,
+      "step": 10
+    },
+    {
+      "epoch": 0.54421768707483,
+      "grad_norm": 8.141377449035645,
+      "learning_rate": 4.536082474226804e-05,
+      "loss": 0.9671,
+      "step": 20
+    },
+    {
+      "epoch": 0.8163265306122449,
+      "grad_norm": 8.35882568359375,
+      "learning_rate": 4.020618556701031e-05,
+      "loss": 0.7093,
+      "step": 30
+    },
+    {
+      "epoch": 0.9795918367346939,
+      "eval_accuracy": 0.8961538461538462,
+      "eval_loss": 0.31302550435066223,
+      "eval_runtime": 233.5959,
+      "eval_samples_per_second": 2.226,
+      "eval_steps_per_second": 0.073,
+      "step": 36
+    },
+    {
+      "epoch": 1.08843537414966,
+      "grad_norm": 11.375490188598633,
+      "learning_rate": 3.5051546391752576e-05,
+      "loss": 0.6024,
+      "step": 40
+    },
+    {
+      "epoch": 1.3605442176870748,
+      "grad_norm": 8.967066764831543,
+      "learning_rate": 2.9896907216494846e-05,
+      "loss": 0.5441,
+      "step": 50
+    },
+    {
+      "epoch": 1.6326530612244898,
+      "grad_norm": 7.383798599243164,
+      "learning_rate": 2.4742268041237116e-05,
+      "loss": 0.5146,
+      "step": 60
+    },
+    {
+      "epoch": 1.9047619047619047,
+      "grad_norm": 7.814334869384766,
+      "learning_rate": 1.9587628865979382e-05,
+      "loss": 0.4969,
+      "step": 70
+    },
+    {
+      "epoch": 1.9863945578231292,
+      "eval_accuracy": 0.9365384615384615,
+      "eval_loss": 0.19368061423301697,
+      "eval_runtime": 4.2117,
+      "eval_samples_per_second": 123.465,
+      "eval_steps_per_second": 4.036,
+      "step": 73
+    },
+    {
+      "epoch": 2.17687074829932,
+      "grad_norm": 8.89726734161377,
+      "learning_rate": 1.4432989690721649e-05,
+      "loss": 0.4832,
+      "step": 80
+    },
+    {
+      "epoch": 2.4489795918367347,
+      "grad_norm": 5.330117225646973,
+      "learning_rate": 9.278350515463918e-06,
+      "loss": 0.4326,
+      "step": 90
+    },
+    {
+      "epoch": 2.7210884353741496,
+      "grad_norm": 6.239503383636475,
+      "learning_rate": 4.123711340206186e-06,
+      "loss": 0.4523,
+      "step": 100
+    },
+    {
+      "epoch": 2.938775510204082,
+      "eval_accuracy": 0.9288461538461539,
+      "eval_loss": 0.1961224228143692,
+      "eval_runtime": 4.3109,
+      "eval_samples_per_second": 120.624,
+      "eval_steps_per_second": 3.943,
+      "step": 108
+    },
+    {
+      "epoch": 2.938775510204082,
+      "step": 108,
+      "total_flos": 3.424639439220572e+17,
+      "train_loss": 0.6798421343167623,
+      "train_runtime": 2572.3495,
+      "train_samples_per_second": 5.458,
+      "train_steps_per_second": 0.042
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 108,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 3.424639439220572e+17,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": null
+}