End of training

Browse files

Files changed (9) hide show

README.md +107 -0
all_results.json +18 -0
config.json +58 -0
eval_results.json +13 -0
model.safetensors +3 -0
preprocessor_config.json +22 -0
train_results.json +8 -0
trainer_state.json +376 -0
training_args.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,107 @@

+---
+library_name: transformers
+license: apache-2.0
+base_model: facebook/convnext-tiny-224
+tags:
+- generated_from_trainer
+datasets:
+- imagefolder
+metrics:
+- precision
+- recall
+- f1
+- accuracy
+model-index:
+- name: convnext-tiny-224-finetuned-barkley
+  results:
+  - task:
+      name: Image Classification
+      type: image-classification
+    dataset:
+      name: imagefolder
+      type: imagefolder
+      config: default
+      split: train
+      args: default
+    metrics:
+    - name: Precision
+      type: precision
+      value: 0.9936145510835913
+    - name: Recall
+      type: recall
+      value: 0.993421052631579
+    - name: F1
+      type: f1
+      value: 0.993419541966282
+    - name: Accuracy
+      type: accuracy
+      value: 0.9939393939393939
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# convnext-tiny-224-finetuned-barkley
+This model is a fine-tuned version of [facebook/convnext-tiny-224](https://huggingface.co/facebook/convnext-tiny-224) on the imagefolder dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.0794
+- Precision: 0.9936
+- Recall: 0.9934
+- F1: 0.9934
+- Accuracy: 0.9939
+- Top1 Accuracy: 0.9934
+- Error Rate: 0.0061
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0002
+- train_batch_size: 32
+- eval_batch_size: 32
+- seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- lr_scheduler_warmup_ratio: 0.1
+- num_epochs: 30
+- mixed_precision_training: Native AMP
+### Training results
+| Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1     | Accuracy | Top1 Accuracy | Error Rate |
+|:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|:-------------:|:----------:|
+| 1.576         | 1.0   | 38   | 1.5660          | 0.3007    | 0.3684 | 0.2952 | 0.3479   | 0.3684        | 0.6521     |
+| 1.5469        | 2.0   | 76   | 1.5353          | 0.3141    | 0.4079 | 0.3215 | 0.3854   | 0.4079        | 0.6146     |
+| 1.5081        | 3.0   | 114  | 1.4782          | 0.5684    | 0.4671 | 0.3961 | 0.4436   | 0.4671        | 0.5564     |
+| 1.4278        | 4.0   | 152  | 1.3718          | 0.7088    | 0.6053 | 0.5840 | 0.5866   | 0.6053        | 0.4134     |
+| 1.2938        | 5.0   | 190  | 1.1909          | 0.8582    | 0.8355 | 0.8378 | 0.8290   | 0.8355        | 0.1710     |
+| 1.0696        | 6.0   | 228  | 0.9353          | 0.9243    | 0.9211 | 0.9215 | 0.9205   | 0.9211        | 0.0795     |
+| 0.789         | 7.0   | 266  | 0.6347          | 0.9680    | 0.9671 | 0.9673 | 0.9691   | 0.9671        | 0.0309     |
+| 0.506         | 8.0   | 304  | 0.3910          | 0.9750    | 0.9737 | 0.9739 | 0.9752   | 0.9737        | 0.0248     |
+| 0.2876        | 9.0   | 342  | 0.2126          | 0.9808    | 0.9803 | 0.9802 | 0.9814   | 0.9803        | 0.0186     |
+| 0.1722        | 10.0  | 380  | 0.1409          | 0.9809    | 0.9803 | 0.9799 | 0.9818   | 0.9803        | 0.0182     |
+| 0.1082        | 11.0  | 418  | 0.0794          | 0.9936    | 0.9934 | 0.9934 | 0.9939   | 0.9934        | 0.0061     |
+| 0.0715        | 12.0  | 456  | 0.0577          | 0.9936    | 0.9934 | 0.9934 | 0.9939   | 0.9934        | 0.0061     |
+| 0.0492        | 13.0  | 494  | 0.0440          | 0.9872    | 0.9868 | 0.9867 | 0.9879   | 0.9868        | 0.0121     |
+### Framework versions
+- Transformers 4.45.2
+- Pytorch 2.3.1+cu121
+- Datasets 3.0.1
+- Tokenizers 0.20.1

all_results.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+    "epoch": 13.0,
+    "eval_accuracy": 0.9939393939393939,
+    "eval_error_rate": 0.0060606060606061,
+    "eval_f1": 0.993419541966282,
+    "eval_loss": 0.0794038251042366,
+    "eval_precision": 0.9936145510835913,
+    "eval_recall": 0.993421052631579,
+    "eval_runtime": 51.0106,
+    "eval_samples_per_second": 2.98,
+    "eval_steps_per_second": 0.098,
+    "eval_top1_accuracy": 0.993421052631579,
+    "total_flos": 3.972506461105029e+17,
+    "train_loss": 0.8004542765347099,
+    "train_runtime": 7158.591,
+    "train_samples_per_second": 5.096,
+    "train_steps_per_second": 0.159
+}

config.json ADDED Viewed

	@@ -0,0 +1,58 @@

+{
+  "_name_or_path": "facebook/convnext-tiny-224",
+  "architectures": [
+    "ConvNextForImageClassification"
+  ],
+  "depths": [
+    3,
+    3,
+    9,
+    3
+  ],
+  "drop_path_rate": 0.0,
+  "hidden_act": "gelu",
+  "hidden_sizes": [
+    96,
+    192,
+    384,
+    768
+  ],
+  "id2label": {
+    "0": "Iinstia bijuga",
+    "1": "Mangifera indica",
+    "2": "Pterocarpus indicus",
+    "3": "Roystonea regia",
+    "4": "Tabebuia"
+  },
+  "image_size": 224,
+  "initializer_range": 0.02,
+  "label2id": {
+    "Iinstia bijuga": 0,
+    "Mangifera indica": 1,
+    "Pterocarpus indicus": 2,
+    "Roystonea regia": 3,
+    "Tabebuia": 4
+  },
+  "layer_norm_eps": 1e-12,
+  "layer_scale_init_value": 1e-06,
+  "model_type": "convnext",
+  "num_channels": 3,
+  "num_stages": 4,
+  "out_features": [
+    "stage4"
+  ],
+  "out_indices": [
+    4
+  ],
+  "patch_size": 4,
+  "problem_type": "single_label_classification",
+  "stage_names": [
+    "stem",
+    "stage1",
+    "stage2",
+    "stage3",
+    "stage4"
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.45.2"
+}

eval_results.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+    "epoch": 13.0,
+    "eval_accuracy": 0.9939393939393939,
+    "eval_error_rate": 0.0060606060606061,
+    "eval_f1": 0.993419541966282,
+    "eval_loss": 0.0794038251042366,
+    "eval_precision": 0.9936145510835913,
+    "eval_recall": 0.993421052631579,
+    "eval_runtime": 51.0106,
+    "eval_samples_per_second": 2.98,
+    "eval_steps_per_second": 0.098,
+    "eval_top1_accuracy": 0.993421052631579
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0799eed45249c597bd5706cd54239ba58459cb5916a27dddda3eccc89547767d
+size 111317164

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "crop_pct": 0.875,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.485,
+    0.456,
+    0.406
+  ],
+  "image_processor_type": "ConvNextImageProcessor",
+  "image_std": [
+    0.229,
+    0.224,
+    0.225
+  ],
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "shortest_edge": 224
+  }
+}

train_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 13.0,
+    "total_flos": 3.972506461105029e+17,
+    "train_loss": 0.8004542765347099,
+    "train_runtime": 7158.591,
+    "train_samples_per_second": 5.096,
+    "train_steps_per_second": 0.159
+}

trainer_state.json ADDED Viewed

	@@ -0,0 +1,376 @@

+{
+  "best_metric": 0.9939393939393939,
+  "best_model_checkpoint": "convnext-tiny-224-finetuned-barkley\\checkpoint-418",
+  "epoch": 13.0,
+  "eval_steps": 500,
+  "global_step": 494,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "train_accuracy": 0.3092105263157895
+    },
+    {
+      "epoch": 1.0,
+      "grad_norm": 2.351605176925659,
+      "learning_rate": 1.1659108139509125e-06,
+      "loss": 1.576,
+      "step": 38
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.34791666666666665,
+      "eval_error_rate": 0.6520833333333333,
+      "eval_f1": 0.2952478867653256,
+      "eval_loss": 1.5659886598587036,
+      "eval_precision": 0.30074270516946977,
+      "eval_recall": 0.3684210526315789,
+      "eval_runtime": 51.2455,
+      "eval_samples_per_second": 2.966,
+      "eval_steps_per_second": 0.098,
+      "eval_top1_accuracy": 0.3684210526315789,
+      "step": 38
+    },
+    {
+      "epoch": 2.0,
+      "train_accuracy": 0.36622807017543857
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 2.0893232822418213,
+      "learning_rate": 2.23574935501902e-06,
+      "loss": 1.5469,
+      "step": 76
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.38541666666666663,
+      "eval_error_rate": 0.6145833333333334,
+      "eval_f1": 0.32146190433952665,
+      "eval_loss": 1.5353103876113892,
+      "eval_precision": 0.3140966869404633,
+      "eval_recall": 0.40789473684210525,
+      "eval_runtime": 52.9551,
+      "eval_samples_per_second": 2.87,
+      "eval_steps_per_second": 0.094,
+      "eval_top1_accuracy": 0.40789473684210525,
+      "step": 76
+    },
+    {
+      "epoch": 3.0,
+      "train_accuracy": 0.4137426900584795
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 2.353696823120117,
+      "learning_rate": 3.927960312504679e-06,
+      "loss": 1.5081,
+      "step": 114
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.44356060606060604,
+      "eval_error_rate": 0.5564393939393939,
+      "eval_f1": 0.3961300506250762,
+      "eval_loss": 1.4782265424728394,
+      "eval_precision": 0.5683927222362125,
+      "eval_recall": 0.46710526315789475,
+      "eval_runtime": 51.3887,
+      "eval_samples_per_second": 2.958,
+      "eval_steps_per_second": 0.097,
+      "eval_top1_accuracy": 0.46710526315789475,
+      "step": 114
+    },
+    {
+      "epoch": 4.0,
+      "train_accuracy": 0.4861111111111111
+    },
+    {
+      "epoch": 4.0,
+      "grad_norm": 2.854907512664795,
+      "learning_rate": 6.113544042901594e-06,
+      "loss": 1.4278,
+      "step": 152
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.5865530303030304,
+      "eval_error_rate": 0.4134469696969696,
+      "eval_f1": 0.5840194800037495,
+      "eval_loss": 1.3718132972717285,
+      "eval_precision": 0.7087537646637603,
+      "eval_recall": 0.6052631578947368,
+      "eval_runtime": 53.3959,
+      "eval_samples_per_second": 2.847,
+      "eval_steps_per_second": 0.094,
+      "eval_top1_accuracy": 0.6052631578947368,
+      "step": 152
+    },
+    {
+      "epoch": 5.0,
+      "train_accuracy": 0.6827485380116959
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 3.946742296218872,
+      "learning_rate": 8.62589039584572e-06,
+      "loss": 1.2938,
+      "step": 190
+    },
+    {
+      "epoch": 5.0,
+      "eval_accuracy": 0.8289772727272728,
+      "eval_error_rate": 0.17102272727272716,
+      "eval_f1": 0.8378200475239326,
+      "eval_loss": 1.1908537149429321,
+      "eval_precision": 0.8581657632453227,
+      "eval_recall": 0.8355263157894737,
+      "eval_runtime": 52.0457,
+      "eval_samples_per_second": 2.921,
+      "eval_steps_per_second": 0.096,
+      "eval_top1_accuracy": 0.8355263157894737,
+      "step": 190
+    },
+    {
+      "epoch": 6.0,
+      "train_accuracy": 0.8713450292397661
+    },
+    {
+      "epoch": 6.0,
+      "grad_norm": 2.741647720336914,
+      "learning_rate": 1.1273479642392808e-05,
+      "loss": 1.0696,
+      "step": 228
+    },
+    {
+      "epoch": 6.0,
+      "eval_accuracy": 0.9204545454545455,
+      "eval_error_rate": 0.07954545454545447,
+      "eval_f1": 0.9214891548724753,
+      "eval_loss": 0.9352867007255554,
+      "eval_precision": 0.9242831541218637,
+      "eval_recall": 0.9210526315789473,
+      "eval_runtime": 53.2027,
+      "eval_samples_per_second": 2.857,
+      "eval_steps_per_second": 0.094,
+      "eval_top1_accuracy": 0.9210526315789473,
+      "step": 228
+    },
+    {
+      "epoch": 7.0,
+      "train_accuracy": 0.9407894736842105
+    },
+    {
+      "epoch": 7.0,
+      "grad_norm": 3.6590983867645264,
+      "learning_rate": 1.3854482295832083e-05,
+      "loss": 0.789,
+      "step": 266
+    },
+    {
+      "epoch": 7.0,
+      "eval_accuracy": 0.9691287878787879,
+      "eval_error_rate": 0.030871212121212133,
+      "eval_f1": 0.9672834045899062,
+      "eval_loss": 0.6346580386161804,
+      "eval_precision": 0.9680208585981083,
+      "eval_recall": 0.9671052631578947,
+      "eval_runtime": 52.1891,
+      "eval_samples_per_second": 2.912,
+      "eval_steps_per_second": 0.096,
+      "eval_top1_accuracy": 0.9671052631578947,
+      "step": 266
+    },
+    {
+      "epoch": 8.0,
+      "train_accuracy": 0.9634502923976608
+    },
+    {
+      "epoch": 8.0,
+      "grad_norm": 3.982485055923462,
+      "learning_rate": 1.6172144859969913e-05,
+      "loss": 0.506,
+      "step": 304
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.975189393939394,
+      "eval_error_rate": 0.024810606060606033,
+      "eval_f1": 0.9738558660758309,
+      "eval_loss": 0.3909807801246643,
+      "eval_precision": 0.9750055285272005,
+      "eval_recall": 0.9736842105263158,
+      "eval_runtime": 50.6533,
+      "eval_samples_per_second": 3.001,
+      "eval_steps_per_second": 0.099,
+      "eval_top1_accuracy": 0.9736842105263158,
+      "step": 304
+    },
+    {
+      "epoch": 9.0,
+      "train_accuracy": 0.9780701754385965
+    },
+    {
+      "epoch": 9.0,
+      "grad_norm": 2.4651834964752197,
+      "learning_rate": 1.8049788627450628e-05,
+      "loss": 0.2876,
+      "step": 342
+    },
+    {
+      "epoch": 9.0,
+      "eval_accuracy": 0.981439393939394,
+      "eval_error_rate": 0.018560606060606055,
+      "eval_f1": 0.9802473202746875,
+      "eval_loss": 0.21257419884204865,
+      "eval_precision": 0.980843653250774,
+      "eval_recall": 0.9802631578947368,
+      "eval_runtime": 50.1498,
+      "eval_samples_per_second": 3.031,
+      "eval_steps_per_second": 0.1,
+      "eval_top1_accuracy": 0.9802631578947368,
+      "step": 342
+    },
+    {
+      "epoch": 10.0,
+      "train_accuracy": 0.9780701754385965
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3.773145914077759,
+      "learning_rate": 1.9318622999689343e-05,
+      "loss": 0.1722,
+      "step": 380
+    },
+    {
+      "epoch": 10.0,
+      "eval_accuracy": 0.9818181818181818,
+      "eval_error_rate": 0.018181818181818188,
+      "eval_f1": 0.979943544279758,
+      "eval_loss": 0.14089564979076385,
+      "eval_precision": 0.9808553804296839,
+      "eval_recall": 0.9802631578947368,
+      "eval_runtime": 50.1171,
+      "eval_samples_per_second": 3.033,
+      "eval_steps_per_second": 0.1,
+      "eval_top1_accuracy": 0.9802631578947368,
+      "step": 380
+    },
+    {
+      "epoch": 11.0,
+      "train_accuracy": 0.9875730994152047
+    },
+    {
+      "epoch": 11.0,
+      "grad_norm": 2.976818561553955,
+      "learning_rate": 1.995005803798479e-05,
+      "loss": 0.1082,
+      "step": 418
+    },
+    {
+      "epoch": 11.0,
+      "eval_accuracy": 0.9939393939393939,
+      "eval_error_rate": 0.0060606060606061,
+      "eval_f1": 0.993419541966282,
+      "eval_loss": 0.0794038251042366,
+      "eval_precision": 0.9936145510835913,
+      "eval_recall": 0.993421052631579,
+      "eval_runtime": 52.5912,
+      "eval_samples_per_second": 2.89,
+      "eval_steps_per_second": 0.095,
+      "eval_top1_accuracy": 0.993421052631579,
+      "step": 418
+    },
+    {
+      "epoch": 12.0,
+      "train_accuracy": 0.9912280701754386
+    },
+    {
+      "epoch": 12.0,
+      "grad_norm": 5.014571189880371,
+      "learning_rate": 1.9972038083659915e-05,
+      "loss": 0.0715,
+      "step": 456
+    },
+    {
+      "epoch": 12.0,
+      "eval_accuracy": 0.9939393939393939,
+      "eval_error_rate": 0.0060606060606061,
+      "eval_f1": 0.993419541966282,
+      "eval_loss": 0.057679127901792526,
+      "eval_precision": 0.9936145510835913,
+      "eval_recall": 0.993421052631579,
+      "eval_runtime": 50.9469,
+      "eval_samples_per_second": 2.984,
+      "eval_steps_per_second": 0.098,
+      "eval_top1_accuracy": 0.993421052631579,
+      "step": 456
+    },
+    {
+      "epoch": 13.0,
+      "train_accuracy": 0.9912280701754386
+    },
+    {
+      "epoch": 13.0,
+      "grad_norm": 1.5518372058868408,
+      "learning_rate": 1.9813886204892037e-05,
+      "loss": 0.0492,
+      "step": 494
+    },
+    {
+      "epoch": 13.0,
+      "eval_accuracy": 0.9878787878787879,
+      "eval_error_rate": 0.012121212121212088,
+      "eval_f1": 0.9867362170674966,
+      "eval_loss": 0.04395502433180809,
+      "eval_precision": 0.9872349657566376,
+      "eval_recall": 0.9868421052631579,
+      "eval_runtime": 54.1085,
+      "eval_samples_per_second": 2.809,
+      "eval_steps_per_second": 0.092,
+      "eval_top1_accuracy": 0.9868421052631579,
+      "step": 494
+    },
+    {
+      "epoch": 13.0,
+      "step": 494,
+      "total_flos": 3.972506461105029e+17,
+      "train_loss": 0.8004542765347099,
+      "train_runtime": 7158.591,
+      "train_samples_per_second": 5.096,
+      "train_steps_per_second": 0.159
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 1140,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 30,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 2
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.972506461105029e+17,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": null
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b32c9a024fd0fe5d70f0247b1ad721619779776bf233e0e5351cdb8332e17696
+size 5176