Model save
Browse files- README.md +8 -8
- model.safetensors +1 -1
- runs/May22_06-52-46_Shravani/events.out.tfevents.1716340980.Shravani.27548.0 +2 -2
- tmp-checkpoint-950/config.json +1 -1
- tmp-checkpoint-950/model.safetensors +1 -1
- tmp-checkpoint-950/optimizer.pt +1 -1
- tmp-checkpoint-950/trainer_state.json +59 -59
- tmp-checkpoint-950/training_args.bin +1 -1
README.md
CHANGED
|
@@ -15,14 +15,14 @@ should probably proofread and complete it, then remove this comment. -->
|
|
| 15 |
|
| 16 |
This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on an unknown dataset.
|
| 17 |
It achieves the following results on the evaluation set:
|
| 18 |
-
- eval_loss: 0.
|
| 19 |
-
- eval_precision: 0.
|
| 20 |
-
- eval_recall: 0.
|
| 21 |
-
- eval_accuracy: 0.
|
| 22 |
-
- eval_f1score: 0.
|
| 23 |
-
- eval_runtime:
|
| 24 |
-
- eval_samples_per_second:
|
| 25 |
-
- eval_steps_per_second: 0.
|
| 26 |
- epoch: 5.0
|
| 27 |
- step: 950
|
| 28 |
|
|
|
|
| 15 |
|
| 16 |
This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on an unknown dataset.
|
| 17 |
It achieves the following results on the evaluation set:
|
| 18 |
+
- eval_loss: 0.1685
|
| 19 |
+
- eval_precision: 0.9495
|
| 20 |
+
- eval_recall: 0.9497
|
| 21 |
+
- eval_accuracy: 0.9497
|
| 22 |
+
- eval_f1score: 0.9494
|
| 23 |
+
- eval_runtime: 40.9327
|
| 24 |
+
- eval_samples_per_second: 18.469
|
| 25 |
+
- eval_steps_per_second: 0.586
|
| 26 |
- epoch: 5.0
|
| 27 |
- step: 950
|
| 28 |
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 378042076
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92acbf1630bb50244bf0a41d2fd0f8be4fb27ec8347033eaa169017970fb6487
|
| 3 |
size 378042076
|
runs/May22_06-52-46_Shravani/events.out.tfevents.1716340980.Shravani.27548.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2876c68e41799c4896cdc50b7d36a04227dc3bacf302d81e57de8331c01f173
|
| 3 |
+
size 9783
|
tmp-checkpoint-950/config.json
CHANGED
|
@@ -23,7 +23,7 @@
|
|
| 23 |
},
|
| 24 |
"layer_norm_eps": 1e-12,
|
| 25 |
"model_type": "vit",
|
| 26 |
-
"num_attention_heads":
|
| 27 |
"num_channels": 3,
|
| 28 |
"num_hidden_layers": 12,
|
| 29 |
"patch_size": 64,
|
|
|
|
| 23 |
},
|
| 24 |
"layer_norm_eps": 1e-12,
|
| 25 |
"model_type": "vit",
|
| 26 |
+
"num_attention_heads": 8,
|
| 27 |
"num_channels": 3,
|
| 28 |
"num_hidden_layers": 12,
|
| 29 |
"patch_size": 64,
|
tmp-checkpoint-950/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 378042076
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92acbf1630bb50244bf0a41d2fd0f8be4fb27ec8347033eaa169017970fb6487
|
| 3 |
size 378042076
|
tmp-checkpoint-950/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 756199354
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45ee97705bf337fefea766f9c5c3262075d533aa8853a0aeedb5041afa419129
|
| 3 |
size 756199354
|
tmp-checkpoint-950/trainer_state.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
-
"best_metric": 0.
|
| 3 |
-
"best_model_checkpoint": "Shravanig/vit-fire-detection\\checkpoint-
|
| 4 |
"epoch": 5.0,
|
| 5 |
"eval_steps": 500,
|
| 6 |
"global_step": 950,
|
|
@@ -11,175 +11,175 @@
|
|
| 11 |
{
|
| 12 |
"epoch": 0.26,
|
| 13 |
"learning_rate": 0.0001,
|
| 14 |
-
"loss": 0.
|
| 15 |
"step": 50
|
| 16 |
},
|
| 17 |
{
|
| 18 |
"epoch": 0.53,
|
| 19 |
"learning_rate": 0.0002,
|
| 20 |
-
"loss": 0.
|
| 21 |
"step": 100
|
| 22 |
},
|
| 23 |
{
|
| 24 |
"epoch": 0.79,
|
| 25 |
"learning_rate": 0.00019444444444444446,
|
| 26 |
-
"loss": 0.
|
| 27 |
"step": 150
|
| 28 |
},
|
| 29 |
{
|
| 30 |
"epoch": 1.0,
|
| 31 |
"eval_accuracy": 0.9113756613756614,
|
| 32 |
-
"eval_f1score": 0.
|
| 33 |
-
"eval_loss": 0.
|
| 34 |
-
"eval_precision": 0.
|
| 35 |
"eval_recall": 0.9113756613756614,
|
| 36 |
-
"eval_runtime":
|
| 37 |
-
"eval_samples_per_second":
|
| 38 |
-
"eval_steps_per_second": 0.
|
| 39 |
"step": 190
|
| 40 |
},
|
| 41 |
{
|
| 42 |
"epoch": 1.05,
|
| 43 |
"learning_rate": 0.00018888888888888888,
|
| 44 |
-
"loss": 0.
|
| 45 |
"step": 200
|
| 46 |
},
|
| 47 |
{
|
| 48 |
"epoch": 1.32,
|
| 49 |
"learning_rate": 0.00018333333333333334,
|
| 50 |
-
"loss": 0.
|
| 51 |
"step": 250
|
| 52 |
},
|
| 53 |
{
|
| 54 |
"epoch": 1.58,
|
| 55 |
"learning_rate": 0.00017777777777777779,
|
| 56 |
-
"loss": 0.
|
| 57 |
"step": 300
|
| 58 |
},
|
| 59 |
{
|
| 60 |
"epoch": 1.84,
|
| 61 |
"learning_rate": 0.00017222222222222224,
|
| 62 |
-
"loss": 0.
|
| 63 |
"step": 350
|
| 64 |
},
|
| 65 |
{
|
| 66 |
"epoch": 2.0,
|
| 67 |
-
"eval_accuracy": 0.
|
| 68 |
-
"eval_f1score": 0.
|
| 69 |
-
"eval_loss": 0.
|
| 70 |
-
"eval_precision": 0.
|
| 71 |
-
"eval_recall": 0.
|
| 72 |
-
"eval_runtime":
|
| 73 |
-
"eval_samples_per_second":
|
| 74 |
-
"eval_steps_per_second": 0.
|
| 75 |
"step": 380
|
| 76 |
},
|
| 77 |
{
|
| 78 |
"epoch": 2.11,
|
| 79 |
"learning_rate": 0.0001666666666666667,
|
| 80 |
-
"loss": 0.
|
| 81 |
"step": 400
|
| 82 |
},
|
| 83 |
{
|
| 84 |
"epoch": 2.37,
|
| 85 |
"learning_rate": 0.0001611111111111111,
|
| 86 |
-
"loss": 0.
|
| 87 |
"step": 450
|
| 88 |
},
|
| 89 |
{
|
| 90 |
"epoch": 2.63,
|
| 91 |
"learning_rate": 0.00015555555555555556,
|
| 92 |
-
"loss": 0.
|
| 93 |
"step": 500
|
| 94 |
},
|
| 95 |
{
|
| 96 |
"epoch": 2.89,
|
| 97 |
"learning_rate": 0.00015000000000000001,
|
| 98 |
-
"loss": 0.
|
| 99 |
"step": 550
|
| 100 |
},
|
| 101 |
{
|
| 102 |
"epoch": 3.0,
|
| 103 |
-
"eval_accuracy": 0.
|
| 104 |
-
"eval_f1score": 0.
|
| 105 |
-
"eval_loss": 0.
|
| 106 |
-
"eval_precision": 0.
|
| 107 |
-
"eval_recall": 0.
|
| 108 |
-
"eval_runtime":
|
| 109 |
-
"eval_samples_per_second":
|
| 110 |
-
"eval_steps_per_second": 0.
|
| 111 |
"step": 570
|
| 112 |
},
|
| 113 |
{
|
| 114 |
"epoch": 3.16,
|
| 115 |
"learning_rate": 0.00014444444444444444,
|
| 116 |
-
"loss": 0.
|
| 117 |
"step": 600
|
| 118 |
},
|
| 119 |
{
|
| 120 |
"epoch": 3.42,
|
| 121 |
"learning_rate": 0.0001388888888888889,
|
| 122 |
-
"loss": 0.
|
| 123 |
"step": 650
|
| 124 |
},
|
| 125 |
{
|
| 126 |
"epoch": 3.68,
|
| 127 |
"learning_rate": 0.00013333333333333334,
|
| 128 |
-
"loss": 0.
|
| 129 |
"step": 700
|
| 130 |
},
|
| 131 |
{
|
| 132 |
"epoch": 3.95,
|
| 133 |
"learning_rate": 0.00012777777777777776,
|
| 134 |
-
"loss": 0.
|
| 135 |
"step": 750
|
| 136 |
},
|
| 137 |
{
|
| 138 |
"epoch": 4.0,
|
| 139 |
-
"eval_accuracy": 0.
|
| 140 |
-
"eval_f1score": 0.
|
| 141 |
-
"eval_loss": 0.
|
| 142 |
-
"eval_precision": 0.
|
| 143 |
-
"eval_recall": 0.
|
| 144 |
-
"eval_runtime":
|
| 145 |
-
"eval_samples_per_second":
|
| 146 |
-
"eval_steps_per_second": 0.
|
| 147 |
"step": 760
|
| 148 |
},
|
| 149 |
{
|
| 150 |
"epoch": 4.21,
|
| 151 |
"learning_rate": 0.00012222222222222224,
|
| 152 |
-
"loss": 0.
|
| 153 |
"step": 800
|
| 154 |
},
|
| 155 |
{
|
| 156 |
"epoch": 4.47,
|
| 157 |
"learning_rate": 0.00011666666666666668,
|
| 158 |
-
"loss": 0.
|
| 159 |
"step": 850
|
| 160 |
},
|
| 161 |
{
|
| 162 |
"epoch": 4.74,
|
| 163 |
"learning_rate": 0.00011111111111111112,
|
| 164 |
-
"loss": 0.
|
| 165 |
"step": 900
|
| 166 |
},
|
| 167 |
{
|
| 168 |
"epoch": 5.0,
|
| 169 |
"learning_rate": 0.00010555555555555557,
|
| 170 |
-
"loss": 0.
|
| 171 |
"step": 950
|
| 172 |
},
|
| 173 |
{
|
| 174 |
"epoch": 5.0,
|
| 175 |
-
"eval_accuracy": 0.
|
| 176 |
-
"eval_f1score": 0.
|
| 177 |
-
"eval_loss": 0.
|
| 178 |
-
"eval_precision": 0.
|
| 179 |
-
"eval_recall": 0.
|
| 180 |
-
"eval_runtime":
|
| 181 |
-
"eval_samples_per_second":
|
| 182 |
-
"eval_steps_per_second": 0.
|
| 183 |
"step": 950
|
| 184 |
}
|
| 185 |
],
|
|
|
|
| 1 |
{
|
| 2 |
+
"best_metric": 0.14938032627105713,
|
| 3 |
+
"best_model_checkpoint": "Shravanig/vit-fire-detection\\checkpoint-760",
|
| 4 |
"epoch": 5.0,
|
| 5 |
"eval_steps": 500,
|
| 6 |
"global_step": 950,
|
|
|
|
| 11 |
{
|
| 12 |
"epoch": 0.26,
|
| 13 |
"learning_rate": 0.0001,
|
| 14 |
+
"loss": 0.9987,
|
| 15 |
"step": 50
|
| 16 |
},
|
| 17 |
{
|
| 18 |
"epoch": 0.53,
|
| 19 |
"learning_rate": 0.0002,
|
| 20 |
+
"loss": 0.6843,
|
| 21 |
"step": 100
|
| 22 |
},
|
| 23 |
{
|
| 24 |
"epoch": 0.79,
|
| 25 |
"learning_rate": 0.00019444444444444446,
|
| 26 |
+
"loss": 0.5138,
|
| 27 |
"step": 150
|
| 28 |
},
|
| 29 |
{
|
| 30 |
"epoch": 1.0,
|
| 31 |
"eval_accuracy": 0.9113756613756614,
|
| 32 |
+
"eval_f1score": 0.9107285323666766,
|
| 33 |
+
"eval_loss": 0.23306569457054138,
|
| 34 |
+
"eval_precision": 0.9103883996879023,
|
| 35 |
"eval_recall": 0.9113756613756614,
|
| 36 |
+
"eval_runtime": 42.0285,
|
| 37 |
+
"eval_samples_per_second": 17.988,
|
| 38 |
+
"eval_steps_per_second": 0.571,
|
| 39 |
"step": 190
|
| 40 |
},
|
| 41 |
{
|
| 42 |
"epoch": 1.05,
|
| 43 |
"learning_rate": 0.00018888888888888888,
|
| 44 |
+
"loss": 0.4285,
|
| 45 |
"step": 200
|
| 46 |
},
|
| 47 |
{
|
| 48 |
"epoch": 1.32,
|
| 49 |
"learning_rate": 0.00018333333333333334,
|
| 50 |
+
"loss": 0.4068,
|
| 51 |
"step": 250
|
| 52 |
},
|
| 53 |
{
|
| 54 |
"epoch": 1.58,
|
| 55 |
"learning_rate": 0.00017777777777777779,
|
| 56 |
+
"loss": 0.3365,
|
| 57 |
"step": 300
|
| 58 |
},
|
| 59 |
{
|
| 60 |
"epoch": 1.84,
|
| 61 |
"learning_rate": 0.00017222222222222224,
|
| 62 |
+
"loss": 0.3161,
|
| 63 |
"step": 350
|
| 64 |
},
|
| 65 |
{
|
| 66 |
"epoch": 2.0,
|
| 67 |
+
"eval_accuracy": 0.8981481481481481,
|
| 68 |
+
"eval_f1score": 0.8968320885202303,
|
| 69 |
+
"eval_loss": 0.22744037210941315,
|
| 70 |
+
"eval_precision": 0.9110491043143017,
|
| 71 |
+
"eval_recall": 0.8981481481481481,
|
| 72 |
+
"eval_runtime": 41.3214,
|
| 73 |
+
"eval_samples_per_second": 18.296,
|
| 74 |
+
"eval_steps_per_second": 0.581,
|
| 75 |
"step": 380
|
| 76 |
},
|
| 77 |
{
|
| 78 |
"epoch": 2.11,
|
| 79 |
"learning_rate": 0.0001666666666666667,
|
| 80 |
+
"loss": 0.2911,
|
| 81 |
"step": 400
|
| 82 |
},
|
| 83 |
{
|
| 84 |
"epoch": 2.37,
|
| 85 |
"learning_rate": 0.0001611111111111111,
|
| 86 |
+
"loss": 0.3162,
|
| 87 |
"step": 450
|
| 88 |
},
|
| 89 |
{
|
| 90 |
"epoch": 2.63,
|
| 91 |
"learning_rate": 0.00015555555555555556,
|
| 92 |
+
"loss": 0.275,
|
| 93 |
"step": 500
|
| 94 |
},
|
| 95 |
{
|
| 96 |
"epoch": 2.89,
|
| 97 |
"learning_rate": 0.00015000000000000001,
|
| 98 |
+
"loss": 0.2686,
|
| 99 |
"step": 550
|
| 100 |
},
|
| 101 |
{
|
| 102 |
"epoch": 3.0,
|
| 103 |
+
"eval_accuracy": 0.9378306878306878,
|
| 104 |
+
"eval_f1score": 0.937487918832369,
|
| 105 |
+
"eval_loss": 0.16444851458072662,
|
| 106 |
+
"eval_precision": 0.9376014472102792,
|
| 107 |
+
"eval_recall": 0.9378306878306878,
|
| 108 |
+
"eval_runtime": 41.7491,
|
| 109 |
+
"eval_samples_per_second": 18.108,
|
| 110 |
+
"eval_steps_per_second": 0.575,
|
| 111 |
"step": 570
|
| 112 |
},
|
| 113 |
{
|
| 114 |
"epoch": 3.16,
|
| 115 |
"learning_rate": 0.00014444444444444444,
|
| 116 |
+
"loss": 0.2547,
|
| 117 |
"step": 600
|
| 118 |
},
|
| 119 |
{
|
| 120 |
"epoch": 3.42,
|
| 121 |
"learning_rate": 0.0001388888888888889,
|
| 122 |
+
"loss": 0.2721,
|
| 123 |
"step": 650
|
| 124 |
},
|
| 125 |
{
|
| 126 |
"epoch": 3.68,
|
| 127 |
"learning_rate": 0.00013333333333333334,
|
| 128 |
+
"loss": 0.2396,
|
| 129 |
"step": 700
|
| 130 |
},
|
| 131 |
{
|
| 132 |
"epoch": 3.95,
|
| 133 |
"learning_rate": 0.00012777777777777776,
|
| 134 |
+
"loss": 0.2335,
|
| 135 |
"step": 750
|
| 136 |
},
|
| 137 |
{
|
| 138 |
"epoch": 4.0,
|
| 139 |
+
"eval_accuracy": 0.951058201058201,
|
| 140 |
+
"eval_f1score": 0.9510381343653914,
|
| 141 |
+
"eval_loss": 0.14938032627105713,
|
| 142 |
+
"eval_precision": 0.9534914361001318,
|
| 143 |
+
"eval_recall": 0.951058201058201,
|
| 144 |
+
"eval_runtime": 45.6331,
|
| 145 |
+
"eval_samples_per_second": 16.567,
|
| 146 |
+
"eval_steps_per_second": 0.526,
|
| 147 |
"step": 760
|
| 148 |
},
|
| 149 |
{
|
| 150 |
"epoch": 4.21,
|
| 151 |
"learning_rate": 0.00012222222222222224,
|
| 152 |
+
"loss": 0.2412,
|
| 153 |
"step": 800
|
| 154 |
},
|
| 155 |
{
|
| 156 |
"epoch": 4.47,
|
| 157 |
"learning_rate": 0.00011666666666666668,
|
| 158 |
+
"loss": 0.2092,
|
| 159 |
"step": 850
|
| 160 |
},
|
| 161 |
{
|
| 162 |
"epoch": 4.74,
|
| 163 |
"learning_rate": 0.00011111111111111112,
|
| 164 |
+
"loss": 0.2179,
|
| 165 |
"step": 900
|
| 166 |
},
|
| 167 |
{
|
| 168 |
"epoch": 5.0,
|
| 169 |
"learning_rate": 0.00010555555555555557,
|
| 170 |
+
"loss": 0.2058,
|
| 171 |
"step": 950
|
| 172 |
},
|
| 173 |
{
|
| 174 |
"epoch": 5.0,
|
| 175 |
+
"eval_accuracy": 0.9497354497354498,
|
| 176 |
+
"eval_f1score": 0.9494114362396765,
|
| 177 |
+
"eval_loss": 0.1685035079717636,
|
| 178 |
+
"eval_precision": 0.9494850222122949,
|
| 179 |
+
"eval_recall": 0.9497354497354498,
|
| 180 |
+
"eval_runtime": 40.9327,
|
| 181 |
+
"eval_samples_per_second": 18.469,
|
| 182 |
+
"eval_steps_per_second": 0.586,
|
| 183 |
"step": 950
|
| 184 |
}
|
| 185 |
],
|
tmp-checkpoint-950/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4792
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:270b5928caae40c5bca0e7cca3827e413320f661f75cdabd732e310d4ec2bcd3
|
| 3 |
size 4792
|