Docty commited on
Commit
c650617
·
verified ·
1 Parent(s): 87c36d2

Model save

Browse files
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ image_0.png filter=lfs diff=lfs merge=lfs -text
37
+ image_1.png filter=lfs diff=lfs merge=lfs -text
38
+ image_2.png filter=lfs diff=lfs merge=lfs -text
39
+ image_3.png filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -18,8 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 1.3390
22
  - Accuracy: 0.925
 
23
 
24
  ## Model description
25
 
@@ -48,9 +48,9 @@ The following hyperparameters were used during training:
48
 
49
  ### Training results
50
 
51
- | Training Loss | Epoch | Step | Validation Loss | Accuracy |
52
- |:-------------:|:-----:|:----:|:---------------:|:--------:|
53
- | 1.3069 | 1.0 | 170 | 1.3390 | 0.925 |
54
 
55
 
56
  ### Framework versions
 
18
 
19
  This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
 
21
  - Accuracy: 0.925
22
+ - Loss: 1.3390
23
 
24
  ## Model description
25
 
 
48
 
49
  ### Training results
50
 
51
+ | Training Loss | Epoch | Step | Accuracy | Validation Loss |
52
+ |:-------------:|:-----:|:----:|:--------:|:---------------:|
53
+ | 1.3069 | 1.0 | 170 | 0.925 | 1.3390 |
54
 
55
 
56
  ### Framework versions
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 1.0,
3
+ "eval_accuracy": 0.925,
4
+ "eval_loss": 1.3389760255813599,
5
+ "eval_runtime": 3.7035,
6
+ "eval_samples_per_second": 64.803,
7
+ "eval_steps_per_second": 8.1,
8
+ "total_flos": 1.0539477329117184e+17,
9
+ "train_loss": 1.6158509927637437,
10
+ "train_runtime": 77.4929,
11
+ "train_samples_per_second": 17.55,
12
+ "train_steps_per_second": 2.194
13
+ }
config.json CHANGED
@@ -40,7 +40,6 @@
40
  "patch_size": 16,
41
  "pooler_act": "tanh",
42
  "pooler_output_size": 768,
43
- "problem_type": "single_label_classification",
44
  "qkv_bias": true,
45
  "transformers_version": "4.56.1"
46
  }
 
40
  "patch_size": 16,
41
  "pooler_act": "tanh",
42
  "pooler_output_size": 768,
 
43
  "qkv_bias": true,
44
  "transformers_version": "4.56.1"
45
  }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 1.0,
3
+ "eval_accuracy": 0.925,
4
+ "eval_loss": 1.3389760255813599,
5
+ "eval_runtime": 3.7035,
6
+ "eval_samples_per_second": 64.803,
7
+ "eval_steps_per_second": 8.1
8
+ }
image_0.png ADDED

Git LFS Details

  • SHA256: 0be8f58b4b6d41413d300543ee67f999305c7b14354f87e6f8231b5ed4f4c4c2
  • Pointer size: 131 Bytes
  • Size of remote file: 244 kB
image_1.png ADDED

Git LFS Details

  • SHA256: cac2905641f3a12b78857dbd6c9911bf4353f43626460809c402e68cdda9da39
  • Pointer size: 131 Bytes
  • Size of remote file: 300 kB
image_2.png ADDED

Git LFS Details

  • SHA256: 8a9e167d0297ccafbd8ad85d623d75766a6bcb0c3887ce9cb06f2c50360e860e
  • Pointer size: 131 Bytes
  • Size of remote file: 324 kB
image_3.png ADDED

Git LFS Details

  • SHA256: 73d259138a0ec2a08db25248423c25f1ad1eae52d68af8d971b70da4a4da5532
  • Pointer size: 131 Bytes
  • Size of remote file: 227 kB
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 1.0,
3
+ "total_flos": 1.0539477329117184e+17,
4
+ "train_loss": 1.6158509927637437,
5
+ "train_runtime": 77.4929,
6
+ "train_samples_per_second": 17.55,
7
+ "train_steps_per_second": 2.194
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,171 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": 170,
3
+ "best_metric": 1.3389760255813599,
4
+ "best_model_checkpoint": "./mangoes/checkpoint-170",
5
+ "epoch": 1.0,
6
+ "eval_steps": 500,
7
+ "global_step": 170,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.058823529411764705,
14
+ "grad_norm": 1.954006552696228,
15
+ "learning_rate": 1.8941176470588238e-05,
16
+ "loss": 2.0442,
17
+ "step": 10
18
+ },
19
+ {
20
+ "epoch": 0.11764705882352941,
21
+ "grad_norm": 3.1689231395721436,
22
+ "learning_rate": 1.776470588235294e-05,
23
+ "loss": 2.0181,
24
+ "step": 20
25
+ },
26
+ {
27
+ "epoch": 0.17647058823529413,
28
+ "grad_norm": 3.157071352005005,
29
+ "learning_rate": 1.658823529411765e-05,
30
+ "loss": 1.9073,
31
+ "step": 30
32
+ },
33
+ {
34
+ "epoch": 0.23529411764705882,
35
+ "grad_norm": 2.8379974365234375,
36
+ "learning_rate": 1.5411764705882356e-05,
37
+ "loss": 1.8325,
38
+ "step": 40
39
+ },
40
+ {
41
+ "epoch": 0.29411764705882354,
42
+ "grad_norm": 3.095369815826416,
43
+ "learning_rate": 1.423529411764706e-05,
44
+ "loss": 1.7749,
45
+ "step": 50
46
+ },
47
+ {
48
+ "epoch": 0.35294117647058826,
49
+ "grad_norm": 3.269249677658081,
50
+ "learning_rate": 1.3058823529411766e-05,
51
+ "loss": 1.7894,
52
+ "step": 60
53
+ },
54
+ {
55
+ "epoch": 0.4117647058823529,
56
+ "grad_norm": 2.953714370727539,
57
+ "learning_rate": 1.1882352941176472e-05,
58
+ "loss": 1.6664,
59
+ "step": 70
60
+ },
61
+ {
62
+ "epoch": 0.47058823529411764,
63
+ "grad_norm": 3.622612237930298,
64
+ "learning_rate": 1.0705882352941178e-05,
65
+ "loss": 1.6351,
66
+ "step": 80
67
+ },
68
+ {
69
+ "epoch": 0.5294117647058824,
70
+ "grad_norm": 3.304643154144287,
71
+ "learning_rate": 9.529411764705882e-06,
72
+ "loss": 1.5905,
73
+ "step": 90
74
+ },
75
+ {
76
+ "epoch": 0.5882352941176471,
77
+ "grad_norm": 3.047823667526245,
78
+ "learning_rate": 8.35294117647059e-06,
79
+ "loss": 1.4602,
80
+ "step": 100
81
+ },
82
+ {
83
+ "epoch": 0.6470588235294118,
84
+ "grad_norm": 3.3985748291015625,
85
+ "learning_rate": 7.176470588235295e-06,
86
+ "loss": 1.5058,
87
+ "step": 110
88
+ },
89
+ {
90
+ "epoch": 0.7058823529411765,
91
+ "grad_norm": 3.7313411235809326,
92
+ "learning_rate": 6e-06,
93
+ "loss": 1.4221,
94
+ "step": 120
95
+ },
96
+ {
97
+ "epoch": 0.7647058823529411,
98
+ "grad_norm": 3.2533087730407715,
99
+ "learning_rate": 4.823529411764706e-06,
100
+ "loss": 1.4311,
101
+ "step": 130
102
+ },
103
+ {
104
+ "epoch": 0.8235294117647058,
105
+ "grad_norm": 3.58194637298584,
106
+ "learning_rate": 3.6470588235294117e-06,
107
+ "loss": 1.3677,
108
+ "step": 140
109
+ },
110
+ {
111
+ "epoch": 0.8823529411764706,
112
+ "grad_norm": 2.956484317779541,
113
+ "learning_rate": 2.470588235294118e-06,
114
+ "loss": 1.3706,
115
+ "step": 150
116
+ },
117
+ {
118
+ "epoch": 0.9411764705882353,
119
+ "grad_norm": 3.5362460613250732,
120
+ "learning_rate": 1.2941176470588237e-06,
121
+ "loss": 1.3467,
122
+ "step": 160
123
+ },
124
+ {
125
+ "epoch": 1.0,
126
+ "grad_norm": 3.1102607250213623,
127
+ "learning_rate": 1.1764705882352942e-07,
128
+ "loss": 1.3069,
129
+ "step": 170
130
+ },
131
+ {
132
+ "epoch": 1.0,
133
+ "eval_accuracy": 0.925,
134
+ "eval_loss": 1.3389760255813599,
135
+ "eval_runtime": 3.7037,
136
+ "eval_samples_per_second": 64.8,
137
+ "eval_steps_per_second": 8.1,
138
+ "step": 170
139
+ },
140
+ {
141
+ "epoch": 1.0,
142
+ "step": 170,
143
+ "total_flos": 1.0539477329117184e+17,
144
+ "train_loss": 1.6158509927637437,
145
+ "train_runtime": 77.4929,
146
+ "train_samples_per_second": 17.55,
147
+ "train_steps_per_second": 2.194
148
+ }
149
+ ],
150
+ "logging_steps": 10,
151
+ "max_steps": 170,
152
+ "num_input_tokens_seen": 0,
153
+ "num_train_epochs": 1,
154
+ "save_steps": 500,
155
+ "stateful_callbacks": {
156
+ "TrainerControl": {
157
+ "args": {
158
+ "should_epoch_stop": false,
159
+ "should_evaluate": false,
160
+ "should_log": false,
161
+ "should_save": true,
162
+ "should_training_stop": true
163
+ },
164
+ "attributes": {}
165
+ }
166
+ },
167
+ "total_flos": 1.0539477329117184e+17,
168
+ "train_batch_size": 8,
169
+ "trial_name": null,
170
+ "trial_params": null
171
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:997a6e4fe36bfd648c3fb14e63a3370fd6401883641dbd5f408384d32a4d6c75
3
  size 5777
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cb67eff64db67cd107ce7365441a071cd571805b0125c9e753dc3e1e7165c04
3
  size 5777