djbp commited on
Commit
88e4d5b
·
verified ·
1 Parent(s): 22d2198

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,14 @@
1
  {
2
  "epoch": 6.885245901639344,
3
- "eval_accuracy": 0.8729338842975206,
4
- "eval_loss": 0.34267309308052063,
5
- "eval_runtime": 203.1004,
6
- "eval_samples_per_second": 9.532,
 
7
  "eval_steps_per_second": 0.079,
8
- "total_flos": 4.180411553219629e+18,
9
- "train_loss": 0.4180879854020618,
10
- "train_runtime": 6613.2188,
11
- "train_samples_per_second": 8.194,
12
  "train_steps_per_second": 0.016
13
  }
 
1
  {
2
  "epoch": 6.885245901639344,
3
+ "eval_accuracy": 0.8824443293630243,
4
+ "eval_auc": 0.957557852599524,
5
+ "eval_loss": 0.30561181902885437,
6
+ "eval_runtime": 203.3286,
7
+ "eval_samples_per_second": 9.497,
8
  "eval_steps_per_second": 0.079,
9
+ "total_flos": 4.1785312376666235e+18,
10
+ "train_loss": 0.38780884515671504,
11
+ "train_runtime": 6680.4521,
12
+ "train_samples_per_second": 8.107,
13
  "train_steps_per_second": 0.016
14
  }
eval_results.json CHANGED
@@ -1,8 +1,9 @@
1
  {
2
  "epoch": 6.885245901639344,
3
- "eval_accuracy": 0.8729338842975206,
4
- "eval_loss": 0.34267309308052063,
5
- "eval_runtime": 203.1004,
6
- "eval_samples_per_second": 9.532,
 
7
  "eval_steps_per_second": 0.079
8
  }
 
1
  {
2
  "epoch": 6.885245901639344,
3
+ "eval_accuracy": 0.8824443293630243,
4
+ "eval_auc": 0.957557852599524,
5
+ "eval_loss": 0.30561181902885437,
6
+ "eval_runtime": 203.3286,
7
+ "eval_samples_per_second": 9.497,
8
  "eval_steps_per_second": 0.079
9
  }
runs/Aug28_16-52-19_data-science-wbi/events.out.tfevents.1724870839.data-science-wbi ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b08144f96c5b4de882fba4b0c1b99cff56e739f68a99dc5afe31dc0e5892055
3
+ size 87
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 6.885245901639344,
3
- "total_flos": 4.180411553219629e+18,
4
- "train_loss": 0.4180879854020618,
5
- "train_runtime": 6613.2188,
6
- "train_samples_per_second": 8.194,
7
  "train_steps_per_second": 0.016
8
  }
 
1
  {
2
  "epoch": 6.885245901639344,
3
+ "total_flos": 4.1785312376666235e+18,
4
+ "train_loss": 0.38780884515671504,
5
+ "train_runtime": 6680.4521,
6
+ "train_samples_per_second": 8.107,
7
  "train_steps_per_second": 0.016
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.8729338842975206,
3
- "best_model_checkpoint": "swin-base-patch4-window7-224-in22k-MM_Classification_base_V10/checkpoint-91",
4
  "epoch": 6.885245901639344,
5
  "eval_steps": 500,
6
  "global_step": 105,
@@ -10,144 +10,151 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.6557377049180327,
13
- "grad_norm": 1.847607135772705,
14
  "learning_rate": 4.545454545454546e-05,
15
- "loss": 0.7948,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.9836065573770492,
20
- "eval_accuracy": 0.8352272727272727,
21
- "eval_loss": 0.4498441815376282,
22
- "eval_runtime": 204.2611,
23
- "eval_samples_per_second": 9.478,
 
24
  "eval_steps_per_second": 0.078,
25
  "step": 15
26
  },
27
  {
28
  "epoch": 1.3114754098360657,
29
- "grad_norm": 2.3756892681121826,
30
  "learning_rate": 4.5212765957446815e-05,
31
- "loss": 0.5062,
32
  "step": 20
33
  },
34
  {
35
  "epoch": 1.9672131147540983,
36
- "grad_norm": 1.4792882204055786,
37
  "learning_rate": 3.9893617021276594e-05,
38
- "loss": 0.4439,
39
  "step": 30
40
  },
41
  {
42
  "epoch": 1.9672131147540983,
43
- "eval_accuracy": 0.8589876033057852,
44
- "eval_loss": 0.38362234830856323,
45
- "eval_runtime": 210.2217,
46
- "eval_samples_per_second": 9.209,
47
- "eval_steps_per_second": 0.076,
 
48
  "step": 30
49
  },
50
  {
51
  "epoch": 2.6229508196721314,
52
- "grad_norm": 2.130309581756592,
53
  "learning_rate": 3.4574468085106386e-05,
54
- "loss": 0.4024,
55
  "step": 40
56
  },
57
  {
58
  "epoch": 2.9508196721311473,
59
- "eval_accuracy": 0.8600206611570248,
60
- "eval_loss": 0.36524850130081177,
61
- "eval_runtime": 204.4105,
62
- "eval_samples_per_second": 9.471,
 
63
  "eval_steps_per_second": 0.078,
64
  "step": 45
65
  },
66
  {
67
  "epoch": 3.278688524590164,
68
- "grad_norm": 2.3738443851470947,
69
  "learning_rate": 2.925531914893617e-05,
70
- "loss": 0.3801,
71
  "step": 50
72
  },
73
  {
74
  "epoch": 3.9344262295081966,
75
- "grad_norm": 3.785062074661255,
76
  "learning_rate": 2.393617021276596e-05,
77
- "loss": 0.3562,
78
  "step": 60
79
  },
80
  {
81
  "epoch": 4.0,
82
- "eval_accuracy": 0.8641528925619835,
83
- "eval_loss": 0.34744057059288025,
84
- "eval_runtime": 203.8324,
85
- "eval_samples_per_second": 9.498,
 
86
  "eval_steps_per_second": 0.078,
87
  "step": 61
88
  },
89
  {
90
  "epoch": 4.590163934426229,
91
- "grad_norm": 3.449556827545166,
92
  "learning_rate": 1.8617021276595745e-05,
93
- "loss": 0.345,
94
  "step": 70
95
  },
96
  {
97
  "epoch": 4.983606557377049,
98
- "eval_accuracy": 0.868801652892562,
99
- "eval_loss": 0.34286215901374817,
100
- "eval_runtime": 203.6664,
101
- "eval_samples_per_second": 9.506,
102
- "eval_steps_per_second": 0.079,
 
103
  "step": 76
104
  },
105
  {
106
  "epoch": 5.245901639344262,
107
- "grad_norm": 2.114426851272583,
108
  "learning_rate": 1.3297872340425532e-05,
109
- "loss": 0.3374,
110
  "step": 80
111
  },
112
  {
113
  "epoch": 5.901639344262295,
114
- "grad_norm": 4.8909759521484375,
115
  "learning_rate": 7.97872340425532e-06,
116
- "loss": 0.3379,
117
  "step": 90
118
  },
119
  {
120
  "epoch": 5.967213114754099,
121
- "eval_accuracy": 0.8729338842975206,
122
- "eval_loss": 0.34267309308052063,
123
- "eval_runtime": 204.1334,
124
- "eval_samples_per_second": 9.484,
 
125
  "eval_steps_per_second": 0.078,
126
  "step": 91
127
  },
128
  {
129
  "epoch": 6.557377049180328,
130
- "grad_norm": 3.155640125274658,
131
  "learning_rate": 2.6595744680851065e-06,
132
- "loss": 0.3213,
133
  "step": 100
134
  },
135
  {
136
  "epoch": 6.885245901639344,
137
- "eval_accuracy": 0.8708677685950413,
138
- "eval_loss": 0.3443421423435211,
139
- "eval_runtime": 203.5472,
140
- "eval_samples_per_second": 9.511,
 
141
  "eval_steps_per_second": 0.079,
142
  "step": 105
143
  },
144
  {
145
  "epoch": 6.885245901639344,
146
  "step": 105,
147
- "total_flos": 4.180411553219629e+18,
148
- "train_loss": 0.4180879854020618,
149
- "train_runtime": 6613.2188,
150
- "train_samples_per_second": 8.194,
151
  "train_steps_per_second": 0.016
152
  }
153
  ],
@@ -168,7 +175,7 @@
168
  "attributes": {}
169
  }
170
  },
171
- "total_flos": 4.180411553219629e+18,
172
  "train_batch_size": 128,
173
  "trial_name": null,
174
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.8824443293630243,
3
+ "best_model_checkpoint": "swin-base-patch4-window7-224-in22k-MM_Classification_base_V10/checkpoint-105",
4
  "epoch": 6.885245901639344,
5
  "eval_steps": 500,
6
  "global_step": 105,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.6557377049180327,
13
+ "grad_norm": 5.335843086242676,
14
  "learning_rate": 4.545454545454546e-05,
15
+ "loss": 0.8134,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.9836065573770492,
20
+ "eval_accuracy": 0.8430864836872087,
21
+ "eval_auc": 0.9250639596370771,
22
+ "eval_loss": 0.419461190700531,
23
+ "eval_runtime": 205.2459,
24
+ "eval_samples_per_second": 9.408,
25
  "eval_steps_per_second": 0.078,
26
  "step": 15
27
  },
28
  {
29
  "epoch": 1.3114754098360657,
30
+ "grad_norm": 2.8889973163604736,
31
  "learning_rate": 4.5212765957446815e-05,
32
+ "loss": 0.5101,
33
  "step": 20
34
  },
35
  {
36
  "epoch": 1.9672131147540983,
37
+ "grad_norm": 1.6868778467178345,
38
  "learning_rate": 3.9893617021276594e-05,
39
+ "loss": 0.3996,
40
  "step": 30
41
  },
42
  {
43
  "epoch": 1.9672131147540983,
44
+ "eval_accuracy": 0.8570688762299327,
45
+ "eval_auc": 0.9437553079992403,
46
+ "eval_loss": 0.3682312071323395,
47
+ "eval_runtime": 204.3267,
48
+ "eval_samples_per_second": 9.451,
49
+ "eval_steps_per_second": 0.078,
50
  "step": 30
51
  },
52
  {
53
  "epoch": 2.6229508196721314,
54
+ "grad_norm": 1.9163786172866821,
55
  "learning_rate": 3.4574468085106386e-05,
56
+ "loss": 0.3693,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 2.9508196721311473,
61
+ "eval_accuracy": 0.877783531848783,
62
+ "eval_auc": 0.9529726135197429,
63
+ "eval_loss": 0.324381947517395,
64
+ "eval_runtime": 203.8679,
65
+ "eval_samples_per_second": 9.472,
66
  "eval_steps_per_second": 0.078,
67
  "step": 45
68
  },
69
  {
70
  "epoch": 3.278688524590164,
71
+ "grad_norm": 2.268683433532715,
72
  "learning_rate": 2.925531914893617e-05,
73
+ "loss": 0.3326,
74
  "step": 50
75
  },
76
  {
77
  "epoch": 3.9344262295081966,
78
+ "grad_norm": 2.837725877761841,
79
  "learning_rate": 2.393617021276596e-05,
80
+ "loss": 0.3147,
81
  "step": 60
82
  },
83
  {
84
  "epoch": 4.0,
85
+ "eval_accuracy": 0.8793371310201968,
86
+ "eval_auc": 0.9557452970649672,
87
+ "eval_loss": 0.31093424558639526,
88
+ "eval_runtime": 204.9066,
89
+ "eval_samples_per_second": 9.424,
90
  "eval_steps_per_second": 0.078,
91
  "step": 61
92
  },
93
  {
94
  "epoch": 4.590163934426229,
95
+ "grad_norm": 1.7413060665130615,
96
  "learning_rate": 1.8617021276595745e-05,
97
+ "loss": 0.3166,
98
  "step": 70
99
  },
100
  {
101
  "epoch": 4.983606557377049,
102
+ "eval_accuracy": 0.8803728638011393,
103
+ "eval_auc": 0.9561359266346766,
104
+ "eval_loss": 0.3134761154651642,
105
+ "eval_runtime": 204.4948,
106
+ "eval_samples_per_second": 9.443,
107
+ "eval_steps_per_second": 0.078,
108
  "step": 76
109
  },
110
  {
111
  "epoch": 5.245901639344262,
112
+ "grad_norm": 1.7945168018341064,
113
  "learning_rate": 1.3297872340425532e-05,
114
+ "loss": 0.2921,
115
  "step": 80
116
  },
117
  {
118
  "epoch": 5.901639344262295,
119
+ "grad_norm": 1.865674376487732,
120
  "learning_rate": 7.97872340425532e-06,
121
+ "loss": 0.2918,
122
  "step": 90
123
  },
124
  {
125
  "epoch": 5.967213114754099,
126
+ "eval_accuracy": 0.8746763335059554,
127
+ "eval_auc": 0.9568584001596542,
128
+ "eval_loss": 0.3116800785064697,
129
+ "eval_runtime": 205.4646,
130
+ "eval_samples_per_second": 9.398,
131
  "eval_steps_per_second": 0.078,
132
  "step": 91
133
  },
134
  {
135
  "epoch": 6.557377049180328,
136
+ "grad_norm": 4.410208225250244,
137
  "learning_rate": 2.6595744680851065e-06,
138
+ "loss": 0.2849,
139
  "step": 100
140
  },
141
  {
142
  "epoch": 6.885245901639344,
143
+ "eval_accuracy": 0.8824443293630243,
144
+ "eval_auc": 0.957557852599524,
145
+ "eval_loss": 0.30561181902885437,
146
+ "eval_runtime": 203.0816,
147
+ "eval_samples_per_second": 9.508,
148
  "eval_steps_per_second": 0.079,
149
  "step": 105
150
  },
151
  {
152
  "epoch": 6.885245901639344,
153
  "step": 105,
154
+ "total_flos": 4.1785312376666235e+18,
155
+ "train_loss": 0.38780884515671504,
156
+ "train_runtime": 6680.4521,
157
+ "train_samples_per_second": 8.107,
158
  "train_steps_per_second": 0.016
159
  }
160
  ],
 
175
  "attributes": {}
176
  }
177
  },
178
+ "total_flos": 4.1785312376666235e+18,
179
  "train_batch_size": 128,
180
  "trial_name": null,
181
  "trial_params": null