pavitemple commited on
Commit
3e6dcbe
·
1 Parent(s): de08a45

End of training

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. all_results.json +5 -5
  3. test_results.json +5 -5
  4. trainer_state.json +142 -52
README.md CHANGED
@@ -17,7 +17,7 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.9771
21
  - Accuracy: 0.6176
22
 
23
  ## Model description
 
17
 
18
  This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 1.0015
21
  - Accuracy: 0.6176
22
 
23
  ## Model description
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 4.2,
3
- "eval_accuracy": 0.47058823529411764,
4
- "eval_loss": 1.3654829263687134,
5
- "eval_runtime": 226.6589,
6
- "eval_samples_per_second": 0.075,
7
  "eval_steps_per_second": 0.009
8
  }
 
1
  {
2
+ "epoch": 12.04,
3
+ "eval_accuracy": 0.6176470588235294,
4
+ "eval_loss": 1.001463770866394,
5
+ "eval_runtime": 216.1108,
6
+ "eval_samples_per_second": 0.079,
7
  "eval_steps_per_second": 0.009
8
  }
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 4.2,
3
- "eval_accuracy": 0.47058823529411764,
4
- "eval_loss": 1.3654829263687134,
5
- "eval_runtime": 226.6589,
6
- "eval_samples_per_second": 0.075,
7
  "eval_steps_per_second": 0.009
8
  }
 
1
  {
2
+ "epoch": 12.04,
3
+ "eval_accuracy": 0.6176470588235294,
4
+ "eval_loss": 1.001463770866394,
5
+ "eval_runtime": 216.1108,
6
+ "eval_samples_per_second": 0.079,
7
  "eval_steps_per_second": 0.009
8
  }
trainer_state.json CHANGED
@@ -1,103 +1,193 @@
1
  {
2
- "best_metric": 0.5652173913043478,
3
- "best_model_checkpoint": "finetuned-Accident-SingleLabel-Final/checkpoint-16",
4
- "epoch": 4.2,
5
  "eval_steps": 500,
6
- "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.2,
13
- "eval_accuracy": 0.391304347826087,
14
- "eval_loss": 1.7558271884918213,
15
- "eval_runtime": 181.0738,
16
  "eval_samples_per_second": 0.066,
17
  "eval_steps_per_second": 0.006,
18
  "step": 4
19
  },
20
  {
21
- "epoch": 1.2,
22
- "eval_accuracy": 0.5217391304347826,
23
- "eval_loss": 1.6333752870559692,
24
- "eval_runtime": 175.4835,
25
  "eval_samples_per_second": 0.068,
26
  "eval_steps_per_second": 0.006,
27
  "step": 8
28
  },
29
  {
30
- "epoch": 2.1,
31
- "learning_rate": 2.777777777777778e-05,
32
- "loss": 1.5371,
33
  "step": 10
34
  },
35
  {
36
- "epoch": 2.2,
37
- "eval_accuracy": 0.5217391304347826,
38
- "eval_loss": 1.4526761770248413,
39
- "eval_runtime": 175.7603,
40
  "eval_samples_per_second": 0.068,
41
  "eval_steps_per_second": 0.006,
42
  "step": 12
43
  },
44
  {
45
- "epoch": 3.2,
46
- "eval_accuracy": 0.5652173913043478,
47
- "eval_loss": 1.291401982307434,
48
- "eval_runtime": 178.1903,
49
- "eval_samples_per_second": 0.067,
50
  "eval_steps_per_second": 0.006,
51
  "step": 16
52
  },
53
  {
54
- "epoch": 4.2,
55
- "learning_rate": 0.0,
56
- "loss": 1.1439,
57
  "step": 20
58
  },
59
  {
60
- "epoch": 4.2,
61
- "eval_accuracy": 0.5652173913043478,
62
- "eval_loss": 1.2895885705947876,
63
- "eval_runtime": 175.7621,
64
  "eval_samples_per_second": 0.068,
65
  "eval_steps_per_second": 0.006,
66
  "step": 20
67
  },
68
  {
69
- "epoch": 4.2,
70
- "step": 20,
71
- "total_flos": 3.115272515753083e+17,
72
- "train_loss": 1.3405299186706543,
73
- "train_runtime": 3828.671,
74
- "train_samples_per_second": 0.084,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
75
  "train_steps_per_second": 0.005
76
  },
77
  {
78
- "epoch": 4.2,
79
- "eval_accuracy": 0.47058823529411764,
80
- "eval_loss": 1.3361997604370117,
81
- "eval_runtime": 250.3731,
82
- "eval_samples_per_second": 0.068,
83
- "eval_steps_per_second": 0.008,
84
- "step": 20
85
  },
86
  {
87
- "epoch": 4.2,
88
- "eval_accuracy": 0.47058823529411764,
89
- "eval_loss": 1.3654829263687134,
90
- "eval_runtime": 226.6589,
91
- "eval_samples_per_second": 0.075,
92
  "eval_steps_per_second": 0.009,
93
- "step": 20
94
  }
95
  ],
96
  "logging_steps": 10,
97
- "max_steps": 20,
98
  "num_train_epochs": 9223372036854775807,
99
  "save_steps": 500,
100
- "total_flos": 3.115272515753083e+17,
101
  "trial_name": null,
102
  "trial_params": null
103
  }
 
1
  {
2
+ "best_metric": 0.6521739130434783,
3
+ "best_model_checkpoint": "finetuned-Accident-SingleLabel-Final/checkpoint-32",
4
+ "epoch": 12.04,
5
  "eval_steps": 500,
6
+ "global_step": 50,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.08,
13
+ "eval_accuracy": 0.13043478260869565,
14
+ "eval_loss": 1.7643578052520752,
15
+ "eval_runtime": 180.6913,
16
  "eval_samples_per_second": 0.066,
17
  "eval_steps_per_second": 0.006,
18
  "step": 4
19
  },
20
  {
21
+ "epoch": 1.08,
22
+ "eval_accuracy": 0.4782608695652174,
23
+ "eval_loss": 1.644978404045105,
24
+ "eval_runtime": 176.6998,
25
  "eval_samples_per_second": 0.068,
26
  "eval_steps_per_second": 0.006,
27
  "step": 8
28
  },
29
  {
30
+ "epoch": 2.04,
31
+ "learning_rate": 4.4444444444444447e-05,
32
+ "loss": 1.6076,
33
  "step": 10
34
  },
35
  {
36
+ "epoch": 2.08,
37
+ "eval_accuracy": 0.5652173913043478,
38
+ "eval_loss": 1.420976996421814,
39
+ "eval_runtime": 175.9453,
40
  "eval_samples_per_second": 0.068,
41
  "eval_steps_per_second": 0.006,
42
  "step": 12
43
  },
44
  {
45
+ "epoch": 3.08,
46
+ "eval_accuracy": 0.6086956521739131,
47
+ "eval_loss": 1.1925344467163086,
48
+ "eval_runtime": 176.0087,
49
+ "eval_samples_per_second": 0.068,
50
  "eval_steps_per_second": 0.006,
51
  "step": 16
52
  },
53
  {
54
+ "epoch": 4.08,
55
+ "learning_rate": 3.3333333333333335e-05,
56
+ "loss": 1.0244,
57
  "step": 20
58
  },
59
  {
60
+ "epoch": 4.08,
61
+ "eval_accuracy": 0.6086956521739131,
62
+ "eval_loss": 1.1086814403533936,
63
+ "eval_runtime": 175.4334,
64
  "eval_samples_per_second": 0.068,
65
  "eval_steps_per_second": 0.006,
66
  "step": 20
67
  },
68
  {
69
+ "epoch": 5.08,
70
+ "eval_accuracy": 0.5652173913043478,
71
+ "eval_loss": 0.9823909401893616,
72
+ "eval_runtime": 150.4209,
73
+ "eval_samples_per_second": 0.08,
74
+ "eval_steps_per_second": 0.007,
75
+ "step": 24
76
+ },
77
+ {
78
+ "epoch": 6.08,
79
+ "eval_accuracy": 0.5217391304347826,
80
+ "eval_loss": 1.0296951532363892,
81
+ "eval_runtime": 150.2481,
82
+ "eval_samples_per_second": 0.08,
83
+ "eval_steps_per_second": 0.007,
84
+ "step": 28
85
+ },
86
+ {
87
+ "epoch": 7.04,
88
+ "learning_rate": 2.2222222222222223e-05,
89
+ "loss": 0.9684,
90
+ "step": 30
91
+ },
92
+ {
93
+ "epoch": 7.08,
94
+ "eval_accuracy": 0.6521739130434783,
95
+ "eval_loss": 1.0348024368286133,
96
+ "eval_runtime": 149.9139,
97
+ "eval_samples_per_second": 0.08,
98
+ "eval_steps_per_second": 0.007,
99
+ "step": 32
100
+ },
101
+ {
102
+ "epoch": 8.08,
103
+ "eval_accuracy": 0.6521739130434783,
104
+ "eval_loss": 0.9425884485244751,
105
+ "eval_runtime": 149.1356,
106
+ "eval_samples_per_second": 0.08,
107
+ "eval_steps_per_second": 0.007,
108
+ "step": 36
109
+ },
110
+ {
111
+ "epoch": 9.08,
112
+ "learning_rate": 1.1111111111111112e-05,
113
+ "loss": 0.7826,
114
+ "step": 40
115
+ },
116
+ {
117
+ "epoch": 9.08,
118
+ "eval_accuracy": 0.6086956521739131,
119
+ "eval_loss": 1.0070533752441406,
120
+ "eval_runtime": 148.8072,
121
+ "eval_samples_per_second": 0.081,
122
+ "eval_steps_per_second": 0.007,
123
+ "step": 40
124
+ },
125
+ {
126
+ "epoch": 10.08,
127
+ "eval_accuracy": 0.6086956521739131,
128
+ "eval_loss": 0.9810559749603271,
129
+ "eval_runtime": 151.9451,
130
+ "eval_samples_per_second": 0.079,
131
+ "eval_steps_per_second": 0.007,
132
+ "step": 44
133
+ },
134
+ {
135
+ "epoch": 11.08,
136
+ "eval_accuracy": 0.6086956521739131,
137
+ "eval_loss": 0.9039665460586548,
138
+ "eval_runtime": 153.6996,
139
+ "eval_samples_per_second": 0.078,
140
+ "eval_steps_per_second": 0.007,
141
+ "step": 48
142
+ },
143
+ {
144
+ "epoch": 12.04,
145
+ "learning_rate": 0.0,
146
+ "loss": 0.7829,
147
+ "step": 50
148
+ },
149
+ {
150
+ "epoch": 12.04,
151
+ "eval_accuracy": 0.6086956521739131,
152
+ "eval_loss": 0.8987236022949219,
153
+ "eval_runtime": 154.4435,
154
+ "eval_samples_per_second": 0.078,
155
+ "eval_steps_per_second": 0.006,
156
+ "step": 50
157
+ },
158
+ {
159
+ "epoch": 12.04,
160
+ "step": 50,
161
+ "total_flos": 7.875408929100923e+17,
162
+ "train_loss": 1.0331808185577394,
163
+ "train_runtime": 9247.5358,
164
+ "train_samples_per_second": 0.087,
165
  "train_steps_per_second": 0.005
166
  },
167
  {
168
+ "epoch": 12.04,
169
+ "eval_accuracy": 0.6176470588235294,
170
+ "eval_loss": 0.9771482944488525,
171
+ "eval_runtime": 215.9095,
172
+ "eval_samples_per_second": 0.079,
173
+ "eval_steps_per_second": 0.009,
174
+ "step": 50
175
  },
176
  {
177
+ "epoch": 12.04,
178
+ "eval_accuracy": 0.6176470588235294,
179
+ "eval_loss": 1.001463770866394,
180
+ "eval_runtime": 216.1108,
181
+ "eval_samples_per_second": 0.079,
182
  "eval_steps_per_second": 0.009,
183
+ "step": 50
184
  }
185
  ],
186
  "logging_steps": 10,
187
+ "max_steps": 50,
188
  "num_train_epochs": 9223372036854775807,
189
  "save_steps": 500,
190
+ "total_flos": 7.875408929100923e+17,
191
  "trial_name": null,
192
  "trial_params": null
193
  }