example404 commited on
Commit
7e947fa
·
1 Parent(s): 7b145cf

End of training

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.16,
3
- "eval_accuracy": 0.26691838512924776,
4
- "eval_loss": 1.1199040412902832,
5
- "eval_runtime": 8842.1517,
6
- "eval_samples_per_second": 0.389,
7
- "eval_steps_per_second": 0.049
8
  }
 
1
  {
2
+ "epoch": 8.1,
3
+ "eval_accuracy": 0.21347661922741795,
4
+ "eval_loss": 1.1585432291030884,
5
+ "eval_runtime": 9824.635,
6
+ "eval_samples_per_second": 0.35,
7
+ "eval_steps_per_second": 0.044
8
  }
runs/Dec14_16-08-17_phillips-personal-workstation/events.out.tfevents.1702644464.phillips-personal-workstation.87918.1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4c32818da00e6d865919b06d6dbb0ec935c54a0ae62c56baa863264ec3681b8
3
- size 357
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b910f9ae588db72fb384f7c41a12138ab3812576c7a31b5ef14a2bd0b4c0cba
3
+ size 674
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.16,
3
- "eval_accuracy": 0.26691838512924776,
4
- "eval_loss": 1.1199040412902832,
5
- "eval_runtime": 8842.1517,
6
- "eval_samples_per_second": 0.389,
7
- "eval_steps_per_second": 0.049
8
  }
 
1
  {
2
+ "epoch": 8.1,
3
+ "eval_accuracy": 0.21347661922741795,
4
+ "eval_loss": 1.1585432291030884,
5
+ "eval_runtime": 9824.635,
6
+ "eval_samples_per_second": 0.35,
7
+ "eval_steps_per_second": 0.044
8
  }
trainer_state.json CHANGED
@@ -1,97 +1,172 @@
1
  {
2
- "best_metric": 0.4974337040205304,
3
- "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-32",
4
- "epoch": 3.15625,
5
- "global_step": 32,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.28,
12
- "eval_accuracy": 0.3678357570573139,
13
- "eval_loss": 1.1095340251922607,
14
- "eval_runtime": 6781.1418,
15
- "eval_samples_per_second": 0.345,
16
- "eval_steps_per_second": 0.043,
17
  "step": 9
18
  },
19
  {
20
- "epoch": 1.03,
21
- "learning_rate": 3.928571428571429e-05,
22
- "loss": 1.1547,
23
  "step": 10
24
  },
25
  {
26
- "epoch": 1.28,
27
- "eval_accuracy": 0.25149700598802394,
28
- "eval_loss": 1.0840415954589844,
29
- "eval_runtime": 6565.429,
30
- "eval_samples_per_second": 0.356,
31
- "eval_steps_per_second": 0.045,
32
  "step": 18
33
  },
34
  {
35
- "epoch": 2.06,
36
- "learning_rate": 2.1428571428571428e-05,
37
- "loss": 1.0917,
38
  "step": 20
39
  },
40
  {
41
- "epoch": 2.28,
42
- "eval_accuracy": 0.48545765611633873,
43
- "eval_loss": 1.037040114402771,
44
- "eval_runtime": 6528.1498,
45
- "eval_samples_per_second": 0.358,
46
  "eval_steps_per_second": 0.045,
47
  "step": 27
48
  },
49
  {
50
- "epoch": 3.09,
51
- "learning_rate": 3.5714285714285714e-06,
52
- "loss": 1.0976,
53
  "step": 30
54
  },
55
  {
56
- "epoch": 3.16,
57
- "eval_accuracy": 0.4974337040205304,
58
- "eval_loss": 1.0295767784118652,
59
- "eval_runtime": 6784.8017,
60
  "eval_samples_per_second": 0.345,
61
  "eval_steps_per_second": 0.043,
62
- "step": 32
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  },
64
  {
65
- "epoch": 3.16,
66
- "step": 32,
67
- "total_flos": 2.9282778998194176e+17,
68
- "train_loss": 1.1151684671640396,
69
- "train_runtime": 29569.9652,
 
 
 
 
 
 
 
 
 
70
  "train_samples_per_second": 0.009,
71
  "train_steps_per_second": 0.001
72
  },
73
  {
74
- "epoch": 3.16,
75
- "eval_accuracy": 0.26691838512924776,
76
- "eval_loss": 1.1199040412902832,
77
- "eval_runtime": 9068.5155,
78
- "eval_samples_per_second": 0.38,
79
- "eval_steps_per_second": 0.048,
80
- "step": 32
81
  },
82
  {
83
- "epoch": 3.16,
84
- "eval_accuracy": 0.26691838512924776,
85
- "eval_loss": 1.1199040412902832,
86
- "eval_runtime": 8842.1517,
87
- "eval_samples_per_second": 0.389,
88
- "eval_steps_per_second": 0.049,
89
- "step": 32
90
  }
91
  ],
92
- "max_steps": 32,
93
  "num_train_epochs": 9223372036854775807,
94
- "total_flos": 2.9282778998194176e+17,
95
  "trial_name": null,
96
  "trial_params": null
97
  }
 
1
  {
2
+ "best_metric": 0.583404619332763,
3
+ "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-27",
4
+ "epoch": 8.1,
5
+ "global_step": 80,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.11,
12
+ "eval_accuracy": 0.3738237810094098,
13
+ "eval_loss": 1.1102712154388428,
14
+ "eval_runtime": 6904.9882,
15
+ "eval_samples_per_second": 0.339,
16
+ "eval_steps_per_second": 0.042,
17
  "step": 9
18
  },
19
  {
20
+ "epoch": 1.01,
21
+ "learning_rate": 4.8611111111111115e-05,
22
+ "loss": 1.1692,
23
  "step": 10
24
  },
25
  {
26
+ "epoch": 1.11,
27
+ "eval_accuracy": 0.2352437981180496,
28
+ "eval_loss": 1.1009142398834229,
29
+ "eval_runtime": 6655.1854,
30
+ "eval_samples_per_second": 0.351,
31
+ "eval_steps_per_second": 0.044,
32
  "step": 18
33
  },
34
  {
35
+ "epoch": 2.02,
36
+ "learning_rate": 4.166666666666667e-05,
37
+ "loss": 1.135,
38
  "step": 20
39
  },
40
  {
41
+ "epoch": 2.11,
42
+ "eval_accuracy": 0.583404619332763,
43
+ "eval_loss": 1.0518925189971924,
44
+ "eval_runtime": 6576.2685,
45
+ "eval_samples_per_second": 0.356,
46
  "eval_steps_per_second": 0.045,
47
  "step": 27
48
  },
49
  {
50
+ "epoch": 3.04,
51
+ "learning_rate": 3.472222222222222e-05,
52
+ "loss": 1.0973,
53
  "step": 30
54
  },
55
  {
56
+ "epoch": 3.11,
57
+ "eval_accuracy": 0.583404619332763,
58
+ "eval_loss": 1.0562057495117188,
59
+ "eval_runtime": 6783.3208,
60
  "eval_samples_per_second": 0.345,
61
  "eval_steps_per_second": 0.043,
62
+ "step": 36
63
+ },
64
+ {
65
+ "epoch": 4.05,
66
+ "learning_rate": 2.777777777777778e-05,
67
+ "loss": 1.0728,
68
+ "step": 40
69
+ },
70
+ {
71
+ "epoch": 4.11,
72
+ "eval_accuracy": 0.3857998289136014,
73
+ "eval_loss": 1.1006081104278564,
74
+ "eval_runtime": 6626.9958,
75
+ "eval_samples_per_second": 0.353,
76
+ "eval_steps_per_second": 0.044,
77
+ "step": 45
78
+ },
79
+ {
80
+ "epoch": 5.06,
81
+ "learning_rate": 2.0833333333333336e-05,
82
+ "loss": 1.052,
83
+ "step": 50
84
+ },
85
+ {
86
+ "epoch": 5.11,
87
+ "eval_accuracy": 0.24978614200171087,
88
+ "eval_loss": 1.1561808586120605,
89
+ "eval_runtime": 6687.7083,
90
+ "eval_samples_per_second": 0.35,
91
+ "eval_steps_per_second": 0.044,
92
+ "step": 54
93
+ },
94
+ {
95
+ "epoch": 6.08,
96
+ "learning_rate": 1.388888888888889e-05,
97
+ "loss": 1.0561,
98
+ "step": 60
99
+ },
100
+ {
101
+ "epoch": 6.11,
102
+ "eval_accuracy": 0.2356715141146279,
103
+ "eval_loss": 1.145110845565796,
104
+ "eval_runtime": 6713.3828,
105
+ "eval_samples_per_second": 0.348,
106
+ "eval_steps_per_second": 0.044,
107
+ "step": 63
108
+ },
109
+ {
110
+ "epoch": 7.09,
111
+ "learning_rate": 6.944444444444445e-06,
112
+ "loss": 1.021,
113
+ "step": 70
114
+ },
115
+ {
116
+ "epoch": 7.11,
117
+ "eval_accuracy": 0.2356715141146279,
118
+ "eval_loss": 1.147510051727295,
119
+ "eval_runtime": 6861.296,
120
+ "eval_samples_per_second": 0.341,
121
+ "eval_steps_per_second": 0.043,
122
+ "step": 72
123
+ },
124
+ {
125
+ "epoch": 8.1,
126
+ "learning_rate": 0.0,
127
+ "loss": 0.9696,
128
+ "step": 80
129
  },
130
  {
131
+ "epoch": 8.1,
132
+ "eval_accuracy": 0.25791274593669805,
133
+ "eval_loss": 1.1406161785125732,
134
+ "eval_runtime": 6748.1283,
135
+ "eval_samples_per_second": 0.346,
136
+ "eval_steps_per_second": 0.043,
137
+ "step": 80
138
+ },
139
+ {
140
+ "epoch": 8.1,
141
+ "step": 80,
142
+ "total_flos": 7.277082099976765e+17,
143
+ "train_loss": 1.0716288447380067,
144
+ "train_runtime": 67996.5245,
145
  "train_samples_per_second": 0.009,
146
  "train_steps_per_second": 0.001
147
  },
148
  {
149
+ "epoch": 8.1,
150
+ "eval_accuracy": 0.21347661922741795,
151
+ "eval_loss": 1.158543348312378,
152
+ "eval_runtime": 9929.4112,
153
+ "eval_samples_per_second": 0.347,
154
+ "eval_steps_per_second": 0.043,
155
+ "step": 80
156
  },
157
  {
158
+ "epoch": 8.1,
159
+ "eval_accuracy": 0.21347661922741795,
160
+ "eval_loss": 1.1585432291030884,
161
+ "eval_runtime": 9824.635,
162
+ "eval_samples_per_second": 0.35,
163
+ "eval_steps_per_second": 0.044,
164
+ "step": 80
165
  }
166
  ],
167
+ "max_steps": 80,
168
  "num_train_epochs": 9223372036854775807,
169
+ "total_flos": 7.277082099976765e+17,
170
  "trial_name": null,
171
  "trial_params": null
172
  }