bombshelll commited on
Commit
32e9c5c
·
verified ·
1 Parent(s): dfb7b4e

End of training

Browse files
Files changed (4) hide show
  1. all_results.json +11 -11
  2. eval_results.json +6 -6
  3. train_results.json +6 -6
  4. trainer_state.json +81 -38
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 2.0,
3
- "eval_accuracy": 0.9904761904761905,
4
- "eval_loss": 0.017159689217805862,
5
- "eval_runtime": 1.7705,
6
- "eval_samples_per_second": 118.612,
7
- "eval_steps_per_second": 3.954,
8
- "total_flos": 9.395826371334144e+16,
9
- "train_loss": 0.323590816060702,
10
- "train_runtime": 55.2419,
11
- "train_samples_per_second": 171.066,
12
- "train_steps_per_second": 1.358
13
  }
 
1
  {
2
+ "epoch": 6.0,
3
+ "eval_accuracy": 1.0,
4
+ "eval_loss": 0.03769616782665253,
5
+ "eval_runtime": 0.946,
6
+ "eval_samples_per_second": 112.046,
7
+ "eval_steps_per_second": 4.228,
8
+ "total_flos": 1.4153791066361856e+17,
9
+ "train_loss": 0.4622622158792284,
10
+ "train_runtime": 90.8298,
11
+ "train_samples_per_second": 208.962,
12
+ "train_steps_per_second": 1.541
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.0,
3
- "eval_accuracy": 0.9904761904761905,
4
- "eval_loss": 0.017159689217805862,
5
- "eval_runtime": 1.7705,
6
- "eval_samples_per_second": 118.612,
7
- "eval_steps_per_second": 3.954
8
  }
 
1
  {
2
+ "epoch": 6.0,
3
+ "eval_accuracy": 1.0,
4
+ "eval_loss": 0.03769616782665253,
5
+ "eval_runtime": 0.946,
6
+ "eval_samples_per_second": 112.046,
7
+ "eval_steps_per_second": 4.228
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.0,
3
- "total_flos": 9.395826371334144e+16,
4
- "train_loss": 0.323590816060702,
5
- "train_runtime": 55.2419,
6
- "train_samples_per_second": 171.066,
7
- "train_steps_per_second": 1.358
8
  }
 
1
  {
2
+ "epoch": 6.0,
3
+ "total_flos": 1.4153791066361856e+17,
4
+ "train_loss": 0.4622622158792284,
5
+ "train_runtime": 90.8298,
6
+ "train_samples_per_second": 208.962,
7
+ "train_steps_per_second": 1.541
8
  }
trainer_state.json CHANGED
@@ -1,66 +1,109 @@
1
  {
2
- "best_metric": 0.9904761904761905,
3
- "best_model_checkpoint": "/kaggle/working/swin-brain-modality-classification/checkpoint-30",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.6666666666666666,
13
- "grad_norm": 5.664389610290527,
14
- "learning_rate": 4.850746268656717e-05,
15
- "loss": 0.803,
 
 
 
 
 
 
 
 
 
16
  "step": 10
17
  },
18
  {
19
- "epoch": 1.0,
20
- "eval_accuracy": 0.9619047619047619,
21
- "eval_loss": 0.1342908889055252,
22
- "eval_runtime": 1.7227,
23
- "eval_samples_per_second": 121.902,
24
- "eval_steps_per_second": 4.063,
25
  "step": 15
26
  },
27
  {
28
- "epoch": 1.3333333333333333,
29
- "grad_norm": 3.640326976776123,
30
- "learning_rate": 4.104477611940299e-05,
31
- "loss": 0.1269,
32
  "step": 20
33
  },
34
  {
35
- "epoch": 2.0,
36
- "grad_norm": 1.9675283432006836,
37
- "learning_rate": 3.358208955223881e-05,
38
- "loss": 0.0409,
 
 
 
 
 
 
 
 
 
39
  "step": 30
40
  },
41
  {
42
- "epoch": 2.0,
43
- "eval_accuracy": 0.9904761904761905,
44
- "eval_loss": 0.017159689217805862,
45
- "eval_runtime": 1.722,
46
- "eval_samples_per_second": 121.952,
47
- "eval_steps_per_second": 4.065,
48
  "step": 30
49
  },
50
  {
51
- "epoch": 2.0,
52
- "step": 30,
53
- "total_flos": 9.395826371334144e+16,
54
- "train_loss": 0.323590816060702,
55
- "train_runtime": 55.2419,
56
- "train_samples_per_second": 171.066,
57
- "train_steps_per_second": 1.358
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
58
  }
59
  ],
60
  "logging_steps": 10,
61
- "max_steps": 75,
62
  "num_input_tokens_seen": 0,
63
- "num_train_epochs": 5,
64
  "save_steps": 500,
65
  "stateful_callbacks": {
66
  "CustomEarlyStoppingCallback": {
@@ -83,7 +126,7 @@
83
  "attributes": {}
84
  }
85
  },
86
- "total_flos": 9.395826371334144e+16,
87
  "train_batch_size": 32,
88
  "trial_name": null,
89
  "trial_params": null
 
1
  {
2
+ "best_metric": 1.0,
3
+ "best_model_checkpoint": "/kaggle/working/swin-brain-modality-classification/checkpoint-45",
4
+ "epoch": 6.0,
5
  "eval_steps": 500,
6
+ "global_step": 45,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.9333333333333333,
13
+ "eval_accuracy": 0.6415094339622641,
14
+ "eval_loss": 1.0901466608047485,
15
+ "eval_runtime": 1.0666,
16
+ "eval_samples_per_second": 99.379,
17
+ "eval_steps_per_second": 3.75,
18
+ "step": 7
19
+ },
20
+ {
21
+ "epoch": 1.3333333333333333,
22
+ "grad_norm": 5.982262134552002,
23
+ "learning_rate": 3.571428571428572e-05,
24
+ "loss": 1.2435,
25
  "step": 10
26
  },
27
  {
28
+ "epoch": 2.0,
29
+ "eval_accuracy": 0.8584905660377359,
30
+ "eval_loss": 0.42658886313438416,
31
+ "eval_runtime": 0.9395,
32
+ "eval_samples_per_second": 112.826,
33
+ "eval_steps_per_second": 4.258,
34
  "step": 15
35
  },
36
  {
37
+ "epoch": 2.6666666666666665,
38
+ "grad_norm": 8.782153129577637,
39
+ "learning_rate": 4.761904761904762e-05,
40
+ "loss": 0.5378,
41
  "step": 20
42
  },
43
  {
44
+ "epoch": 2.9333333333333336,
45
+ "eval_accuracy": 0.9528301886792453,
46
+ "eval_loss": 0.15236791968345642,
47
+ "eval_runtime": 0.9334,
48
+ "eval_samples_per_second": 113.563,
49
+ "eval_steps_per_second": 4.285,
50
+ "step": 22
51
+ },
52
+ {
53
+ "epoch": 4.0,
54
+ "grad_norm": 5.220347881317139,
55
+ "learning_rate": 4.3650793650793655e-05,
56
+ "loss": 0.1747,
57
  "step": 30
58
  },
59
  {
60
+ "epoch": 4.0,
61
+ "eval_accuracy": 0.9716981132075472,
62
+ "eval_loss": 0.07465644180774689,
63
+ "eval_runtime": 0.9385,
64
+ "eval_samples_per_second": 112.947,
65
+ "eval_steps_per_second": 4.262,
66
  "step": 30
67
  },
68
  {
69
+ "epoch": 4.933333333333334,
70
+ "eval_accuracy": 0.9622641509433962,
71
+ "eval_loss": 0.08645126223564148,
72
+ "eval_runtime": 0.9952,
73
+ "eval_samples_per_second": 106.514,
74
+ "eval_steps_per_second": 4.019,
75
+ "step": 37
76
+ },
77
+ {
78
+ "epoch": 5.333333333333333,
79
+ "grad_norm": 5.531038761138916,
80
+ "learning_rate": 3.968253968253968e-05,
81
+ "loss": 0.0905,
82
+ "step": 40
83
+ },
84
+ {
85
+ "epoch": 6.0,
86
+ "eval_accuracy": 1.0,
87
+ "eval_loss": 0.03769616782665253,
88
+ "eval_runtime": 1.0531,
89
+ "eval_samples_per_second": 100.657,
90
+ "eval_steps_per_second": 3.798,
91
+ "step": 45
92
+ },
93
+ {
94
+ "epoch": 6.0,
95
+ "step": 45,
96
+ "total_flos": 1.4153791066361856e+17,
97
+ "train_loss": 0.4622622158792284,
98
+ "train_runtime": 90.8298,
99
+ "train_samples_per_second": 208.962,
100
+ "train_steps_per_second": 1.541
101
  }
102
  ],
103
  "logging_steps": 10,
104
+ "max_steps": 140,
105
  "num_input_tokens_seen": 0,
106
+ "num_train_epochs": 20,
107
  "save_steps": 500,
108
  "stateful_callbacks": {
109
  "CustomEarlyStoppingCallback": {
 
126
  "attributes": {}
127
  }
128
  },
129
+ "total_flos": 1.4153791066361856e+17,
130
  "train_batch_size": 32,
131
  "trial_name": null,
132
  "trial_params": null