bombshelll commited on
Commit
4ff88ba
·
verified ·
1 Parent(s): de9e335

End of training

Browse files
Files changed (4) hide show
  1. all_results.json +11 -11
  2. eval_results.json +6 -6
  3. train_results.json +6 -6
  4. trainer_state.json +37 -28
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 2.888888888888889,
3
- "eval_accuracy": 0.9841269841269841,
4
- "eval_loss": 0.20399044454097748,
5
- "eval_runtime": 0.3813,
6
- "eval_samples_per_second": 165.246,
7
- "eval_steps_per_second": 5.246,
8
- "total_flos": 4.228121867100365e+16,
9
- "train_loss": 0.7618867800785944,
10
- "train_runtime": 21.7408,
11
- "train_samples_per_second": 130.4,
12
- "train_steps_per_second": 0.92
13
  }
 
1
  {
2
+ "epoch": 4.0,
3
+ "eval_accuracy": 1.0,
4
+ "eval_loss": 0.19110850989818573,
5
+ "eval_runtime": 0.3814,
6
+ "eval_samples_per_second": 165.197,
7
+ "eval_steps_per_second": 5.244,
8
+ "total_flos": 5.637495822800486e+16,
9
+ "train_loss": 0.6830070416132609,
10
+ "train_runtime": 28.7573,
11
+ "train_samples_per_second": 98.584,
12
+ "train_steps_per_second": 0.695
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.888888888888889,
3
- "eval_accuracy": 0.9841269841269841,
4
- "eval_loss": 0.20399044454097748,
5
- "eval_runtime": 0.3813,
6
- "eval_samples_per_second": 165.246,
7
- "eval_steps_per_second": 5.246
8
  }
 
1
  {
2
+ "epoch": 4.0,
3
+ "eval_accuracy": 1.0,
4
+ "eval_loss": 0.19110850989818573,
5
+ "eval_runtime": 0.3814,
6
+ "eval_samples_per_second": 165.197,
7
+ "eval_steps_per_second": 5.244
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.888888888888889,
3
- "total_flos": 4.228121867100365e+16,
4
- "train_loss": 0.7618867800785944,
5
- "train_runtime": 21.7408,
6
- "train_samples_per_second": 130.4,
7
- "train_steps_per_second": 0.92
8
  }
 
1
  {
2
+ "epoch": 4.0,
3
+ "total_flos": 5.637495822800486e+16,
4
+ "train_loss": 0.6830070416132609,
5
+ "train_runtime": 28.7573,
6
+ "train_samples_per_second": 98.584,
7
+ "train_steps_per_second": 0.695
8
  }
trainer_state.json CHANGED
@@ -1,55 +1,64 @@
1
  {
2
- "best_metric": 0.9841269841269841,
3
- "best_model_checkpoint": "/kaggle/working/swin-brain-plane-classification/checkpoint-13",
4
- "epoch": 2.888888888888889,
5
  "eval_steps": 500,
6
- "global_step": 13,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.8888888888888888,
13
- "eval_accuracy": 0.8095238095238095,
14
- "eval_loss": 0.743109405040741,
15
- "eval_runtime": 0.3713,
16
- "eval_samples_per_second": 169.663,
17
- "eval_steps_per_second": 5.386,
18
  "step": 4
19
  },
20
  {
21
  "epoch": 2.0,
22
  "eval_accuracy": 0.9682539682539683,
23
- "eval_loss": 0.3612231910228729,
24
- "eval_runtime": 0.3697,
25
- "eval_samples_per_second": 170.43,
26
- "eval_steps_per_second": 5.41,
27
  "step": 9
28
  },
29
  {
30
  "epoch": 2.2222222222222223,
31
- "grad_norm": 6.062853813171387,
32
  "learning_rate": 2.777777777777778e-05,
33
- "loss": 0.8237,
34
  "step": 10
35
  },
36
  {
37
  "epoch": 2.888888888888889,
38
- "eval_accuracy": 0.9841269841269841,
39
- "eval_loss": 0.20399044454097748,
40
- "eval_runtime": 0.3636,
41
- "eval_samples_per_second": 173.264,
42
- "eval_steps_per_second": 5.5,
43
  "step": 13
44
  },
45
  {
46
- "epoch": 2.888888888888889,
47
- "step": 13,
48
- "total_flos": 4.228121867100365e+16,
49
- "train_loss": 0.7618867800785944,
50
- "train_runtime": 21.7408,
51
- "train_samples_per_second": 130.4,
52
- "train_steps_per_second": 0.92
 
 
 
 
 
 
 
 
 
53
  }
54
  ],
55
  "logging_steps": 10,
@@ -78,7 +87,7 @@
78
  "attributes": {}
79
  }
80
  },
81
- "total_flos": 4.228121867100365e+16,
82
  "train_batch_size": 32,
83
  "trial_name": null,
84
  "trial_params": null
 
1
  {
2
+ "best_metric": 1.0,
3
+ "best_model_checkpoint": "/kaggle/working/swin-brain-plane-classification/checkpoint-18",
4
+ "epoch": 4.0,
5
  "eval_steps": 500,
6
+ "global_step": 18,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.8888888888888888,
13
+ "eval_accuracy": 0.9047619047619048,
14
+ "eval_loss": 0.8267417550086975,
15
+ "eval_runtime": 0.3659,
16
+ "eval_samples_per_second": 172.198,
17
+ "eval_steps_per_second": 5.467,
18
  "step": 4
19
  },
20
  {
21
  "epoch": 2.0,
22
  "eval_accuracy": 0.9682539682539683,
23
+ "eval_loss": 0.45388203859329224,
24
+ "eval_runtime": 0.3836,
25
+ "eval_samples_per_second": 164.226,
26
+ "eval_steps_per_second": 5.214,
27
  "step": 9
28
  },
29
  {
30
  "epoch": 2.2222222222222223,
31
+ "grad_norm": 19.5561466217041,
32
  "learning_rate": 2.777777777777778e-05,
33
+ "loss": 0.8656,
34
  "step": 10
35
  },
36
  {
37
  "epoch": 2.888888888888889,
38
+ "eval_accuracy": 0.9682539682539683,
39
+ "eval_loss": 0.30353549122810364,
40
+ "eval_runtime": 0.368,
41
+ "eval_samples_per_second": 171.182,
42
+ "eval_steps_per_second": 5.434,
43
  "step": 13
44
  },
45
  {
46
+ "epoch": 4.0,
47
+ "eval_accuracy": 1.0,
48
+ "eval_loss": 0.19110850989818573,
49
+ "eval_runtime": 0.3651,
50
+ "eval_samples_per_second": 172.56,
51
+ "eval_steps_per_second": 5.478,
52
+ "step": 18
53
+ },
54
+ {
55
+ "epoch": 4.0,
56
+ "step": 18,
57
+ "total_flos": 5.637495822800486e+16,
58
+ "train_loss": 0.6830070416132609,
59
+ "train_runtime": 28.7573,
60
+ "train_samples_per_second": 98.584,
61
+ "train_steps_per_second": 0.695
62
  }
63
  ],
64
  "logging_steps": 10,
 
87
  "attributes": {}
88
  }
89
  },
90
+ "total_flos": 5.637495822800486e+16,
91
  "train_batch_size": 32,
92
  "trial_name": null,
93
  "trial_params": null