Robys01 commited on
Commit
cb812f2
·
verified ·
1 Parent(s): f49fff2

Upload folder using huggingface_hub

Browse files
checkpoint-1200/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:880fe2c9c38252240def486ab1893b1f5454a7139a66459fdbd67da86200bf6f
3
  size 343288572
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:773dca78e04e7c2fdd11828420779a1f50397cbc9f2eb98691641a8aa2f27a5b
3
  size 343288572
checkpoint-1200/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca163c50d41a93fca24af63248a4286c375d15f0e13d88e2125e32fdb61dd333
3
  size 686698042
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fb9b7ead2df23a4abcdfbb4637b532943589ef1ded161f8234644399f295802
3
  size 686698042
checkpoint-1200/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95a3f0e754f92a9ba4f39927b560b1936de6e9d302ea80e42362dd4a3873b661
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b98e8f37e9b343024a717f1b1f96812e3aa6a92d57a322e15eb2f0fe34aaa0ad
3
  size 14244
checkpoint-1200/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 1.7509504556655884,
3
  "best_model_checkpoint": "facial_age_estimator/checkpoint-1200",
4
  "epoch": 10.0,
5
  "eval_steps": 500,
@@ -10,106 +10,106 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.3799237611181703,
14
- "eval_loss": 2.010244131088257,
15
- "eval_runtime": 89.3663,
16
- "eval_samples_per_second": 114.484,
17
- "eval_steps_per_second": 1.79,
18
  "step": 120
19
  },
20
  {
21
  "epoch": 2.0,
22
- "eval_accuracy": 0.39390088945362134,
23
- "eval_loss": 1.9449316263198853,
24
- "eval_runtime": 89.1195,
25
- "eval_samples_per_second": 114.801,
26
- "eval_steps_per_second": 1.795,
27
  "step": 240
28
  },
29
  {
30
  "epoch": 3.0,
31
- "eval_accuracy": 0.41237415697390284,
32
- "eval_loss": 1.8914791345596313,
33
- "eval_runtime": 89.0642,
34
- "eval_samples_per_second": 114.872,
35
- "eval_steps_per_second": 1.796,
36
  "step": 360
37
  },
38
  {
39
  "epoch": 4.0,
40
- "eval_accuracy": 0.4054344638842733,
41
- "eval_loss": 1.8564153909683228,
42
- "eval_runtime": 89.6525,
43
- "eval_samples_per_second": 114.118,
44
- "eval_steps_per_second": 1.785,
45
  "step": 480
46
  },
47
  {
48
  "epoch": 4.166666666666667,
49
- "grad_norm": 3.723311424255371,
50
  "learning_rate": 6.086956521739132e-06,
51
- "loss": 1.8165,
52
  "step": 500
53
  },
54
  {
55
  "epoch": 5.0,
56
- "eval_accuracy": 0.41325383637963053,
57
- "eval_loss": 1.8217633962631226,
58
- "eval_runtime": 89.4594,
59
- "eval_samples_per_second": 114.365,
60
- "eval_steps_per_second": 1.789,
61
  "step": 600
62
  },
63
  {
64
  "epoch": 6.0,
65
- "eval_accuracy": 0.4161861010653895,
66
- "eval_loss": 1.7974796295166016,
67
- "eval_runtime": 90.6881,
68
- "eval_samples_per_second": 112.815,
69
- "eval_steps_per_second": 1.764,
70
  "step": 720
71
  },
72
  {
73
  "epoch": 7.0,
74
- "eval_accuracy": 0.41872739712638063,
75
- "eval_loss": 1.7807412147521973,
76
- "eval_runtime": 89.7218,
77
- "eval_samples_per_second": 114.03,
78
- "eval_steps_per_second": 1.783,
79
  "step": 840
80
  },
81
  {
82
  "epoch": 8.0,
83
- "eval_accuracy": 0.4264490274655459,
84
- "eval_loss": 1.764231562614441,
85
- "eval_runtime": 90.0605,
86
- "eval_samples_per_second": 113.601,
87
- "eval_steps_per_second": 1.777,
88
  "step": 960
89
  },
90
  {
91
  "epoch": 8.333333333333334,
92
- "grad_norm": 2.656496286392212,
93
  "learning_rate": 1.7391304347826088e-06,
94
- "loss": 1.624,
95
  "step": 1000
96
  },
97
  {
98
  "epoch": 9.0,
99
- "eval_accuracy": 0.4291858078389209,
100
- "eval_loss": 1.75428307056427,
101
- "eval_runtime": 89.3673,
102
- "eval_samples_per_second": 114.483,
103
- "eval_steps_per_second": 1.79,
104
  "step": 1080
105
  },
106
  {
107
  "epoch": 10.0,
108
- "eval_accuracy": 0.4270354804026977,
109
- "eval_loss": 1.7509504556655884,
110
- "eval_runtime": 88.7685,
111
- "eval_samples_per_second": 115.255,
112
- "eval_steps_per_second": 1.802,
113
  "step": 1200
114
  }
115
  ],
@@ -130,7 +130,7 @@
130
  "attributes": {}
131
  }
132
  },
133
- "total_flos": 1.1893383914511053e+19,
134
  "train_batch_size": 128,
135
  "trial_name": null,
136
  "trial_params": null
 
1
  {
2
+ "best_metric": 1.5165716409683228,
3
  "best_model_checkpoint": "facial_age_estimator/checkpoint-1200",
4
  "epoch": 10.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.4476590753592024,
14
+ "eval_loss": 1.694000482559204,
15
+ "eval_runtime": 87.798,
16
+ "eval_samples_per_second": 116.529,
17
+ "eval_steps_per_second": 1.822,
18
  "step": 120
19
  },
20
  {
21
  "epoch": 2.0,
22
+ "eval_accuracy": 0.4534258625745284,
23
+ "eval_loss": 1.654381275177002,
24
+ "eval_runtime": 87.4351,
25
+ "eval_samples_per_second": 117.013,
26
+ "eval_steps_per_second": 1.83,
27
  "step": 240
28
  },
29
  {
30
  "epoch": 3.0,
31
+ "eval_accuracy": 0.4608542664451178,
32
+ "eval_loss": 1.618933081626892,
33
+ "eval_runtime": 87.806,
34
+ "eval_samples_per_second": 116.518,
35
+ "eval_steps_per_second": 1.822,
36
  "step": 360
37
  },
38
  {
39
  "epoch": 4.0,
40
+ "eval_accuracy": 0.4673052487537875,
41
+ "eval_loss": 1.6022893190383911,
42
+ "eval_runtime": 87.7995,
43
+ "eval_samples_per_second": 116.527,
44
+ "eval_steps_per_second": 1.822,
45
  "step": 480
46
  },
47
  {
48
  "epoch": 4.166666666666667,
49
+ "grad_norm": 3.601428747177124,
50
  "learning_rate": 6.086956521739132e-06,
51
+ "loss": 1.5209,
52
  "step": 500
53
  },
54
  {
55
  "epoch": 5.0,
56
+ "eval_accuracy": 0.47023751343954645,
57
+ "eval_loss": 1.572880744934082,
58
+ "eval_runtime": 88.2571,
59
+ "eval_samples_per_second": 115.923,
60
+ "eval_steps_per_second": 1.813,
61
  "step": 600
62
  },
63
  {
64
  "epoch": 6.0,
65
+ "eval_accuracy": 0.4768839800606001,
66
+ "eval_loss": 1.5591648817062378,
67
+ "eval_runtime": 87.4224,
68
+ "eval_samples_per_second": 117.03,
69
+ "eval_steps_per_second": 1.83,
70
  "step": 720
71
  },
72
  {
73
  "epoch": 7.0,
74
+ "eval_accuracy": 0.4815756035578145,
75
+ "eval_loss": 1.5406521558761597,
76
+ "eval_runtime": 87.5838,
77
+ "eval_samples_per_second": 116.814,
78
+ "eval_steps_per_second": 1.827,
79
  "step": 840
80
  },
81
  {
82
  "epoch": 8.0,
83
+ "eval_accuracy": 0.48138011924543056,
84
+ "eval_loss": 1.5303517580032349,
85
+ "eval_runtime": 87.3649,
86
+ "eval_samples_per_second": 117.107,
87
+ "eval_steps_per_second": 1.831,
88
  "step": 960
89
  },
90
  {
91
  "epoch": 8.333333333333334,
92
+ "grad_norm": 4.306453227996826,
93
  "learning_rate": 1.7391304347826088e-06,
94
+ "loss": 1.369,
95
  "step": 1000
96
  },
97
  {
98
  "epoch": 9.0,
99
+ "eval_accuracy": 0.4878311015541003,
100
+ "eval_loss": 1.51864492893219,
101
+ "eval_runtime": 88.2907,
102
+ "eval_samples_per_second": 115.879,
103
+ "eval_steps_per_second": 1.812,
104
  "step": 1080
105
  },
106
  {
107
  "epoch": 10.0,
108
+ "eval_accuracy": 0.49086110839605124,
109
+ "eval_loss": 1.5165716409683228,
110
+ "eval_runtime": 87.8471,
111
+ "eval_samples_per_second": 116.464,
112
+ "eval_steps_per_second": 1.821,
113
  "step": 1200
114
  }
115
  ],
 
130
  "attributes": {}
131
  }
132
  },
133
+ "total_flos": 1.2071959063022186e+19,
134
  "train_batch_size": 128,
135
  "trial_name": null,
136
  "trial_params": null
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:880fe2c9c38252240def486ab1893b1f5454a7139a66459fdbd67da86200bf6f
3
  size 343288572
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:773dca78e04e7c2fdd11828420779a1f50397cbc9f2eb98691641a8aa2f27a5b
3
  size 343288572