arpanl commited on
Commit
d0b4626
·
verified ·
1 Parent(s): 92105f4

Training in progress, step 20

Browse files
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "epoch": 30.0,
3
- "eval_accuracy": 0.592,
4
- "eval_f1": 0.4602437417654809,
5
- "eval_loss": 0.8401041626930237,
6
- "eval_runtime": 130.3522,
7
- "eval_samples_per_second": 0.959,
8
- "eval_steps_per_second": 0.123,
9
  "total_flos": 2.907095595264e+17,
10
- "train_loss": 1.6994803905487061,
11
- "train_runtime": 10528.1678,
12
- "train_samples_per_second": 0.356,
13
- "train_steps_per_second": 0.011
14
  }
 
1
  {
2
  "epoch": 30.0,
3
+ "eval_accuracy": 0.608,
4
+ "eval_f1": 0.5096170704866357,
5
+ "eval_loss": 0.736162006855011,
6
+ "eval_runtime": 44.8107,
7
+ "eval_samples_per_second": 2.79,
8
+ "eval_steps_per_second": 0.357,
9
  "total_flos": 2.907095595264e+17,
10
+ "train_loss": 1.321283253033956,
11
+ "train_runtime": 2416.2795,
12
+ "train_samples_per_second": 1.552,
13
+ "train_steps_per_second": 0.05
14
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 30.0,
3
- "eval_accuracy": 0.592,
4
- "eval_f1": 0.4602437417654809,
5
- "eval_loss": 0.8401041626930237,
6
- "eval_runtime": 130.3522,
7
- "eval_samples_per_second": 0.959,
8
- "eval_steps_per_second": 0.123
9
  }
 
1
  {
2
  "epoch": 30.0,
3
+ "eval_accuracy": 0.608,
4
+ "eval_f1": 0.5096170704866357,
5
+ "eval_loss": 0.736162006855011,
6
+ "eval_runtime": 44.8107,
7
+ "eval_samples_per_second": 2.79,
8
+ "eval_steps_per_second": 0.357
9
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e03496b8aa90189bc23efd44b1041370b4122b82f242ce16acd5fdb67f18732c
3
  size 343359328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93d51a216f8b7baad87599fc55a5a954339890cf705dbc6e4abbda8ba83f4590
3
  size 343359328
runs/Feb12_04-49-49_e7b40a5a562d/events.out.tfevents.1707715881.e7b40a5a562d.565.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d6a65b12f329a510afed2e849ef189c8708c5636f48ca03d1bdf8950f3c784f
3
+ size 450
runs/Feb12_10-05-02_8d0c95f0ef0d/events.out.tfevents.1707732306.8d0c95f0ef0d.266.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fec226b902e6b7c51d60c0fa98c7f81307c112eda25f5ea94e6c3b5162b6511
3
+ size 6710
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 30.0,
3
  "total_flos": 2.907095595264e+17,
4
- "train_loss": 1.6994803905487061,
5
- "train_runtime": 10528.1678,
6
- "train_samples_per_second": 0.356,
7
- "train_steps_per_second": 0.011
8
  }
 
1
  {
2
  "epoch": 30.0,
3
  "total_flos": 2.907095595264e+17,
4
+ "train_loss": 1.321283253033956,
5
+ "train_runtime": 2416.2795,
6
+ "train_samples_per_second": 1.552,
7
+ "train_steps_per_second": 0.05
8
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.8401041626930237,
3
  "best_model_checkpoint": "/content/drive/MyDrive/Fine-Tuned_Model3/checkpoint-120",
4
  "epoch": 30.0,
5
  "eval_steps": 20,
@@ -10,108 +10,108 @@
10
  "log_history": [
11
  {
12
  "epoch": 5.0,
13
- "learning_rate": 2.9488887394336025e-05,
14
- "loss": 3.5336,
15
  "step": 20
16
  },
17
  {
18
  "epoch": 5.0,
19
- "eval_accuracy": 0.472,
20
- "eval_f1": 0.2688021058225662,
21
- "eval_loss": 2.5429601669311523,
22
- "eval_runtime": 130.7136,
23
- "eval_samples_per_second": 0.956,
24
- "eval_steps_per_second": 0.122,
25
  "step": 20
26
  },
27
  {
28
  "epoch": 10.0,
29
- "learning_rate": 1.5e-05,
30
- "loss": 1.952,
31
  "step": 40
32
  },
33
  {
34
  "epoch": 10.0,
35
- "eval_accuracy": 0.576,
36
- "eval_f1": 0.369042862070919,
37
- "eval_loss": 1.468719482421875,
38
- "eval_runtime": 131.8983,
39
- "eval_samples_per_second": 0.948,
40
- "eval_steps_per_second": 0.121,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 15.0,
45
- "learning_rate": 5.11112605663977e-07,
46
- "loss": 1.3471,
47
  "step": 60
48
  },
49
  {
50
  "epoch": 15.0,
51
- "eval_accuracy": 0.584,
52
- "eval_f1": 0.38577990574558085,
53
- "eval_loss": 1.274966835975647,
54
- "eval_runtime": 139.0851,
55
- "eval_samples_per_second": 0.899,
56
- "eval_steps_per_second": 0.115,
57
  "step": 60
58
  },
59
  {
60
  "epoch": 20.0,
61
- "learning_rate": 7.499999999999993e-06,
62
- "loss": 1.2688,
63
  "step": 80
64
  },
65
  {
66
  "epoch": 20.0,
67
- "eval_accuracy": 0.576,
68
- "eval_f1": 0.3823282044677926,
69
- "eval_loss": 1.2294681072235107,
70
- "eval_runtime": 131.4905,
71
- "eval_samples_per_second": 0.951,
72
- "eval_steps_per_second": 0.122,
73
  "step": 80
74
  },
75
  {
76
  "epoch": 25.0,
77
- "learning_rate": 2.5606601717798212e-05,
78
- "loss": 1.1444,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 25.0,
83
- "eval_accuracy": 0.592,
84
- "eval_f1": 0.38488272384052435,
85
- "eval_loss": 0.9876356720924377,
86
- "eval_runtime": 130.1608,
87
- "eval_samples_per_second": 0.96,
88
- "eval_steps_per_second": 0.123,
89
  "step": 100
90
  },
91
  {
92
  "epoch": 30.0,
93
- "learning_rate": 2.7990381056766586e-05,
94
- "loss": 0.9511,
95
  "step": 120
96
  },
97
  {
98
  "epoch": 30.0,
99
- "eval_accuracy": 0.592,
100
- "eval_f1": 0.4602437417654809,
101
- "eval_loss": 0.8401041626930237,
102
- "eval_runtime": 130.7723,
103
- "eval_samples_per_second": 0.956,
104
- "eval_steps_per_second": 0.122,
105
  "step": 120
106
  },
107
  {
108
  "epoch": 30.0,
109
  "step": 120,
110
  "total_flos": 2.907095595264e+17,
111
- "train_loss": 1.6994803905487061,
112
- "train_runtime": 10528.1678,
113
- "train_samples_per_second": 0.356,
114
- "train_steps_per_second": 0.011
115
  }
116
  ],
117
  "logging_steps": 20,
 
1
  {
2
+ "best_metric": 0.736162006855011,
3
  "best_model_checkpoint": "/content/drive/MyDrive/Fine-Tuned_Model3/checkpoint-120",
4
  "epoch": 30.0,
5
  "eval_steps": 20,
 
10
  "log_history": [
11
  {
12
  "epoch": 5.0,
13
+ "learning_rate": 6.25e-05,
14
+ "loss": 3.2255,
15
  "step": 20
16
  },
17
  {
18
  "epoch": 5.0,
19
+ "eval_accuracy": 0.512,
20
+ "eval_f1": 0.30833289169267614,
21
+ "eval_loss": 1.9573944807052612,
22
+ "eval_runtime": 43.495,
23
+ "eval_samples_per_second": 2.874,
24
+ "eval_steps_per_second": 0.368,
25
  "step": 20
26
  },
27
  {
28
  "epoch": 10.0,
29
+ "learning_rate": 8.535533905932738e-05,
30
+ "loss": 1.3773,
31
  "step": 40
32
  },
33
  {
34
  "epoch": 10.0,
35
+ "eval_accuracy": 0.584,
36
+ "eval_f1": 0.46169772256728775,
37
+ "eval_loss": 0.8853923678398132,
38
+ "eval_runtime": 43.5002,
39
+ "eval_samples_per_second": 2.874,
40
+ "eval_steps_per_second": 0.368,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 15.0,
45
+ "learning_rate": 3.8060233744356633e-06,
46
+ "loss": 0.869,
47
  "step": 60
48
  },
49
  {
50
  "epoch": 15.0,
51
+ "eval_accuracy": 0.608,
52
+ "eval_f1": 0.4795432331237958,
53
+ "eval_loss": 0.7879514098167419,
54
+ "eval_runtime": 43.7619,
55
+ "eval_samples_per_second": 2.856,
56
+ "eval_steps_per_second": 0.366,
57
  "step": 60
58
  },
59
  {
60
  "epoch": 20.0,
61
+ "learning_rate": 4.999999999999999e-05,
62
+ "loss": 0.7966,
63
  "step": 80
64
  },
65
  {
66
  "epoch": 20.0,
67
+ "eval_accuracy": 0.6,
68
+ "eval_f1": 0.4846140574401444,
69
+ "eval_loss": 0.7732068300247192,
70
+ "eval_runtime": 43.5459,
71
+ "eval_samples_per_second": 2.871,
72
+ "eval_steps_per_second": 0.367,
73
  "step": 80
74
  },
75
  {
76
  "epoch": 25.0,
77
+ "learning_rate": 9.619397662556435e-05,
78
+ "loss": 0.8458,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 25.0,
83
+ "eval_accuracy": 0.576,
84
+ "eval_f1": 0.4111637823594345,
85
+ "eval_loss": 0.7794835567474365,
86
+ "eval_runtime": 43.6082,
87
+ "eval_samples_per_second": 2.866,
88
+ "eval_steps_per_second": 0.367,
89
  "step": 100
90
  },
91
  {
92
  "epoch": 30.0,
93
+ "learning_rate": 1.4644660940672666e-05,
94
+ "loss": 0.8135,
95
  "step": 120
96
  },
97
  {
98
  "epoch": 30.0,
99
+ "eval_accuracy": 0.608,
100
+ "eval_f1": 0.5096170704866357,
101
+ "eval_loss": 0.736162006855011,
102
+ "eval_runtime": 43.4882,
103
+ "eval_samples_per_second": 2.874,
104
+ "eval_steps_per_second": 0.368,
105
  "step": 120
106
  },
107
  {
108
  "epoch": 30.0,
109
  "step": 120,
110
  "total_flos": 2.907095595264e+17,
111
+ "train_loss": 1.321283253033956,
112
+ "train_runtime": 2416.2795,
113
+ "train_samples_per_second": 1.552,
114
+ "train_steps_per_second": 0.05
115
  }
116
  ],
117
  "logging_steps": 20,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d81a55a26d6ce36bd2cb1c3749ad8b71ae387f415df79ce84248209b54e4b4b4
3
  size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc61c928db9a41caeebca7f4059dc89cc650436397dc5bae656b56cbbcd0f2c0
3
  size 4728