arpanl commited on
Commit
d40889c
·
verified ·
1 Parent(s): ec4fc42

Training in progress, step 20

Browse files
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "epoch": 30.0,
3
  "eval_accuracy": 0.592,
4
- "eval_f1": 0.43854957441913966,
5
- "eval_loss": 0.8978701829910278,
6
- "eval_runtime": 131.0498,
7
- "eval_samples_per_second": 0.954,
8
- "eval_steps_per_second": 0.122,
9
  "total_flos": 2.907095595264e+17,
10
- "train_loss": 1.6024109204610189,
11
- "train_runtime": 10078.4501,
12
- "train_samples_per_second": 0.372,
13
- "train_steps_per_second": 0.012
14
  }
 
1
  {
2
  "epoch": 30.0,
3
  "eval_accuracy": 0.592,
4
+ "eval_f1": 0.4602437417654809,
5
+ "eval_loss": 0.8401041626930237,
6
+ "eval_runtime": 130.3522,
7
+ "eval_samples_per_second": 0.959,
8
+ "eval_steps_per_second": 0.123,
9
  "total_flos": 2.907095595264e+17,
10
+ "train_loss": 1.6994803905487061,
11
+ "train_runtime": 10528.1678,
12
+ "train_samples_per_second": 0.356,
13
+ "train_steps_per_second": 0.011
14
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 30.0,
3
  "eval_accuracy": 0.592,
4
- "eval_f1": 0.43854957441913966,
5
- "eval_loss": 0.8978701829910278,
6
- "eval_runtime": 131.0498,
7
- "eval_samples_per_second": 0.954,
8
- "eval_steps_per_second": 0.122
9
  }
 
1
  {
2
  "epoch": 30.0,
3
  "eval_accuracy": 0.592,
4
+ "eval_f1": 0.4602437417654809,
5
+ "eval_loss": 0.8401041626930237,
6
+ "eval_runtime": 130.3522,
7
+ "eval_samples_per_second": 0.959,
8
+ "eval_steps_per_second": 0.123
9
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b5d774cd52b7efdb96d06df5553ae1ce0114e2fbde7330cb2a4b20e7f5a7084
3
  size 343359328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62557cd7096a9412d55e317cc264879c2bb612afd6036295645eeeb21cd4c111
3
  size 343359328
runs/Feb09_10-51-58_95d38ead18ce/events.out.tfevents.1707486617.95d38ead18ce.561.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd16c70d4624dfc58a398be0404965c9e43aa9db34cacb027a98891fe7405271
3
+ size 450
runs/Feb12_04-49-49_e7b40a5a562d/events.out.tfevents.1707713396.e7b40a5a562d.565.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf6a1f1b1a1974f1c3b8e6cfb2e7329dd038f71ed574a747d4b814f72491b310
3
+ size 6709
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 30.0,
3
  "total_flos": 2.907095595264e+17,
4
- "train_loss": 1.6024109204610189,
5
- "train_runtime": 10078.4501,
6
- "train_samples_per_second": 0.372,
7
- "train_steps_per_second": 0.012
8
  }
 
1
  {
2
  "epoch": 30.0,
3
  "total_flos": 2.907095595264e+17,
4
+ "train_loss": 1.6994803905487061,
5
+ "train_runtime": 10528.1678,
6
+ "train_samples_per_second": 0.356,
7
+ "train_steps_per_second": 0.011
8
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.8978701829910278,
3
  "best_model_checkpoint": "/content/drive/MyDrive/Fine-Tuned_Model3/checkpoint-120",
4
  "epoch": 30.0,
5
  "eval_steps": 20,
@@ -10,72 +10,96 @@
10
  "log_history": [
11
  {
12
  "epoch": 5.0,
13
- "eval_accuracy": 0.512,
14
- "eval_f1": 0.2812087537790227,
15
- "eval_loss": 2.0562753677368164,
16
- "eval_runtime": 131.4968,
17
- "eval_samples_per_second": 0.951,
 
 
 
 
 
 
18
  "eval_steps_per_second": 0.122,
19
  "step": 20
20
  },
 
 
 
 
 
 
21
  {
22
  "epoch": 10.0,
23
  "eval_accuracy": 0.576,
24
- "eval_f1": 0.375200783721446,
25
- "eval_loss": 1.4345649480819702,
26
- "eval_runtime": 132.0355,
27
- "eval_samples_per_second": 0.947,
28
  "eval_steps_per_second": 0.121,
29
  "step": 40
30
  },
31
  {
32
- "epoch": 12.5,
33
- "learning_rate": 3.4048431995589453e-06,
34
- "loss": 2.1474,
35
- "step": 50
36
  },
37
  {
38
  "epoch": 15.0,
39
- "eval_accuracy": 0.576,
40
- "eval_f1": 0.3873325405294715,
41
- "eval_loss": 1.3222265243530273,
42
- "eval_runtime": 132.1891,
43
- "eval_samples_per_second": 0.946,
44
- "eval_steps_per_second": 0.121,
45
  "step": 60
46
  },
 
 
 
 
 
 
47
  {
48
  "epoch": 20.0,
49
  "eval_accuracy": 0.576,
50
- "eval_f1": 0.3879913020577983,
51
- "eval_loss": 1.2946172952651978,
52
- "eval_runtime": 131.2242,
53
- "eval_samples_per_second": 0.953,
54
  "eval_steps_per_second": 0.122,
55
  "step": 80
56
  },
57
  {
58
  "epoch": 25.0,
59
- "learning_rate": 1.7926354830241928e-05,
60
- "loss": 1.2873,
61
  "step": 100
62
  },
63
  {
64
  "epoch": 25.0,
65
- "eval_accuracy": 0.6,
66
- "eval_f1": 0.40130894254935173,
67
- "eval_loss": 1.0957316160202026,
68
- "eval_runtime": 130.6383,
69
- "eval_samples_per_second": 0.957,
70
- "eval_steps_per_second": 0.122,
71
  "step": 100
72
  },
 
 
 
 
 
 
73
  {
74
  "epoch": 30.0,
75
  "eval_accuracy": 0.592,
76
- "eval_f1": 0.43854957441913966,
77
- "eval_loss": 0.8978701829910278,
78
- "eval_runtime": 130.7817,
79
  "eval_samples_per_second": 0.956,
80
  "eval_steps_per_second": 0.122,
81
  "step": 120
@@ -84,13 +108,13 @@
84
  "epoch": 30.0,
85
  "step": 120,
86
  "total_flos": 2.907095595264e+17,
87
- "train_loss": 1.6024109204610189,
88
- "train_runtime": 10078.4501,
89
- "train_samples_per_second": 0.372,
90
- "train_steps_per_second": 0.012
91
  }
92
  ],
93
- "logging_steps": 50,
94
  "max_steps": 120,
95
  "num_input_tokens_seen": 0,
96
  "num_train_epochs": 30,
 
1
  {
2
+ "best_metric": 0.8401041626930237,
3
  "best_model_checkpoint": "/content/drive/MyDrive/Fine-Tuned_Model3/checkpoint-120",
4
  "epoch": 30.0,
5
  "eval_steps": 20,
 
10
  "log_history": [
11
  {
12
  "epoch": 5.0,
13
+ "learning_rate": 2.9488887394336025e-05,
14
+ "loss": 3.5336,
15
+ "step": 20
16
+ },
17
+ {
18
+ "epoch": 5.0,
19
+ "eval_accuracy": 0.472,
20
+ "eval_f1": 0.2688021058225662,
21
+ "eval_loss": 2.5429601669311523,
22
+ "eval_runtime": 130.7136,
23
+ "eval_samples_per_second": 0.956,
24
  "eval_steps_per_second": 0.122,
25
  "step": 20
26
  },
27
+ {
28
+ "epoch": 10.0,
29
+ "learning_rate": 1.5e-05,
30
+ "loss": 1.952,
31
+ "step": 40
32
+ },
33
  {
34
  "epoch": 10.0,
35
  "eval_accuracy": 0.576,
36
+ "eval_f1": 0.369042862070919,
37
+ "eval_loss": 1.468719482421875,
38
+ "eval_runtime": 131.8983,
39
+ "eval_samples_per_second": 0.948,
40
  "eval_steps_per_second": 0.121,
41
  "step": 40
42
  },
43
  {
44
+ "epoch": 15.0,
45
+ "learning_rate": 5.11112605663977e-07,
46
+ "loss": 1.3471,
47
+ "step": 60
48
  },
49
  {
50
  "epoch": 15.0,
51
+ "eval_accuracy": 0.584,
52
+ "eval_f1": 0.38577990574558085,
53
+ "eval_loss": 1.274966835975647,
54
+ "eval_runtime": 139.0851,
55
+ "eval_samples_per_second": 0.899,
56
+ "eval_steps_per_second": 0.115,
57
  "step": 60
58
  },
59
+ {
60
+ "epoch": 20.0,
61
+ "learning_rate": 7.499999999999993e-06,
62
+ "loss": 1.2688,
63
+ "step": 80
64
+ },
65
  {
66
  "epoch": 20.0,
67
  "eval_accuracy": 0.576,
68
+ "eval_f1": 0.3823282044677926,
69
+ "eval_loss": 1.2294681072235107,
70
+ "eval_runtime": 131.4905,
71
+ "eval_samples_per_second": 0.951,
72
  "eval_steps_per_second": 0.122,
73
  "step": 80
74
  },
75
  {
76
  "epoch": 25.0,
77
+ "learning_rate": 2.5606601717798212e-05,
78
+ "loss": 1.1444,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 25.0,
83
+ "eval_accuracy": 0.592,
84
+ "eval_f1": 0.38488272384052435,
85
+ "eval_loss": 0.9876356720924377,
86
+ "eval_runtime": 130.1608,
87
+ "eval_samples_per_second": 0.96,
88
+ "eval_steps_per_second": 0.123,
89
  "step": 100
90
  },
91
+ {
92
+ "epoch": 30.0,
93
+ "learning_rate": 2.7990381056766586e-05,
94
+ "loss": 0.9511,
95
+ "step": 120
96
+ },
97
  {
98
  "epoch": 30.0,
99
  "eval_accuracy": 0.592,
100
+ "eval_f1": 0.4602437417654809,
101
+ "eval_loss": 0.8401041626930237,
102
+ "eval_runtime": 130.7723,
103
  "eval_samples_per_second": 0.956,
104
  "eval_steps_per_second": 0.122,
105
  "step": 120
 
108
  "epoch": 30.0,
109
  "step": 120,
110
  "total_flos": 2.907095595264e+17,
111
+ "train_loss": 1.6994803905487061,
112
+ "train_runtime": 10528.1678,
113
+ "train_samples_per_second": 0.356,
114
+ "train_steps_per_second": 0.011
115
  }
116
  ],
117
+ "logging_steps": 20,
118
  "max_steps": 120,
119
  "num_input_tokens_seen": 0,
120
  "num_train_epochs": 30,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:524ac55fe2d55f48c14744604e89ac38f57b6b1a0be144350a0aa965c80cbf5f
3
  size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d81a55a26d6ce36bd2cb1c3749ad8b71ae387f415df79ce84248209b54e4b4b4
3
  size 4728