danield12 commited on
Commit
04e7b41
·
verified ·
1 Parent(s): 2c91398

Upload folder using huggingface_hub

Browse files
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:447a1e485a3f111cf2ef769f24073ec0e50b4a06884a6f49f4dab1d2a562b562
3
  size 160086542
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0052296dbb13857280beac8e7379c6ace74dc1bf153ca9cfe91838b5ffeb957c
3
  size 160086542
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
  "epoch": 0.99,
3
- "eval_accuracy": 0.9,
4
- "eval_f1_score": 0.9015245623941276,
5
- "eval_gmean": 0.8701338213935068,
6
- "eval_loss": 0.30312439799308777,
7
- "eval_precision": 0.9039473684210526,
8
- "eval_recall": 0.9,
9
- "eval_runtime": 152.4589,
10
- "eval_samples_per_second": 0.328,
11
- "eval_steps_per_second": 0.046,
12
  "total_flos": 1.1914693337677824e+17,
13
- "train_loss": 0.3471187468497984,
14
- "train_runtime": 19325.8318,
15
- "train_samples_per_second": 0.31,
16
  "train_steps_per_second": 0.005
17
  }
 
1
  {
2
  "epoch": 0.99,
3
+ "eval_accuracy": 0.86,
4
+ "eval_f1_score": 0.8597171717171715,
5
+ "eval_gmean": 0.8574842430349027,
6
+ "eval_loss": 0.3646777272224426,
7
+ "eval_precision": 0.8601298701298701,
8
+ "eval_recall": 0.86,
9
+ "eval_runtime": 150.5191,
10
+ "eval_samples_per_second": 0.332,
11
+ "eval_steps_per_second": 0.047,
12
  "total_flos": 1.1914693337677824e+17,
13
+ "train_loss": 0.34092466292842744,
14
+ "train_runtime": 18751.1569,
15
+ "train_samples_per_second": 0.32,
16
  "train_steps_per_second": 0.005
17
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 0.99,
3
- "eval_accuracy": 0.9,
4
- "eval_f1_score": 0.9015245623941276,
5
- "eval_gmean": 0.8701338213935068,
6
- "eval_loss": 0.30312439799308777,
7
- "eval_precision": 0.9039473684210526,
8
- "eval_recall": 0.9,
9
- "eval_runtime": 152.4589,
10
- "eval_samples_per_second": 0.328,
11
- "eval_steps_per_second": 0.046
12
  }
 
1
  {
2
  "epoch": 0.99,
3
+ "eval_accuracy": 0.86,
4
+ "eval_f1_score": 0.8597171717171715,
5
+ "eval_gmean": 0.8574842430349027,
6
+ "eval_loss": 0.3646777272224426,
7
+ "eval_precision": 0.8601298701298701,
8
+ "eval_recall": 0.86,
9
+ "eval_runtime": 150.5191,
10
+ "eval_samples_per_second": 0.332,
11
+ "eval_steps_per_second": 0.047
12
  }
runs/Apr01_13-37-34_5dac5133c9b9/events.out.tfevents.1711978656.5dac5133c9b9.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4819946a78d86fcd12306830f41c21a53f71520a9af8bb0e93c8d4ef0563cb35
3
+ size 5540
runs/Apr01_15-19-34_d68427716c29/events.out.tfevents.1711984776.d68427716c29.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:131fe0a2407e6defb41d9428fddb6acc5e385d8b98ee55a8e9c1fd8c1f67d208
3
+ size 9095
runs/Apr01_15-19-34_d68427716c29/events.out.tfevents.1712003678.d68427716c29.34.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:199dd9f9a3a018f0b7ab635cbf30107bae878d26b7772163a4d85e7c87846345
3
+ size 605
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 0.99,
3
  "total_flos": 1.1914693337677824e+17,
4
- "train_loss": 0.3471187468497984,
5
- "train_runtime": 19325.8318,
6
- "train_samples_per_second": 0.31,
7
  "train_steps_per_second": 0.005
8
  }
 
1
  {
2
  "epoch": 0.99,
3
  "total_flos": 1.1914693337677824e+17,
4
+ "train_loss": 0.34092466292842744,
5
+ "train_runtime": 18751.1569,
6
+ "train_samples_per_second": 0.32,
7
  "train_steps_per_second": 0.005
8
  }
trainer_state.json CHANGED
@@ -10,127 +10,127 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.09,
13
- "grad_norm": 7.34375,
14
  "learning_rate": 1.8681318681318682e-05,
15
- "loss": 0.3872,
16
  "step": 8
17
  },
18
  {
19
  "epoch": 0.17,
20
- "grad_norm": 5.59375,
21
  "learning_rate": 1.6923076923076924e-05,
22
- "loss": 0.3649,
23
  "step": 16
24
  },
25
  {
26
  "epoch": 0.26,
27
- "grad_norm": 5.9375,
28
  "learning_rate": 1.5164835164835166e-05,
29
- "loss": 0.4135,
30
  "step": 24
31
  },
32
  {
33
  "epoch": 0.3,
34
- "eval_accuracy": 0.9,
35
- "eval_f1_score": 0.9015245623941276,
36
- "eval_gmean": 0.8701338213935068,
37
- "eval_loss": 0.3042968809604645,
38
- "eval_precision": 0.9039473684210526,
39
- "eval_recall": 0.9,
40
- "eval_runtime": 150.7919,
41
  "eval_samples_per_second": 0.332,
42
  "eval_steps_per_second": 0.046,
43
  "step": 28
44
  },
45
  {
46
  "epoch": 0.34,
47
- "grad_norm": 9.0,
48
  "learning_rate": 1.3406593406593406e-05,
49
- "loss": 0.3769,
50
  "step": 32
51
  },
52
  {
53
  "epoch": 0.43,
54
- "grad_norm": 5.71875,
55
  "learning_rate": 1.164835164835165e-05,
56
- "loss": 0.3004,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 0.51,
61
- "grad_norm": 6.5625,
62
  "learning_rate": 9.890109890109892e-06,
63
- "loss": 0.3444,
64
  "step": 48
65
  },
66
  {
67
  "epoch": 0.6,
68
- "grad_norm": 7.6875,
69
  "learning_rate": 8.131868131868132e-06,
70
- "loss": 0.3599,
71
  "step": 56
72
  },
73
  {
74
  "epoch": 0.6,
75
- "eval_accuracy": 0.9,
76
- "eval_f1_score": 0.9015245623941276,
77
- "eval_gmean": 0.8701338213935068,
78
- "eval_loss": 0.3040618896484375,
79
- "eval_precision": 0.9039473684210526,
80
- "eval_recall": 0.9,
81
- "eval_runtime": 150.6764,
82
  "eval_samples_per_second": 0.332,
83
  "eval_steps_per_second": 0.046,
84
  "step": 56
85
  },
86
  {
87
  "epoch": 0.68,
88
- "grad_norm": 5.78125,
89
  "learning_rate": 6.373626373626373e-06,
90
- "loss": 0.3341,
91
  "step": 64
92
  },
93
  {
94
  "epoch": 0.77,
95
- "grad_norm": 6.3125,
96
  "learning_rate": 4.615384615384616e-06,
97
- "loss": 0.3116,
98
  "step": 72
99
  },
100
  {
101
  "epoch": 0.85,
102
- "grad_norm": 5.53125,
103
  "learning_rate": 2.8571428571428573e-06,
104
- "loss": 0.3222,
105
  "step": 80
106
  },
107
  {
108
  "epoch": 0.9,
109
- "eval_accuracy": 0.9,
110
- "eval_f1_score": 0.9015245623941276,
111
- "eval_gmean": 0.8701338213935068,
112
- "eval_loss": 0.30312439799308777,
113
- "eval_precision": 0.9039473684210526,
114
- "eval_recall": 0.9,
115
- "eval_runtime": 152.7595,
116
- "eval_samples_per_second": 0.327,
117
  "eval_steps_per_second": 0.046,
118
  "step": 84
119
  },
120
  {
121
  "epoch": 0.94,
122
- "grad_norm": 7.84375,
123
  "learning_rate": 1.098901098901099e-06,
124
- "loss": 0.3446,
125
  "step": 88
126
  },
127
  {
128
  "epoch": 0.99,
129
  "step": 93,
130
  "total_flos": 1.1914693337677824e+17,
131
- "train_loss": 0.3471187468497984,
132
- "train_runtime": 19325.8318,
133
- "train_samples_per_second": 0.31,
134
  "train_steps_per_second": 0.005
135
  }
136
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.09,
13
+ "grad_norm": 6.5,
14
  "learning_rate": 1.8681318681318682e-05,
15
+ "loss": 0.338,
16
  "step": 8
17
  },
18
  {
19
  "epoch": 0.17,
20
+ "grad_norm": 6.59375,
21
  "learning_rate": 1.6923076923076924e-05,
22
+ "loss": 0.2964,
23
  "step": 16
24
  },
25
  {
26
  "epoch": 0.26,
27
+ "grad_norm": 4.5625,
28
  "learning_rate": 1.5164835164835166e-05,
29
+ "loss": 0.3441,
30
  "step": 24
31
  },
32
  {
33
  "epoch": 0.3,
34
+ "eval_accuracy": 0.86,
35
+ "eval_f1_score": 0.8597171717171715,
36
+ "eval_gmean": 0.8574842430349027,
37
+ "eval_loss": 0.36518555879592896,
38
+ "eval_precision": 0.8601298701298701,
39
+ "eval_recall": 0.86,
40
+ "eval_runtime": 150.657,
41
  "eval_samples_per_second": 0.332,
42
  "eval_steps_per_second": 0.046,
43
  "step": 28
44
  },
45
  {
46
  "epoch": 0.34,
47
+ "grad_norm": 5.0625,
48
  "learning_rate": 1.3406593406593406e-05,
49
+ "loss": 0.3407,
50
  "step": 32
51
  },
52
  {
53
  "epoch": 0.43,
54
+ "grad_norm": 7.21875,
55
  "learning_rate": 1.164835164835165e-05,
56
+ "loss": 0.3418,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 0.51,
61
+ "grad_norm": 9.75,
62
  "learning_rate": 9.890109890109892e-06,
63
+ "loss": 0.3868,
64
  "step": 48
65
  },
66
  {
67
  "epoch": 0.6,
68
+ "grad_norm": 6.15625,
69
  "learning_rate": 8.131868131868132e-06,
70
+ "loss": 0.3252,
71
  "step": 56
72
  },
73
  {
74
  "epoch": 0.6,
75
+ "eval_accuracy": 0.86,
76
+ "eval_f1_score": 0.8597171717171715,
77
+ "eval_gmean": 0.8574842430349027,
78
+ "eval_loss": 0.36469727754592896,
79
+ "eval_precision": 0.8601298701298701,
80
+ "eval_recall": 0.86,
81
+ "eval_runtime": 150.6949,
82
  "eval_samples_per_second": 0.332,
83
  "eval_steps_per_second": 0.046,
84
  "step": 56
85
  },
86
  {
87
  "epoch": 0.68,
88
+ "grad_norm": 5.875,
89
  "learning_rate": 6.373626373626373e-06,
90
+ "loss": 0.3562,
91
  "step": 64
92
  },
93
  {
94
  "epoch": 0.77,
95
+ "grad_norm": 7.34375,
96
  "learning_rate": 4.615384615384616e-06,
97
+ "loss": 0.3252,
98
  "step": 72
99
  },
100
  {
101
  "epoch": 0.85,
102
+ "grad_norm": 6.25,
103
  "learning_rate": 2.8571428571428573e-06,
104
+ "loss": 0.3177,
105
  "step": 80
106
  },
107
  {
108
  "epoch": 0.9,
109
+ "eval_accuracy": 0.86,
110
+ "eval_f1_score": 0.8597171717171715,
111
+ "eval_gmean": 0.8574842430349027,
112
+ "eval_loss": 0.3646777272224426,
113
+ "eval_precision": 0.8601298701298701,
114
+ "eval_recall": 0.86,
115
+ "eval_runtime": 150.7321,
116
+ "eval_samples_per_second": 0.332,
117
  "eval_steps_per_second": 0.046,
118
  "step": 84
119
  },
120
  {
121
  "epoch": 0.94,
122
+ "grad_norm": 6.9375,
123
  "learning_rate": 1.098901098901099e-06,
124
+ "loss": 0.3777,
125
  "step": 88
126
  },
127
  {
128
  "epoch": 0.99,
129
  "step": 93,
130
  "total_flos": 1.1914693337677824e+17,
131
+ "train_loss": 0.34092466292842744,
132
+ "train_runtime": 18751.1569,
133
+ "train_samples_per_second": 0.32,
134
  "train_steps_per_second": 0.005
135
  }
136
  ],