danield12 commited on
Commit
1c20820
·
verified ·
1 Parent(s): 88658c9

Upload folder using huggingface_hub

Browse files
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e8bc85aa083b75a30b7ba295a754ce02e0c5fadb33d7e0468f13c629931a720
3
  size 160086542
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:447a1e485a3f111cf2ef769f24073ec0e50b4a06884a6f49f4dab1d2a562b562
3
  size 160086542
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
  "epoch": 0.99,
3
- "eval_accuracy": 0.82,
4
- "eval_f1_score": 0.8184577723378215,
5
- "eval_gmean": 0.8139876199369547,
6
- "eval_loss": 0.33375000953674316,
7
- "eval_precision": 0.8230000000000001,
8
- "eval_recall": 0.82,
9
- "eval_runtime": 163.2928,
10
- "eval_samples_per_second": 0.306,
11
- "eval_steps_per_second": 0.043,
12
  "total_flos": 1.1914693337677824e+17,
13
- "train_loss": 0.34641749884492606,
14
- "train_runtime": 20162.3344,
15
- "train_samples_per_second": 0.298,
16
  "train_steps_per_second": 0.005
17
  }
 
1
  {
2
  "epoch": 0.99,
3
+ "eval_accuracy": 0.9,
4
+ "eval_f1_score": 0.9015245623941276,
5
+ "eval_gmean": 0.8701338213935068,
6
+ "eval_loss": 0.30312439799308777,
7
+ "eval_precision": 0.9039473684210526,
8
+ "eval_recall": 0.9,
9
+ "eval_runtime": 152.4589,
10
+ "eval_samples_per_second": 0.328,
11
+ "eval_steps_per_second": 0.046,
12
  "total_flos": 1.1914693337677824e+17,
13
+ "train_loss": 0.3471187468497984,
14
+ "train_runtime": 19325.8318,
15
+ "train_samples_per_second": 0.31,
16
  "train_steps_per_second": 0.005
17
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 0.99,
3
- "eval_accuracy": 0.82,
4
- "eval_f1_score": 0.8184577723378215,
5
- "eval_gmean": 0.8139876199369547,
6
- "eval_loss": 0.33375000953674316,
7
- "eval_precision": 0.8230000000000001,
8
- "eval_recall": 0.82,
9
- "eval_runtime": 163.2928,
10
- "eval_samples_per_second": 0.306,
11
- "eval_steps_per_second": 0.043
12
  }
 
1
  {
2
  "epoch": 0.99,
3
+ "eval_accuracy": 0.9,
4
+ "eval_f1_score": 0.9015245623941276,
5
+ "eval_gmean": 0.8701338213935068,
6
+ "eval_loss": 0.30312439799308777,
7
+ "eval_precision": 0.9039473684210526,
8
+ "eval_recall": 0.9,
9
+ "eval_runtime": 152.4589,
10
+ "eval_samples_per_second": 0.328,
11
+ "eval_steps_per_second": 0.046
12
  }
runs/Apr01_01-51-32_8c1b24df09a3/events.out.tfevents.1711936295.8c1b24df09a3.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c572fd7ce27abd06daa26dd3caf7cb2f6eb5656979b4fa7d8c94f6586d3c442c
3
+ size 9095
runs/Apr01_01-51-32_8c1b24df09a3/events.out.tfevents.1711955773.8c1b24df09a3.34.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4860f8be118fc6bcdcbd210a120fed1e42aa6673bbed555f8ffbcb20ca03f23f
3
+ size 605
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 0.99,
3
  "total_flos": 1.1914693337677824e+17,
4
- "train_loss": 0.34641749884492606,
5
- "train_runtime": 20162.3344,
6
- "train_samples_per_second": 0.298,
7
  "train_steps_per_second": 0.005
8
  }
 
1
  {
2
  "epoch": 0.99,
3
  "total_flos": 1.1914693337677824e+17,
4
+ "train_loss": 0.3471187468497984,
5
+ "train_runtime": 19325.8318,
6
+ "train_samples_per_second": 0.31,
7
  "train_steps_per_second": 0.005
8
  }
trainer_state.json CHANGED
@@ -10,127 +10,127 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.09,
13
- "grad_norm": 6.78125,
14
  "learning_rate": 1.8681318681318682e-05,
15
- "loss": 0.3728,
16
  "step": 8
17
  },
18
  {
19
  "epoch": 0.17,
20
- "grad_norm": 5.03125,
21
  "learning_rate": 1.6923076923076924e-05,
22
- "loss": 0.353,
23
  "step": 16
24
  },
25
  {
26
  "epoch": 0.26,
27
- "grad_norm": 6.5,
28
  "learning_rate": 1.5164835164835166e-05,
29
- "loss": 0.3137,
30
  "step": 24
31
  },
32
  {
33
  "epoch": 0.3,
34
- "eval_accuracy": 0.82,
35
- "eval_f1_score": 0.8184577723378215,
36
- "eval_gmean": 0.8139876199369547,
37
- "eval_loss": 0.33320313692092896,
38
- "eval_precision": 0.8230000000000001,
39
- "eval_recall": 0.82,
40
- "eval_runtime": 163.4252,
41
- "eval_samples_per_second": 0.306,
42
- "eval_steps_per_second": 0.043,
43
  "step": 28
44
  },
45
  {
46
  "epoch": 0.34,
47
- "grad_norm": 7.40625,
48
  "learning_rate": 1.3406593406593406e-05,
49
- "loss": 0.3488,
50
  "step": 32
51
  },
52
  {
53
  "epoch": 0.43,
54
- "grad_norm": 4.375,
55
  "learning_rate": 1.164835164835165e-05,
56
- "loss": 0.3013,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 0.51,
61
- "grad_norm": 8.375,
62
  "learning_rate": 9.890109890109892e-06,
63
- "loss": 0.4057,
64
  "step": 48
65
  },
66
  {
67
  "epoch": 0.6,
68
- "grad_norm": 5.90625,
69
  "learning_rate": 8.131868131868132e-06,
70
- "loss": 0.3598,
71
  "step": 56
72
  },
73
  {
74
  "epoch": 0.6,
75
- "eval_accuracy": 0.82,
76
- "eval_f1_score": 0.8184577723378215,
77
- "eval_gmean": 0.8139876199369547,
78
- "eval_loss": 0.3338281214237213,
79
- "eval_precision": 0.8230000000000001,
80
- "eval_recall": 0.82,
81
- "eval_runtime": 163.4717,
82
- "eval_samples_per_second": 0.306,
83
- "eval_steps_per_second": 0.043,
84
  "step": 56
85
  },
86
  {
87
  "epoch": 0.68,
88
- "grad_norm": 7.6875,
89
  "learning_rate": 6.373626373626373e-06,
90
- "loss": 0.295,
91
  "step": 64
92
  },
93
  {
94
  "epoch": 0.77,
95
- "grad_norm": 6.8125,
96
  "learning_rate": 4.615384615384616e-06,
97
- "loss": 0.3881,
98
  "step": 72
99
  },
100
  {
101
  "epoch": 0.85,
102
- "grad_norm": 5.90625,
103
  "learning_rate": 2.8571428571428573e-06,
104
- "loss": 0.3761,
105
  "step": 80
106
  },
107
  {
108
  "epoch": 0.9,
109
- "eval_accuracy": 0.82,
110
- "eval_f1_score": 0.8184577723378215,
111
- "eval_gmean": 0.8139876199369547,
112
- "eval_loss": 0.33375000953674316,
113
- "eval_precision": 0.8230000000000001,
114
- "eval_recall": 0.82,
115
- "eval_runtime": 163.4454,
116
- "eval_samples_per_second": 0.306,
117
- "eval_steps_per_second": 0.043,
118
  "step": 84
119
  },
120
  {
121
  "epoch": 0.94,
122
- "grad_norm": 4.96875,
123
  "learning_rate": 1.098901098901099e-06,
124
- "loss": 0.2953,
125
  "step": 88
126
  },
127
  {
128
  "epoch": 0.99,
129
  "step": 93,
130
  "total_flos": 1.1914693337677824e+17,
131
- "train_loss": 0.34641749884492606,
132
- "train_runtime": 20162.3344,
133
- "train_samples_per_second": 0.298,
134
  "train_steps_per_second": 0.005
135
  }
136
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.09,
13
+ "grad_norm": 7.34375,
14
  "learning_rate": 1.8681318681318682e-05,
15
+ "loss": 0.3872,
16
  "step": 8
17
  },
18
  {
19
  "epoch": 0.17,
20
+ "grad_norm": 5.59375,
21
  "learning_rate": 1.6923076923076924e-05,
22
+ "loss": 0.3649,
23
  "step": 16
24
  },
25
  {
26
  "epoch": 0.26,
27
+ "grad_norm": 5.9375,
28
  "learning_rate": 1.5164835164835166e-05,
29
+ "loss": 0.4135,
30
  "step": 24
31
  },
32
  {
33
  "epoch": 0.3,
34
+ "eval_accuracy": 0.9,
35
+ "eval_f1_score": 0.9015245623941276,
36
+ "eval_gmean": 0.8701338213935068,
37
+ "eval_loss": 0.3042968809604645,
38
+ "eval_precision": 0.9039473684210526,
39
+ "eval_recall": 0.9,
40
+ "eval_runtime": 150.7919,
41
+ "eval_samples_per_second": 0.332,
42
+ "eval_steps_per_second": 0.046,
43
  "step": 28
44
  },
45
  {
46
  "epoch": 0.34,
47
+ "grad_norm": 9.0,
48
  "learning_rate": 1.3406593406593406e-05,
49
+ "loss": 0.3769,
50
  "step": 32
51
  },
52
  {
53
  "epoch": 0.43,
54
+ "grad_norm": 5.71875,
55
  "learning_rate": 1.164835164835165e-05,
56
+ "loss": 0.3004,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 0.51,
61
+ "grad_norm": 6.5625,
62
  "learning_rate": 9.890109890109892e-06,
63
+ "loss": 0.3444,
64
  "step": 48
65
  },
66
  {
67
  "epoch": 0.6,
68
+ "grad_norm": 7.6875,
69
  "learning_rate": 8.131868131868132e-06,
70
+ "loss": 0.3599,
71
  "step": 56
72
  },
73
  {
74
  "epoch": 0.6,
75
+ "eval_accuracy": 0.9,
76
+ "eval_f1_score": 0.9015245623941276,
77
+ "eval_gmean": 0.8701338213935068,
78
+ "eval_loss": 0.3040618896484375,
79
+ "eval_precision": 0.9039473684210526,
80
+ "eval_recall": 0.9,
81
+ "eval_runtime": 150.6764,
82
+ "eval_samples_per_second": 0.332,
83
+ "eval_steps_per_second": 0.046,
84
  "step": 56
85
  },
86
  {
87
  "epoch": 0.68,
88
+ "grad_norm": 5.78125,
89
  "learning_rate": 6.373626373626373e-06,
90
+ "loss": 0.3341,
91
  "step": 64
92
  },
93
  {
94
  "epoch": 0.77,
95
+ "grad_norm": 6.3125,
96
  "learning_rate": 4.615384615384616e-06,
97
+ "loss": 0.3116,
98
  "step": 72
99
  },
100
  {
101
  "epoch": 0.85,
102
+ "grad_norm": 5.53125,
103
  "learning_rate": 2.8571428571428573e-06,
104
+ "loss": 0.3222,
105
  "step": 80
106
  },
107
  {
108
  "epoch": 0.9,
109
+ "eval_accuracy": 0.9,
110
+ "eval_f1_score": 0.9015245623941276,
111
+ "eval_gmean": 0.8701338213935068,
112
+ "eval_loss": 0.30312439799308777,
113
+ "eval_precision": 0.9039473684210526,
114
+ "eval_recall": 0.9,
115
+ "eval_runtime": 152.7595,
116
+ "eval_samples_per_second": 0.327,
117
+ "eval_steps_per_second": 0.046,
118
  "step": 84
119
  },
120
  {
121
  "epoch": 0.94,
122
+ "grad_norm": 7.84375,
123
  "learning_rate": 1.098901098901099e-06,
124
+ "loss": 0.3446,
125
  "step": 88
126
  },
127
  {
128
  "epoch": 0.99,
129
  "step": 93,
130
  "total_flos": 1.1914693337677824e+17,
131
+ "train_loss": 0.3471187468497984,
132
+ "train_runtime": 19325.8318,
133
+ "train_samples_per_second": 0.31,
134
  "train_steps_per_second": 0.005
135
  }
136
  ],