danield12 commited on
Commit
600e178
·
verified ·
1 Parent(s): 8ca1af7

Upload folder using huggingface_hub

Browse files
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b349cc388254688729bb2bee539e11e35048cffe1a215edda714ab0e5e576f87
3
  size 160086542
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e8bc85aa083b75a30b7ba295a754ce02e0c5fadb33d7e0468f13c629931a720
3
  size 160086542
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
  "epoch": 0.99,
3
- "eval_accuracy": 0.8,
4
- "eval_f1_score": 0.7993558776167471,
5
- "eval_gmean": 0.7980746061134115,
6
- "eval_loss": 0.5084765553474426,
7
- "eval_precision": 0.8012987012987013,
8
- "eval_recall": 0.8,
9
- "eval_runtime": 158.4717,
10
- "eval_samples_per_second": 0.316,
11
- "eval_steps_per_second": 0.044,
12
  "total_flos": 1.1914693337677824e+17,
13
- "train_loss": 0.3557273290490591,
14
- "train_runtime": 19662.2913,
15
- "train_samples_per_second": 0.305,
16
  "train_steps_per_second": 0.005
17
  }
 
1
  {
2
  "epoch": 0.99,
3
+ "eval_accuracy": 0.82,
4
+ "eval_f1_score": 0.8184577723378215,
5
+ "eval_gmean": 0.8139876199369547,
6
+ "eval_loss": 0.33375000953674316,
7
+ "eval_precision": 0.8230000000000001,
8
+ "eval_recall": 0.82,
9
+ "eval_runtime": 163.2928,
10
+ "eval_samples_per_second": 0.306,
11
+ "eval_steps_per_second": 0.043,
12
  "total_flos": 1.1914693337677824e+17,
13
+ "train_loss": 0.34641749884492606,
14
+ "train_runtime": 20162.3344,
15
+ "train_samples_per_second": 0.298,
16
  "train_steps_per_second": 0.005
17
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 0.99,
3
- "eval_accuracy": 0.8,
4
- "eval_f1_score": 0.7993558776167471,
5
- "eval_gmean": 0.7980746061134115,
6
- "eval_loss": 0.5084765553474426,
7
- "eval_precision": 0.8012987012987013,
8
- "eval_recall": 0.8,
9
- "eval_runtime": 158.4717,
10
- "eval_samples_per_second": 0.316,
11
- "eval_steps_per_second": 0.044
12
  }
 
1
  {
2
  "epoch": 0.99,
3
+ "eval_accuracy": 0.82,
4
+ "eval_f1_score": 0.8184577723378215,
5
+ "eval_gmean": 0.8139876199369547,
6
+ "eval_loss": 0.33375000953674316,
7
+ "eval_precision": 0.8230000000000001,
8
+ "eval_recall": 0.82,
9
+ "eval_runtime": 163.2928,
10
+ "eval_samples_per_second": 0.306,
11
+ "eval_steps_per_second": 0.043
12
  }
runs/Mar31_18-25-38_a22c766383b5/events.out.tfevents.1711909540.a22c766383b5.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b7755fac8c174276415b660caa3a37263a2aff2e2d9d347068aaec3b0457168
3
+ size 9095
runs/Mar31_18-25-38_a22c766383b5/events.out.tfevents.1711929866.a22c766383b5.34.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62fe50438adbafc6ccd74de88b333c865460e8ed8b927f662013574f5846e9d7
3
+ size 605
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 0.99,
3
  "total_flos": 1.1914693337677824e+17,
4
- "train_loss": 0.3557273290490591,
5
- "train_runtime": 19662.2913,
6
- "train_samples_per_second": 0.305,
7
  "train_steps_per_second": 0.005
8
  }
 
1
  {
2
  "epoch": 0.99,
3
  "total_flos": 1.1914693337677824e+17,
4
+ "train_loss": 0.34641749884492606,
5
+ "train_runtime": 20162.3344,
6
+ "train_samples_per_second": 0.298,
7
  "train_steps_per_second": 0.005
8
  }
trainer_state.json CHANGED
@@ -10,127 +10,127 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.09,
13
- "grad_norm": 6.0,
14
  "learning_rate": 1.8681318681318682e-05,
15
- "loss": 0.266,
16
  "step": 8
17
  },
18
  {
19
  "epoch": 0.17,
20
- "grad_norm": 8.75,
21
  "learning_rate": 1.6923076923076924e-05,
22
- "loss": 0.404,
23
  "step": 16
24
  },
25
  {
26
  "epoch": 0.26,
27
- "grad_norm": 7.90625,
28
  "learning_rate": 1.5164835164835166e-05,
29
- "loss": 0.4084,
30
  "step": 24
31
  },
32
  {
33
  "epoch": 0.3,
34
- "eval_accuracy": 0.8,
35
- "eval_f1_score": 0.7993558776167471,
36
- "eval_gmean": 0.7980746061134115,
37
- "eval_loss": 0.5118359327316284,
38
- "eval_precision": 0.8012987012987013,
39
- "eval_recall": 0.8,
40
- "eval_runtime": 158.1221,
41
- "eval_samples_per_second": 0.316,
42
- "eval_steps_per_second": 0.044,
43
  "step": 28
44
  },
45
  {
46
  "epoch": 0.34,
47
- "grad_norm": 6.84375,
48
  "learning_rate": 1.3406593406593406e-05,
49
- "loss": 0.3697,
50
  "step": 32
51
  },
52
  {
53
  "epoch": 0.43,
54
- "grad_norm": 5.9375,
55
  "learning_rate": 1.164835164835165e-05,
56
- "loss": 0.3647,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 0.51,
61
- "grad_norm": 7.1875,
62
  "learning_rate": 9.890109890109892e-06,
63
- "loss": 0.3738,
64
  "step": 48
65
  },
66
  {
67
  "epoch": 0.6,
68
- "grad_norm": 6.46875,
69
  "learning_rate": 8.131868131868132e-06,
70
- "loss": 0.3298,
71
  "step": 56
72
  },
73
  {
74
  "epoch": 0.6,
75
- "eval_accuracy": 0.8,
76
- "eval_f1_score": 0.7993558776167471,
77
- "eval_gmean": 0.7980746061134115,
78
- "eval_loss": 0.5087890625,
79
- "eval_precision": 0.8012987012987013,
80
- "eval_recall": 0.8,
81
- "eval_runtime": 158.641,
82
- "eval_samples_per_second": 0.315,
83
- "eval_steps_per_second": 0.044,
84
  "step": 56
85
  },
86
  {
87
  "epoch": 0.68,
88
- "grad_norm": 6.75,
89
  "learning_rate": 6.373626373626373e-06,
90
- "loss": 0.333,
91
  "step": 64
92
  },
93
  {
94
  "epoch": 0.77,
95
- "grad_norm": 7.3125,
96
  "learning_rate": 4.615384615384616e-06,
97
- "loss": 0.3813,
98
  "step": 72
99
  },
100
  {
101
  "epoch": 0.85,
102
- "grad_norm": 6.5,
103
  "learning_rate": 2.8571428571428573e-06,
104
- "loss": 0.3403,
105
  "step": 80
106
  },
107
  {
108
  "epoch": 0.9,
109
- "eval_accuracy": 0.8,
110
- "eval_f1_score": 0.7993558776167471,
111
- "eval_gmean": 0.7980746061134115,
112
- "eval_loss": 0.5084765553474426,
113
- "eval_precision": 0.8012987012987013,
114
- "eval_recall": 0.8,
115
- "eval_runtime": 158.2765,
116
- "eval_samples_per_second": 0.316,
117
- "eval_steps_per_second": 0.044,
118
  "step": 84
119
  },
120
  {
121
  "epoch": 0.94,
122
- "grad_norm": 6.84375,
123
  "learning_rate": 1.098901098901099e-06,
124
- "loss": 0.3473,
125
  "step": 88
126
  },
127
  {
128
  "epoch": 0.99,
129
  "step": 93,
130
  "total_flos": 1.1914693337677824e+17,
131
- "train_loss": 0.3557273290490591,
132
- "train_runtime": 19662.2913,
133
- "train_samples_per_second": 0.305,
134
  "train_steps_per_second": 0.005
135
  }
136
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.09,
13
+ "grad_norm": 6.78125,
14
  "learning_rate": 1.8681318681318682e-05,
15
+ "loss": 0.3728,
16
  "step": 8
17
  },
18
  {
19
  "epoch": 0.17,
20
+ "grad_norm": 5.03125,
21
  "learning_rate": 1.6923076923076924e-05,
22
+ "loss": 0.353,
23
  "step": 16
24
  },
25
  {
26
  "epoch": 0.26,
27
+ "grad_norm": 6.5,
28
  "learning_rate": 1.5164835164835166e-05,
29
+ "loss": 0.3137,
30
  "step": 24
31
  },
32
  {
33
  "epoch": 0.3,
34
+ "eval_accuracy": 0.82,
35
+ "eval_f1_score": 0.8184577723378215,
36
+ "eval_gmean": 0.8139876199369547,
37
+ "eval_loss": 0.33320313692092896,
38
+ "eval_precision": 0.8230000000000001,
39
+ "eval_recall": 0.82,
40
+ "eval_runtime": 163.4252,
41
+ "eval_samples_per_second": 0.306,
42
+ "eval_steps_per_second": 0.043,
43
  "step": 28
44
  },
45
  {
46
  "epoch": 0.34,
47
+ "grad_norm": 7.40625,
48
  "learning_rate": 1.3406593406593406e-05,
49
+ "loss": 0.3488,
50
  "step": 32
51
  },
52
  {
53
  "epoch": 0.43,
54
+ "grad_norm": 4.375,
55
  "learning_rate": 1.164835164835165e-05,
56
+ "loss": 0.3013,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 0.51,
61
+ "grad_norm": 8.375,
62
  "learning_rate": 9.890109890109892e-06,
63
+ "loss": 0.4057,
64
  "step": 48
65
  },
66
  {
67
  "epoch": 0.6,
68
+ "grad_norm": 5.90625,
69
  "learning_rate": 8.131868131868132e-06,
70
+ "loss": 0.3598,
71
  "step": 56
72
  },
73
  {
74
  "epoch": 0.6,
75
+ "eval_accuracy": 0.82,
76
+ "eval_f1_score": 0.8184577723378215,
77
+ "eval_gmean": 0.8139876199369547,
78
+ "eval_loss": 0.3338281214237213,
79
+ "eval_precision": 0.8230000000000001,
80
+ "eval_recall": 0.82,
81
+ "eval_runtime": 163.4717,
82
+ "eval_samples_per_second": 0.306,
83
+ "eval_steps_per_second": 0.043,
84
  "step": 56
85
  },
86
  {
87
  "epoch": 0.68,
88
+ "grad_norm": 7.6875,
89
  "learning_rate": 6.373626373626373e-06,
90
+ "loss": 0.295,
91
  "step": 64
92
  },
93
  {
94
  "epoch": 0.77,
95
+ "grad_norm": 6.8125,
96
  "learning_rate": 4.615384615384616e-06,
97
+ "loss": 0.3881,
98
  "step": 72
99
  },
100
  {
101
  "epoch": 0.85,
102
+ "grad_norm": 5.90625,
103
  "learning_rate": 2.8571428571428573e-06,
104
+ "loss": 0.3761,
105
  "step": 80
106
  },
107
  {
108
  "epoch": 0.9,
109
+ "eval_accuracy": 0.82,
110
+ "eval_f1_score": 0.8184577723378215,
111
+ "eval_gmean": 0.8139876199369547,
112
+ "eval_loss": 0.33375000953674316,
113
+ "eval_precision": 0.8230000000000001,
114
+ "eval_recall": 0.82,
115
+ "eval_runtime": 163.4454,
116
+ "eval_samples_per_second": 0.306,
117
+ "eval_steps_per_second": 0.043,
118
  "step": 84
119
  },
120
  {
121
  "epoch": 0.94,
122
+ "grad_norm": 4.96875,
123
  "learning_rate": 1.098901098901099e-06,
124
+ "loss": 0.2953,
125
  "step": 88
126
  },
127
  {
128
  "epoch": 0.99,
129
  "step": 93,
130
  "total_flos": 1.1914693337677824e+17,
131
+ "train_loss": 0.34641749884492606,
132
+ "train_runtime": 20162.3344,
133
+ "train_samples_per_second": 0.298,
134
  "train_steps_per_second": 0.005
135
  }
136
  ],