danield12 commited on
Commit
58bf162
·
verified ·
1 Parent(s): 181a7d9

Upload folder using huggingface_hub

Browse files
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e20f84166792753507ea6124bdd53360db24770abff12c0c1561863e51e82fd7
3
  size 160086542
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95e2a19914eaa14513f860a0e901e2e1f0a0a709a4d92ea72ec0c3c855b69fd8
3
  size 160086542
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.8166666666666667,
4
- "eval_f1_score": 0.8149425287356322,
5
- "eval_gmean": 0.7636703179128833,
6
- "eval_loss": 0.3408854305744171,
7
- "eval_precision": 0.8137310606060607,
8
  "eval_recall": 0.8166666666666667,
9
- "eval_runtime": 180.7643,
10
- "eval_samples_per_second": 0.332,
11
- "eval_steps_per_second": 0.044,
12
  "total_flos": 8.435821078904832e+16,
13
- "train_loss": 0.43565983558768656,
14
- "train_runtime": 13206.8117,
15
- "train_samples_per_second": 0.324,
16
  "train_steps_per_second": 0.005
17
  }
 
1
  {
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.8166666666666667,
4
+ "eval_f1_score": 0.8080459770114942,
5
+ "eval_gmean": 0.7501820727030913,
6
+ "eval_loss": 0.5850911736488342,
7
+ "eval_precision": 0.8133022774327122,
8
  "eval_recall": 0.8166666666666667,
9
+ "eval_runtime": 175.3378,
10
+ "eval_samples_per_second": 0.342,
11
+ "eval_steps_per_second": 0.046,
12
  "total_flos": 8.435821078904832e+16,
13
+ "train_loss": 0.405215135261194,
14
+ "train_runtime": 12957.5785,
15
+ "train_samples_per_second": 0.33,
16
  "train_steps_per_second": 0.005
17
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.8166666666666667,
4
- "eval_f1_score": 0.8149425287356322,
5
- "eval_gmean": 0.7636703179128833,
6
- "eval_loss": 0.3408854305744171,
7
- "eval_precision": 0.8137310606060607,
8
  "eval_recall": 0.8166666666666667,
9
- "eval_runtime": 180.7643,
10
- "eval_samples_per_second": 0.332,
11
- "eval_steps_per_second": 0.044
12
  }
 
1
  {
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.8166666666666667,
4
+ "eval_f1_score": 0.8080459770114942,
5
+ "eval_gmean": 0.7501820727030913,
6
+ "eval_loss": 0.5850911736488342,
7
+ "eval_precision": 0.8133022774327122,
8
  "eval_recall": 0.8166666666666667,
9
+ "eval_runtime": 175.3378,
10
+ "eval_samples_per_second": 0.342,
11
+ "eval_steps_per_second": 0.046
12
  }
runs/Apr02_23-40-54_3c3e34ad1384/events.out.tfevents.1712101256.3c3e34ad1384.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c446384ed4b1fb2dcfb64f086d9f3310938be2eea7eb29248560679c1130b9e0
3
+ size 7924
runs/Apr02_23-40-54_3c3e34ad1384/events.out.tfevents.1712114389.3c3e34ad1384.34.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52f220ea6075bb904c8e69b55c315d3315a1a2b6e3cdc8fd0dcb223c65572ece
3
+ size 605
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 8.435821078904832e+16,
4
- "train_loss": 0.43565983558768656,
5
- "train_runtime": 13206.8117,
6
- "train_samples_per_second": 0.324,
7
  "train_steps_per_second": 0.005
8
  }
 
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 8.435821078904832e+16,
4
+ "train_loss": 0.405215135261194,
5
+ "train_runtime": 12957.5785,
6
+ "train_samples_per_second": 0.33,
7
  "train_steps_per_second": 0.005
8
  }
trainer_state.json CHANGED
@@ -10,93 +10,93 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.12,
13
- "grad_norm": 13.4375,
14
  "learning_rate": 1.8153846153846155e-05,
15
- "loss": 0.4866,
16
  "step": 8
17
  },
18
  {
19
  "epoch": 0.24,
20
- "grad_norm": 14.5625,
21
  "learning_rate": 1.5692307692307693e-05,
22
- "loss": 0.4687,
23
  "step": 16
24
  },
25
  {
26
  "epoch": 0.36,
27
- "grad_norm": 6.6875,
28
  "learning_rate": 1.3230769230769231e-05,
29
- "loss": 0.4295,
30
  "step": 24
31
  },
32
  {
33
  "epoch": 0.42,
34
  "eval_accuracy": 0.8166666666666667,
35
- "eval_f1_score": 0.8149425287356322,
36
- "eval_gmean": 0.7636703179128833,
37
- "eval_loss": 0.3428385555744171,
38
- "eval_precision": 0.8137310606060607,
39
  "eval_recall": 0.8166666666666667,
40
- "eval_runtime": 180.8759,
41
- "eval_samples_per_second": 0.332,
42
- "eval_steps_per_second": 0.044,
43
  "step": 28
44
  },
45
  {
46
  "epoch": 0.48,
47
- "grad_norm": 6.46875,
48
  "learning_rate": 1.076923076923077e-05,
49
- "loss": 0.4236,
50
  "step": 32
51
  },
52
  {
53
  "epoch": 0.6,
54
- "grad_norm": 9.8125,
55
  "learning_rate": 8.307692307692309e-06,
56
- "loss": 0.3919,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 0.72,
61
- "grad_norm": 13.5,
62
  "learning_rate": 5.846153846153847e-06,
63
- "loss": 0.4099,
64
  "step": 48
65
  },
66
  {
67
  "epoch": 0.84,
68
- "grad_norm": 11.4375,
69
  "learning_rate": 3.384615384615385e-06,
70
- "loss": 0.4242,
71
  "step": 56
72
  },
73
  {
74
  "epoch": 0.84,
75
  "eval_accuracy": 0.8166666666666667,
76
- "eval_f1_score": 0.8149425287356322,
77
- "eval_gmean": 0.7636703179128833,
78
- "eval_loss": 0.34062498807907104,
79
- "eval_precision": 0.8137310606060607,
80
  "eval_recall": 0.8166666666666667,
81
- "eval_runtime": 180.4163,
82
- "eval_samples_per_second": 0.333,
83
- "eval_steps_per_second": 0.044,
84
  "step": 56
85
  },
86
  {
87
  "epoch": 0.96,
88
- "grad_norm": 9.3125,
89
  "learning_rate": 9.230769230769232e-07,
90
- "loss": 0.4092,
91
  "step": 64
92
  },
93
  {
94
  "epoch": 1.0,
95
  "step": 67,
96
  "total_flos": 8.435821078904832e+16,
97
- "train_loss": 0.43565983558768656,
98
- "train_runtime": 13206.8117,
99
- "train_samples_per_second": 0.324,
100
  "train_steps_per_second": 0.005
101
  }
102
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.12,
13
+ "grad_norm": 9.4375,
14
  "learning_rate": 1.8153846153846155e-05,
15
+ "loss": 0.4282,
16
  "step": 8
17
  },
18
  {
19
  "epoch": 0.24,
20
+ "grad_norm": 10.5,
21
  "learning_rate": 1.5692307692307693e-05,
22
+ "loss": 0.4335,
23
  "step": 16
24
  },
25
  {
26
  "epoch": 0.36,
27
+ "grad_norm": 5.03125,
28
  "learning_rate": 1.3230769230769231e-05,
29
+ "loss": 0.3984,
30
  "step": 24
31
  },
32
  {
33
  "epoch": 0.42,
34
  "eval_accuracy": 0.8166666666666667,
35
+ "eval_f1_score": 0.8080459770114942,
36
+ "eval_gmean": 0.7501820727030913,
37
+ "eval_loss": 0.5816406011581421,
38
+ "eval_precision": 0.8133022774327122,
39
  "eval_recall": 0.8166666666666667,
40
+ "eval_runtime": 175.4354,
41
+ "eval_samples_per_second": 0.342,
42
+ "eval_steps_per_second": 0.046,
43
  "step": 28
44
  },
45
  {
46
  "epoch": 0.48,
47
+ "grad_norm": 6.625,
48
  "learning_rate": 1.076923076923077e-05,
49
+ "loss": 0.3979,
50
  "step": 32
51
  },
52
  {
53
  "epoch": 0.6,
54
+ "grad_norm": 7.875,
55
  "learning_rate": 8.307692307692309e-06,
56
+ "loss": 0.3657,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 0.72,
61
+ "grad_norm": 10.0,
62
  "learning_rate": 5.846153846153847e-06,
63
+ "loss": 0.38,
64
  "step": 48
65
  },
66
  {
67
  "epoch": 0.84,
68
+ "grad_norm": 9.6875,
69
  "learning_rate": 3.384615384615385e-06,
70
+ "loss": 0.4054,
71
  "step": 56
72
  },
73
  {
74
  "epoch": 0.84,
75
  "eval_accuracy": 0.8166666666666667,
76
+ "eval_f1_score": 0.8080459770114942,
77
+ "eval_gmean": 0.7501820727030913,
78
+ "eval_loss": 0.5850911736488342,
79
+ "eval_precision": 0.8133022774327122,
80
  "eval_recall": 0.8166666666666667,
81
+ "eval_runtime": 173.49,
82
+ "eval_samples_per_second": 0.346,
83
+ "eval_steps_per_second": 0.046,
84
  "step": 56
85
  },
86
  {
87
  "epoch": 0.96,
88
+ "grad_norm": 8.8125,
89
  "learning_rate": 9.230769230769232e-07,
90
+ "loss": 0.3864,
91
  "step": 64
92
  },
93
  {
94
  "epoch": 1.0,
95
  "step": 67,
96
  "total_flos": 8.435821078904832e+16,
97
+ "train_loss": 0.405215135261194,
98
+ "train_runtime": 12957.5785,
99
+ "train_samples_per_second": 0.33,
100
  "train_steps_per_second": 0.005
101
  }
102
  ],