danield12 commited on
Commit
57f1ae4
·
verified ·
1 Parent(s): f50323f

Upload folder using huggingface_hub

Browse files
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4411c80e204fa52239f0e767750debd1cf11225e340233f1709705364827150e
3
  size 160086542
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83e01fc1d25dedc753f4825dabab388ed7180db6815fc7516b723efdbd0fc2c1
3
  size 160086542
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
- "epoch": 1.0,
3
- "eval_accuracy": 0.85,
4
- "eval_f1_score": 0.8504053648283457,
5
- "eval_gmean": 0.8587214900086042,
6
- "eval_loss": 0.44022461771965027,
7
- "eval_precision": 0.8646326776395022,
8
- "eval_recall": 0.85,
9
- "eval_runtime": 281.2283,
10
- "eval_samples_per_second": 0.356,
11
- "eval_steps_per_second": 0.046,
12
- "total_flos": 8.435821078904832e+16,
13
- "train_loss": 0.508428317397388,
14
- "train_runtime": 14877.7814,
15
- "train_samples_per_second": 0.288,
16
- "train_steps_per_second": 0.005
17
  }
 
1
  {
2
+ "epoch": 0.99,
3
+ "eval_accuracy": 0.78,
4
+ "eval_f1_score": 0.7760000000000001,
5
+ "eval_gmean": 0.7929678856251685,
6
+ "eval_loss": 0.5592187643051147,
7
+ "eval_precision": 0.82625,
8
+ "eval_recall": 0.78,
9
+ "eval_runtime": 111.3804,
10
+ "eval_samples_per_second": 0.449,
11
+ "eval_steps_per_second": 0.063,
12
+ "total_flos": 8.453461911404544e+16,
13
+ "train_loss": 0.6594164299242424,
14
+ "train_runtime": 12749.8583,
15
+ "train_samples_per_second": 0.336,
16
+ "train_steps_per_second": 0.003
17
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 1.0,
3
- "eval_accuracy": 0.85,
4
- "eval_f1_score": 0.8504053648283457,
5
- "eval_gmean": 0.8587214900086042,
6
- "eval_loss": 0.44022461771965027,
7
- "eval_precision": 0.8646326776395022,
8
- "eval_recall": 0.85,
9
- "eval_runtime": 281.2283,
10
- "eval_samples_per_second": 0.356,
11
- "eval_steps_per_second": 0.046
12
  }
 
1
  {
2
+ "epoch": 0.99,
3
+ "eval_accuracy": 0.78,
4
+ "eval_f1_score": 0.7760000000000001,
5
+ "eval_gmean": 0.7929678856251685,
6
+ "eval_loss": 0.5592187643051147,
7
+ "eval_precision": 0.82625,
8
+ "eval_recall": 0.78,
9
+ "eval_runtime": 111.3804,
10
+ "eval_samples_per_second": 0.449,
11
+ "eval_steps_per_second": 0.063
12
  }
runs/Mar26_17-17-40_59245c7fbd53/events.out.tfevents.1711473463.59245c7fbd53.35.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d3d71e8db1d0d700ef4e012d647e61ee029dbbf36c81703e4e8125a1070707
3
+ size 4964
runs/Mar26_18-20-56_8514445b457f/events.out.tfevents.1711477258.8514445b457f.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eecbc248a4c8d4479ac388fa729b32724647f89d0da072f0380e10a93e711d69
3
+ size 4964
runs/Mar26_18-21-19_8514445b457f/events.out.tfevents.1711477279.8514445b457f.34.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dadfc8b19dcc306bcd08d6fd47061d7b755f2d11995ead5d89b58359b4f2d842
3
+ size 6657
runs/Mar26_18-21-19_8514445b457f/events.out.tfevents.1711490140.8514445b457f.34.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a57f4a061bf5f2b0373447b879ac5ccc98f298a199fde4dc3366e7b4217a2d1
3
+ size 605
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.0,
3
- "total_flos": 8.435821078904832e+16,
4
- "train_loss": 0.508428317397388,
5
- "train_runtime": 14877.7814,
6
- "train_samples_per_second": 0.288,
7
- "train_steps_per_second": 0.005
8
  }
 
1
  {
2
+ "epoch": 0.99,
3
+ "total_flos": 8.453461911404544e+16,
4
+ "train_loss": 0.6594164299242424,
5
+ "train_runtime": 12749.8583,
6
+ "train_samples_per_second": 0.336,
7
+ "train_steps_per_second": 0.003
8
  }
trainer_state.json CHANGED
@@ -1,138 +1,71 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0,
5
- "eval_steps": 16,
6
- "global_step": 67,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
- {
12
- "epoch": 0.12,
13
- "grad_norm": 22.625,
14
- "learning_rate": 1.8153846153846155e-05,
15
- "loss": 0.6146,
16
- "step": 8
17
- },
18
- {
19
- "epoch": 0.24,
20
- "grad_norm": 23.375,
21
- "learning_rate": 1.5692307692307693e-05,
22
- "loss": 0.5536,
23
- "step": 16
24
- },
25
  {
26
  "epoch": 0.24,
27
- "eval_accuracy": 0.84,
28
- "eval_f1_score": 0.8403201280512205,
29
- "eval_gmean": 0.849780720378659,
30
- "eval_loss": 0.4766210913658142,
31
- "eval_precision": 0.8575523349436394,
32
- "eval_recall": 0.84,
33
- "eval_runtime": 281.1532,
34
- "eval_samples_per_second": 0.356,
35
- "eval_steps_per_second": 0.046,
36
- "step": 16
37
- },
38
- {
39
- "epoch": 0.36,
40
- "grad_norm": 12.5,
41
- "learning_rate": 1.3230769230769231e-05,
42
- "loss": 0.5034,
43
- "step": 24
44
- },
45
- {
46
- "epoch": 0.48,
47
- "grad_norm": 9.0625,
48
- "learning_rate": 1.076923076923077e-05,
49
- "loss": 0.4886,
50
- "step": 32
51
  },
52
  {
53
  "epoch": 0.48,
54
- "eval_accuracy": 0.85,
55
- "eval_f1_score": 0.8504053648283457,
56
- "eval_gmean": 0.8587214900086042,
57
- "eval_loss": 0.4527539014816284,
58
- "eval_precision": 0.8646326776395022,
59
- "eval_recall": 0.85,
60
- "eval_runtime": 280.8117,
61
- "eval_samples_per_second": 0.356,
62
- "eval_steps_per_second": 0.046,
63
- "step": 32
64
- },
65
- {
66
- "epoch": 0.6,
67
- "grad_norm": 14.0,
68
- "learning_rate": 8.307692307692309e-06,
69
- "loss": 0.4542,
70
- "step": 40
71
- },
72
- {
73
- "epoch": 0.72,
74
- "grad_norm": 21.625,
75
- "learning_rate": 5.846153846153847e-06,
76
- "loss": 0.4781,
77
- "step": 48
78
  },
79
  {
80
  "epoch": 0.72,
81
- "eval_accuracy": 0.85,
82
- "eval_f1_score": 0.8504053648283457,
83
- "eval_gmean": 0.8587214900086042,
84
- "eval_loss": 0.44312500953674316,
85
- "eval_precision": 0.8646326776395022,
86
- "eval_recall": 0.85,
87
- "eval_runtime": 280.8661,
88
- "eval_samples_per_second": 0.356,
89
- "eval_steps_per_second": 0.046,
90
- "step": 48
91
  },
92
  {
93
  "epoch": 0.84,
94
- "grad_norm": 16.5,
95
- "learning_rate": 3.384615384615385e-06,
96
- "loss": 0.4712,
97
- "step": 56
 
 
 
 
 
 
98
  },
99
  {
100
  "epoch": 0.96,
101
- "grad_norm": 11.9375,
102
- "learning_rate": 9.230769230769232e-07,
103
- "loss": 0.4697,
104
- "step": 64
105
- },
106
- {
107
- "epoch": 0.96,
108
- "eval_accuracy": 0.85,
109
- "eval_f1_score": 0.8504053648283457,
110
- "eval_gmean": 0.8587214900086042,
111
- "eval_loss": 0.44022461771965027,
112
- "eval_precision": 0.8646326776395022,
113
- "eval_recall": 0.85,
114
- "eval_runtime": 281.3025,
115
- "eval_samples_per_second": 0.355,
116
- "eval_steps_per_second": 0.046,
117
- "step": 64
118
  },
119
  {
120
- "epoch": 1.0,
121
- "step": 67,
122
- "total_flos": 8.435821078904832e+16,
123
- "train_loss": 0.508428317397388,
124
- "train_runtime": 14877.7814,
125
- "train_samples_per_second": 0.288,
126
- "train_steps_per_second": 0.005
127
  }
128
  ],
129
  "logging_steps": 8,
130
- "max_steps": 67,
131
  "num_input_tokens_seen": 0,
132
  "num_train_epochs": 1,
133
  "save_steps": 500,
134
- "total_flos": 8.435821078904832e+16,
135
- "train_batch_size": 16,
136
  "trial_name": null,
137
  "trial_params": null
138
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9850746268656716,
5
+ "eval_steps": 28,
6
+ "global_step": 33,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  {
12
  "epoch": 0.24,
13
+ "grad_norm": 19.75,
14
+ "learning_rate": 1.6129032258064517e-05,
15
+ "loss": 0.7026,
16
+ "step": 8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
17
  },
18
  {
19
  "epoch": 0.48,
20
+ "grad_norm": 14.875,
21
+ "learning_rate": 1.096774193548387e-05,
22
+ "loss": 0.6661,
23
+ "step": 16
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
24
  },
25
  {
26
  "epoch": 0.72,
27
+ "grad_norm": 18.375,
28
+ "learning_rate": 5.806451612903226e-06,
29
+ "loss": 0.6407,
30
+ "step": 24
 
 
 
 
 
 
31
  },
32
  {
33
  "epoch": 0.84,
34
+ "eval_accuracy": 0.78,
35
+ "eval_f1_score": 0.7760000000000001,
36
+ "eval_gmean": 0.7929678856251685,
37
+ "eval_loss": 0.5600000023841858,
38
+ "eval_precision": 0.82625,
39
+ "eval_recall": 0.78,
40
+ "eval_runtime": 108.8057,
41
+ "eval_samples_per_second": 0.46,
42
+ "eval_steps_per_second": 0.064,
43
+ "step": 28
44
  },
45
  {
46
  "epoch": 0.96,
47
+ "grad_norm": 16.25,
48
+ "learning_rate": 6.451612903225807e-07,
49
+ "loss": 0.6313,
50
+ "step": 32
 
 
 
 
 
 
 
 
 
 
 
 
 
51
  },
52
  {
53
+ "epoch": 0.99,
54
+ "step": 33,
55
+ "total_flos": 8.453461911404544e+16,
56
+ "train_loss": 0.6594164299242424,
57
+ "train_runtime": 12749.8583,
58
+ "train_samples_per_second": 0.336,
59
+ "train_steps_per_second": 0.003
60
  }
61
  ],
62
  "logging_steps": 8,
63
+ "max_steps": 33,
64
  "num_input_tokens_seen": 0,
65
  "num_train_epochs": 1,
66
  "save_steps": 500,
67
+ "total_flos": 8.453461911404544e+16,
68
+ "train_batch_size": 32,
69
  "trial_name": null,
70
  "trial_params": null
71
  }