danield12 commited on
Commit
c272b10
·
verified ·
1 Parent(s): 32027ee

Upload folder using huggingface_hub

Browse files
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d661b5d8e28c6286c4f688153e59f25326218295967aead1da1fcca840dd8cde
3
  size 160086542
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1f061d4fe605304382b94e7f5a8f2230c7c7ba50f77add04cea55be514ab750
3
  size 160086542
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
  "epoch": 1.0,
3
- "eval_accuracy": 0.72,
4
- "eval_f1_score": 0.7154911433172302,
5
- "eval_gmean": 0.7399824497743348,
6
- "eval_loss": 0.6498633027076721,
7
- "eval_precision": 0.7727777777777777,
8
- "eval_recall": 0.72,
9
- "eval_runtime": 137.6618,
10
- "eval_samples_per_second": 0.363,
11
- "eval_steps_per_second": 0.051,
12
  "total_flos": 8.468389371174912e+16,
13
- "train_loss": 0.9084581972947762,
14
- "train_runtime": 14096.0939,
15
- "train_samples_per_second": 0.304,
16
  "train_steps_per_second": 0.005
17
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "eval_accuracy": 0.7666666666666667,
4
+ "eval_f1_score": 0.7677224736048267,
5
+ "eval_gmean": 0.765713693437345,
6
+ "eval_loss": 0.5444498658180237,
7
+ "eval_precision": 0.7704826038159371,
8
+ "eval_recall": 0.7666666666666667,
9
+ "eval_runtime": 188.2947,
10
+ "eval_samples_per_second": 0.319,
11
+ "eval_steps_per_second": 0.042,
12
  "total_flos": 8.468389371174912e+16,
13
+ "train_loss": 0.6622405550373134,
14
+ "train_runtime": 13770.5671,
15
+ "train_samples_per_second": 0.311,
16
  "train_steps_per_second": 0.005
17
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 1.0,
3
- "eval_accuracy": 0.72,
4
- "eval_f1_score": 0.7154911433172302,
5
- "eval_gmean": 0.7399824497743348,
6
- "eval_loss": 0.6498633027076721,
7
- "eval_precision": 0.7727777777777777,
8
- "eval_recall": 0.72,
9
- "eval_runtime": 137.6618,
10
- "eval_samples_per_second": 0.363,
11
- "eval_steps_per_second": 0.051
12
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "eval_accuracy": 0.7666666666666667,
4
+ "eval_f1_score": 0.7677224736048267,
5
+ "eval_gmean": 0.765713693437345,
6
+ "eval_loss": 0.5444498658180237,
7
+ "eval_precision": 0.7704826038159371,
8
+ "eval_recall": 0.7666666666666667,
9
+ "eval_runtime": 188.2947,
10
+ "eval_samples_per_second": 0.319,
11
+ "eval_steps_per_second": 0.042
12
  }
runs/Apr02_02-36-30_f5b09d025ffe/events.out.tfevents.1712025392.f5b09d025ffe.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e95d7c987cf1c6cb9f8e9fbe5806720a6e344b8f47d6a1b136006d1eeee2427
3
+ size 7948
runs/Apr02_02-36-30_f5b09d025ffe/events.out.tfevents.1712039351.f5b09d025ffe.34.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7d0cbf5246eea7aa31fe78df556d504877c2f52b3ebfb061b5ca5bf0c05f9c7
3
+ size 605
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 8.468389371174912e+16,
4
- "train_loss": 0.9084581972947762,
5
- "train_runtime": 14096.0939,
6
- "train_samples_per_second": 0.304,
7
  "train_steps_per_second": 0.005
8
  }
 
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 8.468389371174912e+16,
4
+ "train_loss": 0.6622405550373134,
5
+ "train_runtime": 13770.5671,
6
+ "train_samples_per_second": 0.311,
7
  "train_steps_per_second": 0.005
8
  }
trainer_state.json CHANGED
@@ -10,93 +10,93 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.12,
13
- "grad_norm": 47.25,
14
  "learning_rate": 1.8153846153846155e-05,
15
- "loss": 1.1395,
16
  "step": 8
17
  },
18
  {
19
  "epoch": 0.24,
20
- "grad_norm": 39.75,
21
  "learning_rate": 1.5692307692307693e-05,
22
- "loss": 1.0434,
23
  "step": 16
24
  },
25
  {
26
  "epoch": 0.36,
27
- "grad_norm": 42.0,
28
  "learning_rate": 1.3230769230769231e-05,
29
- "loss": 0.8923,
30
  "step": 24
31
  },
32
  {
33
  "epoch": 0.42,
34
- "eval_accuracy": 0.66,
35
- "eval_f1_score": 0.6473765809873521,
36
- "eval_gmean": 0.6861694917646597,
37
- "eval_loss": 0.692578136920929,
38
- "eval_precision": 0.7367619047619047,
39
- "eval_recall": 0.66,
40
- "eval_runtime": 137.4001,
41
- "eval_samples_per_second": 0.364,
42
- "eval_steps_per_second": 0.051,
43
  "step": 28
44
  },
45
  {
46
  "epoch": 0.48,
47
- "grad_norm": 41.5,
48
  "learning_rate": 1.076923076923077e-05,
49
- "loss": 0.8968,
50
  "step": 32
51
  },
52
  {
53
  "epoch": 0.6,
54
- "grad_norm": 40.75,
55
  "learning_rate": 8.307692307692309e-06,
56
- "loss": 0.8597,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 0.72,
61
- "grad_norm": 29.0,
62
  "learning_rate": 5.846153846153847e-06,
63
- "loss": 0.8077,
64
  "step": 48
65
  },
66
  {
67
  "epoch": 0.84,
68
- "grad_norm": 37.75,
69
  "learning_rate": 3.384615384615385e-06,
70
- "loss": 0.8601,
71
  "step": 56
72
  },
73
  {
74
  "epoch": 0.84,
75
- "eval_accuracy": 0.72,
76
- "eval_f1_score": 0.7154911433172302,
77
- "eval_gmean": 0.7399824497743348,
78
- "eval_loss": 0.6498633027076721,
79
- "eval_precision": 0.7727777777777777,
80
- "eval_recall": 0.72,
81
- "eval_runtime": 137.4306,
82
- "eval_samples_per_second": 0.364,
83
- "eval_steps_per_second": 0.051,
84
  "step": 56
85
  },
86
  {
87
  "epoch": 0.96,
88
- "grad_norm": 39.25,
89
  "learning_rate": 9.230769230769232e-07,
90
- "loss": 0.8283,
91
  "step": 64
92
  },
93
  {
94
  "epoch": 1.0,
95
  "step": 67,
96
  "total_flos": 8.468389371174912e+16,
97
- "train_loss": 0.9084581972947762,
98
- "train_runtime": 14096.0939,
99
- "train_samples_per_second": 0.304,
100
  "train_steps_per_second": 0.005
101
  }
102
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.12,
13
+ "grad_norm": 34.75,
14
  "learning_rate": 1.8153846153846155e-05,
15
+ "loss": 0.7945,
16
  "step": 8
17
  },
18
  {
19
  "epoch": 0.24,
20
+ "grad_norm": 28.25,
21
  "learning_rate": 1.5692307692307693e-05,
22
+ "loss": 0.7456,
23
  "step": 16
24
  },
25
  {
26
  "epoch": 0.36,
27
+ "grad_norm": 27.5,
28
  "learning_rate": 1.3230769230769231e-05,
29
+ "loss": 0.6596,
30
  "step": 24
31
  },
32
  {
33
  "epoch": 0.42,
34
+ "eval_accuracy": 0.7333333333333333,
35
+ "eval_f1_score": 0.7351290684624019,
36
+ "eval_gmean": 0.7371330133463562,
37
+ "eval_loss": 0.548876941204071,
38
+ "eval_precision": 0.743418613274008,
39
+ "eval_recall": 0.7333333333333333,
40
+ "eval_runtime": 187.8728,
41
+ "eval_samples_per_second": 0.319,
42
+ "eval_steps_per_second": 0.043,
43
  "step": 28
44
  },
45
  {
46
  "epoch": 0.48,
47
+ "grad_norm": 29.125,
48
  "learning_rate": 1.076923076923077e-05,
49
+ "loss": 0.6566,
50
  "step": 32
51
  },
52
  {
53
  "epoch": 0.6,
54
+ "grad_norm": 28.875,
55
  "learning_rate": 8.307692307692309e-06,
56
+ "loss": 0.6498,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 0.72,
61
+ "grad_norm": 18.25,
62
  "learning_rate": 5.846153846153847e-06,
63
+ "loss": 0.5961,
64
  "step": 48
65
  },
66
  {
67
  "epoch": 0.84,
68
+ "grad_norm": 26.0,
69
  "learning_rate": 3.384615384615385e-06,
70
+ "loss": 0.6411,
71
  "step": 56
72
  },
73
  {
74
  "epoch": 0.84,
75
+ "eval_accuracy": 0.7666666666666667,
76
+ "eval_f1_score": 0.7677224736048267,
77
+ "eval_gmean": 0.765713693437345,
78
+ "eval_loss": 0.544189453125,
79
+ "eval_precision": 0.7704826038159371,
80
+ "eval_recall": 0.7666666666666667,
81
+ "eval_runtime": 188.0296,
82
+ "eval_samples_per_second": 0.319,
83
+ "eval_steps_per_second": 0.043,
84
  "step": 56
85
  },
86
  {
87
  "epoch": 0.96,
88
+ "grad_norm": 25.625,
89
  "learning_rate": 9.230769230769232e-07,
90
+ "loss": 0.6016,
91
  "step": 64
92
  },
93
  {
94
  "epoch": 1.0,
95
  "step": 67,
96
  "total_flos": 8.468389371174912e+16,
97
+ "train_loss": 0.6622405550373134,
98
+ "train_runtime": 13770.5671,
99
+ "train_samples_per_second": 0.311,
100
  "train_steps_per_second": 0.005
101
  }
102
  ],