danield12 commited on
Commit
16934cd
·
verified ·
1 Parent(s): 0f92b28

Upload folder using huggingface_hub

Browse files
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6108dc25ba5aa452a9c8d2e2e7d6ef2951bcb6110a3c096753940fa8b361588b
3
  size 160086542
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea8d277e715e2a736fbe18142a6cebf1b073418e531abda67df373f2f7a44731
3
  size 160086542
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
- "epoch": 0.98,
3
- "eval_accuracy": 0.45,
4
- "eval_f1_score": 0.413184584178499,
5
- "eval_gmean": 0.43716017951820696,
6
- "eval_loss": 1.7248046398162842,
7
- "eval_precision": 0.42000000000000004,
8
- "eval_recall": 0.45,
9
- "eval_runtime": 249.5755,
10
- "eval_samples_per_second": 0.321,
11
- "eval_steps_per_second": 0.04,
12
- "total_flos": 1.28114982125568e+16,
13
- "train_loss": 1.59609375,
14
- "train_runtime": 2284.6483,
15
- "train_samples_per_second": 0.281,
16
- "train_steps_per_second": 0.004
17
  }
 
1
  {
2
+ "epoch": 0.87,
3
+ "eval_accuracy": 0.5824175824175825,
4
+ "eval_f1_score": 0.5868882275132276,
5
+ "eval_gmean": 0.49316056422674454,
6
+ "eval_loss": 0.8609203100204468,
7
+ "eval_precision": 0.5918367346938775,
8
+ "eval_recall": 0.5824175824175825,
9
+ "eval_runtime": 40.3783,
10
+ "eval_samples_per_second": 2.254,
11
+ "eval_steps_per_second": 0.297,
12
+ "total_flos": 1701527106355200.0,
13
+ "train_loss": 0.9130859375,
14
+ "train_runtime": 390.6328,
15
+ "train_samples_per_second": 1.856,
16
+ "train_steps_per_second": 0.013
17
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 0.98,
3
- "eval_accuracy": 0.45,
4
- "eval_f1_score": 0.413184584178499,
5
- "eval_gmean": 0.43716017951820696,
6
- "eval_loss": 1.7248046398162842,
7
- "eval_precision": 0.42000000000000004,
8
- "eval_recall": 0.45,
9
- "eval_runtime": 249.5755,
10
- "eval_samples_per_second": 0.321,
11
- "eval_steps_per_second": 0.04
12
  }
 
1
  {
2
+ "epoch": 0.87,
3
+ "eval_accuracy": 0.5824175824175825,
4
+ "eval_f1_score": 0.5868882275132276,
5
+ "eval_gmean": 0.49316056422674454,
6
+ "eval_loss": 0.8609203100204468,
7
+ "eval_precision": 0.5918367346938775,
8
+ "eval_recall": 0.5824175824175825,
9
+ "eval_runtime": 40.3783,
10
+ "eval_samples_per_second": 2.254,
11
+ "eval_steps_per_second": 0.297
12
  }
runs/Mar25_17-36-23_7eee068d60ee/events.out.tfevents.1711388186.7eee068d60ee.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02850e21d1a25753baac20c56014e6034a3a85532da4d6bc2328b77019830cd5
3
+ size 5269
runs/Mar25_17-36-23_7eee068d60ee/events.out.tfevents.1711388617.7eee068d60ee.34.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6700ebad37c22a41e4b8f035a5742ae7b1142a07b17390f4d7cb275e734baf4
3
+ size 605
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 0.98,
3
- "total_flos": 1.28114982125568e+16,
4
- "train_loss": 1.59609375,
5
- "train_runtime": 2284.6483,
6
- "train_samples_per_second": 0.281,
7
- "train_steps_per_second": 0.004
8
  }
 
1
  {
2
+ "epoch": 0.87,
3
+ "total_flos": 1701527106355200.0,
4
+ "train_loss": 0.9130859375,
5
+ "train_runtime": 390.6328,
6
+ "train_samples_per_second": 1.856,
7
+ "train_steps_per_second": 0.013
8
  }
trainer_state.json CHANGED
@@ -1,50 +1,30 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.975609756097561,
5
  "eval_steps": 8,
6
- "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.78,
13
- "grad_norm": 34.5,
14
- "learning_rate": 5e-06,
15
- "loss": 1.6561,
16
- "step": 8
17
- },
18
- {
19
- "epoch": 0.78,
20
- "eval_accuracy": 0.45,
21
- "eval_f1_score": 0.413184584178499,
22
- "eval_gmean": 0.43716017951820696,
23
- "eval_loss": 1.7263672351837158,
24
- "eval_precision": 0.42000000000000004,
25
- "eval_recall": 0.45,
26
- "eval_runtime": 249.5589,
27
- "eval_samples_per_second": 0.321,
28
- "eval_steps_per_second": 0.04,
29
- "step": 8
30
- },
31
- {
32
- "epoch": 0.98,
33
- "step": 10,
34
- "total_flos": 1.28114982125568e+16,
35
- "train_loss": 1.59609375,
36
- "train_runtime": 2284.6483,
37
- "train_samples_per_second": 0.281,
38
- "train_steps_per_second": 0.004
39
  }
40
  ],
41
  "logging_steps": 8,
42
- "max_steps": 10,
43
  "num_input_tokens_seen": 0,
44
  "num_train_epochs": 1,
45
  "save_steps": 500,
46
- "total_flos": 1.28114982125568e+16,
47
- "train_batch_size": 16,
48
  "trial_name": null,
49
  "trial_params": null
50
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.8695652173913043,
5
  "eval_steps": 8,
6
+ "global_step": 5,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.87,
13
+ "step": 5,
14
+ "total_flos": 1701527106355200.0,
15
+ "train_loss": 0.9130859375,
16
+ "train_runtime": 390.6328,
17
+ "train_samples_per_second": 1.856,
18
+ "train_steps_per_second": 0.013
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  }
20
  ],
21
  "logging_steps": 8,
22
+ "max_steps": 5,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 1,
25
  "save_steps": 500,
26
+ "total_flos": 1701527106355200.0,
27
+ "train_batch_size": 32,
28
  "trial_name": null,
29
  "trial_params": null
30
  }