Ethan615 commited on
Commit
e46601f
·
1 Parent(s): 937e940

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff45c0b93d503c4ab2cceae124b29584f7fbda2cef9dcc16084a848f895df539
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3856f5d52b139f68324c7fde3f7b30f487ee6e7fee6adeb65d95f8f88928dc48
3
  size 267832560
run-3/checkpoint-2138/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80f2c334ed4f1f294a2f916451cea250a4cfa86cd9c6ec539ac77b6e87747ee5
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3856f5d52b139f68324c7fde3f7b30f487ee6e7fee6adeb65d95f8f88928dc48
3
  size 267832560
run-3/checkpoint-2138/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c5e39aab0ba5776938cf76f475fbe95fc4816348d471338d1eda66c42a7f697
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e472fbf5f8cc5c472eae2173d310316c60a1b566a27c98944f6e61017eab16f
3
  size 535727290
run-3/checkpoint-2138/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d076be17692cfa345b0f1981db591dc8bcdd0b29c1b64b0637d37bb7f8ea4265
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21acd9373ba2636a96a037599a124a8848e64458d7ed9a26ffc24cbd4056b661
3
  size 14244
run-3/checkpoint-2138/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f78ca8dc6a7929f80c42b973d6b726c0c10724f3fabc46b62fb266e16c4fb748
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4249bf660aed0d3def9d8b0f79d921f7a157b3f4104064206caa1eaa6c6ede4
3
  size 1064
run-3/checkpoint-2138/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.3194134442722084,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-2138",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,35 +10,35 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.23,
13
- "learning_rate": 2.109376138070761e-06,
14
- "loss": 0.5971,
15
  "step": 500
16
  },
17
  {
18
  "epoch": 0.47,
19
- "learning_rate": 1.8300625604660523e-06,
20
- "loss": 0.575,
21
  "step": 1000
22
  },
23
  {
24
  "epoch": 0.7,
25
- "learning_rate": 1.5507489828613434e-06,
26
- "loss": 0.5345,
27
  "step": 1500
28
  },
29
  {
30
  "epoch": 0.94,
31
- "learning_rate": 1.2714354052566345e-06,
32
- "loss": 0.5352,
33
  "step": 2000
34
  },
35
  {
36
  "epoch": 1.0,
37
- "eval_loss": 0.5899004936218262,
38
- "eval_matthews_correlation": 0.3194134442722084,
39
- "eval_runtime": 0.7491,
40
- "eval_samples_per_second": 1392.35,
41
- "eval_steps_per_second": 88.107,
42
  "step": 2138
43
  }
44
  ],
@@ -47,13 +47,13 @@
47
  "num_input_tokens_seen": 0,
48
  "num_train_epochs": 2,
49
  "save_steps": 500,
50
- "total_flos": 32608713001968.0,
51
  "train_batch_size": 4,
52
  "trial_name": null,
53
  "trial_params": {
54
- "learning_rate": 2.38868971567547e-06,
55
  "num_train_epochs": 2,
56
  "per_device_train_batch_size": 4,
57
- "seed": 28
58
  }
59
  }
 
1
  {
2
+ "best_metric": 0.0463559874942472,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-2138",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.23,
13
+ "learning_rate": 1.3504098486610872e-06,
14
+ "loss": 0.6235,
15
  "step": 500
16
  },
17
  {
18
  "epoch": 0.47,
19
+ "learning_rate": 1.1715949852260916e-06,
20
+ "loss": 0.6084,
21
  "step": 1000
22
  },
23
  {
24
  "epoch": 0.7,
25
+ "learning_rate": 9.92780121791096e-07,
26
+ "loss": 0.5687,
27
  "step": 1500
28
  },
29
  {
30
  "epoch": 0.94,
31
+ "learning_rate": 8.139652583561002e-07,
32
+ "loss": 0.5599,
33
  "step": 2000
34
  },
35
  {
36
  "epoch": 1.0,
37
+ "eval_loss": 0.5971149802207947,
38
+ "eval_matthews_correlation": 0.0463559874942472,
39
+ "eval_runtime": 0.7351,
40
+ "eval_samples_per_second": 1418.884,
41
+ "eval_steps_per_second": 89.786,
42
  "step": 2138
43
  }
44
  ],
 
47
  "num_input_tokens_seen": 0,
48
  "num_train_epochs": 2,
49
  "save_steps": 500,
50
+ "total_flos": 32410011903984.0,
51
  "train_batch_size": 4,
52
  "trial_name": null,
53
  "trial_params": {
54
+ "learning_rate": 1.529224712096083e-06,
55
  "num_train_epochs": 2,
56
  "per_device_train_batch_size": 4,
57
+ "seed": 5
58
  }
59
  }
run-3/checkpoint-2138/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58fae703abd28cb0ab5528ac939f06e8a9578110f6c6558da0b2c2f9c2704502
3
  size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff0b8762417b71e573ee14cf5d6c55e801af11f299848bcf4bde51f1e4499d53
3
  size 4792
runs/Dec23_01-09-39_cab176ec49ea/events.out.tfevents.1703294598.cab176ec49ea.681.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aec5cbcca727aa7079f2bff88b7723e3256d02957fd46f8f12881568ec6a043
3
+ size 5459
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:57f7a911be8af835fd7cdb5ddc7dfd5e78fd1882a2c8b09cc2ae78dc7aabb4f0
3
  size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff0b8762417b71e573ee14cf5d6c55e801af11f299848bcf4bde51f1e4499d53
3
  size 4792