Amr-h commited on
Commit
eee1782
·
verified ·
1 Parent(s): 5bf7954

Training in progress, epoch 3, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -93,7 +93,7 @@ model-index:
93
  type: validation_eval
94
  metrics:
95
  - type: cosine_accuracy
96
- value: 0.9627359509468079
97
  name: Cosine Accuracy
98
  ---
99
 
@@ -198,7 +198,7 @@ You can finetune this model on your own dataset.
198
 
199
  | Metric | Value |
200
  |:--------------------|:-----------|
201
- | **cosine_accuracy** | **0.9627** |
202
 
203
  <!--
204
  ## Bias, Risks and Limitations
@@ -433,6 +433,7 @@ You can finetune this model on your own dataset.
433
  | None | 0 | - | 0.9213 |
434
  | 1.0 | 835 | 26.455 | 0.9581 |
435
  | 2.0 | 1670 | 12.0476 | 0.9627 |
 
436
 
437
 
438
  ### Framework Versions
 
93
  type: validation_eval
94
  metrics:
95
  - type: cosine_accuracy
96
+ value: 0.9635822772979736
97
  name: Cosine Accuracy
98
  ---
99
 
 
198
 
199
  | Metric | Value |
200
  |:--------------------|:-----------|
201
+ | **cosine_accuracy** | **0.9636** |
202
 
203
  <!--
204
  ## Bias, Risks and Limitations
 
433
  | None | 0 | - | 0.9213 |
434
  | 1.0 | 835 | 26.455 | 0.9581 |
435
  | 2.0 | 1670 | 12.0476 | 0.9627 |
436
+ | 3.0 | 2505 | 7.3661 | 0.9636 |
437
 
438
 
439
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d08e25a63b01b202f572d87ae4aeea67252e02e34a3469fcdc5c131dcbc88b1
3
  size 1112197096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fea8b27fc08c6cd4a81a04c6c85caa5c5b9ceb8806192e42d3abf17bc88ef907
3
  size 1112197096
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:176ab230b15d6519afab3210be0460d7980f81666c095aac796177b564d7c1e9
3
  size 1712830650
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d685da34be96e414f20c69a2228a75a254ed83336c1c978188c57288cf53f8ed
3
  size 1712830650
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e608683bf0a0df17239b942462c855799007b17c46c86ac75de346d7f8c13f07
3
  size 14180
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f423783f8bcf859aff29ed45246cdfe4d5c18ef35d5279c118ba2ed968fd10b
3
  size 14180
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b72542e73ffe194c38cfae2e78e12be45749d8876a8ac01e53f8ee3ee8ccc453
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db3b99e61d88d736baa6fd0e3a94f01e1acd99229821cfd2422e29d6875b89ef
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf6e95f099c43357b5edfafb88b378a3076c67a8db5b80d9451dfee7962b8f61
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26865453805f3926bdbe81c531a088d85786e5a73d544511eef68b50ddb4e9da
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 1670,
3
- "best_metric": 0.9627359509468079,
4
- "best_model_checkpoint": "/kaggle/working/checkpoint-1670",
5
- "epoch": 2.0,
6
  "eval_steps": 500,
7
- "global_step": 1670,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -40,6 +40,22 @@
40
  "eval_steps_per_second": 0.0,
41
  "eval_validation_eval_cosine_accuracy": 0.9627359509468079,
42
  "step": 1670
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
43
  }
44
  ],
45
  "logging_steps": 500,
 
1
  {
2
+ "best_global_step": 2505,
3
+ "best_metric": 0.9635822772979736,
4
+ "best_model_checkpoint": "/kaggle/working/checkpoint-2505",
5
+ "epoch": 3.0,
6
  "eval_steps": 500,
7
+ "global_step": 2505,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
40
  "eval_steps_per_second": 0.0,
41
  "eval_validation_eval_cosine_accuracy": 0.9627359509468079,
42
  "step": 1670
43
+ },
44
+ {
45
+ "epoch": 3.0,
46
+ "grad_norm": 86.45789337158203,
47
+ "learning_rate": 1.666253638382422e-05,
48
+ "loss": 7.3661,
49
+ "step": 2505
50
+ },
51
+ {
52
+ "epoch": 3.0,
53
+ "eval_model_preparation_time": 0.0028,
54
+ "eval_runtime": 147.6683,
55
+ "eval_samples_per_second": 0.0,
56
+ "eval_steps_per_second": 0.0,
57
+ "eval_validation_eval_cosine_accuracy": 0.9635822772979736,
58
+ "step": 2505
59
  }
60
  ],
61
  "logging_steps": 500,