LamaDiab commited on
Commit
5aa80db
·
verified ·
1 Parent(s): e1a149d

Training in progress, epoch 3, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -51,7 +51,7 @@ model-index:
51
  type: unknown
52
  metrics:
53
  - type: cosine_accuracy
54
- value: 0.9241451621055603
55
  name: Cosine Accuracy
56
  ---
57
 
@@ -116,9 +116,9 @@ print(embeddings.shape)
116
  # Get the similarity scores for the embeddings
117
  similarities = model.similarity(embeddings, embeddings)
118
  print(similarities)
119
- # tensor([[1.0000, 0.7980, 0.5008],
120
- # [0.7980, 1.0000, 0.4856],
121
- # [0.5008, 0.4856, 1.0000]])
122
  ```
123
 
124
  <!--
@@ -155,7 +155,7 @@ You can finetune this model on your own dataset.
155
 
156
  | Metric | Value |
157
  |:--------------------|:-----------|
158
- | **cosine_accuracy** | **0.9241** |
159
 
160
  <!--
161
  ## Bias, Risks and Limitations
@@ -370,6 +370,7 @@ You can finetune this model on your own dataset.
370
  | 0.0009 | 1 | 5.8495 | - | - |
371
  | 1.0 | 1139 | 3.0136 | 0.8482 | 0.9113 |
372
  | 2.0 | 2278 | 2.2096 | 0.7465 | 0.9241 |
 
373
 
374
 
375
  ### Framework Versions
 
51
  type: unknown
52
  metrics:
53
  - type: cosine_accuracy
54
+ value: 0.9337190985679626
55
  name: Cosine Accuracy
56
  ---
57
 
 
116
  # Get the similarity scores for the embeddings
117
  similarities = model.similarity(embeddings, embeddings)
118
  print(similarities)
119
+ # tensor([[1.0000, 0.7955, 0.3891],
120
+ # [0.7955, 1.0000, 0.4118],
121
+ # [0.3891, 0.4118, 1.0000]])
122
  ```
123
 
124
  <!--
 
155
 
156
  | Metric | Value |
157
  |:--------------------|:-----------|
158
+ | **cosine_accuracy** | **0.9337** |
159
 
160
  <!--
161
  ## Bias, Risks and Limitations
 
370
  | 0.0009 | 1 | 5.8495 | - | - |
371
  | 1.0 | 1139 | 3.0136 | 0.8482 | 0.9113 |
372
  | 2.0 | 2278 | 2.2096 | 0.7465 | 0.9241 |
373
+ | 3.0 | 3417 | 1.966 | 0.6980 | 0.9337 |
374
 
375
 
376
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2e39231c7d8067da68842fefd4abad2ff8b91970af67955ad9c5f19ccf161a8
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e94dfce1c7a8097a517cdc7e18867845b8cf07b8debbb4c7f86dacfe33f0ad0
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25fc21c2982d17aa3f6fc707f27442f5d1e5edf6276f4ebcbbe1fc1d17a98a9d
3
  size 180607738
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6e5d3026902eda477b64ceaeccd2e204dd15555061fe0a6a4f2baabb9021e9a
3
  size 180607738
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2bf362531f74a3fe6ba5f06065875963cf9872e2a6a7835093b5dc7a57b8290
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bd7c67a9db13a1d1d92181014a6e67813669ee1bbe4529e719f8b5106877aef
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c4c7b163f9ecd5aa5916a8a707d0281dceeb0bb3b46ace886ee05988e38d2f2
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67a6b234e82620ea3da8e2a9835166f15a378f21f79ddb4af11eb7a0b287008f
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a0cbb301e0d0f2e8f6962d0b550760545cc3333a5fead2dc22aebe3963c95d2
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecbc50cd28f5eb9a427ea169ea55add1d74447c6784544c0cff4a17d832f4ec4
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 2.0,
6
  "eval_steps": 500,
7
- "global_step": 2278,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -47,6 +47,22 @@
47
  "eval_samples_per_second": 277.551,
48
  "eval_steps_per_second": 1.11,
49
  "step": 2278
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
50
  }
51
  ],
52
  "logging_steps": 500,
@@ -61,7 +77,7 @@
61
  "should_evaluate": false,
62
  "should_log": false,
63
  "should_save": true,
64
- "should_training_stop": false
65
  },
66
  "attributes": {}
67
  }
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 3.0,
6
  "eval_steps": 500,
7
+ "global_step": 3417,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
47
  "eval_samples_per_second": 277.551,
48
  "eval_steps_per_second": 1.11,
49
  "step": 2278
50
+ },
51
+ {
52
+ "epoch": 3.0,
53
+ "grad_norm": 10.734906196594238,
54
+ "learning_rate": 2.1939447125932427e-08,
55
+ "loss": 1.966,
56
+ "step": 3417
57
+ },
58
+ {
59
+ "epoch": 3.0,
60
+ "eval_cosine_accuracy": 0.9337190985679626,
61
+ "eval_loss": 0.6979679465293884,
62
+ "eval_runtime": 34.569,
63
+ "eval_samples_per_second": 274.957,
64
+ "eval_steps_per_second": 1.099,
65
+ "step": 3417
66
  }
67
  ],
68
  "logging_steps": 500,
 
77
  "should_evaluate": false,
78
  "should_log": false,
79
  "should_save": true,
80
+ "should_training_stop": true
81
  },
82
  "attributes": {}
83
  }