guyhadad01 commited on
Commit
ec4c2fd
·
verified ·
1 Parent(s): 5e5cad2

Training in progress, step 6200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.6825, 0.0849],
290
- # [0.6825, 1.0000, 0.1574],
291
- # [0.0849, 0.1574, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1236,6 +1236,10 @@ You can finetune this model on your own dataset.
1236
  | 0.1043 | 5900 | 0.5589 |
1237
  | 0.1051 | 5950 | 0.4507 |
1238
  | 0.1060 | 6000 | 0.5429 |
 
 
 
 
1239
 
1240
 
1241
  ### Framework Versions
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.6439, 0.1032],
290
+ # [0.6439, 1.0000, 0.1639],
291
+ # [0.1032, 0.1639, 1.0000]])
292
  ```
293
 
294
  <!--
 
1236
  | 0.1043 | 5900 | 0.5589 |
1237
  | 0.1051 | 5950 | 0.4507 |
1238
  | 0.1060 | 6000 | 0.5429 |
1239
+ | 0.1069 | 6050 | 0.3789 |
1240
+ | 0.1078 | 6100 | 0.3949 |
1241
+ | 0.1087 | 6150 | 0.4491 |
1242
+ | 0.1096 | 6200 | 0.435 |
1243
 
1244
 
1245
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7789fd8be583c6cd52a2b3c49d3926b4c97ae306770f1629fc1b7121d168f986
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a5270b151b39c586df44055763986b001c438f14893a5a40f6c947ee59b4dc8
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d02388678163538169399bda8fffa8df551692b3bfa9b7ca53bde07a66c2a6e0
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:427a25cee731ef25ec82aa31f31d5a9a97bf0eeea4714138f8d9bf9fc951230f
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f72d2db1e1a80b4db59e84d70863f853ea4793c1b3630fdd9ffed5098f03c668
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bbae8b7e39c2440f246453cba4933379e4e2419770e59220962ebd5772f6447
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7bb2b51b22f222dc6df63edb791d76de5de25b8bb724e885f8753e34cfb8ae10
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aced43cc9ad9f7501c29ad5e5ca57ee953f249e122ae417e48492911cc37f15d
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df255e26e463b4fc70f27b3a2f6c9b68f20dc79363ed0890520e03d68a77d6b1
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0476ebd1df369b140089da74c2363c20e1328e3a729f4bbbf994d19625550ab9
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.10602392606598222,
6
  "eval_steps": 500,
7
- "global_step": 6000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -848,6 +848,34 @@
848
  "learning_rate": 4.966719679566473e-05,
849
  "loss": 0.5429,
850
  "step": 6000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
851
  }
852
  ],
853
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.1095580569348483,
6
  "eval_steps": 500,
7
+ "global_step": 6200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
848
  "learning_rate": 4.966719679566473e-05,
849
  "loss": 0.5429,
850
  "step": 6000
851
+ },
852
+ {
853
+ "epoch": 0.10690745878319874,
854
+ "grad_norm": 1.6127039194107056,
855
+ "learning_rate": 4.961811077732619e-05,
856
+ "loss": 0.3789,
857
+ "step": 6050
858
+ },
859
+ {
860
+ "epoch": 0.10779099150041525,
861
+ "grad_norm": 2.230015993118286,
862
+ "learning_rate": 4.956902475898765e-05,
863
+ "loss": 0.3949,
864
+ "step": 6100
865
+ },
866
+ {
867
+ "epoch": 0.10867452421763178,
868
+ "grad_norm": 1.9963310956954956,
869
+ "learning_rate": 4.9519938740649116e-05,
870
+ "loss": 0.4491,
871
+ "step": 6150
872
+ },
873
+ {
874
+ "epoch": 0.1095580569348483,
875
+ "grad_norm": 2.2731542587280273,
876
+ "learning_rate": 4.947085272231058e-05,
877
+ "loss": 0.435,
878
+ "step": 6200
879
  }
880
  ],
881
  "logging_steps": 50,