Training in progress, step 240, checkpoint

Files changed (6) hide show

last-checkpoint/README.md CHANGED Viewed

@@ -433,9 +433,9 @@ print(embeddings.shape)
 # Get the similarity scores for the embeddings
 similarities = model.similarity(embeddings, embeddings)
 print(similarities)
-# tensor([[ 1.0000,  0.5316, -0.0116],
-#         [ 0.5316,  1.0000,  0.0884],
-#         [-0.0116,  0.0884,  1.0000]])
 ```
 <!--

 # Get the similarity scores for the embeddings
 similarities = model.similarity(embeddings, embeddings)
 print(similarities)
+# tensor([[ 1.0000,  0.5313, -0.0115],
+#         [ 0.5313,  1.0000,  0.0888],
+#         [-0.0115,  0.0888,  1.0000]])
 ```
 <!--

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fe8aa3a1a1fb9867e7ebcb2575f994045f392075d8e27d85f0725089e178d958
 size 45437864

 version https://git-lfs.github.com/spec/v1
+oid sha256:bed665989bcda1599c1ffcbe160bee40204a08c27acc6013cef770ea9fb4f8c8
 size 45437864

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:46b7d40b2fc8fc1d615cf6d14f4591edcb49cf5723c25f2421e4f1170d3494af
 size 90346763

 version https://git-lfs.github.com/spec/v1
+oid sha256:f08c973a087f6c196760a6b1171af59c0ba0c6106b22f68c7e66de1d8f133a3a
 size 90346763

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:acd6682c2d8fc2044ee522f102fcd2876d77278a945d452b98005081e2da9986
 size 14645

 version https://git-lfs.github.com/spec/v1
+oid sha256:918d235c6f11d479081d5b857150fbecca43736fe409e3d9b3dd1d7cc4c95e10
 size 14645

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:198961584cd0530252f9019204a7eacfefb2ec28aecae73b687db7cd3b9da2f0
 size 1465

 version https://git-lfs.github.com/spec/v1
+oid sha256:52f70fd310ae73fa5fc47cd78a0e3378368b9861f0cfb82675065c3231fde1e6
 size 1465

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -2,9 +2,9 @@
   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.8333333333333334,
   "eval_steps": 500,
-  "global_step": 200,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -50,7 +50,7 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }

   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.0,
   "eval_steps": 500,
+  "global_step": 240,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }