Training in progress, step 50

Files changed (6) hide show

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1da099a0d87099a0b0c9bbf7ea0ae5a6eabcb8d3810f4e9df2b957493c6c6cd5
 size 441154988

 version https://git-lfs.github.com/spec/v1
+oid sha256:b28070514a109f4c6d0cc6bd89ef87ea76348c26aa37d820b2eae9f6195c9738
 size 441154988

runs/Jun15_00-36-15_92b2e0e6fb20/events.out.tfevents.1749947776.92b2e0e6fb20.2194.3 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:68675bc2ed356d6254de5ab1384465e36b4be95c84b4e8a3d42ed7285f48064e
-size 4184

 version https://git-lfs.github.com/spec/v1
+oid sha256:079f4dbb466565a0431e8d93f99f888ff9e82d727edf190150726236219a2b76
+size 5717

runs/Jun15_00-36-38_92b2e0e6fb20/events.out.tfevents.1749947875.92b2e0e6fb20.2194.5 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c04ffe1a33d90bbbfe16f83cd44b5ae14ccb0afef611397e6a0dc4dbbdcdaa40
+size 1576

runs/Jun15_00-38-20_92b2e0e6fb20/events.out.tfevents.1749947901.92b2e0e6fb20.2194.6 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:80235aca5bb0dd08f3e6284a80b3b9bd4ea63ff47c20ab63860a05bdf5217df3
+size 7232

trainer_state.json CHANGED Viewed

@@ -12,40 +12,40 @@
     {
       "epoch": 0,
       "step": 0,
-      "train/classification_loss": 0.6716318130493164,
-      "train/contrastive_loss": 6.973960876464844,
-      "train/negative_loss": 6.973352909088135,
       "train/num_negatives": 190,
       "train/num_positives": 50,
-      "train/positive_loss": 0.0006079699960537255,
-      "train/total_loss": 2.0664238929748535
     },
     {
       "epoch": 0,
       "step": 0,
-      "train/classification_loss": 0.6844258904457092,
-      "train/contrastive_loss": 6.779294490814209,
-      "train/negative_loss": 6.7774882316589355,
       "train/num_negatives": 192,
       "train/num_positives": 48,
-      "train/positive_loss": 0.0018063625320792198,
-      "train/total_loss": 2.0402848720550537
     },
     {
       "epoch": 5.0,
-      "grad_norm": 5.838413238525391,
       "learning_rate": 9.800000000000001e-06,
-      "loss": 1.4132,
       "step": 50
     },
     {
       "epoch": 5.0,
       "step": 50,
       "total_flos": 0.0,
-      "train_loss": 1.413243408203125,
-      "train_runtime": 29.4518,
-      "train_samples_per_second": 53.647,
-      "train_steps_per_second": 1.698
     }
   ],
   "logging_steps": 50,

     {
       "epoch": 0,
       "step": 0,
+      "train/classification_loss": 0.6832770109176636,
+      "train/contrastive_loss": 7.157876014709473,
+      "train/negative_loss": 7.157375812530518,
       "train/num_negatives": 190,
       "train/num_positives": 50,
+      "train/positive_loss": 0.0005001117824576795,
+      "train/total_loss": 2.1148521900177
     },
     {
       "epoch": 0,
       "step": 0,
+      "train/classification_loss": 0.691846489906311,
+      "train/contrastive_loss": 6.978695392608643,
+      "train/negative_loss": 6.977847576141357,
       "train/num_negatives": 192,
       "train/num_positives": 48,
+      "train/positive_loss": 0.0008476818911731243,
+      "train/total_loss": 2.08758544921875
     },
     {
       "epoch": 5.0,
+      "grad_norm": 9.853194236755371,
       "learning_rate": 9.800000000000001e-06,
+      "loss": 2.9901,
       "step": 50
     },
     {
       "epoch": 5.0,
       "step": 50,
       "total_flos": 0.0,
+      "train_loss": 2.9900537109375,
+      "train_runtime": 27.9302,
+      "train_samples_per_second": 56.57,
+      "train_steps_per_second": 1.79
     }
   ],
   "logging_steps": 50,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ca0afef15a0edecfaa88b54e14baf2e856c7793f28bd79fd10178152b6b37f8
 size 5368

 version https://git-lfs.github.com/spec/v1
+oid sha256:c02a3dbfbd9db3f1e4a919c78948efb8eb944344dc26585f19fc5dded995095b
 size 5368