Training in progress, step 50
Browse files- model.safetensors +1 -1
- runs/Jun15_00-36-15_92b2e0e6fb20/events.out.tfevents.1749947776.92b2e0e6fb20.2194.3 +2 -2
- runs/Jun15_00-36-38_92b2e0e6fb20/events.out.tfevents.1749947875.92b2e0e6fb20.2194.5 +3 -0
- runs/Jun15_00-38-20_92b2e0e6fb20/events.out.tfevents.1749947901.92b2e0e6fb20.2194.6 +3 -0
- trainer_state.json +16 -16
- training_args.bin +1 -1
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 441154988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b28070514a109f4c6d0cc6bd89ef87ea76348c26aa37d820b2eae9f6195c9738
|
| 3 |
size 441154988
|
runs/Jun15_00-36-15_92b2e0e6fb20/events.out.tfevents.1749947776.92b2e0e6fb20.2194.3
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:079f4dbb466565a0431e8d93f99f888ff9e82d727edf190150726236219a2b76
|
| 3 |
+
size 5717
|
runs/Jun15_00-36-38_92b2e0e6fb20/events.out.tfevents.1749947875.92b2e0e6fb20.2194.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c04ffe1a33d90bbbfe16f83cd44b5ae14ccb0afef611397e6a0dc4dbbdcdaa40
|
| 3 |
+
size 1576
|
runs/Jun15_00-38-20_92b2e0e6fb20/events.out.tfevents.1749947901.92b2e0e6fb20.2194.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:80235aca5bb0dd08f3e6284a80b3b9bd4ea63ff47c20ab63860a05bdf5217df3
|
| 3 |
+
size 7232
|
trainer_state.json
CHANGED
|
@@ -12,40 +12,40 @@
|
|
| 12 |
{
|
| 13 |
"epoch": 0,
|
| 14 |
"step": 0,
|
| 15 |
-
"train/classification_loss": 0.
|
| 16 |
-
"train/contrastive_loss":
|
| 17 |
-
"train/negative_loss":
|
| 18 |
"train/num_negatives": 190,
|
| 19 |
"train/num_positives": 50,
|
| 20 |
-
"train/positive_loss": 0.
|
| 21 |
-
"train/total_loss": 2.
|
| 22 |
},
|
| 23 |
{
|
| 24 |
"epoch": 0,
|
| 25 |
"step": 0,
|
| 26 |
-
"train/classification_loss": 0.
|
| 27 |
-
"train/contrastive_loss": 6.
|
| 28 |
-
"train/negative_loss": 6.
|
| 29 |
"train/num_negatives": 192,
|
| 30 |
"train/num_positives": 48,
|
| 31 |
-
"train/positive_loss": 0.
|
| 32 |
-
"train/total_loss": 2.
|
| 33 |
},
|
| 34 |
{
|
| 35 |
"epoch": 5.0,
|
| 36 |
-
"grad_norm":
|
| 37 |
"learning_rate": 9.800000000000001e-06,
|
| 38 |
-
"loss":
|
| 39 |
"step": 50
|
| 40 |
},
|
| 41 |
{
|
| 42 |
"epoch": 5.0,
|
| 43 |
"step": 50,
|
| 44 |
"total_flos": 0.0,
|
| 45 |
-
"train_loss":
|
| 46 |
-
"train_runtime":
|
| 47 |
-
"train_samples_per_second":
|
| 48 |
-
"train_steps_per_second": 1.
|
| 49 |
}
|
| 50 |
],
|
| 51 |
"logging_steps": 50,
|
|
|
|
| 12 |
{
|
| 13 |
"epoch": 0,
|
| 14 |
"step": 0,
|
| 15 |
+
"train/classification_loss": 0.6832770109176636,
|
| 16 |
+
"train/contrastive_loss": 7.157876014709473,
|
| 17 |
+
"train/negative_loss": 7.157375812530518,
|
| 18 |
"train/num_negatives": 190,
|
| 19 |
"train/num_positives": 50,
|
| 20 |
+
"train/positive_loss": 0.0005001117824576795,
|
| 21 |
+
"train/total_loss": 2.1148521900177
|
| 22 |
},
|
| 23 |
{
|
| 24 |
"epoch": 0,
|
| 25 |
"step": 0,
|
| 26 |
+
"train/classification_loss": 0.691846489906311,
|
| 27 |
+
"train/contrastive_loss": 6.978695392608643,
|
| 28 |
+
"train/negative_loss": 6.977847576141357,
|
| 29 |
"train/num_negatives": 192,
|
| 30 |
"train/num_positives": 48,
|
| 31 |
+
"train/positive_loss": 0.0008476818911731243,
|
| 32 |
+
"train/total_loss": 2.08758544921875
|
| 33 |
},
|
| 34 |
{
|
| 35 |
"epoch": 5.0,
|
| 36 |
+
"grad_norm": 9.853194236755371,
|
| 37 |
"learning_rate": 9.800000000000001e-06,
|
| 38 |
+
"loss": 2.9901,
|
| 39 |
"step": 50
|
| 40 |
},
|
| 41 |
{
|
| 42 |
"epoch": 5.0,
|
| 43 |
"step": 50,
|
| 44 |
"total_flos": 0.0,
|
| 45 |
+
"train_loss": 2.9900537109375,
|
| 46 |
+
"train_runtime": 27.9302,
|
| 47 |
+
"train_samples_per_second": 56.57,
|
| 48 |
+
"train_steps_per_second": 1.79
|
| 49 |
}
|
| 50 |
],
|
| 51 |
"logging_steps": 50,
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c02a3dbfbd9db3f1e4a919c78948efb8eb944344dc26585f19fc5dded995095b
|
| 3 |
size 5368
|