guyhadad01 commited on
Commit
def62cb
·
verified ·
1 Parent(s): e5e95d9

Training in progress, step 600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -418,9 +418,9 @@ print(embeddings.shape)
418
  # Get the similarity scores for the embeddings
419
  similarities = model.similarity(embeddings, embeddings)
420
  print(similarities)
421
- # tensor([[1.0000, 0.8039, 0.0072],
422
- # [0.8039, 1.0000, 0.0365],
423
- # [0.0072, 0.0365, 1.0000]])
424
  ```
425
 
426
  <!--
@@ -633,6 +633,10 @@ You can finetune this model on your own dataset.
633
  | 0.2778 | 300 | 0.2587 |
634
  | 0.3241 | 350 | 0.2629 |
635
  | 0.3704 | 400 | 0.2518 |
 
 
 
 
636
 
637
 
638
  ### Framework Versions
 
418
  # Get the similarity scores for the embeddings
419
  similarities = model.similarity(embeddings, embeddings)
420
  print(similarities)
421
+ # tensor([[1.0000, 0.8255, 0.0183],
422
+ # [0.8255, 1.0000, 0.0580],
423
+ # [0.0183, 0.0580, 1.0000]])
424
  ```
425
 
426
  <!--
 
633
  | 0.2778 | 300 | 0.2587 |
634
  | 0.3241 | 350 | 0.2629 |
635
  | 0.3704 | 400 | 0.2518 |
636
+ | 0.4167 | 450 | 0.2492 |
637
+ | 0.4630 | 500 | 0.228 |
638
+ | 0.5093 | 550 | 0.2267 |
639
+ | 0.5556 | 600 | 0.2222 |
640
 
641
 
642
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48ef8ec0a1171721c804c180346ec3c917c952ed0da36455a504c5863c6c9788
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:980f0d4b38375feadd3e6c8d2e4ff0c0c1701d415db84cbfeab147a2b4b273b3
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d9aea5acedf0733c92a9daea99cb257662f8f5ae5961ec2df047b6e0c75cc91
3
  size 180608203
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1e63d9b09c1f721f29df757b14a75b61662a1ffe89fccf48e193f7627afbabf
3
  size 180608203
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c19b67f89acc145936e1b518bb5813ff7a56d806e790b9924b0c10aabb6eba24
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:916c146daa973d7fe7286d497c85a56ed924f1e756ec82fccdaa57c8c5694c8b
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30858f23bcb22d0baef45bd4add9d6fa474141308c12653c706077b87d932e49
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb7fde5111803012042c93a73aa191336bb6e10b3ad44f6bd1d94fc7008a22b6
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf50a8da9b77d1d667aa2be5f7411c48d830b5ed090e0ff1a8209df626c404c4
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5ef9347676d52185ae368f376cf1fe5dd55cbd5ed84547d819fe30ad5c5892f
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.37037037037037035,
6
  "eval_steps": 500,
7
- "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -64,6 +64,34 @@
64
  "learning_rate": 3.503086419753087e-05,
65
  "loss": 0.2518,
66
  "step": 400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
67
  }
68
  ],
69
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5555555555555556,
6
  "eval_steps": 500,
7
+ "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
64
  "learning_rate": 3.503086419753087e-05,
65
  "loss": 0.2518,
66
  "step": 400
67
+ },
68
+ {
69
+ "epoch": 0.4166666666666667,
70
+ "grad_norm": 1.3996431827545166,
71
+ "learning_rate": 3.245884773662551e-05,
72
+ "loss": 0.2492,
73
+ "step": 450
74
+ },
75
+ {
76
+ "epoch": 0.46296296296296297,
77
+ "grad_norm": 1.3424209356307983,
78
+ "learning_rate": 2.9886831275720166e-05,
79
+ "loss": 0.228,
80
+ "step": 500
81
+ },
82
+ {
83
+ "epoch": 0.5092592592592593,
84
+ "grad_norm": 1.3468494415283203,
85
+ "learning_rate": 2.7314814814814816e-05,
86
+ "loss": 0.2267,
87
+ "step": 550
88
+ },
89
+ {
90
+ "epoch": 0.5555555555555556,
91
+ "grad_norm": 1.1546319723129272,
92
+ "learning_rate": 2.4742798353909465e-05,
93
+ "loss": 0.2222,
94
+ "step": 600
95
  }
96
  ],
97
  "logging_steps": 50,