guyhadad01 commited on
Commit
3f07acc
·
verified ·
1 Parent(s): 53d3caf

Training in progress, step 600, checkpoint

Browse files
last-checkpoint/2_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c355932b1631d5cc039fe88a412c00c3f3d18cb613c3652c8741e9192cc4806
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dd0cd5325744cbadf85834360afa08f075907c48439302dd9bd1990dcba7c09
3
  size 4718680
last-checkpoint/3_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb2dd401d0d4ffa6433f83d4ac597ff641928d6ea494ae387a1a6f1a6d310553
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:618d79044611c03845fd3d5cfff9c6517211438370c9270043bd8df5fd157566
3
  size 4718680
last-checkpoint/README.md CHANGED
@@ -511,7 +511,7 @@ print(query_embeddings.shape, document_embeddings.shape)
511
  # Get the similarity scores for the embeddings
512
  similarities = model.similarity(query_embeddings, document_embeddings)
513
  print(similarities)
514
- # tensor([[ 0.6620, -0.0063, -0.0333]])
515
  ```
516
 
517
  <!--
@@ -728,6 +728,10 @@ You can finetune this model on your own dataset.
728
  | 0.2879 | 300 | 0.2219 |
729
  | 0.3359 | 350 | 0.2227 |
730
  | 0.3839 | 400 | 0.207 |
 
 
 
 
731
 
732
 
733
  ### Framework Versions
 
511
  # Get the similarity scores for the embeddings
512
  similarities = model.similarity(query_embeddings, document_embeddings)
513
  print(similarities)
514
+ # tensor([[ 0.6990, -0.1064, 0.0055]])
515
  ```
516
 
517
  <!--
 
728
  | 0.2879 | 300 | 0.2219 |
729
  | 0.3359 | 350 | 0.2227 |
730
  | 0.3839 | 400 | 0.207 |
731
+ | 0.4319 | 450 | 0.1853 |
732
+ | 0.4798 | 500 | 0.177 |
733
+ | 0.5278 | 550 | 0.1739 |
734
+ | 0.5758 | 600 | 0.1743 |
735
 
736
 
737
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1b5b40b7da70f2a14fdcffdfb517052cafd4a92b303a999515bd5c70bc3b56e
3
  size 605759848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:688b779211f9d7729cdb8b7a1f33de65e70bf757e770157591258607c47b7f93
3
  size 605759848
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ef66f6c3146c65c716246a9b9b1a314970b310fa5bce4e1a4c785a225e5e5d8
3
  size 1230592267
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4cb7e1ce7f84c978a72dad631b014ca653d4764aa7b2675e53c47546614601d
3
  size 1230592267
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df0af633a4f9f804af5866a99325014522ad3b38b189715886b1cb20a1e95ac1
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edab5dd7827df6c860a06cbc8d688873b247f37062ba5008ca6bb63249a0eb13
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.3838771593090211,
6
  "eval_steps": 500,
7
- "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -64,6 +64,34 @@
64
  "learning_rate": 3.431163287086446e-05,
65
  "loss": 0.207,
66
  "step": 400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
67
  }
68
  ],
69
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5758157389635317,
6
  "eval_steps": 500,
7
+ "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
64
  "learning_rate": 3.431163287086446e-05,
65
  "loss": 0.207,
66
  "step": 400
67
+ },
68
+ {
69
+ "epoch": 0.43186180422264875,
70
+ "grad_norm": 3.703125,
71
+ "learning_rate": 3.16435432230523e-05,
72
+ "loss": 0.1853,
73
+ "step": 450
74
+ },
75
+ {
76
+ "epoch": 0.4798464491362764,
77
+ "grad_norm": 4.125,
78
+ "learning_rate": 2.897545357524013e-05,
79
+ "loss": 0.177,
80
+ "step": 500
81
+ },
82
+ {
83
+ "epoch": 0.527831094049904,
84
+ "grad_norm": 4.09375,
85
+ "learning_rate": 2.6307363927427965e-05,
86
+ "loss": 0.1739,
87
+ "step": 550
88
+ },
89
+ {
90
+ "epoch": 0.5758157389635317,
91
+ "grad_norm": 4.0,
92
+ "learning_rate": 2.3639274279615796e-05,
93
+ "loss": 0.1743,
94
+ "step": 600
95
  }
96
  ],
97
  "logging_steps": 50,