guyhadad01 commited on
Commit
f8c296a
·
verified ·
1 Parent(s): eb1b75f

Training in progress, step 800, checkpoint

Browse files
last-checkpoint/2_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4dd0cd5325744cbadf85834360afa08f075907c48439302dd9bd1990dcba7c09
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56b28b74545c8174d80d1900fffbe59b2a7435a9e928a3f943266d2d96667067
3
  size 4718680
last-checkpoint/3_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:618d79044611c03845fd3d5cfff9c6517211438370c9270043bd8df5fd157566
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40f17852afeb04a7d81bc4e27fdae244ba00112c63322abe9f6c299a666b57b5
3
  size 4718680
last-checkpoint/README.md CHANGED
@@ -511,7 +511,7 @@ print(query_embeddings.shape, document_embeddings.shape)
511
  # Get the similarity scores for the embeddings
512
  similarities = model.similarity(query_embeddings, document_embeddings)
513
  print(similarities)
514
- # tensor([[ 0.6990, -0.1064, 0.0055]])
515
  ```
516
 
517
  <!--
@@ -732,6 +732,10 @@ You can finetune this model on your own dataset.
732
  | 0.4798 | 500 | 0.177 |
733
  | 0.5278 | 550 | 0.1739 |
734
  | 0.5758 | 600 | 0.1743 |
 
 
 
 
735
 
736
 
737
  ### Framework Versions
 
511
  # Get the similarity scores for the embeddings
512
  similarities = model.similarity(query_embeddings, document_embeddings)
513
  print(similarities)
514
+ # tensor([[ 0.7210, -0.0779, -0.0314]])
515
  ```
516
 
517
  <!--
 
732
  | 0.4798 | 500 | 0.177 |
733
  | 0.5278 | 550 | 0.1739 |
734
  | 0.5758 | 600 | 0.1743 |
735
+ | 0.6238 | 650 | 0.1574 |
736
+ | 0.6718 | 700 | 0.1586 |
737
+ | 0.7198 | 750 | 0.1473 |
738
+ | 0.7678 | 800 | 0.1547 |
739
 
740
 
741
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:688b779211f9d7729cdb8b7a1f33de65e70bf757e770157591258607c47b7f93
3
  size 605759848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe81efee97c0f5f6e85eab9e97762a9d281501c3388cc280a9df8ee7217683d3
3
  size 605759848
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4cb7e1ce7f84c978a72dad631b014ca653d4764aa7b2675e53c47546614601d
3
  size 1230592267
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dbba28742d6013f6fc692c0d332059d2e00fb3286712afea40fb65838ac9adc
3
  size 1230592267
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edab5dd7827df6c860a06cbc8d688873b247f37062ba5008ca6bb63249a0eb13
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d57a1899b276deaf9bc6c347b576a36bf470824199b1d1731a5698c732cc5649
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.5758157389635317,
6
  "eval_steps": 500,
7
- "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -92,6 +92,34 @@
92
  "learning_rate": 2.3639274279615796e-05,
93
  "loss": 0.1743,
94
  "step": 600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
95
  }
96
  ],
97
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7677543186180422,
6
  "eval_steps": 500,
7
+ "global_step": 800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
92
  "learning_rate": 2.3639274279615796e-05,
93
  "loss": 0.1743,
94
  "step": 600
95
+ },
96
+ {
97
+ "epoch": 0.6238003838771593,
98
+ "grad_norm": 3.28125,
99
+ "learning_rate": 2.097118463180363e-05,
100
+ "loss": 0.1574,
101
+ "step": 650
102
+ },
103
+ {
104
+ "epoch": 0.6717850287907869,
105
+ "grad_norm": 4.125,
106
+ "learning_rate": 1.830309498399146e-05,
107
+ "loss": 0.1586,
108
+ "step": 700
109
+ },
110
+ {
111
+ "epoch": 0.7197696737044146,
112
+ "grad_norm": 3.875,
113
+ "learning_rate": 1.5635005336179295e-05,
114
+ "loss": 0.1473,
115
+ "step": 750
116
+ },
117
+ {
118
+ "epoch": 0.7677543186180422,
119
+ "grad_norm": 3.671875,
120
+ "learning_rate": 1.2966915688367129e-05,
121
+ "loss": 0.1547,
122
+ "step": 800
123
  }
124
  ],
125
  "logging_steps": 50,