rabaevn commited on
Commit
2c73a16
·
verified ·
1 Parent(s): 4f09d0b

Training in progress, step 1000, checkpoint

Browse files
last-checkpoint/2_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1a852d6fcae1f2179d5763df7a46fddad1877e145fff513af3347be674ce52b
3
  size 9437272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00693ca726c3aa172fe54b2bbf0f5a2ac7ef3e0f15e6ef10272ea4e790f1a7ea
3
  size 9437272
last-checkpoint/3_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3394c00a0b8299e323b6e83e64ef00be5d726f3c420aa6b111200a304b59f62c
3
  size 9437272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ec4b258539975d8b345245718777e000a517241aa23cc10eb37dd6ffc792aab
3
  size 9437272
last-checkpoint/README.md CHANGED
@@ -450,7 +450,7 @@ print(query_embeddings.shape, document_embeddings.shape)
450
  # Get the similarity scores for the embeddings
451
  similarities = model.similarity(query_embeddings, document_embeddings)
452
  print(similarities)
453
- # tensor([[ 0.5962, -0.0191, 0.2550]])
454
  ```
455
 
456
  <!--
@@ -703,6 +703,10 @@ You can finetune this model on your own dataset.
703
  | 0.2316 | 700 | 0.1013 |
704
  | 0.2482 | 750 | 0.1019 |
705
  | 0.2647 | 800 | 0.0964 |
 
 
 
 
706
 
707
 
708
  ### Framework Versions
 
450
  # Get the similarity scores for the embeddings
451
  similarities = model.similarity(query_embeddings, document_embeddings)
452
  print(similarities)
453
+ # tensor([[ 0.4709, -0.1225, 0.1580]])
454
  ```
455
 
456
  <!--
 
703
  | 0.2316 | 700 | 0.1013 |
704
  | 0.2482 | 750 | 0.1019 |
705
  | 0.2647 | 800 | 0.0964 |
706
+ | 0.2813 | 850 | 0.0961 |
707
+ | 0.2978 | 900 | 0.0927 |
708
+ | 0.3144 | 950 | 0.0946 |
709
+ | 0.3309 | 1000 | 0.0988 |
710
 
711
 
712
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6ff1bb561b9706f1f8512c3b49593b3ccfe975a3a766ab30ffe85567e0af9d8
3
  size 1211486072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13ac8f3e49e96856b9bc03370f38b3741180dcb037151388805051f7ea3ffe8f
3
  size 1211486072
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:308069358a54642120bbc71415a487f71aebf1cfafc7c73bebd447e79b921486
3
  size 2460923467
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45310978fd3a8f93b72bef2a6c703555d44d1cb9ff7e494d4ad2616538a9ff9b
3
  size 2460923467
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39a64593b8ffcc45b5d5cd6de2eb5cadb176a065ce63970660c524f174fa6360
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc83c3e7cbaa37ce1778897d2e62cb7b8c41ece6f6ed0596eecff4f3f73fcd86
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7baf2879871f108cbdcd4157b9794e8d6049aec3cf60c7a2c1c3c5259ba4fe4d
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:220ab6d106cef455c6160d9f0f26a124a8032f6a0351c6a17f6905e5df60789d
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.26472534745201853,
6
  "eval_steps": 500,
7
- "global_step": 800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -120,6 +120,34 @@
120
  "learning_rate": 1.6351599852887092e-05,
121
  "loss": 0.0964,
122
  "step": 800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
123
  }
124
  ],
125
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.3309066843150232,
6
  "eval_steps": 500,
7
+ "global_step": 1000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
120
  "learning_rate": 1.6351599852887092e-05,
121
  "loss": 0.0964,
122
  "step": 800
123
+ },
124
+ {
125
+ "epoch": 0.2812706816677697,
126
+ "grad_norm": 6.790607929229736,
127
+ "learning_rate": 1.5983817579992645e-05,
128
+ "loss": 0.0961,
129
+ "step": 850
130
+ },
131
+ {
132
+ "epoch": 0.29781601588352086,
133
+ "grad_norm": 6.981550693511963,
134
+ "learning_rate": 1.56160353070982e-05,
135
+ "loss": 0.0927,
136
+ "step": 900
137
+ },
138
+ {
139
+ "epoch": 0.314361350099272,
140
+ "grad_norm": 4.593362808227539,
141
+ "learning_rate": 1.5248253034203752e-05,
142
+ "loss": 0.0946,
143
+ "step": 950
144
+ },
145
+ {
146
+ "epoch": 0.3309066843150232,
147
+ "grad_norm": 4.783601760864258,
148
+ "learning_rate": 1.4880470761309307e-05,
149
+ "loss": 0.0988,
150
+ "step": 1000
151
  }
152
  ],
153
  "logging_steps": 50,