guyhadad01 commited on
Commit
6ee614e
·
verified ·
1 Parent(s): 2e243f9

Training in progress, step 400, checkpoint

Browse files
last-checkpoint/2_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80ba4c20eaffda01a7578f0684f2336ed09ec07c7aab125579261832916efe9d
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c355932b1631d5cc039fe88a412c00c3f3d18cb613c3652c8741e9192cc4806
3
  size 4718680
last-checkpoint/3_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d97089f7924b8ca62eb91f3741ef27a57ff82b97b5f62f3a66bfd0ab18234833
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb2dd401d0d4ffa6433f83d4ac597ff641928d6ea494ae387a1a6f1a6d310553
3
  size 4718680
last-checkpoint/README.md CHANGED
@@ -511,7 +511,7 @@ print(query_embeddings.shape, document_embeddings.shape)
511
  # Get the similarity scores for the embeddings
512
  similarities = model.similarity(query_embeddings, document_embeddings)
513
  print(similarities)
514
- # tensor([[ 0.6871, -0.1118, -0.0955]])
515
  ```
516
 
517
  <!--
@@ -724,6 +724,10 @@ You can finetune this model on your own dataset.
724
  | 0.0960 | 100 | 0.2763 |
725
  | 0.1440 | 150 | 0.2883 |
726
  | 0.1919 | 200 | 0.2636 |
 
 
 
 
727
 
728
 
729
  ### Framework Versions
 
511
  # Get the similarity scores for the embeddings
512
  similarities = model.similarity(query_embeddings, document_embeddings)
513
  print(similarities)
514
+ # tensor([[ 0.6620, -0.0063, -0.0333]])
515
  ```
516
 
517
  <!--
 
724
  | 0.0960 | 100 | 0.2763 |
725
  | 0.1440 | 150 | 0.2883 |
726
  | 0.1919 | 200 | 0.2636 |
727
+ | 0.2399 | 250 | 0.2626 |
728
+ | 0.2879 | 300 | 0.2219 |
729
+ | 0.3359 | 350 | 0.2227 |
730
+ | 0.3839 | 400 | 0.207 |
731
 
732
 
733
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00293b8b4761f0d06286339bd7a4cc183edee2c660dc984093785075d782b637
3
  size 605759848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1b5b40b7da70f2a14fdcffdfb517052cafd4a92b303a999515bd5c70bc3b56e
3
  size 605759848
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98e772b8cb66794b0681c305d4a6ee5eb7b613bcff465dc3fe7029c205d3e580
3
  size 1230592267
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ef66f6c3146c65c716246a9b9b1a314970b310fa5bce4e1a4c785a225e5e5d8
3
  size 1230592267
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d88407aff68ef8509234fd2211bb50888896b55849641ad9180c09511a40fab
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df0af633a4f9f804af5866a99325014522ad3b38b189715886b1cb20a1e95ac1
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.19193857965451055,
6
  "eval_steps": 500,
7
- "global_step": 200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -36,6 +36,34 @@
36
  "learning_rate": 4.4983991462113126e-05,
37
  "loss": 0.2636,
38
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
39
  }
40
  ],
41
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.3838771593090211,
6
  "eval_steps": 500,
7
+ "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
36
  "learning_rate": 4.4983991462113126e-05,
37
  "loss": 0.2636,
38
  "step": 200
39
+ },
40
+ {
41
+ "epoch": 0.2399232245681382,
42
+ "grad_norm": 5.875,
43
+ "learning_rate": 4.231590181430096e-05,
44
+ "loss": 0.2626,
45
+ "step": 250
46
+ },
47
+ {
48
+ "epoch": 0.28790786948176583,
49
+ "grad_norm": 5.9375,
50
+ "learning_rate": 3.9647812166488794e-05,
51
+ "loss": 0.2219,
52
+ "step": 300
53
+ },
54
+ {
55
+ "epoch": 0.33589251439539347,
56
+ "grad_norm": 5.125,
57
+ "learning_rate": 3.697972251867663e-05,
58
+ "loss": 0.2227,
59
+ "step": 350
60
+ },
61
+ {
62
+ "epoch": 0.3838771593090211,
63
+ "grad_norm": 5.15625,
64
+ "learning_rate": 3.431163287086446e-05,
65
+ "loss": 0.207,
66
+ "step": 400
67
  }
68
  ],
69
  "logging_steps": 50,