guyhadad01 commited on
Commit
516580c
·
verified ·
1 Parent(s): 8bf0a26

Training in progress, step 400, checkpoint

Browse files
last-checkpoint/2_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:245987c37984397149e2b7782bea1deeb6b41895e4c73137a0745ae1034fae74
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8385504144ad50228e1459ea5b1da17bd7f4d3aac19f5476c1c8296b68f4f05b
3
  size 4718680
last-checkpoint/3_Dense/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c06029654776794583e6462e88fb48f86fae257f300ef5195e19451cdd07501d
3
  size 4718680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac472c212bf6ebd5d336507924eb651104467de24dfbfaa520db97b7708d09b9
3
  size 4718680
last-checkpoint/README.md CHANGED
@@ -472,7 +472,7 @@ print(query_embeddings.shape, document_embeddings.shape)
472
  # Get the similarity scores for the embeddings
473
  similarities = model.similarity(query_embeddings, document_embeddings)
474
  print(similarities)
475
- # tensor([[ 0.7186, -0.1245, -0.0664]])
476
  ```
477
 
478
  <!--
@@ -685,6 +685,10 @@ You can finetune this model on your own dataset.
685
  | 0.0508 | 100 | 0.2331 |
686
  | 0.0762 | 150 | 0.2031 |
687
  | 0.1016 | 200 | 0.2042 |
 
 
 
 
688
 
689
 
690
  ### Framework Versions
 
472
  # Get the similarity scores for the embeddings
473
  similarities = model.similarity(query_embeddings, document_embeddings)
474
  print(similarities)
475
+ # tensor([[ 0.5851, -0.1180, -0.1336]])
476
  ```
477
 
478
  <!--
 
685
  | 0.0508 | 100 | 0.2331 |
686
  | 0.0762 | 150 | 0.2031 |
687
  | 0.1016 | 200 | 0.2042 |
688
+ | 0.1270 | 250 | 0.2048 |
689
+ | 0.1524 | 300 | 0.2123 |
690
+ | 0.1778 | 350 | 0.186 |
691
+ | 0.2033 | 400 | 0.1693 |
692
 
693
 
694
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9dcff2bc35d4b89f9920dbfc24c9784230f133e60b7efd8421b728caa3129765
3
  size 605759848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5538ec5f6c8499fe8ef0de1e93c420e403b0b4f926f25aa62e05b6f0e23991b0
3
  size 605759848
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89649a22f3916e197be45a082597d611800c3e9d7c9d75aba96246deab4411d1
3
  size 1230592267
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd9addc9d33db5aa5f32bbfd79d0f8ab2168d1aa307bb30b7aa8355f331a85fd
3
  size 1230592267
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d4e739551319e957e6c472fd8c9bacf3bae41231a764211a8f19abc4bae6961
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fc56140e5c37825482a26f377f07f74eaa4028a1b2f8b46eaa880f0215c9abf
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.1016260162601626,
6
  "eval_steps": 500,
7
- "global_step": 200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -36,6 +36,34 @@
36
  "learning_rate": 4.994353472614343e-05,
37
  "loss": 0.2042,
38
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
39
  }
40
  ],
41
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.2032520325203252,
6
  "eval_steps": 500,
7
+ "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
36
  "learning_rate": 4.994353472614343e-05,
37
  "loss": 0.2042,
38
  "step": 200
39
+ },
40
+ {
41
+ "epoch": 0.12703252032520326,
42
+ "grad_norm": 5.4375,
43
+ "learning_rate": 4.853190287972897e-05,
44
+ "loss": 0.2048,
45
+ "step": 250
46
+ },
47
+ {
48
+ "epoch": 0.1524390243902439,
49
+ "grad_norm": 5.09375,
50
+ "learning_rate": 4.7120271033314515e-05,
51
+ "loss": 0.2123,
52
+ "step": 300
53
+ },
54
+ {
55
+ "epoch": 0.17784552845528456,
56
+ "grad_norm": 4.5,
57
+ "learning_rate": 4.570863918690006e-05,
58
+ "loss": 0.186,
59
+ "step": 350
60
+ },
61
+ {
62
+ "epoch": 0.2032520325203252,
63
+ "grad_norm": 5.6875,
64
+ "learning_rate": 4.42970073404856e-05,
65
+ "loss": 0.1693,
66
+ "step": 400
67
  }
68
  ],
69
  "logging_steps": 50,