rabaevn commited on
Commit
cb3f01b
·
verified ·
1 Parent(s): bce0d93

Training in progress, step 730, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -416,9 +416,9 @@ print(embeddings.shape)
416
  # Get the similarity scores for the embeddings
417
  similarities = model.similarity(embeddings, embeddings)
418
  print(similarities)
419
- # tensor([[ 1.0000, 0.4984, -0.0999],
420
- # [ 0.4984, 1.0000, -0.0665],
421
- # [-0.0999, -0.0665, 1.0000]])
422
  ```
423
 
424
  <!--
@@ -664,6 +664,8 @@ You can finetune this model on your own dataset.
664
  | 0.6849 | 500 | 0.4035 |
665
  | 0.7534 | 550 | 0.4031 |
666
  | 0.8219 | 600 | 0.3928 |
 
 
667
 
668
 
669
  ### Framework Versions
 
416
  # Get the similarity scores for the embeddings
417
  similarities = model.similarity(embeddings, embeddings)
418
  print(similarities)
419
+ # tensor([[ 1.0000, 0.4872, -0.1172],
420
+ # [ 0.4872, 1.0000, -0.0891],
421
+ # [-0.1172, -0.0891, 1.0000]])
422
  ```
423
 
424
  <!--
 
664
  | 0.6849 | 500 | 0.4035 |
665
  | 0.7534 | 550 | 0.4031 |
666
  | 0.8219 | 600 | 0.3928 |
667
+ | 0.8904 | 650 | 0.3978 |
668
+ | 0.9589 | 700 | 0.3825 |
669
 
670
 
671
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d42737ca487f64b2ba0a490df3c1016ede96f9e04bc367ce6fcb5349782d57fd
3
  size 437951328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e76a4b2fb3c0733c12ae07cd3e0f4d875be188fd8938ce2014837b99779ee54
3
  size 437951328
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6bdd1b459b57b607629063b2fa6365026d82857ad958e3cc875f260b4feb3ed3
3
  size 871301195
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2f881cdd4fbadbeed0ef1305747cfe1c55dfdce013684e2a5df5cb7ba0558b5
3
  size 871301195
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76943be04f8b05d95c854799f3634427a1630c4299e02fd4a7cffa5a2077ccd9
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:504f8ee025f27793137df10695026a0da0e5051f8bccc8c4973299bed48fc121
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c03d30d642b0c4e8e2abbdc65933da67b7407e7d449bd380792a2bf635ff9333
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d33660fd2d77daa0cdfa768b8e1bfd3ff165bc08a039957c7b15665ed77b87cd
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.821917808219178,
6
  "eval_steps": 500,
7
- "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -92,6 +92,20 @@
92
  "learning_rate": 9.969558599695586e-06,
93
  "loss": 0.3928,
94
  "step": 600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
95
  }
96
  ],
97
  "logging_steps": 50,
@@ -106,7 +120,7 @@
106
  "should_evaluate": false,
107
  "should_log": false,
108
  "should_save": true,
109
- "should_training_stop": false
110
  },
111
  "attributes": {}
112
  }
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 1.0,
6
  "eval_steps": 500,
7
+ "global_step": 730,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
92
  "learning_rate": 9.969558599695586e-06,
93
  "loss": 0.3928,
94
  "step": 600
95
+ },
96
+ {
97
+ "epoch": 0.8904109589041096,
98
+ "grad_norm": 2.14909029006958,
99
+ "learning_rate": 6.1643835616438354e-06,
100
+ "loss": 0.3978,
101
+ "step": 650
102
+ },
103
+ {
104
+ "epoch": 0.958904109589041,
105
+ "grad_norm": 1.899760365486145,
106
+ "learning_rate": 2.3592085235920852e-06,
107
+ "loss": 0.3825,
108
+ "step": 700
109
  }
110
  ],
111
  "logging_steps": 50,
 
120
  "should_evaluate": false,
121
  "should_log": false,
122
  "should_save": true,
123
+ "should_training_stop": true
124
  },
125
  "attributes": {}
126
  }