LamaDiab commited on
Commit
83163f1
·
verified ·
1 Parent(s): e68565b

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-22/README.md CHANGED
@@ -98,9 +98,9 @@ print(embeddings.shape)
98
  # Get the similarity scores for the embeddings
99
  similarities = model.similarity(embeddings, embeddings)
100
  print(similarities)
101
- # tensor([[1.0000, 0.9016, 0.4455],
102
- # [0.9016, 1.0000, 0.4424],
103
- # [0.4455, 0.4424, 1.0000]])
104
  ```
105
 
106
  <!--
@@ -174,6 +174,7 @@ You can finetune this model on your own dataset.
174
  - `per_device_eval_batch_size`: 16
175
  - `learning_rate`: 2e-05
176
  - `weight_decay`: 0.001
 
177
  - `warmup_ratio`: 0.2
178
  - `fp16`: True
179
  - `dataloader_num_workers`: 2
@@ -204,7 +205,7 @@ You can finetune this model on your own dataset.
204
  - `adam_beta2`: 0.999
205
  - `adam_epsilon`: 1e-08
206
  - `max_grad_norm`: 1.0
207
- - `num_train_epochs`: 3
208
  - `max_steps`: -1
209
  - `lr_scheduler_type`: linear
210
  - `lr_scheduler_kwargs`: {}
@@ -311,7 +312,7 @@ You can finetune this model on your own dataset.
311
  | Epoch | Step | Training Loss |
312
  |:------:|:----:|:-------------:|
313
  | 0.0455 | 1 | 3.3947 |
314
- | 1.0 | 22 | 2.7614 |
315
 
316
 
317
  ### Framework Versions
 
98
  # Get the similarity scores for the embeddings
99
  similarities = model.similarity(embeddings, embeddings)
100
  print(similarities)
101
+ # tensor([[1.0000, 0.9027, 0.4485],
102
+ # [0.9027, 1.0000, 0.4446],
103
+ # [0.4485, 0.4446, 1.0000]])
104
  ```
105
 
106
  <!--
 
174
  - `per_device_eval_batch_size`: 16
175
  - `learning_rate`: 2e-05
176
  - `weight_decay`: 0.001
177
+ - `num_train_epochs`: 2
178
  - `warmup_ratio`: 0.2
179
  - `fp16`: True
180
  - `dataloader_num_workers`: 2
 
205
  - `adam_beta2`: 0.999
206
  - `adam_epsilon`: 1e-08
207
  - `max_grad_norm`: 1.0
208
+ - `num_train_epochs`: 2
209
  - `max_steps`: -1
210
  - `lr_scheduler_type`: linear
211
  - `lr_scheduler_kwargs`: {}
 
312
  | Epoch | Step | Training Loss |
313
  |:------:|:----:|:-------------:|
314
  | 0.0455 | 1 | 3.3947 |
315
+ | 1.0 | 22 | 2.7163 |
316
 
317
 
318
  ### Framework Versions
checkpoint-22/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae36f0d49cb7c6e043c6ef223cacbfbe254b437fe8f8231ff156569d9b3720a7
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44dc75dc88eaa963e3e29998f9ff2c4b342c2b9cc828ed5cc8f06f722ac95d5d
3
  size 90864192
checkpoint-22/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d20014754335e14c3273e770a9a97cae030182098365de37df0f2fbbdde6740a
3
  size 85254842
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3715e5cad0bd7354d05fea88cf40f306a6bc22d5b34fd5f23d539ccc5cb287d
3
  size 85254842
checkpoint-22/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:184a54e4b0325e58e2b676f5bf81fb2212c224be32f3e0d06e2236fd564a2464
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee0889d2e1f8f81ca0859895fa3b9cec01c8ba200e1012155e6d6bf09d3f55f1
3
  size 1064
checkpoint-22/trainer_state.json CHANGED
@@ -18,16 +18,16 @@
18
  },
19
  {
20
  "epoch": 1.0,
21
- "grad_norm": 25.755640029907227,
22
- "learning_rate": 1.730769230769231e-05,
23
- "loss": 2.7614,
24
  "step": 22
25
  }
26
  ],
27
  "logging_steps": 500,
28
- "max_steps": 66,
29
  "num_input_tokens_seen": 0,
30
- "num_train_epochs": 3,
31
  "save_steps": 500,
32
  "stateful_callbacks": {
33
  "TrainerControl": {
 
18
  },
19
  {
20
  "epoch": 1.0,
21
+ "grad_norm": 25.27043342590332,
22
+ "learning_rate": 1.3142857142857145e-05,
23
+ "loss": 2.7163,
24
  "step": 22
25
  }
26
  ],
27
  "logging_steps": 500,
28
+ "max_steps": 44,
29
  "num_input_tokens_seen": 0,
30
+ "num_train_epochs": 2,
31
  "save_steps": 500,
32
  "stateful_callbacks": {
33
  "TrainerControl": {
checkpoint-22/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c47de56b6ffbf75451cd50cf54a7faa7e4410fc0c9cb2ddb837b9ec87e9577b
3
  size 5752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e91a92ff4d4228b61d5b3b1e6c465ed3cfe5a67113276860cdd9a2015549963
3
  size 5752