fguryel commited on
Commit
5db0525
·
verified ·
1 Parent(s): f0e17d6

Upload folder using huggingface_hub

Browse files
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80bcd64f8b28ea0522b23c90d589da4c846b431b7b881449da4660951df57823
3
  size 4991037968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:563ad1a53ff9968c23e661fbde0971b00547c40f4d286b6a81f100ad3a953090
3
  size 4991037968
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d00c654b8158f6603c7785b2e8d5f47d9cb6a25204280ed8587a48e85f66172
3
  size 1610725592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cae00f32d5364a2e287e59819cabad01b83cc639d9fa338d8f4a929c62f6b094
3
  size 1610725592
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:076eba10f086da4576d3906878882df2c7186b2daa7ce0f6a7f0437b019a6acc
3
  size 13203690391
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c768a039ece165c81adc7ffc56067dfc1c0ba40916bd4dd23a66b7db5284ff5
3
  size 13203690391
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20ea3a198ff666cb4ace1c684b598fe43fc7c3c276b83efc553a1b787e12a304
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9445552595536daf5bd8731be4eabb308bd26e76a3f4f0c20c4aa55fcf9ea202
3
  size 14645
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:355a4437a5f06b625275e18af63d950b8d65ee72e9119d148de55df74a553f3b
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5db160d0d863329e76a33fba4aeedbc2d728eee05bd8deed47128275fa20fabd
3
  size 1465
trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 2000,
3
- "best_metric": 1.2739386558532715,
4
- "best_model_checkpoint": "./orpheus-turkish-emotion-finetune/checkpoint-2000",
5
- "epoch": 9.95202492211838,
6
  "eval_steps": 500,
7
- "global_step": 2000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -320,6 +320,84 @@
320
  "eval_samples_per_second": 11.528,
321
  "eval_steps_per_second": 1.481,
322
  "step": 2000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
323
  }
324
  ],
325
  "logging_steps": 50,
@@ -339,7 +417,7 @@
339
  "attributes": {}
340
  }
341
  },
342
- "total_flos": 5.532530945116078e+17,
343
  "train_batch_size": 1,
344
  "trial_name": null,
345
  "trial_params": null
 
1
  {
2
+ "best_global_step": 2500,
3
+ "best_metric": 1.2259057760238647,
4
+ "best_model_checkpoint": "./orpheus-turkish-emotion-finetune/checkpoint-2500",
5
+ "epoch": 12.44361370716511,
6
  "eval_steps": 500,
7
+ "global_step": 2500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
320
  "eval_samples_per_second": 11.528,
321
  "eval_steps_per_second": 1.481,
322
  "step": 2000
323
+ },
324
+ {
325
+ "epoch": 10.20436137071651,
326
+ "grad_norm": 0.87109375,
327
+ "learning_rate": 5.701024361409431e-06,
328
+ "loss": 1.2265,
329
+ "step": 2050
330
+ },
331
+ {
332
+ "epoch": 10.453582554517133,
333
+ "grad_norm": 0.95703125,
334
+ "learning_rate": 5.485494740420431e-06,
335
+ "loss": 1.198,
336
+ "step": 2100
337
+ },
338
+ {
339
+ "epoch": 10.702803738317757,
340
+ "grad_norm": 1.7421875,
341
+ "learning_rate": 5.26905012397343e-06,
342
+ "loss": 1.2148,
343
+ "step": 2150
344
+ },
345
+ {
346
+ "epoch": 10.95202492211838,
347
+ "grad_norm": 1.5234375,
348
+ "learning_rate": 5.052098437890215e-06,
349
+ "loss": 1.1983,
350
+ "step": 2200
351
+ },
352
+ {
353
+ "epoch": 11.199376947040498,
354
+ "grad_norm": 1.15625,
355
+ "learning_rate": 4.835048563649499e-06,
356
+ "loss": 1.2025,
357
+ "step": 2250
358
+ },
359
+ {
360
+ "epoch": 11.448598130841122,
361
+ "grad_norm": 1.0078125,
362
+ "learning_rate": 4.6183095677818825e-06,
363
+ "loss": 1.1926,
364
+ "step": 2300
365
+ },
366
+ {
367
+ "epoch": 11.697819314641745,
368
+ "grad_norm": 1.4453125,
369
+ "learning_rate": 4.402289930916053e-06,
370
+ "loss": 1.2022,
371
+ "step": 2350
372
+ },
373
+ {
374
+ "epoch": 11.947040498442368,
375
+ "grad_norm": 1.1328125,
376
+ "learning_rate": 4.187396777929205e-06,
377
+ "loss": 1.2099,
378
+ "step": 2400
379
+ },
380
+ {
381
+ "epoch": 12.194392523364487,
382
+ "grad_norm": 1.625,
383
+ "learning_rate": 3.974035110652596e-06,
384
+ "loss": 1.2093,
385
+ "step": 2450
386
+ },
387
+ {
388
+ "epoch": 12.44361370716511,
389
+ "grad_norm": 1.0625,
390
+ "learning_rate": 3.762607044578357e-06,
391
+ "loss": 1.1972,
392
+ "step": 2500
393
+ },
394
+ {
395
+ "epoch": 12.44361370716511,
396
+ "eval_loss": 1.2259057760238647,
397
+ "eval_runtime": 15.4359,
398
+ "eval_samples_per_second": 11.596,
399
+ "eval_steps_per_second": 1.49,
400
+ "step": 2500
401
  }
402
  ],
403
  "logging_steps": 50,
 
417
  "attributes": {}
418
  }
419
  },
420
+ "total_flos": 6.917655295552389e+17,
421
  "train_batch_size": 1,
422
  "trial_name": null,
423
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e91f58a9a988419f219f097fff3f0e1762f623e4b2b1a8cf942cacee3271dc13
3
  size 5777
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21019e40285276caa4e865ddd780079cee489dc246be6fcfee79f590b8e47b52
3
  size 5777