Commit
Β·
ffa4692
1
Parent(s):
ba9b273
Training in progress, step 6800
Browse files- adapter_model.bin +1 -1
- {checkpoint-6400 β checkpoint-6700/adapter_model}/README.md +0 -0
- {checkpoint-6400 β checkpoint-6700/adapter_model}/adapter_config.json +0 -0
- {checkpoint-6400 β checkpoint-6700/adapter_model}/adapter_model.bin +1 -1
- {checkpoint-6400/adapter_model β checkpoint-6800}/README.md +0 -0
- {checkpoint-6400/adapter_model β checkpoint-6800}/adapter_config.json +0 -0
- {checkpoint-6400/adapter_model β checkpoint-6800}/adapter_model.bin +1 -1
- {checkpoint-6400 β checkpoint-6800}/optimizer.pt +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_0.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_1.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_10.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_11.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_12.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_13.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_2.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_3.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_4.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_5.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_6.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_7.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_8.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_9.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/scheduler.pt +1 -1
- {checkpoint-6400 β checkpoint-6800}/trainer_state.json +99 -3
- {checkpoint-6400 β checkpoint-6800}/training_args.bin +0 -0
adapter_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 500897101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:caee01e1da9f7e92223499414f8bb25b28ea34daf6fb927c9bd869dcba2559fd
|
| 3 |
size 500897101
|
{checkpoint-6400 β checkpoint-6700/adapter_model}/README.md
RENAMED
|
File without changes
|
{checkpoint-6400 β checkpoint-6700/adapter_model}/adapter_config.json
RENAMED
|
File without changes
|
{checkpoint-6400 β checkpoint-6700/adapter_model}/adapter_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 500897101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bcb96297919ffccc23a8f48a581a3185b03d83d73a72799941d2f235cad389d3
|
| 3 |
size 500897101
|
{checkpoint-6400/adapter_model β checkpoint-6800}/README.md
RENAMED
|
File without changes
|
{checkpoint-6400/adapter_model β checkpoint-6800}/adapter_config.json
RENAMED
|
File without changes
|
{checkpoint-6400/adapter_model β checkpoint-6800}/adapter_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 500897101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:caee01e1da9f7e92223499414f8bb25b28ea34daf6fb927c9bd869dcba2559fd
|
| 3 |
size 500897101
|
{checkpoint-6400 β checkpoint-6800}/optimizer.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1001752701
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a8797c2a2a21d3c99399832b3c5e9972ada7dec6e83cff5de4273cfa1c8c9f7
|
| 3 |
size 1001752701
|
{checkpoint-6400 β checkpoint-6800}/rng_state_0.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76a69b101b534038a0d1cd30c8b1e9841f687d0b3b07df6d02b3916e19b719c2
|
| 3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_1.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5e8706d00c08c82d30b24671bce72e1fd88ccda2d435bfc8570ef4280b40d47
|
| 3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_10.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f82da6b92d2dd42eda022db14fa263f4d03e28910c03bf4e97c967f1d893d8f
|
| 3 |
size 27789
|
{checkpoint-6400 β checkpoint-6800}/rng_state_11.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:864477484049b3efdc98311c8185fa709645f956dfcbc5f22f55344bde84d440
|
| 3 |
size 27789
|
{checkpoint-6400 β checkpoint-6800}/rng_state_12.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b26c1496ef4023f2612561635f505e587abbdb9e2a946f7d90f08aaa3337aa4
|
| 3 |
size 27789
|
{checkpoint-6400 β checkpoint-6800}/rng_state_13.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3c96078789fb495fd632c506d1671752f888d28d828331ac9ab1506089b50ed
|
| 3 |
size 27789
|
{checkpoint-6400 β checkpoint-6800}/rng_state_2.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61e915fcf4dd8f755df46cb9e5050aaae8b843699fa9edd019950564b2fda05c
|
| 3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_3.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e81ee1af73dd375865e86e8bf7e0efc15b3d4e65d58ca9f4d3ed4d33561879b
|
| 3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_4.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f9150b049fc2e88708149ace562a8a4c9fef4ae5ea0bb2b8a584401d2abf84b2
|
| 3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_5.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9632ffce62364279230205690bdfad30fc16e17ef6a0f7efacfbeb73e2b1496
|
| 3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_6.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0510fe79de24ae1d1cce464b86e9ee2bc9d2fa77099fb7dc30a7866117bd6e7
|
| 3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_7.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3c084b8f84126bddadb7fcd64d22191438d565af4562b1fa9ef192f15ed39f43
|
| 3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_8.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7a3c330abb87810692a9b735e5edfdf7a74760562ee2e69753f40e14ef0d2404
|
| 3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_9.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:002d98d8a4fb73f32df6d2c88a43fb21668bf0821b126886c8586170e99c43d9
|
| 3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/scheduler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 627
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89396b89609adca20f26c9861c9dcc008dc9de0fbc3e7816552f07bbb0b807a7
|
| 3 |
size 627
|
{checkpoint-6400 β checkpoint-6800}/trainer_state.json
RENAMED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
-
"epoch": 2.
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -1566,11 +1566,107 @@
|
|
| 1566 |
"learning_rate": 1.4414188367884907e-05,
|
| 1567 |
"loss": 0.7668,
|
| 1568 |
"step": 6400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1569 |
}
|
| 1570 |
],
|
| 1571 |
"max_steps": 7737,
|
| 1572 |
"num_train_epochs": 3,
|
| 1573 |
-
"total_flos": 2.
|
| 1574 |
"trial_name": null,
|
| 1575 |
"trial_params": null
|
| 1576 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
+
"epoch": 2.6366808840635905,
|
| 5 |
+
"global_step": 6800,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 1566 |
"learning_rate": 1.4414188367884907e-05,
|
| 1567 |
"loss": 0.7668,
|
| 1568 |
"step": 6400
|
| 1569 |
+
},
|
| 1570 |
+
{
|
| 1571 |
+
"epoch": 2.49,
|
| 1572 |
+
"learning_rate": 1.3892908218015654e-05,
|
| 1573 |
+
"loss": 0.7662,
|
| 1574 |
+
"step": 6425
|
| 1575 |
+
},
|
| 1576 |
+
{
|
| 1577 |
+
"epoch": 2.5,
|
| 1578 |
+
"learning_rate": 1.3380524034274122e-05,
|
| 1579 |
+
"loss": 0.7689,
|
| 1580 |
+
"step": 6450
|
| 1581 |
+
},
|
| 1582 |
+
{
|
| 1583 |
+
"epoch": 2.51,
|
| 1584 |
+
"learning_rate": 1.2877088752513189e-05,
|
| 1585 |
+
"loss": 0.7694,
|
| 1586 |
+
"step": 6475
|
| 1587 |
+
},
|
| 1588 |
+
{
|
| 1589 |
+
"epoch": 2.52,
|
| 1590 |
+
"learning_rate": 1.2382654384049475e-05,
|
| 1591 |
+
"loss": 0.7714,
|
| 1592 |
+
"step": 6500
|
| 1593 |
+
},
|
| 1594 |
+
{
|
| 1595 |
+
"epoch": 2.53,
|
| 1596 |
+
"learning_rate": 1.1897272010289884e-05,
|
| 1597 |
+
"loss": 0.7701,
|
| 1598 |
+
"step": 6525
|
| 1599 |
+
},
|
| 1600 |
+
{
|
| 1601 |
+
"epoch": 2.54,
|
| 1602 |
+
"learning_rate": 1.1420991777454315e-05,
|
| 1603 |
+
"loss": 0.7628,
|
| 1604 |
+
"step": 6550
|
| 1605 |
+
},
|
| 1606 |
+
{
|
| 1607 |
+
"epoch": 2.55,
|
| 1608 |
+
"learning_rate": 1.0953862891394795e-05,
|
| 1609 |
+
"loss": 0.7661,
|
| 1610 |
+
"step": 6575
|
| 1611 |
+
},
|
| 1612 |
+
{
|
| 1613 |
+
"epoch": 2.56,
|
| 1614 |
+
"learning_rate": 1.0495933612511976e-05,
|
| 1615 |
+
"loss": 0.7729,
|
| 1616 |
+
"step": 6600
|
| 1617 |
+
},
|
| 1618 |
+
{
|
| 1619 |
+
"epoch": 2.57,
|
| 1620 |
+
"learning_rate": 1.0047251250769175e-05,
|
| 1621 |
+
"loss": 0.772,
|
| 1622 |
+
"step": 6625
|
| 1623 |
+
},
|
| 1624 |
+
{
|
| 1625 |
+
"epoch": 2.58,
|
| 1626 |
+
"learning_rate": 9.60786216080466e-06,
|
| 1627 |
+
"loss": 0.7702,
|
| 1628 |
+
"step": 6650
|
| 1629 |
+
},
|
| 1630 |
+
{
|
| 1631 |
+
"epoch": 2.59,
|
| 1632 |
+
"learning_rate": 9.177811737142627e-06,
|
| 1633 |
+
"loss": 0.7711,
|
| 1634 |
+
"step": 6675
|
| 1635 |
+
},
|
| 1636 |
+
{
|
| 1637 |
+
"epoch": 2.6,
|
| 1638 |
+
"learning_rate": 8.757144409503359e-06,
|
| 1639 |
+
"loss": 0.765,
|
| 1640 |
+
"step": 6700
|
| 1641 |
+
},
|
| 1642 |
+
{
|
| 1643 |
+
"epoch": 2.61,
|
| 1644 |
+
"learning_rate": 8.34590363821306e-06,
|
| 1645 |
+
"loss": 0.7713,
|
| 1646 |
+
"step": 6725
|
| 1647 |
+
},
|
| 1648 |
+
{
|
| 1649 |
+
"epoch": 2.62,
|
| 1650 |
+
"learning_rate": 7.944131909713859e-06,
|
| 1651 |
+
"loss": 0.7631,
|
| 1652 |
+
"step": 6750
|
| 1653 |
+
},
|
| 1654 |
+
{
|
| 1655 |
+
"epoch": 2.63,
|
| 1656 |
+
"learning_rate": 7.551870732174416e-06,
|
| 1657 |
+
"loss": 0.767,
|
| 1658 |
+
"step": 6775
|
| 1659 |
+
},
|
| 1660 |
+
{
|
| 1661 |
+
"epoch": 2.64,
|
| 1662 |
+
"learning_rate": 7.169160631201566e-06,
|
| 1663 |
+
"loss": 0.7692,
|
| 1664 |
+
"step": 6800
|
| 1665 |
}
|
| 1666 |
],
|
| 1667 |
"max_steps": 7737,
|
| 1668 |
"num_train_epochs": 3,
|
| 1669 |
+
"total_flos": 2.928513074136613e+19,
|
| 1670 |
"trial_name": null,
|
| 1671 |
"trial_params": null
|
| 1672 |
}
|
{checkpoint-6400 β checkpoint-6800}/training_args.bin
RENAMED
|
File without changes
|