Commit
Β·
7b2562e
1
Parent(s):
aa0242f
Training in progress, step 7500
Browse files- adapter_model.bin +1 -1
- {checkpoint-7100 β checkpoint-7400/adapter_model}/README.md +0 -0
- {checkpoint-7100 β checkpoint-7400/adapter_model}/adapter_config.json +0 -0
- {checkpoint-7100 β checkpoint-7400/adapter_model}/adapter_model.bin +1 -1
- {checkpoint-7100/adapter_model β checkpoint-7500}/README.md +0 -0
- {checkpoint-7100/adapter_model β checkpoint-7500}/adapter_config.json +0 -0
- {checkpoint-7100/adapter_model β checkpoint-7500}/adapter_model.bin +1 -1
- {checkpoint-7100 β checkpoint-7500}/optimizer.pt +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_0.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_1.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_10.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_11.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_12.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_13.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_2.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_3.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_4.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_5.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_6.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_7.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_8.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/rng_state_9.pth +1 -1
- {checkpoint-7100 β checkpoint-7500}/scheduler.pt +1 -1
- {checkpoint-7100 β checkpoint-7500}/trainer_state.json +99 -3
- {checkpoint-7100 β checkpoint-7500}/training_args.bin +0 -0
adapter_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 500897101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:599a7200aa4c479d11103aabf574f030fbcfd8ec950c813b2ed33cb39a745288
|
| 3 |
size 500897101
|
{checkpoint-7100 β checkpoint-7400/adapter_model}/README.md
RENAMED
|
File without changes
|
{checkpoint-7100 β checkpoint-7400/adapter_model}/adapter_config.json
RENAMED
|
File without changes
|
{checkpoint-7100 β checkpoint-7400/adapter_model}/adapter_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 500897101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:993d2c02240ed3801ddacece59d263018042d38b315c16b83c4dac141857f97b
|
| 3 |
size 500897101
|
{checkpoint-7100/adapter_model β checkpoint-7500}/README.md
RENAMED
|
File without changes
|
{checkpoint-7100/adapter_model β checkpoint-7500}/adapter_config.json
RENAMED
|
File without changes
|
{checkpoint-7100/adapter_model β checkpoint-7500}/adapter_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 500897101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:599a7200aa4c479d11103aabf574f030fbcfd8ec950c813b2ed33cb39a745288
|
| 3 |
size 500897101
|
{checkpoint-7100 β checkpoint-7500}/optimizer.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1001752701
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0fbb0b5a10201f46c10a18c381ad9781e7f0c8efb247be7229f7b7a1d0f59669
|
| 3 |
size 1001752701
|
{checkpoint-7100 β checkpoint-7500}/rng_state_0.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cbda122ed6aeb142e9806e2c60595c0fb0345e050a46424ae7e6121a274bdf8f
|
| 3 |
size 27772
|
{checkpoint-7100 β checkpoint-7500}/rng_state_1.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:edfe82be00b7fdfa29bc639a42272a413c2f745e99a7dd4e7c019268bffb3c1c
|
| 3 |
size 27772
|
{checkpoint-7100 β checkpoint-7500}/rng_state_10.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bfbeff8b08e4ff89601ec54eda1fbaada8fa06897aded9396ba9e47eb6a98ac9
|
| 3 |
size 27789
|
{checkpoint-7100 β checkpoint-7500}/rng_state_11.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e488c693c827c1c1bc8761677e2e18ebf62ff097e6a8845c75725b08ee364123
|
| 3 |
size 27789
|
{checkpoint-7100 β checkpoint-7500}/rng_state_12.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70e177e7485bfc4621fd67465543e8b8af515ce3eb17dbc796a813aa9189ca2f
|
| 3 |
size 27789
|
{checkpoint-7100 β checkpoint-7500}/rng_state_13.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d25a7d7bcfccc3ae06e04a8dd31e3a14472b8b1c02eeae89ff0b880b6032932
|
| 3 |
size 27789
|
{checkpoint-7100 β checkpoint-7500}/rng_state_2.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eae779e6cba58f785b1d5fb960336448e1e9e5fc24e9a8e12bca601df697886f
|
| 3 |
size 27772
|
{checkpoint-7100 β checkpoint-7500}/rng_state_3.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1608635b1c766955f0811a53d4bd5951addb57bb03975fa838eda4e0ae41f71d
|
| 3 |
size 27772
|
{checkpoint-7100 β checkpoint-7500}/rng_state_4.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7941a1be97c26b733e1df942d0fd78e6aadc9a0e9eb0828e07b31662264008a
|
| 3 |
size 27772
|
{checkpoint-7100 β checkpoint-7500}/rng_state_5.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e298e6676cd57f41db105eaecc5bd07d4c75370e7d33e163ca2de445996b0d5e
|
| 3 |
size 27772
|
{checkpoint-7100 β checkpoint-7500}/rng_state_6.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:149cb26a6e8eca2a8f06334ca36fc633cc4ddf79e4509a782ff5cbe8d8e3dc8d
|
| 3 |
size 27772
|
{checkpoint-7100 β checkpoint-7500}/rng_state_7.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d0fdf62330e049e160395841276b2da25c8f736f4fabca874aa5b00ac0bdedf4
|
| 3 |
size 27772
|
{checkpoint-7100 β checkpoint-7500}/rng_state_8.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a4f0e9da27258f0f79f9d608144e718b994434a9d87531d3afba0531bb1e29f
|
| 3 |
size 27772
|
{checkpoint-7100 β checkpoint-7500}/rng_state_9.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8a8b6af1d78ab083fc6250edfc937e9898abf345d67eb89a8a91af6cbca15e4
|
| 3 |
size 27772
|
{checkpoint-7100 β checkpoint-7500}/scheduler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 627
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70dbbed2d23faf20ab6dcce74542b56e86868c5259dd618df042286187825260
|
| 3 |
size 627
|
{checkpoint-7100 β checkpoint-7500}/trainer_state.json
RENAMED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
-
"epoch": 2.
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -1742,11 +1742,107 @@
|
|
| 1742 |
"learning_rate": 3.335016048808437e-06,
|
| 1743 |
"loss": 0.7733,
|
| 1744 |
"step": 7100
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1745 |
}
|
| 1746 |
],
|
| 1747 |
"max_steps": 7737,
|
| 1748 |
"num_train_epochs": 3,
|
| 1749 |
-
"total_flos": 3.
|
| 1750 |
"trial_name": null,
|
| 1751 |
"trial_params": null
|
| 1752 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
+
"epoch": 2.908103916246607,
|
| 5 |
+
"global_step": 7500,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 1742 |
"learning_rate": 3.335016048808437e-06,
|
| 1743 |
"loss": 0.7733,
|
| 1744 |
"step": 7100
|
| 1745 |
+
},
|
| 1746 |
+
{
|
| 1747 |
+
"epoch": 2.76,
|
| 1748 |
+
"learning_rate": 3.0797035363512193e-06,
|
| 1749 |
+
"loss": 0.7685,
|
| 1750 |
+
"step": 7125
|
| 1751 |
+
},
|
| 1752 |
+
{
|
| 1753 |
+
"epoch": 2.77,
|
| 1754 |
+
"learning_rate": 2.834404132647128e-06,
|
| 1755 |
+
"loss": 0.769,
|
| 1756 |
+
"step": 7150
|
| 1757 |
+
},
|
| 1758 |
+
{
|
| 1759 |
+
"epoch": 2.78,
|
| 1760 |
+
"learning_rate": 2.5991431802683262e-06,
|
| 1761 |
+
"loss": 0.7647,
|
| 1762 |
+
"step": 7175
|
| 1763 |
+
},
|
| 1764 |
+
{
|
| 1765 |
+
"epoch": 2.79,
|
| 1766 |
+
"learning_rate": 2.3739449846862826e-06,
|
| 1767 |
+
"loss": 0.7634,
|
| 1768 |
+
"step": 7200
|
| 1769 |
+
},
|
| 1770 |
+
{
|
| 1771 |
+
"epoch": 2.8,
|
| 1772 |
+
"learning_rate": 2.158832811760736e-06,
|
| 1773 |
+
"loss": 0.7617,
|
| 1774 |
+
"step": 7225
|
| 1775 |
+
},
|
| 1776 |
+
{
|
| 1777 |
+
"epoch": 2.81,
|
| 1778 |
+
"learning_rate": 1.95382888533604e-06,
|
| 1779 |
+
"loss": 0.768,
|
| 1780 |
+
"step": 7250
|
| 1781 |
+
},
|
| 1782 |
+
{
|
| 1783 |
+
"epoch": 2.82,
|
| 1784 |
+
"learning_rate": 1.7589543849450996e-06,
|
| 1785 |
+
"loss": 0.7712,
|
| 1786 |
+
"step": 7275
|
| 1787 |
+
},
|
| 1788 |
+
{
|
| 1789 |
+
"epoch": 2.83,
|
| 1790 |
+
"learning_rate": 1.5742294436213223e-06,
|
| 1791 |
+
"loss": 0.7703,
|
| 1792 |
+
"step": 7300
|
| 1793 |
+
},
|
| 1794 |
+
{
|
| 1795 |
+
"epoch": 2.84,
|
| 1796 |
+
"learning_rate": 1.3996731458185697e-06,
|
| 1797 |
+
"loss": 0.7618,
|
| 1798 |
+
"step": 7325
|
| 1799 |
+
},
|
| 1800 |
+
{
|
| 1801 |
+
"epoch": 2.85,
|
| 1802 |
+
"learning_rate": 1.2353035254395352e-06,
|
| 1803 |
+
"loss": 0.7767,
|
| 1804 |
+
"step": 7350
|
| 1805 |
+
},
|
| 1806 |
+
{
|
| 1807 |
+
"epoch": 2.86,
|
| 1808 |
+
"learning_rate": 1.0811375639725341e-06,
|
| 1809 |
+
"loss": 0.7659,
|
| 1810 |
+
"step": 7375
|
| 1811 |
+
},
|
| 1812 |
+
{
|
| 1813 |
+
"epoch": 2.87,
|
| 1814 |
+
"learning_rate": 9.371911887371965e-07,
|
| 1815 |
+
"loss": 0.774,
|
| 1816 |
+
"step": 7400
|
| 1817 |
+
},
|
| 1818 |
+
{
|
| 1819 |
+
"epoch": 2.88,
|
| 1820 |
+
"learning_rate": 8.034792712388828e-07,
|
| 1821 |
+
"loss": 0.7658,
|
| 1822 |
+
"step": 7425
|
| 1823 |
+
},
|
| 1824 |
+
{
|
| 1825 |
+
"epoch": 2.89,
|
| 1826 |
+
"learning_rate": 6.800156256323243e-07,
|
| 1827 |
+
"loss": 0.7626,
|
| 1828 |
+
"step": 7450
|
| 1829 |
+
},
|
| 1830 |
+
{
|
| 1831 |
+
"epoch": 2.9,
|
| 1832 |
+
"learning_rate": 5.6681300729442e-07,
|
| 1833 |
+
"loss": 0.7744,
|
| 1834 |
+
"step": 7475
|
| 1835 |
+
},
|
| 1836 |
+
{
|
| 1837 |
+
"epoch": 2.91,
|
| 1838 |
+
"learning_rate": 4.6388311150644683e-07,
|
| 1839 |
+
"loss": 0.7768,
|
| 1840 |
+
"step": 7500
|
| 1841 |
}
|
| 1842 |
],
|
| 1843 |
"max_steps": 7737,
|
| 1844 |
"num_train_epochs": 3,
|
| 1845 |
+
"total_flos": 3.2299438278321373e+19,
|
| 1846 |
"trial_name": null,
|
| 1847 |
"trial_params": null
|
| 1848 |
}
|
{checkpoint-7100 β checkpoint-7500}/training_args.bin
RENAMED
|
File without changes
|