Commit
Β·
44b1d94
1
Parent(s):
7b2562e
Training in progress, step 7600
Browse files- adapter_model.bin +1 -1
- {checkpoint-7200 β checkpoint-7500/adapter_model}/README.md +0 -0
- {checkpoint-7200 β checkpoint-7500/adapter_model}/adapter_config.json +0 -0
- {checkpoint-7200 β checkpoint-7500/adapter_model}/adapter_model.bin +1 -1
- {checkpoint-7200/adapter_model β checkpoint-7600}/README.md +0 -0
- {checkpoint-7200/adapter_model β checkpoint-7600}/adapter_config.json +0 -0
- {checkpoint-7200/adapter_model β checkpoint-7600}/adapter_model.bin +1 -1
- {checkpoint-7200 β checkpoint-7600}/optimizer.pt +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_0.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_1.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_10.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_11.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_12.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_13.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_2.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_3.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_4.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_5.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_6.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_7.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_8.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_9.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/scheduler.pt +1 -1
- {checkpoint-7200 β checkpoint-7600}/trainer_state.json +99 -3
- {checkpoint-7200 β checkpoint-7600}/training_args.bin +0 -0
adapter_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 500897101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5ab034d117a0225da8be2f42841fdd56781cdd412727c42b29659f8fe5e1326
|
| 3 |
size 500897101
|
{checkpoint-7200 β checkpoint-7500/adapter_model}/README.md
RENAMED
|
File without changes
|
{checkpoint-7200 β checkpoint-7500/adapter_model}/adapter_config.json
RENAMED
|
File without changes
|
{checkpoint-7200 β checkpoint-7500/adapter_model}/adapter_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 500897101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:599a7200aa4c479d11103aabf574f030fbcfd8ec950c813b2ed33cb39a745288
|
| 3 |
size 500897101
|
{checkpoint-7200/adapter_model β checkpoint-7600}/README.md
RENAMED
|
File without changes
|
{checkpoint-7200/adapter_model β checkpoint-7600}/adapter_config.json
RENAMED
|
File without changes
|
{checkpoint-7200/adapter_model β checkpoint-7600}/adapter_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 500897101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5ab034d117a0225da8be2f42841fdd56781cdd412727c42b29659f8fe5e1326
|
| 3 |
size 500897101
|
{checkpoint-7200 β checkpoint-7600}/optimizer.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1001752701
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9fb53c8a12296e035ec70bf89911c9255494b238ffbb8f9c7a06d814a5410c87
|
| 3 |
size 1001752701
|
{checkpoint-7200 β checkpoint-7600}/rng_state_0.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d92f7eabe45011214c515bfd61da30217ce7b19e595578b578aa64ad13935f7b
|
| 3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_1.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8faed179788c5f007e70cd65b68283fb43b650dd4050572bbd5baf4bdcfbd924
|
| 3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_10.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61d79bf1140d29880b77d5b59d675f6cde7b6f8b23df1963240456b4cab72a92
|
| 3 |
size 27789
|
{checkpoint-7200 β checkpoint-7600}/rng_state_11.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02ce5e6c819958cba78082c54dc07c058f44ad7e3529ad00f10d119ef3398e40
|
| 3 |
size 27789
|
{checkpoint-7200 β checkpoint-7600}/rng_state_12.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:707e4aefa7d3ce06c156b57c6d9066244c741a492606832c0bb2a2ec62ce93f7
|
| 3 |
size 27789
|
{checkpoint-7200 β checkpoint-7600}/rng_state_13.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27789
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c580d943a9c6477c835e2ef1177fc05e74400a0ecb8d1179ca11160dbf4f9e3f
|
| 3 |
size 27789
|
{checkpoint-7200 β checkpoint-7600}/rng_state_2.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3851048fcf00e460a46c0d0afa742a3479d7e22eff758002fb06f5fc4aff5360
|
| 3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_3.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ad8fccbd226cbad25059f183dbac39878c755c6293504a7508201420371a326
|
| 3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_4.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d169e4e502924fcdcd3c9029b7721729912abdfee723bf2f5b143e0c52278a80
|
| 3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_5.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2e8219f1f38af388ccb00570e48d852630fd0033dc8f43c45d502afdc72c9cc
|
| 3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_6.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4dbf4092b04aa8341ff54a7b4956a047bbc2f54e34818e66a07cba1653e5e641
|
| 3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_7.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3cee8814ccaee8c0d5e7262c51637788ae0940c5d3a963ac9add18e67c5a5167
|
| 3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_8.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b2a094ab4a22bd185f1e49e29bfa15330df8c156a20b2a312cfefc754be4779
|
| 3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_9.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 27772
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1954ff78ec289ceaa33bdc7771b54e14618e8faecc5fba2fdda2fdc84a132170
|
| 3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/scheduler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 627
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a7eb86c35d079e8a2b93e9e3d96c274a24bb1cdec7682fa038d76297f663d7cf
|
| 3 |
size 627
|
{checkpoint-7200 β checkpoint-7600}/trainer_state.json
RENAMED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
-
"epoch": 2.
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -1766,11 +1766,107 @@
|
|
| 1766 |
"learning_rate": 2.3739449846862826e-06,
|
| 1767 |
"loss": 0.7634,
|
| 1768 |
"step": 7200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1769 |
}
|
| 1770 |
],
|
| 1771 |
"max_steps": 7737,
|
| 1772 |
"num_train_epochs": 3,
|
| 1773 |
-
"total_flos": 3.
|
| 1774 |
"trial_name": null,
|
| 1775 |
"trial_params": null
|
| 1776 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
+
"epoch": 2.9468786351298952,
|
| 5 |
+
"global_step": 7600,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 1766 |
"learning_rate": 2.3739449846862826e-06,
|
| 1767 |
"loss": 0.7634,
|
| 1768 |
"step": 7200
|
| 1769 |
+
},
|
| 1770 |
+
{
|
| 1771 |
+
"epoch": 2.8,
|
| 1772 |
+
"learning_rate": 2.158832811760736e-06,
|
| 1773 |
+
"loss": 0.7617,
|
| 1774 |
+
"step": 7225
|
| 1775 |
+
},
|
| 1776 |
+
{
|
| 1777 |
+
"epoch": 2.81,
|
| 1778 |
+
"learning_rate": 1.95382888533604e-06,
|
| 1779 |
+
"loss": 0.768,
|
| 1780 |
+
"step": 7250
|
| 1781 |
+
},
|
| 1782 |
+
{
|
| 1783 |
+
"epoch": 2.82,
|
| 1784 |
+
"learning_rate": 1.7589543849450996e-06,
|
| 1785 |
+
"loss": 0.7712,
|
| 1786 |
+
"step": 7275
|
| 1787 |
+
},
|
| 1788 |
+
{
|
| 1789 |
+
"epoch": 2.83,
|
| 1790 |
+
"learning_rate": 1.5742294436213223e-06,
|
| 1791 |
+
"loss": 0.7703,
|
| 1792 |
+
"step": 7300
|
| 1793 |
+
},
|
| 1794 |
+
{
|
| 1795 |
+
"epoch": 2.84,
|
| 1796 |
+
"learning_rate": 1.3996731458185697e-06,
|
| 1797 |
+
"loss": 0.7618,
|
| 1798 |
+
"step": 7325
|
| 1799 |
+
},
|
| 1800 |
+
{
|
| 1801 |
+
"epoch": 2.85,
|
| 1802 |
+
"learning_rate": 1.2353035254395352e-06,
|
| 1803 |
+
"loss": 0.7767,
|
| 1804 |
+
"step": 7350
|
| 1805 |
+
},
|
| 1806 |
+
{
|
| 1807 |
+
"epoch": 2.86,
|
| 1808 |
+
"learning_rate": 1.0811375639725341e-06,
|
| 1809 |
+
"loss": 0.7659,
|
| 1810 |
+
"step": 7375
|
| 1811 |
+
},
|
| 1812 |
+
{
|
| 1813 |
+
"epoch": 2.87,
|
| 1814 |
+
"learning_rate": 9.371911887371965e-07,
|
| 1815 |
+
"loss": 0.774,
|
| 1816 |
+
"step": 7400
|
| 1817 |
+
},
|
| 1818 |
+
{
|
| 1819 |
+
"epoch": 2.88,
|
| 1820 |
+
"learning_rate": 8.034792712388828e-07,
|
| 1821 |
+
"loss": 0.7658,
|
| 1822 |
+
"step": 7425
|
| 1823 |
+
},
|
| 1824 |
+
{
|
| 1825 |
+
"epoch": 2.89,
|
| 1826 |
+
"learning_rate": 6.800156256323243e-07,
|
| 1827 |
+
"loss": 0.7626,
|
| 1828 |
+
"step": 7450
|
| 1829 |
+
},
|
| 1830 |
+
{
|
| 1831 |
+
"epoch": 2.9,
|
| 1832 |
+
"learning_rate": 5.6681300729442e-07,
|
| 1833 |
+
"loss": 0.7744,
|
| 1834 |
+
"step": 7475
|
| 1835 |
+
},
|
| 1836 |
+
{
|
| 1837 |
+
"epoch": 2.91,
|
| 1838 |
+
"learning_rate": 4.6388311150644683e-07,
|
| 1839 |
+
"loss": 0.7768,
|
| 1840 |
+
"step": 7500
|
| 1841 |
+
},
|
| 1842 |
+
{
|
| 1843 |
+
"epoch": 2.92,
|
| 1844 |
+
"learning_rate": 3.712365722457922e-07,
|
| 1845 |
+
"loss": 0.7653,
|
| 1846 |
+
"step": 7525
|
| 1847 |
+
},
|
| 1848 |
+
{
|
| 1849 |
+
"epoch": 2.93,
|
| 1850 |
+
"learning_rate": 2.888829610873112e-07,
|
| 1851 |
+
"loss": 0.7675,
|
| 1852 |
+
"step": 7550
|
| 1853 |
+
},
|
| 1854 |
+
{
|
| 1855 |
+
"epoch": 2.94,
|
| 1856 |
+
"learning_rate": 2.168307862144725e-07,
|
| 1857 |
+
"loss": 0.7727,
|
| 1858 |
+
"step": 7575
|
| 1859 |
+
},
|
| 1860 |
+
{
|
| 1861 |
+
"epoch": 2.95,
|
| 1862 |
+
"learning_rate": 1.5508749154037327e-07,
|
| 1863 |
+
"loss": 0.7712,
|
| 1864 |
+
"step": 7600
|
| 1865 |
}
|
| 1866 |
],
|
| 1867 |
"max_steps": 7737,
|
| 1868 |
"num_train_epochs": 3,
|
| 1869 |
+
"total_flos": 3.2730387222263497e+19,
|
| 1870 |
"trial_name": null,
|
| 1871 |
"trial_params": null
|
| 1872 |
}
|
{checkpoint-7200 β checkpoint-7600}/training_args.bin
RENAMED
|
File without changes
|