File size: 222,029 Bytes
33b63f6 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530 1531 1532 1533 1534 1535 1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768 1769 1770 1771 1772 1773 1774 1775 1776 1777 1778 1779 1780 1781 1782 1783 1784 1785 1786 1787 1788 1789 1790 1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869 1870 1871 1872 1873 1874 1875 1876 1877 1878 1879 1880 1881 1882 1883 1884 1885 1886 1887 1888 1889 1890 1891 1892 1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916 1917 1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940 1941 1942 1943 1944 1945 1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983 1984 1985 1986 1987 1988 1989 1990 1991 1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034 2035 2036 2037 2038 2039 2040 2041 2042 2043 2044 2045 2046 2047 2048 2049 2050 2051 2052 2053 2054 2055 2056 2057 2058 2059 2060 2061 2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100 2101 2102 2103 2104 2105 2106 2107 2108 2109 2110 2111 2112 2113 2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124 2125 2126 2127 2128 2129 2130 2131 2132 2133 2134 2135 2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285 2286 2287 2288 2289 2290 2291 2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307 2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334 2335 2336 2337 2338 2339 2340 2341 2342 2343 2344 2345 2346 2347 2348 2349 2350 2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372 2373 2374 2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400 2401 2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412 2413 2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426 2427 2428 2429 2430 2431 2432 2433 2434 2435 2436 2437 2438 2439 2440 2441 2442 2443 2444 2445 2446 2447 2448 2449 2450 2451 2452 2453 2454 2455 2456 2457 2458 2459 2460 2461 2462 2463 2464 2465 2466 2467 2468 2469 2470 2471 2472 2473 2474 2475 2476 2477 2478 2479 2480 2481 2482 2483 2484 2485 2486 2487 2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502 2503 2504 2505 2506 2507 2508 2509 |
{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0}
{"train_info/time_between_train_steps": 3.651843309402466, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 14.495634317398071, "step": 1}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 19760.3271484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1737097147, "_runtime": 46}, "step": 1}
{"logs": {"train/loss": 10.9507, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1737097147, "_runtime": 46}, "step": 1}
{"train_info/time_between_train_steps": 0.07622003555297852, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 13.958839416503906, "step": 2}
{"train_info/time_between_train_steps": 0.005166292190551758, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 13.829073190689087, "step": 3}
{"train_info/time_between_train_steps": 0.005765199661254883, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 13.982460260391235, "step": 4}
{"train_info/time_between_train_steps": 0.00634312629699707, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 13.828723669052124, "step": 5}
{"train_info/time_between_train_steps": 0.0059163570404052734, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 13.86355185508728, "step": 6}
{"train_info/time_between_train_steps": 0.005631446838378906, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 13.828385353088379, "step": 7}
{"train_info/time_between_train_steps": 0.005902290344238281, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 13.817607164382935, "step": 8}
{"train_info/time_between_train_steps": 0.005295753479003906, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 13.805377006530762, "step": 9}
{"train_info/time_between_train_steps": 0.005673408508300781, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 13.815861701965332, "step": 10}
{"train_info/time_between_train_steps": 0.00545191764831543, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 13.813509464263916, "step": 11}
{"train_info/time_between_train_steps": 0.005859851837158203, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 13.812410116195679, "step": 12}
{"train_info/time_between_train_steps": 0.005579471588134766, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 13.806305170059204, "step": 13}
{"train_info/time_between_train_steps": 0.005228281021118164, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 13.807024955749512, "step": 14}
{"train_info/time_between_train_steps": 0.005578041076660156, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 13.821202754974365, "step": 15}
{"train_info/time_between_train_steps": 0.005373477935791016, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 13.939035415649414, "step": 16}
{"train_info/time_between_train_steps": 0.0055468082427978516, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 13.84096646308899, "step": 17}
{"train_info/time_between_train_steps": 0.0055103302001953125, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 13.82323670387268, "step": 18}
{"train_info/time_between_train_steps": 0.005661725997924805, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 13.816317319869995, "step": 19}
{"train_info/time_between_train_steps": 0.005712985992431641, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 13.82659387588501, "step": 20}
{"train_info/time_between_train_steps": 0.005329608917236328, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 13.827137231826782, "step": 21}
{"train_info/time_between_train_steps": 0.005379915237426758, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 13.819592714309692, "step": 22}
{"train_info/time_between_train_steps": 0.00593256950378418, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 13.8185293674469, "step": 23}
{"train_info/time_between_train_steps": 0.005565643310546875, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 13.833707571029663, "step": 24}
{"train_info/time_between_train_steps": 0.0059168338775634766, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 13.867460012435913, "step": 25}
{"train_info/time_between_train_steps": 0.0071947574615478516, "step": 25}
{"train_info/time_between_train_steps": 7.512251615524292, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 13.816228866577148, "step": 26}
{"train_info/time_between_train_steps": 0.0051593780517578125, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 13.917293787002563, "step": 27}
{"train_info/time_between_train_steps": 0.005263090133666992, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 13.830246210098267, "step": 28}
{"train_info/time_between_train_steps": 0.0054340362548828125, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 13.935914039611816, "step": 29}
{"train_info/time_between_train_steps": 0.005009889602661133, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 13.841666221618652, "step": 30}
{"train_info/time_between_train_steps": 0.005575895309448242, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 13.941828966140747, "step": 31}
{"train_info/time_between_train_steps": 0.005406379699707031, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 13.82960295677185, "step": 32}
{"train_info/time_between_train_steps": 0.005877017974853516, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 13.865059614181519, "step": 33}
{"train_info/time_between_train_steps": 0.005705833435058594, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 13.832172393798828, "step": 34}
{"train_info/time_between_train_steps": 0.0053865909576416016, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 13.832462787628174, "step": 35}
{"train_info/time_between_train_steps": 0.005509138107299805, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 13.841892004013062, "step": 36}
{"train_info/time_between_train_steps": 0.0057108402252197266, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 13.844874858856201, "step": 37}
{"train_info/time_between_train_steps": 0.005314350128173828, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 13.844947099685669, "step": 38}
{"train_info/time_between_train_steps": 0.005612373352050781, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 13.834400177001953, "step": 39}
{"train_info/time_between_train_steps": 0.005843162536621094, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 13.841911315917969, "step": 40}
{"train_info/time_between_train_steps": 0.005139589309692383, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 13.8458833694458, "step": 41}
{"train_info/time_between_train_steps": 0.005734682083129883, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 13.83195447921753, "step": 42}
{"train_info/time_between_train_steps": 0.00589752197265625, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 13.83602786064148, "step": 43}
{"train_info/time_between_train_steps": 0.005743265151977539, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 13.830932855606079, "step": 44}
{"train_info/time_between_train_steps": 0.005700588226318359, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 13.858396768569946, "step": 45}
{"train_info/time_between_train_steps": 0.0057294368743896484, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 13.863159894943237, "step": 46}
{"train_info/time_between_train_steps": 0.005889892578125, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 13.93877625465393, "step": 47}
{"train_info/time_between_train_steps": 0.005537271499633789, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 13.842863082885742, "step": 48}
{"train_info/time_between_train_steps": 0.005950450897216797, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 13.848151206970215, "step": 49}
{"train_info/time_between_train_steps": 0.00667881965637207, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 13.871625423431396, "step": 50}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737097835, "_runtime": 734}, "step": 50}
{"logs": {"train/loss": 8.5124, "train/learning_rate": 0.00025, "train/epoch": 1.02, "_timestamp": 1737097835, "_runtime": 734}, "step": 50}
{"train_info/time_between_train_steps": 0.03543567657470703, "step": 50}
{"train_info/time_between_train_steps": 7.5914506912231445, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 13.812689542770386, "step": 51}
{"train_info/time_between_train_steps": 0.004988431930541992, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 13.908324480056763, "step": 52}
{"train_info/time_between_train_steps": 0.0053293704986572266, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 13.816579103469849, "step": 53}
{"train_info/time_between_train_steps": 0.00535130500793457, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 13.979037761688232, "step": 54}
{"train_info/time_between_train_steps": 0.0051229000091552734, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 13.836976051330566, "step": 55}
{"train_info/time_between_train_steps": 0.006157875061035156, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 13.87308645248413, "step": 56}
{"train_info/time_between_train_steps": 0.006233930587768555, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 13.853703498840332, "step": 57}
{"train_info/time_between_train_steps": 0.005199909210205078, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 13.845409393310547, "step": 58}
{"train_info/time_between_train_steps": 0.00507807731628418, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 13.835512161254883, "step": 59}
{"train_info/time_between_train_steps": 0.005392789840698242, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 13.832730531692505, "step": 60}
{"train_info/time_between_train_steps": 0.005220890045166016, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 13.842274904251099, "step": 61}
{"train_info/time_between_train_steps": 0.005712747573852539, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 13.942237138748169, "step": 62}
{"train_info/time_between_train_steps": 0.005675554275512695, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 13.83247709274292, "step": 63}
{"train_info/time_between_train_steps": 0.005379676818847656, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 13.833400249481201, "step": 64}
{"train_info/time_between_train_steps": 0.005734920501708984, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 13.834809064865112, "step": 65}
{"train_info/time_between_train_steps": 0.005745887756347656, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 13.842426538467407, "step": 66}
{"train_info/time_between_train_steps": 0.0053958892822265625, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 13.838959217071533, "step": 67}
{"train_info/time_between_train_steps": 0.005594015121459961, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 13.832815885543823, "step": 68}
{"train_info/time_between_train_steps": 0.00530695915222168, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 13.839927673339844, "step": 69}
{"train_info/time_between_train_steps": 0.005855560302734375, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 13.84283185005188, "step": 70}
{"train_info/time_between_train_steps": 0.005950212478637695, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 13.844999313354492, "step": 71}
{"train_info/time_between_train_steps": 0.005645751953125, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 13.880637168884277, "step": 72}
{"train_info/time_between_train_steps": 0.0060100555419921875, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 13.849247932434082, "step": 73}
{"train_info/time_between_train_steps": 0.005659341812133789, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 13.857091903686523, "step": 74}
{"train_info/time_between_train_steps": 0.006218433380126953, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 13.89611554145813, "step": 75}
{"train_info/time_between_train_steps": 0.006189584732055664, "step": 75}
{"train_info/time_between_train_steps": 7.536259174346924, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 13.807922601699829, "step": 76}
{"train_info/time_between_train_steps": 0.0057430267333984375, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 14.044120073318481, "step": 77}
{"train_info/time_between_train_steps": 0.0057489871978759766, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 13.829282760620117, "step": 78}
{"train_info/time_between_train_steps": 0.005922555923461914, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 13.934227228164673, "step": 79}
{"train_info/time_between_train_steps": 0.005868434906005859, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 13.8536696434021, "step": 80}
{"train_info/time_between_train_steps": 0.005242824554443359, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 13.868852376937866, "step": 81}
{"train_info/time_between_train_steps": 0.005728721618652344, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 13.841040134429932, "step": 82}
{"train_info/time_between_train_steps": 0.0059130191802978516, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 13.844797611236572, "step": 83}
{"train_info/time_between_train_steps": 0.00559544563293457, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 13.844639539718628, "step": 84}
{"train_info/time_between_train_steps": 0.0054531097412109375, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 13.837765455245972, "step": 85}
{"train_info/time_between_train_steps": 0.005219221115112305, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 13.842440366744995, "step": 86}
{"train_info/time_between_train_steps": 0.005440235137939453, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 13.870681762695312, "step": 87}
{"train_info/time_between_train_steps": 0.005411863327026367, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 13.850825309753418, "step": 88}
{"train_info/time_between_train_steps": 0.005508899688720703, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 13.839478492736816, "step": 89}
{"train_info/time_between_train_steps": 0.005335569381713867, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 13.851691246032715, "step": 90}
{"train_info/time_between_train_steps": 0.005591154098510742, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 13.848241329193115, "step": 91}
{"train_info/time_between_train_steps": 0.005427360534667969, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 13.84625768661499, "step": 92}
{"train_info/time_between_train_steps": 0.005717277526855469, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 13.935770750045776, "step": 93}
{"train_info/time_between_train_steps": 0.0058002471923828125, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 13.852592706680298, "step": 94}
{"train_info/time_between_train_steps": 0.005707979202270508, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 13.860313177108765, "step": 95}
{"train_info/time_between_train_steps": 0.005658864974975586, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 13.880605220794678, "step": 96}
{"train_info/time_between_train_steps": 0.005869626998901367, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 13.877039909362793, "step": 97}
{"train_info/time_between_train_steps": 0.00604557991027832, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 13.866673707962036, "step": 98}
{"train_info/time_between_train_steps": 0.005671501159667969, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 13.87063193321228, "step": 99}
{"train_info/time_between_train_steps": 0.0058956146240234375, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 14.280521631240845, "step": 100}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737098546, "_runtime": 1445}, "step": 100}
{"logs": {"train/loss": 7.4735, "train/learning_rate": 0.0005, "train/epoch": 3.02, "_timestamp": 1737098546, "_runtime": 1445}, "step": 100}
{"train_info/time_between_train_steps": 109.582270860672, "step": 100}
{"train_info/time_between_train_steps": 117.15802836418152, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 13.76877212524414, "step": 101}
{"train_info/time_between_train_steps": 0.005624055862426758, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 13.899270057678223, "step": 102}
{"train_info/time_between_train_steps": 0.005658626556396484, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 13.84934377670288, "step": 103}
{"train_info/time_between_train_steps": 0.005307435989379883, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 13.927623271942139, "step": 104}
{"train_info/time_between_train_steps": 0.005502462387084961, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 13.821584939956665, "step": 105}
{"train_info/time_between_train_steps": 0.005231618881225586, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 13.832173824310303, "step": 106}
{"train_info/time_between_train_steps": 0.00555872917175293, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 13.813844680786133, "step": 107}
{"train_info/time_between_train_steps": 0.005377292633056641, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 13.923242330551147, "step": 108}
{"train_info/time_between_train_steps": 0.005576133728027344, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 13.830071926116943, "step": 109}
{"train_info/time_between_train_steps": 0.0059051513671875, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 13.83593463897705, "step": 110}
{"train_info/time_between_train_steps": 0.005677700042724609, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 13.830904960632324, "step": 111}
{"train_info/time_between_train_steps": 0.005722999572753906, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 13.928680658340454, "step": 112}
{"train_info/time_between_train_steps": 0.0051763057708740234, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 13.830489158630371, "step": 113}
{"train_info/time_between_train_steps": 0.005099058151245117, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 13.844315767288208, "step": 114}
{"train_info/time_between_train_steps": 0.005494117736816406, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 13.847568273544312, "step": 115}
{"train_info/time_between_train_steps": 0.0057795047760009766, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 13.846116781234741, "step": 116}
{"train_info/time_between_train_steps": 0.005774736404418945, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 13.842009782791138, "step": 117}
{"train_info/time_between_train_steps": 0.0053327083587646484, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 13.853203535079956, "step": 118}
{"train_info/time_between_train_steps": 0.005584716796875, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 13.829362869262695, "step": 119}
{"train_info/time_between_train_steps": 0.00487208366394043, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 13.822247505187988, "step": 120}
{"train_info/time_between_train_steps": 0.005978822708129883, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 13.861863374710083, "step": 121}
{"train_info/time_between_train_steps": 0.005539894104003906, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 13.836488723754883, "step": 122}
{"train_info/time_between_train_steps": 0.005528688430786133, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 13.846813201904297, "step": 123}
{"train_info/time_between_train_steps": 0.005690813064575195, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 13.936060905456543, "step": 124}
{"train_info/time_between_train_steps": 0.0057010650634765625, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 13.95935583114624, "step": 125}
{"train_info/time_between_train_steps": 0.006719827651977539, "step": 125}
{"train_info/time_between_train_steps": 7.693514823913574, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 13.804117918014526, "step": 126}
{"train_info/time_between_train_steps": 0.0053217411041259766, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 13.902634859085083, "step": 127}
{"train_info/time_between_train_steps": 0.0060269832611083984, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 13.813904047012329, "step": 128}
{"train_info/time_between_train_steps": 0.005480527877807617, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 13.983883142471313, "step": 129}
{"train_info/time_between_train_steps": 0.005998373031616211, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 13.840449571609497, "step": 130}
{"train_info/time_between_train_steps": 0.005888700485229492, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 13.848274230957031, "step": 131}
{"train_info/time_between_train_steps": 0.005639553070068359, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 13.823298454284668, "step": 132}
{"train_info/time_between_train_steps": 0.005388021469116211, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 13.909822463989258, "step": 133}
{"train_info/time_between_train_steps": 0.0057337284088134766, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 13.81893253326416, "step": 134}
{"train_info/time_between_train_steps": 0.0052607059478759766, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 13.829563617706299, "step": 135}
{"train_info/time_between_train_steps": 0.005789995193481445, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 13.841821432113647, "step": 136}
{"train_info/time_between_train_steps": 0.005441904067993164, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 13.853350162506104, "step": 137}
{"train_info/time_between_train_steps": 0.00543522834777832, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 13.8328378200531, "step": 138}
{"train_info/time_between_train_steps": 0.005598783493041992, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 13.929934024810791, "step": 139}
{"train_info/time_between_train_steps": 0.005712032318115234, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 13.83250641822815, "step": 140}
{"train_info/time_between_train_steps": 0.00551295280456543, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 13.825500011444092, "step": 141}
{"train_info/time_between_train_steps": 0.0056896209716796875, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 13.854364395141602, "step": 142}
{"train_info/time_between_train_steps": 0.005481243133544922, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 13.83500337600708, "step": 143}
{"train_info/time_between_train_steps": 0.0057489871978759766, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 13.827605962753296, "step": 144}
{"train_info/time_between_train_steps": 0.005588531494140625, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 13.84089207649231, "step": 145}
{"train_info/time_between_train_steps": 0.005625009536743164, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 13.867924451828003, "step": 146}
{"train_info/time_between_train_steps": 0.0061299800872802734, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 13.866628885269165, "step": 147}
{"train_info/time_between_train_steps": 0.006115913391113281, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 13.846845626831055, "step": 148}
{"train_info/time_between_train_steps": 0.005875110626220703, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 13.843868494033813, "step": 149}
{"train_info/time_between_train_steps": 0.00597691535949707, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 13.968989372253418, "step": 150}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737099365, "_runtime": 2264}, "step": 150}
{"logs": {"train/loss": 7.3737, "train/learning_rate": 0.0005833333333333333, "train/epoch": 5.02, "_timestamp": 1737099365, "_runtime": 2264}, "step": 150}
{"train_info/time_between_train_steps": 0.06899213790893555, "step": 150}
{"train_info/time_between_train_steps": 7.599406003952026, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 13.827031135559082, "step": 151}
{"train_info/time_between_train_steps": 0.004981279373168945, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 13.918840169906616, "step": 152}
{"train_info/time_between_train_steps": 0.005354166030883789, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 13.8481125831604, "step": 153}
{"train_info/time_between_train_steps": 0.004574298858642578, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 14.113589525222778, "step": 154}
{"train_info/time_between_train_steps": 0.005168437957763672, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 13.851067781448364, "step": 155}
{"train_info/time_between_train_steps": 0.005224704742431641, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 13.890329360961914, "step": 156}
{"train_info/time_between_train_steps": 0.0057299137115478516, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 13.852158784866333, "step": 157}
{"train_info/time_between_train_steps": 0.005201816558837891, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 13.84146785736084, "step": 158}
{"train_info/time_between_train_steps": 0.005689859390258789, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 13.847963571548462, "step": 159}
{"train_info/time_between_train_steps": 0.00526881217956543, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 13.843003749847412, "step": 160}
{"train_info/time_between_train_steps": 0.0054094791412353516, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 13.84562873840332, "step": 161}
{"train_info/time_between_train_steps": 0.0049152374267578125, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 13.845022916793823, "step": 162}
{"train_info/time_between_train_steps": 0.0057981014251708984, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 13.918141841888428, "step": 163}
{"train_info/time_between_train_steps": 0.005298614501953125, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 13.861958742141724, "step": 164}
{"train_info/time_between_train_steps": 0.005187034606933594, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 13.852068185806274, "step": 165}
{"train_info/time_between_train_steps": 0.005230426788330078, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 13.85152268409729, "step": 166}
{"train_info/time_between_train_steps": 0.006046772003173828, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 13.851981401443481, "step": 167}
{"train_info/time_between_train_steps": 0.005777597427368164, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 13.841321229934692, "step": 168}
{"train_info/time_between_train_steps": 0.0048828125, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 13.848992824554443, "step": 169}
{"train_info/time_between_train_steps": 0.004811525344848633, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 13.941188097000122, "step": 170}
{"train_info/time_between_train_steps": 0.005818843841552734, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 14.011463642120361, "step": 171}
{"train_info/time_between_train_steps": 0.005174398422241211, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 13.85854983329773, "step": 172}
{"train_info/time_between_train_steps": 0.005579471588134766, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 13.85366702079773, "step": 173}
{"train_info/time_between_train_steps": 0.005179882049560547, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 13.865458726882935, "step": 174}
{"train_info/time_between_train_steps": 0.0061986446380615234, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 13.884835481643677, "step": 175}
{"train_info/time_between_train_steps": 0.006198883056640625, "step": 175}
{"train_info/time_between_train_steps": 7.66816520690918, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 13.843709945678711, "step": 176}
{"train_info/time_between_train_steps": 0.0055391788482666016, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 13.969459533691406, "step": 177}
{"train_info/time_between_train_steps": 0.0058553218841552734, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 13.843518257141113, "step": 178}
{"train_info/time_between_train_steps": 0.005095958709716797, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 13.959421634674072, "step": 179}
{"train_info/time_between_train_steps": 0.00535130500793457, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 13.848195552825928, "step": 180}
{"train_info/time_between_train_steps": 0.005289316177368164, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 13.871253490447998, "step": 181}
{"train_info/time_between_train_steps": 0.00536036491394043, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 13.85477876663208, "step": 182}
{"train_info/time_between_train_steps": 0.004901409149169922, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 13.839570045471191, "step": 183}
{"train_info/time_between_train_steps": 0.004925727844238281, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 13.8748197555542, "step": 184}
{"train_info/time_between_train_steps": 0.0054509639739990234, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 13.937409162521362, "step": 185}
{"train_info/time_between_train_steps": 0.005052089691162109, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 13.834811687469482, "step": 186}
{"train_info/time_between_train_steps": 0.005377292633056641, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 13.845189571380615, "step": 187}
{"train_info/time_between_train_steps": 0.004921913146972656, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 13.848725318908691, "step": 188}
{"train_info/time_between_train_steps": 0.005146503448486328, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 13.848942518234253, "step": 189}
{"train_info/time_between_train_steps": 0.005303621292114258, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 13.845007181167603, "step": 190}
{"train_info/time_between_train_steps": 0.005659580230712891, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 13.853827476501465, "step": 191}
{"train_info/time_between_train_steps": 0.004806995391845703, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 13.908633947372437, "step": 192}
{"train_info/time_between_train_steps": 0.005376338958740234, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 13.851009607315063, "step": 193}
{"train_info/time_between_train_steps": 0.005663156509399414, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 13.867965698242188, "step": 194}
{"train_info/time_between_train_steps": 0.0056154727935791016, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 13.857120752334595, "step": 195}
{"train_info/time_between_train_steps": 0.004864931106567383, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 13.851499319076538, "step": 196}
{"train_info/time_between_train_steps": 0.005980014801025391, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 13.915952205657959, "step": 197}
{"train_info/time_between_train_steps": 0.005449533462524414, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 13.873817205429077, "step": 198}
{"train_info/time_between_train_steps": 0.00615239143371582, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 13.895475625991821, "step": 199}
{"train_info/time_between_train_steps": 0.005223274230957031, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 13.894224643707275, "step": 200}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737100077, "_runtime": 2976}, "step": 200}
{"logs": {"train/loss": 7.1503, "train/learning_rate": 0.0005555555555555556, "train/epoch": 7.02, "_timestamp": 1737100077, "_runtime": 2976}, "step": 200}
{"train_info/time_between_train_steps": 123.3403730392456, "step": 200}
{"train_info/time_between_train_steps": 131.15398454666138, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 13.844910860061646, "step": 201}
{"train_info/time_between_train_steps": 0.0051996707916259766, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 13.928102970123291, "step": 202}
{"train_info/time_between_train_steps": 0.005951642990112305, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 13.823896884918213, "step": 203}
{"train_info/time_between_train_steps": 0.005899667739868164, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 13.9230797290802, "step": 204}
{"train_info/time_between_train_steps": 0.005818605422973633, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 13.856201410293579, "step": 205}
{"train_info/time_between_train_steps": 0.00570988655090332, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 13.858061075210571, "step": 206}
{"train_info/time_between_train_steps": 0.0052220821380615234, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 13.827415227890015, "step": 207}
{"train_info/time_between_train_steps": 0.005220174789428711, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 13.838062524795532, "step": 208}
{"train_info/time_between_train_steps": 0.0054168701171875, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 13.840125322341919, "step": 209}
{"train_info/time_between_train_steps": 0.005962848663330078, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 13.839817762374878, "step": 210}
{"train_info/time_between_train_steps": 0.005898475646972656, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 13.840616464614868, "step": 211}
{"train_info/time_between_train_steps": 0.005324602127075195, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 13.840801000595093, "step": 212}
{"train_info/time_between_train_steps": 0.0058956146240234375, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 13.84581971168518, "step": 213}
{"train_info/time_between_train_steps": 0.005695343017578125, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 13.870865106582642, "step": 214}
{"train_info/time_between_train_steps": 0.004947662353515625, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 13.857375383377075, "step": 215}
{"train_info/time_between_train_steps": 0.005426645278930664, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 13.923038721084595, "step": 216}
{"train_info/time_between_train_steps": 0.005160808563232422, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 13.853574275970459, "step": 217}
{"train_info/time_between_train_steps": 0.005397319793701172, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 13.866563558578491, "step": 218}
{"train_info/time_between_train_steps": 0.004797697067260742, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 13.86110258102417, "step": 219}
{"train_info/time_between_train_steps": 0.005174160003662109, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 13.84832501411438, "step": 220}
{"train_info/time_between_train_steps": 0.005754232406616211, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 13.855749368667603, "step": 221}
{"train_info/time_between_train_steps": 0.005529165267944336, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 13.855052471160889, "step": 222}
{"train_info/time_between_train_steps": 0.005679607391357422, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 13.861755132675171, "step": 223}
{"train_info/time_between_train_steps": 0.005373954772949219, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 13.877269268035889, "step": 224}
{"train_info/time_between_train_steps": 0.005413055419921875, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 13.899997472763062, "step": 225}
{"train_info/time_between_train_steps": 0.006675243377685547, "step": 225}
{"train_info/time_between_train_steps": 7.546824932098389, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 13.853760004043579, "step": 226}
{"train_info/time_between_train_steps": 0.005321025848388672, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 13.92681622505188, "step": 227}
{"train_info/time_between_train_steps": 0.0057675838470458984, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 13.84403920173645, "step": 228}
{"train_info/time_between_train_steps": 0.005923271179199219, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 13.983515977859497, "step": 229}
{"train_info/time_between_train_steps": 0.0053806304931640625, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 13.86969256401062, "step": 230}
{"train_info/time_between_train_steps": 0.005244255065917969, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 14.02599835395813, "step": 231}
{"train_info/time_between_train_steps": 0.005663633346557617, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 13.837062358856201, "step": 232}
{"train_info/time_between_train_steps": 0.005517482757568359, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 16.26858615875244, "step": 233}
{"train_info/time_between_train_steps": 0.005538225173950195, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 13.826904296875, "step": 234}
{"train_info/time_between_train_steps": 0.0054552555084228516, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 13.868290662765503, "step": 235}
{"train_info/time_between_train_steps": 0.0059244632720947266, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 13.839818954467773, "step": 236}
{"train_info/time_between_train_steps": 0.005728006362915039, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 13.841100215911865, "step": 237}
{"train_info/time_between_train_steps": 0.0057256221771240234, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 13.835238695144653, "step": 238}
{"train_info/time_between_train_steps": 0.0053920745849609375, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 13.862003326416016, "step": 239}
{"train_info/time_between_train_steps": 0.005678653717041016, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 13.847690105438232, "step": 240}
{"train_info/time_between_train_steps": 0.005242109298706055, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 13.832106590270996, "step": 241}
{"train_info/time_between_train_steps": 0.005941152572631836, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 13.841158151626587, "step": 242}
{"train_info/time_between_train_steps": 0.004747629165649414, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 13.836922645568848, "step": 243}
{"train_info/time_between_train_steps": 0.005671262741088867, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 13.856124639511108, "step": 244}
{"train_info/time_between_train_steps": 0.0060083866119384766, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 13.836740016937256, "step": 245}
{"train_info/time_between_train_steps": 0.006052732467651367, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 13.84801959991455, "step": 246}
{"train_info/time_between_train_steps": 0.005335569381713867, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 13.930846214294434, "step": 247}
{"train_info/time_between_train_steps": 0.005994081497192383, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 13.893747329711914, "step": 248}
{"train_info/time_between_train_steps": 0.004980325698852539, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 13.861598253250122, "step": 249}
{"train_info/time_between_train_steps": 0.00613856315612793, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 13.89588713645935, "step": 250}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737100913, "_runtime": 3812}, "step": 250}
{"logs": {"train/loss": 6.9697, "train/learning_rate": 0.0005277777777777777, "train/epoch": 9.02, "_timestamp": 1737100913, "_runtime": 3812}, "step": 250}
{"train_info/time_between_train_steps": 0.04178905487060547, "step": 250}
{"train_info/time_between_train_steps": 7.632592678070068, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 13.851006984710693, "step": 251}
{"train_info/time_between_train_steps": 0.004910945892333984, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 13.919140815734863, "step": 252}
{"train_info/time_between_train_steps": 0.005580425262451172, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 13.8501455783844, "step": 253}
{"train_info/time_between_train_steps": 0.00495147705078125, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 13.933330774307251, "step": 254}
{"train_info/time_between_train_steps": 0.0050656795501708984, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 13.861980199813843, "step": 255}
{"train_info/time_between_train_steps": 0.00572514533996582, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 13.917855501174927, "step": 256}
{"train_info/time_between_train_steps": 0.0050106048583984375, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 13.841702222824097, "step": 257}
{"train_info/time_between_train_steps": 0.0057125091552734375, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 13.842782497406006, "step": 258}
{"train_info/time_between_train_steps": 0.0047152042388916016, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 13.843727111816406, "step": 259}
{"train_info/time_between_train_steps": 0.005443096160888672, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 13.886867046356201, "step": 260}
{"train_info/time_between_train_steps": 0.005061149597167969, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 13.850101232528687, "step": 261}
{"train_info/time_between_train_steps": 0.005582332611083984, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 13.931325197219849, "step": 262}
{"train_info/time_between_train_steps": 0.005506992340087891, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 13.853442668914795, "step": 263}
{"train_info/time_between_train_steps": 0.004976034164428711, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 13.853179216384888, "step": 264}
{"train_info/time_between_train_steps": 0.004825592041015625, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 13.857842922210693, "step": 265}
{"train_info/time_between_train_steps": 0.005198001861572266, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 13.844700574874878, "step": 266}
{"train_info/time_between_train_steps": 0.005087375640869141, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 13.85396146774292, "step": 267}
{"train_info/time_between_train_steps": 0.004843473434448242, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 13.84492540359497, "step": 268}
{"train_info/time_between_train_steps": 0.0057108402252197266, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 13.869247198104858, "step": 269}
{"train_info/time_between_train_steps": 0.005995273590087891, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 13.853532314300537, "step": 270}
{"train_info/time_between_train_steps": 0.005444526672363281, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 13.863229274749756, "step": 271}
{"train_info/time_between_train_steps": 0.0052678585052490234, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 13.857730388641357, "step": 272}
{"train_info/time_between_train_steps": 0.005618572235107422, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 13.874265670776367, "step": 273}
{"train_info/time_between_train_steps": 0.006003618240356445, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 13.880226135253906, "step": 274}
{"train_info/time_between_train_steps": 0.005838155746459961, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 13.906951904296875, "step": 275}
{"train_info/time_between_train_steps": 0.006352901458740234, "step": 275}
{"train_info/time_between_train_steps": 7.708509206771851, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 13.843410015106201, "step": 276}
{"train_info/time_between_train_steps": 0.005064725875854492, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 13.930879354476929, "step": 277}
{"train_info/time_between_train_steps": 0.005396366119384766, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 13.922987699508667, "step": 278}
{"train_info/time_between_train_steps": 0.005503654479980469, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 13.93901777267456, "step": 279}
{"train_info/time_between_train_steps": 0.005214691162109375, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 13.838765621185303, "step": 280}
{"train_info/time_between_train_steps": 0.0045206546783447266, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 13.98762822151184, "step": 281}
{"train_info/time_between_train_steps": 0.00542902946472168, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 13.864253520965576, "step": 282}
{"train_info/time_between_train_steps": 0.005820274353027344, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 13.840346336364746, "step": 283}
{"train_info/time_between_train_steps": 0.005669593811035156, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 13.85489559173584, "step": 284}
{"train_info/time_between_train_steps": 0.005505800247192383, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 13.952876567840576, "step": 285}
{"train_info/time_between_train_steps": 0.005422115325927734, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 13.8501136302948, "step": 286}
{"train_info/time_between_train_steps": 0.0054857730865478516, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 13.85221815109253, "step": 287}
{"train_info/time_between_train_steps": 0.0057888031005859375, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 13.846032619476318, "step": 288}
{"train_info/time_between_train_steps": 0.005938053131103516, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 13.847818851470947, "step": 289}
{"train_info/time_between_train_steps": 0.005548715591430664, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 13.896734237670898, "step": 290}
{"train_info/time_between_train_steps": 0.0049588680267333984, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 13.859398126602173, "step": 291}
{"train_info/time_between_train_steps": 0.005139589309692383, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 13.860307216644287, "step": 292}
{"train_info/time_between_train_steps": 0.005774497985839844, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 13.926509141921997, "step": 293}
{"train_info/time_between_train_steps": 0.0057010650634765625, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 13.91270112991333, "step": 294}
{"train_info/time_between_train_steps": 0.005456447601318359, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 13.857170104980469, "step": 295}
{"train_info/time_between_train_steps": 0.00513911247253418, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 13.888000726699829, "step": 296}
{"train_info/time_between_train_steps": 0.004892110824584961, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 13.8607816696167, "step": 297}
{"train_info/time_between_train_steps": 0.005800724029541016, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 13.859748601913452, "step": 298}
{"train_info/time_between_train_steps": 0.005737781524658203, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 13.877382516860962, "step": 299}
{"train_info/time_between_train_steps": 0.006515979766845703, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 13.965081691741943, "step": 300}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737101624, "_runtime": 4523}, "step": 300}
{"logs": {"train/loss": 6.6856, "train/learning_rate": 0.0005, "train/epoch": 11.02, "_timestamp": 1737101624, "_runtime": 4523}, "step": 300}
{"train_info/time_between_train_steps": 84.84920120239258, "step": 300}
{"train_info/time_between_train_steps": 92.43188691139221, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 13.837779521942139, "step": 301}
{"train_info/time_between_train_steps": 0.006226778030395508, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 14.028193712234497, "step": 302}
{"train_info/time_between_train_steps": 0.0062084197998046875, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 13.897878646850586, "step": 303}
{"train_info/time_between_train_steps": 0.006287813186645508, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 14.05164384841919, "step": 304}
{"train_info/time_between_train_steps": 0.005852937698364258, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 13.892940759658813, "step": 305}
{"train_info/time_between_train_steps": 0.005880117416381836, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 13.929262161254883, "step": 306}
{"train_info/time_between_train_steps": 0.006098270416259766, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 13.873077630996704, "step": 307}
{"train_info/time_between_train_steps": 0.005205392837524414, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 13.97831916809082, "step": 308}
{"train_info/time_between_train_steps": 0.0051746368408203125, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 13.88906192779541, "step": 309}
{"train_info/time_between_train_steps": 0.004983425140380859, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 13.892932415008545, "step": 310}
{"train_info/time_between_train_steps": 0.00482630729675293, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 13.882330656051636, "step": 311}
{"train_info/time_between_train_steps": 0.005608081817626953, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 13.888511180877686, "step": 312}
{"train_info/time_between_train_steps": 0.005127906799316406, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 13.914083003997803, "step": 313}
{"train_info/time_between_train_steps": 0.005832195281982422, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 13.901989221572876, "step": 314}
{"train_info/time_between_train_steps": 0.004836320877075195, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 13.87896728515625, "step": 315}
{"train_info/time_between_train_steps": 0.005070209503173828, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 13.902350425720215, "step": 316}
{"train_info/time_between_train_steps": 0.00581049919128418, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 13.889736413955688, "step": 317}
{"train_info/time_between_train_steps": 0.00523829460144043, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 13.901793003082275, "step": 318}
{"train_info/time_between_train_steps": 0.005326271057128906, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 13.885191202163696, "step": 319}
{"train_info/time_between_train_steps": 0.005837440490722656, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 13.896314144134521, "step": 320}
{"train_info/time_between_train_steps": 0.005356311798095703, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 13.891067743301392, "step": 321}
{"train_info/time_between_train_steps": 0.005756855010986328, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 13.905555486679077, "step": 322}
{"train_info/time_between_train_steps": 0.005703449249267578, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 13.910127401351929, "step": 323}
{"train_info/time_between_train_steps": 0.005505561828613281, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 13.99704623222351, "step": 324}
{"train_info/time_between_train_steps": 0.006764888763427734, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 13.929206848144531, "step": 325}
{"train_info/time_between_train_steps": 0.0065996646881103516, "step": 325}
{"train_info/time_between_train_steps": 7.630707025527954, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 13.870162010192871, "step": 326}
{"train_info/time_between_train_steps": 0.0051457881927490234, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 13.95318078994751, "step": 327}
{"train_info/time_between_train_steps": 0.004573345184326172, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 13.87515377998352, "step": 328}
{"train_info/time_between_train_steps": 0.005997180938720703, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 14.022568702697754, "step": 329}
{"train_info/time_between_train_steps": 0.005704641342163086, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 13.965798377990723, "step": 330}
{"train_info/time_between_train_steps": 0.006046772003173828, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 13.906731367111206, "step": 331}
{"train_info/time_between_train_steps": 0.005353689193725586, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 13.870989561080933, "step": 332}
{"train_info/time_between_train_steps": 0.004870176315307617, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 13.88606071472168, "step": 333}
{"train_info/time_between_train_steps": 0.005176067352294922, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 13.897565126419067, "step": 334}
{"train_info/time_between_train_steps": 0.005611896514892578, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 13.880041360855103, "step": 335}
{"train_info/time_between_train_steps": 0.005594730377197266, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 13.884727954864502, "step": 336}
{"train_info/time_between_train_steps": 0.0059773921966552734, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 13.894686222076416, "step": 337}
{"train_info/time_between_train_steps": 0.005455970764160156, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 13.886110305786133, "step": 338}
{"train_info/time_between_train_steps": 0.004880428314208984, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 13.977893114089966, "step": 339}
{"train_info/time_between_train_steps": 0.005191326141357422, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 13.882318258285522, "step": 340}
{"train_info/time_between_train_steps": 0.005326747894287109, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 13.884009599685669, "step": 341}
{"train_info/time_between_train_steps": 0.005104541778564453, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 13.8913094997406, "step": 342}
{"train_info/time_between_train_steps": 0.004808187484741211, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 13.980445861816406, "step": 343}
{"train_info/time_between_train_steps": 0.005230903625488281, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 13.886952638626099, "step": 344}
{"train_info/time_between_train_steps": 0.004950761795043945, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 13.894341468811035, "step": 345}
{"train_info/time_between_train_steps": 0.0048770904541015625, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 13.891647577285767, "step": 346}
{"train_info/time_between_train_steps": 0.0061359405517578125, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 13.898278713226318, "step": 347}
{"train_info/time_between_train_steps": 0.005576610565185547, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 13.901435375213623, "step": 348}
{"train_info/time_between_train_steps": 0.005296468734741211, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 13.901663780212402, "step": 349}
{"train_info/time_between_train_steps": 0.005533695220947266, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 13.915796041488647, "step": 350}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737102422, "_runtime": 5321}, "step": 350}
{"logs": {"train/loss": 6.3809, "train/learning_rate": 0.00047222222222222224, "train/epoch": 13.02, "_timestamp": 1737102422, "_runtime": 5321}, "step": 350}
{"train_info/time_between_train_steps": 0.04905343055725098, "step": 350}
{"train_info/time_between_train_steps": 7.749100923538208, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 13.901404619216919, "step": 351}
{"train_info/time_between_train_steps": 0.00574803352355957, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 14.00970458984375, "step": 352}
{"train_info/time_between_train_steps": 0.00481414794921875, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 13.88382863998413, "step": 353}
{"train_info/time_between_train_steps": 0.005830287933349609, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 14.000942707061768, "step": 354}
{"train_info/time_between_train_steps": 0.005769014358520508, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 14.061188220977783, "step": 355}
{"train_info/time_between_train_steps": 0.005600929260253906, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 13.899223566055298, "step": 356}
{"train_info/time_between_train_steps": 0.004760026931762695, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 13.872217655181885, "step": 357}
{"train_info/time_between_train_steps": 0.004697322845458984, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 13.890825748443604, "step": 358}
{"train_info/time_between_train_steps": 0.005933046340942383, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 13.98103380203247, "step": 359}
{"train_info/time_between_train_steps": 0.005153656005859375, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 13.899991750717163, "step": 360}
{"train_info/time_between_train_steps": 0.00494384765625, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 13.897956371307373, "step": 361}
{"train_info/time_between_train_steps": 0.005281925201416016, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 13.896658420562744, "step": 362}
{"train_info/time_between_train_steps": 0.004731893539428711, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 13.902443647384644, "step": 363}
{"train_info/time_between_train_steps": 0.004716634750366211, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 13.984894752502441, "step": 364}
{"train_info/time_between_train_steps": 0.005791664123535156, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 13.916340827941895, "step": 365}
{"train_info/time_between_train_steps": 0.004717350006103516, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 13.902068138122559, "step": 366}
{"train_info/time_between_train_steps": 0.004759073257446289, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 13.908647060394287, "step": 367}
{"train_info/time_between_train_steps": 0.005468845367431641, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 14.001652717590332, "step": 368}
{"train_info/time_between_train_steps": 0.0050809383392333984, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 13.901955604553223, "step": 369}
{"train_info/time_between_train_steps": 0.0050165653228759766, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 13.986228466033936, "step": 370}
{"train_info/time_between_train_steps": 0.005223512649536133, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 13.906971216201782, "step": 371}
{"train_info/time_between_train_steps": 0.005251407623291016, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 13.974918365478516, "step": 372}
{"train_info/time_between_train_steps": 0.005736351013183594, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 13.913446426391602, "step": 373}
{"train_info/time_between_train_steps": 0.005297422409057617, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 13.925419092178345, "step": 374}
{"train_info/time_between_train_steps": 0.005251884460449219, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 13.948100805282593, "step": 375}
{"train_info/time_between_train_steps": 0.006786346435546875, "step": 375}
{"train_info/time_between_train_steps": 7.541026592254639, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 13.886360883712769, "step": 376}
{"train_info/time_between_train_steps": 0.0049746036529541016, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 13.994891881942749, "step": 377}
{"train_info/time_between_train_steps": 0.004783153533935547, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 13.89060664176941, "step": 378}
{"train_info/time_between_train_steps": 0.005031585693359375, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 13.999671697616577, "step": 379}
{"train_info/time_between_train_steps": 0.004882335662841797, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 14.044009447097778, "step": 380}
{"train_info/time_between_train_steps": 0.005803585052490234, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 13.922486782073975, "step": 381}
{"train_info/time_between_train_steps": 0.0051195621490478516, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 13.890524625778198, "step": 382}
{"train_info/time_between_train_steps": 0.005320072174072266, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 13.899926662445068, "step": 383}
{"train_info/time_between_train_steps": 0.004607677459716797, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 13.892159938812256, "step": 384}
{"train_info/time_between_train_steps": 0.00492405891418457, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 14.073086977005005, "step": 385}
{"train_info/time_between_train_steps": 0.0060193538665771484, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 13.895947217941284, "step": 386}
{"train_info/time_between_train_steps": 0.005182504653930664, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 13.902692556381226, "step": 387}
{"train_info/time_between_train_steps": 0.004857063293457031, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 13.906095266342163, "step": 388}
{"train_info/time_between_train_steps": 0.005218982696533203, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 14.005001544952393, "step": 389}
{"train_info/time_between_train_steps": 0.0052373409271240234, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 14.25413990020752, "step": 390}
{"train_info/time_between_train_steps": 0.0056149959564208984, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 13.907521724700928, "step": 391}
{"train_info/time_between_train_steps": 0.00551915168762207, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 13.887401819229126, "step": 392}
{"train_info/time_between_train_steps": 0.005337715148925781, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 13.884505271911621, "step": 393}
{"train_info/time_between_train_steps": 0.005217790603637695, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 13.896223068237305, "step": 394}
{"train_info/time_between_train_steps": 0.0048007965087890625, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 13.88582181930542, "step": 395}
{"train_info/time_between_train_steps": 0.005156517028808594, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 13.914715051651001, "step": 396}
{"train_info/time_between_train_steps": 0.005606174468994141, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 20.354971885681152, "step": 397}
{"train_info/time_between_train_steps": 0.0062406063079833984, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 14.423112154006958, "step": 398}
{"train_info/time_between_train_steps": 0.005972146987915039, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 13.97182822227478, "step": 399}
{"train_info/time_between_train_steps": 0.006382942199707031, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 13.947659254074097, "step": 400}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737103146, "_runtime": 6045}, "step": 400}
{"logs": {"train/loss": 6.0381, "train/learning_rate": 0.00044444444444444436, "train/epoch": 15.02, "_timestamp": 1737103146, "_runtime": 6045}, "step": 400}
{"train_info/time_between_train_steps": 61.29465079307556, "step": 400}
{"train_info/time_between_train_steps": 68.735595703125, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 13.954614639282227, "step": 401}
{"train_info/time_between_train_steps": 0.005413532257080078, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 13.930355310440063, "step": 402}
{"train_info/time_between_train_steps": 0.004791736602783203, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 13.854052543640137, "step": 403}
{"train_info/time_between_train_steps": 0.005051612854003906, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 13.96478271484375, "step": 404}
{"train_info/time_between_train_steps": 0.00517582893371582, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 13.90286135673523, "step": 405}
{"train_info/time_between_train_steps": 0.005291938781738281, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 13.910593032836914, "step": 406}
{"train_info/time_between_train_steps": 0.0052831172943115234, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 13.892119407653809, "step": 407}
{"train_info/time_between_train_steps": 0.004896402359008789, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 13.89266324043274, "step": 408}
{"train_info/time_between_train_steps": 0.005051374435424805, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 13.894505023956299, "step": 409}
{"train_info/time_between_train_steps": 0.005784511566162109, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 13.905038833618164, "step": 410}
{"train_info/time_between_train_steps": 0.00555109977722168, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 13.89327883720398, "step": 411}
{"train_info/time_between_train_steps": 0.004926204681396484, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 13.89393162727356, "step": 412}
{"train_info/time_between_train_steps": 0.005555391311645508, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 13.911381006240845, "step": 413}
{"train_info/time_between_train_steps": 0.00545048713684082, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 13.93831467628479, "step": 414}
{"train_info/time_between_train_steps": 0.0052030086517333984, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 13.897059202194214, "step": 415}
{"train_info/time_between_train_steps": 0.005717754364013672, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 13.989732265472412, "step": 416}
{"train_info/time_between_train_steps": 0.0056726932525634766, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 13.899292707443237, "step": 417}
{"train_info/time_between_train_steps": 0.005243062973022461, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 13.958972454071045, "step": 418}
{"train_info/time_between_train_steps": 0.005257606506347656, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 13.90005874633789, "step": 419}
{"train_info/time_between_train_steps": 0.0060498714447021484, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 13.895954608917236, "step": 420}
{"train_info/time_between_train_steps": 0.005362749099731445, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 13.901273012161255, "step": 421}
{"train_info/time_between_train_steps": 0.005953311920166016, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 13.906675577163696, "step": 422}
{"train_info/time_between_train_steps": 0.005532264709472656, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 13.943002700805664, "step": 423}
{"train_info/time_between_train_steps": 0.005499839782714844, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 13.923184633255005, "step": 424}
{"train_info/time_between_train_steps": 0.0064585208892822266, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 13.933173656463623, "step": 425}
{"train_info/time_between_train_steps": 0.006081104278564453, "step": 425}
{"train_info/time_between_train_steps": 7.731450796127319, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 13.898006439208984, "step": 426}
{"train_info/time_between_train_steps": 0.005869626998901367, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 13.97268533706665, "step": 427}
{"train_info/time_between_train_steps": 0.005411624908447266, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 13.885135889053345, "step": 428}
{"train_info/time_between_train_steps": 0.005227804183959961, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 13.978061437606812, "step": 429}
{"train_info/time_between_train_steps": 0.0055789947509765625, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 13.908413171768188, "step": 430}
{"train_info/time_between_train_steps": 0.0050013065338134766, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 13.909652709960938, "step": 431}
{"train_info/time_between_train_steps": 0.004909515380859375, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 13.970158100128174, "step": 432}
{"train_info/time_between_train_steps": 0.00488591194152832, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 13.878721714019775, "step": 433}
{"train_info/time_between_train_steps": 0.004918575286865234, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 13.906367301940918, "step": 434}
{"train_info/time_between_train_steps": 0.00482487678527832, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 13.928795337677002, "step": 435}
{"train_info/time_between_train_steps": 0.005489826202392578, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 13.903228282928467, "step": 436}
{"train_info/time_between_train_steps": 0.005107879638671875, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 13.906013011932373, "step": 437}
{"train_info/time_between_train_steps": 0.005497455596923828, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 13.911247968673706, "step": 438}
{"train_info/time_between_train_steps": 0.005694150924682617, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 13.968631029129028, "step": 439}
{"train_info/time_between_train_steps": 0.004986286163330078, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 13.91779088973999, "step": 440}
{"train_info/time_between_train_steps": 0.005087614059448242, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 13.894705772399902, "step": 441}
{"train_info/time_between_train_steps": 0.005123615264892578, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 13.901801824569702, "step": 442}
{"train_info/time_between_train_steps": 0.005434513092041016, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 13.904805183410645, "step": 443}
{"train_info/time_between_train_steps": 0.0052874088287353516, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 13.906456232070923, "step": 444}
{"train_info/time_between_train_steps": 0.0057070255279541016, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 13.910661935806274, "step": 445}
{"train_info/time_between_train_steps": 0.0052928924560546875, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 13.900843620300293, "step": 446}
{"train_info/time_between_train_steps": 0.005342721939086914, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 14.005244255065918, "step": 447}
{"train_info/time_between_train_steps": 0.0058746337890625, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 13.926060676574707, "step": 448}
{"train_info/time_between_train_steps": 0.0050563812255859375, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 13.912230968475342, "step": 449}
{"train_info/time_between_train_steps": 0.0057375431060791016, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 13.930314540863037, "step": 450}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737103920, "_runtime": 6819}, "step": 450}
{"logs": {"train/loss": 5.6691, "train/learning_rate": 0.00041666666666666664, "train/epoch": 17.02, "_timestamp": 1737103920, "_runtime": 6819}, "step": 450}
{"train_info/time_between_train_steps": 0.05888056755065918, "step": 450}
{"train_info/time_between_train_steps": 7.826249837875366, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 13.863206624984741, "step": 451}
{"train_info/time_between_train_steps": 0.005750894546508789, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 13.994729995727539, "step": 452}
{"train_info/time_between_train_steps": 0.004998922348022461, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 13.880155324935913, "step": 453}
{"train_info/time_between_train_steps": 0.005587100982666016, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 13.989559412002563, "step": 454}
{"train_info/time_between_train_steps": 0.005980491638183594, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 13.893774509429932, "step": 455}
{"train_info/time_between_train_steps": 0.005419492721557617, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 13.891121864318848, "step": 456}
{"train_info/time_between_train_steps": 0.0046579837799072266, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 13.869708776473999, "step": 457}
{"train_info/time_between_train_steps": 0.005117177963256836, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 13.872582912445068, "step": 458}
{"train_info/time_between_train_steps": 0.0053250789642333984, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 13.87766718864441, "step": 459}
{"train_info/time_between_train_steps": 0.004981517791748047, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 13.875786781311035, "step": 460}
{"train_info/time_between_train_steps": 0.005621910095214844, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 13.8734130859375, "step": 461}
{"train_info/time_between_train_steps": 0.0046422481536865234, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 13.977884292602539, "step": 462}
{"train_info/time_between_train_steps": 0.0047109127044677734, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 13.884376287460327, "step": 463}
{"train_info/time_between_train_steps": 0.005446672439575195, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 13.923748970031738, "step": 464}
{"train_info/time_between_train_steps": 0.0058324337005615234, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 13.889582633972168, "step": 465}
{"train_info/time_between_train_steps": 0.0052721500396728516, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 13.881311416625977, "step": 466}
{"train_info/time_between_train_steps": 0.005349874496459961, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 13.879293441772461, "step": 467}
{"train_info/time_between_train_steps": 0.00500941276550293, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 13.88320517539978, "step": 468}
{"train_info/time_between_train_steps": 0.005250215530395508, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 13.885696649551392, "step": 469}
{"train_info/time_between_train_steps": 0.005777835845947266, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 13.884489297866821, "step": 470}
{"train_info/time_between_train_steps": 0.005093574523925781, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 13.894331455230713, "step": 471}
{"train_info/time_between_train_steps": 0.005963802337646484, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 13.89078664779663, "step": 472}
{"train_info/time_between_train_steps": 0.005368232727050781, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 13.920456886291504, "step": 473}
{"train_info/time_between_train_steps": 0.005128622055053711, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 13.910249948501587, "step": 474}
{"train_info/time_between_train_steps": 0.005621194839477539, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 13.9189772605896, "step": 475}
{"train_info/time_between_train_steps": 0.006959199905395508, "step": 475}
{"train_info/time_between_train_steps": 7.559364080429077, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 13.884634494781494, "step": 476}
{"train_info/time_between_train_steps": 0.004921674728393555, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 13.978466510772705, "step": 477}
{"train_info/time_between_train_steps": 0.00520777702331543, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 13.975866317749023, "step": 478}
{"train_info/time_between_train_steps": 0.005562782287597656, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 13.989914178848267, "step": 479}
{"train_info/time_between_train_steps": 0.00555729866027832, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 13.896990776062012, "step": 480}
{"train_info/time_between_train_steps": 0.005925893783569336, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 13.914825916290283, "step": 481}
{"train_info/time_between_train_steps": 0.004493236541748047, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 13.897196531295776, "step": 482}
{"train_info/time_between_train_steps": 0.0050220489501953125, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 13.906136989593506, "step": 483}
{"train_info/time_between_train_steps": 0.00493931770324707, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 13.909817934036255, "step": 484}
{"train_info/time_between_train_steps": 0.0057604312896728516, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 13.915971517562866, "step": 485}
{"train_info/time_between_train_steps": 0.005025148391723633, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 13.904758214950562, "step": 486}
{"train_info/time_between_train_steps": 0.00547480583190918, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 13.909534931182861, "step": 487}
{"train_info/time_between_train_steps": 0.005999565124511719, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 13.924289226531982, "step": 488}
{"train_info/time_between_train_steps": 0.00543975830078125, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 13.922906637191772, "step": 489}
{"train_info/time_between_train_steps": 0.005193948745727539, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 13.9044029712677, "step": 490}
{"train_info/time_between_train_steps": 0.00549626350402832, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 13.899667501449585, "step": 491}
{"train_info/time_between_train_steps": 0.006102800369262695, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 13.902477502822876, "step": 492}
{"train_info/time_between_train_steps": 0.005664825439453125, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 14.12291669845581, "step": 493}
{"train_info/time_between_train_steps": 0.00515294075012207, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 14.375902652740479, "step": 494}
{"train_info/time_between_train_steps": 0.005589723587036133, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 13.897714853286743, "step": 495}
{"train_info/time_between_train_steps": 0.005828857421875, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 13.970577239990234, "step": 496}
{"train_info/time_between_train_steps": 0.00567936897277832, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 13.926551103591919, "step": 497}
{"train_info/time_between_train_steps": 0.006577968597412109, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 14.240797996520996, "step": 498}
{"train_info/time_between_train_steps": 0.005131959915161133, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 13.986199140548706, "step": 499}
{"train_info/time_between_train_steps": 0.007014036178588867, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 14.002816200256348, "step": 500}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737104635, "_runtime": 7534}, "step": 500}
{"logs": {"train/loss": 5.3832, "train/learning_rate": 0.00038888888888888887, "train/epoch": 19.02, "_timestamp": 1737104635, "_runtime": 7534}, "step": 500}
{"train_info/time_between_train_steps": 44.48552417755127, "step": 500}
{"train_info/time_between_train_steps": 52.22989296913147, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 13.850624084472656, "step": 501}
{"train_info/time_between_train_steps": 0.005180835723876953, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 14.01528549194336, "step": 502}
{"train_info/time_between_train_steps": 0.006057262420654297, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 13.937813520431519, "step": 503}
{"train_info/time_between_train_steps": 0.0060160160064697266, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 14.063852310180664, "step": 504}
{"train_info/time_between_train_steps": 0.005970954895019531, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 13.930076837539673, "step": 505}
{"train_info/time_between_train_steps": 0.005645751953125, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 13.958016157150269, "step": 506}
{"train_info/time_between_train_steps": 0.005822181701660156, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 13.90330457687378, "step": 507}
{"train_info/time_between_train_steps": 0.005746603012084961, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 13.907206296920776, "step": 508}
{"train_info/time_between_train_steps": 0.004909515380859375, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 13.995513200759888, "step": 509}
{"train_info/time_between_train_steps": 0.005228757858276367, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 13.902875423431396, "step": 510}
{"train_info/time_between_train_steps": 0.004983663558959961, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 13.92106032371521, "step": 511}
{"train_info/time_between_train_steps": 0.004925966262817383, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 13.900414228439331, "step": 512}
{"train_info/time_between_train_steps": 0.005639314651489258, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 13.905802726745605, "step": 513}
{"train_info/time_between_train_steps": 0.004878520965576172, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 13.894618034362793, "step": 514}
{"train_info/time_between_train_steps": 0.0052492618560791016, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 13.9159836769104, "step": 515}
{"train_info/time_between_train_steps": 0.0049021244049072266, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 13.951436996459961, "step": 516}
{"train_info/time_between_train_steps": 0.005038261413574219, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 13.912094831466675, "step": 517}
{"train_info/time_between_train_steps": 0.0055179595947265625, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 13.911371946334839, "step": 518}
{"train_info/time_between_train_steps": 0.005030632019042969, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 13.910475254058838, "step": 519}
{"train_info/time_between_train_steps": 0.004904985427856445, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 13.927100896835327, "step": 520}
{"train_info/time_between_train_steps": 0.005804300308227539, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 13.914317846298218, "step": 521}
{"train_info/time_between_train_steps": 0.005249500274658203, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 13.924223899841309, "step": 522}
{"train_info/time_between_train_steps": 0.005379676818847656, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 13.938178062438965, "step": 523}
{"train_info/time_between_train_steps": 0.005277156829833984, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 14.079203844070435, "step": 524}
{"train_info/time_between_train_steps": 0.006316661834716797, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 13.936328887939453, "step": 525}
{"train_info/time_between_train_steps": 0.005788087844848633, "step": 525}
{"train_info/time_between_train_steps": 7.807049036026001, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 13.875181436538696, "step": 526}
{"train_info/time_between_train_steps": 0.005273103713989258, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 14.034756898880005, "step": 527}
{"train_info/time_between_train_steps": 0.005610227584838867, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 13.904778003692627, "step": 528}
{"train_info/time_between_train_steps": 0.005736827850341797, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 14.052775144577026, "step": 529}
{"train_info/time_between_train_steps": 0.005599260330200195, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 13.900041103363037, "step": 530}
{"train_info/time_between_train_steps": 0.00494837760925293, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 13.933428764343262, "step": 531}
{"train_info/time_between_train_steps": 0.00564885139465332, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 13.895809173583984, "step": 532}
{"train_info/time_between_train_steps": 0.004815101623535156, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 13.882745504379272, "step": 533}
{"train_info/time_between_train_steps": 0.00479435920715332, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 13.882806777954102, "step": 534}
{"train_info/time_between_train_steps": 0.005197048187255859, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 13.89010500907898, "step": 535}
{"train_info/time_between_train_steps": 0.005800008773803711, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 13.919119596481323, "step": 536}
{"train_info/time_between_train_steps": 0.005087852478027344, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 13.893339157104492, "step": 537}
{"train_info/time_between_train_steps": 0.005700349807739258, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 13.895235776901245, "step": 538}
{"train_info/time_between_train_steps": 0.0049669742584228516, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 13.982244491577148, "step": 539}
{"train_info/time_between_train_steps": 0.004721641540527344, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 13.88461422920227, "step": 540}
{"train_info/time_between_train_steps": 0.004688739776611328, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 13.937399625778198, "step": 541}
{"train_info/time_between_train_steps": 0.005401611328125, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 13.87894344329834, "step": 542}
{"train_info/time_between_train_steps": 0.005150794982910156, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 13.896674394607544, "step": 543}
{"train_info/time_between_train_steps": 0.00584864616394043, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 13.904250621795654, "step": 544}
{"train_info/time_between_train_steps": 0.0051991939544677734, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 13.909474849700928, "step": 545}
{"train_info/time_between_train_steps": 0.005729198455810547, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 13.92007064819336, "step": 546}
{"train_info/time_between_train_steps": 0.0056133270263671875, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 13.913097620010376, "step": 547}
{"train_info/time_between_train_steps": 0.005551576614379883, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 13.906996011734009, "step": 548}
{"train_info/time_between_train_steps": 0.00561833381652832, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 13.945354461669922, "step": 549}
{"train_info/time_between_train_steps": 0.005820035934448242, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 13.940419435501099, "step": 550}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737105394, "_runtime": 8293}, "step": 550}
{"logs": {"train/loss": 5.1423, "train/learning_rate": 0.0003611111111111111, "train/epoch": 21.02, "_timestamp": 1737105394, "_runtime": 8293}, "step": 550}
{"train_info/time_between_train_steps": 0.05938529968261719, "step": 550}
{"train_info/time_between_train_steps": 7.592665910720825, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 13.86886191368103, "step": 551}
{"train_info/time_between_train_steps": 0.0056345462799072266, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 14.013139247894287, "step": 552}
{"train_info/time_between_train_steps": 0.0049746036529541016, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 13.96943974494934, "step": 553}
{"train_info/time_between_train_steps": 0.0049152374267578125, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 14.082811832427979, "step": 554}
{"train_info/time_between_train_steps": 0.00488734245300293, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 13.988322019577026, "step": 555}
{"train_info/time_between_train_steps": 0.00517582893371582, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 13.913059711456299, "step": 556}
{"train_info/time_between_train_steps": 0.0055561065673828125, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 13.904933452606201, "step": 557}
{"train_info/time_between_train_steps": 0.005693197250366211, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 13.88853406906128, "step": 558}
{"train_info/time_between_train_steps": 0.005296230316162109, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 13.884921073913574, "step": 559}
{"train_info/time_between_train_steps": 0.005419492721557617, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 13.892133474349976, "step": 560}
{"train_info/time_between_train_steps": 0.005251646041870117, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 13.887730598449707, "step": 561}
{"train_info/time_between_train_steps": 0.0052945613861083984, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 13.915281534194946, "step": 562}
{"train_info/time_between_train_steps": 0.00513005256652832, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 13.892777919769287, "step": 563}
{"train_info/time_between_train_steps": 0.005391120910644531, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 13.902848720550537, "step": 564}
{"train_info/time_between_train_steps": 0.005780220031738281, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 13.896689176559448, "step": 565}
{"train_info/time_between_train_steps": 0.004870176315307617, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 13.91998839378357, "step": 566}
{"train_info/time_between_train_steps": 0.005423307418823242, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 13.895260572433472, "step": 567}
{"train_info/time_between_train_steps": 0.0054111480712890625, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 13.907825231552124, "step": 568}
{"train_info/time_between_train_steps": 0.004898548126220703, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 13.890384912490845, "step": 569}
{"train_info/time_between_train_steps": 0.005217552185058594, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 14.015764236450195, "step": 570}
{"train_info/time_between_train_steps": 0.0052416324615478516, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 13.923197984695435, "step": 571}
{"train_info/time_between_train_steps": 0.004934787750244141, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 13.90155839920044, "step": 572}
{"train_info/time_between_train_steps": 0.005704402923583984, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 13.907982587814331, "step": 573}
{"train_info/time_between_train_steps": 0.005283832550048828, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 13.908139944076538, "step": 574}
{"train_info/time_between_train_steps": 0.005557060241699219, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 13.945736408233643, "step": 575}
{"train_info/time_between_train_steps": 0.007570028305053711, "step": 575}
{"train_info/time_between_train_steps": 7.701272010803223, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 13.869638681411743, "step": 576}
{"train_info/time_between_train_steps": 0.005269527435302734, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 13.95889949798584, "step": 577}
{"train_info/time_between_train_steps": 0.004990100860595703, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 13.887614250183105, "step": 578}
{"train_info/time_between_train_steps": 0.005423307418823242, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 14.014126300811768, "step": 579}
{"train_info/time_between_train_steps": 0.0052983760833740234, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 13.903236627578735, "step": 580}
{"train_info/time_between_train_steps": 0.0052149295806884766, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 13.899317026138306, "step": 581}
{"train_info/time_between_train_steps": 0.005337715148925781, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 13.876274347305298, "step": 582}
{"train_info/time_between_train_steps": 0.0055620670318603516, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 13.899271488189697, "step": 583}
{"train_info/time_between_train_steps": 0.005600929260253906, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 13.917774200439453, "step": 584}
{"train_info/time_between_train_steps": 0.006036043167114258, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 13.941867589950562, "step": 585}
{"train_info/time_between_train_steps": 0.005660057067871094, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 14.022199392318726, "step": 586}
{"train_info/time_between_train_steps": 0.005127906799316406, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 13.910897493362427, "step": 587}
{"train_info/time_between_train_steps": 0.0057260990142822266, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 13.911990404129028, "step": 588}
{"train_info/time_between_train_steps": 0.004874467849731445, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 13.8893461227417, "step": 589}
{"train_info/time_between_train_steps": 0.005331754684448242, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 13.913100719451904, "step": 590}
{"train_info/time_between_train_steps": 0.005823612213134766, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 14.749968767166138, "step": 591}
{"train_info/time_between_train_steps": 0.0061283111572265625, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 15.323452234268188, "step": 592}
{"train_info/time_between_train_steps": 0.005119800567626953, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 13.917704105377197, "step": 593}
{"train_info/time_between_train_steps": 0.005845308303833008, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 13.949334859848022, "step": 594}
{"train_info/time_between_train_steps": 0.0060272216796875, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 14.163418054580688, "step": 595}
{"train_info/time_between_train_steps": 0.0062732696533203125, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 13.965266466140747, "step": 596}
{"train_info/time_between_train_steps": 0.006583690643310547, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 13.910356998443604, "step": 597}
{"train_info/time_between_train_steps": 0.005544424057006836, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 13.923301458358765, "step": 598}
{"train_info/time_between_train_steps": 0.005884408950805664, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 14.288087368011475, "step": 599}
{"train_info/time_between_train_steps": 0.005857706069946289, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 13.961082696914673, "step": 600}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737106120, "_runtime": 9019}, "step": 600}
{"logs": {"train/loss": 4.9255, "train/learning_rate": 0.0003333333333333333, "train/epoch": 23.02, "_timestamp": 1737106120, "_runtime": 9019}, "step": 600}
{"train_info/time_between_train_steps": 39.15830993652344, "step": 600}
{"train_info/time_between_train_steps": 46.88274931907654, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 13.942270994186401, "step": 601}
{"train_info/time_between_train_steps": 0.005852222442626953, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 14.002406358718872, "step": 602}
{"train_info/time_between_train_steps": 0.005987644195556641, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 13.897650003433228, "step": 603}
{"train_info/time_between_train_steps": 0.006470203399658203, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 14.058175325393677, "step": 604}
{"train_info/time_between_train_steps": 0.006151676177978516, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 14.004021167755127, "step": 605}
{"train_info/time_between_train_steps": 0.005768775939941406, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 13.903567552566528, "step": 606}
{"train_info/time_between_train_steps": 0.005441427230834961, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 13.879324197769165, "step": 607}
{"train_info/time_between_train_steps": 0.006018877029418945, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 13.889935493469238, "step": 608}
{"train_info/time_between_train_steps": 0.0054624080657958984, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 13.894254922866821, "step": 609}
{"train_info/time_between_train_steps": 0.005362749099731445, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 13.879925966262817, "step": 610}
{"train_info/time_between_train_steps": 0.005761861801147461, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 13.889865159988403, "step": 611}
{"train_info/time_between_train_steps": 0.005430459976196289, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 13.88357663154602, "step": 612}
{"train_info/time_between_train_steps": 0.0056035518646240234, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 13.895215034484863, "step": 613}
{"train_info/time_between_train_steps": 0.005944490432739258, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 13.890885829925537, "step": 614}
{"train_info/time_between_train_steps": 0.0061571598052978516, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 13.892013788223267, "step": 615}
{"train_info/time_between_train_steps": 0.005270719528198242, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 13.98657751083374, "step": 616}
{"train_info/time_between_train_steps": 0.0062749385833740234, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 13.929054737091064, "step": 617}
{"train_info/time_between_train_steps": 0.005347490310668945, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 13.899430274963379, "step": 618}
{"train_info/time_between_train_steps": 0.005185127258300781, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 13.9028000831604, "step": 619}
{"train_info/time_between_train_steps": 0.005963563919067383, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 13.891112327575684, "step": 620}
{"train_info/time_between_train_steps": 0.004960775375366211, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 13.895996332168579, "step": 621}
{"train_info/time_between_train_steps": 0.005872249603271484, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 13.908474922180176, "step": 622}
{"train_info/time_between_train_steps": 0.005441188812255859, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 13.901727199554443, "step": 623}
{"train_info/time_between_train_steps": 0.005422115325927734, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 13.906137466430664, "step": 624}
{"train_info/time_between_train_steps": 0.005505800247192383, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 13.916173458099365, "step": 625}
{"train_info/time_between_train_steps": 0.00647735595703125, "step": 625}
{"train_info/time_between_train_steps": 7.542259216308594, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 13.893011331558228, "step": 626}
{"train_info/time_between_train_steps": 0.004692792892456055, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 14.01478362083435, "step": 627}
{"train_info/time_between_train_steps": 0.00513148307800293, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 13.9151291847229, "step": 628}
{"train_info/time_between_train_steps": 0.005657672882080078, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 14.034381628036499, "step": 629}
{"train_info/time_between_train_steps": 0.005198240280151367, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 13.88772177696228, "step": 630}
{"train_info/time_between_train_steps": 0.005800724029541016, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 13.917105913162231, "step": 631}
{"train_info/time_between_train_steps": 0.00488734245300293, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 13.982540845870972, "step": 632}
{"train_info/time_between_train_steps": 0.005433320999145508, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 13.895740747451782, "step": 633}
{"train_info/time_between_train_steps": 0.005505800247192383, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 13.982438325881958, "step": 634}
{"train_info/time_between_train_steps": 0.00572657585144043, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 13.889589071273804, "step": 635}
{"train_info/time_between_train_steps": 0.0058135986328125, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 13.885374546051025, "step": 636}
{"train_info/time_between_train_steps": 0.005366325378417969, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 13.897703409194946, "step": 637}
{"train_info/time_between_train_steps": 0.0052525997161865234, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 13.885703563690186, "step": 638}
{"train_info/time_between_train_steps": 0.00533604621887207, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 13.892957925796509, "step": 639}
{"train_info/time_between_train_steps": 0.0058629512786865234, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 13.897367238998413, "step": 640}
{"train_info/time_between_train_steps": 0.005596160888671875, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 13.898487567901611, "step": 641}
{"train_info/time_between_train_steps": 0.006184816360473633, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 13.9255051612854, "step": 642}
{"train_info/time_between_train_steps": 0.004906892776489258, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 13.893428087234497, "step": 643}
{"train_info/time_between_train_steps": 0.005377054214477539, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 13.889334201812744, "step": 644}
{"train_info/time_between_train_steps": 0.005190610885620117, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 13.894336700439453, "step": 645}
{"train_info/time_between_train_steps": 0.005842924118041992, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 13.909313917160034, "step": 646}
{"train_info/time_between_train_steps": 0.0061647891998291016, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 14.026946306228638, "step": 647}
{"train_info/time_between_train_steps": 0.00551152229309082, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 13.89749789237976, "step": 648}
{"train_info/time_between_train_steps": 0.005329132080078125, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 13.918104887008667, "step": 649}
{"train_info/time_between_train_steps": 0.005475282669067383, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 13.927855730056763, "step": 650}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737106872, "_runtime": 9771}, "step": 650}
{"logs": {"train/loss": 4.7399, "train/learning_rate": 0.00030555555555555555, "train/epoch": 25.02, "_timestamp": 1737106872, "_runtime": 9771}, "step": 650}
{"train_info/time_between_train_steps": 0.057784318923950195, "step": 650}
{"train_info/time_between_train_steps": 7.781280279159546, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 13.865384101867676, "step": 651}
{"train_info/time_between_train_steps": 0.00519108772277832, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 13.97385287284851, "step": 652}
{"train_info/time_between_train_steps": 0.004923582077026367, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 13.868202924728394, "step": 653}
{"train_info/time_between_train_steps": 0.005647182464599609, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 13.974514484405518, "step": 654}
{"train_info/time_between_train_steps": 0.005465269088745117, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 13.894323825836182, "step": 655}
{"train_info/time_between_train_steps": 0.005565166473388672, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 13.934410572052002, "step": 656}
{"train_info/time_between_train_steps": 0.005706310272216797, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 13.893686056137085, "step": 657}
{"train_info/time_between_train_steps": 0.005362510681152344, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 13.896485328674316, "step": 658}
{"train_info/time_between_train_steps": 0.0060427188873291016, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 13.89784574508667, "step": 659}
{"train_info/time_between_train_steps": 0.006075143814086914, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 13.893388748168945, "step": 660}
{"train_info/time_between_train_steps": 0.005207538604736328, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 13.889667510986328, "step": 661}
{"train_info/time_between_train_steps": 0.0053904056549072266, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 13.890607595443726, "step": 662}
{"train_info/time_between_train_steps": 0.005143880844116211, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 14.033785343170166, "step": 663}
{"train_info/time_between_train_steps": 0.0052835941314697266, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 13.892825365066528, "step": 664}
{"train_info/time_between_train_steps": 0.005214214324951172, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 13.901156663894653, "step": 665}
{"train_info/time_between_train_steps": 0.005454540252685547, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 13.884443998336792, "step": 666}
{"train_info/time_between_train_steps": 0.005084514617919922, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 13.908895254135132, "step": 667}
{"train_info/time_between_train_steps": 0.0059549808502197266, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 13.922348976135254, "step": 668}
{"train_info/time_between_train_steps": 0.005949497222900391, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 13.88812780380249, "step": 669}
{"train_info/time_between_train_steps": 0.005269527435302734, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 13.886515378952026, "step": 670}
{"train_info/time_between_train_steps": 0.0050466060638427734, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 13.902166366577148, "step": 671}
{"train_info/time_between_train_steps": 0.005329608917236328, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 13.898857831954956, "step": 672}
{"train_info/time_between_train_steps": 0.005464792251586914, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 13.918173789978027, "step": 673}
{"train_info/time_between_train_steps": 0.005515098571777344, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 13.909534454345703, "step": 674}
{"train_info/time_between_train_steps": 0.005704641342163086, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 13.921090126037598, "step": 675}
{"train_info/time_between_train_steps": 0.00673675537109375, "step": 675}
{"train_info/time_between_train_steps": 7.854084730148315, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 13.921148300170898, "step": 676}
{"train_info/time_between_train_steps": 0.0051958560943603516, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 14.031049489974976, "step": 677}
{"train_info/time_between_train_steps": 0.005702495574951172, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 13.99370527267456, "step": 678}
{"train_info/time_between_train_steps": 0.005074501037597656, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 14.044378280639648, "step": 679}
{"train_info/time_between_train_steps": 0.0058441162109375, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 13.929939031600952, "step": 680}
{"train_info/time_between_train_steps": 0.005708456039428711, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 13.96187162399292, "step": 681}
{"train_info/time_between_train_steps": 0.004750490188598633, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 13.909506559371948, "step": 682}
{"train_info/time_between_train_steps": 0.004927396774291992, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 13.895551919937134, "step": 683}
{"train_info/time_between_train_steps": 0.005477190017700195, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 14.95650601387024, "step": 684}
{"train_info/time_between_train_steps": 0.005780220031738281, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 13.861536026000977, "step": 685}
{"train_info/time_between_train_steps": 0.005339622497558594, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 13.888795614242554, "step": 686}
{"train_info/time_between_train_steps": 0.005462646484375, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 13.89171838760376, "step": 687}
{"train_info/time_between_train_steps": 0.00513768196105957, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 13.894103288650513, "step": 688}
{"train_info/time_between_train_steps": 0.004930734634399414, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 13.893255949020386, "step": 689}
{"train_info/time_between_train_steps": 0.00523066520690918, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 13.897058486938477, "step": 690}
{"train_info/time_between_train_steps": 0.005360126495361328, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 13.890530586242676, "step": 691}
{"train_info/time_between_train_steps": 0.005786895751953125, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 14.441035985946655, "step": 692}
{"train_info/time_between_train_steps": 0.0054035186767578125, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 14.16831374168396, "step": 693}
{"train_info/time_between_train_steps": 0.005530357360839844, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 13.922133684158325, "step": 694}
{"train_info/time_between_train_steps": 0.0051267147064208984, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 13.928043842315674, "step": 695}
{"train_info/time_between_train_steps": 0.005903482437133789, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 15.004563570022583, "step": 696}
{"train_info/time_between_train_steps": 0.005451202392578125, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 14.214375734329224, "step": 697}
{"train_info/time_between_train_steps": 0.006143093109130859, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 13.960829734802246, "step": 698}
{"train_info/time_between_train_steps": 0.005730152130126953, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 13.93996000289917, "step": 699}
{"train_info/time_between_train_steps": 0.0064013004302978516, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 14.519638776779175, "step": 700}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737107599, "_runtime": 10498}, "step": 700}
{"logs": {"train/loss": 4.582, "train/learning_rate": 0.0002777777777777778, "train/epoch": 27.02, "_timestamp": 1737107599, "_runtime": 10498}, "step": 700}
{"train_info/time_between_train_steps": 92.14519572257996, "step": 700}
{"train_info/time_between_train_steps": 99.99717593193054, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 13.724963665008545, "step": 701}
{"train_info/time_between_train_steps": 0.0050580501556396484, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 13.929886817932129, "step": 702}
{"train_info/time_between_train_steps": 0.0054018497467041016, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 13.827324867248535, "step": 703}
{"train_info/time_between_train_steps": 0.00505828857421875, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 13.946990489959717, "step": 704}
{"train_info/time_between_train_steps": 0.005171775817871094, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 13.826690673828125, "step": 705}
{"train_info/time_between_train_steps": 0.0049593448638916016, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 13.869992733001709, "step": 706}
{"train_info/time_between_train_steps": 0.005063295364379883, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 13.84573221206665, "step": 707}
{"train_info/time_between_train_steps": 0.0049631595611572266, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 13.823062181472778, "step": 708}
{"train_info/time_between_train_steps": 0.004952192306518555, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 13.913888216018677, "step": 709}
{"train_info/time_between_train_steps": 0.005448102951049805, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 13.824995517730713, "step": 710}
{"train_info/time_between_train_steps": 0.004848480224609375, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 13.847466468811035, "step": 711}
{"train_info/time_between_train_steps": 0.005191802978515625, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 13.840517282485962, "step": 712}
{"train_info/time_between_train_steps": 0.005794525146484375, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 13.835032939910889, "step": 713}
{"train_info/time_between_train_steps": 0.0047795772552490234, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 13.838617086410522, "step": 714}
{"train_info/time_between_train_steps": 0.004827022552490234, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 13.851216316223145, "step": 715}
{"train_info/time_between_train_steps": 0.005258798599243164, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 13.845516681671143, "step": 716}
{"train_info/time_between_train_steps": 0.005560636520385742, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 13.844404935836792, "step": 717}
{"train_info/time_between_train_steps": 0.0048825740814208984, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 13.842437744140625, "step": 718}
{"train_info/time_between_train_steps": 0.0047910213470458984, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 13.882903814315796, "step": 719}
{"train_info/time_between_train_steps": 0.005532264709472656, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 13.84477162361145, "step": 720}
{"train_info/time_between_train_steps": 0.005138874053955078, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 13.855881214141846, "step": 721}
{"train_info/time_between_train_steps": 0.004869937896728516, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 13.8455069065094, "step": 722}
{"train_info/time_between_train_steps": 0.005560874938964844, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 13.861129999160767, "step": 723}
{"train_info/time_between_train_steps": 0.005704164505004883, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 13.950928688049316, "step": 724}
{"train_info/time_between_train_steps": 0.005431413650512695, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 13.876701831817627, "step": 725}
{"train_info/time_between_train_steps": 0.0066149234771728516, "step": 725}
{"train_info/time_between_train_steps": 7.731144666671753, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 13.821927309036255, "step": 726}
{"train_info/time_between_train_steps": 0.0044689178466796875, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 13.920387506484985, "step": 727}
{"train_info/time_between_train_steps": 0.005366325378417969, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 13.868731021881104, "step": 728}
{"train_info/time_between_train_steps": 0.00579380989074707, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 14.03325366973877, "step": 729}
{"train_info/time_between_train_steps": 0.005281209945678711, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 13.83600401878357, "step": 730}
{"train_info/time_between_train_steps": 0.004633903503417969, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 13.853904485702515, "step": 731}
{"train_info/time_between_train_steps": 0.005200624465942383, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 13.8517906665802, "step": 732}
{"train_info/time_between_train_steps": 0.005087852478027344, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 13.840356826782227, "step": 733}
{"train_info/time_between_train_steps": 0.004941701889038086, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 13.83841609954834, "step": 734}
{"train_info/time_between_train_steps": 0.00493621826171875, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 13.837181329727173, "step": 735}
{"train_info/time_between_train_steps": 0.005274295806884766, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 13.850053310394287, "step": 736}
{"train_info/time_between_train_steps": 0.0052073001861572266, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 13.835676670074463, "step": 737}
{"train_info/time_between_train_steps": 0.004934549331665039, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 13.851463556289673, "step": 738}
{"train_info/time_between_train_steps": 0.00490570068359375, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 13.850688457489014, "step": 739}
{"train_info/time_between_train_steps": 0.0046808719635009766, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 13.918048620223999, "step": 740}
{"train_info/time_between_train_steps": 0.005359172821044922, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 13.838457107543945, "step": 741}
{"train_info/time_between_train_steps": 0.004708766937255859, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 13.83852219581604, "step": 742}
{"train_info/time_between_train_steps": 0.0057718753814697266, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 13.846403121948242, "step": 743}
{"train_info/time_between_train_steps": 0.004897594451904297, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 13.851297378540039, "step": 744}
{"train_info/time_between_train_steps": 0.0048372745513916016, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 13.845650672912598, "step": 745}
{"train_info/time_between_train_steps": 0.004621028900146484, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 13.842936515808105, "step": 746}
{"train_info/time_between_train_steps": 0.005422830581665039, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 13.855017185211182, "step": 747}
{"train_info/time_between_train_steps": 0.005924224853515625, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 13.856411457061768, "step": 748}
{"train_info/time_between_train_steps": 0.005553722381591797, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 13.898656368255615, "step": 749}
{"train_info/time_between_train_steps": 0.006323575973510742, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 13.845384359359741, "step": 750}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737108402, "_runtime": 11301}, "step": 750}
{"logs": {"train/loss": 4.4476, "train/learning_rate": 0.00025, "train/epoch": 29.02, "_timestamp": 1737108402, "_runtime": 11301}, "step": 750}
{"train_info/time_between_train_steps": 0.056037187576293945, "step": 750}
{"train_info/time_between_train_steps": 7.852966070175171, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 13.796462059020996, "step": 751}
{"train_info/time_between_train_steps": 0.004748344421386719, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 13.884139776229858, "step": 752}
{"train_info/time_between_train_steps": 0.004875898361206055, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 13.810871601104736, "step": 753}
{"train_info/time_between_train_steps": 0.005191802978515625, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 13.943788766860962, "step": 754}
{"train_info/time_between_train_steps": 0.00557255744934082, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 13.908937931060791, "step": 755}
{"train_info/time_between_train_steps": 0.00597691535949707, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 13.825703620910645, "step": 756}
{"train_info/time_between_train_steps": 0.005088090896606445, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 13.817321062088013, "step": 757}
{"train_info/time_between_train_steps": 0.005612850189208984, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 13.80827522277832, "step": 758}
{"train_info/time_between_train_steps": 0.0047075748443603516, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 13.812429428100586, "step": 759}
{"train_info/time_between_train_steps": 0.005190372467041016, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 13.808499097824097, "step": 760}
{"train_info/time_between_train_steps": 0.0048389434814453125, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 13.813191413879395, "step": 761}
{"train_info/time_between_train_steps": 0.005591869354248047, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 13.82986068725586, "step": 762}
{"train_info/time_between_train_steps": 0.005040884017944336, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 13.809061288833618, "step": 763}
{"train_info/time_between_train_steps": 0.005023479461669922, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 13.8069486618042, "step": 764}
{"train_info/time_between_train_steps": 0.005835533142089844, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 13.815659046173096, "step": 765}
{"train_info/time_between_train_steps": 0.004948616027832031, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 13.829785346984863, "step": 766}
{"train_info/time_between_train_steps": 0.0048711299896240234, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 13.81508731842041, "step": 767}
{"train_info/time_between_train_steps": 0.005148410797119141, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 13.815776348114014, "step": 768}
{"train_info/time_between_train_steps": 0.005131244659423828, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 13.806539297103882, "step": 769}
{"train_info/time_between_train_steps": 0.004826068878173828, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 13.899110794067383, "step": 770}
{"train_info/time_between_train_steps": 0.005542755126953125, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 13.810085773468018, "step": 771}
{"train_info/time_between_train_steps": 0.0049059391021728516, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 13.814120054244995, "step": 772}
{"train_info/time_between_train_steps": 0.0052547454833984375, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 13.817427635192871, "step": 773}
{"train_info/time_between_train_steps": 0.0051844120025634766, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 13.825582504272461, "step": 774}
{"train_info/time_between_train_steps": 0.00579833984375, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 13.880196332931519, "step": 775}
{"train_info/time_between_train_steps": 0.0066149234771728516, "step": 775}
{"train_info/time_between_train_steps": 7.505356073379517, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 13.842851400375366, "step": 776}
{"train_info/time_between_train_steps": 0.0050394535064697266, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 13.927303314208984, "step": 777}
{"train_info/time_between_train_steps": 0.005627155303955078, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 18.171040058135986, "step": 778}
{"train_info/time_between_train_steps": 0.004757881164550781, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 13.98942494392395, "step": 779}
{"train_info/time_between_train_steps": 0.005193233489990234, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 13.846668481826782, "step": 780}
{"train_info/time_between_train_steps": 0.005682945251464844, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 13.86051607131958, "step": 781}
{"train_info/time_between_train_steps": 0.0048868656158447266, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 13.858397960662842, "step": 782}
{"train_info/time_between_train_steps": 0.004747629165649414, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 13.837940692901611, "step": 783}
{"train_info/time_between_train_steps": 0.005049467086791992, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 13.844384908676147, "step": 784}
{"train_info/time_between_train_steps": 0.005629301071166992, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 13.838348865509033, "step": 785}
{"train_info/time_between_train_steps": 0.004929304122924805, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 13.92782711982727, "step": 786}
{"train_info/time_between_train_steps": 0.0055696964263916016, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 13.86952519416809, "step": 787}
{"train_info/time_between_train_steps": 0.005801200866699219, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 13.834582567214966, "step": 788}
{"train_info/time_between_train_steps": 0.005298614501953125, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 13.846516370773315, "step": 789}
{"train_info/time_between_train_steps": 0.005189657211303711, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 13.84748101234436, "step": 790}
{"train_info/time_between_train_steps": 0.005606412887573242, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 14.249205589294434, "step": 791}
{"train_info/time_between_train_steps": 0.005123138427734375, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 13.872243165969849, "step": 792}
{"train_info/time_between_train_steps": 0.005558013916015625, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 13.876627445220947, "step": 793}
{"train_info/time_between_train_steps": 0.004749774932861328, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 13.848454713821411, "step": 794}
{"train_info/time_between_train_steps": 0.005301237106323242, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 13.857109308242798, "step": 795}
{"train_info/time_between_train_steps": 0.0048885345458984375, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 13.85547137260437, "step": 796}
{"train_info/time_between_train_steps": 0.005281686782836914, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 13.859542608261108, "step": 797}
{"train_info/time_between_train_steps": 0.005314826965332031, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 13.880496263504028, "step": 798}
{"train_info/time_between_train_steps": 0.0061740875244140625, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 13.89579725265503, "step": 799}
{"train_info/time_between_train_steps": 0.006278276443481445, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 13.904222011566162, "step": 800}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737109117, "_runtime": 12016}, "step": 800}
{"logs": {"train/loss": 4.334, "train/learning_rate": 0.00022222222222222218, "train/epoch": 31.02, "_timestamp": 1737109117, "_runtime": 12016}, "step": 800}
{"train_info/time_between_train_steps": 30.34269690513611, "step": 800}
{"train_info/time_between_train_steps": 37.979684591293335, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 13.888470649719238, "step": 801}
{"train_info/time_between_train_steps": 0.004972219467163086, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 13.901676893234253, "step": 802}
{"train_info/time_between_train_steps": 0.0056591033935546875, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 13.825133323669434, "step": 803}
{"train_info/time_between_train_steps": 0.005578756332397461, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 13.939727544784546, "step": 804}
{"train_info/time_between_train_steps": 0.004922389984130859, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 13.85987138748169, "step": 805}
{"train_info/time_between_train_steps": 0.005448818206787109, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 13.884599208831787, "step": 806}
{"train_info/time_between_train_steps": 0.0059015750885009766, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 13.848915815353394, "step": 807}
{"train_info/time_between_train_steps": 0.004834413528442383, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 13.846395254135132, "step": 808}
{"train_info/time_between_train_steps": 0.005112409591674805, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 13.845700025558472, "step": 809}
{"train_info/time_between_train_steps": 0.0057184696197509766, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 13.843734979629517, "step": 810}
{"train_info/time_between_train_steps": 0.005218505859375, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 13.856698036193848, "step": 811}
{"train_info/time_between_train_steps": 0.00579524040222168, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 13.86931324005127, "step": 812}
{"train_info/time_between_train_steps": 0.0062291622161865234, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 13.853545665740967, "step": 813}
{"train_info/time_between_train_steps": 0.005313396453857422, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 13.91489291191101, "step": 814}
{"train_info/time_between_train_steps": 0.005849361419677734, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 13.86755895614624, "step": 815}
{"train_info/time_between_train_steps": 0.005231618881225586, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 13.86520266532898, "step": 816}
{"train_info/time_between_train_steps": 0.005215883255004883, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 13.94736385345459, "step": 817}
{"train_info/time_between_train_steps": 0.006167173385620117, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 13.891764402389526, "step": 818}
{"train_info/time_between_train_steps": 0.0055582523345947266, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 13.861551284790039, "step": 819}
{"train_info/time_between_train_steps": 0.0058557987213134766, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 13.865716934204102, "step": 820}
{"train_info/time_between_train_steps": 0.004737138748168945, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 13.861412286758423, "step": 821}
{"train_info/time_between_train_steps": 0.005887269973754883, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 13.869692087173462, "step": 822}
{"train_info/time_between_train_steps": 0.005462646484375, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 13.887012004852295, "step": 823}
{"train_info/time_between_train_steps": 0.005971193313598633, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 13.84656834602356, "step": 824}
{"train_info/time_between_train_steps": 0.00538945198059082, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 13.860881328582764, "step": 825}
{"train_info/time_between_train_steps": 0.0063631534576416016, "step": 825}
{"train_info/time_between_train_steps": 7.746461391448975, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 13.863133430480957, "step": 826}
{"train_info/time_between_train_steps": 0.005014657974243164, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 13.953234672546387, "step": 827}
{"train_info/time_between_train_steps": 0.005781412124633789, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 13.840514183044434, "step": 828}
{"train_info/time_between_train_steps": 0.005462169647216797, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 13.938392162322998, "step": 829}
{"train_info/time_between_train_steps": 0.005077838897705078, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 13.838955640792847, "step": 830}
{"train_info/time_between_train_steps": 0.005227327346801758, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 13.847896814346313, "step": 831}
{"train_info/time_between_train_steps": 0.005059480667114258, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 13.897728443145752, "step": 832}
{"train_info/time_between_train_steps": 0.004863262176513672, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 13.83070158958435, "step": 833}
{"train_info/time_between_train_steps": 0.005545854568481445, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 13.82063364982605, "step": 834}
{"train_info/time_between_train_steps": 0.005353450775146484, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 13.825616121292114, "step": 835}
{"train_info/time_between_train_steps": 0.004736661911010742, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 13.82618498802185, "step": 836}
{"train_info/time_between_train_steps": 0.005213737487792969, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 13.835739135742188, "step": 837}
{"train_info/time_between_train_steps": 0.004808187484741211, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 13.823648929595947, "step": 838}
{"train_info/time_between_train_steps": 0.005661964416503906, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 13.827075719833374, "step": 839}
{"train_info/time_between_train_steps": 0.005635976791381836, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 13.826093435287476, "step": 840}
{"train_info/time_between_train_steps": 0.0049991607666015625, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 13.83756422996521, "step": 841}
{"train_info/time_between_train_steps": 0.005070924758911133, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 13.829780578613281, "step": 842}
{"train_info/time_between_train_steps": 0.0053064823150634766, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 13.836997747421265, "step": 843}
{"train_info/time_between_train_steps": 0.005039215087890625, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 13.86885404586792, "step": 844}
{"train_info/time_between_train_steps": 0.005214691162109375, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 13.860023260116577, "step": 845}
{"train_info/time_between_train_steps": 0.005334377288818359, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 13.858373880386353, "step": 846}
{"train_info/time_between_train_steps": 0.005422115325927734, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 13.941861629486084, "step": 847}
{"train_info/time_between_train_steps": 0.006005525588989258, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 13.91273808479309, "step": 848}
{"train_info/time_between_train_steps": 0.005427122116088867, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 13.879227876663208, "step": 849}
{"train_info/time_between_train_steps": 0.0056362152099609375, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 13.881348133087158, "step": 850}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737109858, "_runtime": 12757}, "step": 850}
{"logs": {"train/loss": 4.2328, "train/learning_rate": 0.00019444444444444443, "train/epoch": 33.02, "_timestamp": 1737109858, "_runtime": 12757}, "step": 850}
{"train_info/time_between_train_steps": 0.03741192817687988, "step": 850}
{"train_info/time_between_train_steps": 7.543395280838013, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 13.834896564483643, "step": 851}
{"train_info/time_between_train_steps": 0.004757404327392578, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 13.952773809432983, "step": 852}
{"train_info/time_between_train_steps": 0.005392789840698242, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 13.85461139678955, "step": 853}
{"train_info/time_between_train_steps": 0.0058596134185791016, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 13.979982852935791, "step": 854}
{"train_info/time_between_train_steps": 0.005873203277587891, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 13.858054399490356, "step": 855}
{"train_info/time_between_train_steps": 0.005484580993652344, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 13.896885633468628, "step": 856}
{"train_info/time_between_train_steps": 0.005024909973144531, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 13.859127759933472, "step": 857}
{"train_info/time_between_train_steps": 0.005246877670288086, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 13.854490280151367, "step": 858}
{"train_info/time_between_train_steps": 0.005370378494262695, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 13.868630647659302, "step": 859}
{"train_info/time_between_train_steps": 0.00585627555847168, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 13.857062101364136, "step": 860}
{"train_info/time_between_train_steps": 0.00594639778137207, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 13.860147476196289, "step": 861}
{"train_info/time_between_train_steps": 0.004858970642089844, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 13.857688903808594, "step": 862}
{"train_info/time_between_train_steps": 0.00487518310546875, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 13.951165437698364, "step": 863}
{"train_info/time_between_train_steps": 0.006073474884033203, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 13.854550123214722, "step": 864}
{"train_info/time_between_train_steps": 0.0055620670318603516, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 13.87207841873169, "step": 865}
{"train_info/time_between_train_steps": 0.005644798278808594, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 13.863553047180176, "step": 866}
{"train_info/time_between_train_steps": 0.004889249801635742, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 13.867594480514526, "step": 867}
{"train_info/time_between_train_steps": 0.005133867263793945, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 13.86658525466919, "step": 868}
{"train_info/time_between_train_steps": 0.005049705505371094, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 13.863531112670898, "step": 869}
{"train_info/time_between_train_steps": 0.00543212890625, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 13.874708652496338, "step": 870}
{"train_info/time_between_train_steps": 0.0060956478118896484, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 13.872233152389526, "step": 871}
{"train_info/time_between_train_steps": 0.005196094512939453, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 13.862391948699951, "step": 872}
{"train_info/time_between_train_steps": 0.005228281021118164, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 13.901863098144531, "step": 873}
{"train_info/time_between_train_steps": 0.005963563919067383, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 13.878726959228516, "step": 874}
{"train_info/time_between_train_steps": 0.006671428680419922, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 13.855653047561646, "step": 875}
{"train_info/time_between_train_steps": 0.006565093994140625, "step": 875}
{"train_info/time_between_train_steps": 7.649878025054932, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 13.797175168991089, "step": 876}
{"train_info/time_between_train_steps": 0.004824638366699219, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 14.223211765289307, "step": 877}
{"train_info/time_between_train_steps": 0.005077838897705078, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 13.981128215789795, "step": 878}
{"train_info/time_between_train_steps": 0.005494356155395508, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 13.915945529937744, "step": 879}
{"train_info/time_between_train_steps": 0.005011558532714844, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 13.840072631835938, "step": 880}
{"train_info/time_between_train_steps": 0.0057604312896728516, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 13.864104747772217, "step": 881}
{"train_info/time_between_train_steps": 0.005109071731567383, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 13.824729204177856, "step": 882}
{"train_info/time_between_train_steps": 0.005004405975341797, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 13.81810998916626, "step": 883}
{"train_info/time_between_train_steps": 0.0051882266998291016, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 13.82600998878479, "step": 884}
{"train_info/time_between_train_steps": 0.005784749984741211, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 13.836527347564697, "step": 885}
{"train_info/time_between_train_steps": 0.005280017852783203, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 13.843680143356323, "step": 886}
{"train_info/time_between_train_steps": 0.005610227584838867, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 13.84045696258545, "step": 887}
{"train_info/time_between_train_steps": 0.004840373992919922, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 13.824218273162842, "step": 888}
{"train_info/time_between_train_steps": 0.005199432373046875, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 13.808791399002075, "step": 889}
{"train_info/time_between_train_steps": 0.004787921905517578, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 14.32033634185791, "step": 890}
{"train_info/time_between_train_steps": 0.0050694942474365234, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 13.835784196853638, "step": 891}
{"train_info/time_between_train_steps": 0.0051996707916259766, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 13.8437340259552, "step": 892}
{"train_info/time_between_train_steps": 0.0047533512115478516, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 13.83639121055603, "step": 893}
{"train_info/time_between_train_steps": 0.005484342575073242, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 13.918128252029419, "step": 894}
{"train_info/time_between_train_steps": 0.005584239959716797, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 13.829130172729492, "step": 895}
{"train_info/time_between_train_steps": 0.005602359771728516, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 13.847212314605713, "step": 896}
{"train_info/time_between_train_steps": 0.005254507064819336, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 13.852009773254395, "step": 897}
{"train_info/time_between_train_steps": 0.006094932556152344, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 13.868996143341064, "step": 898}
{"train_info/time_between_train_steps": 0.005800724029541016, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 13.842581748962402, "step": 899}
{"train_info/time_between_train_steps": 0.005717277526855469, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 13.865249872207642, "step": 900}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737110571, "_runtime": 13470}, "step": 900}
{"logs": {"train/loss": 4.1455, "train/learning_rate": 0.00016666666666666666, "train/epoch": 35.02, "_timestamp": 1737110571, "_runtime": 13470}, "step": 900}
{"train_info/time_between_train_steps": 41.99302268028259, "step": 900}
{"train_info/time_between_train_steps": 49.706995487213135, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 13.76110553741455, "step": 901}
{"train_info/time_between_train_steps": 0.005234718322753906, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 13.858489513397217, "step": 902}
{"train_info/time_between_train_steps": 0.00558924674987793, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 13.792221069335938, "step": 903}
{"train_info/time_between_train_steps": 0.0049855709075927734, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 13.911148309707642, "step": 904}
{"train_info/time_between_train_steps": 0.005481719970703125, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 13.808584213256836, "step": 905}
{"train_info/time_between_train_steps": 0.005221128463745117, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 13.840685367584229, "step": 906}
{"train_info/time_between_train_steps": 0.004719257354736328, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 13.808541059494019, "step": 907}
{"train_info/time_between_train_steps": 0.004819393157958984, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 13.819933414459229, "step": 908}
{"train_info/time_between_train_steps": 0.005009889602661133, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 13.903777837753296, "step": 909}
{"train_info/time_between_train_steps": 0.005141496658325195, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 13.825398683547974, "step": 910}
{"train_info/time_between_train_steps": 0.005709648132324219, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 13.824877262115479, "step": 911}
{"train_info/time_between_train_steps": 0.005155801773071289, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 13.832808256149292, "step": 912}
{"train_info/time_between_train_steps": 0.0056264400482177734, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 13.837530136108398, "step": 913}
{"train_info/time_between_train_steps": 0.0050809383392333984, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 13.832710981369019, "step": 914}
{"train_info/time_between_train_steps": 0.0055620670318603516, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 13.83101511001587, "step": 915}
{"train_info/time_between_train_steps": 0.005215644836425781, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 13.831076622009277, "step": 916}
{"train_info/time_between_train_steps": 0.004987001419067383, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 13.832977056503296, "step": 917}
{"train_info/time_between_train_steps": 0.005133152008056641, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 13.838436126708984, "step": 918}
{"train_info/time_between_train_steps": 0.005161762237548828, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 13.82762885093689, "step": 919}
{"train_info/time_between_train_steps": 0.004818916320800781, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 13.83781886100769, "step": 920}
{"train_info/time_between_train_steps": 0.004988431930541992, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 13.843563556671143, "step": 921}
{"train_info/time_between_train_steps": 0.00540614128112793, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 13.841615915298462, "step": 922}
{"train_info/time_between_train_steps": 0.00637364387512207, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 13.855623483657837, "step": 923}
{"train_info/time_between_train_steps": 0.0061800479888916016, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 13.927285194396973, "step": 924}
{"train_info/time_between_train_steps": 0.005795478820800781, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 13.866519212722778, "step": 925}
{"train_info/time_between_train_steps": 0.006752967834472656, "step": 925}
{"train_info/time_between_train_steps": 7.520948886871338, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 13.794725894927979, "step": 926}
{"train_info/time_between_train_steps": 0.005576133728027344, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 13.935219287872314, "step": 927}
{"train_info/time_between_train_steps": 0.004989147186279297, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 13.812637567520142, "step": 928}
{"train_info/time_between_train_steps": 0.005419731140136719, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 13.948626041412354, "step": 929}
{"train_info/time_between_train_steps": 0.005681514739990234, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 13.815678596496582, "step": 930}
{"train_info/time_between_train_steps": 0.0051000118255615234, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 13.838816165924072, "step": 931}
{"train_info/time_between_train_steps": 0.004653453826904297, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 13.805360555648804, "step": 932}
{"train_info/time_between_train_steps": 0.004715442657470703, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 13.87004566192627, "step": 933}
{"train_info/time_between_train_steps": 0.005362272262573242, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 13.821995496749878, "step": 934}
{"train_info/time_between_train_steps": 0.005644083023071289, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 13.830028772354126, "step": 935}
{"train_info/time_between_train_steps": 0.0047681331634521484, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 13.812171220779419, "step": 936}
{"train_info/time_between_train_steps": 0.004838705062866211, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 13.81339979171753, "step": 937}
{"train_info/time_between_train_steps": 0.005020618438720703, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 13.867305517196655, "step": 938}
{"train_info/time_between_train_steps": 0.00592803955078125, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 13.81628942489624, "step": 939}
{"train_info/time_between_train_steps": 0.005171775817871094, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 13.907061338424683, "step": 940}
{"train_info/time_between_train_steps": 0.005655765533447266, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 13.818006753921509, "step": 941}
{"train_info/time_between_train_steps": 0.005105257034301758, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 13.810301542282104, "step": 942}
{"train_info/time_between_train_steps": 0.004998207092285156, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 13.818198680877686, "step": 943}
{"train_info/time_between_train_steps": 0.005654096603393555, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 13.81851077079773, "step": 944}
{"train_info/time_between_train_steps": 0.0050776004791259766, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 13.837036609649658, "step": 945}
{"train_info/time_between_train_steps": 0.0055201053619384766, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 13.898442268371582, "step": 946}
{"train_info/time_between_train_steps": 0.005628108978271484, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 13.8394935131073, "step": 947}
{"train_info/time_between_train_steps": 0.0060846805572509766, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 13.83030366897583, "step": 948}
{"train_info/time_between_train_steps": 0.0052337646484375, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 13.832980155944824, "step": 949}
{"train_info/time_between_train_steps": 0.0061147212982177734, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 13.871710538864136, "step": 950}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737111322, "_runtime": 14221}, "step": 950}
{"logs": {"train/loss": 4.0675, "train/learning_rate": 0.0001388888888888889, "train/epoch": 37.02, "_timestamp": 1737111322, "_runtime": 14221}, "step": 950}
{"train_info/time_between_train_steps": 0.05666327476501465, "step": 950}
{"train_info/time_between_train_steps": 7.65772819519043, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 13.796342372894287, "step": 951}
{"train_info/time_between_train_steps": 0.005588531494140625, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 13.885960817337036, "step": 952}
{"train_info/time_between_train_steps": 0.005322694778442383, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 13.826222896575928, "step": 953}
{"train_info/time_between_train_steps": 0.004983425140380859, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 13.997619867324829, "step": 954}
{"train_info/time_between_train_steps": 0.00513911247253418, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 13.938053131103516, "step": 955}
{"train_info/time_between_train_steps": 0.006089925765991211, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 13.85707688331604, "step": 956}
{"train_info/time_between_train_steps": 0.004980564117431641, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 13.838844299316406, "step": 957}
{"train_info/time_between_train_steps": 0.00487518310546875, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 13.8427152633667, "step": 958}
{"train_info/time_between_train_steps": 0.004938602447509766, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 13.868784189224243, "step": 959}
{"train_info/time_between_train_steps": 0.0052106380462646484, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 13.844900369644165, "step": 960}
{"train_info/time_between_train_steps": 0.005064487457275391, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 13.838993310928345, "step": 961}
{"train_info/time_between_train_steps": 0.0056304931640625, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 13.847862482070923, "step": 962}
{"train_info/time_between_train_steps": 0.005046367645263672, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 13.850334167480469, "step": 963}
{"train_info/time_between_train_steps": 0.005170583724975586, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 13.851819276809692, "step": 964}
{"train_info/time_between_train_steps": 0.00553441047668457, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 13.865749835968018, "step": 965}
{"train_info/time_between_train_steps": 0.00567936897277832, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 13.845290660858154, "step": 966}
{"train_info/time_between_train_steps": 0.005216121673583984, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 13.878547668457031, "step": 967}
{"train_info/time_between_train_steps": 0.005259990692138672, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 13.847199201583862, "step": 968}
{"train_info/time_between_train_steps": 0.005551338195800781, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 13.852099657058716, "step": 969}
{"train_info/time_between_train_steps": 0.005321025848388672, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 13.847168207168579, "step": 970}
{"train_info/time_between_train_steps": 0.005846500396728516, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 13.95880913734436, "step": 971}
{"train_info/time_between_train_steps": 0.00572967529296875, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 13.888063669204712, "step": 972}
{"train_info/time_between_train_steps": 0.005865573883056641, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 13.857033729553223, "step": 973}
{"train_info/time_between_train_steps": 0.005278825759887695, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 13.866209506988525, "step": 974}
{"train_info/time_between_train_steps": 0.00599980354309082, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 13.902409315109253, "step": 975}
{"train_info/time_between_train_steps": 0.006567716598510742, "step": 975}
{"train_info/time_between_train_steps": 8.67470097541809, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 13.822529554367065, "step": 976}
{"train_info/time_between_train_steps": 0.0046694278717041016, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 13.91978645324707, "step": 977}
{"train_info/time_between_train_steps": 0.0049571990966796875, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 13.829339742660522, "step": 978}
{"train_info/time_between_train_steps": 0.00545954704284668, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 13.928364992141724, "step": 979}
{"train_info/time_between_train_steps": 0.004748344421386719, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 13.846518278121948, "step": 980}
{"train_info/time_between_train_steps": 0.005564212799072266, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 13.878079891204834, "step": 981}
{"train_info/time_between_train_steps": 0.0050487518310546875, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 13.838788747787476, "step": 982}
{"train_info/time_between_train_steps": 0.005661725997924805, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 13.842808485031128, "step": 983}
{"train_info/time_between_train_steps": 0.005166769027709961, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 13.850384712219238, "step": 984}
{"train_info/time_between_train_steps": 0.004837751388549805, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 13.84498119354248, "step": 985}
{"train_info/time_between_train_steps": 0.004723310470581055, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 13.93109130859375, "step": 986}
{"train_info/time_between_train_steps": 0.005807638168334961, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 13.839256286621094, "step": 987}
{"train_info/time_between_train_steps": 0.004976034164428711, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 13.842406034469604, "step": 988}
{"train_info/time_between_train_steps": 0.004743814468383789, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 13.850510597229004, "step": 989}
{"train_info/time_between_train_steps": 0.004991292953491211, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 13.853273868560791, "step": 990}
{"train_info/time_between_train_steps": 0.004831790924072266, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 13.861617088317871, "step": 991}
{"train_info/time_between_train_steps": 0.005183696746826172, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 14.652884006500244, "step": 992}
{"train_info/time_between_train_steps": 0.005835294723510742, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 13.856033086776733, "step": 993}
{"train_info/time_between_train_steps": 0.00537562370300293, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 13.86200761795044, "step": 994}
{"train_info/time_between_train_steps": 0.00508880615234375, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 13.869421005249023, "step": 995}
{"train_info/time_between_train_steps": 0.005252361297607422, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 13.908177852630615, "step": 996}
{"train_info/time_between_train_steps": 0.00563502311706543, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 13.870596885681152, "step": 997}
{"train_info/time_between_train_steps": 0.00605463981628418, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 13.862440586090088, "step": 998}
{"train_info/time_between_train_steps": 0.005280256271362305, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 13.876117944717407, "step": 999}
{"train_info/time_between_train_steps": 0.005400180816650391, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 13.919430494308472, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1737112045, "_runtime": 14944}, "step": 1000}
{"logs": {"train/loss": 3.9999, "train/learning_rate": 0.00011111111111111109, "train/epoch": 39.02, "_timestamp": 1737112045, "_runtime": 14944}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1737112046, "_runtime": 14945}, "step": 1000}
{"logs": {"eval/loss": 5.124108791351318, "eval/runtime": 1.1643, "eval/samples_per_second": 81.596, "eval/steps_per_second": 5.153, "train/epoch": 39.02, "_timestamp": 1737112046, "_runtime": 14945}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1737112046, "_runtime": 14945}, "step": 1000}
{"logs": {"eval//scratch/ykyao/projects/multilingual-LM/training/multilingual_dataset.py_loss": 5.124108791351318, "eval//scratch/ykyao/projects/multilingual-LM/training/multilingual_dataset.py_ppl": 168.02433016888105, "eval//scratch/ykyao/projects/multilingual-LM/training/multilingual_dataset.py_runtime": 1.1643, "eval//scratch/ykyao/projects/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 81.596, "train/epoch": 39.02, "_timestamp": 1737112046, "_runtime": 14945}, "step": 1000}
{"train_info/time_between_train_steps": 37.44820046424866, "step": 1000}
{"train_info/time_between_train_steps": 44.83979249000549, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 13.90357232093811, "step": 1001}
{"train_info/time_between_train_steps": 0.006176948547363281, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 13.959335088729858, "step": 1002}
{"train_info/time_between_train_steps": 0.005911827087402344, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 13.843264102935791, "step": 1003}
{"train_info/time_between_train_steps": 0.0057468414306640625, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 13.941983938217163, "step": 1004}
{"train_info/time_between_train_steps": 0.00607752799987793, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 13.848253965377808, "step": 1005}
{"train_info/time_between_train_steps": 0.00589299201965332, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 13.869240045547485, "step": 1006}
{"train_info/time_between_train_steps": 0.005708932876586914, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 13.851687669754028, "step": 1007}
{"train_info/time_between_train_steps": 0.005162954330444336, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 13.855657815933228, "step": 1008}
{"train_info/time_between_train_steps": 0.005906105041503906, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 13.858686923980713, "step": 1009}
{"train_info/time_between_train_steps": 0.0054280757904052734, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 13.856935739517212, "step": 1010}
{"train_info/time_between_train_steps": 0.004788875579833984, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 13.852896451950073, "step": 1011}
{"train_info/time_between_train_steps": 0.0055389404296875, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 13.860505819320679, "step": 1012}
{"train_info/time_between_train_steps": 0.005821943283081055, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 13.860134840011597, "step": 1013}
{"train_info/time_between_train_steps": 0.005985260009765625, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 13.872499465942383, "step": 1014}
{"train_info/time_between_train_steps": 0.005792140960693359, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 13.865755319595337, "step": 1015}
{"train_info/time_between_train_steps": 0.005295276641845703, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 13.838064193725586, "step": 1016}
{"train_info/time_between_train_steps": 0.004609346389770508, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 13.908819675445557, "step": 1017}
{"train_info/time_between_train_steps": 0.005877256393432617, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 13.851243019104004, "step": 1018}
{"train_info/time_between_train_steps": 0.005875825881958008, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 13.83786654472351, "step": 1019}
{"train_info/time_between_train_steps": 0.005650758743286133, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 13.838970184326172, "step": 1020}
{"train_info/time_between_train_steps": 0.005626201629638672, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 13.834532976150513, "step": 1021}
{"train_info/time_between_train_steps": 0.005146980285644531, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 13.836454153060913, "step": 1022}
{"train_info/time_between_train_steps": 0.0054168701171875, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 13.877905130386353, "step": 1023}
{"train_info/time_between_train_steps": 0.0061855316162109375, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 13.845466375350952, "step": 1024}
{"train_info/time_between_train_steps": 0.005514621734619141, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 13.867826461791992, "step": 1025}
{"train_info/time_between_train_steps": 0.006124258041381836, "step": 1025}
{"train_info/time_between_train_steps": 7.608850717544556, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 13.786092758178711, "step": 1026}
{"train_info/time_between_train_steps": 0.00575709342956543, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 13.921666383743286, "step": 1027}
{"train_info/time_between_train_steps": 0.005137920379638672, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 13.810948133468628, "step": 1028}
{"train_info/time_between_train_steps": 0.005196571350097656, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 13.9183931350708, "step": 1029}
{"train_info/time_between_train_steps": 0.006231069564819336, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 13.817835330963135, "step": 1030}
{"train_info/time_between_train_steps": 0.0051937103271484375, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 13.825935363769531, "step": 1031}
{"train_info/time_between_train_steps": 0.005046844482421875, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 13.887964248657227, "step": 1032}
{"train_info/time_between_train_steps": 0.005249738693237305, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 13.807616949081421, "step": 1033}
{"train_info/time_between_train_steps": 0.0048465728759765625, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 13.811566352844238, "step": 1034}
{"train_info/time_between_train_steps": 0.005925178527832031, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 13.814383268356323, "step": 1035}
{"train_info/time_between_train_steps": 0.0053789615631103516, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 13.859607458114624, "step": 1036}
{"train_info/time_between_train_steps": 0.005380153656005859, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 13.81949496269226, "step": 1037}
{"train_info/time_between_train_steps": 0.005239725112915039, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 13.813456773757935, "step": 1038}
{"train_info/time_between_train_steps": 0.00529026985168457, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 13.814117431640625, "step": 1039}
{"train_info/time_between_train_steps": 0.0052089691162109375, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 13.83229112625122, "step": 1040}
{"train_info/time_between_train_steps": 0.005303382873535156, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 13.817203044891357, "step": 1041}
{"train_info/time_between_train_steps": 0.005346059799194336, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 13.816210269927979, "step": 1042}
{"train_info/time_between_train_steps": 0.0056362152099609375, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 13.814774990081787, "step": 1043}
{"train_info/time_between_train_steps": 0.005406618118286133, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 13.843745946884155, "step": 1044}
{"train_info/time_between_train_steps": 0.004991054534912109, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 13.823052644729614, "step": 1045}
{"train_info/time_between_train_steps": 0.0058743953704833984, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 13.812730550765991, "step": 1046}
{"train_info/time_between_train_steps": 0.0057370662689208984, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 13.816386222839355, "step": 1047}
{"train_info/time_between_train_steps": 0.0055544376373291016, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 13.900246858596802, "step": 1048}
{"train_info/time_between_train_steps": 0.005279541015625, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 13.83388614654541, "step": 1049}
{"train_info/time_between_train_steps": 0.005547046661376953, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 13.864168643951416, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1737112792, "_runtime": 15691}, "step": 1050}
{"logs": {"train/loss": 3.9418, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 41.02, "_timestamp": 1737112792, "_runtime": 15691}, "step": 1050}
{"train_info/time_between_train_steps": 0.06021404266357422, "step": 1050}
{"train_info/time_between_train_steps": 7.757790803909302, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 13.8094642162323, "step": 1051}
{"train_info/time_between_train_steps": 0.00463414192199707, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 13.951482772827148, "step": 1052}
{"train_info/time_between_train_steps": 0.004868507385253906, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 13.818205118179321, "step": 1053}
{"train_info/time_between_train_steps": 0.005027294158935547, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 13.928635358810425, "step": 1054}
{"train_info/time_between_train_steps": 0.00524139404296875, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 13.83581018447876, "step": 1055}
{"train_info/time_between_train_steps": 0.005282878875732422, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 13.880407094955444, "step": 1056}
{"train_info/time_between_train_steps": 0.005826711654663086, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 13.840954303741455, "step": 1057}
{"train_info/time_between_train_steps": 0.005385398864746094, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 13.828596830368042, "step": 1058}
{"train_info/time_between_train_steps": 0.004941463470458984, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 13.827876567840576, "step": 1059}
{"train_info/time_between_train_steps": 0.004793643951416016, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 13.828123807907104, "step": 1060}
{"train_info/time_between_train_steps": 0.0052340030670166016, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 13.850249528884888, "step": 1061}
{"train_info/time_between_train_steps": 0.005526304244995117, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 13.833320140838623, "step": 1062}
{"train_info/time_between_train_steps": 0.0054781436920166016, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 13.901684284210205, "step": 1063}
{"train_info/time_between_train_steps": 0.005078554153442383, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 13.824178218841553, "step": 1064}
{"train_info/time_between_train_steps": 0.005624532699584961, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 13.83182978630066, "step": 1065}
{"train_info/time_between_train_steps": 0.00550079345703125, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 13.835984706878662, "step": 1066}
{"train_info/time_between_train_steps": 0.005510091781616211, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 13.832470417022705, "step": 1067}
{"train_info/time_between_train_steps": 0.005548238754272461, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 13.83320927619934, "step": 1068}
{"train_info/time_between_train_steps": 0.005282878875732422, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 13.84837532043457, "step": 1069}
{"train_info/time_between_train_steps": 0.005334615707397461, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 13.831306219100952, "step": 1070}
{"train_info/time_between_train_steps": 0.00556182861328125, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 13.833512544631958, "step": 1071}
{"train_info/time_between_train_steps": 0.005964756011962891, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 13.846773386001587, "step": 1072}
{"train_info/time_between_train_steps": 0.0054590702056884766, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 13.844206809997559, "step": 1073}
{"train_info/time_between_train_steps": 0.0060482025146484375, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 14.229830503463745, "step": 1074}
{"train_info/time_between_train_steps": 0.005886554718017578, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 13.862586736679077, "step": 1075}
{"train_info/time_between_train_steps": 0.006541728973388672, "step": 1075}
{"train_info/time_between_train_steps": 7.549163103103638, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 13.82235860824585, "step": 1076}
{"train_info/time_between_train_steps": 0.004816293716430664, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 13.908960580825806, "step": 1077}
{"train_info/time_between_train_steps": 0.005079984664916992, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 13.907752990722656, "step": 1078}
{"train_info/time_between_train_steps": 0.0045452117919921875, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 13.907451629638672, "step": 1079}
{"train_info/time_between_train_steps": 0.005364894866943359, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 13.857920408248901, "step": 1080}
{"train_info/time_between_train_steps": 0.0053310394287109375, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 13.84820556640625, "step": 1081}
{"train_info/time_between_train_steps": 0.0050890445709228516, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 13.887179136276245, "step": 1082}
{"train_info/time_between_train_steps": 0.005257606506347656, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 13.917775869369507, "step": 1083}
{"train_info/time_between_train_steps": 0.005220651626586914, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 13.814690113067627, "step": 1084}
{"train_info/time_between_train_steps": 0.004847049713134766, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 13.810789108276367, "step": 1085}
{"train_info/time_between_train_steps": 0.005059003829956055, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 13.841569423675537, "step": 1086}
{"train_info/time_between_train_steps": 0.0049626827239990234, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 14.384073972702026, "step": 1087}
{"train_info/time_between_train_steps": 0.005193471908569336, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 13.847089767456055, "step": 1088}
{"train_info/time_between_train_steps": 0.004755973815917969, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 13.8438401222229, "step": 1089}
{"train_info/time_between_train_steps": 0.0050203800201416016, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 14.370115518569946, "step": 1090}
{"train_info/time_between_train_steps": 0.004783153533935547, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 13.819963693618774, "step": 1091}
{"train_info/time_between_train_steps": 0.005378007888793945, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 13.845883131027222, "step": 1092}
{"train_info/time_between_train_steps": 0.0053539276123046875, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 13.842448472976685, "step": 1093}
{"train_info/time_between_train_steps": 0.004941701889038086, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 14.041597366333008, "step": 1094}
{"train_info/time_between_train_steps": 0.005379438400268555, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 14.816989183425903, "step": 1095}
{"train_info/time_between_train_steps": 0.004911184310913086, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 13.817445278167725, "step": 1096}
{"train_info/time_between_train_steps": 0.0060312747955322266, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 13.82118821144104, "step": 1097}
{"train_info/time_between_train_steps": 0.006753444671630859, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 13.830193042755127, "step": 1098}
{"train_info/time_between_train_steps": 0.005677223205566406, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 13.837961673736572, "step": 1099}
{"train_info/time_between_train_steps": 0.005811929702758789, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 13.845885753631592, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1737113507, "_runtime": 16406}, "step": 1100}
{"logs": {"train/loss": 3.8928, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 43.02, "_timestamp": 1737113507, "_runtime": 16406}, "step": 1100}
{"train_info/time_between_train_steps": 33.82193946838379, "step": 1100}
{"train_info/time_between_train_steps": 41.77558088302612, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 13.783228397369385, "step": 1101}
{"train_info/time_between_train_steps": 0.005613565444946289, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 13.913312196731567, "step": 1102}
{"train_info/time_between_train_steps": 0.005276679992675781, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 13.803561925888062, "step": 1103}
{"train_info/time_between_train_steps": 0.005756855010986328, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 13.912985563278198, "step": 1104}
{"train_info/time_between_train_steps": 0.0051043033599853516, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 13.817326545715332, "step": 1105}
{"train_info/time_between_train_steps": 0.005570173263549805, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 13.832926034927368, "step": 1106}
{"train_info/time_between_train_steps": 0.005352497100830078, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 13.814767360687256, "step": 1107}
{"train_info/time_between_train_steps": 0.005398988723754883, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 13.821690797805786, "step": 1108}
{"train_info/time_between_train_steps": 0.005574703216552734, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 13.953375577926636, "step": 1109}
{"train_info/time_between_train_steps": 0.0054798126220703125, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 13.827275514602661, "step": 1110}
{"train_info/time_between_train_steps": 0.006020784378051758, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 13.825150966644287, "step": 1111}
{"train_info/time_between_train_steps": 0.00571131706237793, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 13.828856706619263, "step": 1112}
{"train_info/time_between_train_steps": 0.004801511764526367, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 13.833378076553345, "step": 1113}
{"train_info/time_between_train_steps": 0.005347490310668945, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 13.831608533859253, "step": 1114}
{"train_info/time_between_train_steps": 0.005885601043701172, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 13.842086553573608, "step": 1115}
{"train_info/time_between_train_steps": 0.005278348922729492, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 13.825384378433228, "step": 1116}
{"train_info/time_between_train_steps": 0.005400419235229492, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 13.828956127166748, "step": 1117}
{"train_info/time_between_train_steps": 0.005217313766479492, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 13.859229803085327, "step": 1118}
{"train_info/time_between_train_steps": 0.006024599075317383, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 13.837886810302734, "step": 1119}
{"train_info/time_between_train_steps": 0.00554966926574707, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 13.834799528121948, "step": 1120}
{"train_info/time_between_train_steps": 0.00511932373046875, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 13.83415961265564, "step": 1121}
{"train_info/time_between_train_steps": 0.004881858825683594, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 13.883354187011719, "step": 1122}
{"train_info/time_between_train_steps": 0.005342960357666016, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 13.8502836227417, "step": 1123}
{"train_info/time_between_train_steps": 0.005577802658081055, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 13.849387407302856, "step": 1124}
{"train_info/time_between_train_steps": 0.005295753479003906, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 13.929635047912598, "step": 1125}
{"train_info/time_between_train_steps": 0.006330251693725586, "step": 1125}
{"train_info/time_between_train_steps": 7.700105667114258, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 13.819939851760864, "step": 1126}
{"train_info/time_between_train_steps": 0.00541234016418457, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 13.8859224319458, "step": 1127}
{"train_info/time_between_train_steps": 0.005476474761962891, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 13.825026273727417, "step": 1128}
{"train_info/time_between_train_steps": 0.005673885345458984, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 13.930504083633423, "step": 1129}
{"train_info/time_between_train_steps": 0.00593113899230957, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 13.819244146347046, "step": 1130}
{"train_info/time_between_train_steps": 0.005957603454589844, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 13.82380723953247, "step": 1131}
{"train_info/time_between_train_steps": 0.005106925964355469, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 13.804621696472168, "step": 1132}
{"train_info/time_between_train_steps": 0.0054168701171875, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 13.801166772842407, "step": 1133}
{"train_info/time_between_train_steps": 0.005030632019042969, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 13.849976301193237, "step": 1134}
{"train_info/time_between_train_steps": 0.00516057014465332, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 13.810960054397583, "step": 1135}
{"train_info/time_between_train_steps": 0.005014181137084961, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 13.812029123306274, "step": 1136}
{"train_info/time_between_train_steps": 0.0052721500396728516, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 13.811476230621338, "step": 1137}
{"train_info/time_between_train_steps": 0.004858255386352539, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 13.806917428970337, "step": 1138}
{"train_info/time_between_train_steps": 0.005627632141113281, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 13.814176321029663, "step": 1139}
{"train_info/time_between_train_steps": 0.00520777702331543, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 13.897301435470581, "step": 1140}
{"train_info/time_between_train_steps": 0.0054705142974853516, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 13.81807565689087, "step": 1141}
{"train_info/time_between_train_steps": 0.0048639774322509766, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 13.81335163116455, "step": 1142}
{"train_info/time_between_train_steps": 0.0054473876953125, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 13.84999942779541, "step": 1143}
{"train_info/time_between_train_steps": 0.005458354949951172, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 13.81586742401123, "step": 1144}
{"train_info/time_between_train_steps": 0.004981040954589844, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 13.818000555038452, "step": 1145}
{"train_info/time_between_train_steps": 0.005105733871459961, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 13.815128564834595, "step": 1146}
{"train_info/time_between_train_steps": 0.005491971969604492, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 13.90090274810791, "step": 1147}
{"train_info/time_between_train_steps": 0.00581669807434082, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 13.82390809059143, "step": 1148}
{"train_info/time_between_train_steps": 0.005493640899658203, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 13.8305344581604, "step": 1149}
{"train_info/time_between_train_steps": 0.005678892135620117, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 13.843819618225098, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1737114251, "_runtime": 17150}, "step": 1150}
{"logs": {"train/loss": 3.8551, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 45.02, "_timestamp": 1737114251, "_runtime": 17150}, "step": 1150}
{"train_info/time_between_train_steps": 0.0730736255645752, "step": 1150}
{"train_info/time_between_train_steps": 7.6021177768707275, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 13.830232381820679, "step": 1151}
{"train_info/time_between_train_steps": 0.005125522613525391, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 13.907338857650757, "step": 1152}
{"train_info/time_between_train_steps": 0.005150794982910156, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 13.816601514816284, "step": 1153}
{"train_info/time_between_train_steps": 0.004884243011474609, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 13.923804759979248, "step": 1154}
{"train_info/time_between_train_steps": 0.005033969879150391, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 13.9238440990448, "step": 1155}
{"train_info/time_between_train_steps": 0.005919456481933594, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 13.860073566436768, "step": 1156}
{"train_info/time_between_train_steps": 0.0058171749114990234, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 13.825851202011108, "step": 1157}
{"train_info/time_between_train_steps": 0.0056955814361572266, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 13.827823877334595, "step": 1158}
{"train_info/time_between_train_steps": 0.005667686462402344, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 13.832298040390015, "step": 1159}
{"train_info/time_between_train_steps": 0.005493879318237305, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 13.838470697402954, "step": 1160}
{"train_info/time_between_train_steps": 0.005660295486450195, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 13.840030431747437, "step": 1161}
{"train_info/time_between_train_steps": 0.005457162857055664, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 13.82918119430542, "step": 1162}
{"train_info/time_between_train_steps": 0.005177497863769531, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 13.828558444976807, "step": 1163}
{"train_info/time_between_train_steps": 0.004640340805053711, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 13.87245512008667, "step": 1164}
{"train_info/time_between_train_steps": 0.004838228225708008, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 13.85854983329773, "step": 1165}
{"train_info/time_between_train_steps": 0.005531787872314453, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 13.833770751953125, "step": 1166}
{"train_info/time_between_train_steps": 0.005684375762939453, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 13.831758260726929, "step": 1167}
{"train_info/time_between_train_steps": 0.005357980728149414, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 13.839640378952026, "step": 1168}
{"train_info/time_between_train_steps": 0.00543212890625, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 13.85015082359314, "step": 1169}
{"train_info/time_between_train_steps": 0.005766391754150391, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 13.839061975479126, "step": 1170}
{"train_info/time_between_train_steps": 0.0054187774658203125, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 13.91782808303833, "step": 1171}
{"train_info/time_between_train_steps": 0.0056209564208984375, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 16.448075771331787, "step": 1172}
{"train_info/time_between_train_steps": 0.005246877670288086, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 14.155355453491211, "step": 1173}
{"train_info/time_between_train_steps": 0.005220651626586914, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 13.81600570678711, "step": 1174}
{"train_info/time_between_train_steps": 0.0054280757904052734, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 13.82858943939209, "step": 1175}
{"train_info/time_between_train_steps": 0.0059583187103271484, "step": 1175}
{"train_info/time_between_train_steps": 9.934931993484497, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 14.043248414993286, "step": 1176}
{"train_info/time_between_train_steps": 0.0054225921630859375, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 13.893285036087036, "step": 1177}
{"train_info/time_between_train_steps": 0.005223274230957031, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 13.812951803207397, "step": 1178}
{"train_info/time_between_train_steps": 0.0048792362213134766, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 13.901018381118774, "step": 1179}
{"train_info/time_between_train_steps": 0.0055124759674072266, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 13.88951063156128, "step": 1180}
{"train_info/time_between_train_steps": 0.00501251220703125, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 13.864917755126953, "step": 1181}
{"train_info/time_between_train_steps": 0.005598783493041992, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 13.980719804763794, "step": 1182}
{"train_info/time_between_train_steps": 0.005082130432128906, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 13.806304454803467, "step": 1183}
{"train_info/time_between_train_steps": 0.004849910736083984, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 15.173990249633789, "step": 1184}
{"train_info/time_between_train_steps": 0.005100727081298828, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 13.826179027557373, "step": 1185}
{"train_info/time_between_train_steps": 0.005168914794921875, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 13.905714750289917, "step": 1186}
{"train_info/time_between_train_steps": 0.005507230758666992, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 13.81288743019104, "step": 1187}
{"train_info/time_between_train_steps": 0.004968166351318359, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 14.992391347885132, "step": 1188}
{"train_info/time_between_train_steps": 0.005231618881225586, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 13.939847707748413, "step": 1189}
{"train_info/time_between_train_steps": 0.014187335968017578, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 13.962283849716187, "step": 1190}
{"train_info/time_between_train_steps": 0.004809856414794922, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 13.795217037200928, "step": 1191}
{"train_info/time_between_train_steps": 0.004782676696777344, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 15.520581483840942, "step": 1192}
{"train_info/time_between_train_steps": 0.005270481109619141, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 13.815114259719849, "step": 1193}
{"train_info/time_between_train_steps": 0.005158662796020508, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 13.797888278961182, "step": 1194}
{"train_info/time_between_train_steps": 0.005029439926147461, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 13.821568250656128, "step": 1195}
{"train_info/time_between_train_steps": 0.004618167877197266, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 17.320624828338623, "step": 1196}
{"train_info/time_between_train_steps": 0.005149364471435547, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 13.818354368209839, "step": 1197}
{"train_info/time_between_train_steps": 0.0055425167083740234, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 13.83053183555603, "step": 1198}
{"train_info/time_between_train_steps": 0.004832267761230469, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 13.825464248657227, "step": 1199}
{"train_info/time_between_train_steps": 0.00597071647644043, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 17.705181121826172, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1737114997, "_runtime": 17896}, "step": 1200}
{"logs": {"train/loss": 3.8293, "train/learning_rate": 0.0, "train/epoch": 47.02, "_timestamp": 1737114997, "_runtime": 17896}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1920.9462890625, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1737115102, "_runtime": 18001}, "step": 1200}
{"logs": {"train/train_runtime": 18003.2426, "train/train_samples_per_second": 34.127, "train/train_steps_per_second": 0.067, "train/total_flos": 3.2574232461312e+17, "train/train_loss": 5.325879340966543, "train/epoch": 47.02, "_timestamp": 1737115102, "_runtime": 18001}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1920.9453125, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1737115132, "_runtime": 18031}, "step": 1200}
{"logs": {"eval/loss": 5.152990341186523, "eval/runtime": 1.0967, "eval/samples_per_second": 86.623, "eval/steps_per_second": 5.471, "train/epoch": 47.02, "_timestamp": 1737115132, "_runtime": 18031}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1920.9453125, "train_info/memory_max_allocated": 20711.3779296875, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1737115132, "_runtime": 18031}, "step": 1200}
{"logs": {"eval//scratch/ykyao/projects/multilingual-LM/training/multilingual_dataset.py_loss": 5.152990341186523, "eval//scratch/ykyao/projects/multilingual-LM/training/multilingual_dataset.py_ppl": 172.9478910265473, "eval//scratch/ykyao/projects/multilingual-LM/training/multilingual_dataset.py_runtime": 1.0967, "eval//scratch/ykyao/projects/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 86.623, "train/epoch": 47.02, "_timestamp": 1737115132, "_runtime": 18031}, "step": 1200}
|