07:03:45 args: {'variant': 'baseline', 'epochs': 30, 'bs': 512, 'lr': 0.001, 'lamb': 0.02, 'proj_dim': 128, 'num_workers': 12, 'grad_clip': 1.0, 'ckpt_every': 5, 'data_dir': '/vast/adi/tclejepa/v1', 'wandb': 1, 'push_hf': 1} 07:03:47 train=50000 val=10000 07:04:38 ep 0 | loss=5.3822 inv=0.2120 sig=29.3711 lejepa=0.7952 probe=4.5866 probe_acc=0.1468 gnorm=2.69 lr=5.05e-04 dt=46.4s 07:05:20 ep 1 | loss=4.8869 inv=0.2245 sig=17.0290 lejepa=0.5605 probe=4.3264 probe_acc=0.1488 gnorm=2.56 lr=1.00e-03 dt=42.4s 07:05:58 ep 2 | loss=4.7877 inv=0.2165 sig=15.8164 lejepa=0.5285 probe=4.2592 probe_acc=0.1592 gnorm=1.77 lr=9.97e-04 dt=38.4s 07:06:33 ep 3 | loss=4.6899 inv=0.2050 sig=13.3241 lejepa=0.4673 probe=4.2226 probe_acc=0.1664 gnorm=1.16 lr=9.88e-04 dt=34.3s 07:07:08 ep 4 | loss=4.6102 inv=0.2020 sig=11.4923 lejepa=0.4278 probe=4.1825 probe_acc=0.1676 gnorm=0.93 lr=9.72e-04 dt=35.3s 07:07:08 saved /vast/adi/tclejepa/v1/checkpoints/baseline/epoch_004.pt 07:07:47 ep 5 | loss=4.4992 inv=0.1931 sig=10.1894 lejepa=0.3930 probe=4.1062 probe_acc=0.1768 gnorm=0.78 lr=9.51e-04 dt=33.8s 07:08:22 ep 6 | loss=4.4170 inv=0.1820 sig=9.2039 lejepa=0.3624 probe=4.0545 probe_acc=0.1900 gnorm=0.72 lr=9.24e-04 dt=35.4s 07:08:57 ep 7 | loss=4.3600 inv=0.1777 sig=8.6211 lejepa=0.3465 probe=4.0135 probe_acc=0.1876 gnorm=0.63 lr=8.92e-04 dt=34.3s 07:09:32 ep 8 | loss=4.2948 inv=0.1725 sig=8.3151 lejepa=0.3354 probe=3.9594 probe_acc=0.1984 gnorm=0.55 lr=8.55e-04 dt=34.8s 07:10:07 ep 9 | loss=4.2467 inv=0.1678 sig=7.9800 lejepa=0.3241 probe=3.9227 probe_acc=0.1988 gnorm=0.59 lr=8.14e-04 dt=35.5s 07:10:07 saved /vast/adi/tclejepa/v1/checkpoints/baseline/epoch_009.pt 07:10:46 ep 10 | loss=4.1990 inv=0.1648 sig=7.4810 lejepa=0.3111 probe=3.8878 probe_acc=0.1972 gnorm=0.53 lr=7.68e-04 dt=34.6s 07:11:20 ep 11 | loss=4.1601 inv=0.1625 sig=7.2126 lejepa=0.3035 probe=3.8567 probe_acc=0.2084 gnorm=0.60 lr=7.20e-04 dt=34.3s 07:11:55 ep 12 | loss=4.1352 inv=0.1594 sig=6.9878 lejepa=0.2960 probe=3.8392 probe_acc=0.2084 gnorm=0.51 lr=6.68e-04 dt=34.7s 07:12:31 ep 13 | loss=4.0976 inv=0.1591 sig=6.6840 lejepa=0.2896 probe=3.8081 probe_acc=0.2148 gnorm=0.54 lr=6.15e-04 dt=36.0s 07:13:06 ep 14 | loss=4.0602 inv=0.1570 sig=6.3773 lejepa=0.2814 probe=3.7788 probe_acc=0.2080 gnorm=0.49 lr=5.60e-04 dt=34.8s 07:13:06 saved /vast/adi/tclejepa/v1/checkpoints/baseline/epoch_014.pt 07:13:45 ep 15 | loss=4.0179 inv=0.1546 sig=6.2220 lejepa=0.2759 probe=3.7419 probe_acc=0.2264 gnorm=0.48 lr=5.05e-04 dt=34.5s 07:14:20 ep 16 | loss=3.9854 inv=0.1529 sig=6.0035 lejepa=0.2699 probe=3.7155 probe_acc=0.2260 gnorm=0.46 lr=4.50e-04 dt=34.6s 07:14:54 ep 17 | loss=3.9509 inv=0.1505 sig=5.7584 lejepa=0.2626 probe=3.6882 probe_acc=0.2300 gnorm=0.44 lr=3.95e-04 dt=33.6s 07:15:28 ep 18 | loss=3.9267 inv=0.1498 sig=5.5451 lejepa=0.2577 probe=3.6690 probe_acc=0.2296 gnorm=0.42 lr=3.42e-04 dt=33.9s 07:16:02 ep 19 | loss=3.9203 inv=0.1492 sig=5.4894 lejepa=0.2560 probe=3.6643 probe_acc=0.2376 gnorm=0.44 lr=2.90e-04 dt=34.3s 07:16:02 saved /vast/adi/tclejepa/v1/checkpoints/baseline/epoch_019.pt 07:16:44 ep 20 | loss=3.8860 inv=0.1467 sig=5.3003 lejepa=0.2497 probe=3.6362 probe_acc=0.2396 gnorm=0.38 lr=2.42e-04 dt=34.3s 07:17:18 ep 21 | loss=3.8422 inv=0.1446 sig=5.1936 lejepa=0.2456 probe=3.5966 probe_acc=0.2440 gnorm=0.37 lr=1.96e-04 dt=34.6s 07:17:53 ep 22 | loss=3.8240 inv=0.1423 sig=4.9745 lejepa=0.2389 probe=3.5851 probe_acc=0.2440 gnorm=0.33 lr=1.55e-04 dt=35.2s 07:18:30 ep 23 | loss=3.8025 inv=0.1421 sig=4.9546 lejepa=0.2383 probe=3.5642 probe_acc=0.2476 gnorm=0.33 lr=1.18e-04 dt=36.1s 07:19:04 ep 24 | loss=3.7864 inv=0.1401 sig=4.8328 lejepa=0.2340 probe=3.5525 probe_acc=0.2440 gnorm=0.31 lr=8.59e-05 dt=35.0s 07:19:05 saved /vast/adi/tclejepa/v1/checkpoints/baseline/epoch_024.pt 07:19:45 ep 25 | loss=3.7627 inv=0.1386 sig=4.7178 lejepa=0.2302 probe=3.5324 probe_acc=0.2492 gnorm=0.31 lr=5.90e-05 dt=34.2s 07:20:20 ep 26 | loss=3.7557 inv=0.1396 sig=4.6609 lejepa=0.2300 probe=3.5257 probe_acc=0.2476 gnorm=0.32 lr=3.78e-05 dt=34.3s 07:20:55 ep 27 | loss=3.7405 inv=0.1379 sig=4.5767 lejepa=0.2267 probe=3.5138 probe_acc=0.2500 gnorm=0.32 lr=2.24e-05 dt=35.1s 07:21:29 ep 28 | loss=3.7354 inv=0.1369 sig=4.6161 lejepa=0.2265 probe=3.5089 probe_acc=0.2524 gnorm=0.30 lr=1.31e-05 dt=33.7s 07:22:02 ep 29 | loss=3.7340 inv=0.1380 sig=4.6505 lejepa=0.2282 probe=3.5058 probe_acc=0.2496 gnorm=0.30 lr=1.00e-05 dt=33.9s 07:22:03 saved /vast/adi/tclejepa/v1/checkpoints/baseline/epoch_029.pt 07:22:08 DONE in 1097s