AbstractPhil commited on
Commit
c7f467d
·
verified ·
1 Parent(s): 4cfc8be

Upload weights and configs - Run 20251012_041353

Browse files
weights/best_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:294bbd186f6036cf8599e3d257dae1b99f2b797e69dd10829c778672fbcc83e0
3
  size 64195804
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a0a048b57c5b3bcc5b18aff4e5c5865e4f3c267375450d8467b0d7a313e7dfb
3
  size 64195804
weights/best_model_metadata.json CHANGED
@@ -4,28 +4,28 @@
4
  "state": {
5
  "0": {
6
  "step": "tensor(1252.)",
7
- "exp_avg": "tensor([[ 1.9713e-10, 1.3792e-10, 3.3957e-11, ..., 1.0996e-10,\n 4.6853e-11, -1.1526e-10],\n [-1.0289e-17, -9.5931e-18, 3.2373e-17, ..., 2.7494e-17,\n 4.2224e-18, 8.3908e-18],\n [-1.4832e-05, -9.2881e-06, 3.5940e-06, ..., 1.1999e-05,\n -1.1828e-05, -1.2137e-05],\n ...,\n [ 1.7920e-05, 2.1531e-05, -1.8022e-05, ..., 5.4808e-05,\n 2.7031e-05, 1.3808e-05],\n [-5.7287e-06, 1.6181e-06, 2.7875e-05, ..., -2.6199e-05,\n -2.8657e-05, 1.9206e-05],\n [-8.8155e-05, 4.1780e-06, 4.0802e-05, ..., -3.5290e-05,\n -2.8545e-05, -3.8054e-05]], device='cuda:0')",
8
- "exp_avg_sq": "tensor([[2.2200e-10, 2.7750e-09, 7.1553e-11, ..., 3.0168e-10, 1.8045e-10,\n 4.1697e-11],\n [3.3938e-12, 2.3164e-10, 8.9042e-10, ..., 3.8144e-10, 1.4700e-09,\n 2.5750e-10],\n [1.3881e-08, 1.7306e-08, 7.7339e-09, ..., 1.0447e-08, 7.8801e-09,\n 6.3375e-09],\n ...,\n [1.4389e-08, 1.3066e-08, 1.8699e-08, ..., 8.2831e-09, 8.2600e-09,\n 7.8658e-09],\n [1.4811e-08, 1.5370e-08, 1.0239e-08, ..., 1.4269e-08, 1.1555e-08,\n 8.2375e-09],\n [2.9973e-08, 2.3111e-08, 1.7009e-08, ..., 1.9652e-08, 1.6060e-08,\n 1.0703e-08]], device='cuda:0')"
9
  },
10
  "1": {
11
  "step": "tensor(1252.)",
12
- "exp_avg": "tensor([ 4.1663e-09, -7.4026e-16, 2.5350e-05, ..., -1.7010e-03,\n -1.1158e-04, -2.4774e-03], device='cuda:0')",
13
- "exp_avg_sq": "tensor([4.3436e-07, 2.1974e-06, 1.9867e-05, ..., 2.5302e-05, 2.4478e-05,\n 4.2005e-05], device='cuda:0')"
14
  },
15
  "2": {
16
  "step": "tensor(1252.)",
17
- "exp_avg": "tensor([[-5.6052e-45, -5.6052e-45, 9.8878e-07, ..., -5.9512e-06,\n 5.3793e-07, -2.0074e-06],\n [ 5.6052e-45, 5.6052e-45, 9.0100e-40, ..., 5.6052e-45,\n 5.6052e-45, 1.2612e-44],\n [-5.6052e-45, -5.6052e-45, 7.3746e-07, ..., -7.5448e-06,\n 8.4204e-06, 1.2397e-05],\n ...,\n [-5.6052e-45, 5.6052e-45, 5.6052e-45, ..., 5.6052e-45,\n 1.1651e-15, 5.6052e-45],\n [ 5.6052e-45, 5.6052e-45, 1.8246e-06, ..., 3.8607e-05,\n -1.7986e-06, 6.0209e-06],\n [ 0.0000e+00, 0.0000e+00, 5.6052e-45, ..., 5.6052e-45,\n 5.6052e-45, 0.0000e+00]], device='cuda:0')",
18
- "exp_avg_sq": "tensor([[3.2380e-12, 1.0859e-09, 1.9138e-09, ..., 3.6760e-08, 1.8076e-09,\n 1.2535e-07],\n [1.9280e-08, 5.3790e-09, 3.0021e-11, ..., 1.2888e-08, 9.0937e-12,\n 3.2040e-13],\n [5.7489e-11, 5.6419e-11, 1.3337e-09, ..., 2.0002e-08, 1.0145e-09,\n 5.7969e-09],\n ...,\n [4.5681e-12, 9.6655e-13, 4.2077e-11, ..., 8.3678e-11, 1.7605e-11,\n 1.4295e-13],\n [8.6178e-11, 4.5901e-12, 1.6466e-09, ..., 1.1019e-08, 1.1423e-08,\n 5.1227e-09],\n [0.0000e+00, 0.0000e+00, 2.5350e-18, ..., 1.1969e-21, 1.0028e-18,\n 0.0000e+00]], device='cuda:0')"
19
  },
20
  "3": {
21
  "step": "tensor(1252.)",
22
- "exp_avg": "tensor([-8.1264e-05, 7.5798e-39, 3.6408e-04, -4.2561e-09, 9.9253e-39,\n 1.2599e-04, 4.0824e-06, -4.8343e-04, 5.6052e-45, -1.2024e-04,\n 2.6566e-05, -1.3261e-03, -2.2182e-04, -1.1798e-03, -2.0031e-04,\n 7.9805e-04, -1.9029e-04, 1.5340e-04, 7.3383e-35, 3.1054e-04,\n 8.0232e-31, 3.8927e-04, 5.6052e-45, 2.0327e-07, 2.0346e-04,\n 5.6052e-45, 6.7252e-04, -5.9374e-04, 1.6031e-39, -4.4268e-04,\n 5.6052e-45, -4.2256e-04, 1.1913e-03, 5.2904e-29, 2.6332e-04,\n -1.0844e-04, 1.0241e-03, -3.9324e-04, -6.0203e-04, -6.1506e-04,\n 3.6272e-07, -6.4959e-05, 5.6052e-45, 7.9036e-04, -1.0706e-06,\n 7.5057e-39, 5.1459e-04, 4.2719e-16, -3.0999e-04, 2.9554e-04,\n 5.6052e-45, 7.2826e-04, 2.2880e-04, 7.5234e-07, 1.0432e-03,\n 8.9009e-04, 9.0002e-05, 3.4033e-04, 9.7775e-30, 4.7616e-04,\n -1.7329e-04, -8.2933e-04, -2.5101e-09, -6.6174e-04, -1.9297e-04,\n 2.8065e-05, 3.2792e-21, 5.8694e-05, 7.1903e-09, 5.6052e-45,\n -1.3637e-03, 5.6052e-45, 5.6052e-45, 5.6052e-45, -1.1402e-05,\n 2.1386e-04, 5.5230e-04, -6.4809e-05, 1.5097e-11, 2.1238e-28,\n -6.2058e-04, -6.2416e-04, -1.7541e-04, 5.6052e-45, -2.0223e-04,\n -2.2527e-04, 2.1822e-04, -2.7340e-04, 6.7822e-04, 5.6052e-45,\n 2.0326e-04, -9.1710e-05, 6.6284e-04, -7.8587e-05, 3.1331e-04,\n 2.0703e-08, -1.2218e-04, 5.8165e-04, 5.6052e-45, 1.5165e-04,\n 3.2127e-04, -2.4017e-04, -6.1863e-04, -5.4546e-09, 1.7603e-04,\n 3.7081e-07, -3.6395e-05, 1.9446e-40, 2.5548e-04, 1.1922e-04,\n 1.6387e-06, 5.6052e-45, -1.1167e-04, -5.8101e-04, 3.1455e-04,\n -1.0834e-03, 2.6438e-07, -8.6750e-05, -6.8422e-05, 2.6370e-30,\n -1.7728e-04, 5.6052e-45, 2.6906e-41, -1.4437e-04, -3.4734e-04,\n -2.4244e-04, 8.2188e-05, -2.5536e-04, 4.3580e-43, -9.3818e-06,\n 1.4432e-04, 5.9221e-04, -4.6491e-04, 1.6708e-10, 5.6052e-45,\n 3.3209e-04, -6.4235e-04, 5.6052e-45, 5.6052e-45, 4.5894e-08,\n -3.5661e-04, 5.6052e-45, -2.7353e-04, 1.0630e-12, -1.3663e-04,\n -5.2250e-04, -2.0110e-05, 7.9620e-05, 3.1210e-05, -5.4349e-05,\n 5.6052e-45, -4.3609e-05, 3.5749e-04, -6.0046e-04, 4.4374e-26,\n -1.0729e-05, 1.8651e-04, 3.8081e-05, -1.6347e-04, 3.4891e-04,\n 5.6052e-45, -1.7144e-05, -5.1653e-04, 4.9997e-05, 5.1436e-05,\n -2.6328e-04, 3.8237e-38, 5.6052e-45, 3.9904e-05, -2.8539e-03,\n -3.4180e-05, 5.6052e-45, -2.3077e-04, -1.4283e-03, 1.9029e-07,\n 5.6052e-45, 7.1281e-05, -1.2257e-05, -2.1968e-05, -8.1979e-05,\n 5.9738e-34, 1.0946e-04, -8.8604e-04, 2.6354e-25, 5.6052e-45,\n 4.9875e-07, -5.8565e-04, 3.2329e-04, 1.1123e-03, -1.1433e-05,\n 4.4116e-04, 5.6052e-45, 6.3678e-05, 3.8433e-05, -7.8500e-04,\n -4.2352e-04, 9.7195e-04, 1.2407e-04, 4.6405e-04, -8.7156e-08,\n 3.4464e-04, -5.1656e-04, -9.2867e-06, 5.1762e-05, 3.3112e-04,\n 1.2128e-05, 2.3491e-05, -7.6806e-06, 2.2013e-04, 5.6052e-45,\n -2.9912e-07, -2.5416e-04, 3.7098e-41, 1.2517e-03, 2.4143e-13,\n 7.8699e-07, -7.4514e-04, 4.3245e-07, -3.4058e-04, -3.1511e-04,\n 6.6770e-05, 2.7490e-04, 1.5292e-04, -4.9577e-04, -2.6413e-04,\n -3.3966e-05, 5.6052e-45, -1.1224e-04, -7.2274e-05, 6.1503e-04,\n 7.8753e-42, 1.1536e-12, 2.0789e-32, -3.1003e-04, -4.7707e-04,\n 5.6052e-45, -1.7004e-04, 5.6052e-45, -4.3259e-05, 5.6052e-45,\n 3.6874e-04, 1.0085e-05, 3.7596e-04, -1.9971e-04, 1.6032e-04,\n -1.2170e-06, 7.0850e-04, 5.6052e-45, 1.9194e-04, 2.2501e-06,\n 1.5158e-04, 1.9068e-04, 5.6052e-45, 1.7582e-10, -4.4623e-08,\n 3.5192e-04, 3.2316e-05, -2.5336e-04, -5.6359e-04, 5.6052e-45,\n 3.5653e-04, 4.1357e-05, -2.0718e-04, 2.5250e-06, 3.5969e-05,\n 3.9884e-26, 7.0131e-39, 3.1408e-07, -2.5653e-04, 4.1386e-04,\n 3.7927e-04, 8.7384e-05, -1.6352e-04, 5.6052e-45, -1.1449e-04,\n -2.7980e-04, -5.5338e-09, 5.6052e-45, -2.5174e-04, 5.6052e-45,\n 3.1733e-04, 1.8434e-07, 6.1010e-22, -2.7877e-05, 7.1413e-35,\n -2.4953e-04, 5.6052e-45, -2.5949e-05, 3.3504e-04, -5.0448e-05,\n 3.6315e-05, 5.6052e-45, -5.8939e-04, -9.6755e-05, 8.2634e-04,\n 7.6564e-06, 5.3710e-06, -1.2029e-04, -1.7423e-05, -1.5841e-08,\n -4.1153e-04, 2.7990e-04, 4.6507e-04, 5.6052e-45, 1.3785e-04,\n 9.3304e-04, -1.5396e-04, -1.0375e-04, -6.1837e-08, 5.6052e-45,\n -2.4184e-05, -1.9747e-04, 2.3489e-04, 5.6052e-45, -5.5726e-05,\n 2.7576e-05, 2.3926e-05, 6.7314e-05, 4.7844e-05, -1.0436e-04,\n 1.1386e-10, -3.2232e-04, 5.6052e-45, 3.9104e-07, 7.0597e-04,\n 5.6052e-45, 1.8552e-04, -1.2850e-06, -2.1309e-04, -3.2804e-04,\n 3.8535e-04, 1.9042e-11, 9.8615e-22, 2.0844e-05, 1.7425e-04,\n -4.1536e-05, 5.0983e-06, -5.9622e-04, 3.0312e-04, -8.8849e-06,\n 5.6052e-45, 1.5622e-04, 5.6052e-45, 2.5748e-08, 7.4989e-04,\n 2.0811e-14, 1.0637e-21, 5.6052e-45, -1.6330e-04, 2.1874e-42,\n -3.1103e-04, -7.1300e-04, -4.8133e-05, -4.7158e-08, 1.2379e-04,\n 1.3710e-05, 1.9674e-42, -1.6922e-04, 1.1199e-04, 1.8838e-04,\n 1.1957e-05, -9.3143e-07, 5.6052e-45, 1.2102e-21, 4.1149e-04,\n -1.3290e-03, -2.4555e-04, 7.4706e-04, -1.9759e-04, -5.1621e-04,\n 6.5269e-35, 2.5814e-04, 5.6052e-45, 1.7694e-04, -1.7651e-03,\n 2.9528e-04, 9.0772e-27, -3.9514e-05, -6.2321e-14, 5.2326e-05,\n -1.7559e-04, 3.6145e-05, 4.1458e-34, 5.6052e-45, 1.5670e-04,\n -1.0744e-04, -2.8093e-04, -2.3748e-04, 2.6463e-04, 5.8540e-05,\n 1.8535e-07, -2.9949e-04, 7.6396e-05, 5.9589e-05, 8.2617e-04,\n 5.6052e-45, 1.0766e-03, 1.2193e-35, 5.6052e-45, 6.9457e-04,\n 9.1567e-13, 5.6052e-45, -1.1279e-04, 9.8371e-06, -2.3481e-04,\n -4.2023e-05, -1.7353e-04, 1.8519e-04, 2.8085e-04, 4.1098e-22,\n 4.5900e-04, 5.6052e-45, 5.6052e-45, -4.8305e-05, 1.1504e-03,\n 1.0284e-04, 2.6488e-04, 6.6194e-05, 7.9345e-04, 3.2412e-04,\n 5.6052e-45, 2.6438e-04, 1.2683e-03, 9.8305e-05, -2.7174e-04,\n -4.7245e-04, 1.0225e-04, -1.3631e-04, 3.3892e-35, 1.4776e-04,\n -3.1982e-04, 1.8618e-04, 4.2763e-04, -2.7158e-04, -1.5984e-04,\n 3.0278e-04, 6.1912e-04, 2.0484e-04, 2.6571e-08, 6.3978e-04,\n 3.8475e-04, 4.2492e-04, 8.4660e-26, 3.2762e-04, 5.5910e-04,\n 1.3316e-07, -2.7856e-05, 7.9215e-10, -3.0108e-04, -3.2833e-04,\n -4.4216e-04, -5.6435e-05, -4.1902e-04, 2.6037e-04, -1.1174e-04,\n -1.4238e-05, 5.1957e-04, -4.3069e-04, -1.2269e-04, 5.5970e-04,\n 5.6052e-45, 1.5761e-05, 2.0862e-04, 1.9052e-05, 3.3937e-04,\n 1.0553e-07, -9.6583e-05, 1.2294e-06, -2.3831e-04, -1.5985e-04,\n 5.1069e-04, 1.9570e-07, -3.0616e-04, 2.6753e-04, -4.3465e-05,\n -1.9713e-04, -1.1068e-04, -6.9833e-04, -1.8459e-04, -4.8540e-05,\n 5.6052e-45, 3.9097e-05, -1.1075e-03, 5.6052e-45, 4.1887e-04,\n -8.4801e-05, -1.9641e-04, 5.6052e-45, 1.2488e-22, 2.3699e-07,\n 5.9985e-05, 2.5143e-04, 2.5703e-04, -1.6749e-04, 1.7819e-04,\n -1.9615e-21, 5.6052e-45, 5.0861e-04, -2.7762e-04, 5.6524e-31,\n 1.1466e-04, -3.0801e-04, 3.8789e-05, -1.7303e-04, 1.5610e-27,\n -1.1859e-04, -7.6397e-06, 2.3618e-04, 1.3263e-04, 1.0769e-17,\n -3.2863e-04, 8.3187e-05, 5.6052e-45, 6.4671e-06, 1.1686e-05,\n -2.5893e-04, 5.6052e-45, 1.4613e-05, -1.8140e-04, 1.9618e-42,\n -2.7110e-04, 3.3940e-15, 4.9949e-04, 1.0043e-04, -8.5296e-05,\n 5.6052e-45, 2.9566e-04, 8.6320e-43, -4.8263e-06, 3.0104e-04,\n 2.5275e-18, -8.8767e-05, 3.0834e-04, 8.8117e-29, 5.6052e-45,\n 5.6052e-45, 4.3284e-37, 5.6052e-45, 3.1122e-37, -1.3090e-04,\n -9.2880e-04, 6.7252e-05, -1.2725e-04, -6.0987e-05, 4.2595e-04,\n 5.6052e-45, 7.2849e-05, -1.8850e-04, -1.4746e-04, -1.4861e-04,\n -4.8619e-05, 1.5747e-05, 7.4227e-07, -3.3240e-06, 2.8659e-04,\n 5.6052e-45, -3.3913e-04, 7.4403e-05, 3.5775e-04, 6.7038e-04,\n -9.2686e-05, 3.2418e-11, -1.9911e-04, 2.5734e-04, -1.6413e-04,\n -3.8621e-05, -4.0990e-04, 8.8431e-05, -1.0730e-05, 1.8265e-07,\n 5.6052e-45, 5.6052e-45, 1.7692e-04, 3.2113e-04, -2.0924e-04,\n 7.2445e-04, 4.2848e-04, -6.9459e-04, 5.6052e-45, -2.6960e-04,\n 3.0032e-08, -1.0461e-07, -1.0324e-03, -4.9936e-05, 5.8789e-04,\n 1.8930e-05, -3.9123e-06, 6.2153e-05, 7.5662e-40, -1.3433e-07,\n 2.9666e-04, 1.3513e-05, -2.6712e-05, -1.8029e-05, 9.6275e-05,\n -4.8399e-04, 5.6052e-45, 7.6657e-09, -1.9402e-03, 4.3242e-04,\n 7.4915e-06, 4.4386e-04, 2.7446e-07, 5.6052e-45, -2.3517e-04,\n 5.6052e-45, -1.7880e-04, 5.6052e-45, 4.9186e-27, 3.0135e-04,\n 5.8542e-05, 1.0646e-06, -5.4039e-04, 1.7541e-16, 5.6895e-04,\n 3.2011e-04, 3.0544e-04, 5.6052e-45, 5.6052e-45, 1.1752e-04,\n 2.7228e-04, 6.8890e-37, 2.5974e-07, -4.3170e-05, -3.6247e-04,\n 5.6052e-45, 5.6052e-45, 1.4788e-04, 1.8833e-04, 1.7535e-04,\n 1.4693e-04, 3.7588e-17, 6.4629e-04, -6.6416e-05, -2.9147e-04,\n 5.6052e-45, -6.4610e-04, 1.6550e-04, -1.2144e-04, 2.3050e-04,\n -1.2833e-04, -2.7904e-04, -1.9479e-04, 2.5716e-27, 1.0468e-04,\n -2.0327e-04, 8.6941e-33, 1.9888e-04, 5.5041e-09, -1.6058e-04,\n 8.5532e-04, -8.3713e-05, -8.4738e-05, -1.2076e-04, 4.6266e-20,\n 5.5753e-07, 3.2753e-06, 1.6157e-04, 4.7866e-05, 5.5889e-04,\n 2.6746e-36, 2.9061e-04, -1.0881e-04, -2.1097e-05, -4.8695e-04,\n 3.2925e-04, -4.8553e-05, 3.3439e-41, 1.0943e-04, 5.9802e-04,\n -1.0327e-04, -2.6962e-04, 3.1022e-05, 3.9226e-04, -6.9205e-05,\n -4.3627e-04, 3.1059e-04, -1.4419e-04, 8.9291e-05, 6.3517e-30,\n -9.1758e-04, -4.6729e-04, 7.7562e-13, 4.5750e-05, 5.4830e-38,\n -1.8727e-04, 2.8139e-05, -1.0231e-03, 1.8932e-20, 1.1199e-03,\n -1.4275e-04, 5.6052e-45, 5.4334e-04, 3.5230e-08, -4.6426e-04,\n 5.6052e-45, -2.8555e-04, 5.6052e-45, 7.4944e-09, -4.9895e-04,\n 3.3658e-10, 1.1722e-08, -3.8484e-04, -1.4074e-04, -2.5970e-04,\n 6.5027e-19, -4.2515e-04, -1.8295e-04, 1.4178e-05, 7.6085e-06,\n 5.2322e-04, -1.5440e-04, -6.8521e-05, -1.9164e-04, -1.6505e-04,\n -3.8157e-04, 5.6052e-45, 9.5609e-05, 3.2674e-12, 5.6052e-45,\n -5.4841e-07, 3.2532e-05, 1.0319e-10, 5.6052e-45, 4.9991e-04,\n 5.4790e-04, 3.0915e-10, 1.7830e-04, -3.6514e-04, -2.6623e-04,\n -1.4962e-05, 4.1905e-28, 3.2258e-04, 8.8132e-08, -6.4462e-04,\n 5.6052e-45, 4.6858e-04, 5.8869e-06, 9.5817e-05, -5.2355e-04,\n -8.0031e-05, 8.1327e-30, 1.9230e-05, -4.6101e-04, -5.7366e-13,\n 9.8916e-25, 3.7994e-13, 3.1462e-05, -1.8218e-04, 5.0399e-04,\n 1.4011e-30, 6.0425e-05, 5.6052e-45, 5.6052e-45, -3.0413e-04,\n 5.3550e-09, -6.1937e-05, 2.4589e-10, 5.6052e-45, 5.6052e-45,\n -3.5811e-04, 3.0902e-04, -2.8563e-04, 2.1389e-04, 2.5223e-04,\n 6.7046e-15, 3.4430e-04, 5.6052e-45], device='cuda:0')",
23
- "exp_avg_sq": "tensor([3.3693e-06, 2.4410e-05, 8.9575e-07, 1.1231e-05, 6.2019e-06, 4.9490e-06,\n 4.5566e-07, 5.7694e-06, 1.1967e-09, 5.1687e-06, 4.6993e-06, 7.4326e-06,\n 4.2618e-06, 6.9185e-06, 5.1314e-06, 1.4186e-06, 7.8493e-06, 6.4303e-06,\n 2.2068e-05, 4.5573e-06, 4.1858e-07, 1.9032e-06, 2.9108e-09, 2.4298e-05,\n 9.2279e-06, 5.2920e-06, 3.6979e-06, 2.7045e-06, 6.8514e-07, 7.3013e-06,\n 5.4680e-08, 2.9139e-06, 6.4900e-06, 1.5336e-08, 1.4735e-05, 4.2086e-07,\n 1.7540e-06, 4.5798e-06, 3.8331e-06, 1.7108e-05, 1.2593e-05, 1.5988e-06,\n 1.4059e-05, 2.2733e-06, 1.3956e-06, 3.1771e-08, 6.7631e-06, 7.8367e-06,\n 7.4455e-06, 3.6206e-06, 1.4442e-06, 7.8171e-06, 9.6952e-07, 2.5454e-07,\n 2.0429e-05, 4.9588e-06, 1.7894e-06, 6.1193e-06, 3.5241e-07, 5.7870e-06,\n 5.0422e-07, 2.5689e-06, 7.6001e-07, 2.3287e-06, 4.7610e-06, 6.8214e-06,\n 2.7934e-06, 5.7856e-07, 1.2541e-07, 2.1391e-05, 4.5586e-06, 3.8044e-07,\n 1.0139e-07, 5.0466e-05, 9.2853e-06, 1.0080e-05, 7.1167e-06, 3.3880e-06,\n 7.4313e-06, 2.1592e-05, 3.2378e-06, 8.2832e-06, 2.6593e-06, 1.8354e-08,\n 2.0593e-06, 9.7601e-06, 2.0677e-07, 6.6697e-06, 1.2691e-05, 2.7408e-16,\n 4.8086e-06, 2.5989e-06, 3.8664e-07, 3.1938e-06, 3.5740e-06, 2.0398e-06,\n 1.0473e-05, 1.6150e-05, 4.5368e-06, 5.0644e-07, 1.6493e-05, 9.5020e-07,\n 5.7118e-06, 6.8295e-08, 3.3438e-06, 7.5491e-07, 7.2297e-06, 2.0499e-08,\n 8.8315e-06, 8.8582e-07, 1.9254e-05, 8.1561e-06, 4.2689e-07, 1.8190e-05,\n 7.2604e-07, 1.0932e-05, 7.4600e-06, 1.4252e-06, 2.6599e-06, 1.2821e-07,\n 3.3043e-06, 2.2632e-09, 3.7446e-07, 3.2996e-06, 2.0189e-06, 1.1756e-05,\n 4.5110e-06, 6.8147e-06, 7.6686e-06, 1.6396e-05, 2.4774e-06, 6.4399e-06,\n 1.5132e-05, 1.9939e-06, 1.9646e-07, 8.6791e-07, 3.7148e-05, 1.3106e-07,\n 1.5055e-05, 5.9321e-07, 2.1396e-05, 2.0616e-06, 3.1613e-05, 4.9411e-08,\n 4.4038e-06, 3.2082e-06, 8.8962e-06, 1.2544e-06, 2.0764e-06, 1.4117e-06,\n 1.7709e-05, 3.1737e-06, 1.3063e-06, 1.4324e-06, 9.2868e-07, 2.2081e-06,\n 5.7214e-08, 1.6185e-06, 1.5348e-06, 6.2244e-06, 9.4854e-07, 6.7281e-06,\n 1.3210e-06, 2.5563e-07, 8.7678e-06, 7.1245e-07, 2.8445e-06, 1.8839e-06,\n 1.5569e-06, 5.3353e-06, 1.7520e-06, 3.2884e-09, 1.0783e-05, 8.1873e-06,\n 6.8559e-05, 1.5123e-06, 2.0890e-07, 5.4987e-06, 2.1404e-06, 3.0977e-06,\n 5.5348e-06, 7.7396e-06, 1.7445e-07, 4.5536e-09, 1.7669e-07, 4.6162e-06,\n 7.7856e-06, 9.0437e-06, 1.8811e-06, 4.0502e-06, 3.6209e-06, 1.0294e-05,\n 1.9044e-05, 3.0561e-06, 3.3748e-06, 1.9965e-05, 6.8493e-06, 2.5217e-06,\n 2.4885e-06, 1.1633e-06, 4.5274e-06, 3.4137e-06, 2.6378e-06, 3.3471e-06,\n 2.1692e-05, 5.8255e-06, 2.4218e-06, 8.6630e-06, 3.8317e-06, 8.7063e-06,\n 3.4823e-06, 7.4554e-08, 6.4560e-07, 1.2154e-06, 5.9539e-06, 4.4567e-07,\n 2.2113e-06, 1.7861e-05, 1.3831e-06, 5.2571e-06, 4.3274e-06, 6.9857e-07,\n 1.9159e-06, 6.6942e-07, 4.3637e-06, 2.4472e-06, 3.6669e-12, 2.0182e-06,\n 5.6492e-06, 2.5355e-06, 2.4622e-06, 1.8956e-07, 1.2370e-05, 6.4376e-06,\n 1.1244e-05, 5.5215e-09, 5.1558e-06, 6.8355e-09, 7.8053e-06, 2.3653e-09,\n 2.8897e-06, 1.7738e-06, 3.3102e-06, 6.3382e-07, 1.6061e-06, 3.4454e-05,\n 1.0155e-05, 9.9832e-16, 6.3578e-05, 1.2768e-05, 7.9200e-07, 2.3123e-06,\n 1.3503e-06, 1.2308e-08, 5.1714e-07, 5.1811e-06, 5.9057e-06, 3.3349e-06,\n 1.0878e-05, 1.0051e-07, 1.0626e-06, 5.0624e-06, 1.2407e-05, 1.6917e-05,\n 1.1727e-06, 4.6355e-09, 5.3633e-06, 6.2005e-06, 2.6731e-06, 7.3875e-06,\n 4.5632e-06, 4.4475e-06, 1.8239e-05, 9.8957e-07, 3.2249e-06, 5.0458e-06,\n 2.2688e-05, 6.9551e-06, 6.8217e-06, 1.1738e-10, 1.6302e-05, 4.1912e-06,\n 8.5339e-08, 1.2285e-05, 8.6727e-06, 1.4659e-06, 2.5946e-06, 2.6636e-06,\n 3.8717e-06, 2.8450e-06, 5.4497e-06, 1.1539e-06, 4.4956e-06, 6.1807e-06,\n 6.5998e-06, 1.5836e-05, 7.0212e-07, 1.4822e-06, 1.3207e-05, 1.1564e-06,\n 2.2965e-06, 2.0187e-06, 1.0480e-05, 4.7167e-07, 5.2347e-06, 4.8601e-06,\n 5.6593e-06, 1.1369e-06, 5.5059e-06, 3.9796e-08, 7.7935e-06, 9.5096e-07,\n 2.1128e-06, 7.1229e-06, 1.2517e-05, 3.0143e-08, 1.7837e-06, 1.8615e-05,\n 6.7370e-07, 1.2780e-07, 1.8260e-05, 1.8836e-05, 2.7510e-12, 4.3468e-09,\n 5.8866e-06, 3.5754e-06, 1.0533e-06, 1.9996e-06, 2.1044e-05, 1.0091e-05,\n 8.2017e-06, 1.5049e-08, 7.8433e-07, 5.0551e-07, 4.7566e-06, 2.6181e-07,\n 3.0355e-06, 2.1853e-06, 1.6365e-06, 7.1078e-07, 2.7933e-05, 9.4889e-07,\n 7.2585e-10, 1.8789e-09, 2.6458e-06, 6.4898e-06, 1.6380e-07, 1.1762e-08,\n 6.1760e-06, 1.9065e-06, 3.1144e-06, 1.6804e-05, 9.7195e-06, 3.4094e-08,\n 1.9902e-06, 1.4157e-05, 1.3322e-05, 4.2700e-06, 7.0517e-06, 1.0999e-06,\n 1.4735e-07, 4.5406e-08, 1.1311e-06, 1.8050e-09, 1.7040e-06, 4.7493e-06,\n 1.8805e-06, 4.3105e-06, 3.0279e-06, 6.6367e-06, 3.7447e-06, 2.5139e-06,\n 6.8704e-15, 7.6032e-06, 6.9122e-06, 6.9131e-07, 4.7528e-05, 5.7191e-06,\n 1.7187e-08, 1.5245e-06, 1.3911e-06, 4.6972e-06, 1.2284e-05, 2.4333e-05,\n 1.1751e-06, 3.7495e-06, 1.0096e-06, 1.6648e-05, 1.7527e-06, 1.6993e-07,\n 2.0131e-06, 7.7643e-06, 4.4183e-06, 3.7435e-06, 8.1354e-06, 8.1317e-06,\n 1.0773e-05, 6.5235e-06, 2.2403e-06, 2.8637e-06, 1.0907e-05, 1.6727e-09,\n 2.9217e-08, 1.3397e-05, 9.9356e-06, 1.1695e-05, 1.6826e-05, 4.6957e-06,\n 3.5887e-05, 1.0815e-06, 4.0590e-06, 2.6816e-07, 9.1692e-07, 4.8500e-07,\n 2.2639e-05, 3.7577e-06, 9.4447e-07, 2.6807e-07, 5.8754e-06, 4.9834e-06,\n 1.8924e-06, 7.0958e-06, 5.0751e-06, 2.5766e-07, 1.6951e-06, 3.3770e-06,\n 7.8760e-06, 4.1990e-06, 2.1676e-08, 1.1226e-05, 1.0999e-06, 3.4279e-06,\n 9.6933e-06, 4.9122e-06, 1.4666e-07, 8.9252e-06, 4.5064e-06, 7.1595e-06,\n 1.1603e-08, 2.4819e-06, 5.8658e-06, 2.1225e-06, 4.1565e-05, 1.3885e-06,\n 2.2436e-06, 2.8361e-08, 7.1726e-06, 8.5637e-09, 2.5720e-06, 3.7462e-06,\n 3.4960e-06, 6.7820e-06, 1.1515e-06, 1.3679e-06, 4.9748e-06, 2.0245e-05,\n 9.1198e-06, 3.5416e-06, 1.8741e-06, 1.9910e-06, 1.5754e-05, 1.1233e-06,\n 2.2612e-06, 2.6649e-08, 9.0686e-06, 1.2949e-05, 1.6705e-06, 4.1054e-05,\n 1.6241e-06, 2.0028e-06, 3.4621e-06, 1.4528e-07, 1.3291e-07, 2.4980e-05,\n 8.5697e-07, 3.6278e-06, 1.8603e-06, 1.2999e-05, 1.2606e-06, 2.7245e-06,\n 3.6697e-10, 5.3910e-08, 8.0575e-06, 3.1466e-05, 2.2134e-06, 7.2762e-06,\n 2.7171e-06, 2.5004e-07, 9.6974e-08, 4.7756e-06, 5.3983e-06, 1.9046e-06,\n 2.9134e-06, 1.8686e-06, 2.0608e-06, 5.1195e-07, 4.7890e-10, 7.1490e-06,\n 3.3984e-06, 3.4456e-06, 1.8777e-06, 2.6746e-05, 4.2836e-06, 7.2854e-06,\n 1.4814e-06, 6.4303e-06, 3.4519e-06, 1.1490e-06, 5.0320e-07, 3.5298e-09,\n 1.1648e-05, 5.0200e-06, 2.8040e-07, 3.0941e-05, 1.1119e-06, 7.3155e-06,\n 9.5795e-08, 3.1949e-06, 3.9493e-06, 4.0432e-05, 3.0909e-06, 6.2836e-07,\n 3.5134e-06, 4.6867e-06, 4.4169e-06, 8.6829e-06, 1.0924e-07, 1.0040e-06,\n 9.7807e-07, 8.8766e-06, 1.8046e-07, 3.5222e-06, 1.4853e-05, 4.4637e-06,\n 2.1686e-06, 2.4515e-07, 4.8200e-08, 6.2169e-05, 5.0371e-10, 1.2525e-05,\n 3.5620e-06, 3.2728e-05, 3.4235e-05, 7.9581e-07, 4.5748e-06, 3.3867e-05,\n 1.4252e-05, 3.6429e-07, 1.4411e-06, 5.4747e-06, 5.1058e-06, 7.5437e-06,\n 3.7024e-06, 6.7335e-07, 9.1437e-06, 6.6628e-08, 2.3364e-05, 1.5279e-06,\n 2.6628e-06, 1.0145e-05, 1.4809e-06, 2.6937e-06, 9.9388e-06, 5.3542e-06,\n 7.2049e-06, 3.1689e-06, 1.6303e-06, 6.1651e-06, 1.6020e-06, 1.0233e-07,\n 1.7902e-05, 1.9106e-07, 9.2660e-07, 1.4074e-06, 1.8916e-06, 7.1971e-06,\n 5.8780e-05, 2.3267e-05, 1.7304e-06, 4.2744e-06, 4.0710e-06, 7.3329e-08,\n 4.6507e-06, 3.2389e-06, 3.6059e-06, 1.6733e-06, 3.8105e-06, 3.2092e-05,\n 2.5952e-05, 6.7724e-07, 1.2954e-06, 2.7841e-06, 6.3976e-06, 1.6183e-07,\n 1.2807e-05, 1.1780e-06, 2.2827e-06, 1.3140e-05, 1.7030e-05, 1.2125e-06,\n 3.4199e-06, 3.9883e-06, 3.1252e-06, 2.7216e-09, 9.1962e-06, 9.7500e-07,\n 1.0411e-06, 6.3169e-06, 1.7635e-07, 3.4237e-07, 1.1492e-06, 2.7977e-06,\n 9.5920e-06, 5.7352e-07, 2.9897e-06, 8.8170e-06, 6.9273e-06, 2.3744e-06,\n 1.0508e-05, 5.1282e-06, 4.6150e-06, 1.6428e-05, 5.3555e-05, 7.4789e-06,\n 1.5190e-06, 6.9186e-07, 4.6280e-09, 1.7534e-05, 2.7921e-06, 4.2805e-05,\n 5.8490e-06, 2.1551e-09, 3.2127e-06, 4.0567e-07, 7.0518e-06, 7.3131e-06,\n 5.2941e-06, 1.9729e-06, 4.7879e-06, 1.6201e-06, 1.4118e-06, 3.5397e-06,\n 1.4090e-06, 4.1118e-06, 1.0943e-07, 4.7859e-07, 1.1029e-06, 2.7658e-06,\n 3.2909e-06, 4.1412e-07, 1.5403e-05, 9.1910e-06, 8.1625e-06, 1.0662e-06,\n 1.8042e-09, 4.7395e-06, 1.2501e-06, 5.4024e-07, 1.8113e-07, 4.7083e-06,\n 2.5615e-06, 5.3423e-05, 1.6159e-05, 1.9292e-06, 2.2935e-06, 2.1682e-06,\n 7.1856e-08, 1.8946e-05, 8.0018e-06, 3.4229e-06, 8.4947e-06, 6.2085e-06,\n 4.7878e-06, 3.3672e-06, 1.2898e-06, 3.9991e-06, 7.8990e-06, 1.9971e-06,\n 1.5234e-05, 9.8609e-10, 2.6940e-06, 1.5203e-06, 6.4713e-06, 9.9104e-07,\n 8.5900e-06, 2.2823e-06, 6.8063e-06, 4.5486e-06, 8.2973e-07, 8.1065e-06,\n 3.8346e-07, 6.5471e-18, 3.7177e-06, 7.7388e-07, 4.2688e-06, 3.3238e-08,\n 1.2169e-06, 1.2871e-05, 1.0205e-05, 6.0908e-06, 3.7562e-08, 8.6344e-06,\n 5.8068e-06, 5.6396e-06, 2.0693e-06, 1.9309e-06, 8.8574e-06, 2.0175e-06,\n 2.0972e-07, 2.0442e-06, 4.9912e-06, 7.0220e-06, 3.6238e-06, 1.6966e-06,\n 3.6249e-06, 3.9343e-06, 8.1132e-13, 2.1420e-07, 2.6506e-06, 1.1776e-11,\n 2.8554e-06, 3.3908e-05, 6.7573e-06, 9.8483e-10, 1.9724e-06, 3.1046e-06,\n 4.3230e-07, 6.7797e-06, 4.6747e-06, 1.8974e-06, 3.6497e-06, 5.9390e-06,\n 4.6872e-06, 1.9245e-06, 7.1672e-06, 6.3692e-05, 4.4564e-06, 6.0133e-06,\n 3.6987e-06, 4.9418e-06, 3.8102e-06, 5.0585e-08, 1.2168e-05, 1.3071e-06,\n 1.6564e-07, 1.6742e-10, 5.2557e-06, 9.7073e-06, 9.5956e-06, 2.3412e-06,\n 1.8318e-06, 5.1803e-06, 4.8746e-05, 2.8585e-06, 5.3646e-06, 3.4900e-06,\n 3.2306e-07, 2.8074e-07, 1.0148e-06, 4.6156e-07, 1.0313e-05, 1.5338e-05,\n 1.8243e-06, 2.1760e-06, 4.3299e-06, 2.3921e-07, 1.2060e-06, 3.2017e-17],\n device='cuda:0')"
24
  },
25
  "4": {
26
  "step": "tensor(1252.)",
27
- "exp_avg": "tensor([[-2.6488e-05, -3.0670e-41, 7.2287e-06, ..., -5.1648e-16,\n -3.5191e-06, 5.6052e-45],\n [ 4.9832e-06, 4.3369e-40, 1.2981e-05, ..., -1.7986e-16,\n 1.2125e-05, 5.6052e-45],\n [-1.4689e-04, -2.7840e-40, -3.2052e-05, ..., -3.6451e-16,\n -2.8482e-05, 5.6052e-45],\n ...,\n [ 3.2523e-05, -5.4717e-40, 1.7757e-05, ..., -1.0408e-16,\n -2.6931e-05, -5.6052e-45],\n [ 3.6407e-05, 1.3309e-40, -6.4877e-05, ..., -6.4068e-16,\n 3.8929e-05, -5.6052e-45],\n [ 1.1389e-04, -1.0316e-39, -4.6095e-05, ..., 1.2785e-16,\n 5.6176e-06, -5.6052e-45]], device='cuda:0')",
28
- "exp_avg_sq": "tensor([[2.9468e-08, 5.6937e-09, 5.2163e-09, ..., 1.4844e-10, 2.7376e-09,\n 5.1928e-23],\n [1.1546e-07, 2.4961e-09, 1.1412e-08, ..., 6.9710e-13, 4.4339e-09,\n 2.3162e-20],\n [1.4265e-07, 4.6236e-08, 1.6179e-08, ..., 7.9306e-12, 7.2551e-09,\n 3.2764e-22],\n ...,\n [1.0996e-07, 1.6454e-10, 1.4801e-08, ..., 1.9046e-11, 7.8488e-09,\n 5.9771e-21],\n [1.0020e-07, 2.5611e-10, 1.4037e-08, ..., 5.6161e-10, 6.1721e-09,\n 2.9927e-21],\n [1.2666e-07, 9.4758e-09, 1.3140e-08, ..., 5.6897e-12, 4.7143e-09,\n 3.5015e-21]], device='cuda:0')"
29
  }
30
  },
31
  "param_groups": [
@@ -223,15 +223,15 @@
223
  ]
224
  },
225
  "metrics": {
226
- "best_val_acc": 79.488,
227
  "best_epoch": 0,
228
  "scale_accuracies": {
229
- "384": 79.488
230
  }
231
  },
232
  "train_config": {
233
  "name": "david_training",
234
- "run_id": "20251012_040642",
235
  "dataset_name": "AbstractPhil/imagenet-clip-features-orderly",
236
  "model_variant": "clip_vit_l14",
237
  "num_classes": 1000,
 
4
  "state": {
5
  "0": {
6
  "step": "tensor(1252.)",
7
+ "exp_avg": "tensor([[-5.1115e-05, 2.0107e-05, 3.4546e-05, ..., -3.3245e-05,\n 9.1718e-06, 8.0877e-06],\n [-3.6630e-05, -1.6314e-05, -5.6690e-06, ..., -3.2203e-05,\n 2.1494e-05, -9.5532e-06],\n [-5.6052e-45, -5.6052e-45, -5.6052e-45, ..., -5.6052e-45,\n 5.6052e-45, -5.6052e-45],\n ...,\n [-5.7992e-07, 1.7772e-05, -2.0679e-05, ..., 5.6017e-06,\n 3.1833e-05, 2.3251e-05],\n [-1.5739e-05, -2.9994e-05, -6.0391e-06, ..., 1.8479e-05,\n -2.8892e-05, 4.3773e-06],\n [-5.3456e-06, 4.4878e-05, -2.1462e-05, ..., 2.3223e-05,\n 6.6821e-06, 2.3600e-05]], device='cuda:0')",
8
+ "exp_avg_sq": "tensor([[1.2885e-08, 1.3700e-08, 6.3741e-09, ..., 8.7725e-09, 7.6021e-09,\n 4.8925e-09],\n [7.9402e-09, 9.3185e-09, 6.0706e-09, ..., 5.7460e-09, 5.5121e-09,\n 3.8883e-09],\n [8.2648e-18, 9.9391e-18, 1.1785e-17, ..., 6.7162e-18, 3.4203e-18,\n 8.1850e-18],\n ...,\n [1.4760e-08, 1.4014e-08, 9.2830e-09, ..., 1.0177e-08, 7.3684e-09,\n 6.2340e-09],\n [1.8348e-08, 1.5192e-08, 1.2791e-08, ..., 1.1322e-08, 9.8771e-09,\n 8.2061e-09],\n [1.9906e-09, 3.1307e-09, 2.1364e-09, ..., 3.3339e-09, 1.6830e-09,\n 1.6688e-09]], device='cuda:0')"
9
  },
10
  "1": {
11
  "step": "tensor(1252.)",
12
+ "exp_avg": "tensor([-1.4937e-03, -1.0415e-03, 5.6052e-45, ..., -6.1226e-04,\n 1.0764e-03, 9.4429e-04], device='cuda:0')",
13
+ "exp_avg_sq": "tensor([1.6521e-05, 1.2791e-05, 3.4756e-14, ..., 2.0229e-05, 2.3449e-05,\n 3.8690e-06], device='cuda:0')"
14
  },
15
  "2": {
16
  "step": "tensor(1252.)",
17
+ "exp_avg": "tensor([[ 3.8469e-06, 4.4727e-06, 5.6052e-45, ..., 6.8052e-05,\n -1.6977e-08, -1.1068e-06],\n [ 5.6052e-45, 3.4778e-23, 0.0000e+00, ..., 5.6052e-45,\n 5.6052e-45, 5.6052e-45],\n [ 5.6052e-45, 5.6052e-45, 0.0000e+00, ..., 5.6052e-45,\n 5.6052e-45, 5.6052e-45],\n ...,\n [ 0.0000e+00, 5.6052e-45, 0.0000e+00, ..., 5.6052e-45,\n 5.6052e-45, 0.0000e+00],\n [ 2.6602e-12, 6.5419e-14, 0.0000e+00, ..., -5.6052e-45,\n 5.6052e-45, -5.6052e-45],\n [ 1.7557e-06, -4.9403e-07, 0.0000e+00, ..., 1.2390e-06,\n 1.6308e-05, -2.5592e-06]], device='cuda:0')",
18
+ "exp_avg_sq": "tensor([[9.7774e-09, 6.2782e-09, 5.4596e-17, ..., 9.7538e-09, 6.3006e-08,\n 1.4746e-09],\n [3.5497e-11, 6.6977e-10, 0.0000e+00, ..., 1.2565e-10, 4.6488e-14,\n 4.6279e-10],\n [9.2665e-10, 3.2794e-09, 0.0000e+00, ..., 1.8004e-09, 1.5863e-14,\n 3.6890e-09],\n ...,\n [0.0000e+00, 1.5680e-16, 0.0000e+00, ..., 4.5935e-18, 5.4860e-18,\n 0.0000e+00],\n [1.6481e-09, 1.6852e-08, 0.0000e+00, ..., 3.6060e-09, 2.4500e-10,\n 2.2296e-08],\n [2.6776e-10, 3.7610e-10, 0.0000e+00, ..., 2.7872e-10, 4.5433e-09,\n 8.8203e-11]], device='cuda:0')"
19
  },
20
  "3": {
21
  "step": "tensor(1252.)",
22
+ "exp_avg": "tensor([ 3.8218e-04, 8.0004e-22, 5.6052e-45, -1.2478e-04, 7.0635e-05,\n 2.0413e-20, 1.1707e-04, 1.9848e-04, 3.1622e-05, 4.7034e-04,\n 1.0529e-04, 4.7842e-19, 4.8117e-04, 6.6726e-07, -2.6610e-04,\n 6.0888e-20, -9.4428e-05, 5.6052e-45, 5.6052e-45, -3.7158e-04,\n 5.6052e-45, -9.8299e-05, 5.6052e-45, 2.5381e-04, 6.2474e-04,\n -1.8862e-06, 2.7348e-08, 5.6052e-45, 2.7322e-04, 1.9617e-04,\n -2.3872e-04, 2.4501e-06, -1.8965e-05, 4.9968e-04, -1.3027e-04,\n 8.1243e-05, 1.5436e-28, 2.1093e-04, 3.3742e-04, 5.0860e-05,\n 5.2040e-04, 9.5792e-05, 5.7385e-04, 6.3446e-04, 2.6995e-04,\n 1.0579e-10, -4.3391e-05, 3.0988e-04, 5.5316e-04, 4.2428e-04,\n 4.5718e-31, 2.1099e-06, 1.0349e-04, 3.7559e-04, -1.1469e-07,\n 1.7873e-23, 1.4911e-27, -6.1441e-05, 5.6052e-45, 3.0057e-04,\n -1.1182e-07, -2.2101e-05, -4.2033e-04, 5.4079e-04, 7.5203e-15,\n 5.5865e-18, 2.6620e-04, -4.5977e-06, 5.6052e-45, 5.6052e-45,\n -6.1323e-04, 1.2223e-39, -2.3448e-05, -2.2909e-04, -3.9513e-04,\n 4.2284e-04, 5.6052e-45, 3.7224e-05, -3.5990e-05, 1.3120e-04,\n 5.6052e-45, 6.2860e-05, 9.5806e-04, 5.6052e-45, 7.9613e-05,\n 3.2063e-04, 7.8807e-05, -1.4610e-04, -7.5393e-05, 5.7598e-04,\n 2.8434e-04, -2.9455e-21, 9.5098e-08, 4.7277e-04, 5.6382e-05,\n 5.8133e-04, 3.8539e-04, -3.8778e-07, -5.0567e-05, 2.9547e-04,\n -7.1920e-04, 1.5677e-04, -1.3764e-04, -1.0793e-03, 2.9480e-04,\n -5.5674e-04, -8.5346e-05, -1.5459e-04, -9.3293e-05, 5.6052e-45,\n -1.1488e-04, 3.4394e-04, 6.1917e-04, 1.1114e-38, 1.7663e-04,\n -4.3614e-04, 1.2581e-04, 4.0967e-05, 3.7442e-07, 2.4266e-34,\n -3.3006e-04, -5.9274e-04, 5.4158e-06, 5.6052e-45, -2.8571e-04,\n 4.2498e-05, 2.4431e-06, 1.7019e-41, 5.1506e-05, 5.6052e-45,\n 2.1816e-04, 1.8041e-04, 5.6052e-45, 7.9613e-05, 1.0230e-20,\n -2.3387e-04, 2.6979e-21, 2.7262e-04, 1.9061e-04, 5.7635e-31,\n 5.5506e-23, 2.5028e-18, 5.2738e-05, 1.2882e-10, 5.6052e-45,\n 3.0278e-19, -1.9402e-04, -3.5185e-04, 3.0248e-18, -4.9454e-10,\n 5.6052e-45, -2.1463e-04, 5.6052e-45, 8.2809e-04, 3.2103e-16,\n 7.3538e-05, 5.6052e-45, 2.0477e-06, 5.1427e-27, 1.3080e-04,\n -1.1485e-06, 1.5549e-16, -3.6691e-04, 1.7712e-04, -1.2041e-04,\n -3.3719e-04, -4.9399e-22, 5.6052e-45, 3.4673e-04, 4.4995e-04,\n -7.1545e-05, 1.5384e-04, 1.7358e-04, -1.2248e-04, 4.7999e-05,\n 4.1299e-05, 7.5115e-07, -1.7030e-04, -9.2796e-05, 6.8892e-05,\n -1.1835e-03, -2.8181e-04, 1.1863e-04, 1.4258e-33, 1.2956e-32,\n 5.6052e-45, -8.1853e-04, -2.0531e-04, -3.9707e-10, 7.2812e-10,\n -1.9252e-04, -4.5288e-04, 2.9232e-04, -4.5380e-04, -1.8649e-04,\n -1.7415e-04, -3.9736e-04, 8.5544e-04, 1.5977e-04, 5.6052e-45,\n 1.0916e-09, 2.0393e-04, -2.6196e-04, -1.6734e-04, -6.9888e-04,\n -1.5094e-07, -1.4927e-04, -4.3640e-04, 7.9703e-16, 3.7150e-11,\n 3.1619e-05, 9.1752e-36, 9.4894e-05, -7.7122e-05, -7.4456e-05,\n -4.7453e-04, 2.1760e-04, -6.6162e-17, 4.2643e-04, 1.6761e-04,\n 3.2113e-07, -9.2353e-04, -2.2324e-04, -4.9814e-05, -1.2032e-06,\n 5.1401e-11, 5.6052e-45, 3.1504e-04, 3.6809e-04, 5.6052e-45,\n -9.6823e-05, -1.7097e-04, -2.7672e-05, 2.0413e-04, 5.6052e-45,\n -6.7278e-04, 8.5375e-04, 5.6052e-45, -2.5825e-04, -7.9492e-04,\n 2.8845e-15, 6.3364e-31, 1.1674e-04, -2.8837e-04, 6.1486e-05,\n 3.6381e-04, 9.9847e-05, 1.2208e-04, 2.2044e-21, 5.6052e-45,\n 8.9531e-05, 1.2577e-04, -1.1164e-04, -5.1391e-04, 5.1978e-05,\n 7.7511e-04, 5.6052e-45, 4.0989e-05, 5.6052e-45, 2.4154e-04,\n 5.6052e-45, 2.6517e-04, 2.6230e-04, -1.6418e-04, 4.0567e-04,\n 1.0574e-14, -5.9253e-05, 1.0241e-04, -7.9978e-05, 8.9149e-27,\n -2.4600e-04, -4.8269e-06, -3.3168e-04, -1.6313e-04, 1.2319e-03,\n -8.4572e-05, 1.8478e-04, 2.0782e-09, -2.8268e-06, -7.9179e-05,\n 5.0319e-10, -1.1923e-04, 3.9236e-44, 4.0023e-05, 3.0151e-04,\n -1.2087e-04, 2.6693e-05, -1.1285e-04, 5.6052e-45, 2.9637e-04,\n 2.1271e-04, 2.8520e-04, 2.4720e-41, 5.1247e-14, 3.3199e-04,\n -1.7947e-06, 5.2672e-04, -4.8191e-04, -1.7399e-04, -6.5861e-43,\n -1.9457e-04, -6.4591e-04, 3.3081e-09, 5.6052e-45, 4.1406e-20,\n 8.5171e-10, 5.6052e-45, 1.5754e-04, -4.1803e-06, -4.1639e-04,\n -8.5921e-05, 5.6052e-45, 5.1273e-04, -1.0320e-05, -1.7667e-04,\n 5.6052e-45, 5.6052e-45, -7.7146e-04, 4.0002e-38, -2.0809e-04,\n -1.3197e-04, 8.0053e-05, 3.8074e-20, -4.5425e-04, 2.1859e-04,\n 8.1467e-32, 2.7410e-04, -6.8712e-05, 6.9257e-05, 6.5898e-04,\n 3.3839e-04, -2.5711e-04, 1.1826e-03, 2.3023e-04, 7.7894e-40,\n -1.4262e-04, -6.9575e-05, 1.1507e-07, 5.6052e-45, 5.6052e-45,\n 4.4987e-05, -4.5090e-05, -3.4941e-05, 2.7201e-05, -6.0723e-05,\n 1.0621e-04, 3.0405e-05, 5.6052e-45, -6.2574e-04, 3.9199e-06,\n 1.2306e-05, -2.7718e-04, 2.3346e-17, 5.6905e-39, 4.9593e-34,\n -7.6822e-04, 8.4728e-14, 1.6328e-08, 2.9529e-04, -7.6453e-07,\n 3.7565e-04, 2.0243e-04, 1.8215e-34, 1.6978e-04, -1.9418e-05,\n 3.1847e-20, 1.0820e-04, 4.8579e-04, 7.1742e-08, 5.6052e-45,\n 2.5511e-04, 5.7119e-20, 6.4309e-05, -1.5516e-04, -2.0177e-05,\n 7.1613e-09, 5.6052e-45, 2.5350e-13, 5.8009e-29, 2.4599e-04,\n 2.4395e-04, -3.7157e-04, -1.9739e-04, -1.3765e-04, 5.6052e-45,\n 2.7911e-04, 5.6052e-45, 2.4672e-04, -4.9174e-04, -6.8502e-05,\n -8.3649e-05, 1.5599e-05, 5.6052e-45, -1.6585e-05, 4.0139e-05,\n 2.9731e-04, 8.4497e-08, 2.5546e-07, 2.8841e-35, 5.6052e-45,\n 8.6095e-05, 3.6328e-04, 2.5533e-04, 1.3146e-03, 1.7070e-04,\n 3.8743e-04, 5.6052e-45, -4.7014e-04, 4.5412e-05, -3.2610e-04,\n -3.0897e-04, 5.6052e-45, -4.7544e-05, 2.2350e-04, 1.6483e-08,\n 1.3765e-04, 5.6052e-45, 3.6315e-05, 4.5507e-05, -1.0489e-03,\n 3.7407e-04, -5.4334e-04, -2.2857e-03, 1.0393e-33, 5.6052e-45,\n 7.3345e-33, 1.5414e-04, 5.6052e-45, 5.6052e-45, 5.6052e-45,\n -6.5093e-04, -1.4926e-04, -3.1952e-04, 1.7657e-07, 7.7445e-04,\n 5.6052e-45, -4.8834e-04, -9.2296e-07, -6.0505e-04, 5.6052e-45,\n 5.6052e-45, -3.2284e-04, 5.6052e-45, 5.6052e-45, 4.2095e-42,\n -3.9422e-04, -1.3901e-04, 1.1123e-04, 8.2342e-15, 5.6052e-45,\n 5.9790e-04, 1.1872e-04, -5.3718e-04, 3.5846e-04, 7.2883e-04,\n -1.4106e-04, 2.9866e-08, 4.4480e-04, 5.5912e-43, 1.8141e-07,\n 4.0878e-10, -2.1845e-04, 5.6052e-45, -4.4449e-04, 5.6052e-45,\n -2.7358e-04, 5.6782e-05, 5.2037e-05, -7.2313e-05, -6.5192e-05,\n 2.0171e-04, 5.6052e-45, 5.6052e-45, 4.2101e-04, 5.6052e-45,\n 2.6803e-37, -2.0666e-07, -1.4383e-04, 3.7621e-18, 4.3796e-04,\n 4.4754e-04, 3.2286e-04, -1.9190e-04, -4.2962e-04, -1.3110e-05,\n 3.3386e-04, -4.6300e-04, -5.3814e-04, 7.3730e-05, -7.4109e-04,\n -8.2087e-05, 5.6052e-45, -6.3055e-04, 2.7288e-04, 8.9807e-05,\n 5.6052e-45, -1.4269e-04, 5.5829e-05, -1.4574e-04, -1.1367e-04,\n 2.8679e-14, -1.1732e-03, 1.3771e-04, 5.4366e-07, -2.0518e-04,\n 1.0191e-06, -3.7106e-04, -1.7129e-04, 5.6052e-45, 2.0274e-04,\n -1.7718e-04, -5.9050e-05, -1.4819e-04, -3.4906e-04, 1.1461e-40,\n 1.6469e-08, -8.1696e-05, 1.2102e-04, 2.7143e-21, -9.1091e-07,\n 6.4320e-04, -6.5085e-05, -3.0696e-04, -6.2679e-06, 1.4956e-05,\n 1.4310e-04, 1.1640e-09, 1.1597e-03, -5.7752e-04, 2.4327e-05,\n -4.4174e-04, -2.4569e-04, 5.3230e-04, -3.9954e-05, 5.6052e-45,\n 8.2504e-20, -1.0823e-04, 6.2652e-12, -2.6155e-05, -6.7134e-04,\n 7.0425e-04, -5.0158e-04, 5.9339e-04, -2.0269e-04, 7.5749e-04,\n 5.6052e-45, -3.2619e-06, -1.5872e-03, 8.0820e-04, 1.2370e-06,\n 3.6122e-04, 3.1083e-04, 2.7292e-04, 4.5809e-04, -8.2813e-05,\n 5.6052e-45, 3.0311e-05, -7.7129e-05, 5.6052e-45, 2.3292e-04,\n 5.6052e-45, -3.7187e-05, 2.1344e-26, -1.0217e-04, -9.4743e-07,\n 4.2678e-04, 4.1857e-05, 5.6052e-45, -2.1576e-04, 5.6052e-45,\n 2.1321e-05, -7.5512e-06, -7.2515e-04, 5.6052e-45, -2.2833e-04,\n -3.6974e-04, 1.6655e-04, 8.4603e-08, -2.6396e-05, 7.9812e-05,\n 1.2428e-04, 3.3136e-09, 5.1999e-09, -6.2667e-05, 5.6052e-45,\n -1.8404e-04, 4.1423e-04, 6.9310e-04, -2.5808e-04, -8.0821e-06,\n -3.8919e-06, 5.6052e-45, 8.7584e-05, -4.2317e-04, 1.2604e-05,\n 2.9426e-04, 2.5232e-05, -1.3666e-04, 1.4815e-04, -7.9855e-07,\n 4.9999e-05, 8.5039e-05, 2.2255e-04, -1.1264e-09, 2.5471e-04,\n 3.6019e-04, -3.6965e-04, 1.1358e-13, -2.3170e-04, 3.6616e-04,\n -1.5764e-04, 5.9709e-05, 1.8939e-07, 5.6052e-45, 7.6144e-05,\n 5.6052e-45, 5.0188e-10, 1.9223e-32, -4.5194e-04, -3.0563e-04,\n 1.1113e-04, -2.1723e-04, -1.3396e-04, -1.2334e-03, 6.4252e-06,\n -9.6372e-04, 5.6052e-45, 4.8890e-05, -1.7205e-04, 5.6052e-45,\n 5.6052e-45, 3.5136e-35, 5.6052e-45, 5.6052e-45, 1.1885e-04,\n 2.4666e-07, 5.6052e-45, -8.8639e-05, 5.9116e-04, -9.4945e-05,\n 3.9502e-05, 5.6052e-45, -4.1640e-04, 5.7558e-41, 5.6052e-45,\n -1.5666e-04, 5.6052e-45, -2.7820e-04, -4.2402e-04, 2.9701e-04,\n 3.1877e-04, -4.6690e-06, 6.6976e-04, 3.4616e-04, 6.1442e-05,\n -3.5794e-04, -2.8278e-04, -1.7150e-04, 4.4884e-06, 4.4483e-12,\n -4.4531e-04, 2.3326e-24, -2.4075e-04, 5.6052e-45, 5.1110e-05,\n 7.1042e-04, 7.8490e-05, 5.6052e-45, -5.8747e-06, 1.2398e-08,\n -4.9089e-04, 5.6052e-45, -2.5268e-04, -4.3913e-04, -1.7341e-04,\n 5.1760e-04, -7.4397e-04, 5.6052e-45, 5.6052e-45, 5.6052e-45,\n 2.3848e-04, 1.5510e-04, 2.1766e-04, 5.6052e-45, 3.8660e-04,\n 5.6052e-45, 2.2806e-05, -9.8839e-07, -5.6887e-05, 2.4856e-04,\n 2.9393e-12, 5.0904e-22, 5.6052e-45, 5.4609e-07, 4.5710e-42,\n -1.9395e-04, 8.4836e-05, 4.8425e-04, 1.8691e-11, 6.2520e-07,\n 9.4244e-04, 1.1704e-04, -2.5014e-04, -1.5512e-04, 2.8406e-04,\n -4.1554e-04, 5.6052e-45, -8.8677e-05, -1.2047e-04, 5.6052e-45,\n -4.8120e-05, -2.2179e-05, 2.0070e-32, -2.5375e-04, -2.8027e-04,\n 5.6052e-45, -3.6313e-04, 2.3223e-04, -7.2957e-05, 1.8224e-04,\n 5.6052e-45, -2.6673e-05, -1.8215e-04, 2.1180e-04, 9.9072e-14,\n 1.6484e-11, -2.4268e-04, -3.0438e-04, -3.6011e-04, 4.3778e-04,\n 2.8486e-12, 2.1854e-04, 5.6052e-45, -2.3703e-05, 4.5993e-34,\n -1.3364e-06, -2.7262e-04, 1.8741e-04, -2.1678e-04, 4.0780e-07,\n -2.8199e-04, 4.9196e-05, 3.1032e-06, 1.8501e-04, 5.6052e-45,\n 1.4732e-05, 1.3301e-04, 5.6052e-45, -2.0621e-04, 2.1345e-41,\n -2.1755e-06, 3.1857e-28, 8.7392e-10, -1.9154e-04, -2.5642e-04,\n 2.8721e-04, 2.8977e-30, 8.9714e-05, 6.4323e-04, -4.2397e-05,\n 2.6927e-06, 9.8263e-05, 2.4579e-04, 5.6052e-45, 5.6052e-45,\n 5.6052e-45, 7.2791e-07, 1.1419e-04], device='cuda:0')",
23
+ "exp_avg_sq": "tensor([2.7635e-06, 8.2423e-07, 2.6001e-06, 4.4758e-07, 7.6642e-06, 7.6808e-06,\n 1.1055e-05, 2.5434e-05, 6.7623e-06, 7.3278e-06, 4.8224e-06, 4.2421e-06,\n 1.0958e-06, 9.1319e-06, 2.0342e-06, 2.3354e-06, 1.6900e-05, 4.6893e-06,\n 5.8218e-07, 1.4690e-05, 9.6257e-08, 1.3343e-06, 7.5355e-06, 2.7443e-06,\n 6.3642e-06, 1.4530e-06, 2.0400e-06, 1.7442e-08, 6.0682e-06, 6.2240e-06,\n 5.3140e-07, 2.0466e-06, 3.6801e-06, 1.6826e-05, 2.3466e-06, 6.1230e-09,\n 9.3673e-06, 8.8893e-06, 2.5041e-06, 5.5933e-06, 2.0168e-05, 9.0763e-07,\n 4.4732e-06, 2.6477e-06, 7.5364e-06, 7.7119e-06, 1.1337e-06, 1.1949e-06,\n 3.2596e-05, 2.2453e-06, 1.4961e-05, 9.7974e-05, 3.9626e-06, 2.9001e-06,\n 1.2551e-05, 8.7083e-06, 2.0797e-05, 1.1476e-07, 4.6326e-06, 3.2638e-06,\n 2.9113e-08, 3.0116e-06, 8.1881e-06, 4.6217e-06, 1.2633e-10, 3.1499e-06,\n 4.4544e-06, 1.5556e-05, 8.1254e-06, 1.9342e-06, 2.4515e-06, 6.8063e-06,\n 3.9216e-07, 2.4367e-06, 1.5499e-06, 1.0611e-06, 4.7240e-08, 2.1201e-06,\n 1.9380e-07, 2.6816e-07, 1.9720e-05, 1.0707e-06, 9.3989e-06, 1.3042e-07,\n 3.8750e-05, 9.6063e-07, 4.5605e-06, 8.8143e-06, 8.8979e-07, 1.1859e-05,\n 2.0681e-06, 3.8866e-06, 3.3987e-08, 3.3756e-06, 2.6734e-08, 1.1815e-05,\n 1.4255e-05, 5.6772e-05, 9.0597e-06, 4.9357e-06, 8.6550e-06, 5.7778e-06,\n 2.9124e-05, 3.7177e-05, 3.3967e-06, 5.5560e-06, 1.2809e-06, 2.3054e-06,\n 2.5995e-06, 3.2284e-08, 1.7538e-06, 1.8689e-05, 4.4649e-06, 6.5428e-06,\n 1.0186e-05, 9.1332e-06, 1.8178e-06, 1.1373e-07, 6.3444e-06, 3.5708e-06,\n 7.9360e-06, 1.2610e-05, 5.6133e-06, 8.9479e-06, 2.5459e-06, 3.2453e-06,\n 1.4225e-05, 2.8527e-07, 4.3806e-06, 3.9827e-05, 4.9039e-06, 6.4620e-06,\n 3.9087e-07, 2.3398e-06, 4.1882e-06, 5.1322e-07, 1.5762e-09, 1.0374e-05,\n 1.2307e-06, 6.4191e-06, 3.9408e-06, 2.1664e-06, 7.1447e-07, 6.1204e-10,\n 8.3959e-09, 1.1168e-05, 4.2433e-06, 4.9932e-06, 3.0005e-05, 2.6369e-07,\n 5.3896e-08, 9.8654e-07, 6.6309e-07, 4.6892e-07, 2.5723e-08, 4.9584e-06,\n 9.6611e-06, 9.1801e-06, 1.2126e-05, 1.4420e-05, 3.4475e-09, 4.4199e-06,\n 2.1153e-06, 1.9039e-06, 5.8109e-06, 3.1363e-06, 4.7447e-06, 1.5787e-11,\n 1.8691e-06, 5.0461e-07, 1.2875e-05, 1.1117e-05, 1.6662e-06, 2.0908e-06,\n 4.5878e-06, 1.3043e-06, 1.5576e-09, 2.4455e-06, 8.6583e-06, 2.6111e-05,\n 9.1380e-06, 9.5527e-06, 3.1162e-06, 3.6288e-10, 6.6277e-10, 3.8118e-16,\n 5.4426e-06, 1.1652e-06, 2.3855e-07, 1.5424e-08, 3.1613e-06, 3.1236e-07,\n 4.6236e-06, 1.3960e-05, 7.5890e-06, 2.5207e-06, 1.9452e-06, 6.8358e-06,\n 3.8253e-07, 1.0103e-16, 1.1990e-05, 2.1094e-06, 4.7269e-06, 6.8602e-06,\n 3.3418e-06, 8.4926e-07, 7.9136e-06, 6.4455e-06, 4.1708e-06, 7.5726e-08,\n 4.6451e-06, 1.0624e-07, 2.3946e-06, 8.1357e-06, 4.7993e-06, 1.0426e-06,\n 3.2290e-06, 1.5974e-06, 5.7175e-06, 1.7559e-06, 3.6356e-06, 5.8189e-06,\n 2.4541e-06, 9.9111e-07, 1.7420e-05, 1.4958e-05, 3.3310e-05, 3.7194e-06,\n 4.2554e-06, 2.9765e-07, 3.0352e-06, 4.2935e-06, 3.9751e-06, 1.3449e-06,\n 9.4652e-06, 9.3510e-07, 1.3593e-05, 1.7949e-09, 2.0589e-06, 2.9155e-06,\n 6.1750e-06, 4.9236e-06, 5.0906e-06, 2.3622e-06, 9.3690e-07, 1.6861e-06,\n 6.7642e-07, 9.8416e-06, 8.2588e-07, 6.2805e-06, 2.7127e-05, 3.5601e-06,\n 1.0432e-05, 1.1015e-05, 1.6681e-06, 5.2195e-06, 1.9196e-09, 3.0939e-06,\n 1.4243e-14, 2.2847e-05, 1.1307e-14, 4.9401e-06, 2.7682e-06, 5.1914e-06,\n 2.4829e-05, 1.2108e-05, 5.0223e-07, 3.2724e-06, 1.5393e-05, 2.2256e-05,\n 7.1956e-06, 7.9809e-07, 2.3644e-06, 8.9256e-06, 5.7172e-06, 1.7009e-06,\n 7.3657e-06, 9.7895e-09, 1.7859e-08, 1.5188e-05, 2.7915e-05, 1.2584e-05,\n 1.6261e-05, 5.1083e-06, 7.5614e-06, 2.6763e-07, 3.9161e-06, 2.2760e-06,\n 5.7604e-09, 3.3778e-05, 3.5035e-07, 1.2192e-05, 3.5018e-05, 1.5584e-07,\n 2.4436e-06, 3.4135e-05, 8.5208e-06, 2.6426e-05, 2.6068e-06, 5.2863e-08,\n 5.6054e-07, 3.0880e-05, 7.8967e-08, 3.8191e-17, 1.0476e-06, 2.2543e-08,\n 2.6412e-07, 6.6212e-07, 5.0764e-06, 1.1731e-05, 1.3041e-05, 1.4668e-09,\n 3.4768e-06, 2.4514e-07, 1.8413e-06, 3.2195e-09, 1.2458e-08, 5.0837e-05,\n 6.3851e-06, 9.5732e-07, 6.1195e-06, 1.4582e-07, 1.1189e-09, 3.9474e-06,\n 7.4354e-07, 1.1680e-05, 2.1765e-05, 2.3609e-06, 2.9188e-06, 1.8701e-06,\n 3.4824e-06, 6.6610e-07, 5.8816e-06, 6.9383e-07, 1.1291e-07, 2.3145e-05,\n 8.8313e-07, 1.8833e-06, 8.7727e-15, 1.4838e-08, 1.4422e-05, 5.7285e-06,\n 3.7528e-05, 1.8159e-06, 1.0544e-05, 2.5835e-06, 3.9738e-06, 8.8034e-05,\n 1.2251e-06, 9.4887e-06, 6.0755e-06, 4.8507e-06, 5.3185e-07, 2.3883e-06,\n 2.6655e-06, 4.2074e-06, 2.0790e-08, 2.5173e-06, 6.3141e-07, 5.0400e-05,\n 4.6013e-06, 3.0301e-06, 9.9046e-06, 1.2544e-05, 2.0839e-06, 3.2442e-06,\n 3.4710e-07, 6.3130e-06, 3.2889e-08, 1.5440e-08, 3.2169e-06, 5.0759e-06,\n 3.4324e-07, 1.3033e-06, 1.6576e-06, 2.2029e-05, 1.7243e-06, 1.0396e-10,\n 4.7026e-06, 8.7802e-07, 3.5323e-06, 5.2635e-06, 1.5909e-06, 2.8940e-06,\n 9.8276e-06, 5.8029e-07, 2.5229e-08, 1.5997e-06, 1.1792e-05, 1.7611e-06,\n 1.0263e-05, 3.0424e-06, 6.7804e-09, 6.1549e-08, 4.7294e-06, 8.4267e-06,\n 1.8893e-07, 4.1132e-06, 3.3799e-05, 4.3778e-06, 1.8254e-05, 6.7081e-07,\n 4.1423e-06, 8.4735e-06, 3.6044e-06, 1.6995e-06, 2.8538e-05, 8.8125e-06,\n 6.0234e-06, 5.7969e-06, 1.1630e-05, 6.0837e-11, 1.0943e-05, 3.3285e-06,\n 3.7586e-07, 1.3991e-06, 5.7702e-09, 4.1101e-06, 2.6616e-07, 1.0576e-06,\n 1.0275e-05, 5.5071e-06, 3.7250e-06, 4.0906e-09, 2.6992e-16, 3.0799e-09,\n 8.3534e-06, 2.2700e-06, 6.2404e-09, 1.3051e-08, 3.3644e-06, 1.7666e-06,\n 1.2167e-05, 4.3525e-06, 9.1940e-06, 1.4465e-06, 2.3755e-06, 7.0184e-10,\n 3.9014e-06, 3.4029e-08, 5.1870e-06, 2.7011e-06, 5.4022e-09, 4.1265e-08,\n 1.9683e-06, 3.4872e-06, 2.1086e-06, 1.7690e-06, 3.3838e-09, 7.2447e-07,\n 8.4324e-07, 3.2213e-06, 5.0629e-06, 2.9049e-06, 3.3831e-06, 1.1949e-05,\n 2.2543e-06, 5.6718e-06, 1.2789e-06, 8.2205e-07, 2.9680e-09, 1.5477e-05,\n 3.1158e-10, 2.3947e-06, 2.6832e-06, 2.4993e-06, 6.5105e-08, 1.0203e-06,\n 1.0962e-05, 7.7665e-08, 2.7368e-06, 1.2613e-07, 7.8532e-08, 2.0080e-06,\n 1.1522e-07, 5.6014e-09, 8.0050e-07, 1.1106e-07, 2.8275e-05, 5.3317e-06,\n 5.7615e-06, 6.8117e-06, 2.9477e-06, 9.4296e-06, 1.1397e-06, 4.0063e-06,\n 7.8655e-06, 1.0989e-05, 1.9478e-06, 2.6493e-06, 7.9995e-06, 8.3976e-09,\n 7.2869e-06, 1.0398e-05, 1.3317e-06, 1.3967e-05, 3.6518e-06, 1.1920e-05,\n 2.6141e-06, 5.3034e-06, 6.7520e-05, 4.4231e-06, 2.4173e-06, 1.0679e-08,\n 6.1482e-06, 7.5624e-06, 1.3259e-06, 3.4549e-06, 3.4735e-07, 8.2579e-06,\n 8.2085e-06, 2.9985e-06, 1.1818e-06, 1.1183e-05, 4.1715e-07, 3.6036e-06,\n 1.3245e-06, 8.5177e-07, 9.3521e-06, 4.5151e-06, 5.3930e-06, 8.7343e-08,\n 4.0790e-06, 2.6213e-06, 9.7652e-07, 4.8756e-07, 2.6712e-10, 4.2550e-06,\n 1.8962e-06, 1.0766e-06, 6.6679e-06, 1.0320e-05, 4.3428e-06, 8.1872e-06,\n 1.5235e-06, 1.0617e-06, 1.0776e-05, 3.1228e-05, 9.0577e-06, 1.7002e-06,\n 4.6403e-06, 1.2928e-06, 7.4892e-06, 6.5739e-06, 3.5542e-05, 1.1237e-07,\n 4.4597e-06, 2.1408e-06, 2.8802e-06, 4.9050e-05, 1.5864e-05, 1.5140e-06,\n 8.1816e-06, 5.7483e-06, 9.7043e-08, 7.0867e-05, 7.0706e-07, 5.8030e-06,\n 7.7502e-07, 6.7973e-06, 1.8975e-09, 2.1978e-05, 9.3858e-07, 2.3881e-06,\n 9.1155e-06, 9.9408e-07, 7.4750e-07, 4.4526e-08, 1.4871e-05, 2.1717e-06,\n 6.4667e-07, 1.7443e-09, 2.2929e-06, 1.8590e-06, 8.9147e-06, 2.0009e-05,\n 3.1006e-06, 8.8249e-09, 5.3805e-06, 3.0253e-06, 6.6780e-06, 5.6370e-09,\n 6.8988e-09, 5.4272e-06, 5.5881e-13, 6.4459e-06, 2.3978e-06, 5.0918e-06,\n 1.1587e-06, 9.8417e-06, 4.2385e-07, 8.7130e-10, 7.4782e-06, 9.0731e-06,\n 5.5543e-06, 2.4838e-06, 2.9560e-06, 5.5438e-07, 2.3324e-06, 1.0982e-05,\n 1.6531e-07, 8.5394e-06, 5.4014e-06, 1.2213e-06, 2.9334e-07, 8.3539e-06,\n 8.8837e-07, 2.1152e-08, 5.0797e-06, 1.0892e-06, 4.8637e-06, 1.3747e-07,\n 5.6260e-06, 1.5568e-05, 8.6679e-06, 3.9408e-09, 5.3034e-06, 4.5725e-06,\n 8.9083e-07, 5.9902e-06, 4.1320e-06, 3.1970e-06, 1.1695e-05, 6.4857e-06,\n 1.6124e-05, 3.9665e-06, 3.9097e-10, 5.8513e-06, 1.1892e-06, 1.3367e-06,\n 3.4750e-06, 1.4724e-06, 1.0265e-07, 3.1993e-09, 9.2003e-07, 2.5418e-05,\n 1.2111e-11, 4.3551e-06, 2.3199e-06, 1.7161e-06, 1.1696e-05, 1.2982e-09,\n 6.2876e-06, 3.3889e-05, 7.6548e-10, 3.4753e-06, 7.3415e-06, 8.5450e-07,\n 1.4555e-05, 1.2171e-06, 4.1200e-06, 7.9647e-06, 1.7999e-06, 3.8644e-06,\n 1.7869e-06, 1.4648e-06, 7.8012e-06, 1.1652e-06, 2.0371e-05, 2.9475e-07,\n 1.0262e-05, 2.9415e-05, 6.5699e-06, 3.5011e-05, 2.5001e-06, 2.0804e-05,\n 7.1644e-06, 1.4837e-09, 1.6807e-05, 4.6603e-07, 3.1761e-06, 1.1410e-10,\n 1.0977e-06, 7.3931e-07, 3.4925e-06, 4.4718e-07, 5.3529e-06, 5.7546e-07,\n 5.1306e-06, 1.2285e-08, 4.3652e-06, 6.3057e-06, 5.8609e-06, 2.9062e-05,\n 2.5618e-06, 5.3666e-06, 5.8160e-06, 5.1699e-08, 2.8844e-06, 1.5069e-05,\n 4.6277e-08, 1.6703e-09, 4.4050e-05, 3.2656e-08, 2.6022e-07, 2.2618e-06,\n 9.3212e-06, 5.5249e-06, 3.4869e-09, 1.1305e-05, 3.4726e-06, 1.2189e-06,\n 4.2793e-06, 5.6784e-06, 6.4796e-06, 4.4786e-06, 2.7759e-08, 4.1061e-06,\n 3.9746e-07, 2.1879e-10, 3.0849e-06, 9.8819e-07, 3.0723e-06, 1.1628e-05,\n 6.6023e-06, 3.6294e-07, 2.1752e-06, 9.0967e-07, 2.4828e-07, 8.9622e-06,\n 1.9525e-05, 1.0774e-05, 3.4450e-06, 2.9301e-06, 2.9697e-05, 1.0362e-08,\n 3.0917e-06, 8.2352e-06, 2.4926e-06, 1.2623e-05, 2.6111e-06, 2.9703e-05,\n 2.2415e-10, 1.3668e-06, 2.6213e-05, 1.1685e-06, 9.2140e-06, 4.2463e-07,\n 1.0327e-06, 8.9171e-08, 3.5471e-06, 1.3164e-05, 5.4360e-05, 4.7926e-06,\n 1.0364e-06, 2.0245e-07, 2.1811e-05, 1.7465e-05, 6.4295e-06, 5.2477e-05,\n 2.7913e-06, 2.3232e-08, 2.1540e-06, 1.8578e-06, 6.2524e-07, 5.7028e-06,\n 4.1694e-07, 3.4700e-06, 1.4467e-06, 2.0266e-06, 4.4553e-06, 3.1180e-07,\n 8.8490e-06, 2.3461e-05, 2.7787e-08, 4.2001e-15, 1.8561e-05, 1.4299e-07],\n device='cuda:0')"
24
  },
25
  "4": {
26
  "step": "tensor(1252.)",
27
+ "exp_avg": "tensor([[ 6.2476e-06, 1.5620e-24, 5.6052e-45, ..., 5.6052e-45,\n -1.0678e-08, 3.5135e-07],\n [ 2.0481e-05, 2.4674e-23, -5.6052e-45, ..., -5.6052e-45,\n 1.1884e-09, -1.4128e-06],\n [ 9.2974e-06, 4.8254e-24, -5.6052e-45, ..., -5.6052e-45,\n -2.5342e-08, 8.8364e-07],\n ...,\n [ 3.9494e-05, 1.0036e-23, -5.6052e-45, ..., -5.6052e-45,\n 7.4303e-09, 1.3260e-05],\n [-3.1277e-05, -1.7812e-23, 5.6052e-45, ..., -5.6052e-45,\n 1.6134e-08, 3.6615e-06],\n [-3.0890e-05, -6.1184e-24, 5.6052e-45, ..., -5.6052e-45,\n -1.5985e-08, -2.5147e-06]], device='cuda:0')",
28
+ "exp_avg_sq": "tensor([[1.9864e-08, 1.0276e-11, 2.3055e-09, ..., 1.1772e-17, 1.8261e-08,\n 2.0070e-10],\n [2.7359e-08, 1.8948e-10, 5.7807e-10, ..., 6.0166e-16, 2.3274e-09,\n 3.5971e-10],\n [4.3654e-08, 1.1519e-12, 1.5706e-10, ..., 2.6240e-16, 6.9820e-11,\n 3.4333e-10],\n ...,\n [3.9805e-08, 1.8755e-10, 4.6976e-11, ..., 2.2957e-16, 1.6913e-09,\n 3.4654e-10],\n [5.4508e-08, 1.5719e-11, 2.1832e-09, ..., 3.4213e-18, 4.7717e-09,\n 1.0817e-09],\n [3.9547e-08, 2.4142e-11, 1.7476e-09, ..., 2.1926e-16, 1.0526e-08,\n 8.0925e-10]], device='cuda:0')"
29
  }
30
  },
31
  "param_groups": [
 
223
  ]
224
  },
225
  "metrics": {
226
+ "best_val_acc": 79.318,
227
  "best_epoch": 0,
228
  "scale_accuracies": {
229
+ "384": 79.318
230
  }
231
  },
232
  "train_config": {
233
  "name": "david_training",
234
+ "run_id": "20251012_041353",
235
  "dataset_name": "AbstractPhil/imagenet-clip-features-orderly",
236
  "model_variant": "clip_vit_l14",
237
  "num_classes": 1000,
weights/train_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "name": "david_training",
3
- "run_id": "20251012_040642",
4
  "dataset_name": "AbstractPhil/imagenet-clip-features-orderly",
5
  "model_variant": "clip_vit_l14",
6
  "num_classes": 1000,
 
1
  {
2
  "name": "david_training",
3
+ "run_id": "20251012_041353",
4
  "dataset_name": "AbstractPhil/imagenet-clip-features-orderly",
5
  "model_variant": "clip_vit_l14",
6
  "num_classes": 1000,