AbstractPhil commited on
Commit
9d650e1
·
verified ·
1 Parent(s): ef806e7

Upload weights and configs - Run 20251012_032356

Browse files
weights/best_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ecf5e86fd5b2ddb68e090d5f70544f98d7a52e2e21a58950633ab7170563619
3
  size 59515088
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44284136131c7abd3beeed57400f92b000b3208e86947fc46472887cea412e75
3
  size 59515088
weights/best_model_metadata.json CHANGED
@@ -4,18 +4,18 @@
4
  "state": {
5
  "0": {
6
  "step": "tensor(1252.)",
7
- "exp_avg": "tensor([[ 9.9808e-05, -2.3590e-04, 4.8703e-05, ..., -6.7867e-06,\n 1.5045e-04, -6.9639e-06],\n [-3.2055e-05, -2.8797e-04, 6.0306e-05, ..., 9.5280e-06,\n 2.2100e-06, 3.8027e-06],\n [ 5.6052e-45, -5.6052e-45, -5.6052e-45, ..., 5.6052e-45,\n 5.6052e-45, 5.6052e-45],\n ...,\n [ 1.2700e-04, -2.9514e-05, 2.9405e-05, ..., 3.5731e-05,\n 2.1884e-06, -6.4312e-05],\n [ 2.5446e-04, -2.6147e-04, 2.8969e-05, ..., 8.7159e-05,\n 5.2191e-05, 1.4825e-04],\n [ 2.1196e-05, 7.8471e-06, -4.5547e-05, ..., 5.2981e-06,\n -1.3684e-04, -7.5568e-05]], device='cuda:0')",
8
- "exp_avg_sq": "tensor([[5.4091e-07, 5.4144e-07, 4.9248e-08, ..., 4.1057e-08, 7.7326e-08,\n 5.4548e-08],\n [2.1701e-07, 3.3507e-07, 5.9846e-08, ..., 6.8188e-08, 6.9439e-08,\n 7.7029e-08],\n [2.3653e-09, 4.7337e-10, 1.4479e-10, ..., 2.1699e-10, 5.2052e-10,\n 4.1789e-10],\n ...,\n [4.9622e-07, 6.7429e-07, 5.9319e-08, ..., 7.7861e-08, 6.7676e-08,\n 4.2370e-08],\n [1.8010e-07, 3.5606e-07, 3.6999e-08, ..., 5.1092e-08, 7.0665e-08,\n 4.0146e-08],\n [1.0317e-07, 2.4285e-07, 4.6463e-08, ..., 5.2589e-08, 4.8899e-08,\n 4.3048e-08]], device='cuda:0')"
9
  },
10
  "1": {
11
  "step": "tensor(1252.)",
12
- "exp_avg": "tensor([ 2.9097e-03, 1.3327e-03, 5.6052e-45, -6.0815e-04, -4.8489e-07,\n 5.6052e-45, 4.5090e-04, -3.5691e-03, 1.6202e-03, -8.7439e-15,\n 4.4855e-04, 1.3435e-04, 2.7017e-03, 2.9764e-04, -2.6219e-03,\n 5.6216e-05, 1.3226e-03, -3.9642e-03, 8.1591e-04, -8.6576e-04,\n 2.2454e-04, 1.0421e-04, -2.1005e-03, 6.4988e-24, 5.7679e-04,\n 2.7692e-04, -9.5206e-04, -5.5439e-03, -5.3738e-03, 2.8346e-04,\n 1.7878e-03, 5.6052e-45, 1.0163e-03, -2.8758e-04, -1.0929e-03,\n 6.1516e-36, -6.6696e-03, 1.2855e-03, 1.6802e-03, -2.5499e-04,\n 8.3145e-04, -7.6461e-04, 1.0018e-03, -8.2878e-04, -6.3370e-04,\n 6.4852e-03, -1.1970e-03, 4.4301e-23, -1.5002e-03, -1.3855e-03,\n -4.5024e-03, 7.1654e-04, -4.9084e-04, 1.6491e-03, 5.6052e-45,\n -3.0916e-03, 5.2380e-03, -4.4587e-04, 3.4016e-04, -2.3714e-03,\n 2.0890e-16, -3.2571e-03, 1.5128e-03, -4.8482e-04, 8.1386e-05,\n 1.5725e-03, 2.3494e-03, 5.0308e-04, 3.6531e-03, 3.8240e-21,\n 4.7257e-03, -5.3711e-04, 1.8309e-04, 1.5676e-12, 3.5145e-03,\n 9.8415e-03, 1.0916e-02, -6.8465e-04, 4.2006e-03, -6.7891e-03,\n -1.2097e-03, 5.6052e-45, 1.1576e-16, -2.7480e-04, -5.5370e-03,\n -7.5772e-04, -2.9113e-18, 4.3444e-03, 3.1825e-03, -3.6059e-04,\n -3.6649e-04, 3.3190e-03, -1.9954e-03, -8.0797e-03, 3.6348e-03,\n 4.6834e-03, 2.3070e-03, -2.8616e-03, -7.9862e-04, -5.0693e-03,\n 2.4830e-04, 3.3737e-03, 4.2926e-03, 3.6573e-03, -3.5065e-04,\n -5.6572e-04, 1.8134e-03, -6.3776e-04, 4.6051e-03, -2.8824e-03,\n -3.6993e-04, -9.8880e-04, 1.0007e-40, -9.8369e-04, -2.8130e-03,\n 1.4090e-03, -1.7435e-06, 7.0776e-04, 5.7418e-03, -2.8657e-05,\n 2.4314e-03, -2.0983e-03, 5.1883e-03, -2.1431e-38, 7.4072e-07,\n -1.2746e-03, -3.4858e-04, -4.6374e-04, -1.6977e-03, 5.6052e-45,\n 3.7000e-03, 1.5831e-03, -2.0776e-03, -3.7744e-11, -4.3330e-04,\n 1.4578e-03, 7.6183e-03, -3.3606e-03, -1.0650e-03, 4.3183e-03,\n 3.1241e-08, 1.4853e-03, 2.1910e-07, 1.8818e-03, -3.2697e-03,\n 5.9948e-04, -2.3068e-03, 4.1328e-03, 2.3744e-07, 1.1056e-03,\n -1.6506e-04, 5.6052e-45, 5.6052e-45, 5.9209e-04, -2.7072e-03,\n -5.1818e-03, 3.9953e-04, 2.1181e-03, 5.6052e-45, 7.1065e-04,\n 2.8993e-03, 1.0938e-04, 4.5471e-04, -3.0714e-03, -1.6887e-03,\n 4.9794e-04, 3.8360e-04, -2.8068e-06, -3.4753e-04, 6.1017e-03,\n 9.3058e-04, 1.6621e-23, 5.6052e-45, 1.0997e-03, 1.6329e-03,\n 5.6052e-45, -2.2469e-14, 1.2329e-04, 6.3936e-03, -1.4311e-03,\n 2.5462e-03, -6.5818e-04, 1.6421e-03, -4.6383e-03, 1.1713e-03,\n 4.1140e-04, -7.0093e-04, -2.9552e-03, -9.6662e-03, 2.7718e-03,\n -7.6885e-03, -1.9008e-03, 4.6894e-04, 1.5270e-03, -1.1454e-02,\n 3.9764e-03, 3.5573e-03, 3.9063e-04, -1.4086e-03, -9.4108e-05,\n -1.9810e-03, 9.3351e-04, -2.7475e-03, -2.0864e-03, 6.9651e-04,\n 3.6452e-03, -2.2449e-03, -5.8442e-04, 2.1306e-03, 5.8208e-03,\n 1.6991e-04, -2.1017e-03, 3.0419e-03, 1.8699e-03, -1.8809e-03,\n -1.2653e-03, -5.3299e-03, -1.6545e-03, -1.0058e-03, 1.5983e-03,\n -2.4800e-03, -8.4721e-03, 1.9065e-26, 4.7373e-04, 2.0919e-03,\n -2.9753e-03, -4.0522e-04, 2.5252e-03, -2.8403e-03, -1.4599e-03,\n 1.3485e-03, -1.0358e-03, 3.9361e-41, 1.5485e-39, -5.7891e-03,\n -5.8865e-04, 8.3625e-04, 6.9007e-05, 3.3757e-03, 2.4274e-04,\n -6.1542e-05, 3.0383e-03, 2.3547e-03, 4.9550e-03, -2.0679e-03,\n 2.9972e-14, -2.8711e-03, -3.2705e-03, -3.5964e-03, 1.7757e-03,\n 6.0012e-03, 4.5402e-27, 2.1096e-03, 7.6903e-04, -4.8270e-04,\n -6.9613e-04, 1.0011e-03, 9.6959e-05, -3.0302e-03, 4.3707e-03,\n -2.7226e-03, -4.3493e-04, -1.7738e-03, 2.8508e-04, 2.4977e-04,\n -3.0230e-03, -2.4574e-03, 2.2031e-03, -2.3219e-03, 1.1483e-04,\n 4.2586e-03, 3.5752e-03, 5.6052e-45, 5.5265e-03, -5.1519e-03,\n 1.0887e-03, 7.3665e-04, 2.1852e-03, -1.6445e-03, -7.3967e-05,\n -7.4355e-04, 7.6051e-04, 3.4523e-03, 1.0644e-03, -1.1934e-03,\n -1.8700e-04, 3.7302e-14, -2.1369e-03, 5.6052e-45, -1.7855e-03,\n -5.3899e-03, 5.6500e-03, -6.1412e-05, -2.9054e-03, -3.7659e-04,\n -1.8160e-04, 1.9969e-31, -5.3695e-04, -4.6615e-04, 2.3254e-38,\n 5.6052e-45, 5.4223e-03, 4.4807e-03, -1.3030e-03, -1.2695e-03,\n -1.2296e-03, -9.0901e-04, 2.3960e-03, 1.6224e-04, -1.0780e-03,\n 2.8688e-03, 2.3945e-03, 2.9703e-03, 3.5277e-03, -2.4392e-03,\n -1.7388e-03, 1.9980e-03, 2.0871e-03, 5.6052e-45, 3.7856e-04,\n 2.2651e-03, 1.7563e-03, 5.6052e-45, 2.0318e-03, 1.3920e-03,\n 6.9956e-03, 1.8756e-03, -5.5313e-04, 2.4667e-03, 8.8846e-04,\n 1.1469e-03, 2.3866e-03, -1.7824e-03, 7.7836e-04, -5.0318e-04,\n -9.9463e-04, 9.0413e-04, 5.4385e-07, 6.3684e-04, 1.0693e-03,\n -1.9220e-03, 3.1149e-03, -5.8925e-04, -2.1141e-03, 1.9296e-03,\n 5.6052e-45, -3.9401e-03, 1.2427e-03, 5.6052e-45, -6.7204e-04,\n -1.1268e-05, 5.9482e-04, 1.4091e-03, -3.0139e-03, 4.3913e-04,\n -2.7723e-03, -2.4720e-03, -4.9926e-04, -2.7104e-03, -5.6586e-04,\n 7.8348e-04, 5.6052e-45, 1.3427e-03, -4.7691e-03, 5.6052e-45,\n -2.0714e-03, -5.4685e-04, -1.1198e-07, -7.7871e-05, -4.1724e-03,\n -2.1828e-03, -6.9466e-04, -2.3864e-04, 2.6827e-03, -2.0941e-03,\n 1.8311e-03, 2.7079e-03, -4.4246e-03, 3.3094e-03, 1.8410e-03,\n -6.3030e-03, 3.4858e-03, -1.9636e-03, 5.6052e-45, 1.9304e-05,\n -4.1517e-21, 2.4526e-03, 4.8325e-03, -6.6209e-04, 9.4050e-04,\n 3.5215e-42, 4.5619e-03, -6.1602e-03, -2.5304e-03, -9.4652e-04,\n 7.0431e-04, -7.8636e-24, 3.5365e-03, 5.6052e-45, 5.6052e-45,\n 9.4229e-04, 2.1341e-03, -6.8848e-03, 2.8542e-03, -2.0011e-04,\n 6.2322e-04, 5.4069e-04, 2.1369e-03, -2.7031e-03, 6.2608e-04,\n -7.1263e-04, -5.2130e-03, -7.6677e-04, 5.3319e-03, -7.3731e-41,\n -8.2319e-04, -8.3675e-04, 9.1410e-04, 5.6052e-45, 5.3688e-03,\n 4.4872e-03, -3.9738e-03, 5.5525e-04, -2.6904e-03, -6.7565e-04,\n 1.5406e-03, -2.9458e-03, 3.1132e-03, 5.6203e-04, -1.3210e-03,\n -2.1013e-03, -8.1524e-04, -3.7536e-03, -2.9657e-03, -2.6874e-03,\n 1.5260e-03, -3.0026e-03, 1.4654e-08, -1.1917e-03, 1.6394e-03,\n 5.6052e-45, -1.9517e-10, -3.2261e-03, 1.5158e-04, 2.0841e-03,\n -1.8274e-16, 1.8457e-29, -1.1565e-03, 4.7800e-04, 3.4919e-08,\n 4.5683e-18, -3.7613e-27, 5.6052e-45, -1.4436e-03, -2.0606e-03,\n -5.2525e-04, -2.9899e-03, 3.4768e-04, 1.1600e-03, 2.7800e-03,\n 2.1888e-03, -4.4828e-07, -7.0891e-04, -9.2954e-05, 1.1944e-03,\n 1.1122e-04, -5.0771e-03, 1.2030e-03, -5.6601e-04, 2.6567e-03,\n -2.5926e-03, 2.5320e-03, -4.3434e-04, -9.2896e-04, 6.3431e-03,\n 8.5656e-04, 5.1081e-03, -2.3216e-03, -5.3759e-03, 3.3953e-03,\n 4.0417e-03, -3.0275e-03, -6.7968e-05, -2.8031e-03, -2.8511e-04,\n 3.4441e-03, 2.6827e-03, -2.8124e-03, -4.7469e-14, 5.0620e-03,\n -1.5232e-03, -1.7148e-03, -5.0032e-03, 3.2487e-03, -1.8802e-03,\n 6.7241e-04, 1.3107e-03, -8.0724e-03, 2.5132e-03, 5.6052e-45,\n -9.5002e-04, 2.7097e-03, 2.6700e-03, 2.4434e-03, -1.6090e-21,\n 6.0059e-03, -1.0610e-03, -4.8448e-03, 7.5928e-04, 5.6052e-45,\n 5.9775e-25, 2.2420e-05, 3.3517e-04, 3.1995e-03, 2.1595e-04,\n 2.6273e-04, 4.7507e-03, 2.2225e-03, -2.0668e-08, 3.3253e-04,\n 1.1676e-03, -1.4700e-03, -3.4555e-03, -5.6052e-45, -3.1489e-03,\n -3.4126e-03, 4.0212e-03, 4.2094e-03, -1.0276e-02, 3.6612e-03,\n 1.8664e-03, 1.1503e-03, 4.9484e-03, 8.5730e-04, -3.0980e-06,\n 4.3121e-03, 1.4095e-03, -8.8099e-11, -1.1596e-03, -2.9243e-03,\n -4.0902e-03, -2.4074e-03, -3.5444e-03, 1.1548e-18, -4.3250e-08,\n 1.1259e-03, 7.5497e-04, 1.6669e-03, -4.1334e-03, -8.5967e-04,\n 6.6669e-04, -6.8106e-08, 1.7873e-03, 6.9239e-04, -3.4414e-03,\n 3.3455e-03, -6.4815e-04, -4.4830e-04, 6.2729e-04, 3.1767e-03,\n -1.1806e-03, 5.6052e-45, -6.1646e-05, -1.5390e-08, -3.8129e-03,\n -5.5182e-04, 4.8020e-03, 3.0543e-03, 2.6255e-04, -7.5502e-03,\n -3.9313e-03, -7.1502e-03, 4.7074e-03, 3.0065e-03, -1.9671e-03,\n -7.0393e-04, 1.2949e-21, 5.6052e-45, -5.1700e-03, -2.5810e-03,\n 2.2440e-14, 5.9939e-03, 4.5024e-04, -3.9611e-04, -6.0625e-04,\n 2.5357e-03, 4.8548e-03, 5.6052e-45, 1.3375e-05, 8.7432e-04,\n -4.6417e-04, -4.8118e-03, -1.0334e-05, -1.0974e-03, 7.7801e-04,\n 5.6052e-45, -1.3710e-03, -4.1969e-03, -8.9786e-04, 3.7286e-04,\n 2.2078e-03, 5.6052e-45, 4.4025e-04, 3.5078e-17, -2.3542e-04,\n -8.6203e-04, -2.0364e-03, -1.9391e-03, -1.9571e-03, -3.8523e-03,\n 8.1275e-44, 3.8030e-03, -2.9845e-03, 1.1340e-03, -3.8654e-03,\n -3.1780e-03, 3.0170e-03, -3.5518e-06, 1.2191e-03, 1.9990e-03,\n 1.3138e-03, -4.8024e-03, -5.5048e-03, 2.6232e-03, 2.9120e-03,\n 6.1065e-03, 1.9772e-14, -1.4609e-03, -1.3955e-03, -1.1309e-03,\n 4.4795e-03, 5.6052e-45, 1.8031e-03, 6.4633e-07, 2.0465e-03,\n 3.7773e-03, 1.9373e-03, 3.8224e-04, 4.0307e-03, -1.3818e-03],\n device='cuda:0')",
13
- "exp_avg_sq": "tensor([1.0657e-04, 1.2498e-04, 5.4747e-07, 1.5065e-04, 1.6597e-06, 9.6464e-08,\n 5.7696e-05, 1.5453e-04, 8.2285e-05, 4.0288e-06, 8.5279e-05, 8.9790e-05,\n 1.7742e-04, 1.9223e-04, 9.8694e-05, 5.8505e-05, 1.1162e-04, 1.5988e-04,\n 7.5000e-05, 4.3486e-05, 4.3413e-05, 1.6213e-04, 1.3302e-04, 6.6957e-07,\n 3.2834e-05, 2.1819e-06, 2.3604e-04, 1.9225e-04, 1.1807e-04, 2.0260e-04,\n 2.3734e-05, 4.9176e-08, 9.9726e-05, 6.7809e-05, 6.4116e-05, 2.2739e-06,\n 1.6892e-04, 1.6830e-04, 1.0314e-04, 9.3657e-05, 2.0912e-04, 2.0061e-04,\n 1.3971e-04, 1.0896e-04, 5.0730e-05, 1.3257e-04, 3.1017e-05, 1.6003e-06,\n 1.0016e-04, 3.9827e-05, 1.0853e-04, 1.0274e-04, 6.8523e-05, 1.6013e-04,\n 1.1100e-05, 9.5912e-05, 1.9205e-04, 1.3528e-04, 6.9431e-05, 1.2905e-04,\n 5.8560e-06, 2.2769e-04, 7.7184e-05, 1.8214e-04, 7.5148e-06, 1.6535e-04,\n 8.7372e-05, 1.5874e-05, 1.4836e-04, 7.8219e-07, 1.4206e-04, 1.4345e-04,\n 1.3214e-04, 5.8393e-06, 1.1338e-04, 1.5193e-04, 1.2176e-04, 1.5996e-04,\n 1.0422e-04, 1.4050e-04, 1.3875e-04, 5.0348e-07, 4.1452e-06, 1.0420e-04,\n 1.2363e-04, 1.2190e-04, 2.5825e-06, 1.7398e-04, 8.3418e-05, 1.2805e-04,\n 1.5007e-04, 4.6880e-05, 5.2009e-05, 6.3075e-05, 1.1318e-04, 1.5523e-04,\n 1.2102e-04, 1.2687e-04, 9.0525e-05, 2.5028e-04, 2.9265e-04, 1.4653e-04,\n 1.1980e-04, 1.4750e-04, 1.6089e-05, 6.2279e-06, 2.0253e-04, 2.0641e-04,\n 1.4600e-04, 1.1342e-04, 6.9079e-05, 5.9040e-05, 3.0364e-08, 1.1472e-04,\n 1.2216e-04, 1.5451e-05, 6.0434e-06, 1.7606e-04, 8.8550e-05, 3.0746e-05,\n 1.1317e-04, 9.6538e-05, 1.8607e-04, 1.4595e-05, 1.1918e-04, 1.4209e-05,\n 9.3113e-05, 1.3750e-04, 5.7601e-05, 9.6174e-08, 2.1956e-04, 1.4674e-04,\n 8.0491e-05, 1.4195e-05, 9.8237e-05, 6.8813e-05, 1.6731e-04, 1.4326e-04,\n 4.1997e-05, 5.4175e-05, 1.2158e-06, 1.6454e-04, 4.0711e-06, 1.8878e-04,\n 1.2410e-04, 1.6002e-04, 1.0956e-04, 1.0676e-04, 4.3374e-06, 1.8985e-04,\n 1.1697e-04, 4.6518e-06, 2.0894e-06, 9.9115e-05, 1.6756e-04, 1.4277e-04,\n 4.4317e-06, 1.0657e-04, 1.2864e-06, 2.2122e-04, 9.5258e-05, 1.4995e-04,\n 1.2619e-04, 2.7058e-05, 1.1466e-04, 2.2609e-05, 1.9238e-06, 1.0774e-05,\n 1.0919e-04, 1.0577e-04, 6.1629e-05, 6.2394e-07, 2.7799e-09, 1.5646e-04,\n 1.5640e-04, 1.5983e-06, 2.5999e-06, 1.3227e-04, 3.0020e-04, 4.0478e-05,\n 5.8057e-05, 9.0989e-05, 1.3166e-04, 2.9814e-04, 6.8373e-05, 1.1930e-04,\n 3.9874e-05, 8.8335e-05, 7.1290e-05, 1.3050e-04, 1.5606e-04, 1.6142e-04,\n 9.1281e-05, 1.5517e-04, 8.5782e-05, 1.6078e-04, 9.9462e-05, 1.5166e-04,\n 1.0937e-04, 1.1834e-04, 9.8588e-05, 1.5297e-04, 1.3750e-04, 1.3850e-04,\n 1.0609e-04, 5.9584e-05, 9.6978e-05, 1.8988e-04, 1.3983e-04, 1.6517e-04,\n 2.0238e-04, 6.1500e-05, 1.2606e-04, 1.0112e-04, 5.8389e-05, 8.5489e-05,\n 1.2577e-04, 1.7108e-04, 1.3891e-04, 1.1265e-04, 1.1794e-04, 1.8124e-04,\n 5.4795e-07, 1.1601e-04, 7.7962e-05, 1.0644e-04, 4.2547e-05, 7.7368e-05,\n 1.8829e-04, 1.4142e-04, 2.5550e-04, 1.1878e-04, 6.3489e-06, 4.3365e-06,\n 1.6430e-04, 4.9562e-05, 1.3993e-04, 8.1268e-05, 1.2643e-04, 2.2004e-05,\n 1.9739e-04, 4.1638e-05, 1.5866e-04, 1.4759e-04, 1.3158e-04, 1.8179e-05,\n 1.6027e-04, 1.2549e-04, 1.9569e-04, 8.4398e-05, 1.4535e-04, 5.4644e-05,\n 1.6169e-04, 1.2208e-04, 1.7599e-04, 9.4468e-05, 6.0572e-05, 7.8003e-04,\n 2.2577e-04, 9.8741e-05, 1.0735e-04, 9.2178e-05, 1.5435e-04, 3.3711e-05,\n 1.4859e-04, 7.5763e-05, 1.4214e-04, 8.2884e-05, 1.2263e-04, 9.7052e-05,\n 1.5557e-04, 1.3137e-04, 8.1252e-07, 1.2670e-04, 1.5327e-04, 6.3749e-05,\n 1.5327e-04, 1.5620e-04, 1.3979e-04, 1.8585e-04, 1.3567e-04, 1.0034e-04,\n 1.1085e-04, 1.5390e-04, 1.5355e-04, 1.2933e-04, 5.3038e-07, 1.1110e-04,\n 1.1968e-06, 1.2746e-04, 1.4634e-04, 1.6784e-04, 1.0154e-04, 8.7271e-05,\n 3.6511e-05, 1.4328e-04, 2.6839e-06, 8.2360e-05, 1.6174e-04, 2.6423e-07,\n 8.0022e-06, 1.5647e-04, 1.4390e-05, 2.0712e-04, 1.1966e-04, 1.2116e-04,\n 8.2312e-05, 1.4790e-04, 1.3410e-04, 1.3199e-04, 1.5459e-04, 1.4375e-04,\n 1.0500e-04, 9.5798e-05, 2.0366e-04, 1.3458e-04, 9.5124e-05, 2.5052e-04,\n 6.5783e-06, 1.2063e-04, 1.5319e-04, 1.8916e-04, 9.1263e-07, 2.1179e-04,\n 2.5095e-06, 1.4195e-04, 1.1650e-04, 1.0627e-04, 9.2918e-05, 8.5886e-05,\n 1.5846e-04, 1.3672e-04, 1.3835e-05, 1.5123e-04, 1.0138e-04, 1.0761e-04,\n 1.5179e-04, 7.8470e-06, 9.2061e-05, 1.4345e-04, 1.5339e-04, 1.7330e-04,\n 1.6678e-04, 6.9284e-05, 1.3848e-04, 2.1464e-07, 1.3049e-04, 6.7242e-05,\n 1.7938e-06, 1.6084e-04, 8.2247e-06, 5.9421e-05, 1.0957e-04, 1.4101e-04,\n 1.6227e-05, 2.1253e-04, 9.9932e-05, 1.9896e-04, 1.6496e-04, 1.6180e-04,\n 7.5642e-05, 5.5413e-06, 1.3033e-04, 1.1072e-04, 3.9993e-07, 2.8074e-05,\n 5.0329e-05, 4.8088e-06, 1.1054e-04, 5.9186e-05, 1.1593e-04, 1.0599e-04,\n 7.6909e-05, 8.4948e-05, 1.6006e-04, 7.4657e-05, 1.6763e-04, 1.5340e-04,\n 1.9831e-04, 9.3780e-05, 1.2386e-04, 1.0620e-04, 1.1448e-04, 6.1126e-06,\n 1.0337e-04, 1.7338e-05, 1.0805e-04, 2.1856e-04, 6.0433e-05, 1.0851e-04,\n 3.6828e-07, 1.6744e-04, 1.1827e-04, 3.1246e-05, 1.0913e-04, 1.0361e-04,\n 2.3393e-06, 2.0273e-05, 5.3356e-06, 6.7816e-06, 9.0499e-05, 2.4462e-04,\n 1.3379e-04, 1.6504e-04, 6.7356e-06, 8.5502e-05, 1.3591e-04, 1.6342e-04,\n 5.8167e-05, 6.7462e-05, 1.0389e-04, 1.6985e-04, 7.0559e-05, 1.4013e-04,\n 1.8478e-06, 7.2669e-05, 1.5968e-05, 1.0009e-04, 1.3229e-05, 1.2551e-04,\n 9.0110e-05, 1.3758e-04, 2.1852e-05, 1.2398e-04, 6.1984e-05, 2.1324e-04,\n 1.3438e-04, 1.3156e-04, 1.7449e-04, 1.1232e-04, 1.1211e-04, 1.0872e-04,\n 8.0641e-05, 1.4451e-04, 1.3943e-04, 9.0162e-05, 1.2867e-04, 1.2411e-06,\n 1.3691e-04, 3.0526e-05, 2.6990e-07, 1.5792e-06, 1.3751e-04, 1.6311e-04,\n 1.4706e-04, 2.3367e-06, 1.0337e-05, 1.2572e-04, 1.2500e-04, 5.0513e-06,\n 3.9280e-06, 3.4529e-06, 8.1961e-07, 1.1639e-04, 1.0618e-04, 1.3924e-04,\n 1.3476e-04, 6.0390e-05, 5.5459e-05, 1.3877e-04, 1.9087e-04, 4.5239e-06,\n 5.6055e-05, 6.4027e-05, 2.2887e-04, 2.1422e-04, 1.7405e-04, 1.7171e-04,\n 1.3046e-04, 7.8992e-05, 2.0561e-04, 5.6756e-05, 1.6212e-04, 6.1590e-05,\n 1.1942e-04, 4.8147e-05, 1.0807e-04, 1.5405e-04, 8.5730e-05, 1.3142e-04,\n 1.4351e-04, 1.1481e-04, 1.1602e-04, 1.3749e-04, 1.5277e-04, 1.6102e-04,\n 4.9004e-05, 7.3917e-05, 1.4746e-06, 2.4094e-04, 2.0498e-04, 7.0090e-05,\n 1.1606e-04, 1.5974e-04, 1.1282e-04, 1.7416e-04, 1.2365e-04, 1.8325e-04,\n 1.6413e-04, 1.0075e-05, 1.5340e-04, 1.7198e-04, 3.7495e-05, 1.0890e-04,\n 3.2546e-06, 9.5192e-05, 1.6514e-04, 1.4632e-04, 1.3682e-04, 1.1080e-06,\n 6.8253e-07, 6.4819e-05, 1.0894e-05, 1.6991e-04, 5.8200e-05, 6.9377e-05,\n 1.9031e-04, 1.1263e-04, 6.5790e-06, 1.9370e-05, 1.2348e-04, 1.6868e-04,\n 6.1779e-05, 1.9711e-06, 2.4460e-04, 1.2958e-04, 1.2875e-04, 1.5574e-04,\n 1.2438e-04, 1.2424e-04, 1.8478e-04, 1.1652e-04, 1.3442e-04, 1.7498e-04,\n 1.3293e-04, 1.0791e-04, 1.1685e-04, 4.7575e-07, 7.0879e-05, 9.9483e-05,\n 9.2598e-05, 1.3999e-04, 1.3390e-04, 1.5507e-06, 2.2021e-06, 1.2262e-04,\n 3.5282e-05, 3.9577e-05, 1.8776e-04, 2.3607e-05, 1.2914e-04, 9.5425e-06,\n 8.8458e-05, 5.4793e-05, 1.7688e-04, 1.4917e-04, 7.1929e-05, 1.2966e-04,\n 1.1531e-04, 1.4657e-04, 1.4532e-04, 7.1435e-07, 9.3775e-05, 3.5738e-06,\n 1.2525e-04, 9.9462e-05, 1.2356e-04, 1.1832e-04, 1.1851e-04, 1.1907e-04,\n 9.6039e-05, 9.3672e-05, 1.2571e-04, 9.0461e-05, 4.6265e-05, 8.1472e-05,\n 2.8538e-06, 3.9573e-06, 1.8178e-04, 8.5273e-05, 1.1549e-06, 1.1301e-04,\n 9.9930e-06, 2.6556e-04, 9.0106e-05, 1.0476e-04, 1.3779e-04, 4.4612e-07,\n 1.9354e-07, 9.2418e-05, 7.6904e-05, 5.2415e-05, 3.1193e-06, 1.1338e-04,\n 1.2712e-04, 6.7011e-07, 9.0553e-05, 1.9501e-04, 2.1779e-04, 1.0918e-04,\n 7.6809e-05, 5.6993e-07, 1.2559e-04, 1.8947e-07, 2.4857e-05, 1.9147e-04,\n 1.6334e-04, 9.5103e-05, 1.7345e-04, 1.0121e-04, 1.6039e-07, 9.0950e-05,\n 1.2939e-04, 2.5690e-05, 1.5040e-04, 1.4694e-04, 1.0786e-04, 1.0812e-04,\n 1.0765e-04, 1.0414e-04, 1.2522e-04, 1.6548e-04, 1.1310e-04, 4.7277e-05,\n 1.2718e-04, 1.6998e-04, 2.2692e-06, 5.2793e-05, 1.5023e-04, 3.3612e-05,\n 1.9915e-04, 9.5176e-07, 1.2857e-04, 5.6581e-06, 5.1162e-05, 1.4187e-04,\n 7.1108e-06, 1.2574e-04, 9.9547e-05, 8.2938e-05], device='cuda:0')"
14
  },
15
  "2": {
16
  "step": "tensor(1252.)",
17
- "exp_avg": "tensor([[-2.4572e-05, -1.9201e-06, 5.6052e-45, ..., -2.0221e-05,\n -8.0042e-06, 1.2930e-05],\n [ 8.2135e-05, 5.8937e-05, -5.6052e-45, ..., -2.3740e-05,\n 7.0554e-05, -2.9479e-05],\n [ 3.2157e-05, -2.7470e-05, -5.6052e-45, ..., -2.2250e-05,\n 7.4611e-05, 1.1439e-05],\n ...,\n [ 1.5776e-05, 1.4394e-05, -5.6052e-45, ..., -1.4606e-05,\n 1.9324e-05, 1.3889e-04],\n [ 4.4814e-05, 1.0931e-05, -5.6052e-45, ..., -5.8624e-05,\n 1.0031e-04, 1.1417e-04],\n [-4.9805e-05, -2.2688e-05, 5.6052e-45, ..., 1.1320e-05,\n 8.2752e-05, 5.0785e-05]], device='cuda:0')",
18
- "exp_avg_sq": "tensor([[6.1916e-08, 4.0039e-08, 2.8288e-12, ..., 7.2189e-08, 3.4673e-08,\n 3.0847e-08],\n [9.9022e-08, 8.6026e-08, 2.4207e-12, ..., 9.1891e-08, 6.3491e-08,\n 6.3855e-08],\n [6.0957e-08, 4.8856e-08, 1.0245e-11, ..., 6.7222e-08, 6.9665e-08,\n 5.9740e-08],\n ...,\n [1.0218e-07, 7.0578e-08, 3.4236e-11, ..., 1.5361e-07, 6.8790e-08,\n 7.8031e-08],\n [9.7974e-08, 7.2477e-08, 4.8175e-12, ..., 1.2711e-07, 6.6718e-08,\n 9.0619e-08],\n [1.0754e-07, 8.6475e-08, 8.5844e-13, ..., 1.4465e-07, 1.1352e-07,\n 8.2872e-08]], device='cuda:0')"
19
  }
20
  },
21
  "param_groups": [
@@ -218,15 +218,15 @@
218
  ]
219
  },
220
  "metrics": {
221
- "best_val_acc": 71.754,
222
  "best_epoch": 0,
223
  "scale_accuracies": {
224
- "256": 71.754
225
  }
226
  },
227
  "train_config": {
228
  "name": "david_training",
229
- "run_id": "20251012_031919",
230
  "dataset_name": "AbstractPhil/imagenet-clip-features-orderly",
231
  "model_variant": "clip_vit_b16",
232
  "num_classes": 1000,
 
4
  "state": {
5
  "0": {
6
  "step": "tensor(1252.)",
7
+ "exp_avg": "tensor([[ 2.2889e-05, 3.2026e-05, 1.6571e-06, ..., 1.7219e-05,\n 1.1876e-05, -3.7499e-05],\n [-2.1468e-04, -1.3604e-04, 1.3280e-04, ..., -4.3560e-05,\n 2.0309e-04, -2.6094e-04],\n [-6.7956e-05, 7.5952e-05, 9.7297e-05, ..., -4.7797e-05,\n 2.9834e-05, -1.0805e-04],\n ...,\n [-1.1135e-04, 1.5752e-04, -1.0688e-04, ..., 2.3727e-05,\n -6.9641e-05, 1.9441e-05],\n [-1.4223e-19, 4.0510e-20, -7.5370e-20, ..., 1.2587e-19,\n -9.1474e-20, -3.3843e-19],\n [-1.0722e-05, -2.7671e-05, 1.7630e-05, ..., 1.6293e-05,\n -1.6963e-05, -1.2034e-05]], device='cuda:0')",
8
+ "exp_avg_sq": "tensor([[1.1735e-07, 1.2837e-07, 1.1420e-08, ..., 2.4014e-08, 2.3699e-08,\n 6.9322e-09],\n [2.2943e-07, 1.5274e-07, 4.7403e-08, ..., 9.2499e-08, 5.6044e-08,\n 6.6360e-08],\n [2.0946e-07, 3.0776e-07, 6.8965e-08, ..., 7.5621e-08, 5.2727e-08,\n 5.3820e-08],\n ...,\n [5.5617e-07, 3.9251e-07, 6.7908e-08, ..., 6.5855e-08, 5.9912e-08,\n 4.2784e-08],\n [2.1465e-10, 4.9741e-09, 7.8046e-10, ..., 3.2963e-10, 1.0450e-09,\n 6.2219e-10],\n [3.6456e-07, 2.1370e-07, 3.8428e-08, ..., 3.7118e-08, 7.7678e-08,\n 4.0870e-08]], device='cuda:0')"
9
  },
10
  "1": {
11
  "step": "tensor(1252.)",
12
+ "exp_avg": "tensor([-6.0069e-04, -3.3064e-03, -3.0734e-03, -8.6551e-04, -1.1617e-13,\n -1.9131e-04, -3.1353e-04, 1.9033e-03, 4.3359e-05, -9.1803e-04,\n 1.1774e-03, 9.3017e-04, 5.6052e-45, 3.8611e-03, -8.6159e-03,\n -9.7585e-04, -7.5239e-04, -4.9659e-03, 4.8121e-04, 5.6052e-45,\n -6.3107e-05, -2.2051e-03, 1.0329e-03, -1.9065e-03, 8.0956e-34,\n 4.0895e-03, 4.9298e-03, -8.0805e-04, 2.4687e-03, -1.3231e-03,\n -1.3785e-03, -3.6809e-03, -1.2147e-07, 5.6052e-45, 1.2894e-03,\n -5.8629e-05, -4.0794e-04, -1.3202e-05, -1.8225e-04, 2.7894e-03,\n 4.3474e-03, -1.8189e-03, 3.7872e-03, -6.5277e-04, 6.2215e-04,\n -1.5357e-03, 3.2316e-04, -3.0323e-03, 4.6631e-03, -1.0720e-03,\n -7.0228e-03, 5.6052e-45, 7.1771e-35, 5.6052e-45, 2.2352e-04,\n 7.5579e-04, -4.4723e-03, -2.0540e-03, 1.3815e-21, 1.4974e-04,\n -4.9958e-03, -2.7003e-03, 3.7906e-03, -6.1028e-05, 2.5707e-03,\n 3.8245e-04, 2.5648e-03, 5.6052e-45, 2.3466e-03, -1.9835e-04,\n 2.0861e-08, 3.8633e-08, 3.9210e-03, -4.4422e-03, 1.3143e-03,\n -1.9418e-03, -7.5711e-04, 4.5668e-03, 3.5378e-04, -2.4114e-03,\n 1.4986e-03, -4.5153e-03, -7.8498e-05, 1.9901e-04, 4.5906e-03,\n 2.3016e-03, 1.9876e-04, 9.5623e-04, -2.3304e-03, 1.5096e-03,\n 5.6052e-45, 1.7155e-03, 2.4380e-03, -1.3041e-03, -1.4891e-03,\n 1.5806e-03, -3.3790e-03, -7.7564e-05, -2.7520e-03, 4.8316e-04,\n -7.0963e-04, 1.8868e-10, -2.4407e-03, -6.3466e-04, -6.3611e-03,\n 3.7107e-04, -2.2045e-03, -2.7769e-03, -1.1518e-05, -4.6362e-03,\n 2.2827e-03, 7.4211e-04, 5.6052e-45, -2.7134e-03, 1.6550e-09,\n 1.1651e-03, 1.1698e-03, 3.4867e-03, 5.6052e-45, 3.0735e-08,\n 9.0221e-10, 2.0252e-03, 5.6052e-45, 4.1098e-04, 2.3577e-04,\n -2.5428e-04, -6.5745e-05, 5.6052e-45, 1.6520e-03, -1.0316e-03,\n 9.3832e-05, -1.2079e-04, 1.5227e-03, 7.9433e-15, 7.9189e-04,\n -7.9527e-04, 1.5553e-03, -5.0773e-04, 7.7019e-04, -1.1426e-03,\n 5.1381e-03, -7.1637e-04, -1.8527e-03, 2.5450e-03, 8.9379e-03,\n -3.2705e-03, -1.6546e-13, 4.0166e-03, -1.0601e-03, 6.1481e-04,\n 1.8809e-13, -6.7260e-04, 1.1489e-03, 8.6132e-39, -1.4846e-03,\n -4.7213e-04, 2.3243e-23, -9.3133e-04, 2.6049e-03, 2.1563e-03,\n 3.9112e-31, -3.6412e-03, -5.2335e-03, -5.9905e-03, -2.3537e-03,\n -1.3842e-03, -5.9578e-03, -2.2822e-03, 1.1170e-04, -2.1091e-29,\n 5.6052e-45, 3.0544e-03, -5.9425e-05, -4.0994e-03, -2.8030e-03,\n -4.9734e-03, -1.4584e-03, 1.4601e-04, 4.9706e-34, 1.7165e-03,\n 2.3065e-03, 3.6659e-03, 5.6655e-04, 5.6052e-45, 3.5381e-03,\n -2.2904e-03, 4.5980e-03, 2.6798e-03, 4.0761e-03, 5.6052e-45,\n 5.6052e-45, 5.0720e-04, -3.7422e-04, 1.9530e-03, -1.2886e-03,\n -4.0029e-03, 2.1770e-03, 4.1103e-04, 5.6052e-45, -7.1649e-04,\n 7.2740e-04, -1.3782e-03, 2.7222e-03, -5.9347e-04, -1.2909e-03,\n 5.6052e-45, -8.0836e-03, 1.2741e-03, -4.9838e-04, 2.9652e-03,\n 4.9207e-03, 2.5242e-03, 4.6802e-03, 1.4867e-04, 3.1299e-04,\n -2.2740e-03, -2.9689e-03, -5.3209e-04, -2.3417e-03, 1.3715e-04,\n 2.0833e-03, -5.4587e-03, -6.8023e-04, 6.9832e-04, -5.9483e-03,\n 3.2933e-03, -1.6839e-03, -4.2018e-03, -5.3849e-03, 2.9948e-03,\n -4.8168e-03, 3.8610e-03, -1.4261e-03, 3.7585e-09, -3.0871e-03,\n -9.9207e-04, 2.6115e-03, -4.9670e-03, -4.3795e-03, 3.4741e-03,\n 4.4612e-04, -2.7896e-03, 5.7169e-04, 4.8785e-03, -9.7763e-04,\n 3.7314e-03, 2.6435e-03, 1.3079e-03, 2.1492e-03, -4.0522e-03,\n 9.8097e-04, -3.8514e-03, 2.0170e-05, -1.6691e-03, -3.1188e-03,\n -4.4586e-03, 5.6052e-45, 3.6943e-03, -1.2492e-03, 5.2881e-05,\n -7.5173e-04, 1.7691e-03, 7.7236e-03, 1.0483e-03, 4.0832e-04,\n 5.3189e-04, 2.8803e-03, 5.6052e-45, 3.9974e-03, 2.7963e-04,\n -4.9529e-04, -1.2284e-03, 9.8050e-04, 8.9134e-04, -3.3321e-03,\n -2.5986e-17, 3.7972e-03, 5.6052e-45, -2.1032e-03, 7.8734e-04,\n 1.9879e-03, 1.1265e-03, -3.4019e-03, -3.1301e-03, 3.3404e-03,\n -9.8025e-04, 5.6052e-45, -8.3202e-04, 7.9056e-04, 8.0925e-04,\n -6.3958e-13, -2.7826e-03, 1.3710e-03, 3.5263e-03, 1.6505e-03,\n 4.7166e-04, 3.2478e-03, 6.0789e-04, -1.5110e-03, -3.8444e-03,\n -3.0352e-04, -3.0284e-04, 2.6331e-08, -2.5967e-03, -1.9465e-03,\n -9.0765e-12, 3.8184e-03, -1.1051e-09, 5.6052e-45, -3.7817e-03,\n -3.6641e-03, 1.0406e-03, 1.8360e-03, 6.0505e-03, 1.2501e-03,\n 1.1163e-03, 8.2670e-04, -1.5502e-03, 1.2199e-03, -1.8529e-04,\n 1.3050e-04, 6.3554e-03, -6.4259e-03, -2.6184e-03, -1.9043e-03,\n 7.6206e-04, -4.6475e-03, 1.2827e-25, 6.9756e-03, -3.8316e-04,\n 3.1803e-05, 2.8865e-04, 5.3987e-03, 5.5536e-04, 5.6052e-45,\n -5.6030e-04, 7.8950e-04, -9.7610e-05, -1.3669e-03, 1.2413e-03,\n 1.1517e-03, -2.8729e-04, 2.8656e-03, -2.8236e-03, -4.2717e-03,\n -2.1533e-03, 5.6052e-45, -1.4698e-12, 9.4901e-04, -6.9550e-04,\n 6.9772e-04, -4.4212e-03, 1.4552e-03, 1.2531e-03, 2.5615e-03,\n -3.7819e-03, 1.2623e-04, -1.0779e-03, -1.3615e-03, 3.9590e-18,\n 8.6027e-05, -2.0218e-03, 1.9077e-03, -1.2890e-03, 5.5033e-04,\n 1.2863e-03, 4.8764e-04, -1.0874e-03, -7.3269e-04, 2.0846e-03,\n 2.3644e-03, 3.5509e-03, -9.4110e-04, -2.7191e-05, 9.8474e-04,\n 5.4307e-03, -3.7414e-03, 8.9703e-04, 5.6052e-45, 8.7415e-04,\n 1.3296e-08, 5.6052e-45, -6.3380e-04, 3.7691e-03, 3.5902e-03,\n -1.0605e-04, 4.4580e-04, 6.7394e-03, -2.4415e-03, -7.3135e-04,\n 2.0872e-03, -2.1997e-03, 4.1108e-03, -4.3807e-09, 5.6052e-45,\n -4.9648e-04, 2.8766e-03, -1.2014e-03, -2.8814e-03, -5.5966e-05,\n 2.5405e-03, -8.5971e-04, -5.4241e-06, -3.2462e-03, 3.1314e-04,\n -2.5387e-03, 2.4806e-03, 1.4698e-33, -6.4468e-11, -6.2196e-03,\n 8.0881e-14, -6.5373e-10, 5.6052e-45, -1.3717e-03, 2.7646e-03,\n 3.4550e-03, -2.5083e-04, 5.6052e-45, 3.5205e-03, 1.3218e-03,\n 7.1738e-04, -3.0211e-04, 6.9750e-03, 1.2837e-03, -6.4541e-04,\n -3.0453e-33, -3.1030e-03, -8.0829e-13, 2.2259e-03, 2.4388e-19,\n 1.5958e-03, 2.9320e-03, 7.4004e-05, 5.6052e-45, -4.8786e-03,\n -9.6536e-04, -1.1047e-03, 3.5034e-04, 9.7487e-04, 3.5561e-03,\n -1.8258e-03, 1.1405e-03, -4.4571e-03, 5.3981e-04, -1.9415e-03,\n 3.7651e-07, -2.9522e-03, 1.2595e-11, -3.1325e-04, -1.0205e-02,\n 5.6052e-45, -6.9883e-04, -3.1635e-04, 2.1702e-05, -2.1005e-02,\n 1.3513e-10, 7.1958e-05, 2.0322e-04, -2.4389e-03, 5.6052e-45,\n 1.5596e-03, 3.4362e-03, 5.9835e-43, -2.6713e-03, -1.0566e-18,\n -1.8087e-03, -6.2851e-04, 5.6052e-45, -1.2291e-04, -2.5857e-03,\n 1.1538e-03, -4.0428e-03, 5.9601e-04, 1.7805e-03, 7.0921e-04,\n -2.7822e-04, 3.5518e-23, 2.7884e-03, 5.6052e-45, -1.5361e-06,\n 7.0726e-09, 1.6324e-06, 3.7290e-03, 9.7123e-05, 6.5938e-03,\n 2.3920e-03, 3.0546e-03, 5.1159e-04, -5.2809e-03, -6.4831e-03,\n 3.8676e-15, -1.4933e-04, 1.7249e-03, -2.0113e-03, -2.7728e-19,\n 2.6408e-06, -8.0329e-03, 7.7057e-04, 2.2606e-03, -1.2932e-06,\n 9.5648e-05, 5.6052e-45, -1.5404e-08, -3.5735e-03, -5.7265e-04,\n 2.7375e-03, -1.1931e-03, 4.6036e-04, -8.1512e-04, -1.6971e-03,\n 2.8026e-03, 6.1842e-03, -2.0997e-03, -3.4300e-03, 7.6167e-11,\n 1.2152e-18, 5.9221e-03, -1.5254e-03, 1.2840e-03, 1.4807e-03,\n 2.2137e-04, 2.3902e-03, -3.6905e-04, 3.7090e-04, 3.9848e-03,\n 8.4553e-06, -8.6029e-03, 6.3052e-03, -1.4264e-03, 1.7582e-03,\n 2.1909e-22, -7.4063e-04, 6.8185e-05, -1.7367e-04, -7.4308e-08,\n -3.5554e-03, 2.0595e-03, 7.3922e-23, 5.6052e-45, 4.7111e-04,\n 6.7966e-03, -6.9490e-03, -3.4873e-03, -2.8326e-03, 3.1004e-03,\n -4.4247e-04, -5.0340e-03, 3.9281e-03, 3.5720e-03, -3.4490e-03,\n 1.4723e-03, 1.3372e-03, 8.2852e-03, -5.1868e-04, 6.5427e-04,\n -1.0040e-03, 1.9325e-04, 2.7792e-03, 3.1484e-03, -7.3690e-04,\n -7.9488e-04, -5.2024e-03, -5.9283e-04, -1.8571e-04, 1.3465e-21,\n -1.3919e-03, 3.1642e-04, 2.8527e-03, 5.5314e-03, 9.5748e-04,\n -6.3823e-03, 1.1961e-03, -3.7229e-03, 3.6283e-03, 6.2414e-42,\n -7.7902e-16, 5.6052e-45, -3.2896e-03, 3.8389e-03, -2.9575e-04,\n 3.8170e-03, 1.0278e-21, 2.5214e-03, -2.4962e-04, 2.4568e-03,\n 3.4345e-03, 1.0050e-03, -9.1621e-04, 3.8970e-04, -6.1147e-04,\n 1.3594e-03, -2.9058e-03, 2.1731e-03, 4.0486e-03, 4.8792e-04,\n 2.2176e-03, 2.4161e-03, -9.1977e-04, 3.5772e-04, 2.5839e-03,\n 3.2797e-03, -1.7886e-03, 1.6143e-03, -1.6899e-03, 1.8400e-03,\n 2.0042e-03, 1.4821e-03, -3.1434e-04, 1.6967e-03, 9.6830e-04,\n -3.2342e-04, -5.9173e-05, 3.4689e-03, 4.8732e-05, -2.4224e-03,\n -1.1371e-03, -7.5282e-03, 3.2003e-03, 3.0720e-04, -2.8621e-13,\n 5.2720e-31, -8.1575e-18, 4.8461e-04, -5.0260e-03, -1.4113e-03,\n -8.9169e-04, -6.4226e-04, -1.5311e-03, -3.3189e-04, 2.9600e-03,\n -3.4607e-03, 5.0965e-07, -1.7981e-18, 2.3618e-04, -5.6518e-03,\n 1.5403e-03, 2.7384e-03, -6.1458e-04, -5.2167e-18, -9.0002e-04],\n device='cuda:0')",
13
+ "exp_avg_sq": "tensor([3.2507e-05, 1.1724e-04, 8.7974e-05, 6.7685e-05, 1.8961e-06, 1.6011e-05,\n 1.1788e-04, 1.1777e-04, 6.9844e-05, 1.1874e-04, 1.1513e-04, 1.9905e-04,\n 6.4615e-06, 1.0866e-04, 1.1703e-04, 1.2000e-04, 1.8659e-04, 1.9433e-04,\n 7.8171e-06, 1.6823e-06, 7.4718e-05, 1.0555e-04, 8.7074e-05, 1.1808e-04,\n 6.1408e-06, 1.7379e-04, 1.2058e-04, 1.6009e-04, 9.5392e-05, 1.6592e-04,\n 1.2516e-04, 1.7138e-04, 1.1935e-05, 1.0846e-06, 5.2729e-05, 1.1998e-04,\n 1.4447e-04, 9.2601e-05, 5.1950e-05, 1.2680e-04, 1.3692e-04, 4.7013e-05,\n 1.2441e-04, 1.0247e-04, 5.4981e-05, 1.3501e-04, 1.2635e-04, 2.1873e-04,\n 1.6533e-04, 2.4761e-05, 1.7014e-04, 6.4423e-07, 1.0454e-06, 9.7833e-07,\n 1.1844e-04, 2.2787e-04, 8.1590e-05, 8.1723e-05, 3.1593e-06, 1.8851e-04,\n 1.0411e-04, 8.9025e-05, 1.6391e-04, 6.4249e-05, 1.3726e-04, 1.9040e-04,\n 1.2166e-04, 1.1974e-06, 1.3068e-04, 1.3169e-04, 2.6010e-06, 4.8913e-06,\n 1.6314e-04, 8.2426e-05, 8.8617e-06, 1.0488e-04, 1.1895e-04, 1.6822e-04,\n 3.9032e-05, 1.2856e-04, 1.6754e-04, 1.1636e-04, 1.5123e-04, 9.2484e-05,\n 1.3653e-04, 7.5866e-05, 1.4074e-04, 3.2978e-05, 1.1580e-04, 9.9418e-05,\n 7.6357e-06, 1.8128e-04, 1.1747e-04, 5.9849e-05, 1.3040e-04, 2.3896e-05,\n 8.8402e-05, 4.6617e-05, 8.6008e-05, 6.9984e-05, 7.8474e-06, 6.2019e-06,\n 1.3756e-04, 1.5139e-04, 1.6610e-04, 1.4352e-05, 1.1485e-04, 1.7282e-04,\n 9.9013e-07, 2.9003e-05, 1.7810e-04, 2.0762e-04, 5.1625e-07, 9.3318e-05,\n 3.4231e-06, 6.3253e-05, 1.6599e-04, 1.6560e-04, 2.3018e-07, 9.7048e-07,\n 8.3732e-07, 9.4250e-05, 6.6675e-07, 2.6900e-04, 1.1154e-04, 1.9790e-04,\n 1.1683e-04, 1.2542e-07, 3.9549e-05, 1.9470e-04, 9.2241e-05, 7.9176e-05,\n 1.5936e-04, 2.2375e-07, 1.5429e-04, 9.7220e-05, 3.8196e-05, 1.1510e-04,\n 8.2425e-05, 1.2534e-04, 2.0527e-04, 1.5900e-04, 1.5641e-04, 1.2322e-04,\n 1.5682e-04, 1.1042e-04, 9.8737e-06, 1.4441e-04, 1.0458e-04, 8.0399e-05,\n 8.4686e-06, 8.8142e-05, 7.9128e-05, 4.5436e-06, 1.0553e-04, 1.3169e-04,\n 8.9994e-06, 1.6063e-04, 9.3803e-05, 1.4917e-04, 7.5638e-06, 1.2990e-04,\n 2.3577e-04, 9.4472e-05, 1.0972e-04, 9.9431e-05, 2.3060e-04, 7.3299e-05,\n 9.5476e-05, 1.0670e-06, 1.6478e-06, 1.2884e-04, 1.7710e-04, 1.1040e-04,\n 7.9592e-05, 1.5554e-04, 4.1986e-05, 1.4639e-04, 2.9905e-07, 3.7256e-05,\n 9.7225e-05, 1.7506e-04, 6.7457e-07, 2.2003e-06, 1.5172e-04, 1.2292e-04,\n 1.9601e-04, 5.9613e-05, 9.7429e-05, 2.9050e-07, 7.3207e-06, 1.1665e-04,\n 6.0249e-05, 1.2152e-04, 1.3849e-04, 1.1670e-04, 7.3939e-05, 1.3982e-04,\n 1.1539e-06, 1.3118e-04, 5.3802e-05, 5.9900e-05, 2.0751e-04, 3.6520e-05,\n 2.3494e-04, 5.6914e-08, 1.5068e-04, 1.3239e-04, 1.0836e-04, 1.5655e-04,\n 5.6113e-05, 1.1710e-04, 1.3372e-04, 7.8968e-05, 3.2596e-05, 1.1261e-04,\n 6.6086e-05, 1.4019e-04, 1.5585e-04, 6.9301e-05, 1.0123e-04, 1.4779e-04,\n 1.0782e-04, 8.9897e-05, 1.1035e-04, 8.6228e-05, 2.1523e-04, 1.7441e-04,\n 8.3166e-05, 1.8110e-04, 9.4618e-05, 2.0647e-04, 1.5496e-04, 1.4147e-06,\n 1.3028e-04, 6.9138e-05, 1.1595e-04, 9.8562e-05, 2.6164e-04, 9.7953e-05,\n 4.8600e-05, 5.7490e-05, 1.4495e-04, 1.5176e-04, 1.7491e-04, 8.0334e-05,\n 4.1977e-05, 8.6283e-05, 8.5547e-05, 1.2930e-04, 9.6704e-05, 1.1941e-04,\n 8.9328e-05, 1.0880e-04, 1.4305e-04, 1.2733e-04, 6.0956e-06, 1.0217e-04,\n 5.3809e-05, 3.1618e-06, 1.2085e-04, 1.9260e-04, 1.2522e-04, 1.3108e-04,\n 1.2611e-04, 1.4462e-04, 8.4020e-05, 9.0356e-07, 1.1884e-04, 1.5240e-04,\n 7.2876e-05, 1.6757e-04, 1.2694e-04, 6.7720e-06, 1.7029e-04, 1.5517e-06,\n 1.1217e-04, 4.4558e-06, 7.8680e-05, 3.5964e-06, 1.0988e-04, 7.8484e-05,\n 1.9183e-04, 1.3617e-04, 1.6142e-04, 1.3095e-04, 1.8173e-07, 1.1762e-04,\n 1.5120e-04, 7.8412e-05, 2.6337e-06, 1.1580e-04, 1.8360e-04, 1.4545e-04,\n 1.2320e-04, 1.4313e-04, 1.9809e-04, 1.0087e-04, 1.3083e-04, 1.9717e-04,\n 8.9043e-05, 4.9356e-06, 1.2835e-05, 7.3823e-05, 1.4438e-04, 3.8133e-05,\n 1.2614e-04, 1.8736e-07, 3.6950e-06, 1.2990e-04, 1.5428e-04, 8.8410e-05,\n 1.4186e-04, 1.4564e-04, 5.6568e-05, 1.4128e-04, 1.6564e-04, 1.4981e-04,\n 7.7269e-05, 1.4320e-04, 1.4481e-04, 2.0914e-04, 1.7764e-04, 7.9841e-05,\n 1.6716e-05, 1.5881e-04, 1.0352e-04, 3.2232e-06, 8.7772e-05, 1.5606e-04,\n 5.2200e-06, 6.3725e-05, 1.9099e-04, 9.9991e-05, 4.4081e-10, 9.8620e-05,\n 5.8329e-05, 1.7657e-04, 8.5530e-05, 1.0080e-04, 8.0978e-06, 1.4344e-04,\n 1.1621e-04, 1.0616e-04, 1.0820e-04, 1.6679e-04, 6.4509e-06, 1.5713e-05,\n 1.3086e-04, 1.3924e-04, 5.7230e-05, 1.7347e-04, 1.0459e-04, 1.2532e-04,\n 1.9473e-04, 7.8555e-05, 9.9183e-05, 1.0078e-04, 1.6287e-04, 6.1473e-06,\n 6.2829e-05, 6.3714e-05, 1.2282e-04, 1.1346e-04, 1.5332e-04, 2.7345e-04,\n 1.5856e-05, 1.2311e-04, 1.4564e-04, 1.7048e-04, 1.5353e-04, 1.3800e-04,\n 1.1477e-04, 2.7784e-06, 1.2321e-04, 2.1425e-04, 2.5506e-04, 1.9452e-05,\n 2.8083e-06, 1.9102e-04, 4.0009e-06, 1.5322e-05, 1.0637e-04, 2.2128e-04,\n 3.8706e-05, 9.9500e-05, 1.4568e-04, 2.1639e-04, 8.7405e-05, 6.0282e-05,\n 1.4450e-04, 1.3912e-04, 9.9623e-05, 1.5229e-06, 5.0533e-06, 1.6214e-04,\n 1.4565e-04, 1.5037e-04, 1.4981e-04, 6.1761e-05, 8.6326e-05, 9.5113e-05,\n 5.7161e-06, 7.1970e-05, 7.9266e-05, 1.4965e-04, 9.8810e-05, 1.8609e-06,\n 6.2232e-07, 2.6146e-05, 5.3609e-07, 6.4562e-06, 9.3529e-07, 1.8374e-04,\n 1.0017e-04, 2.0571e-05, 6.9488e-05, 2.5251e-06, 4.9152e-05, 1.0061e-04,\n 8.1306e-05, 1.1810e-04, 1.4575e-04, 2.0476e-04, 1.2326e-04, 6.5627e-06,\n 3.4647e-05, 1.9104e-06, 6.4540e-05, 3.5233e-07, 3.7474e-05, 1.2947e-04,\n 1.4519e-04, 1.6220e-06, 7.6871e-05, 1.1438e-04, 1.8536e-04, 1.7969e-04,\n 8.1910e-05, 2.3525e-05, 1.2165e-04, 4.8800e-05, 1.5248e-04, 1.6620e-04,\n 8.4353e-05, 4.3623e-06, 9.5107e-05, 5.4737e-07, 1.1433e-04, 6.0626e-05,\n 1.8163e-05, 1.6771e-05, 9.4185e-05, 5.5767e-06, 1.2817e-04, 8.5737e-07,\n 5.7967e-05, 2.3343e-06, 8.8746e-05, 2.4520e-05, 1.3919e-04, 1.5167e-04,\n 1.5942e-07, 1.0202e-04, 2.0640e-05, 1.5169e-04, 8.0813e-05, 1.3020e-06,\n 1.0727e-04, 7.4665e-05, 2.5416e-04, 1.8834e-04, 8.4547e-05, 1.4440e-06,\n 6.9902e-05, 1.4743e-04, 9.0501e-06, 1.4931e-04, 2.8734e-06, 5.9674e-06,\n 5.0801e-07, 8.4795e-06, 9.1691e-05, 1.5931e-04, 2.0231e-04, 1.4534e-04,\n 7.5968e-05, 1.0432e-04, 1.2185e-04, 9.2049e-05, 1.2056e-06, 1.2896e-04,\n 1.1794e-04, 2.2746e-04, 1.6985e-06, 5.9872e-06, 1.0515e-04, 8.1016e-05,\n 8.1447e-05, 7.6041e-06, 1.1137e-04, 8.9460e-06, 2.0996e-06, 1.9050e-04,\n 1.2343e-04, 1.7245e-04, 1.0255e-04, 1.0953e-04, 1.0919e-04, 5.8683e-05,\n 1.3136e-04, 2.1726e-04, 7.8684e-05, 1.3435e-04, 6.6953e-06, 7.4107e-06,\n 1.6702e-04, 2.5935e-04, 1.7216e-04, 1.1827e-04, 1.4945e-04, 1.4070e-04,\n 1.3730e-04, 1.0282e-04, 1.0497e-04, 2.0012e-05, 1.3467e-04, 1.4184e-04,\n 7.3608e-05, 7.6452e-05, 8.8413e-07, 6.9574e-05, 1.4512e-04, 6.6037e-05,\n 6.7463e-06, 1.1129e-04, 1.2146e-04, 5.4648e-07, 1.6442e-06, 1.2454e-04,\n 1.4420e-04, 1.5347e-04, 7.9989e-05, 1.4221e-04, 7.9842e-05, 1.4321e-04,\n 8.5637e-05, 6.5051e-05, 9.0108e-05, 1.1111e-04, 1.4506e-04, 1.4121e-04,\n 1.6361e-04, 1.2710e-04, 1.2343e-04, 3.8292e-05, 1.1329e-04, 2.9475e-04,\n 1.0576e-04, 9.4500e-05, 5.2959e-05, 1.2773e-04, 1.2505e-04, 2.0023e-04,\n 3.5716e-06, 9.7151e-05, 1.6800e-04, 5.4568e-05, 1.7418e-04, 1.2755e-04,\n 1.0674e-04, 1.2603e-04, 1.3099e-04, 1.8476e-04, 1.5367e-06, 8.5715e-07,\n 9.8105e-06, 1.3796e-04, 1.0924e-04, 1.4638e-04, 1.5233e-04, 1.8672e-05,\n 9.3651e-05, 1.0190e-04, 1.6308e-05, 1.0922e-04, 7.2146e-05, 9.3805e-05,\n 1.6084e-04, 1.4160e-04, 6.4953e-05, 1.3259e-04, 1.1345e-04, 1.7007e-04,\n 1.2662e-04, 7.4785e-05, 1.3804e-04, 1.3471e-04, 2.1403e-04, 1.7911e-04,\n 1.7954e-04, 7.4847e-05, 1.1543e-04, 9.6103e-05, 1.1780e-04, 9.8543e-05,\n 8.7148e-05, 1.3462e-04, 2.5042e-04, 1.8533e-04, 1.9444e-04, 1.8729e-04,\n 1.6371e-04, 3.8871e-05, 3.1880e-05, 1.4484e-04, 1.1660e-04, 1.3105e-04,\n 6.3615e-05, 3.2822e-07, 1.2267e-05, 9.3126e-07, 1.4859e-04, 1.1661e-04,\n 1.2378e-04, 1.9250e-04, 8.5557e-05, 7.5857e-05, 7.2122e-05, 1.3369e-04,\n 7.1680e-05, 2.9975e-06, 9.6274e-09, 1.7516e-04, 9.9866e-05, 1.9206e-04,\n 1.4256e-04, 1.1975e-04, 1.1671e-06, 8.0871e-05], device='cuda:0')"
14
  },
15
  "2": {
16
  "step": "tensor(1252.)",
17
+ "exp_avg": "tensor([[ 6.2244e-06, 1.0123e-04, 2.6873e-06, ..., -5.1794e-05,\n -1.0963e-20, 9.0553e-05],\n [-1.5695e-05, 3.0202e-04, 7.8999e-06, ..., -4.3161e-05,\n -5.0507e-21, -3.3274e-06],\n [ 6.2648e-08, 3.1202e-05, -4.5084e-05, ..., 1.3314e-04,\n -8.1531e-21, -2.5778e-05],\n ...,\n [-2.5402e-05, -9.5713e-06, 8.4876e-05, ..., -1.2755e-05,\n -4.5398e-20, -9.3574e-05],\n [-3.9413e-05, -2.8487e-04, 1.7388e-05, ..., -4.5623e-05,\n 5.0067e-20, -8.3133e-05],\n [-1.7686e-05, -4.0777e-04, -3.5612e-05, ..., -2.5136e-05,\n -1.9603e-20, 6.6686e-06]], device='cuda:0')",
18
+ "exp_avg_sq": "tensor([[2.3771e-08, 5.6179e-08, 3.7151e-08, ..., 4.8737e-08, 6.5373e-13,\n 6.5375e-08],\n [3.1993e-08, 1.1027e-07, 8.7912e-08, ..., 8.8702e-08, 1.2129e-10,\n 7.8001e-08],\n [3.1502e-08, 8.7614e-08, 6.8821e-08, ..., 7.2139e-08, 8.1122e-10,\n 9.5629e-08],\n ...,\n [1.6788e-08, 9.1308e-08, 8.2521e-08, ..., 9.2985e-08, 5.9039e-10,\n 9.7403e-08],\n [5.4341e-08, 1.2883e-07, 1.0161e-07, ..., 1.1026e-07, 5.3329e-12,\n 2.4452e-07],\n [2.9475e-08, 1.0801e-07, 7.2145e-08, ..., 1.3073e-07, 7.4640e-10,\n 6.5312e-08]], device='cuda:0')"
19
  }
20
  },
21
  "param_groups": [
 
218
  ]
219
  },
220
  "metrics": {
221
+ "best_val_acc": 72.356,
222
  "best_epoch": 0,
223
  "scale_accuracies": {
224
+ "256": 72.356
225
  }
226
  },
227
  "train_config": {
228
  "name": "david_training",
229
+ "run_id": "20251012_032356",
230
  "dataset_name": "AbstractPhil/imagenet-clip-features-orderly",
231
  "model_variant": "clip_vit_b16",
232
  "num_classes": 1000,
weights/train_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "name": "david_training",
3
- "run_id": "20251012_031919",
4
  "dataset_name": "AbstractPhil/imagenet-clip-features-orderly",
5
  "model_variant": "clip_vit_b16",
6
  "num_classes": 1000,
 
1
  {
2
  "name": "david_training",
3
+ "run_id": "20251012_032356",
4
  "dataset_name": "AbstractPhil/imagenet-clip-features-orderly",
5
  "model_variant": "clip_vit_b16",
6
  "num_classes": 1000,