AbstractPhil commited on
Commit
cc3dcad
·
verified ·
1 Parent(s): 87a4443

Upload weights and configs - David-fully_shared-weighted_sum - Run 20251012_132646

Browse files
weights/David-fully_shared-weighted_sum/20251012_132646/best_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:476f73d3a5cb21b1dbe8626e30c4317f0d553b13865341ef37c7f2e9bc815e46
3
  size 2628344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f49ab08aa1141f7d9ff7772393084c6250114e0069dd401acf0fa0423324beee
3
  size 2628344
weights/David-fully_shared-weighted_sum/20251012_132646/best_model_metadata.json CHANGED
@@ -1,46 +1,46 @@
1
  {
2
- "epoch": 3,
3
  "optimizer_state_dict": {
4
  "state": {
5
  "0": {
6
- "step": "tensor(5008.)",
7
- "exp_avg": "tensor([[-1.1230e-03, -1.6981e-03, 8.8243e-04, ..., -4.8594e-04,\n -3.8148e-04, 4.4194e-05],\n [ 1.7288e-04, 1.0945e-03, -1.5732e-03, ..., 5.1399e-04,\n -2.7085e-04, 2.2907e-04],\n [ 1.4119e-03, 2.9297e-04, -1.2873e-03, ..., 2.2817e-04,\n 2.7465e-04, 6.3447e-04],\n ...,\n [ 3.8322e-04, 2.2759e-03, 8.5259e-04, ..., -2.6006e-04,\n -1.5257e-04, -1.7237e-04],\n [-1.2525e-04, 1.0728e-03, -8.9537e-04, ..., 1.8505e-05,\n -2.1532e-05, 5.1829e-04],\n [-2.6790e-04, -7.9588e-04, 1.4150e-03, ..., -8.8310e-04,\n 2.5351e-04, 2.0954e-04]], device='cuda:0')",
8
- "exp_avg_sq": "tensor([[4.1530e-06, 2.9445e-05, 1.4735e-05, ..., 3.0969e-06, 2.3536e-06,\n 6.0039e-06],\n [1.0254e-05, 3.1427e-05, 1.7271e-05, ..., 3.9719e-06, 2.3369e-06,\n 5.7316e-06],\n [7.9538e-06, 4.7854e-05, 2.1410e-05, ..., 5.6525e-06, 3.0658e-06,\n 7.2611e-06],\n ...,\n [5.8806e-06, 5.2893e-05, 1.8188e-05, ..., 4.7980e-06, 3.0286e-06,\n 3.7597e-06],\n [4.4071e-06, 3.6163e-05, 1.3799e-05, ..., 3.2340e-06, 2.1710e-06,\n 2.5852e-06],\n [2.7648e-06, 1.3295e-05, 1.1579e-05, ..., 2.7398e-06, 1.6352e-06,\n 2.1448e-06]], device='cuda:0')"
9
  },
10
  "1": {
11
- "step": "tensor(5008.)",
12
- "exp_avg": "tensor([ 1.8826e-02, 9.2450e-03, 5.1239e-02, 1.4302e-02, -1.8116e-02,\n 3.1519e-02, 2.6606e-02, 1.4748e-02, -2.9714e-02, 1.7927e-02,\n -1.9756e-02, 6.4592e-03, -1.9618e-02, -1.3739e-02, 2.1586e-02,\n 3.3201e-03, 5.8719e-02, 8.9494e-03, -7.3825e-03, -4.4088e-03,\n -2.2125e-03, -1.4593e-02, -2.3205e-02, -3.3923e-02, 3.2310e-02,\n -1.1489e-02, 1.7067e-02, 4.0224e-02, -2.4282e-02, 1.9949e-03,\n -1.8096e-02, -3.4114e-02, 2.3217e-02, 1.4321e-02, 4.6799e-03,\n -3.3832e-02, -3.5706e-03, 1.5617e-02, -1.7906e-03, 3.8591e-02,\n 2.3137e-02, -3.8120e-02, -2.2585e-02, -3.2190e-02, 4.1643e-03,\n -9.6754e-03, 1.1373e-03, -3.5916e-02, -1.9638e-02, 5.8868e-03,\n -2.9333e-03, 2.5912e-02, -6.2582e-03, 3.0509e-03, -4.2866e-03,\n 1.3562e-02, 8.1266e-03, 3.6935e-03, -8.2579e-03, 5.1590e-03,\n 4.1672e-03, -2.4474e-02, 1.4971e-02, 2.4181e-02, -4.3989e-03,\n 4.3723e-03, -3.1397e-03, -1.7064e-02, 3.7604e-02, 2.0331e-02,\n 3.6293e-03, -1.6623e-02, 1.2822e-02, -1.2813e-02, 3.9621e-02,\n -1.4388e-02, -9.7019e-03, -1.2867e-02, 5.1088e-03, -3.8703e-03,\n 1.2037e-02, -3.4495e-03, -2.3341e-02, -3.6973e-02, 3.8301e-03,\n 2.6073e-02, 2.1087e-02, 2.3079e-02, 3.4341e-02, -1.2640e-02,\n 2.5137e-02, 3.3887e-03, 6.6774e-02, -2.4435e-02, -3.1510e-02,\n 1.3349e-03, -4.6995e-03, 2.8070e-02, 3.3159e-03, 1.7377e-02,\n 7.4447e-03, -3.5620e-03, -2.9688e-02, -1.5222e-02, -9.6429e-03,\n 6.4860e-03, 7.3786e-03, 6.8267e-03, 4.5014e-04, -2.1046e-02,\n -9.0729e-03, -8.3521e-03, -1.5510e-02, -2.9092e-02, -1.5608e-03,\n 1.0956e-02, -6.8351e-03, 3.4580e-03, -1.5578e-02, -2.3133e-02,\n 1.0579e-02, 1.6689e-02, 2.5875e-03, 3.5160e-02, -3.9335e-03,\n 5.4056e-03, -5.7879e-03, 2.7108e-03, 1.7901e-02, -3.3624e-02,\n -1.1064e-02, 2.1946e-02, -1.3397e-02, 6.9708e-03, -2.1429e-02,\n -1.5614e-02, -1.3486e-02, -3.6082e-03, 3.4211e-02, 1.0375e-03,\n 2.0678e-03, 9.6109e-03, 1.8691e-02, 4.8153e-04, -4.8446e-03,\n 1.1434e-02, -6.7119e-02, -1.1511e-02, -4.7919e-03, 3.4753e-02,\n 4.9036e-02, -1.8307e-02, 1.8229e-02, 1.8918e-02, 8.2896e-03,\n 8.2585e-03, -9.2288e-03, -5.7169e-02, 1.3355e-02, 2.4652e-02,\n -1.1623e-02, 1.2202e-03, 3.7813e-03, 6.3779e-03, -1.8253e-02,\n 5.0765e-03, -4.1184e-03, 1.5841e-02, -3.1552e-03, 2.7844e-02,\n 4.0947e-03, -2.6546e-02, 6.6179e-03, -1.1272e-02, -4.3845e-02,\n 2.5156e-02, -3.2176e-02, -5.1441e-04, -3.2315e-03, -2.9269e-03,\n 2.8880e-03, -8.4696e-02, 2.8344e-03, 1.7418e-02, -8.5503e-03,\n -1.2802e-02, 2.7067e-02, 2.8389e-02, -2.9499e-03, -4.3166e-02,\n -1.2561e-03, -1.5049e-03, 1.4530e-02, -2.4177e-02, -4.0094e-02,\n -2.8498e-02, 5.7119e-03, -6.6086e-03, 7.7728e-03, -1.9267e-02,\n -1.5791e-02, 1.2833e-02, -8.7338e-03, -6.9153e-03, -5.3013e-03,\n -1.3133e-02, -2.7093e-02, 3.7075e-03, 1.7775e-02, 3.7392e-03,\n 1.7764e-02, -5.6612e-03, -1.0525e-02, 5.4252e-03, 4.8284e-02,\n -3.8916e-02, -1.4168e-02, -2.1915e-03, -3.2065e-04, 7.2808e-03,\n 1.6518e-02, 2.0289e-02, 3.3099e-03, -1.0053e-02, 4.4124e-02,\n 8.9763e-03, 2.0367e-03, 1.8085e-02, -8.9079e-03, -4.0361e-02,\n 6.3477e-03, -1.1543e-03, -4.6127e-02, -5.6799e-03, 1.2302e-02,\n 9.4722e-03, -4.2716e-02, 4.9635e-03, 6.7600e-03, -1.4022e-02,\n -2.1022e-02, -2.6975e-02, -6.0806e-02, 7.8315e-03, 1.1706e-02,\n -4.3994e-03, 2.1043e-03, -7.2372e-03, -3.3396e-02, -2.5032e-02,\n -1.7885e-02, 1.1947e-03, -2.6102e-02, -8.6965e-03, -1.3452e-02,\n 4.0446e-02, 1.0915e-02, -2.0816e-02, -2.4208e-03, -1.2709e-02,\n -1.3052e-02, -2.2749e-02, -6.1472e-03, 1.9950e-03, 1.3153e-02,\n 2.2318e-03, 2.5194e-02, 3.6230e-03, 7.0193e-03, 5.1776e-03,\n -2.3208e-03, 5.7883e-02, 3.1093e-02, 2.4320e-02, -4.9186e-03,\n 3.1006e-03, -5.0278e-03, 1.4702e-02, 1.0584e-02, -6.6311e-03,\n -2.4885e-03, -2.5256e-02, 2.2617e-02, 2.5140e-02, -1.7339e-02,\n 3.4625e-02, -2.6482e-02, 1.7238e-02, -7.2231e-03, 3.2412e-02,\n -1.2149e-01, -8.3441e-03, 6.1203e-04, -3.2988e-02, -1.1938e-02,\n -2.3012e-02, -2.2362e-02, 2.4986e-02, 1.6660e-02, -1.0288e-02,\n 1.0746e-02, 1.0570e-02, -1.8688e-02, -2.4399e-03, 1.9430e-02,\n 1.2458e-02, 3.5908e-03, 1.4565e-02, 8.5969e-03, 1.8819e-02,\n 1.9277e-02, 2.3331e-02, 1.5028e-02, -1.7221e-02, -3.4583e-02,\n 2.4806e-02, -2.1692e-02, 1.9058e-02, 3.7500e-02, 9.4620e-03,\n -7.2598e-02, 3.0671e-03, -7.7230e-05, 1.3034e-02, 1.4009e-02,\n -2.3234e-02, 2.2420e-02, -1.3788e-02, -2.9124e-02, 2.6816e-02,\n -4.4457e-03, -1.2709e-02, 3.0509e-02, -1.3827e-02, 2.5645e-02,\n -9.8564e-03, 2.0699e-02, 1.6752e-02, -2.2014e-02, 1.0980e-02,\n 1.2349e-02, 1.2173e-02, 1.0898e-02, 5.8900e-03, 3.9373e-02,\n -3.0039e-03, -4.3118e-02, 7.5014e-03, 1.0188e-02, 2.2672e-02,\n -3.0225e-02, -8.6984e-03, 1.6676e-02, 1.6920e-02, 2.9734e-03,\n -3.4277e-02, 1.0660e-03, 3.3736e-02, -1.0036e-02, 9.3334e-04,\n -1.0929e-02, 1.8014e-02, -1.5273e-02, 1.8896e-02, 1.1528e-02,\n 5.3778e-04, -2.6961e-02, -1.2374e-02, -2.8883e-03, 2.9925e-02,\n -5.1151e-02, 3.9963e-02, -7.2218e-03, 2.9892e-03, 1.9375e-02,\n 8.8027e-03, 1.5175e-02, 1.9207e-02, 2.7136e-02, -1.5579e-02,\n 1.0864e-02, -1.3314e-02, -3.2899e-02, 2.6386e-02, -7.0221e-03,\n 1.8596e-02, 5.7813e-03, -1.0817e-02, -1.1234e-02, -1.1643e-03,\n -3.8568e-02, 3.4877e-03, -8.2193e-03, 9.6313e-03, -2.0926e-02,\n 6.3420e-03, 1.9087e-02, -6.0869e-03, 1.3991e-03, 1.3895e-02,\n -7.5625e-03, -2.0593e-02, -1.7436e-02, -2.7332e-02, 6.9042e-03,\n -2.4734e-02, 2.1061e-02, -6.5042e-03, 1.1484e-02, 8.1219e-03,\n -1.3500e-02, -7.4161e-03, 1.9782e-03, -4.9849e-03, 1.1346e-02,\n -3.7154e-02, 2.3436e-02, 1.2989e-02, -1.1469e-02, 1.6544e-02,\n 8.6258e-03, -3.5089e-02, -5.3416e-03, -7.8483e-03, 4.3648e-03,\n 1.0035e-02, -1.0845e-03, 7.2523e-03, 4.3262e-02, 2.2422e-03,\n -7.4405e-03, -6.3825e-04, 2.3108e-02, 1.4278e-02, -1.4173e-03,\n 1.9439e-02, 2.2908e-03, 2.5176e-02, 5.4866e-03, 5.9009e-05,\n 5.7709e-03, -1.9140e-02, -2.1233e-02, -1.7427e-02, -1.2646e-02,\n -4.1329e-02, -1.3818e-02, -1.3989e-02, -3.3200e-02, 7.4491e-03,\n 5.3278e-03, -7.4798e-03, 2.2317e-02, -9.0632e-03, 1.3627e-02,\n 1.6893e-03, 1.1815e-02, -9.0258e-03, 1.0307e-02, -1.6499e-02,\n -2.6021e-02, -1.5008e-02, -1.4901e-02, 2.8010e-02, 1.5537e-03,\n 2.9730e-02, 1.5684e-02, 1.3571e-02, 1.4725e-02, -2.2389e-02,\n 6.6216e-03, -1.0543e-03, 3.1137e-02, -5.0946e-02, -1.3019e-02,\n -1.2717e-02, -8.9111e-03, 3.8591e-03, -6.8286e-03, -2.4602e-02,\n 6.0984e-03, -5.0637e-03, -5.2850e-02, -1.2824e-02, 2.1947e-02,\n 2.4265e-02, 1.3512e-03, 7.2249e-02, -6.4477e-03, -4.9032e-04,\n 2.5237e-02, 9.2552e-03, -2.0605e-02, -5.9785e-03, 4.1271e-02,\n -4.4904e-03, -2.4063e-03, 4.0602e-02, 6.6938e-05, 1.0767e-02,\n 4.1942e-05, -6.4488e-03, -9.9551e-03, 1.1847e-02, -3.6731e-03,\n 8.7070e-03, -1.8285e-02, 6.4866e-03, 5.7810e-02, 1.4422e-02,\n 9.9396e-03, -1.7762e-03], device='cuda:0')",
13
- "exp_avg_sq": "tensor([0.0040, 0.0043, 0.0064, 0.0049, 0.0033, 0.0028, 0.0054, 0.0042, 0.0039,\n 0.0036, 0.0049, 0.0036, 0.0033, 0.0047, 0.0048, 0.0045, 0.0052, 0.0034,\n 0.0030, 0.0041, 0.0058, 0.0035, 0.0030, 0.0033, 0.0056, 0.0040, 0.0039,\n 0.0031, 0.0050, 0.0057, 0.0047, 0.0054, 0.0047, 0.0044, 0.0037, 0.0094,\n 0.0036, 0.0029, 0.0030, 0.0065, 0.0063, 0.0039, 0.0041, 0.0059, 0.0018,\n 0.0060, 0.0018, 0.0039, 0.0035, 0.0022, 0.0034, 0.0026, 0.0046, 0.0043,\n 0.0037, 0.0029, 0.0028, 0.0025, 0.0030, 0.0042, 0.0019, 0.0034, 0.0049,\n 0.0058, 0.0039, 0.0062, 0.0036, 0.0027, 0.0075, 0.0064, 0.0033, 0.0091,\n 0.0032, 0.0036, 0.0036, 0.0044, 0.0037, 0.0017, 0.0029, 0.0056, 0.0032,\n 0.0041, 0.0034, 0.0029, 0.0006, 0.0044, 0.0046, 0.0058, 0.0030, 0.0039,\n 0.0059, 0.0033, 0.0068, 0.0034, 0.0053, 0.0043, 0.0040, 0.0044, 0.0033,\n 0.0052, 0.0035, 0.0037, 0.0052, 0.0048, 0.0025, 0.0051, 0.0024, 0.0048,\n 0.0049, 0.0039, 0.0041, 0.0042, 0.0030, 0.0038, 0.0024, 0.0029, 0.0064,\n 0.0022, 0.0020, 0.0047, 0.0032, 0.0037, 0.0017, 0.0030, 0.0044, 0.0046,\n 0.0066, 0.0035, 0.0048, 0.0040, 0.0049, 0.0017, 0.0025, 0.0037, 0.0024,\n 0.0052, 0.0054, 0.0017, 0.0072, 0.0039, 0.0022, 0.0051, 0.0036, 0.0030,\n 0.0016, 0.0064, 0.0121, 0.0075, 0.0041, 0.0063, 0.0044, 0.0042, 0.0041,\n 0.0036, 0.0046, 0.0058, 0.0031, 0.0038, 0.0019, 0.0034, 0.0049, 0.0063,\n 0.0028, 0.0047, 0.0064, 0.0088, 0.0034, 0.0031, 0.0041, 0.0062, 0.0021,\n 0.0033, 0.0037, 0.0027, 0.0051, 0.0048, 0.0054, 0.0033, 0.0067, 0.0044,\n 0.0063, 0.0041, 0.0076, 0.0041, 0.0050, 0.0055, 0.0044, 0.0036, 0.0032,\n 0.0047, 0.0049, 0.0032, 0.0034, 0.0037, 0.0046, 0.0062, 0.0060, 0.0054,\n 0.0026, 0.0049, 0.0045, 0.0036, 0.0047, 0.0056, 0.0032, 0.0043, 0.0028,\n 0.0047, 0.0033, 0.0090, 0.0037, 0.0035, 0.0058, 0.0045, 0.0065, 0.0039,\n 0.0027, 0.0032, 0.0040, 0.0062, 0.0041, 0.0052, 0.0041, 0.0027, 0.0050,\n 0.0039, 0.0036, 0.0060, 0.0049, 0.0037, 0.0024, 0.0047, 0.0049, 0.0069,\n 0.0045, 0.0031, 0.0035, 0.0062, 0.0046, 0.0065, 0.0023, 0.0045, 0.0046,\n 0.0049, 0.0074, 0.0081, 0.0016, 0.0039, 0.0069, 0.0024, 0.0052, 0.0035,\n 0.0035, 0.0007, 0.0018, 0.0043, 0.0041, 0.0040, 0.0047, 0.0036, 0.0030,\n 0.0038, 0.0051, 0.0045, 0.0035, 0.0048, 0.0053, 0.0040, 0.0022, 0.0040,\n 0.0066, 0.0040, 0.0037, 0.0063, 0.0056, 0.0041, 0.0035, 0.0054, 0.0040,\n 0.0047, 0.0036, 0.0062, 0.0051, 0.0045, 0.0041, 0.0023, 0.0063, 0.0031,\n 0.0036, 0.0057, 0.0057, 0.0042, 0.0023, 0.0056, 0.0040, 0.0083, 0.0048,\n 0.0042, 0.0043, 0.0043, 0.0045, 0.0035, 0.0055, 0.0057, 0.0038, 0.0037,\n 0.0045, 0.0051, 0.0041, 0.0051, 0.0057, 0.0054, 0.0031, 0.0049, 0.0059,\n 0.0028, 0.0039, 0.0042, 0.0038, 0.0024, 0.0048, 0.0021, 0.0036, 0.0054,\n 0.0041, 0.0066, 0.0045, 0.0051, 0.0042, 0.0053, 0.0033, 0.0023, 0.0020,\n 0.0050, 0.0050, 0.0033, 0.0055, 0.0052, 0.0052, 0.0043, 0.0055, 0.0030,\n 0.0043, 0.0036, 0.0027, 0.0043, 0.0050, 0.0042, 0.0029, 0.0048, 0.0025,\n 0.0040, 0.0039, 0.0051, 0.0042, 0.0076, 0.0044, 0.0047, 0.0030, 0.0039,\n 0.0045, 0.0056, 0.0044, 0.0025, 0.0061, 0.0060, 0.0046, 0.0033, 0.0029,\n 0.0066, 0.0054, 0.0055, 0.0025, 0.0032, 0.0041, 0.0040, 0.0038, 0.0052,\n 0.0045, 0.0052, 0.0060, 0.0037, 0.0064, 0.0044, 0.0032, 0.0049, 0.0049,\n 0.0029, 0.0062, 0.0056, 0.0054, 0.0045, 0.0026, 0.0063, 0.0048, 0.0054,\n 0.0046, 0.0058, 0.0043, 0.0040, 0.0018, 0.0032, 0.0031, 0.0064, 0.0023,\n 0.0059, 0.0067, 0.0043, 0.0041, 0.0030, 0.0035, 0.0027, 0.0017, 0.0051,\n 0.0051, 0.0048, 0.0027, 0.0045, 0.0032, 0.0093, 0.0029, 0.0059, 0.0098,\n 0.0023, 0.0050, 0.0048, 0.0037, 0.0056, 0.0040, 0.0033, 0.0037, 0.0047,\n 0.0053, 0.0036, 0.0030, 0.0041, 0.0033, 0.0036, 0.0025, 0.0033, 0.0024,\n 0.0069, 0.0056, 0.0039, 0.0022, 0.0048, 0.0046, 0.0036, 0.0072, 0.0060,\n 0.0034, 0.0038, 0.0038, 0.0044, 0.0042, 0.0039, 0.0040, 0.0018, 0.0023,\n 0.0092, 0.0045, 0.0034, 0.0068, 0.0051, 0.0046, 0.0057, 0.0064, 0.0044,\n 0.0034, 0.0043, 0.0072, 0.0035, 0.0046, 0.0031, 0.0047, 0.0026, 0.0026,\n 0.0063, 0.0037, 0.0046, 0.0073, 0.0037, 0.0049, 0.0020, 0.0033, 0.0032,\n 0.0037, 0.0068, 0.0037, 0.0053, 0.0031, 0.0037, 0.0051, 0.0029, 0.0099,\n 0.0055, 0.0036, 0.0058, 0.0033, 0.0068, 0.0037, 0.0053, 0.0032, 0.0026,\n 0.0049, 0.0027, 0.0065, 0.0038, 0.0095, 0.0046, 0.0036, 0.0029],\n device='cuda:0')"
14
  },
15
  "2": {
16
- "step": "tensor(5008.)",
17
- "exp_avg": "tensor([ 1.5637e-03, 1.1331e-03, 6.3570e-03, 1.5253e-03, -5.2898e-03,\n 8.3879e-03, 2.3779e-03, 2.3403e-03, -3.3713e-03, 3.2798e-03,\n -2.7316e-03, 2.3929e-03, -3.7851e-03, -1.6408e-03, 3.2766e-03,\n 1.8150e-03, 8.8428e-03, 1.7770e-03, -1.6138e-03, -1.2442e-03,\n -1.9715e-04, -3.8505e-03, -5.6693e-03, -9.1981e-03, 3.0765e-03,\n -1.9992e-03, 6.1373e-03, 6.6007e-03, -2.4273e-03, 7.8320e-04,\n -2.1833e-03, -5.5062e-04, 4.3956e-03, 1.6076e-03, -7.4118e-05,\n -3.2350e-03, -1.6134e-03, 3.6158e-03, -3.4705e-04, 5.1396e-03,\n 4.1571e-03, -8.4949e-03, -3.6366e-03, -3.6467e-03, 1.3956e-03,\n -1.3255e-03, 1.2478e-03, -6.8331e-03, -5.4349e-03, 1.7584e-03,\n 5.5563e-04, 5.4039e-03, -2.0392e-03, -1.9413e-04, -7.7759e-04,\n 1.1283e-03, 1.9054e-03, 1.1418e-03, -2.8994e-03, 5.5052e-04,\n 1.2070e-03, -4.9494e-03, 2.5321e-03, 2.5224e-03, -1.7651e-03,\n -5.8677e-04, -1.8712e-03, -4.2110e-03, 4.0981e-03, 3.4653e-03,\n 1.9871e-03, -2.4918e-03, 2.5319e-03, -2.0132e-03, 8.3889e-03,\n -2.5534e-03, -9.9281e-04, -7.1519e-03, 1.1709e-03, -5.4243e-04,\n 2.7622e-03, -1.6514e-03, -3.7645e-03, -7.8327e-03, 1.7744e-02,\n 3.3313e-03, 3.3014e-03, 2.3544e-03, 9.1376e-03, -2.3299e-03,\n 3.9793e-03, -1.5084e-04, 4.8612e-03, -7.9764e-03, -4.4329e-03,\n 1.2382e-03, -6.3019e-04, 4.8229e-03, 9.3515e-04, 3.3755e-03,\n 2.1709e-03, -7.4667e-05, -4.0581e-03, -2.2337e-03, -5.2629e-03,\n 4.4666e-04, 1.5305e-03, 1.1986e-03, 9.7193e-07, -3.7198e-03,\n -1.8105e-03, -1.3496e-03, -2.9405e-03, -5.6836e-03, 3.5774e-04,\n 2.7856e-03, -6.2601e-04, -4.2445e-04, -5.6002e-03, -3.0331e-03,\n 2.2639e-03, 2.4479e-03, 2.6321e-03, 7.9847e-03, -2.4252e-04,\n 1.0002e-03, -7.5899e-04, 3.1623e-04, 2.3828e-03, -5.7131e-03,\n -1.2818e-03, 1.3927e-02, -4.3597e-03, 1.3153e-03, -3.9436e-03,\n -1.0681e-03, -1.7330e-03, 8.8354e-04, 3.6809e-03, -7.6309e-04,\n 3.2238e-03, 1.9947e-04, 4.0161e-03, 1.5780e-03, -1.3455e-03,\n 1.5874e-03, -7.7936e-03, -1.2151e-03, -1.3381e-03, 4.2631e-03,\n 7.8867e-03, -3.4176e-03, 3.4302e-03, 3.5700e-03, 2.0708e-04,\n 3.8596e-04, -3.9538e-03, -1.3080e-02, 4.7764e-03, 5.4275e-03,\n -2.4672e-03, -2.6849e-04, -6.0117e-05, 1.0519e-03, -2.4120e-03,\n 7.9954e-05, -2.1970e-03, 4.6195e-03, 2.2314e-05, 3.6972e-03,\n 4.7364e-04, -2.0202e-03, 1.6837e-03, -1.6608e-03, -5.0006e-03,\n 2.8853e-03, -4.2246e-03, 5.6656e-05, -3.4071e-04, -1.3522e-03,\n 1.5905e-03, -1.1995e-02, 2.3916e-04, 1.8017e-03, -1.1774e-03,\n 2.9518e-04, 2.8723e-03, 5.4799e-03, -7.1523e-04, -4.8157e-03,\n -1.8695e-03, -1.2530e-03, 3.3510e-03, -4.9661e-03, -3.5618e-03,\n -4.6777e-03, 5.8857e-04, -1.8104e-03, 3.3910e-03, -6.3014e-03,\n -6.7493e-04, 1.9431e-03, -1.5187e-03, -2.0627e-03, -7.6643e-04,\n -9.0444e-04, -7.9063e-03, 2.0442e-04, 4.2483e-03, 9.5781e-04,\n 2.9150e-03, -1.6241e-03, -3.9101e-03, 4.0494e-04, 4.7711e-03,\n -6.2297e-03, -5.3865e-03, -2.3949e-03, 2.5871e-04, 1.0842e-03,\n 3.0142e-03, 1.4479e-03, 1.6725e-03, -2.4770e-03, 5.3801e-03,\n 2.9238e-03, -5.1469e-04, 2.2795e-03, 1.6863e-04, -4.7410e-03,\n -2.9515e-03, 7.0501e-04, -7.2585e-03, -7.0893e-04, 7.5173e-04,\n 4.4746e-03, -1.0040e-02, 5.2203e-04, 5.5522e-04, -7.4918e-04,\n -6.6960e-03, -6.5837e-03, -1.1347e-02, 1.2861e-03, 1.6720e-03,\n -2.6619e-03, 1.5145e-03, -3.4372e-04, -4.0455e-03, -8.4521e-03,\n -4.9356e-03, -4.9877e-04, -5.1602e-03, -4.1158e-02, -5.5503e-03,\n 9.5820e-03, 2.4651e-03, -4.5891e-03, -7.7031e-04, -4.9482e-03,\n -3.1116e-03, -4.9030e-03, -1.3765e-03, 1.0995e-03, 2.6602e-03,\n -2.8690e-04, 3.0339e-03, 2.6024e-04, 3.2000e-03, 5.2323e-04,\n -6.2582e-04, 1.2948e-02, 5.4504e-03, 3.7211e-03, -5.5264e-04,\n 2.0485e-04, -1.7893e-03, 2.9001e-03, 1.7439e-03, -1.6614e-04,\n -2.0795e-03, -3.0921e-03, 2.9284e-03, 6.2525e-03, -3.8834e-03,\n 1.2916e-02, -2.0872e-03, 2.5457e-03, -3.3909e-04, 5.3209e-03,\n -1.2311e-02, -1.5753e-03, 8.4622e-04, -5.1752e-03, -2.0433e-03,\n -2.5980e-03, -3.5568e-03, 2.7918e-03, 2.3728e-03, -2.0323e-03,\n 1.4495e-03, 9.6842e-04, -2.4979e-03, -4.4124e-04, 2.9860e-03,\n 9.5480e-04, 5.9629e-04, 1.2403e-03, 5.7443e-04, 2.2416e-03,\n 2.8539e-03, 4.3555e-03, 3.3092e-03, -1.5052e-05, -7.0476e-03,\n 5.2002e-03, -3.4017e-03, 4.8848e-03, 4.5802e-03, 1.9291e-03,\n -1.2934e-02, 1.0005e-03, 1.8790e-04, 9.9918e-04, 2.2771e-03,\n -2.7146e-03, 4.5488e-03, -3.9269e-04, -9.5604e-03, 4.3809e-03,\n -1.1777e-03, -3.8840e-03, 1.4149e-02, -2.0829e-03, 4.7894e-03,\n -4.5252e-03, 3.1743e-03, 6.4039e-03, -1.6988e-03, 1.9086e-03,\n 7.0879e-04, 2.7432e-03, 1.0088e-03, 1.7484e-03, 1.3466e-02,\n 5.6593e-04, -7.4784e-03, 1.7661e-03, 7.1077e-05, 3.1699e-03,\n -8.6904e-03, -2.2616e-03, 3.6547e-03, 2.2356e-03, 6.0370e-04,\n -4.6223e-03, 6.1233e-04, 4.4147e-03, -3.1454e-03, 8.0866e-04,\n -1.6000e-03, 2.3895e-03, -2.4401e-03, 5.0198e-03, 1.4081e-03,\n 5.2904e-05, -2.1126e-03, -4.0217e-03, -1.6847e-04, 4.7040e-03,\n -9.3510e-03, 5.9152e-03, -1.5079e-04, 2.1108e-04, 4.0704e-03,\n 2.7419e-03, 2.0107e-03, 1.9175e-03, 6.1114e-03, -2.3153e-03,\n 9.4298e-04, -2.1065e-03, -3.2045e-03, 7.6808e-03, -1.2134e-03,\n 3.4460e-03, 1.5884e-03, -2.9380e-03, -1.7970e-03, -1.9316e-03,\n -7.3167e-03, 6.8377e-04, -3.7814e-03, 2.4459e-03, -2.6305e-03,\n 2.9982e-03, 1.6166e-03, -1.3900e-04, 1.0294e-05, 2.5463e-03,\n -1.5701e-03, -4.1301e-03, -5.9673e-03, -4.2009e-03, 1.1908e-03,\n -2.3197e-03, 2.0371e-03, -1.2731e-03, 1.3982e-03, 2.2241e-03,\n -3.6285e-03, -4.9339e-03, 3.2035e-03, -4.6974e-04, 1.4820e-03,\n -3.7954e-03, 4.6122e-03, 2.3582e-03, -3.2672e-03, 3.9615e-03,\n 3.2876e-03, -4.1430e-03, -4.4520e-04, -4.5813e-03, 1.9136e-03,\n 1.7037e-03, -2.5789e-04, -5.4252e-04, 1.5001e-02, 4.8935e-04,\n -2.9632e-03, 6.8849e-05, 3.1083e-03, 2.3438e-03, 1.3715e-04,\n 2.2875e-03, 1.2438e-03, 2.4613e-03, -7.1723e-04, -2.6003e-04,\n 2.0538e-03, -1.9543e-03, -2.1281e-03, -1.0952e-03, -8.1909e-03,\n -6.0105e-03, -3.8879e-03, -9.5963e-04, -5.9575e-03, 1.7417e-03,\n 1.7456e-03, -2.4974e-03, 2.2621e-03, -7.7044e-04, 1.9886e-03,\n 9.8562e-04, 1.6273e-03, -1.0239e-02, 3.2646e-03, -3.0718e-03,\n -2.3390e-03, -2.1378e-03, -2.4323e-03, 3.9756e-03, -9.4067e-05,\n 2.0967e-03, 1.3855e-03, 3.5729e-03, 2.6354e-03, -2.2136e-03,\n 6.8377e-04, 3.0151e-05, 5.4546e-03, -1.4087e-02, -2.3797e-03,\n -2.5428e-03, -1.8049e-03, 4.3431e-05, -2.1986e-03, -5.6161e-03,\n 8.0044e-04, -1.6199e-03, -6.9479e-03, -6.6103e-03, 8.1480e-03,\n 6.2698e-03, 1.5187e-03, 1.1297e-02, -2.9504e-04, 2.6824e-04,\n 8.5132e-03, 1.3827e-03, -2.9369e-03, -1.9412e-03, 4.9061e-03,\n -2.1001e-03, 4.7557e-04, 5.4240e-03, -6.8520e-04, 1.3993e-03,\n -8.3853e-04, 6.0229e-04, -9.1813e-04, 4.5081e-03, 2.0948e-03,\n 2.4591e-03, -2.5379e-03, 9.7504e-05, 8.5393e-03, 1.4853e-03,\n 4.5573e-03, -1.4257e-03], device='cuda:0')",
18
- "exp_avg_sq": "tensor([8.5181e-05, 7.6540e-05, 6.9160e-05, 5.8538e-05, 1.7873e-04, 1.6369e-04,\n 5.5226e-05, 5.6506e-05, 7.5931e-05, 9.9937e-05, 8.9579e-05, 2.6836e-04,\n 6.8846e-05, 9.8901e-05, 9.9787e-05, 8.4669e-05, 5.6392e-05, 2.5266e-04,\n 1.5246e-04, 1.1826e-04, 7.0538e-05, 1.4403e-04, 1.7788e-04, 1.4277e-04,\n 5.3319e-05, 8.4194e-05, 2.1612e-04, 7.0942e-05, 5.2329e-05, 8.9419e-05,\n 7.3923e-05, 4.0005e-05, 1.2302e-04, 4.2182e-05, 8.3777e-05, 1.0057e-04,\n 8.4290e-05, 1.3238e-04, 1.5412e-04, 1.1738e-04, 1.4307e-04, 1.1434e-04,\n 1.0897e-04, 7.9403e-05, 1.1551e-04, 1.1009e-04, 3.2317e-04, 1.0975e-04,\n 1.5649e-04, 3.1015e-04, 1.2146e-04, 1.0338e-04, 8.8347e-05, 6.9724e-05,\n 1.0081e-04, 8.8853e-05, 1.1075e-04, 1.7167e-04, 8.4072e-05, 1.3335e-04,\n 1.9454e-04, 1.3711e-04, 1.0672e-04, 6.9389e-05, 1.3600e-04, 5.6569e-05,\n 1.2727e-04, 1.5792e-04, 6.9525e-05, 1.0495e-04, 8.0570e-05, 1.0711e-04,\n 7.3610e-05, 6.8021e-05, 1.1544e-04, 1.1008e-04, 6.5307e-05, 3.8277e-04,\n 2.0406e-04, 5.5952e-05, 2.1824e-04, 9.4292e-05, 8.1942e-05, 1.0774e-04,\n 1.0975e-01, 6.8056e-05, 9.6144e-05, 4.5391e-05, 1.1438e-04, 8.5799e-05,\n 1.3679e-04, 1.0774e-04, 5.0444e-05, 2.2922e-04, 6.3621e-05, 8.2976e-05,\n 9.4708e-05, 8.5147e-05, 1.0316e-04, 1.2862e-04, 8.5365e-05, 6.6713e-05,\n 1.8550e-04, 7.5622e-05, 3.9042e-04, 5.7683e-05, 2.1052e-04, 9.4636e-05,\n 8.2362e-05, 1.0202e-04, 1.2800e-04, 7.9737e-05, 7.7803e-05, 9.6021e-05,\n 1.5262e-04, 1.0941e-04, 1.4592e-04, 2.7731e-04, 2.7086e-04, 1.0332e-04,\n 9.3495e-05, 4.8591e-05, 5.1994e-04, 9.8420e-05, 4.4647e-05, 6.0561e-05,\n 6.3075e-05, 8.4102e-05, 4.3204e-05, 7.2744e-05, 9.8594e-05, 6.2543e-04,\n 1.5396e-04, 7.3329e-05, 8.5270e-05, 5.7911e-05, 6.6661e-05, 3.7964e-04,\n 6.3794e-05, 1.5260e-04, 1.6342e-04, 5.1682e-05, 9.9206e-05, 1.8306e-04,\n 2.8062e-04, 8.7257e-05, 1.2546e-04, 9.2811e-05, 5.2118e-05, 5.6137e-05,\n 1.0631e-04, 8.8958e-05, 9.8355e-05, 8.3003e-05, 5.6856e-05, 8.2253e-05,\n 3.1770e-04, 1.3943e-04, 2.0053e-04, 9.4031e-05, 7.5362e-05, 1.1385e-04,\n 2.7963e-04, 8.5839e-05, 5.5629e-05, 1.0778e-04, 1.7742e-04, 2.1947e-04,\n 8.5615e-05, 9.0991e-05, 2.0305e-04, 1.0731e-04, 1.0874e-04, 1.8500e-04,\n 8.3808e-05, 7.8731e-05, 7.9927e-05, 6.8185e-05, 6.0940e-05, 8.6364e-05,\n 8.9142e-05, 1.2770e-04, 6.4104e-05, 5.2132e-05, 5.9187e-05, 7.8621e-05,\n 9.4734e-05, 1.0262e-04, 9.4835e-05, 1.1780e-04, 2.5116e-04, 1.8043e-04,\n 7.0380e-05, 1.0749e-04, 3.9852e-05, 6.4969e-05, 5.0384e-05, 7.5243e-05,\n 2.3609e-04, 1.2863e-04, 3.6214e-05, 1.0219e-04, 8.6961e-05, 6.0282e-05,\n 7.6318e-05, 6.1607e-05, 1.8889e-04, 7.8364e-05, 2.0820e-04, 1.9055e-04,\n 1.2100e-04, 1.4280e-04, 8.6052e-05, 5.5838e-05, 1.1421e-04, 1.5386e-04,\n 2.6858e-04, 6.4796e-05, 1.0250e-04, 8.2069e-05, 1.4898e-04, 7.4218e-05,\n 9.7484e-05, 1.6798e-04, 6.8435e-05, 1.1001e-04, 1.1639e-04, 5.9624e-05,\n 1.1308e-04, 1.0449e-04, 2.3216e-04, 1.0495e-04, 7.2232e-05, 7.9661e-05,\n 4.7154e-05, 1.8461e-04, 1.3631e-04, 7.8458e-05, 6.0728e-05, 5.9072e-05,\n 2.1917e-04, 1.3997e-04, 1.2691e-04, 5.0728e-05, 7.8870e-05, 8.8276e-05,\n 4.5411e-04, 7.5987e-05, 7.8900e-05, 2.0889e-04, 7.8996e-05, 1.0774e-04,\n 2.7114e-04, 6.9288e-03, 3.0527e-04, 1.0167e-04, 1.3662e-04, 1.2929e-04,\n 6.6372e-05, 1.4790e-04, 1.0635e-04, 1.3523e-04, 7.0672e-05, 7.4412e-05,\n 1.7286e-04, 7.3732e-05, 1.1508e-04, 5.4867e-05, 2.6548e-04, 6.6427e-05,\n 7.4630e-05, 2.0490e-04, 7.3035e-05, 7.9467e-05, 1.1346e-04, 6.1307e-05,\n 2.0775e-04, 5.4481e-05, 4.7012e-05, 7.2863e-05, 9.6463e-05, 4.4750e-05,\n 4.8941e-05, 1.4008e-04, 9.6039e-05, 2.2207e-04, 7.1188e-05, 1.0957e-04,\n 7.8019e-05, 1.2864e-04, 7.7467e-05, 9.4558e-05, 2.0031e-04, 1.2282e-04,\n 8.3006e-05, 7.0955e-05, 1.1043e-04, 7.1206e-05, 8.2549e-05, 5.2150e-05,\n 5.9106e-05, 7.2927e-05, 7.6705e-05, 8.5511e-05, 8.4014e-05, 5.5332e-05,\n 7.1404e-05, 1.3070e-04, 6.1098e-05, 7.9744e-05, 8.5379e-05, 6.7078e-05,\n 1.0844e-04, 5.8691e-05, 8.1497e-05, 1.4583e-04, 1.9364e-04, 1.1972e-04,\n 5.1649e-05, 1.6834e-04, 1.0426e-04, 2.7651e-04, 9.2908e-05, 1.0991e-04,\n 1.7730e-04, 7.8310e-05, 1.1935e-04, 6.5991e-05, 1.7140e-04, 1.4463e-04,\n 1.9471e-04, 1.4845e-04, 3.5586e-04, 6.2301e-05, 1.2379e-04, 1.5848e-04,\n 1.1358e-04, 1.6632e-04, 1.0273e-04, 1.2483e-04, 7.0481e-05, 1.8110e-04,\n 4.5939e-05, 8.9607e-05, 2.0460e-04, 7.0496e-05, 1.0939e-04, 1.0279e-04,\n 1.5531e-04, 1.1121e-04, 1.3447e-04, 1.0933e-04, 1.4408e-04, 7.0176e-05,\n 1.0078e-04, 9.8290e-05, 1.1187e-04, 6.8561e-05, 8.9006e-05, 5.0292e-05,\n 7.9085e-05, 7.2157e-05, 6.2548e-05, 1.8419e-04, 8.0337e-05, 1.8433e-04,\n 5.8556e-05, 2.8369e-04, 1.5772e-04, 6.9203e-05, 1.1821e-04, 1.3874e-04,\n 1.5467e-04, 1.0363e-04, 1.2180e-04, 1.2505e-04, 6.4642e-05, 5.2114e-05,\n 1.1171e-04, 8.1772e-05, 6.4010e-05, 1.5791e-04, 7.0903e-05, 1.6018e-04,\n 1.4143e-04, 2.1900e-04, 6.7894e-05, 1.0575e-04, 1.0790e-04, 1.5127e-04,\n 7.7488e-05, 1.2461e-04, 2.3218e-04, 1.2154e-04, 4.9221e-05, 1.5401e-04,\n 6.5265e-05, 1.8850e-04, 6.2458e-05, 1.9405e-04, 1.6980e-04, 9.7002e-05,\n 2.4445e-04, 9.3908e-05, 2.3616e-04, 7.2644e-05, 8.8782e-05, 6.1520e-05,\n 8.5631e-05, 1.6085e-04, 1.2503e-04, 1.7555e-04, 5.4937e-04, 6.7344e-05,\n 6.2021e-05, 6.0324e-05, 7.7427e-05, 9.5160e-05, 2.0374e-04, 6.2104e-05,\n 7.7439e-05, 8.3824e-05, 5.8404e-05, 3.5826e-04, 9.7618e-05, 1.0263e-04,\n 1.9410e-04, 7.2720e-05, 2.3394e-04, 1.2380e-04, 1.4980e-04, 7.3861e-05,\n 9.8819e-05, 8.7184e-05, 1.0638e-04, 8.4856e-05, 1.5991e-04, 3.8543e-05,\n 2.4692e-04, 6.1860e-05, 1.8556e-04, 5.4125e-05, 3.3263e-05, 4.9241e-05,\n 3.2173e-04, 9.0930e-05, 7.4547e-05, 3.4561e-05, 1.0666e-04, 6.2772e-05,\n 1.1846e-04, 1.0371e-04, 5.9603e-05, 1.0313e-04, 5.9619e-05, 1.5056e-04,\n 8.5241e-05, 6.3958e-04, 3.3623e-04, 8.1319e-05, 7.1386e-05, 7.6726e-05,\n 6.2588e-05, 8.5882e-05, 9.3270e-05, 3.5954e-05, 6.7050e-05, 1.8582e-04,\n 1.0891e-04, 5.8441e-05, 1.1604e-04, 5.6476e-05, 5.3924e-05, 1.8970e-04,\n 5.7692e-05, 1.2145e-04, 1.4310e-04, 7.9222e-05, 1.5206e-04, 6.6541e-05,\n 7.9201e-05, 1.0760e-04, 8.8739e-05, 4.2310e-04, 2.0214e-04, 1.6200e-04,\n 8.5348e-05, 1.0926e-04, 5.5087e-05, 6.5922e-05, 2.1271e-04, 1.6083e-04,\n 9.5037e-05, 1.6130e-04, 1.1298e-04, 8.2289e-05, 1.6394e-04, 5.9827e-05,\n 1.8446e-04, 9.7241e-05, 1.3447e-04, 6.5520e-05, 8.8839e-05, 1.7649e-04,\n 1.1930e-04, 1.8870e-04, 9.2755e-05, 8.2796e-05, 8.8917e-05, 1.0271e-04,\n 2.8899e-04, 2.0131e-04], device='cuda:0')"
19
  },
20
  "3": {
21
- "step": "tensor(5008.)",
22
- "exp_avg": "tensor([ 3.3398e-03, 1.4436e-03, 8.0064e-03, 2.0668e-03, -3.6029e-03,\n 7.1286e-03, 3.1447e-03, 2.1482e-03, -6.2963e-03, 3.4202e-03,\n -4.0272e-03, 2.4285e-03, -3.4062e-03, -2.6609e-03, 4.0964e-03,\n 6.0860e-04, 8.6702e-03, 1.2649e-03, -1.6718e-03, -8.5540e-04,\n -3.2256e-04, -3.4672e-03, -3.2979e-03, -7.2044e-03, 4.8517e-03,\n -1.7859e-03, 4.3538e-03, 7.1305e-03, -3.7853e-03, 4.1843e-04,\n -3.2893e-03, -2.8702e-03, 4.3770e-03, 2.0667e-03, 2.9268e-06,\n -5.2091e-03, -1.7434e-03, 3.2457e-03, -6.7705e-04, 6.7199e-03,\n 4.2421e-03, -7.5485e-03, -4.1551e-03, -6.0736e-03, 1.2553e-03,\n -1.4270e-03, 5.7382e-04, -7.4928e-03, -4.8617e-03, 1.1645e-03,\n -3.1433e-04, 5.2693e-03, -1.1487e-03, 6.6413e-04, -8.5520e-04,\n 3.3720e-03, 1.6537e-03, 7.0514e-04, -1.6705e-03, 4.8992e-04,\n 9.9663e-04, -4.7566e-03, 2.6456e-03, 3.9404e-03, -8.3652e-04,\n 1.7409e-04, -8.1409e-04, -3.6685e-03, 5.6785e-03, 3.8426e-03,\n -1.1910e-04, -2.5474e-03, 2.7215e-03, -1.9656e-03, 7.7194e-03,\n -2.1851e-03, -1.6890e-03, -3.3839e-03, 7.9458e-04, -1.5985e-04,\n 2.4083e-03, -1.0973e-03, -3.9151e-03, -7.2412e-03, 1.1584e-03,\n 4.3022e-03, 3.1098e-03, 3.6643e-03, 7.7558e-03, -2.1422e-03,\n 4.6182e-03, 2.7221e-04, 8.3915e-03, -6.4528e-03, -5.2567e-03,\n 1.8591e-04, -5.0738e-04, 5.0806e-03, 5.0632e-04, 4.0664e-03,\n 1.5855e-03, -2.6474e-04, -4.9788e-03, -2.4805e-03, -3.1280e-03,\n 1.2409e-03, 1.4404e-03, 1.1429e-03, 2.7812e-04, -3.8812e-03,\n -2.1911e-03, -8.9230e-04, -2.7871e-03, -5.3181e-03, 1.6322e-04,\n 2.4339e-03, -8.0754e-04, -3.7450e-05, -3.9658e-03, -3.8371e-03,\n 2.6975e-03, 3.2698e-03, 1.7957e-03, 7.3895e-03, -4.3771e-04,\n 1.1245e-03, -5.8086e-04, 4.7314e-04, 2.9452e-03, -5.8369e-03,\n -2.3787e-03, 7.0435e-03, -2.7697e-03, 1.0462e-03, -4.4072e-03,\n -1.9636e-03, -1.6578e-03, -3.4865e-04, 5.0952e-03, 7.6798e-04,\n 1.9276e-03, 1.3516e-03, 3.3094e-03, 1.2127e-04, -1.2253e-03,\n 2.5227e-03, -8.8820e-03, -2.0733e-03, -1.7010e-03, 5.0755e-03,\n 9.0977e-03, -3.4070e-03, 3.2390e-03, 3.5022e-03, 1.6198e-03,\n 1.4260e-03, -2.6028e-03, -9.8785e-03, 3.5267e-03, 4.4884e-03,\n -1.7884e-03, 1.9769e-04, -1.1192e-04, 1.3499e-03, -2.7584e-03,\n 2.9355e-04, -8.8886e-04, 3.6981e-03, -3.7286e-04, 4.6442e-03,\n 1.3729e-03, -4.1008e-03, 1.1148e-03, -2.0406e-03, -8.1138e-03,\n 3.7234e-03, -5.3597e-03, 3.1074e-04, -4.5101e-04, -1.4665e-04,\n -2.3749e-04, -1.2822e-02, 1.1965e-04, 2.8015e-03, -1.1025e-03,\n -1.9837e-03, 4.1873e-03, 5.2588e-03, -5.8627e-04, -7.5609e-03,\n -2.8515e-04, -5.2145e-04, 2.9457e-03, -4.2299e-03, -5.7356e-03,\n -4.1747e-03, 9.4867e-04, -2.7047e-03, 1.9600e-03, -4.0901e-03,\n -2.0138e-03, 2.1438e-03, -1.7386e-03, -8.0980e-04, -5.9443e-04,\n -2.3274e-03, -5.8341e-03, 5.5808e-04, 3.5288e-03, 3.4049e-04,\n 3.8589e-03, -1.7152e-03, -2.1489e-03, 9.6730e-04, 7.1880e-03,\n -7.8067e-03, -3.2923e-03, -1.0084e-03, -4.3383e-04, 1.3057e-03,\n 3.5486e-03, 3.1019e-03, 8.3562e-04, -1.1630e-03, 6.8783e-03,\n 1.6250e-03, 2.2419e-05, 3.1016e-03, -1.1111e-03, -6.0419e-03,\n 7.1448e-04, 1.4592e-04, -7.7294e-03, -6.7714e-04, 1.7121e-03,\n 2.6262e-03, -9.4446e-03, 7.6053e-04, 1.2040e-03, -1.8781e-03,\n -4.9971e-03, -5.5560e-03, -1.1583e-02, 1.0605e-03, 1.9785e-03,\n -1.3783e-03, 1.0326e-03, -1.0360e-03, -4.9509e-03, -6.5969e-03,\n -3.1702e-03, 2.0128e-04, -5.2555e-03, -7.9476e-03, -3.3455e-03,\n 8.1801e-03, 2.4098e-03, -4.2384e-03, -4.3125e-04, -3.7560e-03,\n -2.6162e-03, -3.8732e-03, -4.0478e-04, 3.0338e-04, 2.4053e-03,\n -1.1722e-04, 3.6771e-03, 6.2642e-04, 1.5170e-03, 6.3792e-04,\n -4.5180e-04, 1.1588e-02, 5.6206e-03, 3.7951e-03, -1.1153e-03,\n -5.2072e-05, -1.6450e-03, 3.1872e-03, 1.3644e-03, -5.3870e-04,\n -1.6229e-03, -2.9160e-03, 3.6268e-03, 4.0034e-03, -3.1500e-03,\n 8.0848e-03, -3.0812e-03, 3.4928e-03, -1.7271e-03, 6.1210e-03,\n -1.7697e-02, -1.3846e-03, 6.4492e-04, -5.6198e-03, -2.5297e-03,\n -3.1794e-03, -4.2447e-03, 4.4220e-03, 3.0400e-03, -2.2566e-03,\n 1.6475e-03, 2.1092e-03, -3.4378e-03, -7.1195e-04, 3.2480e-03,\n 2.0052e-03, 7.0264e-05, 2.8563e-03, 1.4045e-03, 2.8809e-03,\n 2.7495e-03, 3.3671e-03, 3.3069e-03, -9.6387e-04, -5.8567e-03,\n 4.9773e-03, -5.1065e-03, 3.9535e-03, 5.8053e-03, 2.1333e-03,\n -1.1228e-02, 8.8514e-04, 6.2492e-05, 1.6537e-03, 2.1017e-03,\n -3.2407e-03, 3.8196e-03, -1.9032e-03, -5.9224e-03, 5.1425e-03,\n -1.6114e-03, -2.7414e-03, 8.8875e-03, -1.8359e-03, 4.9757e-03,\n -1.6312e-03, 3.9752e-03, 5.8147e-03, -3.8860e-03, 2.1711e-03,\n 2.2833e-03, 3.3543e-03, 1.0797e-03, 1.2454e-03, 9.0082e-03,\n -2.0197e-04, -8.6154e-03, 1.3012e-03, 1.1280e-03, 4.5158e-03,\n -6.6865e-03, -1.2608e-03, 3.7778e-03, 3.0456e-03, 4.6689e-04,\n -7.0062e-03, 7.6051e-04, 5.5898e-03, -2.0944e-03, 3.9263e-04,\n -2.2333e-03, 3.2380e-03, -2.4577e-03, 5.5274e-03, 1.6951e-03,\n -4.3282e-04, -4.3788e-03, -2.4505e-03, -4.5556e-04, 4.0755e-03,\n -7.4525e-03, 7.6729e-03, -9.8688e-04, 7.7359e-04, 3.5337e-03,\n 1.6584e-03, 2.7173e-03, 3.0410e-03, 4.9650e-03, -2.2753e-03,\n 2.6238e-03, -3.3085e-03, -4.8559e-03, 4.2020e-03, -1.8353e-03,\n 3.8161e-03, 9.8887e-04, -2.2070e-03, -1.6843e-03, -7.9262e-04,\n -6.7666e-03, 6.0184e-04, -2.3103e-03, 1.7753e-03, -3.3768e-03,\n 2.5095e-03, 1.8873e-03, -1.8027e-03, 1.1206e-03, 2.5656e-03,\n -1.5520e-03, -3.6715e-03, -4.1316e-03, -4.9327e-03, 1.6249e-03,\n -3.7218e-03, 3.9736e-03, -7.8062e-04, 2.0632e-03, 2.0147e-03,\n -3.3636e-03, -2.4722e-03, 5.7953e-04, -8.3934e-04, 2.2436e-03,\n -6.4266e-03, 5.3912e-03, 2.2860e-03, -2.2876e-03, 3.7697e-03,\n 1.6517e-03, -6.0452e-03, -2.5940e-04, -2.2421e-03, 1.7408e-03,\n 1.7277e-03, -2.3591e-04, 3.2953e-04, 1.0450e-02, 1.2270e-04,\n -2.8497e-03, 4.3121e-04, 3.8621e-03, 2.3367e-03, 3.9182e-04,\n 3.0773e-03, 7.0511e-04, 3.6690e-03, 4.2694e-04, 1.8336e-04,\n 1.2461e-03, -2.3628e-03, -2.7982e-03, -2.1105e-03, -3.9643e-03,\n -7.0765e-03, -3.1041e-03, -1.8921e-03, -5.9365e-03, 1.7454e-03,\n 1.0454e-03, -1.9346e-03, 3.6936e-03, -1.3681e-03, 2.7940e-03,\n 7.8641e-04, 1.8480e-03, -3.2485e-03, 2.6562e-03, -2.4350e-03,\n -3.8484e-03, -2.3453e-03, -2.9160e-03, 4.7605e-03, 1.1637e-03,\n 3.6615e-03, 2.1438e-03, 2.0847e-03, 2.9464e-03, -3.2162e-03,\n 7.1372e-04, -3.4022e-04, 5.5596e-03, -1.1885e-02, -2.3501e-03,\n -2.9144e-03, -1.9083e-03, 2.4979e-04, -8.7368e-04, -3.8590e-03,\n 8.0720e-04, -1.3443e-03, -8.3138e-03, -3.4583e-03, 5.3208e-03,\n 4.0716e-03, 2.3031e-04, 1.1672e-02, -7.0416e-04, -4.8297e-05,\n 7.3178e-03, 1.9291e-03, -3.8061e-03, -1.2856e-03, 6.4063e-03,\n -1.4145e-03, -3.0433e-04, 6.6180e-03, -7.3319e-04, 2.1165e-03,\n -4.0365e-04, -1.9276e-04, -1.5791e-03, 3.0071e-03, -2.5961e-04,\n 1.9443e-03, -4.1760e-03, 1.1718e-03, 1.0029e-02, 2.3954e-03,\n 1.9842e-03, -1.0761e-03], device='cuda:0')",
23
- "exp_avg_sq": "tensor([9.9826e-05, 8.7461e-05, 1.2703e-04, 8.6655e-05, 9.7617e-05, 1.1228e-04,\n 9.4477e-05, 7.0785e-05, 9.1594e-05, 1.0144e-04, 1.1676e-04, 1.7174e-04,\n 6.7153e-05, 1.2427e-04, 1.0852e-04, 1.0611e-04, 9.2445e-05, 1.3209e-04,\n 1.2688e-04, 1.1632e-04, 1.1603e-04, 1.1517e-04, 1.2045e-04, 9.7412e-05,\n 9.1604e-05, 9.6854e-05, 1.6722e-04, 7.3114e-05, 7.7992e-05, 1.1745e-04,\n 9.7939e-05, 7.9389e-05, 1.4367e-04, 6.2088e-05, 8.1728e-05, 1.9333e-04,\n 1.0312e-04, 1.0086e-04, 1.2229e-04, 1.4902e-04, 1.6388e-04, 1.0752e-04,\n 1.0687e-04, 1.4432e-04, 7.1895e-05, 1.4998e-04, 1.1136e-04, 1.2253e-04,\n 1.4137e-04, 1.3507e-04, 1.1208e-04, 9.3687e-05, 1.2427e-04, 9.9270e-05,\n 1.1871e-04, 9.2181e-05, 8.8440e-05, 1.1344e-04, 7.5813e-05, 1.3352e-04,\n 9.1722e-05, 1.1020e-04, 1.1244e-04, 1.2769e-04, 1.0883e-04, 1.0880e-04,\n 1.2289e-04, 1.0137e-04, 1.2469e-04, 1.4650e-04, 9.2339e-05, 1.9323e-04,\n 8.8184e-05, 1.0145e-04, 1.0681e-04, 9.6616e-05, 8.1644e-05, 1.2151e-04,\n 1.1966e-04, 8.0096e-05, 1.3677e-04, 9.9697e-05, 8.8468e-05, 8.5579e-05,\n 3.1883e-04, 8.5769e-05, 1.0279e-04, 9.1006e-05, 1.0099e-04, 1.0354e-04,\n 1.6046e-04, 9.8881e-05, 9.2280e-05, 1.5466e-04, 9.0947e-05, 1.0960e-04,\n 1.1265e-04, 1.0005e-04, 1.0249e-04, 1.6004e-04, 9.7155e-05, 7.4442e-05,\n 1.7004e-04, 9.8206e-05, 1.4927e-04, 8.5658e-05, 1.0897e-04, 1.1522e-04,\n 1.3112e-04, 1.0691e-04, 1.2999e-04, 9.8917e-05, 9.0072e-05, 9.8925e-05,\n 9.1420e-05, 8.6818e-05, 1.6349e-04, 1.1860e-04, 9.7036e-05, 1.2915e-04,\n 9.7685e-05, 7.1845e-05, 1.3532e-04, 9.2007e-05, 7.1104e-05, 9.5092e-05,\n 1.0739e-04, 1.0096e-04, 7.3795e-05, 9.8596e-05, 1.1707e-04, 1.4802e-04,\n 9.0995e-05, 8.3622e-05, 7.3170e-05, 9.6362e-05, 9.6461e-05, 1.1855e-04,\n 1.0988e-04, 1.3571e-04, 9.9285e-05, 8.5173e-05, 9.0970e-05, 1.4239e-04,\n 1.0213e-04, 1.3073e-04, 2.2612e-04, 1.5400e-04, 8.0036e-05, 1.0257e-04,\n 1.2701e-04, 1.0285e-04, 1.1037e-04, 9.4223e-05, 9.5005e-05, 1.1358e-04,\n 1.4831e-04, 1.0544e-04, 1.0403e-04, 9.4811e-05, 9.0976e-05, 1.3665e-04,\n 1.5693e-04, 8.7643e-05, 1.0540e-04, 1.4061e-04, 1.4026e-04, 1.2355e-04,\n 9.4800e-05, 1.4505e-04, 1.1061e-04, 1.0042e-04, 9.2322e-05, 1.1828e-04,\n 1.2248e-04, 7.7095e-05, 1.2057e-04, 8.1187e-05, 1.1860e-04, 1.1428e-04,\n 1.2039e-04, 1.0674e-04, 1.2149e-04, 8.3251e-05, 1.0288e-04, 1.0678e-04,\n 1.1332e-04, 9.0368e-05, 8.2805e-05, 1.2137e-04, 1.6208e-04, 9.7445e-05,\n 8.7017e-05, 9.8339e-05, 6.4365e-05, 1.1595e-04, 8.4987e-05, 1.3157e-04,\n 1.2400e-04, 1.4131e-04, 6.6052e-05, 8.8014e-05, 1.0565e-04, 9.2376e-05,\n 7.5006e-05, 8.8225e-05, 1.1846e-04, 1.0319e-04, 1.2274e-04, 2.3510e-04,\n 1.1698e-04, 1.0592e-04, 1.4749e-04, 8.1353e-05, 1.6208e-04, 1.1644e-04,\n 1.3138e-04, 6.7463e-05, 1.1117e-04, 1.2650e-04, 1.2007e-04, 1.1055e-04,\n 1.0513e-04, 1.1193e-04, 1.0320e-04, 1.0110e-04, 9.8902e-05, 1.0707e-04,\n 1.1056e-04, 9.3269e-05, 1.0873e-04, 1.2240e-04, 1.1162e-04, 1.3385e-04,\n 7.8839e-05, 1.3268e-04, 1.1386e-04, 1.3726e-04, 8.9514e-05, 1.0322e-04,\n 9.7535e-05, 1.3983e-04, 1.4196e-04, 9.3841e-05, 1.3018e-04, 1.5442e-04,\n 1.1651e-04, 9.1555e-05, 1.1348e-04, 1.1333e-04, 1.0273e-04, 1.0184e-04,\n 1.3677e-04, 2.8493e-04, 1.0634e-04, 1.1430e-04, 1.3291e-04, 1.2338e-04,\n 9.8141e-05, 1.2061e-04, 8.1613e-05, 1.1483e-04, 1.0028e-04, 1.0820e-04,\n 1.2956e-04, 1.0288e-04, 1.2554e-04, 7.4934e-05, 1.1174e-04, 9.0657e-05,\n 1.3108e-04, 1.4554e-04, 8.8140e-05, 1.3327e-04, 1.2639e-04, 8.9173e-05,\n 1.3966e-04, 9.7801e-05, 7.7112e-05, 1.0701e-04, 1.0770e-04, 8.2547e-05,\n 8.6797e-05, 1.2446e-04, 1.1357e-04, 1.0681e-04, 1.2237e-04, 1.0648e-04,\n 1.0205e-04, 1.6249e-04, 1.1532e-04, 1.0546e-04, 1.0439e-04, 1.4007e-04,\n 9.1297e-05, 1.2627e-04, 1.2688e-04, 9.7364e-05, 1.0131e-04, 7.8524e-05,\n 1.0115e-04, 8.1170e-05, 1.1999e-04, 1.1175e-04, 8.4374e-05, 7.8094e-05,\n 9.7865e-05, 1.4728e-04, 7.2437e-05, 9.9143e-05, 1.3578e-04, 8.8967e-05,\n 8.5356e-05, 9.4753e-05, 1.2067e-04, 1.1074e-04, 1.6053e-04, 1.1480e-04,\n 7.1649e-05, 9.3638e-05, 1.0988e-04, 1.1859e-04, 8.2119e-05, 1.1602e-04,\n 1.3648e-04, 1.1448e-04, 1.1420e-04, 9.1423e-05, 1.2166e-04, 1.3869e-04,\n 1.3791e-04, 9.4594e-05, 1.3085e-04, 9.8578e-05, 1.2132e-04, 1.0291e-04,\n 1.4459e-04, 1.7955e-04, 1.1519e-04, 1.1814e-04, 9.0068e-05, 1.1218e-04,\n 7.6523e-05, 9.3466e-05, 1.0198e-04, 1.0068e-04, 1.3118e-04, 1.0915e-04,\n 1.0248e-04, 1.4424e-04, 8.7388e-05, 1.0954e-04, 1.2314e-04, 1.0458e-04,\n 1.1034e-04, 1.7857e-04, 1.1531e-04, 9.7351e-05, 8.2279e-05, 7.7565e-05,\n 1.0543e-04, 1.3110e-04, 8.6614e-05, 1.1735e-04, 1.1670e-04, 1.9208e-04,\n 8.9986e-05, 1.5174e-04, 1.0723e-04, 1.0593e-04, 1.3486e-04, 1.5449e-04,\n 9.3422e-05, 1.0991e-04, 1.2922e-04, 9.5732e-05, 8.8752e-05, 1.0038e-04,\n 1.2102e-04, 1.0994e-04, 1.0497e-04, 1.4007e-04, 1.3119e-04, 1.2096e-04,\n 1.0238e-04, 1.7919e-04, 1.0500e-04, 9.0817e-05, 1.3662e-04, 1.6079e-04,\n 1.1826e-04, 1.2797e-04, 1.0715e-04, 1.6772e-04, 9.5188e-05, 1.6731e-04,\n 8.5382e-05, 1.5803e-04, 9.2325e-05, 1.6284e-04, 8.4628e-05, 9.9099e-05,\n 1.4835e-04, 1.5120e-04, 1.1703e-04, 1.0687e-04, 1.2550e-04, 9.7514e-05,\n 9.6812e-05, 1.0003e-04, 1.0962e-04, 1.1042e-04, 1.3148e-04, 1.0794e-04,\n 9.7711e-05, 8.4441e-05, 7.1040e-05, 9.9965e-05, 1.2303e-04, 1.3276e-04,\n 8.4091e-05, 1.4039e-04, 1.3804e-04, 1.5175e-04, 1.1111e-04, 1.1871e-04,\n 1.2931e-04, 1.0340e-04, 1.6959e-04, 9.8317e-05, 1.3463e-04, 9.8137e-05,\n 1.1336e-04, 8.6788e-05, 9.7016e-05, 9.9233e-05, 1.2520e-04, 6.9016e-05,\n 1.4183e-04, 7.6929e-05, 1.0928e-04, 9.7218e-05, 7.7175e-05, 6.7794e-05,\n 1.2668e-04, 9.8011e-05, 9.2959e-05, 6.2169e-05, 1.6302e-04, 1.2339e-04,\n 1.1334e-04, 1.0265e-04, 7.7331e-05, 1.2033e-04, 8.6906e-05, 1.4612e-04,\n 8.8832e-05, 1.3947e-04, 1.3546e-04, 1.6717e-04, 9.0590e-05, 8.0725e-05,\n 1.1216e-04, 1.1912e-04, 1.1121e-04, 7.5490e-05, 1.2054e-04, 1.4256e-04,\n 1.1383e-04, 9.2679e-05, 1.7246e-04, 7.1578e-05, 8.7267e-05, 1.1607e-04,\n 8.0509e-05, 8.2762e-05, 9.7303e-05, 1.3221e-04, 1.4170e-04, 8.3071e-05,\n 1.0790e-04, 1.1575e-04, 1.0333e-04, 1.2824e-04, 1.1253e-04, 1.2951e-04,\n 9.5521e-05, 1.2569e-04, 6.9529e-05, 1.0118e-04, 1.2968e-04, 1.3985e-04,\n 1.2522e-04, 1.1057e-04, 1.7804e-04, 1.1217e-04, 1.3094e-04, 1.1639e-04,\n 1.3332e-04, 1.6328e-04, 1.3025e-04, 1.1350e-04, 8.8102e-05, 1.1165e-04,\n 1.1635e-04, 1.0175e-04, 1.6332e-04, 9.4158e-05, 1.9665e-04, 1.0523e-04,\n 1.3641e-04, 1.2188e-04], device='cuda:0')"
24
  },
25
  "4": {
26
- "step": "tensor(5008.)",
27
- "exp_avg": "tensor([[-1.4001e-04, 5.4738e-04, 2.3948e-05, ..., 4.0728e-05,\n 2.8603e-04, -9.1870e-05],\n [-4.8272e-04, -9.8014e-05, -3.5998e-04, ..., -2.0332e-04,\n 3.3512e-04, -2.9984e-04],\n [ 2.7128e-04, 1.7591e-04, 1.1848e-04, ..., -1.7333e-04,\n -3.0730e-04, 2.6872e-04],\n ...,\n [ 7.7770e-05, 7.5213e-05, 1.3020e-04, ..., -2.1946e-04,\n -1.6273e-04, 4.1114e-04],\n [ 3.6391e-04, -1.0463e-04, -1.6615e-05, ..., -3.6900e-04,\n -1.8721e-04, 4.1951e-04],\n [ 4.6571e-05, -2.9873e-04, -3.4650e-04, ..., -3.8067e-04,\n 3.2387e-04, 8.8552e-05]], device='cuda:0')",
28
- "exp_avg_sq": "tensor([[3.8289e-07, 8.3125e-07, 3.3157e-07, ..., 4.1393e-07, 6.2802e-07,\n 7.2890e-07],\n [9.4104e-07, 4.2653e-07, 1.4974e-06, ..., 1.2301e-06, 1.3744e-06,\n 9.0485e-07],\n [6.5820e-07, 4.4177e-07, 7.3752e-07, ..., 1.3008e-06, 1.0793e-06,\n 6.8083e-07],\n ...,\n [1.1848e-06, 4.9012e-07, 8.2042e-07, ..., 1.1382e-06, 1.4754e-06,\n 2.0402e-06],\n [8.1509e-07, 5.7862e-07, 8.5122e-07, ..., 9.5410e-07, 1.3261e-06,\n 1.5323e-06],\n [7.2540e-07, 7.4291e-07, 1.3010e-06, ..., 1.0042e-06, 1.6732e-06,\n 1.2972e-06]], device='cuda:0')"
29
  },
30
  "5": {
31
- "step": "tensor(5008.)",
32
- "exp_avg": "tensor([[ 1.2971e-05, -1.5414e-05, 4.7145e-06, ..., 2.5809e-05,\n 2.1992e-04, 2.9177e-05],\n [-2.5009e-04, -5.3441e-05, -1.3114e-04, ..., -1.0805e-04,\n 2.3465e-04, -1.1163e-04],\n [ 1.9886e-04, 2.1095e-04, 1.4139e-04, ..., -1.0386e-04,\n -1.8608e-04, 1.0025e-04],\n ...,\n [-9.5128e-05, -2.2244e-04, 3.0045e-04, ..., -2.6538e-04,\n 6.3334e-05, 1.2192e-05],\n [ 9.5096e-06, 3.0840e-04, 1.1355e-04, ..., -1.1462e-04,\n 8.3339e-05, 2.0363e-04],\n [-1.2835e-04, 2.1304e-04, -2.1943e-04, ..., -6.6441e-05,\n -1.9693e-04, 1.9615e-04]], device='cuda:0')",
33
- "exp_avg_sq": "tensor([[1.0915e-07, 6.5623e-08, 1.1653e-07, ..., 1.9666e-07, 2.0179e-07,\n 1.3972e-07],\n [2.7043e-07, 1.2014e-07, 2.4114e-07, ..., 3.6235e-07, 3.5771e-07,\n 3.5681e-07],\n [2.1950e-07, 2.2283e-07, 2.6444e-07, ..., 3.9875e-07, 3.5357e-07,\n 2.4748e-07],\n ...,\n [3.0549e-07, 2.5087e-07, 3.7865e-07, ..., 2.8807e-07, 5.2967e-07,\n 4.8358e-07],\n [2.1021e-07, 3.5204e-07, 3.3291e-07, ..., 3.0386e-07, 4.1230e-07,\n 4.6330e-07],\n [2.6709e-07, 2.5174e-07, 4.0582e-07, ..., 4.2732e-07, 4.8182e-07,\n 3.0534e-07]], device='cuda:0')"
34
  },
35
  "6": {
36
- "step": "tensor(5008.)",
37
- "exp_avg": "tensor([ 0.0008, -0.0008], device='cuda:0')",
38
- "exp_avg_sq": "tensor([1.0196e-05, 1.0196e-05], device='cuda:0')"
39
  }
40
  },
41
  "param_groups": [
42
  {
43
- "lr": 0.0006548539886902864,
44
  "name": "shared",
45
  "betas": [
46
  0.9,
@@ -64,7 +64,7 @@
64
  ]
65
  },
66
  {
67
- "lr": 0.0006548539886902864,
68
  "name": "scale_256",
69
  "betas": [
70
  0.9,
@@ -85,7 +85,7 @@
85
  ]
86
  },
87
  {
88
- "lr": 0.0006548539886902864,
89
  "name": "scale_512",
90
  "betas": [
91
  0.9,
@@ -106,7 +106,7 @@
106
  ]
107
  },
108
  {
109
- "lr": 0.0003275997400965494,
110
  "name": "fusion",
111
  "betas": [
112
  0.9,
@@ -133,30 +133,30 @@
133
  "T_i": 10,
134
  "T_mult": 2,
135
  "eta_min": 1e-06,
136
- "T_cur": 4,
137
  "base_lrs": [
138
  0.001,
139
  0.001,
140
  0.001,
141
  0.0005
142
  ],
143
- "last_epoch": 4,
144
  "_step_count": 0,
145
  "_is_initial": false,
146
  "_get_lr_called_within_step": false,
147
  "_last_lr": [
148
- 0.0006548539886902864,
149
- 0.0006548539886902864,
150
- 0.0006548539886902864,
151
- 0.0003275997400965494
152
  ]
153
  },
154
  "metrics": {
155
- "best_val_acc": 70.614,
156
- "best_epoch": 3,
157
  "scale_accuracies": {
158
- "256": 70.124,
159
- "512": 70.46
160
  }
161
  },
162
  "train_config": {
 
1
  {
2
+ "epoch": 4,
3
  "optimizer_state_dict": {
4
  "state": {
5
  "0": {
6
+ "step": "tensor(6260.)",
7
+ "exp_avg": "tensor([[ 3.1722e-04, 3.1541e-03, 1.0743e-03, ..., 2.9322e-04,\n 5.6603e-04, 5.1939e-04],\n [-5.8773e-04, 2.7085e-03, -8.4152e-05, ..., 3.6830e-04,\n -2.1589e-04, -6.0146e-04],\n [-1.8794e-04, 3.5767e-03, -3.1200e-03, ..., 5.7624e-04,\n 2.0440e-04, -8.9246e-04],\n ...,\n [-1.0678e-03, -1.1239e-03, 7.4526e-05, ..., -2.6899e-04,\n -1.9413e-04, -7.7857e-05],\n [-7.1220e-04, -4.6767e-03, 3.2651e-03, ..., -1.8281e-05,\n 2.7817e-05, 9.0213e-04],\n [ 3.8004e-04, -1.6752e-03, 9.4115e-04, ..., 1.0887e-04,\n -4.9217e-05, -1.1337e-04]], device='cuda:0')",
8
+ "exp_avg_sq": "tensor([[4.0182e-06, 2.6264e-05, 1.5469e-05, ..., 3.1997e-06, 2.6607e-06,\n 6.2000e-06],\n [1.1437e-05, 2.9362e-05, 1.8885e-05, ..., 3.8683e-06, 2.4802e-06,\n 5.4786e-06],\n [7.1391e-06, 4.6127e-05, 2.1583e-05, ..., 5.3447e-06, 2.9660e-06,\n 6.4597e-06],\n ...,\n [5.4480e-06, 4.6049e-05, 1.7139e-05, ..., 4.3088e-06, 2.8427e-06,\n 3.2124e-06],\n [4.5123e-06, 3.4993e-05, 1.5051e-05, ..., 3.0318e-06, 2.1692e-06,\n 2.5714e-06],\n [2.8421e-06, 1.2176e-05, 1.0831e-05, ..., 2.6425e-06, 1.6447e-06,\n 2.0784e-06]], device='cuda:0')"
9
  },
10
  "1": {
11
+ "step": "tensor(6260.)",
12
+ "exp_avg": "tensor([ 3.8287e-02, 7.0744e-03, 4.6278e-03, -4.6743e-02, 7.3604e-04,\n -4.8485e-03, -2.4281e-02, -1.1458e-02, 1.1361e-02, 3.7939e-02,\n 1.0578e-02, -1.1545e-02, -4.1391e-03, -2.1389e-03, -3.7640e-02,\n -5.0695e-02, -4.8609e-02, -4.2825e-02, 9.5611e-03, -2.7086e-03,\n -8.1645e-02, 5.0465e-02, -4.7577e-03, -1.6391e-02, -2.6154e-02,\n 1.4030e-02, -7.6941e-04, 1.6214e-02, -1.1239e-02, -1.0351e-02,\n -1.9110e-02, 2.6022e-02, -4.2750e-03, 2.5497e-02, 3.0964e-02,\n 2.4860e-02, 1.2926e-02, -1.4974e-02, 1.3156e-02, -1.0836e-02,\n 9.6476e-03, 1.7289e-02, -1.8028e-02, -1.1272e-02, -2.0952e-02,\n 3.3801e-02, 5.0331e-03, 7.3461e-03, 8.5710e-04, 3.6008e-03,\n -1.6823e-02, -2.1902e-02, 8.0397e-04, -3.6462e-03, 4.6077e-03,\n 1.8185e-02, -3.4063e-02, -7.9193e-03, 4.4017e-03, -1.3735e-02,\n 6.9905e-03, -4.8321e-03, 4.2993e-03, 3.5981e-03, 1.6529e-02,\n 1.3397e-02, 3.5450e-02, 7.1683e-03, -3.1353e-03, -4.6232e-02,\n -1.1754e-02, 5.9485e-03, 4.7543e-03, 3.1489e-02, -2.9745e-02,\n -1.2485e-03, 2.0774e-02, 1.4253e-02, 6.3192e-03, -5.0772e-03,\n 5.5329e-03, 1.6628e-02, -1.6319e-02, 1.3700e-02, 5.5130e-03,\n -6.1528e-02, -3.9390e-02, 1.3808e-02, -4.0851e-03, 1.7086e-03,\n 2.3253e-03, -3.1091e-03, -1.0949e-02, -2.6634e-02, 6.6016e-03,\n 7.0280e-03, -4.3269e-03, -2.1167e-02, 1.0241e-02, 2.7441e-02,\n 2.5566e-02, -2.9024e-02, -1.9951e-02, -2.3090e-02, 1.8327e-02,\n 3.2079e-03, -8.4656e-03, 4.0309e-02, -1.6775e-02, 4.1465e-03,\n -6.1990e-03, -3.5925e-02, 6.5328e-03, -1.0797e-01, -2.6290e-02,\n -7.1130e-03, -7.1726e-03, 1.9910e-02, 1.2287e-03, 2.6613e-02,\n -1.6972e-02, -1.6264e-02, 1.0138e-02, 1.7948e-02, -1.7570e-02,\n -1.3114e-02, 7.1512e-03, -1.2897e-02, -2.3700e-03, 1.0894e-03,\n 1.1488e-02, -2.1036e-03, -1.0666e-02, -1.3311e-02, -2.5209e-02,\n -3.0498e-03, 3.3425e-02, -2.6824e-02, 2.9714e-02, 1.5678e-02,\n -1.1071e-02, 3.0084e-02, 1.7867e-02, 1.1807e-02, 1.6388e-03,\n -1.3518e-03, -2.6451e-02, -2.0514e-02, -2.0630e-03, 1.3967e-02,\n -5.0451e-03, 1.2406e-03, -1.8563e-02, 6.1663e-03, -2.5807e-02,\n 3.8573e-02, 1.8341e-02, 1.1298e-02, -4.6710e-03, -1.6627e-02,\n -5.9884e-03, 8.0051e-03, 6.1325e-03, 1.3148e-02, -2.0617e-02,\n 9.3196e-03, 4.4715e-03, 7.1958e-03, 7.7074e-03, -1.4054e-03,\n 8.3743e-03, 9.6104e-03, -1.4407e-02, 1.0630e-02, -2.4000e-02,\n 2.1516e-02, -7.1061e-04, 7.3933e-03, -6.3228e-02, 1.6711e-02,\n -1.5630e-02, 3.3160e-03, -1.4658e-02, 2.6277e-02, 1.0896e-02,\n -1.9270e-02, 1.8549e-02, -3.3540e-02, 1.2401e-02, 3.9251e-04,\n 1.4241e-03, -4.4019e-02, -1.0013e-03, 1.9363e-02, 1.6239e-02,\n 4.6009e-02, 3.2435e-02, -5.5079e-02, -5.0769e-03, 2.3695e-02,\n -3.8212e-03, 1.7573e-02, 1.3671e-02, -1.7148e-02, 5.7055e-03,\n 4.1058e-03, -1.2033e-03, 1.5867e-02, 9.6781e-03, -1.0136e-02,\n 9.7165e-03, -9.9817e-03, 7.1484e-04, -7.5623e-03, 8.7494e-03,\n 7.6246e-04, -4.4888e-06, 6.2455e-03, -1.4076e-03, -5.2628e-02,\n -4.8459e-02, -2.8403e-02, -2.3883e-02, -5.8512e-03, -3.5528e-03,\n -1.2671e-02, -1.0262e-02, -1.0329e-02, 1.3604e-02, 1.4568e-02,\n 5.7667e-03, 3.5003e-04, 9.4511e-03, 1.2720e-02, -5.0806e-04,\n 1.1562e-02, -2.2015e-02, 2.9138e-03, -7.2606e-03, -3.1598e-02,\n -1.0548e-03, 3.8577e-02, -8.2498e-03, 1.7948e-03, 2.2289e-02,\n -7.2965e-03, 4.1943e-03, 4.6692e-03, 1.9245e-02, -3.3418e-03,\n 1.4388e-02, 9.6351e-03, 9.2271e-03, 7.5374e-03, -3.5625e-02,\n -7.3475e-03, -8.2203e-03, -5.2415e-04, -6.6258e-03, -3.3096e-03,\n 1.5189e-02, 2.4717e-03, -1.5238e-02, 9.3064e-03, -3.7153e-02,\n -2.4327e-02, 7.9849e-03, -1.0039e-02, 1.6063e-02, 8.3004e-03,\n 2.1386e-02, 4.9097e-02, 2.2039e-02, -9.0948e-02, 4.6477e-03,\n 1.7955e-02, 3.1564e-03, -3.8319e-03, 2.0519e-02, 6.1444e-03,\n -1.7738e-02, -1.9348e-02, 9.6401e-03, 1.6220e-03, -6.4844e-03,\n -5.4217e-03, 4.4311e-03, 6.6548e-03, -2.7304e-03, 2.4047e-02,\n -1.8420e-02, -9.1805e-03, 1.9927e-02, 2.5734e-02, 2.1368e-02,\n 1.7123e-02, -4.4288e-02, -6.7710e-02, 1.1993e-02, -6.4020e-03,\n -3.8266e-03, 2.1033e-02, 1.2275e-02, 1.7655e-02, 3.9573e-03,\n 2.0131e-02, 2.6364e-02, -3.3657e-02, 1.1919e-02, 3.7818e-02,\n 2.1630e-02, -2.2235e-03, 5.9623e-03, 1.2263e-02, 1.8866e-02,\n -1.9704e-02, -1.9742e-02, -4.4306e-02, 9.1872e-03, 1.7408e-02,\n 1.0881e-02, -9.1749e-03, 2.9778e-03, 4.5772e-02, 8.6524e-03,\n -3.0541e-02, 6.9361e-03, 2.0173e-02, 5.7835e-03, 8.9142e-02,\n 8.5473e-03, -2.3475e-02, 2.1740e-02, 1.1176e-02, 6.8983e-03,\n 2.0390e-02, -2.4504e-02, -5.1879e-03, -5.2856e-02, 3.7868e-02,\n -6.6295e-03, -1.3594e-02, -1.5865e-02, 3.5660e-02, -9.8688e-03,\n -2.4674e-03, -6.8197e-02, 4.4329e-02, -9.8988e-03, 7.1389e-05,\n 2.9316e-02, 1.9902e-02, -1.5678e-02, -1.9607e-02, 2.1865e-02,\n -6.8571e-02, -1.0837e-02, 9.3229e-03, 5.9236e-03, 1.7944e-03,\n -7.8694e-03, -2.5341e-02, 1.2404e-03, 2.6575e-02, -7.9784e-03,\n 1.9583e-02, 1.3037e-02, 1.1921e-02, -3.1066e-02, -2.9630e-02,\n -6.1752e-02, -4.5265e-02, 3.2678e-02, -1.1861e-02, 2.7437e-03,\n 1.8793e-02, 7.4700e-03, -6.1178e-03, 3.8862e-02, 1.1419e-02,\n 1.9983e-02, 1.0733e-02, 4.6946e-02, 1.7694e-02, 6.3264e-03,\n -2.6940e-03, 2.2536e-04, -1.6457e-02, -3.1861e-02, 5.1680e-03,\n -1.4922e-03, 2.8381e-02, 1.7341e-02, 1.5049e-02, 6.9486e-03,\n -1.0157e-02, 3.6269e-03, -4.1289e-02, 1.3396e-02, 6.3983e-03,\n -7.7330e-03, 2.2355e-02, 3.6277e-02, 5.9523e-02, -1.6178e-03,\n -3.3730e-02, -1.8006e-02, -9.1209e-04, 3.7044e-02, -1.3934e-02,\n -3.1090e-02, 6.5350e-03, -4.0766e-03, -1.3798e-03, 1.2118e-02,\n -2.9756e-02, -6.7338e-03, 2.0605e-02, -3.5522e-03, 3.0580e-02,\n -1.3392e-03, 2.2960e-03, -4.2043e-02, 5.0153e-03, 1.7484e-02,\n -1.1225e-02, 2.7259e-02, 2.2224e-02, -1.5206e-02, -3.6641e-02,\n -4.8472e-03, -1.2165e-03, -1.9333e-02, 1.3597e-02, -1.0023e-02,\n -6.6633e-03, 7.1999e-03, -7.4278e-03, 2.7650e-03, -1.1078e-02,\n -1.7142e-02, -1.8912e-03, 2.3660e-02, -1.3783e-02, -4.1150e-02,\n 2.6868e-02, -3.2397e-04, -1.4040e-02, 1.3942e-02, 3.8696e-02,\n -1.4583e-02, 6.8208e-03, 2.0938e-02, -3.6576e-03, -1.6154e-02,\n 5.1289e-02, -2.2931e-02, -1.3640e-02, 3.1942e-03, 2.2815e-02,\n -5.1017e-02, -1.0102e-02, 7.1091e-02, 7.6073e-03, 3.3452e-02,\n 1.1638e-02, -5.8458e-02, -7.3556e-03, 3.0164e-02, -3.6774e-04,\n -1.1932e-02, 1.7343e-02, 1.2772e-02, 7.6630e-03, 1.3012e-02,\n -1.7053e-02, 1.4923e-02, 6.2616e-03, -4.3743e-03, 1.8084e-02,\n 8.2520e-03, 1.1635e-02, -1.3706e-02, 4.9977e-03, 1.2277e-03,\n 5.4867e-03, 9.3740e-03, -1.5906e-02, 1.1762e-02, -1.5932e-03,\n 1.7397e-02, 3.2279e-02, 8.4486e-03, -6.0659e-04, -4.2045e-03,\n 2.1770e-02, 3.8335e-02, -4.4980e-02, 1.0806e-02, 3.0911e-02,\n -2.0104e-02, 2.2958e-02, -1.4797e-02, 5.2966e-03, 4.5325e-03,\n 5.5271e-03, 2.7181e-02, -7.6531e-03, 3.3271e-03, -2.7743e-02,\n -3.4526e-02, -7.6148e-03], device='cuda:0')",
13
+ "exp_avg_sq": "tensor([0.0041, 0.0044, 0.0059, 0.0047, 0.0032, 0.0024, 0.0055, 0.0039, 0.0035,\n 0.0034, 0.0047, 0.0034, 0.0030, 0.0044, 0.0047, 0.0044, 0.0045, 0.0038,\n 0.0031, 0.0040, 0.0065, 0.0037, 0.0030, 0.0032, 0.0051, 0.0035, 0.0035,\n 0.0028, 0.0046, 0.0053, 0.0042, 0.0050, 0.0048, 0.0044, 0.0037, 0.0085,\n 0.0036, 0.0029, 0.0026, 0.0062, 0.0065, 0.0037, 0.0039, 0.0055, 0.0017,\n 0.0052, 0.0018, 0.0036, 0.0033, 0.0019, 0.0031, 0.0023, 0.0042, 0.0039,\n 0.0037, 0.0025, 0.0028, 0.0024, 0.0028, 0.0042, 0.0018, 0.0040, 0.0043,\n 0.0048, 0.0039, 0.0056, 0.0034, 0.0026, 0.0065, 0.0056, 0.0031, 0.0086,\n 0.0026, 0.0032, 0.0034, 0.0041, 0.0031, 0.0017, 0.0026, 0.0050, 0.0032,\n 0.0034, 0.0033, 0.0032, 0.0006, 0.0048, 0.0046, 0.0057, 0.0027, 0.0034,\n 0.0062, 0.0030, 0.0059, 0.0030, 0.0048, 0.0037, 0.0042, 0.0037, 0.0035,\n 0.0050, 0.0032, 0.0033, 0.0048, 0.0043, 0.0025, 0.0050, 0.0025, 0.0044,\n 0.0046, 0.0034, 0.0044, 0.0042, 0.0027, 0.0043, 0.0025, 0.0028, 0.0058,\n 0.0023, 0.0020, 0.0047, 0.0033, 0.0033, 0.0017, 0.0028, 0.0038, 0.0040,\n 0.0061, 0.0035, 0.0040, 0.0037, 0.0050, 0.0015, 0.0024, 0.0035, 0.0023,\n 0.0048, 0.0048, 0.0017, 0.0064, 0.0037, 0.0021, 0.0046, 0.0034, 0.0027,\n 0.0014, 0.0058, 0.0118, 0.0074, 0.0039, 0.0059, 0.0045, 0.0041, 0.0041,\n 0.0035, 0.0042, 0.0054, 0.0028, 0.0035, 0.0017, 0.0031, 0.0045, 0.0062,\n 0.0029, 0.0044, 0.0057, 0.0092, 0.0036, 0.0028, 0.0035, 0.0053, 0.0020,\n 0.0030, 0.0036, 0.0026, 0.0044, 0.0044, 0.0048, 0.0033, 0.0064, 0.0043,\n 0.0059, 0.0038, 0.0070, 0.0035, 0.0046, 0.0054, 0.0042, 0.0036, 0.0031,\n 0.0043, 0.0049, 0.0036, 0.0031, 0.0035, 0.0045, 0.0062, 0.0056, 0.0051,\n 0.0025, 0.0044, 0.0041, 0.0034, 0.0043, 0.0054, 0.0032, 0.0042, 0.0025,\n 0.0043, 0.0032, 0.0085, 0.0036, 0.0031, 0.0061, 0.0037, 0.0072, 0.0036,\n 0.0025, 0.0031, 0.0036, 0.0063, 0.0040, 0.0046, 0.0035, 0.0024, 0.0044,\n 0.0038, 0.0036, 0.0051, 0.0048, 0.0035, 0.0024, 0.0046, 0.0042, 0.0061,\n 0.0040, 0.0034, 0.0031, 0.0057, 0.0045, 0.0056, 0.0023, 0.0042, 0.0040,\n 0.0048, 0.0079, 0.0078, 0.0016, 0.0035, 0.0061, 0.0023, 0.0048, 0.0036,\n 0.0035, 0.0007, 0.0017, 0.0038, 0.0038, 0.0038, 0.0044, 0.0034, 0.0030,\n 0.0036, 0.0054, 0.0043, 0.0034, 0.0047, 0.0049, 0.0038, 0.0021, 0.0036,\n 0.0071, 0.0045, 0.0036, 0.0065, 0.0052, 0.0038, 0.0033, 0.0048, 0.0040,\n 0.0042, 0.0035, 0.0057, 0.0046, 0.0041, 0.0040, 0.0021, 0.0062, 0.0028,\n 0.0034, 0.0056, 0.0051, 0.0040, 0.0021, 0.0051, 0.0038, 0.0072, 0.0047,\n 0.0040, 0.0038, 0.0041, 0.0042, 0.0034, 0.0055, 0.0048, 0.0035, 0.0036,\n 0.0040, 0.0048, 0.0039, 0.0052, 0.0057, 0.0050, 0.0028, 0.0043, 0.0059,\n 0.0026, 0.0036, 0.0039, 0.0033, 0.0022, 0.0044, 0.0021, 0.0032, 0.0053,\n 0.0041, 0.0057, 0.0045, 0.0049, 0.0042, 0.0050, 0.0032, 0.0022, 0.0020,\n 0.0045, 0.0048, 0.0030, 0.0052, 0.0052, 0.0053, 0.0039, 0.0056, 0.0028,\n 0.0038, 0.0032, 0.0024, 0.0041, 0.0051, 0.0040, 0.0027, 0.0040, 0.0022,\n 0.0045, 0.0034, 0.0046, 0.0044, 0.0078, 0.0039, 0.0039, 0.0029, 0.0037,\n 0.0036, 0.0053, 0.0038, 0.0023, 0.0055, 0.0059, 0.0044, 0.0030, 0.0028,\n 0.0055, 0.0055, 0.0050, 0.0023, 0.0028, 0.0040, 0.0039, 0.0033, 0.0043,\n 0.0048, 0.0047, 0.0061, 0.0035, 0.0071, 0.0039, 0.0030, 0.0052, 0.0047,\n 0.0027, 0.0063, 0.0058, 0.0046, 0.0042, 0.0026, 0.0058, 0.0042, 0.0057,\n 0.0041, 0.0060, 0.0038, 0.0036, 0.0020, 0.0030, 0.0033, 0.0059, 0.0021,\n 0.0060, 0.0059, 0.0037, 0.0040, 0.0027, 0.0032, 0.0023, 0.0016, 0.0045,\n 0.0046, 0.0043, 0.0025, 0.0046, 0.0031, 0.0089, 0.0026, 0.0061, 0.0089,\n 0.0021, 0.0050, 0.0048, 0.0041, 0.0050, 0.0039, 0.0033, 0.0034, 0.0043,\n 0.0055, 0.0034, 0.0029, 0.0041, 0.0029, 0.0034, 0.0024, 0.0035, 0.0022,\n 0.0069, 0.0053, 0.0035, 0.0022, 0.0044, 0.0044, 0.0035, 0.0069, 0.0060,\n 0.0030, 0.0034, 0.0033, 0.0043, 0.0039, 0.0043, 0.0036, 0.0018, 0.0020,\n 0.0094, 0.0043, 0.0032, 0.0061, 0.0044, 0.0047, 0.0055, 0.0064, 0.0044,\n 0.0032, 0.0040, 0.0067, 0.0034, 0.0041, 0.0028, 0.0047, 0.0025, 0.0025,\n 0.0056, 0.0034, 0.0045, 0.0066, 0.0036, 0.0048, 0.0020, 0.0033, 0.0032,\n 0.0031, 0.0063, 0.0033, 0.0050, 0.0030, 0.0032, 0.0046, 0.0030, 0.0096,\n 0.0054, 0.0038, 0.0050, 0.0030, 0.0065, 0.0037, 0.0047, 0.0030, 0.0024,\n 0.0045, 0.0024, 0.0055, 0.0032, 0.0096, 0.0043, 0.0036, 0.0028],\n device='cuda:0')"
14
  },
15
  "2": {
16
+ "step": "tensor(6260.)",
17
+ "exp_avg": "tensor([ 4.8867e-03, 5.0872e-04, -1.1179e-03, -6.3669e-03, 9.7841e-04,\n -1.2620e-03, -3.2520e-03, -1.2085e-03, 2.0005e-03, 7.2467e-03,\n 2.6847e-03, -5.1920e-03, -3.2815e-04, 1.1350e-03, -5.7392e-03,\n -1.1850e-02, -4.9809e-03, -1.4367e-02, 8.5089e-04, -2.7555e-04,\n -9.9056e-03, 1.3274e-02, -1.8857e-04, -3.3881e-03, -1.8454e-03,\n 2.0691e-03, -9.8235e-04, 2.7665e-03, -1.0355e-03, -1.1666e-03,\n -2.3049e-03, 2.0035e-03, 1.5425e-03, 4.4901e-03, 7.7570e-03,\n 3.9652e-03, 3.4477e-03, -5.4886e-03, 3.4431e-03, -2.7509e-03,\n 2.8473e-04, 3.2787e-03, -4.1174e-03, -2.0651e-03, -6.0493e-03,\n 4.7881e-03, 2.2355e-03, 4.3603e-04, -6.1181e-04, 2.7814e-03,\n -2.4060e-03, -4.4140e-03, 4.5694e-05, 2.6914e-05, 1.5530e-03,\n 3.7221e-03, -6.0255e-03, -1.6161e-03, 3.3332e-04, -3.9637e-03,\n 1.0653e-03, -1.6633e-03, 7.4323e-04, -1.7207e-04, 3.7102e-03,\n 1.6462e-03, 8.2696e-03, 4.0024e-03, -1.3782e-03, -8.3224e-03,\n -2.1287e-03, 1.0655e-03, 1.1073e-03, 5.8886e-03, -6.9749e-03,\n -6.9178e-04, 2.2777e-03, 5.3585e-03, 1.3174e-03, -7.5804e-04,\n 1.6006e-03, 3.1378e-03, -4.8349e-03, 2.9375e-03, 6.2926e-02,\n -4.9597e-03, -7.9912e-03, 1.1522e-03, -1.7965e-03, 9.0977e-04,\n 9.3490e-04, -1.8803e-04, -1.6911e-03, -9.3432e-03, 1.9296e-04,\n 1.7120e-04, -6.0348e-04, -3.6702e-03, 4.4878e-03, 4.8650e-03,\n 5.2098e-03, -5.3342e-03, -4.6895e-03, -2.5844e-03, 6.8568e-03,\n 9.2179e-04, -5.0121e-03, 6.6449e-03, 2.3190e-04, 1.7712e-04,\n -1.8432e-03, -4.7253e-03, 1.7649e-03, -1.5790e-02, -6.2896e-03,\n -2.5629e-03, -1.3048e-03, 7.2159e-03, -1.1316e-03, 4.7814e-03,\n -2.5444e-03, -4.2504e-04, 5.8342e-03, 4.1806e-03, -1.3246e-03,\n -2.0185e-03, 1.4937e-04, -2.3415e-03, -1.0825e-03, 2.0923e-04,\n 1.5273e-03, -2.0230e-03, -3.8851e-03, -1.3077e-03, -7.4009e-03,\n -2.7793e-03, 3.3375e-03, -1.7036e-02, 3.7110e-03, 5.4149e-03,\n -2.8434e-03, 3.0604e-03, 4.0370e-03, 2.6169e-03, -2.2187e-03,\n 9.4422e-04, -2.0355e-03, -2.6657e-03, -4.1957e-04, 3.0747e-03,\n -1.3988e-03, -8.0024e-04, -4.4096e-03, 1.7475e-03, -4.8512e-03,\n 5.2750e-03, 5.6642e-03, 2.7110e-03, -3.2228e-03, -1.6431e-03,\n -6.8941e-04, 6.7973e-04, 2.6017e-03, 2.4595e-03, -1.9450e-03,\n 1.5458e-03, 2.2050e-03, 2.8669e-03, 1.8986e-03, -1.7492e-04,\n 1.8372e-03, 1.7970e-03, -3.0099e-03, 3.5868e-03, -2.7756e-03,\n 3.0318e-03, -1.4662e-03, 3.2855e-04, -8.3113e-03, 2.4346e-03,\n -3.9485e-03, -6.1455e-04, -2.1049e-03, 5.2822e-03, 1.2449e-03,\n -3.5912e-03, 3.5329e-03, -6.7198e-03, 2.7082e-03, -8.1415e-04,\n 8.8920e-04, -6.0166e-03, -6.5106e-04, 2.8041e-03, 1.4105e-03,\n 5.0365e-03, 2.3220e-03, -6.4239e-03, -4.0117e-03, 4.3123e-03,\n -6.8566e-04, 4.3732e-03, 1.9032e-03, -2.4268e-03, -7.1627e-04,\n 1.1084e-04, -1.4613e-03, 2.1403e-03, 2.0373e-03, 1.8801e-03,\n 5.1170e-04, -3.3361e-03, -3.7526e-04, -8.6339e-04, 2.4656e-03,\n -9.6281e-04, -8.2122e-04, 4.2926e-04, -1.4004e-03, -5.5838e-03,\n -1.4807e-02, -4.8923e-03, -4.3213e-03, -2.1803e-03, -5.3398e-04,\n -1.1681e-03, -9.1127e-04, -7.4865e-04, 3.6239e-03, 1.0889e-03,\n 6.5428e-04, -1.0703e-05, 1.1373e-03, 2.1438e-03, -4.1434e-04,\n 4.0449e-03, -4.2720e-03, 1.3878e-04, -1.2676e-03, -3.5601e-03,\n -8.9969e-04, 1.0198e-02, -3.6208e-03, -3.7273e-04, 3.9022e-03,\n -7.5235e-04, 2.4885e-03, -4.0734e-04, 2.4597e-03, -1.4699e-03,\n 1.2869e-03, 2.8020e-03, 1.1916e-03, 2.5705e-02, -1.3206e-02,\n -1.0751e-03, -1.1769e-03, -3.9161e-05, -6.2010e-04, 7.6244e-04,\n 4.3166e-03, 4.7065e-04, -9.5820e-04, 6.7457e-04, -7.9814e-03,\n -2.7726e-03, 1.0704e-03, -1.3961e-03, 6.9104e-03, 1.3303e-03,\n 1.9127e-03, 1.6537e-02, 4.0638e-03, -9.1654e-03, 8.8158e-04,\n 2.9526e-03, 1.0356e-03, -9.7502e-04, 3.0738e-03, 6.4695e-04,\n -3.1488e-03, -1.1554e-03, 1.1232e-03, -2.5902e-04, -1.0267e-03,\n -6.4079e-05, 1.6548e-04, 1.4237e-03, 1.6725e-04, 2.1010e-03,\n -2.1379e-03, -2.0094e-03, 7.9690e-03, 3.4915e-03, 3.3876e-03,\n 2.7499e-03, -5.7693e-03, -9.4365e-03, 2.5063e-03, -1.8646e-03,\n -2.3048e-04, 2.7507e-03, 6.8362e-04, 1.8233e-03, 2.1790e-03,\n 2.2745e-03, 3.6279e-03, -5.3239e-03, 1.2008e-03, 6.9363e-03,\n 2.5056e-03, 4.4390e-04, 1.2272e-03, 1.4655e-03, 3.6269e-03,\n -5.4146e-03, -4.0763e-03, -1.1614e-02, 1.3809e-03, 2.8938e-03,\n 2.0831e-03, -4.8253e-03, 4.0983e-04, 6.7578e-03, 2.1646e-03,\n -3.3930e-03, 1.4760e-03, 4.3051e-03, 7.7662e-04, 1.8646e-02,\n 2.5540e-03, -6.7559e-03, 1.2408e-02, 6.3797e-04, 1.7023e-03,\n 5.9787e-03, -5.2527e-03, -2.3116e-03, -9.1865e-03, 8.9471e-03,\n -1.5752e-03, -4.1685e-03, -1.6283e-03, 7.2006e-03, -3.2105e-03,\n -2.5230e-05, -1.2684e-02, 8.4796e-03, -1.7509e-03, 2.7738e-04,\n 7.3405e-03, 3.4225e-03, -3.3818e-03, -2.9039e-03, 3.8495e-03,\n -8.4090e-03, -2.6074e-03, 1.4745e-03, 1.7347e-03, 3.0088e-04,\n -1.1235e-03, -3.7340e-03, 5.8534e-04, 6.6134e-03, -2.5978e-03,\n 2.8600e-03, 1.2610e-03, 4.3294e-03, -8.8621e-03, -4.9124e-03,\n -7.7673e-03, -8.3438e-03, 8.2868e-03, -2.6217e-03, 1.2684e-03,\n 3.7026e-03, 8.7610e-04, -1.1838e-03, 6.6596e-03, 1.8273e-03,\n 1.5483e-03, 3.0108e-03, 4.9411e-03, 4.1947e-03, -7.1165e-07,\n 2.1385e-03, 2.2143e-03, -2.7983e-03, -4.6172e-03, 1.8923e-03,\n -1.9843e-03, 4.7586e-03, 5.1999e-03, 2.8251e-03, 9.4055e-04,\n -5.4168e-03, 2.7846e-04, -8.8146e-03, 1.1342e-03, 1.0348e-03,\n -3.1423e-03, 3.5030e-03, 1.2380e-02, 7.7151e-03, 3.0760e-04,\n -4.4095e-03, -1.9055e-03, 3.2680e-04, 5.1586e-03, -8.6181e-04,\n -5.4959e-03, 1.7943e-03, -3.6391e-03, 4.1673e-04, 1.0527e-03,\n -5.1937e-03, -1.6752e-03, 3.2007e-03, -1.0697e-03, 3.3488e-03,\n -3.0408e-04, -1.2251e-03, -3.2794e-03, 2.7430e-03, 1.9908e-03,\n -2.0770e-03, 6.8514e-03, 2.3879e-03, -5.0781e-03, -8.4566e-03,\n -2.0373e-03, -1.2098e-03, -2.9571e-03, 2.1479e-03, -1.6534e-03,\n -2.3728e-03, 1.4389e-03, -1.0436e-03, 1.5819e-03, -2.5597e-03,\n -7.3902e-03, -1.3219e-03, 2.7013e-03, -2.2526e-03, -1.6069e-02,\n 3.7173e-03, 4.2608e-04, -1.4553e-03, -1.4548e-04, 4.7333e-03,\n -2.7314e-03, 5.2138e-04, 3.6016e-03, -9.5947e-04, -3.3567e-03,\n 1.2448e-02, -4.6116e-03, -1.0872e-02, 1.5687e-03, 1.5182e-03,\n -7.9019e-03, -2.3635e-03, 9.1619e-03, 2.2213e-03, 4.6617e-03,\n 1.4724e-03, -6.8670e-03, -2.3906e-03, 7.0449e-03, 5.4083e-04,\n -2.2398e-03, 2.9774e-03, 1.2333e-03, 1.0830e-03, 1.1886e-03,\n -4.8377e-03, 2.8849e-03, 3.6970e-04, -4.5830e-04, 2.1080e-03,\n 2.2285e-03, 1.5534e-03, -2.0126e-03, 2.5872e-03, -2.9912e-04,\n 1.3546e-03, 7.1378e-04, -9.3051e-04, 1.3557e-03, -8.4275e-04,\n 4.4472e-03, 7.5092e-03, 8.7805e-04, -1.0514e-03, -9.5651e-04,\n 3.0572e-03, 8.4259e-03, -5.1380e-03, 3.4458e-03, 5.0327e-03,\n -4.3082e-03, 5.9500e-03, -3.2243e-03, 1.8296e-03, 1.3737e-03,\n -3.4129e-05, 2.1228e-03, -1.7475e-03, 5.3503e-04, -4.3082e-03,\n -1.1050e-02, -2.4932e-03], device='cuda:0')",
18
+ "exp_avg_sq": "tensor([1.0792e-04, 9.0773e-05, 7.7478e-05, 7.0284e-05, 2.0606e-04, 1.7382e-04,\n 6.7362e-05, 6.2944e-05, 8.5263e-05, 1.1758e-04, 1.0870e-04, 3.3140e-04,\n 7.9464e-05, 1.1656e-04, 1.1921e-04, 1.0743e-04, 5.9468e-05, 3.4468e-04,\n 1.9544e-04, 1.3167e-04, 9.6660e-05, 2.0093e-04, 2.2937e-04, 1.5615e-04,\n 5.5964e-05, 9.0342e-05, 2.6454e-04, 8.3666e-05, 5.9381e-05, 1.0581e-04,\n 8.1942e-05, 4.5587e-05, 1.5460e-04, 5.1406e-05, 1.0676e-04, 1.0959e-04,\n 1.0808e-04, 1.6558e-04, 1.6960e-04, 1.3375e-04, 1.7639e-04, 1.3367e-04,\n 1.3215e-04, 9.2916e-05, 1.3905e-04, 1.1919e-04, 3.9185e-04, 1.3130e-04,\n 1.8960e-04, 3.6746e-04, 1.4445e-04, 1.1928e-04, 9.7207e-05, 8.1171e-05,\n 1.3278e-04, 9.8138e-05, 1.3436e-04, 2.1676e-04, 1.0071e-04, 1.6460e-04,\n 2.3541e-04, 1.8001e-04, 1.1689e-04, 7.1375e-05, 1.6981e-04, 6.3839e-05,\n 1.4972e-04, 2.0867e-04, 7.1932e-05, 1.1391e-04, 9.8710e-05, 1.2239e-04,\n 8.3071e-05, 7.8341e-05, 1.3802e-04, 1.2147e-04, 6.8727e-05, 5.0341e-04,\n 2.2837e-04, 5.9238e-05, 2.6835e-04, 9.8945e-05, 1.0126e-04, 1.5626e-04,\n 1.8265e-01, 8.5799e-05, 1.1625e-04, 5.2007e-05, 1.3491e-04, 1.0109e-04,\n 1.7189e-04, 1.2908e-04, 4.8529e-05, 2.6843e-04, 6.5262e-05, 9.0394e-05,\n 1.2401e-04, 8.7091e-05, 1.4041e-04, 1.5788e-04, 9.9385e-05, 7.8370e-05,\n 2.1022e-04, 8.3179e-05, 4.9730e-04, 6.7922e-05, 2.7224e-04, 1.0873e-04,\n 9.6273e-05, 1.1185e-04, 1.7513e-04, 9.9811e-05, 9.6998e-05, 1.2109e-04,\n 1.9311e-04, 1.4158e-04, 1.6021e-04, 3.6983e-04, 3.4689e-04, 1.3618e-04,\n 1.2525e-04, 5.4673e-05, 6.8177e-04, 1.0754e-04, 4.9694e-05, 6.9982e-05,\n 7.4220e-05, 1.0672e-04, 4.3816e-05, 8.4941e-05, 1.2389e-04, 6.8842e-04,\n 1.9690e-04, 8.5505e-05, 1.0317e-04, 6.8448e-05, 7.2588e-05, 5.1974e-04,\n 7.0582e-05, 1.9039e-04, 2.0312e-04, 5.6723e-05, 1.1405e-04, 2.2860e-04,\n 3.3016e-04, 9.3178e-05, 1.3381e-04, 1.1165e-04, 6.3504e-05, 6.4653e-05,\n 1.3613e-04, 1.0739e-04, 1.2789e-04, 1.0706e-04, 6.5977e-05, 9.2151e-05,\n 3.6195e-04, 1.5915e-04, 2.3896e-04, 1.0791e-04, 8.5331e-05, 1.2916e-04,\n 3.5238e-04, 9.6609e-05, 5.9611e-05, 1.2944e-04, 2.4423e-04, 2.4205e-04,\n 9.3840e-05, 9.7066e-05, 2.6742e-04, 1.2821e-04, 1.2967e-04, 2.3409e-04,\n 8.8927e-05, 8.8945e-05, 9.6447e-05, 8.9413e-05, 7.0898e-05, 1.0188e-04,\n 1.0641e-04, 1.6001e-04, 6.9191e-05, 5.6665e-05, 6.5863e-05, 9.8997e-05,\n 1.1538e-04, 1.2909e-04, 1.1369e-04, 1.3225e-04, 3.1254e-04, 2.4712e-04,\n 7.8887e-05, 1.2204e-04, 4.8840e-05, 7.4660e-05, 5.5167e-05, 8.8031e-05,\n 2.9919e-04, 1.4351e-04, 4.0146e-05, 1.1328e-04, 1.0609e-04, 7.3102e-05,\n 9.4959e-05, 7.3513e-05, 2.2534e-04, 8.9023e-05, 2.5034e-04, 2.1784e-04,\n 1.4688e-04, 1.6458e-04, 1.1312e-04, 5.7794e-05, 1.5459e-04, 1.7661e-04,\n 2.9837e-04, 7.8849e-05, 1.1800e-04, 1.0241e-04, 1.8850e-04, 8.4100e-05,\n 1.0510e-04, 1.9210e-04, 7.5606e-05, 1.2741e-04, 1.4106e-04, 6.0376e-05,\n 1.3675e-04, 1.2316e-04, 2.8231e-04, 1.2109e-04, 7.8818e-05, 8.5911e-05,\n 5.2847e-05, 2.3495e-04, 1.4444e-04, 8.4533e-05, 7.2124e-05, 6.2424e-05,\n 2.7410e-04, 1.6171e-04, 1.3607e-04, 6.0380e-05, 9.5745e-05, 1.0252e-04,\n 5.4768e-04, 9.2122e-05, 8.5727e-05, 2.5686e-04, 8.5908e-05, 1.3866e-04,\n 3.3664e-04, 9.0643e-03, 3.7432e-04, 1.0873e-04, 1.5788e-04, 1.5483e-04,\n 7.8344e-05, 1.7510e-04, 1.2820e-04, 1.6233e-04, 8.7034e-05, 9.2719e-05,\n 2.1298e-04, 8.9637e-05, 1.2885e-04, 6.3668e-05, 3.3003e-04, 7.5529e-05,\n 9.9450e-05, 2.9308e-04, 8.7183e-05, 9.3543e-05, 1.2998e-04, 7.0202e-05,\n 2.5591e-04, 6.1789e-05, 5.8334e-05, 8.0637e-05, 1.1825e-04, 5.0052e-05,\n 5.6604e-05, 1.5276e-04, 1.1111e-04, 2.5987e-04, 8.1534e-05, 1.3289e-04,\n 1.0164e-04, 1.5643e-04, 8.7080e-05, 1.1466e-04, 2.4778e-04, 1.3974e-04,\n 9.6759e-05, 7.5543e-05, 1.2742e-04, 8.6746e-05, 8.9915e-05, 6.0370e-05,\n 6.8627e-05, 8.5938e-05, 9.4896e-05, 9.2362e-05, 1.0326e-04, 6.8984e-05,\n 8.0581e-05, 1.5293e-04, 7.3110e-05, 1.0483e-04, 1.0117e-04, 7.6617e-05,\n 1.1731e-04, 6.8658e-05, 1.0037e-04, 1.7185e-04, 2.2787e-04, 1.4640e-04,\n 5.8551e-05, 2.0328e-04, 1.0779e-04, 3.7033e-04, 1.0311e-04, 1.3255e-04,\n 2.1325e-04, 8.0628e-05, 1.4747e-04, 8.4007e-05, 2.0089e-04, 1.7388e-04,\n 2.5681e-04, 1.7806e-04, 4.8905e-04, 6.8115e-05, 1.3929e-04, 1.8226e-04,\n 1.3247e-04, 2.0558e-04, 1.3466e-04, 1.3887e-04, 8.4411e-05, 2.1834e-04,\n 5.2822e-05, 1.0176e-04, 2.1825e-04, 8.3836e-05, 1.2652e-04, 1.1945e-04,\n 1.7376e-04, 1.1973e-04, 1.4859e-04, 1.3853e-04, 1.5667e-04, 8.0877e-05,\n 1.3025e-04, 1.2427e-04, 1.3072e-04, 7.1213e-05, 1.0712e-04, 6.1010e-05,\n 7.9518e-05, 8.2784e-05, 6.9502e-05, 2.1214e-04, 8.8811e-05, 2.2914e-04,\n 7.0151e-05, 3.3518e-04, 1.8356e-04, 7.0150e-05, 1.4000e-04, 1.7000e-04,\n 1.7629e-04, 1.1690e-04, 1.4700e-04, 1.5039e-04, 7.0644e-05, 5.3187e-05,\n 1.4254e-04, 8.3098e-05, 7.5045e-05, 2.0402e-04, 9.2433e-05, 1.7278e-04,\n 1.7165e-04, 2.9715e-04, 8.9655e-05, 1.2465e-04, 1.3469e-04, 1.8962e-04,\n 7.9172e-05, 1.4432e-04, 2.8665e-04, 1.3863e-04, 5.6675e-05, 2.0410e-04,\n 7.4273e-05, 2.3233e-04, 7.1642e-05, 2.3668e-04, 2.4007e-04, 1.1151e-04,\n 3.5575e-04, 1.0606e-04, 2.8336e-04, 8.7962e-05, 9.4872e-05, 6.6499e-05,\n 1.0199e-04, 1.8137e-04, 1.4876e-04, 1.9311e-04, 6.7667e-04, 7.7809e-05,\n 6.9968e-05, 6.8193e-05, 9.7806e-05, 1.1829e-04, 2.5237e-04, 7.0415e-05,\n 9.4459e-05, 1.0944e-04, 6.0876e-05, 4.0843e-04, 1.1683e-04, 1.2658e-04,\n 2.5623e-04, 7.9128e-05, 2.8916e-04, 1.5294e-04, 1.7881e-04, 8.6799e-05,\n 1.1889e-04, 1.0089e-04, 1.3520e-04, 1.0283e-04, 1.8143e-04, 4.6377e-05,\n 3.2253e-04, 8.1746e-05, 2.1466e-04, 6.3853e-05, 3.9842e-05, 5.6384e-05,\n 4.0739e-04, 1.0075e-04, 8.7633e-05, 4.4923e-05, 1.2219e-04, 7.2685e-05,\n 1.2746e-04, 1.1325e-04, 6.3969e-05, 1.2327e-04, 6.8187e-05, 2.0386e-04,\n 9.8931e-05, 8.4716e-04, 3.6577e-04, 9.6047e-05, 8.4695e-05, 8.7840e-05,\n 6.8798e-05, 9.6087e-05, 1.2179e-04, 3.9986e-05, 7.7385e-05, 2.3668e-04,\n 1.3526e-04, 6.4968e-05, 1.3383e-04, 6.6248e-05, 5.7501e-05, 2.1494e-04,\n 6.7186e-05, 1.5650e-04, 1.7472e-04, 8.8961e-05, 1.7171e-04, 7.7478e-05,\n 9.0730e-05, 1.3632e-04, 1.0665e-04, 5.3253e-04, 2.5189e-04, 2.0321e-04,\n 9.3765e-05, 1.1508e-04, 6.5757e-05, 7.6875e-05, 2.6611e-04, 1.7254e-04,\n 1.0786e-04, 2.1497e-04, 1.2025e-04, 9.7063e-05, 2.2226e-04, 6.5228e-05,\n 2.1468e-04, 1.1085e-04, 1.6930e-04, 7.4267e-05, 1.1345e-04, 2.0424e-04,\n 1.3223e-04, 2.2672e-04, 1.0070e-04, 9.4908e-05, 1.0856e-04, 1.1736e-04,\n 3.6340e-04, 2.4406e-04], device='cuda:0')"
19
  },
20
  "3": {
21
+ "step": "tensor(6260.)",
22
+ "exp_avg": "tensor([ 6.5936e-03, 1.1896e-03, -5.0563e-04, -7.4915e-03, 2.6546e-04,\n -9.9585e-04, -4.1941e-03, -2.5255e-03, 1.8572e-03, 6.9235e-03,\n 2.2968e-03, -3.4442e-03, -7.3726e-04, 1.5316e-04, -6.0679e-03,\n -1.0157e-02, -8.2887e-03, -9.3257e-03, 1.5103e-03, -3.0279e-04,\n -1.6971e-02, 1.1692e-02, -1.7167e-03, -2.8821e-03, -3.7607e-03,\n 2.4524e-03, 4.2655e-05, 3.0777e-03, -1.8064e-03, -1.3582e-03,\n -3.6452e-03, 4.1541e-03, 1.5816e-03, 3.5059e-03, 5.3233e-03,\n 4.6033e-03, 3.1643e-03, -4.6820e-03, 3.5589e-03, -2.0642e-03,\n 1.3118e-03, 3.3629e-03, -3.5940e-03, -2.6429e-03, -3.9873e-03,\n 5.9555e-03, 2.2178e-03, 1.7363e-03, 1.9350e-04, 9.2571e-04,\n -3.7084e-03, -4.6472e-03, 9.3669e-04, -4.6792e-04, 1.2628e-03,\n 3.5393e-03, -7.0226e-03, -1.1334e-03, 7.7335e-04, -2.9711e-03,\n 1.4594e-03, -1.3083e-03, 1.6890e-04, 6.4026e-04, 3.2287e-03,\n 2.3185e-03, 8.2296e-03, 2.6423e-03, -1.1963e-03, -9.0908e-03,\n -2.8086e-03, 1.2918e-03, 8.0634e-04, 6.5974e-03, -6.5277e-03,\n -6.5682e-04, 3.2977e-03, 4.3411e-03, 4.1987e-04, -9.1263e-04,\n 1.2841e-03, 3.8271e-03, -3.1331e-03, 2.6616e-03, 3.5247e-03,\n -7.5258e-03, -8.3000e-03, 2.0191e-03, -1.0541e-03, -1.1944e-04,\n 1.0101e-03, -1.1438e-03, -1.5252e-03, -7.4187e-03, 7.1159e-04,\n 1.9368e-03, -1.0312e-03, -4.2518e-03, 2.1283e-03, 6.2732e-03,\n 4.8872e-03, -5.8156e-03, -4.0569e-03, -3.3439e-03, 4.2690e-03,\n 7.4194e-04, -2.6519e-03, 7.9385e-03, -2.2503e-03, 6.3317e-04,\n -1.6069e-03, -7.8601e-03, 1.7050e-03, -1.7223e-02, -6.0011e-03,\n -1.2895e-03, -1.7636e-03, 5.2802e-03, -3.5089e-04, 5.3815e-03,\n -3.6036e-03, -3.2066e-03, 3.3231e-03, 3.7462e-03, -1.8971e-03,\n -2.1568e-03, 1.8754e-04, -2.3440e-03, -5.3024e-04, 5.5007e-04,\n 2.3241e-03, -1.1130e-03, -2.3732e-03, -1.7660e-03, -5.7150e-03,\n -1.1365e-03, 5.7380e-03, -8.8755e-03, 4.4198e-03, 4.4902e-03,\n -1.8295e-03, 4.9779e-03, 3.4482e-03, 3.2950e-03, -6.3343e-04,\n 2.1640e-04, -3.5598e-03, -3.1751e-03, -1.4713e-03, 2.5914e-03,\n -1.3604e-03, -7.4860e-05, -3.6553e-03, 1.8916e-03, -4.5745e-03,\n 6.3626e-03, 4.0188e-03, 2.3253e-03, -1.0803e-03, -4.0328e-03,\n -9.2515e-04, 1.6980e-03, 1.0648e-03, 2.0089e-03, -2.8730e-03,\n 1.4450e-03, 1.5035e-03, 1.2080e-03, 1.6250e-03, 3.7270e-04,\n 1.8052e-03, 1.9897e-03, -2.8347e-03, 3.1325e-03, -4.5082e-03,\n 2.8384e-03, 2.6309e-04, 1.5265e-03, -1.1645e-02, 2.5962e-03,\n -3.0479e-03, -3.0059e-04, -3.7233e-03, 5.2628e-03, 1.7481e-03,\n -3.6924e-03, 3.0029e-03, -7.1065e-03, 2.2279e-03, -3.9385e-04,\n 3.1901e-04, -7.1231e-03, -2.3241e-04, 3.8676e-03, 2.3142e-03,\n 7.1210e-03, 4.4992e-03, -1.0707e-02, -2.8359e-03, 4.9074e-03,\n -7.4047e-04, 3.3955e-03, 2.5787e-03, -3.0021e-03, 2.9790e-04,\n 7.0792e-04, 1.1648e-04, 3.0105e-03, 2.0562e-03, -1.3292e-03,\n 1.6110e-03, -2.9840e-03, -2.1809e-04, -5.0096e-04, 1.7456e-03,\n 7.5357e-05, -1.7320e-04, 8.6628e-04, -1.6480e-04, -9.9287e-03,\n -1.0883e-02, -5.9667e-03, -4.8220e-03, -1.7565e-03, -8.5419e-04,\n -2.6408e-03, -1.8273e-03, -1.3795e-03, 2.4250e-03, 2.6066e-03,\n 6.9231e-04, -1.2363e-04, 2.0000e-03, 2.1655e-03, -4.1665e-04,\n 2.5296e-03, -4.7914e-03, 5.2238e-04, -1.1875e-03, -4.2807e-03,\n -1.9132e-04, 8.8770e-03, -2.4273e-03, 3.4417e-04, 4.0713e-03,\n -1.3153e-03, 1.5050e-03, 4.3390e-04, 3.3259e-03, -1.5498e-03,\n 2.2988e-03, 2.1816e-03, 1.8305e-03, 5.2378e-03, -8.1518e-03,\n -1.6015e-03, -1.3515e-03, -4.0487e-04, -2.8048e-04, 1.7408e-04,\n 2.4742e-03, 6.0270e-04, -1.9395e-03, 7.5296e-04, -7.7572e-03,\n -4.2122e-03, 1.7807e-03, -1.4512e-03, 4.5213e-03, 1.5880e-03,\n 3.1325e-03, 1.1604e-02, 4.0154e-03, -1.6928e-02, 2.4390e-04,\n 3.3653e-03, 9.2839e-04, -1.1077e-03, 3.1341e-03, 7.6772e-04,\n -3.6586e-03, -1.9267e-03, 2.0644e-03, -9.7815e-05, -1.6944e-03,\n -6.5447e-04, 2.9358e-04, 1.5196e-03, 8.4775e-05, 4.1781e-03,\n -3.2747e-03, -1.6734e-03, 5.3132e-03, 4.4260e-03, 3.8258e-03,\n 2.1634e-03, -8.1195e-03, -1.2488e-02, 1.6600e-03, -9.2338e-04,\n -9.9431e-04, 3.3417e-03, 1.9330e-03, 3.2097e-03, 1.1007e-03,\n 3.0188e-03, 4.6290e-03, -7.0154e-03, 1.7630e-03, 6.5104e-03,\n 4.2256e-03, -6.5387e-04, 8.5264e-04, 2.1452e-03, 3.2120e-03,\n -5.0989e-03, -4.2399e-03, -9.5398e-03, 1.3750e-03, 3.6652e-03,\n 2.3065e-03, -2.8187e-03, 2.3368e-04, 7.3485e-03, 2.1539e-03,\n -4.9271e-03, 1.3303e-03, 2.9252e-03, 1.2075e-03, 1.7311e-02,\n 1.9609e-03, -6.0004e-03, 7.0697e-03, 1.7806e-03, 1.7983e-03,\n 4.4307e-03, -4.9672e-03, -1.7716e-03, -9.6870e-03, 7.7847e-03,\n -8.6779e-04, -3.8887e-03, -2.7203e-03, 7.0542e-03, -2.3426e-03,\n 1.8489e-04, -1.4084e-02, 8.6603e-03, -2.4365e-03, 9.1543e-05,\n 6.4823e-03, 3.6271e-03, -3.1617e-03, -3.8594e-03, 4.1755e-03,\n -1.2361e-02, -2.2489e-03, 1.9218e-03, 1.3042e-03, 6.0264e-04,\n -1.0475e-03, -5.4257e-03, 4.2230e-05, 5.5030e-03, -1.1079e-03,\n 3.7429e-03, 2.1193e-03, 2.8632e-03, -7.7220e-03, -4.5074e-03,\n -1.1174e-02, -7.5125e-03, 7.1657e-03, -3.3154e-03, 1.0750e-03,\n 3.7191e-03, 1.8097e-03, -8.5331e-04, 7.0096e-03, 2.1095e-03,\n 2.8208e-03, 3.1790e-03, 7.2482e-03, 3.4535e-03, 1.2731e-03,\n -4.9758e-04, 1.1436e-03, -3.1838e-03, -4.8770e-03, 7.7653e-04,\n -1.1670e-03, 5.8724e-03, 3.9518e-03, 2.4306e-03, 1.3322e-03,\n -2.3090e-03, 2.0827e-04, -7.9451e-03, 1.9031e-03, 1.9339e-03,\n -1.9706e-03, 4.2827e-03, 8.9863e-03, 1.0219e-02, 1.4770e-04,\n -5.5539e-03, -3.6721e-03, 6.9482e-05, 7.2983e-03, -2.3164e-03,\n -6.2482e-03, 1.4368e-03, -2.6136e-03, 2.2961e-04, 1.4488e-03,\n -4.7855e-03, -1.5540e-03, 3.5234e-03, -1.1314e-03, 4.3382e-03,\n -4.6037e-04, 1.5632e-04, -6.4678e-03, 9.5986e-04, 3.2047e-03,\n -1.7480e-03, 5.3464e-03, 4.1775e-03, -4.2921e-03, -7.6855e-03,\n -1.3624e-03, -2.3977e-06, -2.8608e-03, 2.1526e-03, -2.1872e-03,\n -1.6377e-03, 1.5019e-03, -1.6374e-03, 9.9057e-04, -2.2022e-03,\n -4.4503e-03, 8.5544e-05, 3.1861e-03, -2.4511e-03, -9.9849e-03,\n 4.1231e-03, 3.4452e-04, -2.2725e-03, 8.1517e-04, 6.3879e-03,\n -3.0817e-03, 9.1640e-04, 3.4646e-03, -6.0133e-04, -3.4296e-03,\n 1.2108e-02, -4.0666e-03, -5.8869e-03, 9.4028e-04, 3.4290e-03,\n -8.2380e-03, -1.6503e-03, 1.2035e-02, 2.3587e-03, 5.3181e-03,\n 1.4879e-03, -9.9646e-03, -1.6769e-03, 7.0585e-03, -7.3951e-05,\n -2.4927e-03, 2.9834e-03, 2.0717e-03, 2.1251e-03, 1.5643e-03,\n -4.0666e-03, 2.6792e-03, 4.8865e-04, -1.1527e-03, 2.8985e-03,\n 1.3729e-03, 1.7010e-03, -2.3779e-03, 1.5440e-03, -7.1371e-04,\n 1.4621e-03, 1.6267e-03, -1.9764e-03, 2.2300e-03, -2.2441e-04,\n 4.0509e-03, 7.5744e-03, 1.6251e-03, -3.0041e-04, -6.1343e-04,\n 3.4326e-03, 8.5691e-03, -7.8756e-03, 2.9864e-03, 4.9767e-03,\n -4.7135e-03, 4.6276e-03, -2.5782e-03, 1.5023e-03, 8.9126e-04,\n 1.5143e-03, 4.6476e-03, -1.8130e-03, 9.7806e-04, -4.8972e-03,\n -8.5198e-03, -1.5693e-03], device='cuda:0')",
23
+ "exp_avg_sq": "tensor([1.2575e-04, 1.1000e-04, 1.4853e-04, 1.0790e-04, 1.1689e-04, 1.1994e-04,\n 1.2042e-04, 8.3786e-05, 1.0066e-04, 1.1758e-04, 1.4321e-04, 2.0947e-04,\n 7.9407e-05, 1.4941e-04, 1.3370e-04, 1.3395e-04, 1.0358e-04, 1.7976e-04,\n 1.6539e-04, 1.3574e-04, 1.7957e-04, 1.6151e-04, 1.5214e-04, 1.0937e-04,\n 1.0507e-04, 1.0668e-04, 1.9472e-04, 8.6102e-05, 9.0176e-05, 1.3947e-04,\n 1.0810e-04, 9.5406e-05, 1.8360e-04, 7.9955e-05, 1.0622e-04, 2.2178e-04,\n 1.3546e-04, 1.2563e-04, 1.3335e-04, 1.7606e-04, 2.0830e-04, 1.2664e-04,\n 1.2977e-04, 1.7466e-04, 8.5656e-05, 1.6422e-04, 1.3602e-04, 1.4659e-04,\n 1.6684e-04, 1.5493e-04, 1.3218e-04, 1.0377e-04, 1.3956e-04, 1.1536e-04,\n 1.4880e-04, 1.0114e-04, 1.1284e-04, 1.4253e-04, 9.0337e-05, 1.6920e-04,\n 1.1017e-04, 1.5402e-04, 1.2568e-04, 1.3139e-04, 1.3772e-04, 1.2733e-04,\n 1.4557e-04, 1.2641e-04, 1.3337e-04, 1.6276e-04, 1.0907e-04, 2.2896e-04,\n 9.2585e-05, 1.1183e-04, 1.2796e-04, 1.1160e-04, 8.3736e-05, 1.5235e-04,\n 1.3562e-04, 9.1302e-05, 1.6880e-04, 1.0571e-04, 1.0654e-04, 1.2084e-04,\n 5.1514e-04, 1.1092e-04, 1.2624e-04, 1.1369e-04, 1.1871e-04, 1.1673e-04,\n 2.1200e-04, 1.1819e-04, 9.4825e-05, 1.7451e-04, 1.0308e-04, 1.2202e-04,\n 1.4866e-04, 1.0438e-04, 1.3927e-04, 1.9917e-04, 1.1133e-04, 8.5160e-05,\n 1.9570e-04, 1.0874e-04, 1.9018e-04, 1.0692e-04, 1.3976e-04, 1.3453e-04,\n 1.5635e-04, 1.1528e-04, 1.7300e-04, 1.2378e-04, 1.0746e-04, 1.3408e-04,\n 1.1785e-04, 1.1193e-04, 1.8323e-04, 1.5437e-04, 1.2366e-04, 1.6786e-04,\n 1.2922e-04, 8.3686e-05, 1.6885e-04, 1.0141e-04, 7.9075e-05, 1.0774e-04,\n 1.2854e-04, 1.2675e-04, 7.7291e-05, 1.1609e-04, 1.5346e-04, 1.5997e-04,\n 1.1358e-04, 9.8705e-05, 8.7336e-05, 1.1353e-04, 1.0783e-04, 1.5747e-04,\n 1.2447e-04, 1.6934e-04, 1.1865e-04, 9.8465e-05, 1.0633e-04, 1.7365e-04,\n 1.1530e-04, 1.4571e-04, 2.6459e-04, 1.9017e-04, 9.8277e-05, 1.1923e-04,\n 1.6173e-04, 1.2335e-04, 1.4261e-04, 1.2066e-04, 1.0987e-04, 1.3121e-04,\n 1.6915e-04, 1.2035e-04, 1.1793e-04, 1.1047e-04, 1.0563e-04, 1.6705e-04,\n 1.9592e-04, 1.0277e-04, 1.1855e-04, 1.7744e-04, 1.9155e-04, 1.3172e-04,\n 1.0166e-04, 1.5879e-04, 1.3906e-04, 1.1632e-04, 1.1341e-04, 1.4606e-04,\n 1.3269e-04, 8.8860e-05, 1.4078e-04, 1.0602e-04, 1.4402e-04, 1.4076e-04,\n 1.4517e-04, 1.2777e-04, 1.4080e-04, 9.1410e-05, 1.1748e-04, 1.3379e-04,\n 1.3527e-04, 1.1644e-04, 1.0026e-04, 1.3877e-04, 1.9976e-04, 1.3400e-04,\n 9.9860e-05, 1.1761e-04, 8.2055e-05, 1.4588e-04, 9.9417e-05, 1.5820e-04,\n 1.5452e-04, 1.6007e-04, 7.6271e-05, 1.0207e-04, 1.2688e-04, 1.1372e-04,\n 9.5097e-05, 1.0875e-04, 1.3613e-04, 1.1886e-04, 1.4595e-04, 2.7612e-04,\n 1.4144e-04, 1.2324e-04, 2.0046e-04, 8.4263e-05, 2.2611e-04, 1.2919e-04,\n 1.4159e-04, 8.1693e-05, 1.2549e-04, 1.6713e-04, 1.4994e-04, 1.2748e-04,\n 1.1321e-04, 1.2718e-04, 1.1452e-04, 1.2561e-04, 1.2411e-04, 1.1358e-04,\n 1.3451e-04, 1.0998e-04, 1.3017e-04, 1.4769e-04, 1.2380e-04, 1.4775e-04,\n 9.1067e-05, 1.7515e-04, 1.2009e-04, 1.6161e-04, 1.0826e-04, 1.0752e-04,\n 1.1786e-04, 1.6453e-04, 1.5385e-04, 1.1798e-04, 1.7141e-04, 1.8763e-04,\n 1.4071e-04, 1.1014e-04, 1.2684e-04, 1.3600e-04, 1.1745e-04, 1.3431e-04,\n 1.6915e-04, 3.5317e-04, 1.2631e-04, 1.2282e-04, 1.5549e-04, 1.5346e-04,\n 1.1445e-04, 1.4159e-04, 1.0035e-04, 1.3886e-04, 1.2890e-04, 1.3108e-04,\n 1.5599e-04, 1.2711e-04, 1.4553e-04, 9.0238e-05, 1.3555e-04, 1.0397e-04,\n 1.7808e-04, 2.0605e-04, 1.0666e-04, 1.7577e-04, 1.4785e-04, 1.0447e-04,\n 1.6971e-04, 1.1103e-04, 9.7360e-05, 1.2040e-04, 1.3565e-04, 9.5824e-05,\n 1.0174e-04, 1.3469e-04, 1.3914e-04, 1.2258e-04, 1.4951e-04, 1.2563e-04,\n 1.2839e-04, 1.9973e-04, 1.3034e-04, 1.2885e-04, 1.2525e-04, 1.6251e-04,\n 1.1228e-04, 1.3803e-04, 1.5723e-04, 1.1917e-04, 1.1137e-04, 9.5429e-05,\n 1.1811e-04, 9.9385e-05, 1.5471e-04, 1.2078e-04, 9.8845e-05, 9.7197e-05,\n 1.0709e-04, 1.7745e-04, 8.9234e-05, 1.3001e-04, 1.6969e-04, 1.0507e-04,\n 9.3495e-05, 1.0687e-04, 1.5229e-04, 1.2995e-04, 1.8916e-04, 1.3661e-04,\n 8.0220e-05, 1.0921e-04, 1.1968e-04, 1.5239e-04, 9.1484e-05, 1.3868e-04,\n 1.6829e-04, 1.2274e-04, 1.4523e-04, 1.1474e-04, 1.5032e-04, 1.6515e-04,\n 1.7835e-04, 1.0880e-04, 1.7595e-04, 1.1059e-04, 1.4168e-04, 1.1741e-04,\n 1.7436e-04, 2.2089e-04, 1.4951e-04, 1.3388e-04, 1.1310e-04, 1.3159e-04,\n 8.8906e-05, 1.0484e-04, 1.1186e-04, 1.2214e-04, 1.6313e-04, 1.2798e-04,\n 1.1798e-04, 1.5698e-04, 9.5005e-05, 1.4566e-04, 1.3568e-04, 1.2314e-04,\n 1.4403e-04, 2.3316e-04, 1.3406e-04, 1.0424e-04, 9.9949e-05, 9.2307e-05,\n 1.0515e-04, 1.5595e-04, 9.7020e-05, 1.3210e-04, 1.2769e-04, 2.4305e-04,\n 1.1027e-04, 1.7642e-04, 1.2912e-04, 1.0851e-04, 1.7292e-04, 1.8084e-04,\n 1.0380e-04, 1.2488e-04, 1.5836e-04, 1.1815e-04, 9.7291e-05, 1.0293e-04,\n 1.5490e-04, 1.2267e-04, 1.2926e-04, 1.7759e-04, 1.8104e-04, 1.3336e-04,\n 1.2224e-04, 2.4573e-04, 1.3035e-04, 1.0638e-04, 1.7288e-04, 2.1376e-04,\n 1.2714e-04, 1.5203e-04, 1.3508e-04, 2.0087e-04, 1.0833e-04, 2.2335e-04,\n 9.6232e-05, 2.0327e-04, 1.0331e-04, 1.9455e-04, 1.1878e-04, 1.1493e-04,\n 2.0433e-04, 1.7636e-04, 1.3180e-04, 1.3527e-04, 1.3676e-04, 1.0270e-04,\n 1.1883e-04, 1.1368e-04, 1.2805e-04, 1.1891e-04, 1.6220e-04, 1.2455e-04,\n 1.1407e-04, 9.5182e-05, 8.4393e-05, 1.2808e-04, 1.4889e-04, 1.6445e-04,\n 9.9863e-05, 1.8467e-04, 1.5592e-04, 1.7429e-04, 1.3614e-04, 1.5140e-04,\n 1.8024e-04, 1.1585e-04, 2.1083e-04, 1.2486e-04, 1.6011e-04, 1.1759e-04,\n 1.4532e-04, 1.0453e-04, 1.2250e-04, 1.2093e-04, 1.3837e-04, 8.4479e-05,\n 1.8112e-04, 1.0243e-04, 1.2245e-04, 1.2267e-04, 9.3212e-05, 7.8245e-05,\n 1.5809e-04, 1.1292e-04, 1.1268e-04, 7.9275e-05, 1.9621e-04, 1.5245e-04,\n 1.2435e-04, 1.1393e-04, 8.4688e-05, 1.4695e-04, 9.7378e-05, 2.0232e-04,\n 1.0383e-04, 1.7800e-04, 1.4327e-04, 2.1578e-04, 1.0945e-04, 9.2735e-05,\n 1.2897e-04, 1.2934e-04, 1.4422e-04, 9.2588e-05, 1.5003e-04, 1.8087e-04,\n 1.3970e-04, 1.0480e-04, 1.9953e-04, 8.8275e-05, 9.7254e-05, 1.3081e-04,\n 1.0098e-04, 1.0231e-04, 1.1759e-04, 1.4872e-04, 1.6157e-04, 1.0221e-04,\n 1.2619e-04, 1.4369e-04, 1.2637e-04, 1.5565e-04, 1.4342e-04, 1.6224e-04,\n 1.0167e-04, 1.4033e-04, 8.0997e-05, 1.1940e-04, 1.5674e-04, 1.5033e-04,\n 1.4426e-04, 1.4225e-04, 2.1080e-04, 1.3861e-04, 1.7826e-04, 1.2386e-04,\n 1.5484e-04, 1.9373e-04, 1.6261e-04, 1.3055e-04, 1.0951e-04, 1.2689e-04,\n 1.2895e-04, 1.1988e-04, 1.7875e-04, 1.0219e-04, 2.5556e-04, 1.2248e-04,\n 1.7413e-04, 1.4658e-04], device='cuda:0')"
24
  },
25
  "4": {
26
+ "step": "tensor(6260.)",
27
+ "exp_avg": "tensor([[-2.4307e-05, 9.4611e-05, 6.3634e-05, ..., 3.6809e-04,\n -7.1694e-04, -9.9097e-05],\n [-1.7877e-04, -7.8264e-05, -7.5887e-05, ..., 3.1284e-05,\n 1.0259e-03, -1.8599e-04],\n [ 2.0717e-04, 1.2593e-04, -2.2736e-04, ..., -3.5495e-04,\n 6.9710e-05, 3.2759e-04],\n ...,\n [ 2.0303e-04, 3.8214e-04, -3.1978e-04, ..., -1.8504e-04,\n 4.5403e-04, 5.4143e-04],\n [ 1.9841e-04, -1.7725e-04, 5.2030e-06, ..., -2.4801e-04,\n 6.9651e-04, 8.8638e-05],\n [ 1.2187e-04, 2.9725e-04, -1.7300e-05, ..., -1.1983e-04,\n 1.2005e-04, -4.0230e-05]], device='cuda:0')",
28
+ "exp_avg_sq": "tensor([[2.4906e-07, 7.0951e-07, 2.5918e-07, ..., 3.2336e-07, 5.3992e-07,\n 5.4305e-07],\n [6.7211e-07, 2.8950e-07, 1.1404e-06, ..., 1.0186e-06, 1.1489e-06,\n 6.5343e-07],\n [4.3169e-07, 3.1296e-07, 5.8489e-07, ..., 1.1070e-06, 8.3938e-07,\n 4.4997e-07],\n ...,\n [9.1299e-07, 3.5147e-07, 6.5943e-07, ..., 9.3078e-07, 1.3141e-06,\n 1.7089e-06],\n [5.3956e-07, 3.9846e-07, 7.0520e-07, ..., 7.1024e-07, 1.1042e-06,\n 1.1504e-06],\n [5.0558e-07, 5.8065e-07, 1.0803e-06, ..., 8.1991e-07, 1.4335e-06,\n 9.7408e-07]], device='cuda:0')"
29
  },
30
  "5": {
31
+ "step": "tensor(6260.)",
32
+ "exp_avg": "tensor([[-1.4470e-04, 3.1142e-05, 4.8491e-06, ..., 1.0279e-04,\n 4.4636e-05, 8.6155e-06],\n [-5.4609e-05, -6.5727e-05, -9.7730e-05, ..., -2.0548e-04,\n 4.1089e-04, -2.9224e-04],\n [ 9.0119e-05, 4.7032e-05, -1.0009e-04, ..., 6.4305e-05,\n -1.6036e-06, 2.2026e-04],\n ...,\n [-3.8610e-05, 9.9904e-05, -3.2030e-04, ..., -1.2563e-04,\n 1.8940e-04, 4.3564e-04],\n [-5.6906e-05, -3.2452e-06, -2.3419e-04, ..., 4.0425e-04,\n -1.0487e-04, -3.1641e-04],\n [-8.1440e-05, -2.7528e-04, -1.7591e-04, ..., 4.8396e-04,\n -1.0290e-04, 2.2857e-05]], device='cuda:0')",
33
+ "exp_avg_sq": "tensor([[7.8768e-08, 4.9331e-08, 1.0050e-07, ..., 1.7118e-07, 1.7352e-07,\n 9.5275e-08],\n [2.1355e-07, 9.0563e-08, 1.9602e-07, ..., 3.1747e-07, 2.9845e-07,\n 2.9380e-07],\n [1.5014e-07, 1.8703e-07, 2.2293e-07, ..., 3.7066e-07, 3.1937e-07,\n 1.6941e-07],\n ...,\n [2.4526e-07, 2.0357e-07, 3.2612e-07, ..., 2.5150e-07, 4.7541e-07,\n 4.0504e-07],\n [1.5069e-07, 2.9833e-07, 2.9376e-07, ..., 2.6648e-07, 3.7469e-07,\n 4.1035e-07],\n [2.0446e-07, 2.1553e-07, 3.8131e-07, ..., 4.3858e-07, 4.2578e-07,\n 2.2549e-07]], device='cuda:0')"
34
  },
35
  "6": {
36
+ "step": "tensor(6260.)",
37
+ "exp_avg": "tensor([ 0.0016, -0.0016], device='cuda:0')",
38
+ "exp_avg_sq": "tensor([9.3679e-06, 9.3679e-06], device='cuda:0')"
39
  }
40
  },
41
  "param_groups": [
42
  {
43
+ "lr": 0.0005005000000000001,
44
  "name": "shared",
45
  "betas": [
46
  0.9,
 
64
  ]
65
  },
66
  {
67
+ "lr": 0.0005005000000000001,
68
  "name": "scale_256",
69
  "betas": [
70
  0.9,
 
85
  ]
86
  },
87
  {
88
+ "lr": 0.0005005000000000001,
89
  "name": "scale_512",
90
  "betas": [
91
  0.9,
 
106
  ]
107
  },
108
  {
109
+ "lr": 0.0002505,
110
  "name": "fusion",
111
  "betas": [
112
  0.9,
 
133
  "T_i": 10,
134
  "T_mult": 2,
135
  "eta_min": 1e-06,
136
+ "T_cur": 5,
137
  "base_lrs": [
138
  0.001,
139
  0.001,
140
  0.001,
141
  0.0005
142
  ],
143
+ "last_epoch": 5,
144
  "_step_count": 0,
145
  "_is_initial": false,
146
  "_get_lr_called_within_step": false,
147
  "_last_lr": [
148
+ 0.0005005000000000001,
149
+ 0.0005005000000000001,
150
+ 0.0005005000000000001,
151
+ 0.0002505
152
  ]
153
  },
154
  "metrics": {
155
+ "best_val_acc": 71.096,
156
+ "best_epoch": 4,
157
  "scale_accuracies": {
158
+ "256": 70.456,
159
+ "512": 70.964
160
  }
161
  },
162
  "train_config": {