Upload weights and configs - David-decoupled-deep_efficiency - Run 20251012_065325
Browse files
weights/David-decoupled-deep_efficiency/20251012_065325/best_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 59515088
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f37bf4247645adf0df795b72b8f62941acd742446a82d070425620418d2292d
|
| 3 |
size 59515088
|
weights/David-decoupled-deep_efficiency/20251012_065325/best_model_metadata.json
CHANGED
|
@@ -1,26 +1,26 @@
|
|
| 1 |
{
|
| 2 |
-
"epoch":
|
| 3 |
"optimizer_state_dict": {
|
| 4 |
"state": {
|
| 5 |
"0": {
|
| 6 |
-
"step": "tensor(
|
| 7 |
-
"exp_avg": "tensor([[ 1.
|
| 8 |
-
"exp_avg_sq": "tensor([[1.
|
| 9 |
},
|
| 10 |
"1": {
|
| 11 |
-
"step": "tensor(
|
| 12 |
-
"exp_avg": "tensor([
|
| 13 |
-
"exp_avg_sq": "tensor([0.0019, 0.0019, 0.
|
| 14 |
},
|
| 15 |
"2": {
|
| 16 |
-
"step": "tensor(
|
| 17 |
-
"exp_avg": "tensor([[
|
| 18 |
-
"exp_avg_sq": "tensor([[
|
| 19 |
}
|
| 20 |
},
|
| 21 |
"param_groups": [
|
| 22 |
{
|
| 23 |
-
"lr": 0.
|
| 24 |
"name": "scale_256",
|
| 25 |
"betas": [
|
| 26 |
0.9,
|
|
@@ -43,7 +43,7 @@
|
|
| 43 |
]
|
| 44 |
},
|
| 45 |
{
|
| 46 |
-
"lr": 0.
|
| 47 |
"name": "scale_512",
|
| 48 |
"betas": [
|
| 49 |
0.9,
|
|
@@ -66,7 +66,7 @@
|
|
| 66 |
]
|
| 67 |
},
|
| 68 |
{
|
| 69 |
-
"lr": 0.
|
| 70 |
"name": "scale_768",
|
| 71 |
"betas": [
|
| 72 |
0.9,
|
|
@@ -89,7 +89,7 @@
|
|
| 89 |
]
|
| 90 |
},
|
| 91 |
{
|
| 92 |
-
"lr": 0.
|
| 93 |
"name": "scale_1024",
|
| 94 |
"betas": [
|
| 95 |
0.9,
|
|
@@ -112,7 +112,7 @@
|
|
| 112 |
]
|
| 113 |
},
|
| 114 |
{
|
| 115 |
-
"lr": 0.
|
| 116 |
"name": "scale_1280",
|
| 117 |
"betas": [
|
| 118 |
0.9,
|
|
@@ -135,7 +135,7 @@
|
|
| 135 |
]
|
| 136 |
},
|
| 137 |
{
|
| 138 |
-
"lr": 0.
|
| 139 |
"name": "fusion",
|
| 140 |
"betas": [
|
| 141 |
0.9,
|
|
@@ -195,7 +195,7 @@
|
|
| 195 |
"T_i": 10,
|
| 196 |
"T_mult": 2,
|
| 197 |
"eta_min": 1e-06,
|
| 198 |
-
"T_cur":
|
| 199 |
"base_lrs": [
|
| 200 |
0.001,
|
| 201 |
0.001,
|
|
@@ -204,24 +204,24 @@
|
|
| 204 |
0.001,
|
| 205 |
0.0005
|
| 206 |
],
|
| 207 |
-
"last_epoch":
|
| 208 |
"_step_count": 0,
|
| 209 |
"_is_initial": false,
|
| 210 |
"_get_lr_called_within_step": false,
|
| 211 |
"_last_lr": [
|
| 212 |
-
0.
|
| 213 |
-
0.
|
| 214 |
-
0.
|
| 215 |
-
0.
|
| 216 |
-
0.
|
| 217 |
-
0.
|
| 218 |
]
|
| 219 |
},
|
| 220 |
"metrics": {
|
| 221 |
-
"best_val_acc":
|
| 222 |
-
"best_epoch":
|
| 223 |
"scale_accuracies": {
|
| 224 |
-
"256":
|
| 225 |
}
|
| 226 |
},
|
| 227 |
"train_config": {
|
|
|
|
| 1 |
{
|
| 2 |
+
"epoch": 1,
|
| 3 |
"optimizer_state_dict": {
|
| 4 |
"state": {
|
| 5 |
"0": {
|
| 6 |
+
"step": "tensor(2504.)",
|
| 7 |
+
"exp_avg": "tensor([[ 1.9903e-04, -2.0316e-03, 4.0099e-04, ..., 3.9600e-04,\n -7.7503e-05, -3.2745e-04],\n [ 1.2035e-04, -5.4277e-04, 8.3932e-04, ..., -6.4219e-05,\n -1.1444e-04, 2.8184e-04],\n [-6.7256e-05, 9.3359e-04, -1.2770e-04, ..., 2.4264e-04,\n -4.6260e-04, -2.6548e-04],\n ...,\n [-9.3872e-06, -3.3246e-04, -1.0106e-04, ..., -6.8116e-05,\n -1.0831e-05, -4.9642e-04],\n [-1.2853e-03, -3.1639e-03, 1.6793e-03, ..., 8.5221e-04,\n 2.0776e-04, -5.3517e-04],\n [-6.0768e-04, -1.0425e-03, 2.5003e-04, ..., 1.3259e-04,\n -6.0654e-05, -1.6917e-04]], device='cuda:0')",
|
| 8 |
+
"exp_avg_sq": "tensor([[1.4933e-06, 1.3383e-05, 4.9550e-06, ..., 2.0071e-06, 1.0758e-06,\n 1.6587e-06],\n [3.3611e-06, 9.2764e-06, 9.0210e-06, ..., 2.5916e-06, 9.1690e-07,\n 1.3613e-06],\n [2.5602e-06, 1.6735e-05, 6.9803e-06, ..., 1.5625e-06, 1.0142e-06,\n 1.3210e-06],\n ...,\n [4.2617e-06, 3.2869e-05, 9.4941e-06, ..., 2.8932e-06, 1.9778e-06,\n 1.9807e-06],\n [2.4394e-06, 2.4098e-05, 7.0105e-06, ..., 1.8268e-06, 1.1096e-06,\n 1.5990e-06],\n [2.7173e-06, 1.4306e-05, 5.9305e-06, ..., 1.5879e-06, 1.2643e-06,\n 3.5216e-06]], device='cuda:0')"
|
| 9 |
},
|
| 10 |
"1": {
|
| 11 |
+
"step": "tensor(2504.)",
|
| 12 |
+
"exp_avg": "tensor([ 3.7015e-04, -2.3370e-03, 9.0641e-03, 4.4973e-03, -1.0452e-02,\n 4.3782e-03, -2.0823e-03, -7.3727e-03, -1.1328e-02, -1.8645e-02,\n 2.3319e-02, -7.7803e-03, -4.1483e-03, -1.0812e-02, -1.3694e-02,\n -4.7227e-03, -1.9605e-02, 4.1987e-02, -1.3836e-02, 1.3592e-02,\n -2.3378e-03, -1.4993e-02, -1.2426e-03, 5.2254e-03, -4.8466e-04,\n 5.3871e-03, 3.2941e-03, -3.5580e-03, -4.2602e-03, -7.9428e-03,\n 1.6526e-02, 2.7316e-03, 1.9632e-02, -1.4506e-02, -7.1378e-03,\n -8.1808e-03, 9.0706e-04, -5.7208e-03, 8.3405e-03, -1.1962e-02,\n 2.1529e-03, 2.7002e-03, -9.5559e-03, 2.5858e-03, 1.9019e-02,\n 1.6488e-02, 1.7670e-02, -1.1011e-02, -4.5329e-03, -3.7018e-02,\n 3.7496e-03, 2.4826e-02, 4.9099e-03, -1.8235e-02, 1.4793e-02,\n -2.6602e-02, -1.4454e-02, 1.8537e-02, 4.2614e-04, 8.5051e-03,\n -4.6100e-04, 7.5454e-03, -8.1947e-03, 6.6934e-03, -5.2298e-03,\n 3.7937e-03, 4.4811e-03, 1.1742e-02, -1.3882e-02, -5.8893e-03,\n -2.5940e-03, -1.0937e-02, -4.5452e-03, -1.7575e-02, -3.3608e-03,\n -1.0778e-02, 1.4423e-02, 2.1711e-03, -8.6503e-03, -3.9028e-02,\n -6.9429e-03, 1.0434e-02, -8.4117e-03, -2.5737e-03, -1.9437e-02,\n 1.2141e-02, -8.9491e-03, -1.5660e-02, -7.8207e-03, 2.7758e-03,\n 2.4170e-03, 1.1981e-02, -1.7890e-02, 1.9754e-03, -1.0491e-02,\n -1.7669e-03, -7.6529e-03, 1.7853e-02, -6.1149e-03, 2.9477e-04,\n 2.0961e-02, -2.3410e-02, 1.0970e-02, 1.1934e-02, 2.4891e-03,\n 4.3455e-02, 3.5481e-03, 7.4252e-03, 1.1450e-02, 1.5432e-02,\n -1.8916e-04, -1.9861e-02, 1.5046e-03, -1.1228e-02, -2.7466e-02,\n -6.5935e-04, 6.0407e-03, 3.5843e-03, 6.4985e-03, -5.6037e-03,\n -7.3331e-03, -1.8326e-02, -6.3276e-03, -1.0016e-03, 1.8660e-02,\n 1.3386e-02, 6.2620e-03, 7.7024e-03, -9.7012e-03, 1.3455e-03,\n -2.2261e-03, 1.1020e-03, 5.5393e-03, -4.2593e-03, 1.7430e-02,\n -2.3933e-02, -2.5678e-02, 1.1107e-02, -2.3952e-03, -2.0671e-02,\n 5.0374e-03, 3.1478e-02, -1.2650e-02, 2.3486e-02, -4.7556e-03,\n 2.5522e-03, 2.1172e-03, -1.3519e-02, -2.7345e-03, -1.8219e-02,\n 3.2386e-03, 2.6787e-03, -3.7405e-02, 2.0377e-03, 2.2786e-02,\n -3.7128e-05, -3.9497e-02, 5.3251e-03, 1.3003e-02, 6.6501e-03,\n -3.2034e-02, 3.6701e-02, -2.2223e-04, 1.2996e-02, 1.0601e-02,\n -1.9193e-03, 8.2985e-03, 9.2626e-04, 1.8440e-03, 7.9549e-03,\n 9.4247e-03, 1.7267e-02, -6.2791e-03, 3.8940e-03, 2.0544e-03,\n 1.3940e-03, -1.1052e-02, -8.3617e-03, 7.2351e-03, 4.1323e-03,\n 6.8777e-04, -2.0998e-02, -1.0373e-03, -4.6615e-03, -1.3763e-02,\n -1.1012e-03, -2.8058e-02, 3.5221e-03, 2.3242e-03, -3.7730e-02,\n 4.1052e-03, 9.4342e-03, 7.4152e-03, 2.3496e-02, -3.4740e-03,\n 3.7744e-03, -3.1437e-02, -2.9619e-03, 1.0581e-02, -2.4242e-02,\n -2.8182e-03, 5.5457e-03, -1.0421e-02, 8.6784e-03, -2.8856e-03,\n 5.0659e-04, 9.8441e-03, -3.0326e-04, 3.0359e-03, -9.8104e-03,\n -9.9844e-03, 1.4239e-02, -2.5225e-02, 1.0159e-03, -1.2108e-02,\n 7.0868e-03, -1.2549e-02, 1.4220e-02, 4.4437e-03, 2.0620e-02,\n -2.7853e-03, 2.3273e-02, 9.1179e-03, -1.7696e-02, 1.1397e-02,\n 2.5824e-02, -4.4603e-03, -2.1303e-02, 1.3596e-02, 1.6398e-02,\n 8.5609e-03, -4.6444e-04, 1.5405e-02, 1.8042e-02, -1.0500e-02,\n -6.6665e-02, 1.2047e-02, 2.0606e-02, 2.1219e-02, 1.1406e-02,\n 3.6286e-02, -2.8446e-03, -6.4342e-03, -8.0879e-03, 1.0519e-02,\n 4.8636e-03, -3.1575e-02, 2.8921e-02, 1.4505e-02, -5.5999e-03,\n -6.3928e-03, 1.8554e-03, 1.4512e-02, 4.0229e-03, -3.3347e-02,\n -8.0840e-03, 4.7516e-03, 7.2561e-03, 8.3234e-03, 3.6309e-02,\n -2.2225e-02, -3.1745e-03, -1.3161e-02, 2.3942e-03, -9.7760e-03,\n 4.1599e-03, -5.9595e-03, 8.3747e-03, 7.7639e-03, -7.7427e-03,\n 6.2609e-03, -9.3417e-04, -2.5982e-02, 3.1943e-02, -8.4646e-04,\n 1.3606e-02, 2.8375e-03, -1.2618e-02, 1.3730e-02, -5.0016e-03,\n -1.3591e-02, -5.3509e-03, -1.8622e-02, 1.0042e-02, 1.2241e-03,\n 2.0266e-02, 8.7766e-03, 5.2801e-03, -1.1249e-02, -9.1190e-03,\n 1.8848e-02, 3.4133e-03, 1.9920e-02, 1.5360e-02, -8.1308e-03,\n 9.7479e-03, 2.5615e-03, 3.2904e-04, 5.3236e-03, 1.1275e-02,\n -2.3847e-02, 8.8524e-03, 4.7067e-03, -1.2748e-03, 8.6914e-03,\n 1.6651e-02, 1.2849e-02, 9.0641e-03, 4.8100e-03, 1.8057e-02,\n 6.7364e-03, -1.6841e-03, -1.8297e-02, -3.9983e-03, -1.5536e-02,\n 4.5254e-03, -1.3754e-02, 5.4797e-03, -1.3434e-02, -2.5416e-02,\n 3.6965e-02, 1.0310e-02, -1.0124e-04, 1.7364e-03, -1.0163e-02,\n 1.5583e-02, -3.6903e-03, 2.0873e-02, 8.7366e-03, -3.0092e-02,\n -2.1265e-02, 3.1959e-03, -3.2141e-02, -2.7559e-02, 1.4039e-02,\n 7.3270e-03, -2.5510e-03, 1.8156e-03, 4.2029e-02, 3.1559e-03,\n 3.0051e-02, 4.4247e-03, 6.7175e-03, -1.3601e-02, 2.0102e-03,\n -4.3502e-03, -4.1042e-02, 2.7482e-03, 3.8990e-03, 6.0767e-03,\n -1.8549e-03, 4.3223e-03, 1.2431e-03, 2.5267e-03, 2.1141e-02,\n -5.4905e-03, -1.9051e-02, -2.0751e-03, 2.4948e-03, -1.0516e-02,\n -9.1798e-04, 4.7818e-03, -2.6325e-03, -1.2754e-02, 9.3676e-03,\n 5.5414e-03, 2.0135e-02, -3.3297e-03, -6.5511e-04, -1.5180e-02,\n -6.2350e-02, -2.2458e-02, -4.0152e-03, 1.8771e-02, -2.8697e-03,\n 2.4316e-03, -4.5374e-03, 1.2434e-02, 2.1114e-02, 1.2682e-02,\n 3.0717e-02, 8.1329e-03, 1.7098e-02, 1.1113e-02, -9.7007e-03,\n -3.2172e-03, -9.4604e-03, 1.8473e-03, -1.1092e-02, -9.0469e-04,\n 9.9962e-03, -3.0490e-02, 3.8586e-02, -5.0345e-03, -2.7900e-02,\n 1.4848e-02, 3.8165e-02, 1.9578e-02, -1.4309e-02, 8.1076e-03,\n 4.0688e-03, -1.8150e-02, -1.8551e-02, -6.9978e-03, 7.6080e-03,\n 2.3558e-02, -9.7192e-03, -2.5298e-03, -9.8672e-03, 2.0012e-02,\n 3.3717e-03, 1.5531e-02, -2.3598e-03, -1.4062e-02, 1.8739e-03,\n -6.2653e-04, -1.0313e-02, -1.6515e-03, -3.5710e-03, -1.7260e-02,\n 5.1800e-04, 1.8365e-02, 2.4575e-02, -9.3078e-03, 1.1834e-02,\n 2.6459e-02, 2.3392e-02, -1.8705e-02, -7.9415e-03, -5.7631e-03,\n 2.8511e-02, 1.7752e-02, -1.0011e-02, 7.0031e-03, -2.5317e-02,\n 1.1355e-02, 2.3412e-02, -7.0986e-03, -5.8811e-03, 1.9290e-03,\n -1.0360e-02, -6.3055e-03, -9.6267e-03, 1.4141e-02, 1.8005e-03,\n -1.4323e-02, 1.3786e-02, 1.5624e-02, 1.7800e-02, -1.3349e-02,\n -8.3177e-03, 2.5931e-02, -3.0994e-04, 1.6163e-02, 8.3758e-04,\n 1.1851e-02, 1.8527e-02, 2.5990e-02, 1.1613e-02, -3.6058e-02,\n 3.0730e-03, -1.3725e-02, 2.1578e-03, -1.0197e-02, -2.6884e-02,\n 3.8387e-03, -2.2237e-02, 1.1961e-02, -5.8919e-03, 2.2816e-02,\n 2.4111e-04, -2.4864e-02, -1.2242e-02, -1.0923e-02, -2.8317e-03,\n 5.0746e-04, 1.7315e-02, 2.0425e-03, 6.3374e-03, -6.5011e-03,\n 4.1144e-03, -2.4692e-02, 2.1480e-02, 4.0464e-06, 1.4859e-02,\n -1.8319e-02, 8.1660e-03, -3.7029e-03, 1.8128e-03, -2.7395e-02,\n 1.5815e-02, -4.2541e-03, 2.0555e-03, -1.3953e-02, 7.0785e-04,\n 1.4946e-02, 2.7037e-03, 1.4192e-02, 1.0791e-02, 1.2503e-02,\n 5.7559e-04, -7.3741e-03, -1.0589e-02, 1.2760e-02, 5.7868e-03,\n 7.7232e-03, -1.2102e-02, 1.5461e-02, -2.9322e-02, -3.7516e-02,\n 1.9406e-02, 3.7544e-03, -4.9696e-03, 1.7453e-02, 1.9470e-02,\n 1.9318e-02, 1.2881e-03, 2.6887e-02, -2.3501e-03, -7.0118e-03,\n -1.3360e-02, 1.2180e-03, 4.9717e-03, 3.3087e-02, -1.6251e-02,\n -1.9534e-02, 7.5200e-03, -1.0589e-02, 6.5200e-04, 1.7015e-02,\n 8.2721e-03, 1.4412e-02, -1.6038e-03, 7.1778e-03, 5.6243e-04,\n 3.3249e-03, -3.6018e-03, 1.9255e-02, -1.3330e-03, -5.6798e-03,\n -1.0747e-02, -1.0796e-02, -1.4548e-02, 1.9716e-03, -8.7362e-02,\n 1.7665e-02, 1.8212e-02, -4.2831e-03, 8.6517e-03, 2.0562e-02,\n 5.7245e-03, 1.3288e-04, -3.1388e-02, -7.4862e-03, 1.2812e-05,\n 5.4817e-03, 1.6561e-02, -3.5099e-05, 1.4302e-02, 5.5100e-03,\n 8.0109e-03, -2.0828e-02, 2.6218e-03, 5.5258e-03, 8.2771e-03,\n 4.3478e-03, 1.7280e-02, 3.8516e-05, 5.3053e-04, 2.4896e-02,\n -2.4664e-02, -7.6390e-03, 2.5688e-03, -2.9710e-03, -4.1264e-03,\n -1.6960e-03, 2.2620e-03, 2.5374e-02, 1.3910e-02, -8.4825e-04,\n 1.4985e-03, 1.0969e-04, 4.4948e-03, 1.8173e-02, -2.7873e-02,\n -1.3119e-02, 2.2612e-02, 1.1584e-02, -1.7831e-03, 1.9717e-02,\n -2.0277e-04, 1.6129e-02, 1.1356e-02, -8.4536e-03, 1.0369e-02,\n -2.4749e-02, -6.5893e-03, 4.1463e-04, -8.3810e-04, 1.1518e-02,\n -2.2795e-02, -3.3748e-02, 9.6555e-03, 1.1948e-02, -1.4417e-02,\n 7.2138e-03, -4.5353e-03, -4.5611e-04, 8.8891e-03, 4.3160e-03,\n 3.8857e-03, -3.4371e-02, -7.1428e-03, -8.5142e-03, -4.9979e-03,\n 3.3383e-02, -2.1196e-02, -1.6020e-03, 1.4625e-02, 8.6971e-03,\n -1.3028e-02, -6.6353e-03, 1.2731e-02, 5.4896e-03, -1.0384e-02,\n 8.6397e-03, -4.2818e-04, -8.7563e-03, 9.3405e-03, 5.3446e-03,\n 9.2650e-03, -1.1889e-02, 3.1683e-03, -1.6852e-02, -1.5115e-02,\n -1.8536e-02, -7.4602e-03, -1.6525e-03, -2.8242e-02, -1.4293e-02],\n device='cuda:0')",
|
| 13 |
+
"exp_avg_sq": "tensor([0.0019, 0.0019, 0.0018, 0.0019, 0.0023, 0.0023, 0.0012, 0.0018, 0.0022,\n 0.0023, 0.0031, 0.0029, 0.0029, 0.0029, 0.0016, 0.0019, 0.0020, 0.0029,\n 0.0016, 0.0025, 0.0023, 0.0020, 0.0020, 0.0027, 0.0020, 0.0029, 0.0042,\n 0.0022, 0.0027, 0.0025, 0.0019, 0.0022, 0.0032, 0.0025, 0.0022, 0.0019,\n 0.0018, 0.0021, 0.0029, 0.0020, 0.0022, 0.0014, 0.0024, 0.0021, 0.0020,\n 0.0026, 0.0025, 0.0022, 0.0022, 0.0019, 0.0021, 0.0019, 0.0020, 0.0024,\n 0.0024, 0.0026, 0.0040, 0.0021, 0.0027, 0.0020, 0.0021, 0.0025, 0.0023,\n 0.0031, 0.0029, 0.0021, 0.0033, 0.0028, 0.0025, 0.0024, 0.0031, 0.0018,\n 0.0031, 0.0029, 0.0020, 0.0022, 0.0020, 0.0017, 0.0019, 0.0023, 0.0020,\n 0.0020, 0.0018, 0.0025, 0.0018, 0.0019, 0.0018, 0.0026, 0.0023, 0.0021,\n 0.0023, 0.0034, 0.0023, 0.0017, 0.0026, 0.0021, 0.0019, 0.0020, 0.0018,\n 0.0024, 0.0024, 0.0017, 0.0021, 0.0018, 0.0021, 0.0028, 0.0019, 0.0021,\n 0.0034, 0.0023, 0.0025, 0.0023, 0.0019, 0.0023, 0.0021, 0.0020, 0.0024,\n 0.0023, 0.0020, 0.0036, 0.0027, 0.0030, 0.0019, 0.0020, 0.0025, 0.0025,\n 0.0040, 0.0021, 0.0021, 0.0020, 0.0023, 0.0035, 0.0026, 0.0022, 0.0022,\n 0.0021, 0.0020, 0.0021, 0.0027, 0.0032, 0.0022, 0.0024, 0.0027, 0.0025,\n 0.0025, 0.0021, 0.0017, 0.0023, 0.0023, 0.0017, 0.0022, 0.0020, 0.0033,\n 0.0034, 0.0025, 0.0026, 0.0029, 0.0019, 0.0023, 0.0025, 0.0025, 0.0034,\n 0.0027, 0.0027, 0.0024, 0.0023, 0.0017, 0.0027, 0.0028, 0.0029, 0.0015,\n 0.0017, 0.0019, 0.0020, 0.0028, 0.0029, 0.0025, 0.0019, 0.0017, 0.0021,\n 0.0031, 0.0024, 0.0023, 0.0019, 0.0018, 0.0021, 0.0025, 0.0021, 0.0029,\n 0.0032, 0.0022, 0.0028, 0.0021, 0.0025, 0.0019, 0.0020, 0.0019, 0.0027,\n 0.0022, 0.0025, 0.0022, 0.0025, 0.0033, 0.0037, 0.0024, 0.0021, 0.0027,\n 0.0022, 0.0023, 0.0024, 0.0023, 0.0016, 0.0022, 0.0034, 0.0022, 0.0035,\n 0.0021, 0.0023, 0.0021, 0.0028, 0.0023, 0.0025, 0.0017, 0.0025, 0.0020,\n 0.0020, 0.0030, 0.0021, 0.0027, 0.0023, 0.0024, 0.0023, 0.0026, 0.0020,\n 0.0024, 0.0031, 0.0021, 0.0028, 0.0021, 0.0027, 0.0022, 0.0022, 0.0021,\n 0.0029, 0.0028, 0.0023, 0.0030, 0.0027, 0.0023, 0.0025, 0.0021, 0.0019,\n 0.0036, 0.0028, 0.0021, 0.0022, 0.0025, 0.0020, 0.0018, 0.0022, 0.0019,\n 0.0023, 0.0017, 0.0032, 0.0029, 0.0023, 0.0019, 0.0016, 0.0021, 0.0018,\n 0.0024, 0.0042, 0.0022, 0.0021, 0.0019, 0.0022, 0.0020, 0.0019, 0.0023,\n 0.0020, 0.0023, 0.0029, 0.0033, 0.0027, 0.0021, 0.0024, 0.0023, 0.0020,\n 0.0031, 0.0024, 0.0020, 0.0018, 0.0019, 0.0017, 0.0022, 0.0027, 0.0023,\n 0.0019, 0.0034, 0.0025, 0.0022, 0.0022, 0.0028, 0.0018, 0.0021, 0.0026,\n 0.0021, 0.0023, 0.0020, 0.0023, 0.0021, 0.0022, 0.0015, 0.0030, 0.0035,\n 0.0025, 0.0025, 0.0024, 0.0021, 0.0021, 0.0023, 0.0031, 0.0023, 0.0022,\n 0.0026, 0.0025, 0.0027, 0.0025, 0.0029, 0.0020, 0.0039, 0.0020, 0.0030,\n 0.0022, 0.0036, 0.0030, 0.0021, 0.0020, 0.0034, 0.0024, 0.0025, 0.0023,\n 0.0019, 0.0024, 0.0029, 0.0027, 0.0020, 0.0021, 0.0024, 0.0026, 0.0018,\n 0.0023, 0.0040, 0.0026, 0.0028, 0.0024, 0.0026, 0.0023, 0.0020, 0.0024,\n 0.0017, 0.0019, 0.0019, 0.0024, 0.0031, 0.0028, 0.0028, 0.0032, 0.0021,\n 0.0029, 0.0028, 0.0032, 0.0021, 0.0028, 0.0029, 0.0030, 0.0029, 0.0028,\n 0.0020, 0.0023, 0.0033, 0.0023, 0.0022, 0.0021, 0.0023, 0.0021, 0.0029,\n 0.0025, 0.0022, 0.0023, 0.0021, 0.0028, 0.0024, 0.0028, 0.0022, 0.0022,\n 0.0021, 0.0025, 0.0024, 0.0041, 0.0020, 0.0025, 0.0024, 0.0024, 0.0023,\n 0.0028, 0.0037, 0.0020, 0.0023, 0.0022, 0.0039, 0.0027, 0.0032, 0.0021,\n 0.0023, 0.0018, 0.0020, 0.0018, 0.0020, 0.0019, 0.0032, 0.0022, 0.0026,\n 0.0029, 0.0019, 0.0022, 0.0027, 0.0027, 0.0021, 0.0035, 0.0022, 0.0024,\n 0.0014, 0.0024, 0.0027, 0.0022, 0.0027, 0.0024, 0.0028, 0.0032, 0.0019,\n 0.0019, 0.0018, 0.0031, 0.0033, 0.0025, 0.0027, 0.0026, 0.0020, 0.0030,\n 0.0038, 0.0019, 0.0021, 0.0027, 0.0026, 0.0020, 0.0025, 0.0029, 0.0028,\n 0.0020, 0.0022, 0.0020, 0.0022, 0.0021, 0.0026, 0.0020, 0.0025, 0.0027,\n 0.0018, 0.0024, 0.0024, 0.0028, 0.0016, 0.0035, 0.0020, 0.0029, 0.0027,\n 0.0017, 0.0021, 0.0022, 0.0036, 0.0017, 0.0026, 0.0026, 0.0024, 0.0024,\n 0.0023, 0.0022, 0.0021, 0.0021, 0.0019, 0.0035, 0.0017, 0.0021, 0.0022,\n 0.0020, 0.0024, 0.0019, 0.0033, 0.0020, 0.0020, 0.0021, 0.0019, 0.0024,\n 0.0022, 0.0025, 0.0026, 0.0025, 0.0023, 0.0028, 0.0023, 0.0027, 0.0016,\n 0.0026, 0.0015, 0.0028, 0.0019, 0.0023, 0.0020, 0.0024, 0.0029, 0.0020,\n 0.0021, 0.0019, 0.0026, 0.0024, 0.0018, 0.0021, 0.0024, 0.0025, 0.0024,\n 0.0018, 0.0016, 0.0020, 0.0028, 0.0022, 0.0025, 0.0023, 0.0018, 0.0026,\n 0.0020, 0.0023, 0.0022, 0.0022, 0.0034, 0.0025, 0.0020, 0.0025, 0.0017,\n 0.0015, 0.0026, 0.0024, 0.0023, 0.0023, 0.0020, 0.0023, 0.0024, 0.0025,\n 0.0024, 0.0022, 0.0026, 0.0024, 0.0018, 0.0027, 0.0019, 0.0021, 0.0020,\n 0.0017, 0.0035, 0.0027, 0.0022, 0.0027, 0.0024, 0.0021, 0.0029, 0.0024,\n 0.0022, 0.0038, 0.0018, 0.0031, 0.0025, 0.0032, 0.0029, 0.0024, 0.0020,\n 0.0024, 0.0029, 0.0019, 0.0020, 0.0029, 0.0020, 0.0036, 0.0029, 0.0024,\n 0.0020, 0.0023, 0.0019, 0.0024, 0.0024, 0.0021, 0.0018, 0.0023, 0.0031,\n 0.0024, 0.0019, 0.0021, 0.0023, 0.0021, 0.0025, 0.0023, 0.0023, 0.0026,\n 0.0018, 0.0029, 0.0031, 0.0019, 0.0050, 0.0022, 0.0032, 0.0021, 0.0031,\n 0.0022, 0.0020, 0.0024, 0.0019, 0.0024, 0.0027, 0.0013, 0.0024, 0.0025,\n 0.0024, 0.0034, 0.0020, 0.0028, 0.0028, 0.0022, 0.0027, 0.0027, 0.0021,\n 0.0022], device='cuda:0')"
|
| 14 |
},
|
| 15 |
"2": {
|
| 16 |
+
"step": "tensor(2504.)",
|
| 17 |
+
"exp_avg": "tensor([[ 3.3157e-05, 9.0172e-05, 8.2628e-05, ..., 5.1896e-05,\n 9.1822e-05, -2.2610e-04],\n [-4.5172e-04, -1.2079e-04, 1.8322e-04, ..., -3.3412e-05,\n 1.8097e-04, 1.7297e-04],\n [ 4.6973e-04, -8.3150e-05, -9.6866e-04, ..., -3.8514e-05,\n 1.4621e-04, -6.8942e-05],\n ...,\n [-5.8888e-04, -3.6048e-04, -3.6673e-05, ..., -1.5665e-05,\n -4.0896e-04, 5.4799e-04],\n [-1.2193e-03, -3.9815e-04, 3.8778e-04, ..., -5.7737e-05,\n -7.0575e-05, 2.8701e-05],\n [ 1.0101e-04, 1.1042e-04, 2.3041e-04, ..., 1.5737e-05,\n -3.5228e-04, -4.9031e-05]], device='cuda:0')",
|
| 18 |
+
"exp_avg_sq": "tensor([[8.4538e-07, 6.2770e-07, 8.0637e-07, ..., 3.5103e-07, 8.9550e-07,\n 1.4680e-06],\n [1.2847e-06, 1.6966e-06, 1.4330e-06, ..., 9.8359e-07, 2.4769e-06,\n 2.1182e-06],\n [1.5711e-06, 1.8740e-06, 1.7353e-06, ..., 1.0199e-06, 1.4728e-06,\n 1.2872e-06],\n ...,\n [1.6384e-06, 1.4097e-06, 1.7026e-06, ..., 1.1115e-06, 1.9571e-06,\n 3.8118e-06],\n [1.8098e-06, 2.3717e-06, 1.8668e-06, ..., 8.7579e-07, 1.8769e-06,\n 1.9211e-06],\n [2.0767e-06, 8.3075e-07, 2.4246e-06, ..., 1.2058e-06, 1.8157e-06,\n 2.2155e-06]], device='cuda:0')"
|
| 19 |
}
|
| 20 |
},
|
| 21 |
"param_groups": [
|
| 22 |
{
|
| 23 |
+
"lr": 0.0009046039886902864,
|
| 24 |
"name": "scale_256",
|
| 25 |
"betas": [
|
| 26 |
0.9,
|
|
|
|
| 43 |
]
|
| 44 |
},
|
| 45 |
{
|
| 46 |
+
"lr": 0.0009046039886902864,
|
| 47 |
"name": "scale_512",
|
| 48 |
"betas": [
|
| 49 |
0.9,
|
|
|
|
| 66 |
]
|
| 67 |
},
|
| 68 |
{
|
| 69 |
+
"lr": 0.0009046039886902864,
|
| 70 |
"name": "scale_768",
|
| 71 |
"betas": [
|
| 72 |
0.9,
|
|
|
|
| 89 |
]
|
| 90 |
},
|
| 91 |
{
|
| 92 |
+
"lr": 0.0009046039886902864,
|
| 93 |
"name": "scale_1024",
|
| 94 |
"betas": [
|
| 95 |
0.9,
|
|
|
|
| 112 |
]
|
| 113 |
},
|
| 114 |
{
|
| 115 |
+
"lr": 0.0009046039886902864,
|
| 116 |
"name": "scale_1280",
|
| 117 |
"betas": [
|
| 118 |
0.9,
|
|
|
|
| 135 |
]
|
| 136 |
},
|
| 137 |
{
|
| 138 |
+
"lr": 0.0004523497400965494,
|
| 139 |
"name": "fusion",
|
| 140 |
"betas": [
|
| 141 |
0.9,
|
|
|
|
| 195 |
"T_i": 10,
|
| 196 |
"T_mult": 2,
|
| 197 |
"eta_min": 1e-06,
|
| 198 |
+
"T_cur": 2,
|
| 199 |
"base_lrs": [
|
| 200 |
0.001,
|
| 201 |
0.001,
|
|
|
|
| 204 |
0.001,
|
| 205 |
0.0005
|
| 206 |
],
|
| 207 |
+
"last_epoch": 2,
|
| 208 |
"_step_count": 0,
|
| 209 |
"_is_initial": false,
|
| 210 |
"_get_lr_called_within_step": false,
|
| 211 |
"_last_lr": [
|
| 212 |
+
0.0009046039886902864,
|
| 213 |
+
0.0009046039886902864,
|
| 214 |
+
0.0009046039886902864,
|
| 215 |
+
0.0009046039886902864,
|
| 216 |
+
0.0009046039886902864,
|
| 217 |
+
0.0004523497400965494
|
| 218 |
]
|
| 219 |
},
|
| 220 |
"metrics": {
|
| 221 |
+
"best_val_acc": 71.226,
|
| 222 |
+
"best_epoch": 1,
|
| 223 |
"scale_accuracies": {
|
| 224 |
+
"256": 71.226
|
| 225 |
}
|
| 226 |
},
|
| 227 |
"train_config": {
|