Upload weights and configs - Run 20251012_032356
Browse files
weights/best_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 59515088
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3b0c800988cf782b1b9980bc9ac31f9de8953dc7f0e37707281a8e81c83c521
|
| 3 |
size 59515088
|
weights/best_model_metadata.json
CHANGED
|
@@ -1,26 +1,26 @@
|
|
| 1 |
{
|
| 2 |
-
"epoch":
|
| 3 |
"optimizer_state_dict": {
|
| 4 |
"state": {
|
| 5 |
"0": {
|
| 6 |
-
"step": "tensor(
|
| 7 |
-
"exp_avg": "tensor([[
|
| 8 |
-
"exp_avg_sq": "tensor([[
|
| 9 |
},
|
| 10 |
"1": {
|
| 11 |
-
"step": "tensor(
|
| 12 |
-
"exp_avg": "tensor([
|
| 13 |
-
"exp_avg_sq": "tensor([
|
| 14 |
},
|
| 15 |
"2": {
|
| 16 |
-
"step": "tensor(
|
| 17 |
-
"exp_avg": "tensor([[
|
| 18 |
-
"exp_avg_sq": "tensor([[
|
| 19 |
}
|
| 20 |
},
|
| 21 |
"param_groups": [
|
| 22 |
{
|
| 23 |
-
"lr": 0.
|
| 24 |
"name": "scale_256",
|
| 25 |
"betas": [
|
| 26 |
0.9,
|
|
@@ -43,7 +43,7 @@
|
|
| 43 |
]
|
| 44 |
},
|
| 45 |
{
|
| 46 |
-
"lr": 0.
|
| 47 |
"name": "scale_512",
|
| 48 |
"betas": [
|
| 49 |
0.9,
|
|
@@ -66,7 +66,7 @@
|
|
| 66 |
]
|
| 67 |
},
|
| 68 |
{
|
| 69 |
-
"lr": 0.
|
| 70 |
"name": "scale_768",
|
| 71 |
"betas": [
|
| 72 |
0.9,
|
|
@@ -89,7 +89,7 @@
|
|
| 89 |
]
|
| 90 |
},
|
| 91 |
{
|
| 92 |
-
"lr": 0.
|
| 93 |
"name": "scale_1024",
|
| 94 |
"betas": [
|
| 95 |
0.9,
|
|
@@ -112,7 +112,7 @@
|
|
| 112 |
]
|
| 113 |
},
|
| 114 |
{
|
| 115 |
-
"lr": 0.
|
| 116 |
"name": "scale_1280",
|
| 117 |
"betas": [
|
| 118 |
0.9,
|
|
@@ -135,7 +135,7 @@
|
|
| 135 |
]
|
| 136 |
},
|
| 137 |
{
|
| 138 |
-
"lr": 0.
|
| 139 |
"name": "fusion",
|
| 140 |
"betas": [
|
| 141 |
0.9,
|
|
@@ -195,7 +195,7 @@
|
|
| 195 |
"T_i": 10,
|
| 196 |
"T_mult": 2,
|
| 197 |
"eta_min": 1e-06,
|
| 198 |
-
"T_cur":
|
| 199 |
"base_lrs": [
|
| 200 |
0.01,
|
| 201 |
0.01,
|
|
@@ -204,24 +204,24 @@
|
|
| 204 |
0.01,
|
| 205 |
0.005
|
| 206 |
],
|
| 207 |
-
"last_epoch":
|
| 208 |
"_step_count": 0,
|
| 209 |
"_is_initial": false,
|
| 210 |
"_get_lr_called_within_step": false,
|
| 211 |
"_last_lr": [
|
| 212 |
-
0.
|
| 213 |
-
0.
|
| 214 |
-
0.
|
| 215 |
-
0.
|
| 216 |
-
0.
|
| 217 |
-
0.
|
| 218 |
]
|
| 219 |
},
|
| 220 |
"metrics": {
|
| 221 |
-
"best_val_acc":
|
| 222 |
-
"best_epoch":
|
| 223 |
"scale_accuracies": {
|
| 224 |
-
"256":
|
| 225 |
}
|
| 226 |
},
|
| 227 |
"train_config": {
|
|
|
|
| 1 |
{
|
| 2 |
+
"epoch": 2,
|
| 3 |
"optimizer_state_dict": {
|
| 4 |
"state": {
|
| 5 |
"0": {
|
| 6 |
+
"step": "tensor(3756.)",
|
| 7 |
+
"exp_avg": "tensor([[ 1.7831e-05, -4.5677e-05, -1.0656e-05, ..., 2.5515e-05,\n 2.5247e-05, 2.0031e-05],\n [ 2.8097e-05, -8.2606e-05, 2.0928e-05, ..., 5.4769e-06,\n 6.5177e-06, 1.4157e-05],\n [-1.5467e-05, -4.2629e-05, -4.7339e-06, ..., 5.2465e-05,\n 1.1511e-05, 1.5347e-05],\n ...,\n [-2.3319e-04, 1.3111e-04, -6.7066e-05, ..., -8.4160e-05,\n -1.3645e-05, -5.2447e-05],\n [ 2.8317e-32, -3.0252e-32, 3.7288e-32, ..., 1.2018e-33,\n -2.5549e-32, -1.2403e-32],\n [ 2.8868e-04, -2.0421e-04, 5.1263e-05, ..., 1.0802e-04,\n 6.9886e-05, -1.3845e-05]], device='cuda:0')",
|
| 8 |
+
"exp_avg_sq": "tensor([[5.5924e-08, 7.8008e-08, 9.2438e-09, ..., 2.2459e-08, 2.2992e-08,\n 6.1665e-09],\n [1.5358e-07, 1.1598e-07, 3.8675e-08, ..., 7.3238e-08, 3.6567e-08,\n 5.1830e-08],\n [1.1599e-07, 1.4503e-07, 3.3933e-08, ..., 4.0283e-08, 2.8559e-08,\n 3.0028e-08],\n ...,\n [3.0393e-07, 1.8733e-07, 3.2085e-08, ..., 3.6319e-08, 2.9407e-08,\n 1.9908e-08],\n [1.7530e-11, 4.0619e-10, 6.3743e-11, ..., 2.6928e-11, 8.5347e-11,\n 5.0808e-11],\n [1.9579e-07, 1.2667e-07, 1.9311e-08, ..., 2.4558e-08, 4.5792e-08,\n 2.2544e-08]], device='cuda:0')"
|
| 9 |
},
|
| 10 |
"1": {
|
| 11 |
+
"step": "tensor(3756.)",
|
| 12 |
+
"exp_avg": "tensor([ 5.1233e-04, 1.4962e-03, 8.6219e-04, 6.6010e-04, -2.8160e-12,\n 9.4107e-05, 1.1703e-04, 5.3116e-04, 1.1135e-03, 2.2131e-03,\n -7.7125e-04, 3.4627e-03, 5.6052e-45, -6.5682e-04, 1.2157e-03,\n -3.2750e-04, -2.4690e-03, 2.3180e-03, 5.7181e-04, 5.6052e-45,\n -2.4293e-03, -2.9330e-03, -1.1394e-03, -1.1585e-03, 5.6052e-45,\n 2.7927e-03, 1.9219e-04, -7.7537e-04, 1.0711e-03, -2.8580e-03,\n -8.0813e-04, -2.4576e-04, -2.3504e-08, 5.6052e-45, -1.2613e-03,\n 7.3082e-04, 2.2089e-04, -2.8135e-03, -1.7028e-04, -9.0479e-04,\n -3.4984e-03, -2.0797e-03, 3.1206e-04, -1.5827e-03, 1.4216e-03,\n 5.5516e-03, 3.3014e-03, -6.2577e-04, 1.7331e-03, 1.2679e-03,\n -4.2741e-05, 5.6052e-45, -5.6052e-45, 5.6052e-45, -1.2496e-03,\n -9.4733e-04, 1.6383e-03, -4.1002e-04, 3.2997e-09, 3.3793e-03,\n -3.7731e-04, 3.8605e-04, -2.8461e-03, -1.1535e-03, -1.6822e-03,\n -1.6403e-03, 7.6820e-05, 5.6052e-45, 1.1597e-04, 2.3749e-03,\n -2.1615e-04, 5.6052e-45, 3.5370e-03, 3.2385e-03, 2.5593e-04,\n 1.1675e-03, -1.5430e-03, -1.2461e-03, 3.1295e-03, -9.0900e-03,\n 2.0511e-03, -1.5631e-03, 1.7974e-03, -5.7405e-04, 1.3671e-03,\n -8.7397e-04, 2.9302e-03, 1.2321e-03, 1.2652e-03, 2.4025e-03,\n 5.6052e-45, -1.0113e-03, -8.0032e-04, -3.4159e-03, -9.0481e-04,\n -1.8566e-03, 7.8791e-04, 5.2959e-04, -3.0380e-03, -6.7021e-04,\n 7.4207e-04, 6.3742e-04, -1.4810e-03, -1.3313e-03, -4.9065e-04,\n -1.0980e-04, 4.6380e-05, 2.6412e-03, -1.7604e-04, -7.9487e-04,\n 4.2142e-04, -1.7397e-03, 5.6052e-45, 1.0810e-03, -1.6093e-05,\n 1.8620e-03, -1.1098e-03, 4.2065e-03, -5.6052e-45, 1.0830e-05,\n 5.6052e-45, -4.9362e-04, 5.6052e-45, 4.5340e-03, 2.7321e-04,\n 3.2198e-03, -6.2468e-03, 5.6052e-45, 4.0794e-04, -2.9376e-04,\n 2.0729e-03, 1.9686e-03, 2.8169e-03, 9.9771e-25, 1.8688e-03,\n -3.2034e-04, 2.9599e-04, 1.7660e-03, 5.4940e-04, -5.5974e-04,\n 1.7476e-03, 2.0100e-03, 5.2797e-03, 2.3488e-03, 5.5077e-03,\n 2.2498e-03, -8.5076e-13, 4.0588e-03, -4.4685e-04, 2.2580e-03,\n -2.3057e-17, 1.3667e-03, -2.0953e-03, 5.6052e-45, 3.2642e-03,\n 1.1543e-03, 6.5475e-20, 2.3212e-03, 3.4358e-03, -4.1328e-04,\n -1.2298e-03, 4.9247e-04, 6.0939e-04, 3.2708e-03, 2.0755e-04,\n 3.8615e-05, 9.2578e-04, 1.8436e-04, 2.7992e-03, 7.7843e-23,\n 5.6052e-45, -6.7832e-04, -2.2660e-03, 8.3994e-04, -2.6474e-03,\n 5.8393e-04, -7.7083e-04, -2.7944e-03, 5.6052e-45, 1.2081e-03,\n -1.4105e-03, -1.8192e-03, 1.4575e-04, 5.6052e-45, -5.0196e-04,\n 1.1285e-03, -8.7956e-04, -7.5027e-04, -1.9143e-05, 5.6052e-45,\n 5.6052e-45, 2.1472e-03, 2.0672e-03, -4.0834e-03, 1.1510e-04,\n 7.5289e-04, -1.6370e-03, 1.5778e-03, 5.6052e-45, 9.0714e-04,\n 1.8977e-03, -1.8082e-03, 9.2614e-04, -1.9589e-03, -1.1776e-03,\n 5.6052e-45, 3.3800e-04, 3.8359e-04, 1.0382e-03, 1.8186e-03,\n 7.9169e-04, 5.4020e-04, -4.6689e-04, 3.7264e-04, 5.1813e-04,\n -2.6652e-03, 1.9006e-03, -1.2771e-03, -2.5275e-03, -3.0154e-03,\n 5.3493e-04, 2.4243e-04, 1.5057e-03, -1.1234e-03, 2.1051e-03,\n 9.7383e-04, -3.3279e-03, -3.1169e-04, 2.4938e-04, -2.2146e-06,\n 7.9057e-04, -2.7659e-04, -1.0425e-03, 5.6052e-45, -1.8182e-03,\n 3.0576e-03, 2.8684e-03, 4.9024e-04, 1.5073e-03, 2.0503e-03,\n 7.2662e-04, 5.9012e-04, -1.2612e-03, 8.4114e-04, 1.4172e-04,\n 3.8061e-03, -1.0976e-03, -4.4220e-04, -1.6167e-03, 2.3890e-03,\n -3.2845e-03, 3.0843e-03, 1.2070e-04, 1.6564e-03, 5.6408e-04,\n -1.9539e-03, 5.6052e-45, -2.9932e-04, -2.6776e-04, 5.9844e-04,\n -1.4972e-04, 7.2556e-04, -1.3185e-03, 8.6790e-04, -1.6135e-03,\n -5.3571e-04, -2.9040e-04, 5.6052e-45, -2.0915e-03, -2.2987e-03,\n 5.6645e-04, -8.4885e-04, 9.0699e-04, 3.9753e-04, 1.3428e-04,\n 5.6052e-45, 1.8292e-03, 5.6052e-45, -4.4438e-03, 8.0182e-04,\n -1.1643e-03, 4.3945e-03, -2.2254e-03, -5.2929e-03, -3.7621e-04,\n 3.2349e-04, -4.3990e-19, 3.2879e-03, 5.5551e-04, -2.1160e-05,\n -1.6796e-04, 2.1284e-03, 6.7839e-04, 1.9942e-03, -1.7185e-04,\n 2.9146e-03, -5.7036e-03, 4.0484e-03, 3.0776e-03, -6.2567e-04,\n 1.2639e-03, 3.4377e-04, -4.9843e-06, 1.6383e-04, 4.6551e-04,\n 2.1297e-05, -2.2879e-04, 5.6052e-45, 5.6052e-45, 5.6641e-04,\n 1.3571e-03, -3.0112e-03, -5.2022e-04, 1.7431e-03, -8.2426e-04,\n -4.6999e-04, 1.4273e-03, 1.8569e-03, -3.6938e-04, 1.7993e-04,\n 7.7306e-04, -3.0861e-04, -2.5285e-03, -8.6260e-05, 2.4698e-04,\n -1.5429e-03, 1.3110e-03, -5.4266e-04, 1.9959e-05, 1.3702e-03,\n 2.2933e-04, 1.4004e-03, -1.4422e-03, 1.7862e-03, 5.6052e-45,\n -2.2920e-04, 1.7263e-04, -9.7651e-04, 1.5978e-03, -3.9989e-04,\n -6.9877e-04, 1.0665e-03, 3.1147e-03, 9.5281e-04, -1.3571e-03,\n -2.0422e-03, 5.6052e-45, -3.1476e-04, -1.0402e-03, 1.6093e-03,\n 5.0974e-04, -1.3595e-03, 1.8338e-03, 1.0209e-03, -1.0805e-03,\n -6.0864e-03, -4.5676e-04, 2.0731e-03, 2.0280e-03, -1.4483e-03,\n -1.5112e-03, -2.0867e-04, 3.4876e-03, 5.2873e-04, -4.3349e-03,\n 1.6431e-03, 3.3320e-04, -5.3557e-04, -1.1041e-04, 1.0357e-03,\n 3.0968e-03, 7.0172e-04, 2.3487e-04, -1.8611e-03, -1.2893e-03,\n 2.4788e-03, -3.5122e-04, 7.0537e-05, 5.6052e-45, -1.3271e-03,\n -2.2722e-03, 5.6052e-45, -7.8819e-04, -3.5749e-03, 1.7267e-03,\n -1.9830e-03, -1.6744e-03, 2.2860e-03, 1.9861e-04, 2.0112e-04,\n 3.5650e-04, -2.7359e-03, 1.4410e-03, -5.6052e-45, 5.6052e-45,\n -8.9577e-04, 3.5788e-03, 1.2752e-03, 3.6856e-03, -3.6852e-04,\n 2.5619e-04, 2.8084e-04, -1.5861e-03, -4.6875e-04, -5.3986e-04,\n 9.9002e-04, 2.3711e-04, 5.6052e-45, -3.6677e-03, -9.2103e-04,\n 5.6052e-45, -8.7159e-04, 5.6052e-45, -4.0697e-05, -8.5340e-04,\n 3.2206e-04, 7.8644e-04, 5.6052e-45, -1.5146e-03, 3.0435e-03,\n -6.3783e-04, -1.3443e-03, -1.6531e-03, -2.1750e-03, 1.1121e-03,\n 7.2222e-04, -2.5241e-03, 6.5804e-24, -2.7617e-03, 2.8942e-12,\n -6.0669e-04, 2.4579e-04, 6.0150e-04, 5.6052e-45, -6.9064e-05,\n 1.4827e-03, -4.3664e-04, 4.7341e-04, -1.2992e-03, -3.8477e-04,\n 3.5847e-03, -6.8151e-04, 1.3217e-03, -1.0765e-03, -4.6359e-04,\n 7.9395e-04, -2.2083e-03, 5.6052e-45, -2.3358e-03, 4.1295e-03,\n 5.6052e-45, 2.1284e-03, 2.2264e-04, 6.1589e-04, -6.9541e-04,\n 3.0862e-15, -6.7634e-04, 5.3916e-06, 5.7845e-04, 5.6052e-45,\n -8.4421e-04, -6.4071e-03, 5.6052e-45, -6.1570e-04, 1.1874e-10,\n 1.6721e-03, 1.0634e-03, 5.6052e-45, 5.2167e-04, -4.3601e-04,\n 5.2242e-03, 7.0871e-04, -5.1759e-03, -1.8040e-03, -2.1591e-03,\n -5.3001e-05, 5.6052e-45, 3.0465e-03, 5.6052e-45, -2.9522e-04,\n -1.0857e-04, -5.6573e-04, -1.4785e-03, 2.4057e-03, 5.6347e-04,\n -5.0183e-04, 2.1063e-03, -2.7572e-04, -3.3027e-03, 1.9016e-03,\n 5.6052e-45, -9.0800e-04, 7.3842e-04, 1.9143e-03, -5.9897e-04,\n 1.0573e-04, 3.2216e-03, -1.4969e-04, -9.8013e-05, -8.7615e-04,\n 2.4830e-03, 5.6052e-45, -3.5623e-04, 2.7601e-03, -1.5760e-04,\n -6.6513e-04, -4.0614e-06, 6.0204e-04, -2.1472e-03, 2.3123e-03,\n 2.0108e-03, -3.6236e-03, -1.8755e-03, 4.0671e-04, -3.7499e-13,\n 5.6052e-45, -2.5051e-04, -2.9165e-03, -1.5708e-03, 6.8843e-04,\n 1.6382e-03, 2.6966e-03, 2.3469e-03, 8.3923e-04, -6.5503e-04,\n -5.1303e-04, -1.9877e-03, -8.5651e-04, -9.4771e-04, -3.1107e-03,\n 2.7734e-22, 1.8081e-03, 1.3143e-03, 4.3692e-04, -5.6052e-45,\n 6.7914e-04, 1.3574e-05, 5.6052e-45, 5.6052e-45, 1.9418e-03,\n 4.6115e-04, 1.3270e-03, 1.6926e-03, -1.7398e-03, -5.8611e-05,\n -1.4337e-03, 1.4241e-03, 6.2230e-04, 2.5681e-03, 7.9564e-04,\n -7.1825e-04, 2.9431e-04, 8.9161e-04, -5.4874e-04, -1.8233e-03,\n -3.6833e-04, 8.9179e-04, -8.6929e-04, -9.3005e-04, 3.4687e-03,\n 5.7667e-04, 2.3803e-03, -4.0191e-04, 3.5921e-03, 6.4549e-04,\n -2.6844e-03, -3.5730e-03, -4.3390e-04, 3.9128e-04, -9.8408e-04,\n 4.1179e-03, 5.0758e-04, -1.0377e-03, 1.0575e-03, -2.8883e-04,\n -3.8610e-35, 5.6052e-45, -2.5155e-03, -1.5328e-03, 3.0458e-03,\n -8.3949e-04, 5.6052e-45, 1.3146e-03, -5.2305e-03, -1.0560e-03,\n -8.0811e-04, -3.0424e-03, 4.5300e-04, -2.0464e-03, -2.4431e-03,\n 4.9951e-04, 6.8201e-04, -3.1527e-04, -8.7993e-04, -2.9484e-03,\n 4.8691e-04, -1.7727e-03, -7.9813e-04, -2.3738e-03, -2.6145e-05,\n -1.8552e-03, -1.0963e-03, 1.2725e-04, -2.3126e-03, -6.4813e-04,\n 1.9604e-04, -2.7641e-03, 9.3641e-04, 9.5629e-04, 2.4258e-03,\n -1.0593e-03, 1.5176e-03, -2.2232e-04, 1.4156e-03, 3.2536e-04,\n 4.4908e-03, -1.0206e-03, 9.0033e-08, 1.5631e-03, 1.4958e-10,\n 2.7674e-14, -1.5015e-05, 2.3728e-03, 1.6508e-04, -3.3530e-03,\n 2.2802e-03, 7.1558e-04, -6.1278e-04, 1.3469e-03, -4.3877e-04,\n -6.6916e-03, -3.7049e-34, 8.0133e-06, 1.9363e-03, 2.4436e-04,\n -2.1892e-03, -1.7682e-03, -1.6809e-03, 4.8598e-31, 3.1390e-03],\n device='cuda:0')",
|
| 13 |
+
"exp_avg_sq": "tensor([1.8429e-05, 7.8424e-05, 4.1216e-05, 3.2207e-05, 1.5486e-07, 8.1643e-06,\n 5.6661e-05, 5.4997e-05, 3.6809e-05, 5.8048e-05, 5.5900e-05, 1.0907e-04,\n 5.2763e-07, 4.9280e-05, 6.0358e-05, 6.0430e-05, 9.3022e-05, 6.6292e-05,\n 2.2263e-05, 1.3737e-07, 4.6491e-05, 4.1435e-05, 3.8910e-05, 6.2517e-05,\n 5.0144e-07, 8.2325e-05, 5.6426e-05, 7.6278e-05, 5.5761e-05, 6.7651e-05,\n 6.4038e-05, 6.5705e-05, 1.0096e-06, 8.8563e-08, 4.7941e-05, 5.5138e-05,\n 6.3255e-05, 4.0000e-05, 3.1811e-05, 5.8204e-05, 6.2877e-05, 3.0693e-05,\n 5.5385e-05, 4.5257e-05, 4.4873e-05, 6.5875e-05, 5.8716e-05, 9.9101e-05,\n 9.7689e-05, 3.3143e-05, 7.1325e-05, 5.2607e-08, 8.5362e-08, 7.9888e-08,\n 7.1962e-05, 1.1149e-04, 4.4462e-05, 4.1195e-05, 2.5838e-07, 6.9597e-05,\n 5.9119e-05, 4.8329e-05, 9.5072e-05, 3.5547e-05, 6.7055e-05, 7.1558e-05,\n 5.2508e-05, 9.7777e-08, 7.3431e-05, 6.2996e-05, 7.9860e-06, 3.9941e-07,\n 7.2067e-05, 4.6330e-05, 1.3939e-05, 6.3709e-05, 7.0940e-05, 7.1251e-05,\n 3.4550e-05, 7.3103e-05, 9.4840e-05, 5.4518e-05, 7.9089e-05, 4.5982e-05,\n 6.0059e-05, 4.9573e-05, 5.8442e-05, 3.0440e-05, 6.0963e-05, 5.4131e-05,\n 6.2351e-07, 7.2436e-05, 5.1906e-05, 4.2414e-05, 9.1787e-05, 2.1514e-05,\n 5.2725e-05, 4.1873e-05, 4.9157e-05, 3.6346e-05, 2.9048e-05, 5.7960e-06,\n 7.6109e-05, 8.0546e-05, 1.2031e-04, 3.1543e-05, 5.6253e-05, 8.2481e-05,\n 1.2189e-05, 2.6002e-05, 8.6256e-05, 9.0572e-05, 4.2156e-08, 4.1130e-05,\n 5.3011e-07, 4.5521e-05, 6.3898e-05, 9.7266e-05, 1.8796e-08, 9.8546e-08,\n 6.8374e-08, 5.0582e-05, 5.4445e-08, 1.1226e-04, 5.4902e-05, 7.8698e-05,\n 7.3919e-05, 1.0242e-08, 2.3582e-05, 7.7462e-05, 4.4632e-05, 5.0593e-05,\n 7.1332e-05, 1.8271e-08, 6.7731e-05, 5.8945e-05, 3.1110e-05, 5.1993e-05,\n 4.2545e-05, 5.2321e-05, 1.0764e-04, 6.3356e-05, 7.3797e-05, 5.5977e-05,\n 6.8316e-05, 6.1020e-05, 8.0626e-07, 6.7718e-05, 5.7531e-05, 4.4023e-05,\n 6.9153e-07, 3.8952e-05, 4.7206e-05, 3.7102e-07, 4.9116e-05, 7.3234e-05,\n 7.3487e-07, 7.9238e-05, 4.3922e-05, 6.1611e-05, 2.1392e-05, 5.9273e-05,\n 1.4000e-04, 5.4958e-05, 5.5462e-05, 4.1322e-05, 1.0242e-04, 3.5023e-05,\n 5.3783e-05, 8.7312e-08, 1.3455e-07, 6.2080e-05, 8.8259e-05, 4.6051e-05,\n 5.0702e-05, 8.2736e-05, 2.5034e-05, 6.8924e-05, 2.4419e-08, 2.8527e-05,\n 5.2167e-05, 7.3348e-05, 9.0304e-06, 1.7967e-07, 6.7260e-05, 6.1738e-05,\n 8.1591e-05, 3.5377e-05, 4.5612e-05, 5.2171e-08, 5.9779e-07, 5.3762e-05,\n 2.8652e-05, 7.1083e-05, 6.1304e-05, 5.5979e-05, 3.9565e-05, 7.5861e-05,\n 9.4224e-08, 4.8972e-05, 4.0873e-05, 2.9134e-05, 8.5371e-05, 2.5459e-05,\n 1.1806e-04, 4.6474e-09, 5.6294e-05, 6.2230e-05, 4.8022e-05, 6.4653e-05,\n 3.1432e-05, 5.7633e-05, 6.0467e-05, 5.9572e-05, 3.4891e-05, 5.2127e-05,\n 3.9065e-05, 7.4697e-05, 7.3555e-05, 3.6516e-05, 4.0428e-05, 6.5586e-05,\n 4.5840e-05, 5.1340e-05, 5.2006e-05, 5.3998e-05, 8.8808e-05, 9.3350e-05,\n 3.8006e-05, 8.3215e-05, 6.1270e-05, 1.0445e-04, 7.0716e-05, 1.1552e-07,\n 6.6224e-05, 3.3235e-05, 5.2076e-05, 3.9190e-05, 1.3412e-04, 5.7846e-05,\n 3.7738e-05, 5.5868e-05, 5.8193e-05, 5.1935e-05, 9.0579e-05, 3.8098e-05,\n 3.0676e-05, 7.1407e-05, 4.0514e-05, 5.2177e-05, 5.7026e-05, 5.2525e-05,\n 4.3748e-05, 4.9606e-05, 6.8073e-05, 5.4826e-05, 4.9775e-07, 4.4180e-05,\n 3.3553e-05, 1.3345e-05, 5.5598e-05, 8.0616e-05, 6.8480e-05, 6.4118e-05,\n 5.9491e-05, 5.7352e-05, 4.2876e-05, 7.3783e-08, 6.4196e-05, 6.4906e-05,\n 4.3185e-05, 8.3245e-05, 4.9406e-05, 2.4759e-05, 7.4066e-05, 1.2876e-07,\n 5.5531e-05, 3.6385e-07, 4.0812e-05, 1.8832e-05, 5.4092e-05, 4.6169e-05,\n 8.6733e-05, 7.8781e-05, 6.8829e-05, 6.6240e-05, 1.4839e-08, 7.6035e-05,\n 7.8169e-05, 4.0586e-05, 6.9116e-06, 5.9455e-05, 8.6081e-05, 6.8788e-05,\n 4.7999e-05, 9.0710e-05, 9.8244e-05, 5.5921e-05, 5.4694e-05, 1.1449e-04,\n 4.9329e-05, 6.2151e-06, 1.1886e-06, 4.3558e-05, 5.7345e-05, 3.4039e-06,\n 6.2881e-05, 1.5315e-08, 3.0172e-07, 5.8508e-05, 8.4363e-05, 3.9821e-05,\n 6.2632e-05, 7.2649e-05, 5.8004e-05, 5.8830e-05, 6.8701e-05, 5.1764e-05,\n 4.0504e-05, 6.9099e-05, 7.2059e-05, 1.0150e-04, 8.1962e-05, 4.0281e-05,\n 1.9336e-05, 6.2384e-05, 4.9710e-05, 7.0670e-06, 4.2761e-05, 6.5936e-05,\n 1.1104e-05, 3.6789e-05, 7.6847e-05, 7.2629e-05, 3.5995e-11, 5.1730e-05,\n 3.6673e-05, 8.5187e-05, 3.6331e-05, 4.6995e-05, 9.1364e-06, 6.6941e-05,\n 4.9654e-05, 5.2543e-05, 5.2972e-05, 8.5916e-05, 5.2677e-07, 6.7806e-06,\n 5.9184e-05, 5.9994e-05, 4.2475e-05, 6.7451e-05, 4.9160e-05, 5.1374e-05,\n 9.5346e-05, 5.5690e-05, 5.1087e-05, 5.1013e-05, 7.7113e-05, 1.3310e-06,\n 2.9492e-05, 3.7743e-05, 6.4588e-05, 8.8312e-05, 6.5177e-05, 1.4898e-04,\n 1.7569e-05, 6.9014e-05, 7.9805e-05, 6.7745e-05, 6.6396e-05, 4.6284e-05,\n 4.9685e-05, 1.0765e-05, 5.2503e-05, 9.4992e-05, 1.2216e-04, 1.7051e-05,\n 2.2932e-07, 6.6446e-05, 1.9666e-05, 1.2512e-06, 5.0863e-05, 1.0809e-04,\n 4.8287e-05, 4.1113e-05, 5.7037e-05, 7.6571e-05, 4.0140e-05, 3.2797e-05,\n 7.5846e-05, 7.5232e-05, 4.8110e-05, 1.2436e-07, 4.1264e-07, 5.8930e-05,\n 6.4290e-05, 5.9733e-05, 8.5655e-05, 4.2477e-05, 5.1533e-05, 4.0953e-05,\n 1.9062e-05, 4.4839e-05, 4.8009e-05, 8.5967e-05, 4.2455e-05, 1.5196e-07,\n 8.6692e-06, 1.7067e-05, 4.3776e-08, 5.9799e-06, 7.6373e-08, 7.7939e-05,\n 6.6996e-05, 2.2114e-05, 4.4705e-05, 2.0620e-07, 2.7376e-05, 6.1274e-05,\n 3.9801e-05, 6.7514e-05, 7.7499e-05, 8.3942e-05, 5.4821e-05, 3.9531e-06,\n 3.7451e-05, 1.5607e-07, 3.2283e-05, 2.8839e-08, 3.2195e-05, 6.9658e-05,\n 5.9980e-05, 1.3245e-07, 3.5261e-05, 5.4220e-05, 7.9021e-05, 6.9342e-05,\n 4.8851e-05, 3.0698e-05, 7.3776e-05, 3.0239e-05, 6.1269e-05, 8.3531e-05,\n 4.3949e-05, 1.2398e-06, 5.4793e-05, 4.4704e-08, 5.6602e-05, 3.6121e-05,\n 1.4832e-06, 2.8724e-05, 4.3440e-05, 4.2151e-06, 5.2914e-05, 7.0113e-08,\n 3.5470e-05, 5.1513e-06, 4.5728e-05, 2.0023e-06, 5.5838e-05, 9.5254e-05,\n 1.3018e-08, 4.7710e-05, 1.6855e-06, 6.7336e-05, 4.4844e-05, 1.0632e-07,\n 6.9499e-05, 3.8512e-05, 1.1443e-04, 7.7913e-05, 4.8103e-05, 1.9658e-05,\n 3.8010e-05, 5.8789e-05, 7.3901e-07, 6.7558e-05, 2.3464e-07, 9.9241e-06,\n 6.0042e-06, 7.3457e-06, 4.9822e-05, 6.4646e-05, 1.1142e-04, 5.0077e-05,\n 5.9531e-05, 4.5883e-05, 6.5449e-05, 4.9554e-05, 9.8446e-08, 5.5766e-05,\n 5.6535e-05, 1.1022e-04, 7.2413e-06, 2.2127e-05, 4.5780e-05, 3.7642e-05,\n 5.6162e-05, 1.2533e-05, 4.8463e-05, 7.3051e-07, 7.0802e-06, 8.7394e-05,\n 5.1142e-05, 9.3222e-05, 5.9558e-05, 5.3520e-05, 6.2056e-05, 5.1860e-05,\n 6.2345e-05, 1.1813e-04, 4.4469e-05, 6.1378e-05, 5.4675e-07, 6.0514e-07,\n 6.8865e-05, 1.3582e-04, 8.0553e-05, 4.9708e-05, 6.0015e-05, 6.1626e-05,\n 5.5857e-05, 6.6562e-05, 5.0500e-05, 1.0480e-05, 5.3138e-05, 6.2440e-05,\n 4.3975e-05, 4.3015e-05, 1.4075e-07, 4.1689e-05, 6.3768e-05, 3.6194e-05,\n 5.5089e-07, 5.1195e-05, 5.9280e-05, 4.4625e-08, 1.3426e-07, 6.4783e-05,\n 6.1671e-05, 7.4173e-05, 3.5884e-05, 7.4318e-05, 3.4199e-05, 6.2636e-05,\n 4.9733e-05, 3.5539e-05, 3.9190e-05, 6.2689e-05, 6.2631e-05, 5.4694e-05,\n 8.1090e-05, 7.6418e-05, 6.4501e-05, 3.5079e-05, 5.3659e-05, 1.6279e-04,\n 4.1786e-05, 5.2087e-05, 2.7329e-05, 5.4073e-05, 6.3129e-05, 9.9276e-05,\n 1.4463e-06, 4.7581e-05, 7.8885e-05, 3.6910e-05, 7.5648e-05, 5.6108e-05,\n 6.1684e-05, 4.9811e-05, 5.5668e-05, 8.1306e-05, 7.6103e-07, 6.9993e-08,\n 8.0110e-07, 5.5193e-05, 4.9125e-05, 6.7111e-05, 6.0407e-05, 1.5247e-06,\n 5.0229e-05, 5.9279e-05, 2.5739e-05, 5.7219e-05, 4.1998e-05, 4.4227e-05,\n 8.3390e-05, 6.9618e-05, 4.7138e-05, 9.0475e-05, 6.8649e-05, 8.6704e-05,\n 5.7291e-05, 6.2965e-05, 6.1046e-05, 6.3377e-05, 8.6306e-05, 8.9585e-05,\n 8.1385e-05, 4.0861e-05, 5.0476e-05, 5.1084e-05, 5.8064e-05, 4.2190e-05,\n 4.8913e-05, 6.1226e-05, 1.2306e-04, 9.7292e-05, 7.2088e-05, 7.9435e-05,\n 6.0723e-05, 2.1911e-05, 2.4702e-05, 6.3349e-05, 5.6102e-05, 5.9785e-05,\n 3.3363e-05, 3.4988e-08, 1.0017e-06, 7.3015e-07, 6.3292e-05, 4.8849e-05,\n 5.9466e-05, 7.0894e-05, 5.3603e-05, 4.3099e-05, 4.0995e-05, 7.9944e-05,\n 4.0672e-05, 2.5679e-07, 4.2538e-08, 7.4015e-05, 5.2913e-05, 8.9377e-05,\n 6.6951e-05, 5.6542e-05, 9.5307e-08, 4.0459e-05], device='cuda:0')"
|
| 14 |
},
|
| 15 |
"2": {
|
| 16 |
+
"step": "tensor(3756.)",
|
| 17 |
+
"exp_avg": "tensor([[-7.9560e-06, 2.3993e-05, 3.2534e-06, ..., 5.1585e-06,\n -3.0564e-33, 5.7035e-06],\n [-2.3746e-05, -4.0098e-05, -1.1183e-05, ..., 1.7490e-05,\n -2.7885e-33, -3.1322e-05],\n [-2.1273e-05, -1.0974e-05, 1.0933e-06, ..., 1.0596e-05,\n -3.1965e-33, 4.0670e-05],\n ...,\n [-8.9289e-06, 5.3523e-05, -6.5075e-06, ..., 2.6585e-05,\n 4.1366e-34, 2.6323e-05],\n [-2.7970e-06, 3.2530e-05, 6.1558e-06, ..., 4.4867e-05,\n 7.4581e-33, 1.1290e-04],\n [ 8.1028e-06, 1.2931e-05, 5.9366e-08, ..., 1.4795e-05,\n 5.9547e-33, 5.4140e-05]], device='cuda:0')",
|
| 18 |
+
"exp_avg_sq": "tensor([[4.0505e-09, 1.4402e-08, 1.2323e-08, ..., 1.4270e-08, 5.3745e-14,\n 1.2518e-08],\n [8.1800e-09, 3.9253e-08, 2.2590e-08, ..., 2.9301e-08, 9.9092e-12,\n 2.1253e-08],\n [6.0028e-09, 2.6590e-08, 2.3240e-08, ..., 2.0730e-08, 6.6242e-11,\n 2.8640e-08],\n ...,\n [6.7921e-09, 2.7842e-08, 2.6969e-08, ..., 2.5708e-08, 4.8211e-11,\n 3.2653e-08],\n [9.4379e-09, 3.2343e-08, 2.5039e-08, ..., 3.0256e-08, 4.4243e-13,\n 7.4594e-08],\n [8.0911e-09, 3.1045e-08, 2.6019e-08, ..., 3.9526e-08, 6.0953e-11,\n 1.9206e-08]], device='cuda:0')"
|
| 19 |
}
|
| 20 |
},
|
| 21 |
"param_groups": [
|
| 22 |
{
|
| 23 |
+
"lr": 0.00793913236883622,
|
| 24 |
"name": "scale_256",
|
| 25 |
"betas": [
|
| 26 |
0.9,
|
|
|
|
| 43 |
]
|
| 44 |
},
|
| 45 |
{
|
| 46 |
+
"lr": 0.00793913236883622,
|
| 47 |
"name": "scale_512",
|
| 48 |
"betas": [
|
| 49 |
0.9,
|
|
|
|
| 66 |
]
|
| 67 |
},
|
| 68 |
{
|
| 69 |
+
"lr": 0.00793913236883622,
|
| 70 |
"name": "scale_768",
|
| 71 |
"betas": [
|
| 72 |
0.9,
|
|
|
|
| 89 |
]
|
| 90 |
},
|
| 91 |
{
|
| 92 |
+
"lr": 0.00793913236883622,
|
| 93 |
"name": "scale_1024",
|
| 94 |
"betas": [
|
| 95 |
0.9,
|
|
|
|
| 112 |
]
|
| 113 |
},
|
| 114 |
{
|
| 115 |
+
"lr": 0.00793913236883622,
|
| 116 |
"name": "scale_1280",
|
| 117 |
"betas": [
|
| 118 |
0.9,
|
|
|
|
| 135 |
]
|
| 136 |
},
|
| 137 |
{
|
| 138 |
+
"lr": 0.003969669238105037,
|
| 139 |
"name": "fusion",
|
| 140 |
"betas": [
|
| 141 |
0.9,
|
|
|
|
| 195 |
"T_i": 10,
|
| 196 |
"T_mult": 2,
|
| 197 |
"eta_min": 1e-06,
|
| 198 |
+
"T_cur": 3,
|
| 199 |
"base_lrs": [
|
| 200 |
0.01,
|
| 201 |
0.01,
|
|
|
|
| 204 |
0.01,
|
| 205 |
0.005
|
| 206 |
],
|
| 207 |
+
"last_epoch": 3,
|
| 208 |
"_step_count": 0,
|
| 209 |
"_is_initial": false,
|
| 210 |
"_get_lr_called_within_step": false,
|
| 211 |
"_last_lr": [
|
| 212 |
+
0.00793913236883622,
|
| 213 |
+
0.00793913236883622,
|
| 214 |
+
0.00793913236883622,
|
| 215 |
+
0.00793913236883622,
|
| 216 |
+
0.00793913236883622,
|
| 217 |
+
0.003969669238105037
|
| 218 |
]
|
| 219 |
},
|
| 220 |
"metrics": {
|
| 221 |
+
"best_val_acc": 74.29,
|
| 222 |
+
"best_epoch": 2,
|
| 223 |
"scale_accuracies": {
|
| 224 |
+
"256": 74.29
|
| 225 |
}
|
| 226 |
},
|
| 227 |
"train_config": {
|