Upload weights and configs - David-decoupled-deep_efficiency - Run 20251012_065325
Browse files
weights/David-decoupled-deep_efficiency/20251012_065325/best_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 59515088
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:63da40ca37b1d6dfef6fe878c9795165ecd148a58435169b369b095f7bdf5908
|
| 3 |
size 59515088
|
weights/David-decoupled-deep_efficiency/20251012_065325/best_model_metadata.json
CHANGED
|
@@ -1,26 +1,26 @@
|
|
| 1 |
{
|
| 2 |
-
"epoch":
|
| 3 |
"optimizer_state_dict": {
|
| 4 |
"state": {
|
| 5 |
"0": {
|
| 6 |
-
"step": "tensor(
|
| 7 |
-
"exp_avg": "tensor([[
|
| 8 |
-
"exp_avg_sq": "tensor([[1.
|
| 9 |
},
|
| 10 |
"1": {
|
| 11 |
-
"step": "tensor(
|
| 12 |
-
"exp_avg": "tensor([
|
| 13 |
-
"exp_avg_sq": "tensor([0.
|
| 14 |
},
|
| 15 |
"2": {
|
| 16 |
-
"step": "tensor(
|
| 17 |
-
"exp_avg": "tensor([[
|
| 18 |
-
"exp_avg_sq": "tensor([[
|
| 19 |
}
|
| 20 |
},
|
| 21 |
"param_groups": [
|
| 22 |
{
|
| 23 |
-
"lr": 0.
|
| 24 |
"name": "scale_256",
|
| 25 |
"betas": [
|
| 26 |
0.9,
|
|
@@ -43,7 +43,7 @@
|
|
| 43 |
]
|
| 44 |
},
|
| 45 |
{
|
| 46 |
-
"lr": 0.
|
| 47 |
"name": "scale_512",
|
| 48 |
"betas": [
|
| 49 |
0.9,
|
|
@@ -66,7 +66,7 @@
|
|
| 66 |
]
|
| 67 |
},
|
| 68 |
{
|
| 69 |
-
"lr": 0.
|
| 70 |
"name": "scale_768",
|
| 71 |
"betas": [
|
| 72 |
0.9,
|
|
@@ -89,7 +89,7 @@
|
|
| 89 |
]
|
| 90 |
},
|
| 91 |
{
|
| 92 |
-
"lr": 0.
|
| 93 |
"name": "scale_1024",
|
| 94 |
"betas": [
|
| 95 |
0.9,
|
|
@@ -112,7 +112,7 @@
|
|
| 112 |
]
|
| 113 |
},
|
| 114 |
{
|
| 115 |
-
"lr": 0.
|
| 116 |
"name": "scale_1280",
|
| 117 |
"betas": [
|
| 118 |
0.9,
|
|
@@ -135,7 +135,7 @@
|
|
| 135 |
]
|
| 136 |
},
|
| 137 |
{
|
| 138 |
-
"lr": 0.
|
| 139 |
"name": "fusion",
|
| 140 |
"betas": [
|
| 141 |
0.9,
|
|
@@ -195,7 +195,7 @@
|
|
| 195 |
"T_i": 10,
|
| 196 |
"T_mult": 2,
|
| 197 |
"eta_min": 1e-06,
|
| 198 |
-
"T_cur":
|
| 199 |
"base_lrs": [
|
| 200 |
0.001,
|
| 201 |
0.001,
|
|
@@ -204,24 +204,24 @@
|
|
| 204 |
0.001,
|
| 205 |
0.0005
|
| 206 |
],
|
| 207 |
-
"last_epoch":
|
| 208 |
"_step_count": 0,
|
| 209 |
"_is_initial": false,
|
| 210 |
"_get_lr_called_within_step": false,
|
| 211 |
"_last_lr": [
|
| 212 |
-
0.
|
| 213 |
-
0.
|
| 214 |
-
0.
|
| 215 |
-
0.
|
| 216 |
-
0.
|
| 217 |
-
0.
|
| 218 |
]
|
| 219 |
},
|
| 220 |
"metrics": {
|
| 221 |
-
"best_val_acc": 71.
|
| 222 |
-
"best_epoch":
|
| 223 |
"scale_accuracies": {
|
| 224 |
-
"256": 71.
|
| 225 |
}
|
| 226 |
},
|
| 227 |
"train_config": {
|
|
|
|
| 1 |
{
|
| 2 |
+
"epoch": 2,
|
| 3 |
"optimizer_state_dict": {
|
| 4 |
"state": {
|
| 5 |
"0": {
|
| 6 |
+
"step": "tensor(3756.)",
|
| 7 |
+
"exp_avg": "tensor([[ 6.2482e-05, -1.0957e-03, 1.8610e-04, ..., -6.3775e-05,\n 3.7722e-05, 3.0946e-04],\n [ 4.2669e-04, -4.4703e-04, 4.8625e-05, ..., -5.4459e-04,\n -1.1069e-04, -1.9971e-04],\n [ 2.1516e-04, 4.9376e-04, 1.0133e-03, ..., -5.4277e-04,\n -5.4259e-04, -2.4519e-04],\n ...,\n [ 1.3256e-04, 4.0228e-04, -8.2632e-04, ..., 2.7256e-05,\n -3.2793e-04, 1.5244e-04],\n [-4.2531e-04, -3.0743e-03, 1.4001e-04, ..., -4.0860e-04,\n 4.6036e-04, -1.8925e-04],\n [-1.4353e-04, -1.3795e-04, -6.5146e-04, ..., -1.1998e-04,\n 7.3662e-05, -3.9551e-05]], device='cuda:0')",
|
| 8 |
+
"exp_avg_sq": "tensor([[1.3045e-06, 1.2095e-05, 3.8998e-06, ..., 1.8005e-06, 9.7567e-07,\n 1.2811e-06],\n [3.1867e-06, 7.4417e-06, 8.1910e-06, ..., 2.5037e-06, 8.5574e-07,\n 1.1760e-06],\n [2.4247e-06, 1.5653e-05, 6.0696e-06, ..., 1.4071e-06, 9.6109e-07,\n 1.2029e-06],\n ...,\n [4.4321e-06, 3.4483e-05, 8.9087e-06, ..., 2.7869e-06, 1.6946e-06,\n 1.8854e-06],\n [1.9278e-06, 2.0316e-05, 5.4190e-06, ..., 1.3752e-06, 8.8687e-07,\n 1.3061e-06],\n [2.3611e-06, 1.1804e-05, 4.7666e-06, ..., 1.2768e-06, 1.1256e-06,\n 2.6667e-06]], device='cuda:0')"
|
| 9 |
},
|
| 10 |
"1": {
|
| 11 |
+
"step": "tensor(3756.)",
|
| 12 |
+
"exp_avg": "tensor([ 7.5002e-03, 6.1666e-03, -4.9600e-03, 6.1611e-03, 4.2384e-02,\n -1.9220e-02, -8.3844e-03, 4.7075e-04, 1.0635e-02, -1.0766e-02,\n -8.4952e-04, 1.1064e-03, -7.1118e-03, -1.7303e-02, -1.9323e-02,\n -1.2425e-02, 1.0077e-02, -4.0970e-02, 1.6759e-03, -2.3874e-02,\n 1.6497e-02, -1.2889e-04, 6.9716e-03, 2.6505e-02, 1.5302e-03,\n 1.1848e-02, 1.9951e-02, -8.8258e-03, 3.5513e-03, 1.4729e-02,\n 1.0189e-02, -4.1829e-03, 4.6535e-03, -2.6548e-02, 1.1126e-03,\n -2.9267e-02, -6.5974e-03, 1.0647e-02, -3.9801e-03, -8.8817e-05,\n -1.8313e-02, 6.3268e-03, 5.1648e-03, 3.6987e-03, -8.3055e-03,\n -3.9887e-03, -3.4601e-03, 1.9262e-02, 1.4138e-02, -1.7778e-02,\n -3.2670e-03, 3.1757e-02, 3.8606e-03, -3.3370e-03, 3.0356e-02,\n -1.3397e-02, -2.5703e-03, 1.4614e-02, -3.3291e-02, 8.3999e-04,\n 1.1530e-02, -1.9905e-02, 8.5553e-03, 1.5821e-02, 1.2836e-02,\n -5.8094e-03, -2.4451e-02, 1.0649e-02, 3.0301e-03, 2.4705e-03,\n -4.2230e-02, -1.3881e-02, -1.5045e-02, -5.2605e-03, 1.8229e-02,\n 5.9738e-03, 8.7830e-03, 6.5329e-03, -6.0538e-03, 1.3049e-02,\n -6.7696e-03, -6.8786e-04, 2.6906e-02, 2.2707e-02, -1.9941e-02,\n -1.1775e-02, -1.5720e-02, -1.2808e-02, -3.2262e-03, 2.2056e-02,\n 9.3135e-03, -2.3001e-03, 4.6321e-03, 1.6632e-02, -1.7077e-02,\n 2.4845e-03, 7.0338e-03, -2.0788e-03, 4.1306e-03, -1.8734e-02,\n 4.3794e-03, 1.5470e-02, -2.0499e-03, 7.6800e-03, 2.3201e-03,\n 8.2508e-03, 2.5984e-02, 1.7805e-02, -9.6886e-04, -9.4811e-03,\n -2.1282e-02, 1.0057e-02, 1.6776e-02, 2.8346e-03, -4.4798e-02,\n 1.0172e-02, 6.5314e-03, 1.2147e-02, -7.4831e-03, -8.4042e-03,\n 1.0060e-02, 5.8784e-03, -5.0699e-03, -2.3155e-02, 1.2979e-02,\n -4.0700e-02, 3.8160e-02, -1.5794e-03, -1.9136e-02, 8.3348e-03,\n -5.4544e-03, -6.8930e-03, 1.8212e-03, 3.0208e-03, -7.2003e-03,\n -3.7202e-03, 3.5775e-03, 1.2043e-02, -1.8218e-02, 1.0326e-02,\n -4.7054e-03, 2.6481e-02, -2.2354e-03, -9.7157e-03, -2.0954e-02,\n -2.0589e-02, -3.7296e-03, 8.4174e-03, 7.1278e-03, 1.8315e-03,\n -6.1332e-03, 2.1701e-02, 1.7961e-03, -3.5695e-02, -3.6253e-03,\n 6.3861e-03, -8.7802e-03, 2.5661e-02, -1.4770e-02, 2.3363e-03,\n 4.8627e-06, -3.4831e-03, -1.7585e-02, -1.3600e-02, -4.7705e-03,\n 3.2852e-03, -4.3559e-03, 1.2411e-02, -6.3844e-03, 1.4594e-02,\n -2.1835e-02, 2.2034e-02, 7.4159e-03, -1.9344e-02, -4.2616e-03,\n 5.3107e-03, 1.8573e-02, 3.3974e-03, 8.9747e-03, -2.9110e-02,\n -6.1603e-04, 2.6851e-02, 1.0675e-03, 3.8335e-03, -2.1870e-02,\n -7.2596e-03, 1.3847e-02, 3.5364e-04, -2.6820e-02, 4.1513e-03,\n -5.5434e-03, 8.5315e-03, 9.0884e-03, 6.4947e-03, -2.7338e-03,\n -2.1389e-02, 1.0514e-02, -3.7026e-03, -7.4370e-03, -1.8809e-02,\n -1.1799e-02, -2.1281e-02, -1.3515e-02, 2.7394e-03, -1.8285e-02,\n 2.8042e-03, 6.4321e-04, -3.2111e-02, 1.2037e-02, 2.1382e-03,\n -3.2882e-03, -8.3480e-03, -4.7763e-03, 1.0980e-02, -6.0826e-03,\n 1.2728e-02, 2.0775e-03, -4.6533e-03, -7.1669e-04, 6.6817e-03,\n 8.3459e-03, -5.2075e-03, 1.3601e-02, -7.4524e-03, 6.3202e-03,\n -3.6381e-03, -1.1919e-03, 2.1841e-02, -2.0557e-02, 2.1676e-02,\n 1.1317e-02, -2.5531e-02, 5.8963e-03, 1.7122e-02, -7.2185e-03,\n 5.5723e-04, 4.0023e-03, 7.6886e-03, -6.5542e-03, -1.0972e-04,\n 1.2319e-02, 1.0818e-02, 8.8110e-04, 5.4517e-03, -1.4672e-02,\n 7.6637e-03, -2.2257e-02, -2.4268e-03, 6.0236e-03, 5.7640e-03,\n -9.3002e-03, 6.5061e-03, 9.9962e-03, 7.4713e-03, -2.2215e-02,\n 5.7826e-03, 8.8195e-03, -1.1466e-02, 8.2011e-03, 7.4601e-04,\n 2.2986e-03, -2.8695e-03, -1.6565e-03, 2.7637e-02, 1.7682e-02,\n -1.1140e-02, 8.0441e-03, -1.1175e-02, 1.1836e-02, 3.4923e-03,\n 1.2227e-02, -1.3963e-02, 9.4421e-03, 8.7784e-03, -4.5916e-03,\n 1.3755e-02, -9.8096e-03, -1.0324e-02, -1.0254e-03, 1.3824e-02,\n -5.8864e-03, 2.8100e-02, 1.9033e-02, -1.7944e-03, 5.0956e-04,\n 1.2556e-02, 3.5404e-02, -1.1972e-02, -4.4883e-03, -6.9917e-04,\n 2.7119e-03, -4.3158e-02, 1.9065e-02, 5.5506e-03, 1.8930e-03,\n -1.5561e-02, 2.4375e-02, -3.1385e-03, 2.1630e-02, 2.1765e-03,\n -1.1839e-02, 4.0120e-03, 3.2524e-02, -1.5400e-02, 3.9087e-03,\n 9.0975e-03, -7.9342e-03, 8.9844e-03, 1.1798e-02, -6.3013e-03,\n -6.8291e-03, -3.5375e-03, 6.0614e-03, 3.3835e-02, -1.0973e-02,\n 6.9588e-03, 4.2893e-03, -1.0467e-03, 1.8468e-02, -3.2033e-03,\n -1.6772e-02, -4.8663e-04, 2.1358e-02, 8.8287e-03, -1.2741e-02,\n -9.2074e-03, 3.4563e-03, 1.7435e-02, 1.8690e-03, 2.9876e-04,\n 1.0413e-04, -1.0112e-02, 1.6502e-02, 2.1767e-03, -6.0951e-03,\n 1.9795e-02, 5.1981e-03, 6.8298e-03, -9.1880e-04, -6.1209e-03,\n 1.9639e-02, -7.0725e-03, -8.4911e-04, -3.1936e-03, -8.1469e-03,\n 2.2903e-03, -7.2077e-03, -1.2629e-03, -1.6029e-03, -3.0349e-02,\n 6.3177e-03, -2.2232e-02, -7.8631e-04, -1.0223e-02, -1.4878e-02,\n 1.2067e-03, 1.0516e-02, 7.4746e-03, 2.3452e-04, 1.0757e-02,\n -6.7234e-03, -1.9288e-02, -6.6883e-04, -1.4599e-02, 2.7748e-03,\n -2.7878e-02, 2.2437e-02, -2.1864e-02, -1.3880e-02, -9.6712e-03,\n -1.9037e-03, 5.7162e-03, 1.7645e-02, -9.6087e-03, -4.7373e-03,\n -1.1607e-02, 6.1116e-03, -6.8908e-03, -5.1185e-03, 1.2684e-02,\n 5.2543e-04, 5.7019e-03, -1.6155e-02, 8.7226e-04, -8.4820e-03,\n -4.5337e-03, 1.0811e-02, 1.4901e-02, -1.3097e-02, -1.8544e-02,\n 1.3208e-02, 3.0735e-03, 2.6452e-02, -3.4206e-02, 1.4948e-02,\n -2.2616e-03, -1.4811e-03, -1.4967e-02, 3.1700e-03, -5.1466e-02,\n 9.4068e-03, 3.6288e-03, 5.1295e-03, 6.7509e-03, 5.6759e-03,\n 1.4958e-02, 7.1466e-03, -8.6712e-04, 1.8486e-02, 7.7097e-03,\n 4.0422e-04, 1.0883e-02, 8.9003e-03, 8.4420e-03, -1.3882e-02,\n 1.2395e-02, 4.8072e-03, -4.1003e-03, -2.3001e-03, -8.5254e-03,\n 3.1507e-02, 4.4109e-03, -4.6974e-03, 1.4503e-02, -1.9600e-03,\n -1.5566e-02, -1.4285e-03, 3.3898e-03, 2.0972e-02, -3.7452e-02,\n 9.9496e-03, 1.6657e-02, 1.4277e-02, -4.9693e-04, 1.3667e-02,\n 9.2383e-03, 1.0335e-02, -4.0814e-03, 2.1612e-02, -1.1772e-02,\n 5.7829e-03, 1.9121e-03, 5.4433e-04, -2.1631e-02, -1.0545e-02,\n -1.8550e-02, -1.0206e-02, 6.1815e-03, 2.6431e-04, 6.5531e-03,\n -4.3925e-02, -1.4396e-02, -7.9888e-03, -5.1216e-03, 1.7811e-02,\n 9.3742e-03, -1.0087e-02, -9.3537e-03, 1.0426e-03, 5.4855e-03,\n -8.4249e-03, -7.2711e-04, 1.8274e-02, 8.7232e-03, 3.8414e-03,\n 1.2546e-02, 1.0764e-02, 1.6020e-02, -2.5126e-03, 5.8987e-03,\n 7.1405e-03, -4.8120e-03, -3.5610e-03, -5.2019e-03, -5.7160e-04,\n -5.4134e-03, 2.1359e-02, 7.2265e-03, -9.2278e-03, -2.0810e-03,\n -1.0700e-02, 1.0448e-03, 4.2769e-03, 4.6024e-03, -2.2860e-02,\n 2.1438e-02, 1.9457e-02, 3.5407e-03, -1.2072e-02, -3.5997e-02,\n 4.1577e-03, -5.7400e-03, -1.5299e-02, 1.0582e-02, 4.2529e-03,\n 4.8344e-03, 9.6877e-03, -9.8788e-03, 6.9282e-03, 1.5047e-02,\n -1.8485e-02, 2.0370e-03, -9.5045e-03, -1.1592e-02, 2.2464e-02,\n -1.9486e-02, 1.1776e-02, 3.4814e-03, 1.8949e-02, 1.1111e-02,\n 7.3057e-03, -5.6502e-03, 8.0085e-03, 1.0480e-02, -1.3336e-02,\n -1.5076e-02, -3.6794e-03, -1.1929e-02, 1.0319e-02, 1.8013e-02,\n 1.2966e-02, 4.3545e-03, 1.3252e-02, 1.5814e-02, 9.4098e-03,\n -6.4499e-03, 4.0679e-03, -4.1531e-03, 1.1122e-02, 1.0362e-03,\n -8.7823e-03, 7.8166e-03, -2.3918e-03, 9.2952e-04, 2.0623e-03,\n 5.4402e-03, 2.4221e-02, 1.1807e-02, -3.8971e-03, -3.0831e-02,\n -8.1170e-04, -1.7695e-02, 1.5276e-02, -9.0631e-03, -6.0323e-03,\n -5.6246e-03, -4.6081e-02, 1.5295e-02, -3.0662e-03, 1.4421e-03,\n 3.1950e-03, -1.6876e-02, 1.4467e-03, 1.9590e-02, -3.2373e-02,\n 8.8691e-03, 1.6429e-02, -3.3556e-03, 1.1395e-02, 5.2048e-03,\n -1.0511e-02, -1.3843e-02, -3.9300e-02, 9.6730e-03, 1.2379e-02,\n 2.5041e-04, 1.8809e-02, -2.1314e-03, -2.1516e-02, 2.0708e-03,\n -3.0634e-03, -8.5988e-03, -1.2090e-02, -1.2553e-02, -1.0845e-02,\n 1.0688e-03, 5.1341e-03, 1.4643e-02, -7.8537e-04, 4.6313e-03,\n -1.3006e-02, -4.9244e-03, -1.0704e-02, -4.5927e-03, 1.6731e-03,\n -4.8729e-03, -1.1680e-02, -2.1329e-03, -1.0017e-03, 6.3447e-03,\n -1.9672e-03, 2.6279e-03, -1.8901e-03, 4.0267e-03, 3.6861e-03,\n 1.4563e-02, -3.3208e-03, 4.6089e-03, -8.4111e-03, -1.5482e-02,\n 1.3915e-02, -1.1742e-02, 1.4256e-02, 2.0253e-02, -4.6216e-03,\n -2.3277e-02, -1.2902e-03, 7.1385e-03, 3.1895e-03, 2.5037e-03,\n 3.0609e-03, -2.2982e-03, -1.6950e-02, 1.0686e-02, 1.2337e-02,\n 5.1010e-03, 3.3296e-03, -8.7820e-03, 4.1231e-04, 1.4284e-02,\n 5.2430e-03, 1.3779e-02, 1.1006e-02, 3.4085e-03, 9.4340e-04,\n 1.3037e-02, -6.5691e-03, -5.1768e-03, 5.0331e-03, -3.0340e-02,\n 1.9957e-02, -2.3842e-03, 1.0488e-02, 8.7999e-04, 8.6451e-03,\n 9.6842e-03, 9.2201e-04, 7.2388e-03, -4.3417e-03, 1.7046e-02],\n device='cuda:0')",
|
| 13 |
+
"exp_avg_sq": "tensor([0.0017, 0.0019, 0.0016, 0.0015, 0.0021, 0.0019, 0.0011, 0.0017, 0.0017,\n 0.0018, 0.0026, 0.0026, 0.0028, 0.0024, 0.0014, 0.0016, 0.0017, 0.0026,\n 0.0012, 0.0022, 0.0022, 0.0015, 0.0016, 0.0024, 0.0017, 0.0023, 0.0037,\n 0.0018, 0.0021, 0.0022, 0.0014, 0.0016, 0.0030, 0.0022, 0.0019, 0.0015,\n 0.0013, 0.0020, 0.0025, 0.0017, 0.0016, 0.0011, 0.0021, 0.0017, 0.0017,\n 0.0023, 0.0021, 0.0019, 0.0018, 0.0016, 0.0016, 0.0015, 0.0017, 0.0022,\n 0.0020, 0.0021, 0.0037, 0.0017, 0.0025, 0.0015, 0.0019, 0.0020, 0.0017,\n 0.0025, 0.0025, 0.0017, 0.0032, 0.0023, 0.0021, 0.0019, 0.0028, 0.0015,\n 0.0025, 0.0022, 0.0020, 0.0017, 0.0017, 0.0014, 0.0016, 0.0019, 0.0016,\n 0.0015, 0.0016, 0.0020, 0.0015, 0.0015, 0.0016, 0.0025, 0.0020, 0.0017,\n 0.0018, 0.0027, 0.0017, 0.0016, 0.0027, 0.0018, 0.0013, 0.0016, 0.0015,\n 0.0022, 0.0020, 0.0013, 0.0016, 0.0015, 0.0017, 0.0024, 0.0015, 0.0018,\n 0.0032, 0.0019, 0.0021, 0.0018, 0.0016, 0.0019, 0.0020, 0.0017, 0.0018,\n 0.0018, 0.0017, 0.0031, 0.0027, 0.0022, 0.0017, 0.0017, 0.0025, 0.0024,\n 0.0036, 0.0018, 0.0017, 0.0016, 0.0021, 0.0031, 0.0023, 0.0017, 0.0019,\n 0.0017, 0.0019, 0.0019, 0.0024, 0.0025, 0.0018, 0.0019, 0.0023, 0.0021,\n 0.0021, 0.0016, 0.0014, 0.0018, 0.0019, 0.0015, 0.0016, 0.0018, 0.0027,\n 0.0028, 0.0020, 0.0021, 0.0025, 0.0017, 0.0020, 0.0020, 0.0021, 0.0030,\n 0.0022, 0.0022, 0.0022, 0.0017, 0.0013, 0.0026, 0.0024, 0.0028, 0.0012,\n 0.0015, 0.0017, 0.0018, 0.0025, 0.0024, 0.0021, 0.0014, 0.0015, 0.0017,\n 0.0025, 0.0022, 0.0020, 0.0015, 0.0015, 0.0016, 0.0021, 0.0018, 0.0025,\n 0.0026, 0.0020, 0.0025, 0.0017, 0.0022, 0.0016, 0.0018, 0.0015, 0.0025,\n 0.0016, 0.0021, 0.0019, 0.0020, 0.0032, 0.0033, 0.0020, 0.0017, 0.0020,\n 0.0021, 0.0021, 0.0021, 0.0019, 0.0013, 0.0018, 0.0031, 0.0016, 0.0027,\n 0.0018, 0.0018, 0.0018, 0.0021, 0.0020, 0.0020, 0.0012, 0.0021, 0.0016,\n 0.0018, 0.0025, 0.0015, 0.0023, 0.0020, 0.0020, 0.0021, 0.0019, 0.0016,\n 0.0022, 0.0026, 0.0017, 0.0023, 0.0017, 0.0023, 0.0017, 0.0018, 0.0018,\n 0.0025, 0.0023, 0.0019, 0.0024, 0.0023, 0.0018, 0.0020, 0.0017, 0.0014,\n 0.0035, 0.0021, 0.0015, 0.0017, 0.0022, 0.0017, 0.0015, 0.0017, 0.0015,\n 0.0019, 0.0014, 0.0029, 0.0025, 0.0018, 0.0016, 0.0013, 0.0017, 0.0016,\n 0.0019, 0.0040, 0.0018, 0.0018, 0.0015, 0.0020, 0.0017, 0.0016, 0.0018,\n 0.0017, 0.0016, 0.0025, 0.0027, 0.0024, 0.0017, 0.0019, 0.0019, 0.0015,\n 0.0027, 0.0017, 0.0017, 0.0017, 0.0017, 0.0014, 0.0018, 0.0022, 0.0019,\n 0.0015, 0.0030, 0.0020, 0.0017, 0.0017, 0.0025, 0.0014, 0.0018, 0.0022,\n 0.0017, 0.0018, 0.0017, 0.0021, 0.0015, 0.0019, 0.0012, 0.0026, 0.0028,\n 0.0020, 0.0023, 0.0020, 0.0019, 0.0018, 0.0021, 0.0024, 0.0020, 0.0019,\n 0.0021, 0.0024, 0.0023, 0.0021, 0.0028, 0.0016, 0.0038, 0.0015, 0.0025,\n 0.0018, 0.0028, 0.0027, 0.0019, 0.0015, 0.0028, 0.0020, 0.0019, 0.0020,\n 0.0014, 0.0020, 0.0026, 0.0023, 0.0015, 0.0016, 0.0019, 0.0022, 0.0015,\n 0.0021, 0.0035, 0.0022, 0.0025, 0.0017, 0.0021, 0.0018, 0.0018, 0.0021,\n 0.0014, 0.0015, 0.0017, 0.0021, 0.0028, 0.0023, 0.0024, 0.0028, 0.0019,\n 0.0026, 0.0022, 0.0025, 0.0017, 0.0030, 0.0022, 0.0024, 0.0028, 0.0023,\n 0.0017, 0.0019, 0.0024, 0.0018, 0.0018, 0.0017, 0.0020, 0.0016, 0.0026,\n 0.0025, 0.0018, 0.0019, 0.0017, 0.0020, 0.0020, 0.0025, 0.0017, 0.0018,\n 0.0017, 0.0024, 0.0020, 0.0042, 0.0017, 0.0020, 0.0020, 0.0018, 0.0020,\n 0.0026, 0.0032, 0.0015, 0.0019, 0.0018, 0.0034, 0.0021, 0.0031, 0.0018,\n 0.0020, 0.0015, 0.0016, 0.0015, 0.0016, 0.0017, 0.0028, 0.0018, 0.0023,\n 0.0029, 0.0017, 0.0018, 0.0025, 0.0024, 0.0018, 0.0030, 0.0019, 0.0019,\n 0.0011, 0.0021, 0.0022, 0.0019, 0.0022, 0.0019, 0.0026, 0.0032, 0.0015,\n 0.0015, 0.0014, 0.0031, 0.0031, 0.0024, 0.0023, 0.0020, 0.0016, 0.0026,\n 0.0038, 0.0015, 0.0016, 0.0023, 0.0018, 0.0018, 0.0020, 0.0025, 0.0023,\n 0.0017, 0.0019, 0.0017, 0.0018, 0.0019, 0.0022, 0.0018, 0.0020, 0.0023,\n 0.0016, 0.0022, 0.0021, 0.0024, 0.0013, 0.0030, 0.0018, 0.0022, 0.0024,\n 0.0014, 0.0017, 0.0019, 0.0030, 0.0014, 0.0022, 0.0020, 0.0020, 0.0022,\n 0.0021, 0.0019, 0.0017, 0.0017, 0.0016, 0.0030, 0.0015, 0.0017, 0.0018,\n 0.0015, 0.0019, 0.0014, 0.0029, 0.0019, 0.0015, 0.0018, 0.0015, 0.0022,\n 0.0020, 0.0022, 0.0022, 0.0020, 0.0017, 0.0023, 0.0019, 0.0023, 0.0013,\n 0.0021, 0.0011, 0.0026, 0.0015, 0.0018, 0.0019, 0.0020, 0.0025, 0.0019,\n 0.0017, 0.0016, 0.0020, 0.0019, 0.0015, 0.0017, 0.0021, 0.0021, 0.0019,\n 0.0016, 0.0012, 0.0017, 0.0023, 0.0017, 0.0021, 0.0018, 0.0013, 0.0024,\n 0.0015, 0.0020, 0.0017, 0.0019, 0.0024, 0.0021, 0.0018, 0.0021, 0.0014,\n 0.0013, 0.0019, 0.0019, 0.0021, 0.0018, 0.0018, 0.0020, 0.0023, 0.0020,\n 0.0021, 0.0018, 0.0020, 0.0022, 0.0014, 0.0025, 0.0017, 0.0016, 0.0018,\n 0.0013, 0.0029, 0.0025, 0.0019, 0.0022, 0.0023, 0.0020, 0.0024, 0.0020,\n 0.0021, 0.0036, 0.0016, 0.0028, 0.0022, 0.0027, 0.0025, 0.0019, 0.0018,\n 0.0020, 0.0021, 0.0014, 0.0016, 0.0025, 0.0019, 0.0032, 0.0024, 0.0020,\n 0.0015, 0.0018, 0.0015, 0.0020, 0.0019, 0.0017, 0.0013, 0.0019, 0.0029,\n 0.0021, 0.0018, 0.0018, 0.0021, 0.0017, 0.0022, 0.0019, 0.0019, 0.0021,\n 0.0016, 0.0024, 0.0025, 0.0014, 0.0044, 0.0018, 0.0028, 0.0017, 0.0029,\n 0.0021, 0.0017, 0.0022, 0.0015, 0.0019, 0.0024, 0.0011, 0.0017, 0.0021,\n 0.0022, 0.0031, 0.0017, 0.0023, 0.0024, 0.0018, 0.0025, 0.0025, 0.0015,\n 0.0017], device='cuda:0')"
|
| 14 |
},
|
| 15 |
"2": {
|
| 16 |
+
"step": "tensor(3756.)",
|
| 17 |
+
"exp_avg": "tensor([[-2.0531e-04, 2.6832e-04, -6.0653e-05, ..., -6.8946e-05,\n 1.3081e-04, -3.1265e-04],\n [-1.5010e-04, 2.7194e-05, -4.7230e-05, ..., 1.9473e-05,\n -2.3948e-04, -3.1832e-04],\n [-3.2661e-05, -2.5834e-04, 5.6320e-05, ..., 7.7295e-05,\n -8.1635e-04, 8.1857e-05],\n ...,\n [ 6.3526e-05, -2.0283e-05, -2.0169e-04, ..., -9.2684e-05,\n 2.1288e-04, -1.7126e-04],\n [-1.1934e-04, 1.8057e-04, 3.5367e-04, ..., 1.4586e-05,\n 9.6794e-06, -1.6967e-04],\n [ 1.1826e-05, 4.2725e-04, -3.2022e-04, ..., 7.0693e-05,\n -4.3537e-04, -3.5973e-04]], device='cuda:0')",
|
| 18 |
+
"exp_avg_sq": "tensor([[5.2474e-07, 4.8824e-07, 5.0117e-07, ..., 2.0473e-07, 5.6365e-07,\n 1.4658e-06],\n [9.0473e-07, 1.4383e-06, 8.6538e-07, ..., 5.9647e-07, 1.7928e-06,\n 1.6739e-06],\n [1.1156e-06, 1.5511e-06, 1.1785e-06, ..., 6.4719e-07, 1.0678e-06,\n 9.4882e-07],\n ...,\n [1.1252e-06, 1.0989e-06, 1.0603e-06, ..., 7.4304e-07, 1.2404e-06,\n 2.8223e-06],\n [1.1438e-06, 2.1048e-06, 1.1909e-06, ..., 4.8723e-07, 1.1319e-06,\n 1.8908e-06],\n [1.5152e-06, 6.8419e-07, 1.6502e-06, ..., 7.0794e-07, 1.0720e-06,\n 1.9125e-06]], device='cuda:0')"
|
| 19 |
}
|
| 20 |
},
|
| 21 |
"param_groups": [
|
| 22 |
{
|
| 23 |
+
"lr": 0.0007940987335200904,
|
| 24 |
"name": "scale_256",
|
| 25 |
"betas": [
|
| 26 |
0.9,
|
|
|
|
| 43 |
]
|
| 44 |
},
|
| 45 |
{
|
| 46 |
+
"lr": 0.0007940987335200904,
|
| 47 |
"name": "scale_512",
|
| 48 |
"betas": [
|
| 49 |
0.9,
|
|
|
|
| 66 |
]
|
| 67 |
},
|
| 68 |
{
|
| 69 |
+
"lr": 0.0007940987335200904,
|
| 70 |
"name": "scale_768",
|
| 71 |
"betas": [
|
| 72 |
0.9,
|
|
|
|
| 89 |
]
|
| 90 |
},
|
| 91 |
{
|
| 92 |
+
"lr": 0.0007940987335200904,
|
| 93 |
"name": "scale_1024",
|
| 94 |
"betas": [
|
| 95 |
0.9,
|
|
|
|
| 112 |
]
|
| 113 |
},
|
| 114 |
{
|
| 115 |
+
"lr": 0.0007940987335200904,
|
| 116 |
"name": "scale_1280",
|
| 117 |
"betas": [
|
| 118 |
0.9,
|
|
|
|
| 135 |
]
|
| 136 |
},
|
| 137 |
{
|
| 138 |
+
"lr": 0.00039715242044697206,
|
| 139 |
"name": "fusion",
|
| 140 |
"betas": [
|
| 141 |
0.9,
|
|
|
|
| 195 |
"T_i": 10,
|
| 196 |
"T_mult": 2,
|
| 197 |
"eta_min": 1e-06,
|
| 198 |
+
"T_cur": 3,
|
| 199 |
"base_lrs": [
|
| 200 |
0.001,
|
| 201 |
0.001,
|
|
|
|
| 204 |
0.001,
|
| 205 |
0.0005
|
| 206 |
],
|
| 207 |
+
"last_epoch": 3,
|
| 208 |
"_step_count": 0,
|
| 209 |
"_is_initial": false,
|
| 210 |
"_get_lr_called_within_step": false,
|
| 211 |
"_last_lr": [
|
| 212 |
+
0.0007940987335200904,
|
| 213 |
+
0.0007940987335200904,
|
| 214 |
+
0.0007940987335200904,
|
| 215 |
+
0.0007940987335200904,
|
| 216 |
+
0.0007940987335200904,
|
| 217 |
+
0.00039715242044697206
|
| 218 |
]
|
| 219 |
},
|
| 220 |
"metrics": {
|
| 221 |
+
"best_val_acc": 71.666,
|
| 222 |
+
"best_epoch": 2,
|
| 223 |
"scale_accuracies": {
|
| 224 |
+
"256": 71.666
|
| 225 |
}
|
| 226 |
},
|
| 227 |
"train_config": {
|